opencv/samples/dnn/optical_flow.py

#!/usr/bin/env python
'''
This sample using FlowNet v2 model to calculate optical flow.
Original paper: https://arxiv.org/abs/1612.01925.
Original repo:  https://github.com/lmb-freiburg/flownet2.

Download the converted .caffemodel model from https://drive.google.com/open?id=16qvE9VNmU39NttpZwZs81Ga8VYQJDaWZ
and .prototxt from https://drive.google.com/open?id=19bo6SWU2p8ZKvjXqMKiCPdK8mghwDy9b.
Otherwise download original model from https://lmb.informatik.uni-freiburg.de/resources/binaries/flownet2/flownet2-models.tar.gz,
convert .h5 model to .caffemodel and modify original .prototxt using .prototxt from link above.
'''

import argparse
import os.path
import numpy as np
import cv2 as cv


class OpticalFlow(object):
    def __init__(self, proto, model, height, width):
        self.net = cv.dnn.readNet(proto, model)
        self.net.setPreferableBackend(cv.dnn.DNN_BACKEND_OPENCV)
        self.height = height
        self.width = width

    def compute_flow(self, first_img, second_img):
        inp0 = cv.dnn.blobFromImage(first_img, size=(self.width, self.height))
        inp1 = cv.dnn.blobFromImage(second_img, size=(self.width, self.height))
        self.net.setInput(inp0, "img0")
        self.net.setInput(inp1, "img1")
        flow = self.net.forward()
        output = self.motion_to_color(flow)
        return output

    def motion_to_color(self, flow):
        arr = np.arange(0, 255, dtype=np.uint8)
        colormap = cv.applyColorMap(arr, cv.COLORMAP_HSV)
        colormap = colormap.squeeze(1)

        flow = flow.squeeze(0)
        fx, fy = flow[0, ...], flow[1, ...]
        rad = np.sqrt(fx**2 + fy**2)
        maxrad = rad.max() if rad.max() != 0 else 1

        ncols = arr.size
        rad = rad[..., np.newaxis] / maxrad
        a = np.arctan2(-fy / maxrad, -fx / maxrad) / np.pi
        fk = (a + 1) / 2.0 * (ncols - 1)
        k0 = fk.astype(np.int)
        k1 = (k0 + 1) % ncols
        f = fk[..., np.newaxis] - k0[..., np.newaxis]

        col0 = colormap[k0] / 255.0
        col1 = colormap[k1] / 255.0
        col = (1 - f) * col0 + f * col1
        col = np.where(rad <= 1, 1 - rad * (1 - col), col * 0.75)
        output = (255.0 * col).astype(np.uint8)
        return output


if __name__ == '__main__':
    parser = argparse.ArgumentParser(description='Use this script to calculate optical flow using FlowNetv2',
                                     formatter_class=argparse.ArgumentDefaultsHelpFormatter)
    parser.add_argument('-input', '-i', required=True, help='Path to input video file. Skip this argument to capture frames from a camera.')
    parser.add_argument('--height', default=320, help='Input height')
    parser.add_argument('--width',  default=448, help='Input width')
    parser.add_argument('--proto', '-p', default='FlowNet2_deploy.prototxt', help='Path to prototxt.')
    parser.add_argument('--model', '-m', default='FlowNet2_weights.caffemodel', help='Path to caffemodel.')
    args, _ = parser.parse_known_args()

    if not os.path.isfile(args.model) or not os.path.isfile(args.proto):
        raise OSError("Prototxt or caffemodel not exist")

    winName = 'Calculation optical flow in OpenCV'
    cv.namedWindow(winName, cv.WINDOW_NORMAL)
    cap = cv.VideoCapture(args.input if args.input else 0)
    hasFrame, first_frame = cap.read()
    opt_flow = OpticalFlow(args.proto, args.model, args.height, args.width)
    while cv.waitKey(1) < 0:
        hasFrame, second_frame = cap.read()
        if not hasFrame:
            break
        flow = opt_flow.compute_flow(first_frame, second_frame)
        first_frame = second_frame
        cv.imshow(winName, flow)
Merge pull request #16575 from l-bat:flownet2 Support FlowNet2 model * Support DataAugmentation layer * Fix warnings * Fix comments * Support Correlation layer * TEST * Support Correlation layer * Supported Accum and FlowWarp layers * Supported ChannelNorm layer * Supported Resample with inputs.size() > 1 * Fixed comments * Refactoring * Added tests * Add resample test * Added asserts in resize layer * Updated DataAugmentation layer * Update convolution layer * Refactoring * Fix data augmentation layer * Fix caffe importer * Fix resize * Switch to Mat ptr * Remove useless resize type * Used ResizeLayer in Accum * Split ChannelNormLayer * Delete duplicate assert * Add sample * Fix sample * Added colormap 5 years ago			`#!/usr/bin/env python`
			`'''`
			`This sample using FlowNet v2 model to calculate optical flow.`
			`Original paper: https://arxiv.org/abs/1612.01925.`
			`Original repo: https://github.com/lmb-freiburg/flownet2.`

			`Download the converted .caffemodel model from https://drive.google.com/open?id=16qvE9VNmU39NttpZwZs81Ga8VYQJDaWZ`
			`and .prototxt from https://drive.google.com/open?id=19bo6SWU2p8ZKvjXqMKiCPdK8mghwDy9b.`
			`Otherwise download original model from https://lmb.informatik.uni-freiburg.de/resources/binaries/flownet2/flownet2-models.tar.gz,`
			`convert .h5 model to .caffemodel and modify original .prototxt using .prototxt from link above.`
			`'''`

			`import argparse`
			`import os.path`
			`import numpy as np`
			`import cv2 as cv`


			`class OpticalFlow(object):`
			`def __init__(self, proto, model, height, width):`
			`self.net = cv.dnn.readNet(proto, model)`
			`self.net.setPreferableBackend(cv.dnn.DNN_BACKEND_OPENCV)`
			`self.height = height`
			`self.width = width`

			`def compute_flow(self, first_img, second_img):`
			`inp0 = cv.dnn.blobFromImage(first_img, size=(self.width, self.height))`
			`inp1 = cv.dnn.blobFromImage(second_img, size=(self.width, self.height))`
			`self.net.setInput(inp0, "img0")`
			`self.net.setInput(inp1, "img1")`
			`flow = self.net.forward()`
			`output = self.motion_to_color(flow)`
			`return output`

			`def motion_to_color(self, flow):`
			`arr = np.arange(0, 255, dtype=np.uint8)`
			`colormap = cv.applyColorMap(arr, cv.COLORMAP_HSV)`
			`colormap = colormap.squeeze(1)`

			`flow = flow.squeeze(0)`
			`fx, fy = flow[0, ...], flow[1, ...]`
			`rad = np.sqrt(fx2 + fy2)`
			`maxrad = rad.max() if rad.max() != 0 else 1`

			`ncols = arr.size`
			`rad = rad[..., np.newaxis] / maxrad`
			`a = np.arctan2(-fy / maxrad, -fx / maxrad) / np.pi`
			`fk = (a + 1) / 2.0 * (ncols - 1)`
			`k0 = fk.astype(np.int)`
			`k1 = (k0 + 1) % ncols`
			`f = fk[..., np.newaxis] - k0[..., np.newaxis]`

			`col0 = colormap[k0] / 255.0`
			`col1 = colormap[k1] / 255.0`
			`col = (1 - f) * col0 + f * col1`
			`col = np.where(rad <= 1, 1 - rad * (1 - col), col * 0.75)`
			`output = (255.0 * col).astype(np.uint8)`
			`return output`


			`if __name__ == '__main__':`
			`parser = argparse.ArgumentParser(description='Use this script to calculate optical flow using FlowNetv2',`
			`formatter_class=argparse.ArgumentDefaultsHelpFormatter)`
			`parser.add_argument('-input', '-i', required=True, help='Path to input video file. Skip this argument to capture frames from a camera.')`
			`parser.add_argument('--height', default=320, help='Input height')`
			`parser.add_argument('--width', default=448, help='Input width')`
			`parser.add_argument('--proto', '-p', default='FlowNet2_deploy.prototxt', help='Path to prototxt.')`
			`parser.add_argument('--model', '-m', default='FlowNet2_weights.caffemodel', help='Path to caffemodel.')`
			`args, _ = parser.parse_known_args()`

			`if not os.path.isfile(args.model) or not os.path.isfile(args.proto):`
			`raise OSError("Prototxt or caffemodel not exist")`

			`winName = 'Calculation optical flow in OpenCV'`
			`cv.namedWindow(winName, cv.WINDOW_NORMAL)`
			`cap = cv.VideoCapture(args.input if args.input else 0)`
			`hasFrame, first_frame = cap.read()`
			`opt_flow = OpticalFlow(args.proto, args.model, args.height, args.width)`
			`while cv.waitKey(1) < 0:`
			`hasFrame, second_frame = cap.read()`
			`if not hasFrame:`
			`break`
			`flow = opt_flow.compute_flow(first_frame, second_frame)`
			`first_frame = second_frame`
			`cv.imshow(winName, flow)`