Overview

This application fetches frames from input video source, runs the algorithms on the previous and current images, and then calculate the motion vectors for every 4x4 pixel block. The output motion vectors will be mapped to the HSV colorspace, where hue relates to motion angle, value relates to motion speed, and the result will be saved to a video file.

Instructions

The command line parameters are:

where

backend: Defines the backend that will perform the processing. Only nvenc is currently supported.
input video: Input video file name, it accepts .mp4, .avi and possibly others, depending on OpenCV's support.
quality: Specify the quality that the algorithm will use. Available options are: low (fastest), medium (balanced perf and quality) and high (slowest).

Here's one example:

C++
./vpi_sample_13_optflow_dense nvenc ../assets/pedestrians.mp4 high
Python
python main.py nvenc ../assets/pedestrians.mp4 high

The application will process pedestrians.mp4 and create denseoptflow_mv_nvenc.mp4.

Note: If using OpenCV-2.4 or older (i.e. on Ubuntu 16.04), output file is denseoptflow_mv_nvenc.avi.

Results

Input video	Motion vector video

Source Code

For convenience, here's the code that is also installed in the samples directory.

Language: C++ Python

 import cv2
 import sys
 import vpi
 import numpy as np
 from os import path
 from argparse import ArgumentParser
 from contextlib import contextmanager
  
 # ----------------------------
 # Some utility functions
  
 def process_motion_vectors(mv):
     with mv.rlock():
         # convert S10.5 format to float
         flow = np.float32(mv.cpu())/(1<<5)
  
     # Create an image where the motion vector angle is
     # mapped to a color hue, and intensity is proportional
     # to vector's magnitude
     magnitude, angle = cv2.cartToPolar(flow[:,:,0], flow[:,:,1], angleInDegrees=True)
  
     clip = 5.0
     cv2.threshold(magnitude, clip, clip, cv2.THRESH_TRUNC, magnitude)
  
     # build the hsv image
     hsv = np.ndarray([flow.shape[0], flow.shape[1], 3], np.float32)
     hsv[:,:,0] = angle
     hsv[:,:,1] = np.ones((angle.shape[0], angle.shape[1]), np.float32)
     hsv[:,:,2] = magnitude / clip
  
     # Convert HSV to BGR8
     bgr = cv2.cvtColor(hsv, cv2.COLOR_HSV2BGR)
     return np.uint8(bgr*255)
  
 # ----------------------------
 # Parse command line arguments
  
 parser = ArgumentParser()
 parser.add_argument('backend', choices=['nvenc'],
                     help='Backend to be used for processing')
  
 parser.add_argument('input',
                     help='Input video to be processed')
  
 parser.add_argument('quality', choices=['low', 'medium', 'high'],
                     help='Quality setting')
  
 args = parser.parse_args();
  
 assert args.backend == 'nvenc'
 backend = vpi.Backend.NVENC
  
 if args.quality == "low":
     quality = vpi.OptFlowQuality.LOW
 elif args.quality == "medium":
     quality = vpi.OptFlowQuality.MEDIUM
 else:
     assert args.quality == "high"
     quality = vpi.OptFlowQuality.HIGH
  
 # -----------------------------
 # Open input and output videos
  
 inVideo = cv2.VideoCapture(args.input)
  
 if int(cv2.__version__.split('.')[0]) >= 3:
     extOutputVideo = '.mp4'
     fourcc = cv2.VideoWriter_fourcc(*'avc1')
     inSize = (int(inVideo.get(cv2.CAP_PROP_FRAME_WIDTH)), int(inVideo.get(cv2.CAP_PROP_FRAME_HEIGHT)))
     fps = inVideo.get(cv2.CAP_PROP_FPS)
 else:
     # MP4 support with OpenCV-2.4 has issues, we'll use
     # avi/mpeg instead.
     extOutputVideo = '.avi'
     fourcc = cv2.cv.CV_FOURCC('M','P','E','G')
     inSize = (int(inVideo.get(cv2.cv.CV_CAP_PROP_FRAME_WIDTH)), int(inVideo.get(cv2.cv.CV_CAP_PROP_FRAME_HEIGHT)))
     fps = inVideo.get(cv2.cv.CV_CAP_PROP_FPS)
  
 if backend == vpi.Backend.NVENC:
     # NVENC always returns 1/4th resolution
     outSize = (inSize[0]//4, inSize[1]//4)
 else:
     outSize = inSize
  
 outVideo = cv2.VideoWriter('denseoptflow_mv_python'+str(sys.version_info[0])+'_'+args.backend+extOutputVideo,
                             fourcc, fps, outSize)
  
 #---------------------------------
 # Main processing loop
  
 prevFrame = None
  
 idFrame = 0
 while True:
     # Read one input frame
     ret, cvFrame = inVideo.read()
     if not ret:
         break
  
     # Convert it to NV12_ER format to be used by VPI
     # No single backend can convert from OpenCV's BGR8 to NV12_ER_BL
     # required by the algorithm. We must do in two steps using CUDA and VIC.
     curFrame = vpi.asimage(cvFrame, vpi.Format.BGR8) \
                 .convert(vpi.Format.NV12_ER, backend=vpi.Backend.CUDA) \
                 .convert(vpi.Format.NV12_ER_BL, backend=vpi.Backend.VIC)
  
     # Need at least 2 frames to start processing
     if prevFrame is not None:
         print("Processing frame {}".format(idFrame))
  
         # Calculate the motion vectors from previous to current frame
         with backend:
             motion_vectors = vpi.optflow_dense(prevFrame, curFrame, quality = quality)
  
         # Turn motion vectors into an image
         motion_image = process_motion_vectors(motion_vectors)
  
         # Save it to output video
         outVideo.write(motion_image)
  
     # Prepare next iteration
     prevFrame = curFrame
     idFrame += 1
  
 # vim: ts=8:sw=4:sts=4:et:ai

 #include <opencv2/core/version.hpp>
 #if CV_MAJOR_VERSION >= 3
 #    include <opencv2/imgcodecs.hpp>
 #    include <opencv2/videoio.hpp>
 #else
 #    include <opencv2/highgui/highgui.hpp>
 #endif
  
 #include <opencv2/imgproc/imgproc.hpp>
 #include <vpi/OpenCVInterop.hpp>
  
 #include <vpi/Array.h>
 #include <vpi/Image.h>
 #include <vpi/ImageFormat.h>
 #include <vpi/Pyramid.h>
 #include <vpi/Status.h>
 #include <vpi/Stream.h>
 #include <vpi/algo/ConvertImageFormat.h>
 #include <vpi/algo/OpticalFlowDense.h>
  
 #include <iostream>
 #include <sstream>
  
 #define CHECK_STATUS(STMT)                                    \
     do                                                        \
     {                                                         \
         VPIStatus status = (STMT);                            \
         if (status != VPI_SUCCESS)                            \
         {                                                     \
             char buffer[VPI_MAX_STATUS_MESSAGE_LENGTH];       \
             vpiGetLastStatusMessage(buffer, sizeof(buffer));  \
             std::ostringstream ss;                            \
             ss << vpiStatusGetName(status) << ": " << buffer; \
             throw std::runtime_error(ss.str());               \
         }                                                     \
     } while (0);
  
 static void ProcessMotionVector(VPIImage mvImg, cv::Mat &outputImage)
 {
     // Lock the input image to access it from CPU
     VPIImageData mvData;
     CHECK_STATUS(vpiImageLock(mvImg, VPI_LOCK_READ, &mvData));
  
     // Create a cv::Mat that points to the input image data
     cv::Mat mvImage;
     CHECK_STATUS(vpiImageDataExportOpenCVMat(mvData, &mvImage));
  
     // Convert S10.5 format to float
     cv::Mat flow(mvImage.size(), CV_32FC2);
     mvImage.convertTo(flow, CV_32F, 1.0f / (1 << 5));
  
     // Image not needed anymore, we can unlock it.
     CHECK_STATUS(vpiImageUnlock(mvImg));
  
     // Create an image where the motion vector angle is
     // mapped to a color hue, and intensity is proportional
     // to vector's magnitude.
     cv::Mat magnitude, angle;
     {
         cv::Mat flowChannels[2];
         split(flow, flowChannels);
         cv::cartToPolar(flowChannels[0], flowChannels[1], magnitude, angle, true);
     }
  
     float clip = 5;
     cv::threshold(magnitude, magnitude, clip, clip, cv::THRESH_TRUNC);
  
     // build hsv image
     cv::Mat _hsv[3], hsv, bgr;
     _hsv[0] = angle;
     _hsv[1] = cv::Mat::ones(angle.size(), CV_32F);
     _hsv[2] = magnitude / clip; // intensity must vary from 0 to 1
     merge(_hsv, 3, hsv);
  
     cv::cvtColor(hsv, bgr, cv::COLOR_HSV2BGR);
     bgr.convertTo(outputImage, CV_8U, 255.0);
 }
  
 int main(int argc, char *argv[])
 {
     // OpenCV image that will be wrapped by a VPIImage.
     // Define it here so that it's destroyed *after* wrapper is destroyed
     cv::Mat cvPrevFrame, cvCurFrame;
  
     // VPI objects that will be used
     VPIStream stream         = NULL;
     VPIImage imgPrevFramePL  = NULL;
     VPIImage imgPrevFrameTmp = NULL;
     VPIImage imgPrevFrameBL  = NULL;
     VPIImage imgCurFramePL   = NULL;
     VPIImage imgCurFrameTmp  = NULL;
     VPIImage imgCurFrameBL   = NULL;
     VPIImage imgMotionVecBL  = NULL;
     VPIPayload payload       = NULL;
  
     int retval = 0;
  
     try
     {
         if (argc != 4)
         {
             throw std::runtime_error(std::string("Usage: ") + argv[0] + " <nvenc> <input_video> <low|medium|high>");
         }
  
         // Parse input parameters
         std::string strBackend    = argv[1];
         std::string strInputVideo = argv[2];
         std::string strQuality    = argv[3];
  
         VPIOpticalFlowQuality quality;
         if (strQuality == "low")
         {
             quality = VPI_OPTICAL_FLOW_QUALITY_LOW;
         }
         else if (strQuality == "medium")
         {
             quality = VPI_OPTICAL_FLOW_QUALITY_MEDIUM;
         }
         else if (strQuality == "high")
         {
             quality = VPI_OPTICAL_FLOW_QUALITY_HIGH;
         }
         else
         {
             throw std::runtime_error("Unknown quality provided");
         }
  
         VPIBackend backend;
         if (strBackend == "nvenc")
         {
             backend = VPI_BACKEND_NVENC;
         }
         else
         {
             throw std::runtime_error("Backend '" + strBackend + "' not recognized, it must be nvenc.");
         }
  
         // Load the input video
         cv::VideoCapture invid;
         if (!invid.open(strInputVideo))
         {
             throw std::runtime_error("Can't open '" + strInputVideo + "'");
         }
  
         // Create the stream where processing will happen. We'll use user-provided backend
         // for Optical Flow, and CUDA/VIC for image format conversions.
         CHECK_STATUS(vpiStreamCreate(backend | VPI_BACKEND_CUDA | VPI_BACKEND_VIC, &stream));
  
         // Fetch the first frame
         if (!invid.read(cvPrevFrame))
         {
             throw std::runtime_error("Cannot read frame from input video");
         }
  
         // Create the previous and current frame wrapper using the first frame. This wrapper will
         // be set to point to every new frame in the main loop.
         CHECK_STATUS(vpiImageCreateOpenCVMatWrapper(cvPrevFrame, 0, &imgPrevFramePL));
         CHECK_STATUS(vpiImageCreateOpenCVMatWrapper(cvPrevFrame, 0, &imgCurFramePL));
  
         // Define the image formats we'll use throughout this sample.
         VPIImageFormat imgFmt   = VPI_IMAGE_FORMAT_NV12_ER;
         VPIImageFormat imgFmtBL = VPI_IMAGE_FORMAT_NV12_ER_BL;
  
         int32_t width  = cvPrevFrame.cols;
         int32_t height = cvPrevFrame.rows;
  
         // Create Dense Optical Flow payload to be executed on the given backend
         CHECK_STATUS(vpiCreateOpticalFlowDense(backend, width, height, imgFmtBL, quality, &payload));
  
         // The Dense Optical Flow on NVENC backend expects input to be in block-linear format.
         // Since Convert Image Format algorithm doesn't currently support direct BGR
         // pitch-linear (from OpenCV) to NV12 block-linear conversion, it must be done in two
         // passes, first from BGR/PL to NV12/PL using CUDA, then from NV12/PL to NV12/BL using VIC.
         // The temporary image buffer below will store the intermediate NV12/PL representation.
         CHECK_STATUS(vpiImageCreate(width, height, imgFmt, 0, &imgPrevFrameTmp));
         CHECK_STATUS(vpiImageCreate(width, height, imgFmt, 0, &imgCurFrameTmp));
  
         // Now create the final block-linear buffer that'll be used as input to the
         // algorithm.
         CHECK_STATUS(vpiImageCreate(width, height, imgFmtBL, 0, &imgPrevFrameBL));
         CHECK_STATUS(vpiImageCreate(width, height, imgFmtBL, 0, &imgCurFrameBL));
  
         // Motion vector image width and height, align to be multiple of 4
         int32_t mvWidth  = (width + 3) / 4;
         int32_t mvHeight = (height + 3) / 4;
  
         // The output video will be heatmap of motion vector image
 #if CV_MAJOR_VERSION >= 3
         int fourcc                 = cv::VideoWriter::fourcc('a', 'v', 'c', '1');
         double fps                 = invid.get(cv::CAP_PROP_FPS);
         std::string extOutputVideo = ".mp4";
 #else
         // MP4 support with OpenCV-2.4 has issues, we'll use
         // avi/mpeg instead.
         int fourcc                 = CV_FOURCC('M', 'P', 'E', 'G');
         double fps                 = invid.get(CV_CAP_PROP_FPS);
         std::string extOutputVideo = ".avi";
 #endif
  
         cv::VideoWriter outVideo("denseoptflow_mv_" + strBackend + extOutputVideo, fourcc, fps,
                                  cv::Size(mvWidth, mvHeight));
         if (!outVideo.isOpened())
         {
             throw std::runtime_error("Can't create output video");
         }
  
         // Create the output motion vector buffer
         CHECK_STATUS(vpiImageCreate(mvWidth, mvHeight, VPI_IMAGE_FORMAT_2S16_BL, 0, &imgMotionVecBL));
  
         // First convert the first frame to NV12_BL. It'll be used as previous frame when the algorithm is called.
         CHECK_STATUS(vpiSubmitConvertImageFormat(stream, VPI_BACKEND_CUDA, imgPrevFramePL, imgPrevFrameTmp, nullptr));
         CHECK_STATUS(vpiSubmitConvertImageFormat(stream, VPI_BACKEND_VIC, imgPrevFrameTmp, imgPrevFrameBL, nullptr));
  
         // Create a output image which holds the rendered motion vector image.
         cv::Mat mvOutputImage;
  
         // Fetch a new frame until video ends
         int idxFrame = 1;
         while (invid.read(cvCurFrame))
         {
             printf("Processing frame %d\n", idxFrame++);
             // Wrap frame into a VPIImage, reusing the existing imgCurFramePL.
             CHECK_STATUS(vpiImageSetWrappedOpenCVMat(imgCurFramePL, cvCurFrame));
  
             // Convert current frame to NV12_BL format
             CHECK_STATUS(vpiSubmitConvertImageFormat(stream, VPI_BACKEND_CUDA, imgCurFramePL, imgCurFrameTmp, nullptr));
             CHECK_STATUS(vpiSubmitConvertImageFormat(stream, VPI_BACKEND_VIC, imgCurFrameTmp, imgCurFrameBL, nullptr));
  
             CHECK_STATUS(
                 vpiSubmitOpticalFlowDense(stream, backend, payload, imgPrevFrameBL, imgCurFrameBL, imgMotionVecBL));
  
             // Wait for processing to finish.
             CHECK_STATUS(vpiStreamSync(stream));
  
             // Render the resulting motion vector in the output image
             ProcessMotionVector(imgMotionVecBL, mvOutputImage);
  
             // Save to output video
             outVideo << mvOutputImage;
  
             // Swap previous frame and next frame
             std::swap(cvPrevFrame, cvCurFrame);
             std::swap(imgPrevFramePL, imgCurFramePL);
             std::swap(imgPrevFrameBL, imgCurFrameBL);
         }
     }
     catch (std::exception &e)
     {
         std::cerr << e.what() << std::endl;
         retval = 1;
     }
  
     // Destroy all resources used
     vpiStreamDestroy(stream);
     vpiPayloadDestroy(payload);
  
     vpiImageDestroy(imgPrevFramePL);
     vpiImageDestroy(imgPrevFrameTmp);
     vpiImageDestroy(imgPrevFrameBL);
     vpiImageDestroy(imgCurFramePL);
     vpiImageDestroy(imgCurFrameTmp);
     vpiImageDestroy(imgCurFrameBL);
     vpiImageDestroy(imgMotionVecBL);
  
     return retval;
 }
  
 // vim: ts=8:sw=4:sts=4:et:ai

VPI - Vision Programming Interface

1.2 Release

Overview

Instructions

Results

Source Code