Overview

This application fetches frames from input video source, runs the algorithms on current images, and then calculate foreground mask. The output foreground mask will be saved to a video file.

Instructions

The command line parameters are:

where

backend: Defines the backend that will perform the processing. Only cpu and cuda are currently supported.
input video: Input video file name, it accepts .mp4, .avi and possibly others, depending on OpenCV's support.

Here's one example:

C++
./vpi_sample_14_background_subtractor cpu ../assets/pedestrians.mp4
Python
python main.py cpu ../assets/pedestrians.mp4

The application will process pedestrians.mp4 and create fgmask_cpu.mp4 and bgimage_cpu.mp4.

Note: If using OpenCV-2.4 or older (i.e. on Ubuntu 16.04), output files are fgmask_cpu.avi and bgimage_cpu.mp4.

Results

Input video	Foreground video	Background video

Source Code

For convenience, here's the code that is also installed in the samples directory.

Language: C++ Python

 import cv2
 import sys
 import vpi
 import numpy as np
 from argparse import ArgumentParser
  
 # ----------------------------
 # Parse command line arguments
  
 parser = ArgumentParser()
 parser.add_argument('backend', choices=['cpu','cuda'],
                     help='Backend to be used for processing')
  
 parser.add_argument('input',
                     help='Input video to be denoised')
  
 args = parser.parse_args();
  
 if args.backend == 'cuda':
     backend = vpi.Backend.CUDA
 else:
     assert args.backend == 'cpu'
     backend = vpi.Backend.CPU
  
 # -----------------------------
 # Open input and output videos
  
 inVideo = cv2.VideoCapture(args.input)
  
 if int(cv2.__version__.split('.')[0]) >= 3:
     extOutputVideo = '.mp4'
     fourcc = cv2.VideoWriter_fourcc(*'avc1')
     inSize = (int(inVideo.get(cv2.CAP_PROP_FRAME_WIDTH)), int(inVideo.get(cv2.CAP_PROP_FRAME_HEIGHT)))
     fps = inVideo.get(cv2.CAP_PROP_FPS)
 else:
     # MP4 support with OpenCV-2.4 has issues, we'll use
     # avi/mpeg instead.
     extOutputVideo = '.avi'
     fourcc = cv2.cv.CV_FOURCC('M','P','E','G')
     inSize = (int(inVideo.get(cv2.cv.CV_CAP_PROP_FRAME_WIDTH)), int(inVideo.get(cv2.cv.CV_CAP_PROP_FRAME_HEIGHT)))
     fps = inVideo.get(cv2.cv.CV_CAP_PROP_FPS)
  
 outVideoFGMask = cv2.VideoWriter('fgmask_python'+str(sys.version_info[0])+'_'+args.backend+extOutputVideo,
                                  fourcc, fps, inSize)
  
 outVideoBGImage = cv2.VideoWriter('bgimage_python'+str(sys.version_info[0])+'_'+args.backend+extOutputVideo,
                                   fourcc, fps, inSize)
  
 #--------------------------------------------------------------
 # Create the Background Subtractor object using the backend specified by the user
 with backend:
     bgsub = vpi.BackgroundSubtractor(inSize, vpi.Format.BGR8)
  
 #--------------------------------------------------------------
 # Main processing loop
 idxFrame = 0
 while True:
     print("Processing frame {}".format(idxFrame))
     idxFrame+=1
  
     # Read one input frame
     ret, cvFrame = inVideo.read()
     if not ret:
         break
  
     # Get the foreground mask and background image estimates
     fgmask, bgimage = bgsub(vpi.asimage(cvFrame, vpi.Format.BGR8), learnrate=0.01)
  
     # Mask needs to be converted to BGR8 for output
     fgmask = fgmask.convert(vpi.Format.BGR8, backend=vpi.Backend.CUDA);
  
     # Write images to output videos
     with fgmask.rlock(), bgimage.rlock():
         outVideoFGMask.write(fgmask.cpu())
         outVideoBGImage.write(bgimage.cpu())
  
 # vim: ts=8:sw=4:sts=4:et:ai

 #include <opencv2/core/version.hpp>
 #if CV_MAJOR_VERSION >= 3
 #    include <opencv2/imgcodecs.hpp>
 #    include <opencv2/videoio.hpp>
 #else
 #    include <opencv2/highgui/highgui.hpp>
 #endif
  
 #include <opencv2/imgproc/imgproc.hpp>
 #include <vpi/OpenCVInterop.hpp>
  
 #include <vpi/Array.h>
 #include <vpi/Image.h>
 #include <vpi/ImageFormat.h>
 #include <vpi/Pyramid.h>
 #include <vpi/Status.h>
 #include <vpi/Stream.h>
 #include <vpi/algo/BackgroundSubtractor.h>
 #include <vpi/algo/ConvertImageFormat.h>
  
 #include <iostream>
 #include <sstream>
  
 #define CHECK_STATUS(STMT)                                    \
     do                                                        \
     {                                                         \
         VPIStatus status = (STMT);                            \
         if (status != VPI_SUCCESS)                            \
         {                                                     \
             char buffer[VPI_MAX_STATUS_MESSAGE_LENGTH];       \
             vpiGetLastStatusMessage(buffer, sizeof(buffer));  \
             std::ostringstream ss;                            \
             ss << vpiStatusGetName(status) << ": " << buffer; \
             throw std::runtime_error(ss.str());               \
         }                                                     \
     } while (0);
  
 int main(int argc, char *argv[])
 {
     // OpenCV image that will be wrapped by a VPIImage.
     // Define it here so that it's destroyed *after* wrapper is destroyed
     cv::Mat cvCurFrame;
  
     // VPI objects that will be used
     VPIStream stream     = NULL;
     VPIImage imgCurFrame = NULL;
     VPIImage bgimage     = NULL;
     VPIImage fgmask      = NULL;
     VPIPayload payload   = NULL;
  
     int retval = 0;
  
     try
     {
         if (argc != 3)
         {
             throw std::runtime_error(std::string("Usage: ") + argv[0] + " <cpu|cuda> <input_video>");
         }
  
         // Parse input parameters
         std::string strBackend    = argv[1];
         std::string strInputVideo = argv[2];
  
         VPIBackend backend;
         if (strBackend == "cpu")
         {
             backend = VPI_BACKEND_CPU;
         }
         else if (strBackend == "cuda")
         {
             backend = VPI_BACKEND_CUDA;
         }
         else
         {
             throw std::runtime_error("Backend '" + strBackend + "' not recognized.");
         }
  
         // Load the input video
         cv::VideoCapture invid;
         if (!invid.open(strInputVideo))
         {
             throw std::runtime_error("Can't open '" + strInputVideo + "'");
         }
  
 #if CV_MAJOR_VERSION >= 3
         int32_t width  = invid.get(cv::CAP_PROP_FRAME_WIDTH);
         int32_t height = invid.get(cv::CAP_PROP_FRAME_HEIGHT);
  
         int fourcc                 = cv::VideoWriter::fourcc('a', 'v', 'c', '1');
         double fps                 = invid.get(cv::CAP_PROP_FPS);
         std::string extOutputVideo = ".mp4";
 #else
         int32_t width  = invid.get(CV_CAP_PROP_FRAME_WIDTH);
         int32_t height = invid.get(CV_CAP_PROP_FRAME_HEIGHT);
  
         // MP4 support with OpenCV-2.4 has issues, we'll use
         // avi/mpeg instead.
         int fourcc                 = CV_FOURCC('M', 'P', 'E', 'G');
         double fps                 = invid.get(CV_CAP_PROP_FPS);
         std::string extOutputVideo = ".avi";
 #endif
  
         // Create the stream where processing will happen. We'll use user-provided backend.
         CHECK_STATUS(vpiStreamCreate(backend, &stream));
  
         // Create background subtractor payload to be executed on the given backend
         // OpenCV delivers us BGR8 images, so the algorithm is configured to accept that.
         CHECK_STATUS(vpiCreateBackgroundSubtractor(backend, width, height, VPI_IMAGE_FORMAT_BGR8, &payload));
  
         // Create foreground image
         CHECK_STATUS(vpiImageCreate(width, height, VPI_IMAGE_FORMAT_U8, 0, &fgmask));
  
         // Create background image
         CHECK_STATUS(vpiImageCreate(width, height, VPI_IMAGE_FORMAT_BGR8, 0, &bgimage));
  
         cv::VideoWriter outVideo("fgmask_" + strBackend + extOutputVideo, fourcc, fps, cv::Size(width, height), false);
         if (!outVideo.isOpened())
         {
             throw std::runtime_error("Can't create output video");
         }
  
         cv::VideoWriter bgimageVideo("bgimage_" + strBackend + extOutputVideo, fourcc, fps, cv::Size(width, height));
         if (!outVideo.isOpened())
         {
             throw std::runtime_error("Can't create output video");
         }
  
         // Fetch a new frame until video ends
         int idxFrame = 1;
  
         while (invid.read(cvCurFrame))
         {
             printf("Processing frame %d\n", idxFrame++);
             // Wrap frame into a VPIImage
             if (imgCurFrame == NULL)
             {
                 CHECK_STATUS(vpiImageCreateOpenCVMatWrapper(cvCurFrame, 0, &imgCurFrame));
             }
             else
             {
                 CHECK_STATUS(vpiImageSetWrappedOpenCVMat(imgCurFrame, cvCurFrame));
             }
  
             VPIBackgroundSubtractorParams params;
             CHECK_STATUS(vpiInitBackgroundSubtractorParams(&params));
             params.learningRate = 0.01;
  
             CHECK_STATUS(
                 vpiSubmitBackgroundSubtractor(stream, backend, payload, imgCurFrame, fgmask, bgimage, &params));
  
             // Wait for processing to finish.
             CHECK_STATUS(vpiStreamSync(stream));
  
             {
                 // Now add it to the output video stream
                 VPIImageData imgdata;
                 CHECK_STATUS(vpiImageLock(fgmask, VPI_LOCK_READ, &imgdata));
  
                 cv::Mat outFrame;
                 CHECK_STATUS(vpiImageDataExportOpenCVMat(imgdata, &outFrame));
  
                 outVideo << outFrame;
  
                 CHECK_STATUS(vpiImageUnlock(fgmask));
             }
  
             {
                 VPIImageData bgdata;
                 CHECK_STATUS(vpiImageLock(bgimage, VPI_LOCK_READ, &bgdata));
  
                 cv::Mat outFrame;
                 CHECK_STATUS(vpiImageDataExportOpenCVMat(bgdata, &outFrame));
  
                 bgimageVideo << outFrame;
  
                 CHECK_STATUS(vpiImageUnlock(bgimage));
             }
         }
     }
     catch (std::exception &e)
     {
         std::cerr << e.what() << std::endl;
         retval = 1;
     }
  
     // Destroy all resources used
     vpiStreamDestroy(stream);
     vpiPayloadDestroy(payload);
  
     vpiImageDestroy(imgCurFrame);
     vpiImageDestroy(fgmask);
     vpiImageDestroy(bgimage);
  
     return retval;
 }
  
 // vim: ts=8:sw=4:sts=4:et:ai

VPI - Vision Programming Interface

1.2 Release

Overview

Instructions

Results

Source Code