Merge pull request #7873 from addisonElliott:Mat_Range_InitializerList

[platform/upstream/opencv.git] / samples / gpu / hog.cpp
diff --git a/samples/gpu/hog.cpp b/samples/gpu/hog.cpp

index 59ea44f..8f857da 100644 (file)
--- a/samples/gpu/hog.cpp
+++ b/samples/gpu/hog.cpp
@@ -5,7 +5,7 @@
  #include <iomanip>
  #include <stdexcept>
  #include <opencv2/core/utility.hpp>
-#include "opencv2/cuda.hpp"
+#include "opencv2/cudaobjdetect.hpp"
  #include "opencv2/highgui.hpp"
  #include "opencv2/objdetect.hpp"
  #include "opencv2/imgproc.hpp"
@@ -22,10 +22,14 @@ public:
      static Args read(int argc, char** argv);
  
      string src;
+    bool src_is_folder;
      bool src_is_video;
      bool src_is_camera;
      int camera_id;
  
+    bool svm_load;
+    string svm;
+
      bool write_video;
      string dst_video;
      double dst_video_fps;
@@ -44,6 +48,10 @@ public:
  
      int win_width;
      int win_stride_width, win_stride_height;
+    int block_width;
+    int block_stride_width, block_stride_height;
+    int cell_width;
+    int nbins;
  
      bool gamma_corr;
  };
@@ -93,6 +101,9 @@ static void printHelp()
      cout << "Histogram of Oriented Gradients descriptor and detector sample.\n"
           << "\nUsage: hog_gpu\n"
           << "  (<image>|--video <vide>|--camera <camera_id>) # frames source\n"
+         << "  or"
+         << "  (--folder <folder_path>) # load images from folder\n"
+         << "  [--svm <file> # load svm file"
           << "  [--make_gray <true/false>] # convert image to gray one or not\n"
           << "  [--resize_src <true/false>] # do resize of the source image or not\n"
           << "  [--width <int>] # resized image width\n"
@@ -100,9 +111,14 @@ static void printHelp()
           << "  [--hit_threshold <double>] # classifying plane distance threshold (0.0 usually)\n"
           << "  [--scale <double>] # HOG window scale factor\n"
           << "  [--nlevels <int>] # max number of HOG window scales\n"
-         << "  [--win_width <int>] # width of the window (48 or 64)\n"
+         << "  [--win_width <int>] # width of the window\n"
           << "  [--win_stride_width <int>] # distance by OX axis between neighbour wins\n"
           << "  [--win_stride_height <int>] # distance by OY axis between neighbour wins\n"
+         << "  [--block_width <int>] # width of the block\n"
+         << "  [--block_stride_width <int>] # distance by 0X axis between neighbour blocks\n"
+         << "  [--block_stride_height <int>] # distance by 0Y axis between neighbour blocks\n"
+         << "  [--cell_width <int>] # width of the cell\n"
+         << "  [--nbins <int>] # number of bins\n"
           << "  [--gr_threshold <int>] # merging similar rects constant\n"
           << "  [--gamma_correct <int>] # do gamma correction or not\n"
           << "  [--write_video <bool>] # write video or not\n"
@@ -115,11 +131,19 @@ int main(int argc, char** argv)
  {
      try
      {
+        Args args;
          if (argc < 2)
+        {
              printHelp();
-        Args args = Args::read(argc, argv);
-        if (help_showed)
-            return -1;
+            args.camera_id = 0;
+            args.src_is_camera = true;
+        }
+        else
+        {
+            args = Args::read(argc, argv);
+            if (help_showed)
+                return -1;
+        }
          App app(args);
          app.run();
      }
@@ -134,6 +158,8 @@ Args::Args()
  {
      src_is_video = false;
      src_is_camera = false;
+    src_is_folder = false;
+    svm_load = false;
      camera_id = 0;
  
      write_video = false;
@@ -154,6 +180,11 @@ Args::Args()
      win_width = 48;
      win_stride_width = 8;
      win_stride_height = 8;
+    block_width = 16;
+    block_stride_width = 8;
+    block_stride_height = 8;
+    cell_width = 8;
+    nbins = 9;
  
      gamma_corr = true;
  }
@@ -178,6 +209,11 @@ Args Args::read(int argc, char** argv)
          else if (string(argv[i]) == "--win_width") args.win_width = atoi(argv[++i]);
          else if (string(argv[i]) == "--win_stride_width") args.win_stride_width = atoi(argv[++i]);
          else if (string(argv[i]) == "--win_stride_height") args.win_stride_height = atoi(argv[++i]);
+        else if (string(argv[i]) == "--block_width") args.block_width = atoi(argv[++i]);
+        else if (string(argv[i]) == "--block_stride_width") args.block_stride_width = atoi(argv[++i]);
+        else if (string(argv[i]) == "--block_stride_height") args.block_stride_height = atoi(argv[++i]);
+        else if (string(argv[i]) == "--cell_width") args.cell_width = atoi(argv[++i]);
+        else if (string(argv[i]) == "--nbins") args.nbins = atoi(argv[++i]);
          else if (string(argv[i]) == "--gr_threshold") args.gr_threshold = atoi(argv[++i]);
          else if (string(argv[i]) == "--gamma_correct") args.gamma_corr = (string(argv[++i]) == "true");
          else if (string(argv[i]) == "--write_video") args.write_video = (string(argv[++i]) == "true");
@@ -186,6 +222,8 @@ Args Args::read(int argc, char** argv)
          else if (string(argv[i]) == "--help") printHelp();
          else if (string(argv[i]) == "--video") { args.src = argv[++i]; args.src_is_video = true; }
          else if (string(argv[i]) == "--camera") { args.camera_id = atoi(argv[++i]); args.src_is_camera = true; }
+        else if (string(argv[i]) == "--folder") { args.src = argv[++i]; args.src_is_folder = true;}
+        else if (string(argv[i]) == "--svm") { args.svm = argv[++i]; args.svm_load = true;}
          else if (args.src.empty()) args.src = argv[i];
          else throw runtime_error((string("unknown key: ") + argv[i]));
      }
@@ -220,16 +258,17 @@ App::App(const Args& s)
  
      gamma_corr = args.gamma_corr;
  
-    if (args.win_width != 64 && args.win_width != 48)
-        args.win_width = 64;
-
      cout << "Scale: " << scale << endl;
      if (args.resize_src)
          cout << "Resized source: (" << args.width << ", " << args.height << ")\n";
      cout << "Group threshold: " << gr_threshold << endl;
      cout << "Levels number: " << nlevels << endl;
-    cout << "Win width: " << args.win_width << endl;
+    cout << "Win size: (" << args.win_width << ", " << args.win_width*2 << ")\n";
      cout << "Win stride: (" << args.win_stride_width << ", " << args.win_stride_height << ")\n";
+    cout << "Block size: (" << args.block_width << ", " << args.block_width << ")\n";
+    cout << "Block stride: (" << args.block_stride_width << ", " << args.block_stride_height << ")\n";
+    cout << "Cell size: (" << args.cell_width << ", " << args.cell_width << ")\n";
+    cout << "Bins number: " << args.nbins << endl;
      cout << "Hit threshold: " << hit_threshold << endl;
      cout << "Gamma correction: " << gamma_corr << endl;
      cout << endl;
@@ -241,28 +280,58 @@ void App::run()
      running = true;
      cv::VideoWriter video_writer;
  
-    Size win_size(args.win_width, args.win_width * 2); //(64, 128) or (48, 96)
      Size win_stride(args.win_stride_width, args.win_stride_height);
+    Size win_size(args.win_width, args.win_width * 2);
+    Size block_size(args.block_width, args.block_width);
+    Size block_stride(args.block_stride_width, args.block_stride_height);
+    Size cell_size(args.cell_width, args.cell_width);
+
+    cv::Ptr<cv::cuda::HOG> gpu_hog = cv::cuda::HOG::create(win_size, block_size, block_stride, cell_size, args.nbins);
+    cv::HOGDescriptor cpu_hog(win_size, block_size, block_stride, cell_size, args.nbins);
+
+    if(args.svm_load) {
+        std::vector<float> svm_model;
+        const std::string model_file_name = args.svm;
+        FileStorage ifs(model_file_name, FileStorage::READ);
+        if (ifs.isOpened()) {
+            ifs["svm_detector"] >> svm_model;
+        } else {
+            const std::string what =
+                    "could not load model for hog classifier from file: "
+                    + model_file_name;
+            throw std::runtime_error(what);
+        }
+
+        // check if the variables are initialized
+        if (svm_model.empty()) {
+            const std::string what =
+                    "HoG classifier: svm model could not be loaded from file"
+                    + model_file_name;
+            throw std::runtime_error(what);
+        }
+
+        gpu_hog->setSVMDetector(svm_model);
+        cpu_hog.setSVMDetector(svm_model);
+    } else {
+        // Create HOG descriptors and detectors here
+        Mat detector = gpu_hog->getDefaultPeopleDetector();
  
-    // Create HOG descriptors and detectors here
-    vector<float> detector;
-    if (win_size == Size(64, 128))
-        detector = cv::cuda::HOGDescriptor::getPeopleDetector64x128();
-    else
-        detector = cv::cuda::HOGDescriptor::getPeopleDetector48x96();
-
-    cv::cuda::HOGDescriptor gpu_hog(win_size, Size(16, 16), Size(8, 8), Size(8, 8), 9,
-                                   cv::cuda::HOGDescriptor::DEFAULT_WIN_SIGMA, 0.2, gamma_corr,
-                                   cv::cuda::HOGDescriptor::DEFAULT_NLEVELS);
-    cv::HOGDescriptor cpu_hog(win_size, Size(16, 16), Size(8, 8), Size(8, 8), 9, 1, -1,
-                              HOGDescriptor::L2Hys, 0.2, gamma_corr, cv::HOGDescriptor::DEFAULT_NLEVELS);
-    gpu_hog.setSVMDetector(detector);
-    cpu_hog.setSVMDetector(detector);
+        gpu_hog->setSVMDetector(detector);
+        cpu_hog.setSVMDetector(detector);
+    }
+
+    cout << "gpusvmDescriptorSize : " << gpu_hog->getDescriptorSize()
+         << endl;
+    cout << "cpusvmDescriptorSize : " << cpu_hog.getDescriptorSize()
+         << endl;
  
      while (running)
      {
          VideoCapture vc;
          Mat frame;
+        vector<String> filenames;
+
+        unsigned int count = 1;
  
          if (args.src_is_video)
          {
@@ -271,6 +340,14 @@ void App::run()
                  throw runtime_error(string("can't open video file: " + args.src));
              vc >> frame;
          }
+        else if (args.src_is_folder) {
+            String folder = args.src;
+            cout << folder << endl;
+            glob(folder, filenames);
+            frame = imread(filenames[count]);  // 0 --> .gitignore
+            if (!frame.data)
+                cerr << "Problem loading image from folder!!!" << endl;
+        }
          else if (args.src_is_camera)
          {
              vc.open(args.camera_id);
@@ -307,9 +384,6 @@ void App::run()
              else img = img_aux;
              img_to_show = img;
  
-            gpu_hog.nlevels = nlevels;
-            cpu_hog.nlevels = nlevels;
-
              vector<Rect> found;
  
              // Perform HOG classification
@@ -317,11 +391,19 @@ void App::run()
              if (use_gpu)
              {
                  gpu_img.upload(img);
-                gpu_hog.detectMultiScale(gpu_img, found, hit_threshold, win_stride,
+                gpu_hog->setNumLevels(nlevels);
+                gpu_hog->setHitThreshold(hit_threshold);
+                gpu_hog->setWinStride(win_stride);
+                gpu_hog->setScaleFactor(scale);
+                gpu_hog->setGroupThreshold(gr_threshold);
+                gpu_hog->detectMultiScale(gpu_img, found);
+            }
+            else
+            {
+                cpu_hog.nlevels = nlevels;
+                cpu_hog.detectMultiScale(img, found, hit_threshold, win_stride,
                                           Size(0, 0), scale, gr_threshold);
              }
-            else cpu_hog.detectMultiScale(img, found, hit_threshold, win_stride,
-                                          Size(0, 0), scale, gr_threshold);
              hogWorkEnd();
  
              // Draw positive classified windows
@@ -335,11 +417,20 @@ void App::run()
                  putText(img_to_show, "Mode: GPU", Point(5, 25), FONT_HERSHEY_SIMPLEX, 1., Scalar(255, 100, 0), 2);
              else
                  putText(img_to_show, "Mode: CPU", Point(5, 25), FONT_HERSHEY_SIMPLEX, 1., Scalar(255, 100, 0), 2);
-            putText(img_to_show, "FPS (HOG only): " + hogWorkFps(), Point(5, 65), FONT_HERSHEY_SIMPLEX, 1., Scalar(255, 100, 0), 2);
-            putText(img_to_show, "FPS (total): " + workFps(), Point(5, 105), FONT_HERSHEY_SIMPLEX, 1., Scalar(255, 100, 0), 2);
+            putText(img_to_show, "FPS HOG: " + hogWorkFps(), Point(5, 65), FONT_HERSHEY_SIMPLEX, 1., Scalar(255, 100, 0), 2);
+            putText(img_to_show, "FPS total: " + workFps(), Point(5, 105), FONT_HERSHEY_SIMPLEX, 1., Scalar(255, 100, 0), 2);
              imshow("opencv_gpu_hog", img_to_show);
  
              if (args.src_is_video || args.src_is_camera) vc >> frame;
+            if (args.src_is_folder) {
+                count++;
+                if (count < filenames.size()) {
+                    frame = imread(filenames[count]);
+                } else {
+                    Mat empty;
+                    frame = empty;
+                }
+            }
  
              workEnd();