Move scale and async_res variables to ThreadCtx

author Michal Sojka <michal.sojka@cvut.cz>

Tue, 11 Sep 2018 23:01:58 +0000 (01:01 +0200)

committer Michal Sojka <michal.sojka@cvut.cz>

Wed, 12 Sep 2018 05:06:44 +0000 (07:06 +0200)
author Michal Sojka <michal.sojka@cvut.cz>
Tue, 11 Sep 2018 23:01:58 +0000 (01:01 +0200)
committer Michal Sojka <michal.sojka@cvut.cz>
Wed, 12 Sep 2018 05:06:44 +0000 (07:06 +0200)
diff --git a/src/kcf.cpp b/src/kcf.cpp

index 7dacb2c20b8619c2ff5e305fad0fe315f513c584..8a1d98005dd18a00cdadee87eeac6cea7d27d062 100644 (file)
--- a/src/kcf.cpp
+++ b/src/kcf.cpp
@@ -1,7 +1,6 @@
  #include "kcf.h"
  #include <numeric>
  #include <thread>
-#include <future>
  #include <algorithm>
  
  #ifdef FFTW
@@ -321,59 +320,45 @@ void KCF_Tracker::track(cv::Mat &img)
      }
  
      double max_response = -1.;
-    uint scale_index = 0;
+    ThreadCtx *max = nullptr;
      cv::Point2i *max_response_pt = nullptr;
      cv::Mat *max_response_map = nullptr;
  
-    if (m_use_multithreading) {
-        std::vector<std::future<void>> async_res(p_scales.size());
-        for (auto it = p_threadctxs.begin(); it != p_threadctxs.end(); ++it) {
-            uint index = uint(std::distance(p_threadctxs.begin(), it));
-            async_res[index] = std::async(std::launch::async, [this, &input_gray, &input_rgb, index, it]() -> void {
-                return scale_track(*it, input_rgb, input_gray, this->p_scales[index]);
-            });
-        }
-        for (auto it = p_threadctxs.begin(); it != p_threadctxs.end(); ++it) {
-            uint index = uint(std::distance(p_threadctxs.begin(), it));
-            async_res[index].wait();
-            if (it->max_response > max_response) {
-                max_response = it->max_response;
-                max_response_pt = &it->max_loc;
-                max_response_map = &it->response;
-                scale_index = index;
-            }
+#ifdef ASYNC
+    for (auto &it : p_threadctxs)
+        it.async_res = std::async(std::launch::async, [this, &input_gray, &input_rgb, &it]() -> void {
+            scale_track(it, input_rgb, input_gray);
+        });
+    for (auto const &it : p_threadctxs)
+        it.async_res.wait();
+
+#else  // !ASYNC
+    // FIXME: Iterate correctly in big batch mode - perhaps have only one element in the list
+    NORMAL_OMP_PARALLEL_FOR
+    for (uint i = 0; i < p_threadctxs.size(); ++i)
+        scale_track(p_threadctxs[i], input_rgb, input_gray);
+#endif
+
+#ifndef BIG_BATCH
+    for (auto &it : p_threadctxs) {
+        if (it.max_response > max_response) {
+            max_response = it.max_response;
+            max_response_pt = &it.max_loc;
+            max_response_map = &it.response;
+            max = &it;
          }
-    } else {
-        uint start = m_use_big_batch ? 1 : 0;
-        uint end = m_use_big_batch ? 2 : uint(p_num_scales);
-        NORMAL_OMP_PARALLEL_FOR
-        for (uint i = start; i < end; ++i) {
-            auto it = p_threadctxs.begin();
-            std::advance(it, i);
-            scale_track(*it, input_rgb, input_gray, this->p_scales[i]);
-
-            if (m_use_big_batch) {
-                for (size_t j = 0; j < p_scales.size(); ++j) {
-                    if (it->max_responses[j] > max_response) {
-                        max_response = it->max_responses[j];
-                        max_response_pt = &it->max_locs[j];
-                        max_response_map = &it->response_maps[j];
-                        scale_index = j;
-                    }
-                }
-            } else {
-                NORMAL_OMP_CRITICAL
-                {
-                    if (it->max_response > max_response) {
-                        max_response = it->max_response;
-                        max_response_pt = &it->max_loc;
-                        max_response_map = &it->response;
-                        scale_index = i;
-                    }
-                }
-            }
+    }
+#else
+    // FIXME: Iterate correctly in big batch mode - perhaps have only one element in the list
+    for (uint j = 0; j < p_scales.size(); ++j) {
+        if (p_threadctxs[0].max_responses[j] > max_response) {
+            max_response = p_threadctxs[0].max_responses[j];
+            max_response_pt = &p_threadctxs[0].max_locs[j];
+            max_response_map = &p_threadctxs[0].response_maps[j];
+            max = &p_threadctxs[0];
          }
      }
+#endif
  
      DEBUG_PRINTM(*max_response_map);
      DEBUG_PRINT(*max_response_pt);
@@ -406,11 +391,13 @@ void KCF_Tracker::track(cv::Mat &img)
      }
  
      // sub grid scale interpolation
-    double new_scale = p_scales[scale_index];
-    if (m_use_subgrid_scale)
-        new_scale = sub_grid_scale(scale_index);
+    if (m_use_subgrid_scale) {
+        auto it = std::find_if(p_threadctxs.begin(), p_threadctxs.end(), [max](ThreadCtx &ctx) { return &ctx == max; });
+        p_current_scale *= sub_grid_scale(std::distance(p_threadctxs.begin(), it));
+    } else {
+        p_current_scale *= max->scale;
+    }
  
-    p_current_scale *= new_scale;
  
      if (p_current_scale < p_min_max_scale[0]) p_current_scale = p_min_max_scale[0];
      if (p_current_scale > p_min_max_scale[1]) p_current_scale = p_min_max_scale[1];
@@ -455,7 +442,7 @@ void KCF_Tracker::track(cv::Mat &img)
  #endif
  }
  
-void KCF_Tracker::scale_track(ThreadCtx &vars, cv::Mat &input_rgb, cv::Mat &input_gray, double scale)
+void KCF_Tracker::scale_track(ThreadCtx &vars, cv::Mat &input_rgb, cv::Mat &input_gray)
  {
      if (m_use_big_batch) {
          vars.patch_feats.clear();
@@ -467,7 +454,7 @@ void KCF_Tracker::scale_track(ThreadCtx &vars, cv::Mat &input_rgb, cv::Mat &inpu
      } else {
          vars.patch_feats.clear();
          get_features(input_rgb, input_gray, int(this->p_pose.cx), int(this->p_pose.cy), this->p_windows_size.width,
-                     this->p_windows_size.height, vars, this->p_current_scale *scale);
+                     this->p_windows_size.height, vars, this->p_current_scale * vars.scale);
      }
  
      fft.forward_window(vars.patch_feats, vars.zf, vars.fw_all, m_use_cuda ? vars.data_features.deviceMem() : nullptr,
@@ -516,7 +503,7 @@ void KCF_Tracker::scale_track(ThreadCtx &vars, cv::Mat &input_rgb, cv::Mat &inpu
  
          DEBUG_PRINT(vars.max_loc);
  
-        double weight = scale < 1. ? scale : 1. / scale;
+        double weight = vars.scale < 1. ? vars.scale : 1. / vars.scale;
          vars.max_response = vars.max_val * weight;
      }
      return;
diff --git a/src/kcf.h b/src/kcf.h

index 23ff04b8ba16a43716a1bb903aa6c9866f980691..044934592a8e1210bec435c2dc32a834c92c5917 100644 (file)
--- a/src/kcf.h
+++ b/src/kcf.h
@@ -142,7 +142,7 @@ private:
      ComplexMat p_model_xf;
      ComplexMat p_xf;
      //helping functions
-    void scale_track(ThreadCtx & vars, cv::Mat & input_rgb, cv::Mat & input_gray, double scale);
+    void scale_track(ThreadCtx & vars, cv::Mat & input_rgb, cv::Mat & input_gray);
      cv::Mat get_subwindow(const cv::Mat & input, int cx, int cy, int size_x, int size_y);
      cv::Mat gaussian_shaped_labels(double sigma, int dim1, int dim2);
      void gaussian_correlation(struct ThreadCtx &vars, const ComplexMat & xf, const ComplexMat & yf, double sigma, bool auto_correlation = false);
diff --git a/src/threadctx.hpp b/src/threadctx.hpp

index dc6921c14f1c28de254beb95f161253e90e22459..c4bb5356484925b34a5871ba6e134bd69812ff86 100644 (file)
--- a/src/threadctx.hpp
+++ b/src/threadctx.hpp
@@ -1,6 +1,7 @@
  #ifndef SCALE_VARS_HPP
  #define SCALE_VARS_HPP
  
+#include <future>
  #include "dynmem.hpp"
  
  #ifdef CUFFT
@@ -15,7 +16,8 @@ typedef int *cudaStream_t;
  
  struct ThreadCtx {
    public:
-    ThreadCtx(cv::Size windows_size, uint cell_size, uint num_of_feats, uint num_of_scales = 1)
+    ThreadCtx(cv::Size windows_size, uint cell_size, uint num_of_feats, double scale, uint num_of_scales = 1)
+        : scale(scale)
      {
          this->xf_sqr_norm = DynMem(num_of_scales * sizeof(float));
          this->yf_sqr_norm = DynMem(sizeof(float));
@@ -80,6 +82,11 @@ struct ThreadCtx {
  #endif
      }
  
+    const double scale;
+#ifdef ASYNC
+    std::future<void> async_res;
+#endif
+
      DynMem xf_sqr_norm, yf_sqr_norm;
      std::vector<cv::Mat> patch_feats;
author	Michal Sojka <michal.sojka@cvut.cz>
	Tue, 11 Sep 2018 23:01:58 +0000 (01:01 +0200)
committer	Michal Sojka <michal.sojka@cvut.cz>
	Wed, 12 Sep 2018 05:06:44 +0000 (07:06 +0200)
src/kcf.cpp		patch \| blob \| history
src/kcf.h		patch \| blob \| history
src/threadctx.hpp		patch \| blob \| history