]> rtime.felk.cvut.cz Git - hercules2020/kcf.git/blobdiff - main_vot.cpp
Simplify scale initialization
[hercules2020/kcf.git] / main_vot.cpp
index 1af98e8663a87ad975318d90099ce4adc3eff2ab..3a846e86af00aa4999de8d8c4e904781596c6f97 100644 (file)
@@ -2,10 +2,36 @@
 #include <getopt.h>
 #include <libgen.h>
 #include <unistd.h>
+#include <iomanip>
 
 #include "kcf.h"
 #include "vot.hpp"
 
+double calcAccuracy(std::string line, cv::Rect bb_rect, cv::Rect &groundtruth_rect)
+{
+    std::vector<float> numbers;
+    std::istringstream s(line);
+    float x;
+    char ch;
+
+    while (s >> x) {
+        numbers.push_back(x);
+        s >> ch;
+    }
+    double x1 = std::min(numbers[0], std::min(numbers[2], std::min(numbers[4], numbers[6])));
+    double x2 = std::max(numbers[0], std::max(numbers[2], std::max(numbers[4], numbers[6])));
+    double y1 = std::min(numbers[1], std::min(numbers[3], std::min(numbers[5], numbers[7])));
+    double y2 = std::max(numbers[1], std::max(numbers[3], std::max(numbers[5], numbers[7])));
+
+    groundtruth_rect = cv::Rect(x1, y1, x2 - x1, y2 - y1);
+
+    double rects_intersection = (groundtruth_rect & bb_rect).area();
+    double rects_union = (groundtruth_rect | bb_rect).area();
+    double accuracy = rects_intersection / rects_union;
+
+    return accuracy;
+}
+
 int main(int argc, char *argv[])
 {
     //load region, images and prepare for output
@@ -24,8 +50,7 @@ int main(int argc, char *argv[])
             {0,           0,                 0,  0 }
         };
 
-        int c = getopt_long(argc, argv, "dhv::f::o:",
-                        long_options, &option_index);
+        int c = getopt_long(argc, argv, "dhv::f::o:", long_options, &option_index);
         if (c == -1)
             break;
 
@@ -59,7 +84,7 @@ int main(int argc, char *argv[])
             sizes.erase(0, pos + delimiter.length());
 
             fit_size_x = stol(first_argument);
-           fit_size_y = stol(sizes);
+            fit_size_y = stol(sizes);
             break;
         }
     }
@@ -95,12 +120,9 @@ int main(int argc, char *argv[])
     }
     VOT vot_io(region, images, output);
 
-// if groundtruth.txt is used use intersection over union (IOU) to calculate tracker accuracy
-    bool use_iou = false;
+    // if groundtruth.txt is used use intersection over union (IOU) to calculate tracker accuracy
     std::ifstream groundtruth_stream;
     if (region.compare("groundtruth.txt") == 0) {
-        std::cout << region << std::endl;
-        use_iou = true;
         groundtruth_stream.open(region.c_str());
         std::string line;
         std::getline(groundtruth_stream, line);
@@ -116,14 +138,18 @@ int main(int argc, char *argv[])
     tracker.init(image, init_rect, fit_size_x, fit_size_y);
 
     BBox_c bb;
-    cv::Rect bb_rect, groundtruth_rect;
-    double avg_time = 0., avg_inter = 0.;
+    cv::Rect bb_rect;
+    double avg_time = 0., sum_accuracy = 0.;
     int frames = 0;
+
+    std::cout << std::fixed << std::setprecision(2);
+
     while (vot_io.getNextImage(image) == 1){
         double time_profile_counter = cv::getCPUTickCount();
         tracker.track(image);
         time_profile_counter = cv::getCPUTickCount() - time_profile_counter;
-         std::cout << "  -> speed : " <<  time_profile_counter/((double)cvGetTickFrequency()*1000) << "ms. per frame" << std::endl;
+         std::cout << "  -> speed : " <<  time_profile_counter/((double)cvGetTickFrequency()*1000) << "ms per frame, "
+                      "response : " << tracker.getFilterResponse();
         avg_time += time_profile_counter/((double)cvGetTickFrequency()*1000);
         frames++;
 
@@ -131,32 +157,20 @@ int main(int argc, char *argv[])
         bb_rect = cv::Rect(bb.cx - bb.w/2., bb.cy - bb.h/2., bb.w, bb.h);
         vot_io.outputBoundingBox(bb_rect);
 
-        if (use_iou) {
+        if (groundtruth_stream.is_open()) {
             std::string line;
             std::getline(groundtruth_stream, line);
-            std::vector<float> numbers;
-            std::istringstream s( line );
-            float x;
-            char ch;
-            while (s >> x){
-                numbers.push_back(x);
-                s >> ch;
-            }
-            double x1 = std::min(numbers[0], std::min(numbers[2], std::min(numbers[4], numbers[6])));
-            double x2 = std::max(numbers[0], std::max(numbers[2], std::max(numbers[4], numbers[6])));
-            double y1 = std::min(numbers[1], std::min(numbers[3], std::min(numbers[5], numbers[7])));
-            double y2 = std::max(numbers[1], std::max(numbers[3], std::max(numbers[5], numbers[7])));
-
-            groundtruth_rect = cv::Rect(x1, y1, x2-x1, y2-y1);
-//             cv::rectangle(image, groundtruth_rect, CV_RGB(255,0,0), 2);
-
-            double rects_intersection = (groundtruth_rect & bb_rect).area();
-            double rects_union = (groundtruth_rect | bb_rect).area();
-            double union_over_inter = rects_intersection/rects_union;
-            std::cout << "   ->intersection ratio " << union_over_inter << std::endl;
-            avg_inter +=union_over_inter;
+
+            cv::Rect groundtruthRect;
+            double accuracy = calcAccuracy(line, bb_rect, groundtruthRect);
+            if (visualize_delay >= 0)
+                cv::rectangle(image, groundtruthRect, CV_RGB(255, 0,0), 1);
+            std::cout << ", accuracy: " << accuracy;
+            sum_accuracy += accuracy;
         }
 
+        std::cout << std::endl;
+
         if (visualize_delay >= 0) {
             cv::rectangle(image, bb_rect, CV_RGB(0,255,0), 2);
             cv::imshow("output", image);
@@ -186,11 +200,12 @@ int main(int argc, char *argv[])
 //        cv::imwrite(ss.c_str(), image, compression_params);
     }
 
-    std::cout << "Average processing speed " << avg_time/frames <<  "ms. (" << 1./(avg_time/frames)*1000 << " fps)" << std::endl;
-    if (use_iou) {
-        std::cout << "Average intersection ratio " << avg_inter/frames << std::endl;
+    std::cout << "Average processing speed: " << avg_time / frames << "ms (" << 1. / (avg_time / frames) * 1000 << " fps)";
+    if (groundtruth_stream.is_open()) {
+        std::cout << "; Average accuracy: " << sum_accuracy/frames << std::endl;
         groundtruth_stream.close();
     }
+    std::cout << std::endl;
 
     return EXIT_SUCCESS;
 }