AlexeyAB
2018-02-07 4373f897f1a5efd1a58746c44430dc33df925415
src/yolo_console_dll.cpp
@@ -11,10 +11,10 @@
#ifdef _WIN32
#define OPENCV
#include "windows.h"
#endif
#define TRACK_OPTFLOW
// To use tracking - uncomment the following line. Tracking is supported only by OpenCV 3.x
//#define TRACK_OPTFLOW
#include "yolo_v2_class.hpp"  // imported functions from DLL
@@ -38,16 +38,156 @@
#endif
cv::Scalar obj_id_to_color(int obj_id) {
   int const colors[6][3] = { { 1,0,1 },{ 0,0,1 },{ 0,1,1 },{ 0,1,0 },{ 1,1,0 },{ 1,0,0 } };
   int const offset = obj_id * 123457 % 6;
   int const color_scale = 150 + (obj_id * 123457) % 100;
   cv::Scalar color(colors[offset][0], colors[offset][1], colors[offset][2]);
   color *= color_scale;
   return color;
}
class preview_boxes_t {
   enum { frames_history = 30 }; // how long to keep the history saved
   struct preview_box_track_t {
      unsigned int track_id, obj_id, last_showed_frames_ago;
      bool current_detection;
      bbox_t bbox;
      cv::Mat mat_obj, mat_resized_obj;
      preview_box_track_t() : track_id(0), obj_id(0), last_showed_frames_ago(frames_history), current_detection(false){}
   };
   std::vector<preview_box_track_t> preview_box_track_id;
   size_t const preview_box_size, bottom_offset;
   bool const one_off_detections;
public:
   preview_boxes_t(size_t _preview_box_size = 100, size_t _bottom_offset = 100, bool _one_off_detections = false) :
      preview_box_size(_preview_box_size), bottom_offset(_bottom_offset), one_off_detections(_one_off_detections)
   {}
   void set(cv::Mat src_mat, std::vector<bbox_t> result_vec)
   {
      size_t const count_preview_boxes = src_mat.cols / preview_box_size;
      if (preview_box_track_id.size() != count_preview_boxes) preview_box_track_id.resize(count_preview_boxes);
      // increment frames history
      for (auto &i : preview_box_track_id)
         i.last_showed_frames_ago = std::min((unsigned)frames_history, i.last_showed_frames_ago + 1);
      // occupy empty boxes
      for (auto &k : result_vec) {
         bool found = false;
         // find the same (track_id)
         for (auto &i : preview_box_track_id) {
            if (i.track_id == k.track_id) {
               if (!one_off_detections) i.last_showed_frames_ago = 0; // for tracked objects
               found = true;
               break;
            }
         }
         if (!found) {
            // find empty box
            for (auto &i : preview_box_track_id) {
               if (i.last_showed_frames_ago == frames_history) {
                  if (!one_off_detections && k.frames_counter == 0) break; // don't show if obj isn't tracked yet
                  i.track_id = k.track_id;
                  i.obj_id = k.obj_id;
                  i.bbox = k;
                  i.last_showed_frames_ago = 0;
                  break;
               }
            }
         }
      }
      // draw preview box (from old or current frame)
      for (size_t i = 0; i < preview_box_track_id.size(); ++i)
      {
         // get object image
         cv::Mat dst = preview_box_track_id[i].mat_resized_obj;
         preview_box_track_id[i].current_detection = false;
         for (auto &k : result_vec) {
            if (preview_box_track_id[i].track_id == k.track_id) {
               if (one_off_detections && preview_box_track_id[i].last_showed_frames_ago > 0) {
                  preview_box_track_id[i].last_showed_frames_ago = frames_history; break;
               }
               bbox_t b = k;
               cv::Rect r(b.x, b.y, b.w, b.h);
               cv::Rect img_rect(cv::Point2i(0, 0), src_mat.size());
               cv::Rect rect_roi = r & img_rect;
               if (rect_roi.width > 1 || rect_roi.height > 1) {
                  cv::Mat roi = src_mat(rect_roi);
                  cv::resize(roi, dst, cv::Size(preview_box_size, preview_box_size));
                  preview_box_track_id[i].mat_obj = roi.clone();
                  preview_box_track_id[i].mat_resized_obj = dst.clone();
                  preview_box_track_id[i].current_detection = true;
                  preview_box_track_id[i].bbox = k;
               }
               break;
            }
         }
      }
   }
   void draw(cv::Mat draw_mat, bool show_small_boxes = false)
   {
      // draw preview box (from old or current frame)
      for (size_t i = 0; i < preview_box_track_id.size(); ++i)
      {
         auto &prev_box = preview_box_track_id[i];
         // draw object image
         cv::Mat dst = prev_box.mat_resized_obj;
         if (prev_box.last_showed_frames_ago < frames_history &&
            dst.size() == cv::Size(preview_box_size, preview_box_size))
         {
            cv::Rect dst_rect_roi(cv::Point2i(i * preview_box_size, draw_mat.rows - bottom_offset), dst.size());
            cv::Mat dst_roi = draw_mat(dst_rect_roi);
            dst.copyTo(dst_roi);
            cv::Scalar color = obj_id_to_color(prev_box.obj_id);
            int thickness = (prev_box.current_detection) ? 5 : 1;
            cv::rectangle(draw_mat, dst_rect_roi, color, thickness);
            unsigned int const track_id = prev_box.track_id;
            std::string track_id_str = (track_id > 0)? std::to_string(track_id):"";
            putText(draw_mat, track_id_str, dst_rect_roi.tl() - cv::Point2i(0, 10), cv::FONT_HERSHEY_COMPLEX_SMALL, 1.0, cv::Scalar(0, 0, 0), 2);
            std::string size_str = std::to_string(prev_box.bbox.w) + "x" + std::to_string(prev_box.bbox.h);
            putText(draw_mat, size_str, dst_rect_roi.tl() + cv::Point2i(0, 12), cv::FONT_HERSHEY_COMPLEX_SMALL, 0.8, cv::Scalar(0, 0, 0), 1);
            if (!one_off_detections && prev_box.current_detection) {
               cv::line(draw_mat, dst_rect_roi.tl() + cv::Point2i(preview_box_size, 0),
                  cv::Point2i(prev_box.bbox.x, prev_box.bbox.y + prev_box.bbox.h),
                  color);
            }
            if (one_off_detections && show_small_boxes) {
               cv::Rect src_rect_roi(cv::Point2i(prev_box.bbox.x, prev_box.bbox.y),
               cv::Size(prev_box.bbox.w, prev_box.bbox.h));
               unsigned int const color_history = (255 * prev_box.last_showed_frames_ago) / frames_history;
               color = cv::Scalar(255 - 3* color_history, 255 - 2 * color_history,  255 - 1 * color_history);
               if (prev_box.mat_obj.size() == src_rect_roi.size()) {
                  prev_box.mat_obj.copyTo(draw_mat(src_rect_roi));
               }
               cv::rectangle(draw_mat, src_rect_roi, color, thickness);
               putText(draw_mat, track_id_str, src_rect_roi.tl() - cv::Point2i(0, 10), cv::FONT_HERSHEY_COMPLEX_SMALL, 0.8, cv::Scalar(0, 0, 0), 1);
            }
         }
      }
   }
};
void draw_boxes(cv::Mat mat_img, std::vector<bbox_t> result_vec, std::vector<std::string> obj_names, 
   unsigned int wait_msec = 0, int current_det_fps = -1, int current_cap_fps = -1)
   int current_det_fps = -1, int current_cap_fps = -1)
{
   int const colors[6][3] = { { 1,0,1 },{ 0,0,1 },{ 0,1,1 },{ 0,1,0 },{ 1,1,0 },{ 1,0,0 } };
   for (auto &i : result_vec) {
      int const offset = i.obj_id * 123457 % 6;
      int const color_scale = 150 + (i.obj_id * 123457) % 100;
      cv::Scalar color(colors[offset][0], colors[offset][1], colors[offset][2]);
      color *= color_scale;
      cv::Scalar color = obj_id_to_color(i.obj_id);
      cv::rectangle(mat_img, cv::Rect(i.x, i.y, i.w, i.h), color, 5);
      if (obj_names.size() > i.obj_id) {
         std::string obj_name = obj_names[i.obj_id];
@@ -64,8 +204,6 @@
      std::string fps_str = "FPS detection: " + std::to_string(current_det_fps) + "   FPS capture: " + std::to_string(current_cap_fps);
      putText(mat_img, fps_str, cv::Point2f(10, 20), cv::FONT_HERSHEY_COMPLEX_SMALL, 1.2, cv::Scalar(50, 255, 0), 2);
   }
   cv::imshow("window name", mat_img);
   cv::waitKey(wait_msec);
}
#endif   // OPENCV
@@ -91,17 +229,29 @@
int main(int argc, char *argv[])
{
   std::string  names_file = "data/voc.names";
   std::string  cfg_file = "cfg/yolo-voc.cfg";
   std::string  weights_file = "yolo-voc.weights";
   std::string filename;
   if (argc > 1) filename = argv[1];
   //Detector detector("cfg/yolo-voc.cfg", "yolo-voc.weights");
   Detector detector("tiny-yolo-voc_air.cfg", "backup/tiny-yolo-voc_air_5000.weights");
   if (argc > 4) {   //voc.names yolo-voc.cfg yolo-voc.weights test.mp4
      names_file = argv[1];
      cfg_file = argv[2];
      weights_file = argv[3];
      filename = argv[4];
   }
   else if (argc > 1) filename = argv[1];
   auto obj_names = objects_names_from_file("data/voc.names");
   float const thresh = (argc > 5) ? std::stof(argv[5]) : 0.20;
   Detector detector(cfg_file, weights_file);
   auto obj_names = objects_names_from_file(names_file);
   std::string out_videofile = "result.avi";
   bool const save_output_videofile = false;
#ifdef TRACK_OPTFLOW
   Tracker_optflow tracker_flow;
   detector.wait_stream = true;
#endif
   while (true) 
@@ -112,6 +262,9 @@
      
      try {
#ifdef OPENCV
         preview_boxes_t large_preview(100, 150, false), small_preview(50, 50, true);
         bool show_small_boxes = false;
         std::string const file_ext = filename.substr(filename.find_last_of(".") + 1);
         std::string const protocol = filename.substr(0, 7);
         if (file_ext == "avi" || file_ext == "mp4" || file_ext == "mjpg" || file_ext == "mov" ||  // video file
@@ -156,26 +309,48 @@
               {
                  std::unique_lock<std::mutex> lock(mtx);
                  det_image = detector.mat_to_image_resize(cur_frame);
                  result_vec = thread_result_vec;
                  result_vec = detector.tracking(result_vec);  // comment it - if track_id is not required
                  //auto old_result_vec = result_vec;
                  auto old_result_vec = detector.tracking_id(result_vec);
                  auto detected_result_vec = thread_result_vec;
                  result_vec = detected_result_vec;
#ifdef TRACK_OPTFLOW
                  // track optical flow
                  if (track_optflow_queue.size() > 0) {
                     std::queue<cv::Mat> new_track_optflow_queue;
                     //std::cout << "\n !!!! all = " << track_optflow_queue.size() << ", cur = " << passed_flow_frames << std::endl;
                     tracker_flow.update_tracking_flow(track_optflow_queue.front());
                     cv::Mat first_frame = track_optflow_queue.front();
                     tracker_flow.update_tracking_flow(track_optflow_queue.front(), result_vec);
                     while (track_optflow_queue.size() > 1) {
                        track_optflow_queue.pop();
                        result_vec = tracker_flow.tracking_flow(track_optflow_queue.front(), result_vec);
                        if (track_optflow_queue.size() <= passed_flow_frames && new_track_optflow_queue.size() == 0)
                           new_track_optflow_queue = track_optflow_queue;
                        result_vec = tracker_flow.tracking_flow(track_optflow_queue.front(), false);
                     }
                     track_optflow_queue = new_track_optflow_queue;
                     new_track_optflow_queue.swap(std::queue<cv::Mat>());
                     track_optflow_queue.pop();
                     passed_flow_frames = 0;
                     result_vec = detector.tracking_id(result_vec);
                     auto tmp_result_vec = detector.tracking_id(detected_result_vec);
                     small_preview.set(first_frame, tmp_result_vec);
                  }
#endif
                  result_vec = detector.tracking_id(result_vec);  // comment it - if track_id is not required
                  // add old tracked objects
                  for (auto &i : old_result_vec) {
                     auto it = std::find_if(result_vec.begin(), result_vec.end(),
                        [&i](bbox_t const& b) { return b.track_id == i.track_id && b.obj_id == i.obj_id; });
                     bool track_id_absent = (it == result_vec.end());
                     if (track_id_absent) {
                        if (i.frames_counter-- > 1)
                           result_vec.push_back(i);
                     }
                     else {
                        it->frames_counter = std::min((unsigned)3, i.frames_counter + 1);
                     }
                  }
#ifdef TRACK_OPTFLOW
                  tracker_flow.update_cur_bbox_vec(result_vec);
                  result_vec = tracker_flow.tracking_flow(cur_frame, false);  // track optical flow
#endif
                  consumed = false;
                  cv_pre_tracked.notify_all();
               }
@@ -185,20 +360,20 @@
                     auto current_image = det_image;
                     consumed = true;
                     while (current_image.use_count() > 0) {
                        //std::vector<bbox_t> result;
                        auto result = detector.detect_resized(*current_image, frame_size, 0.24, false);  // true
                        //Sleep(200);
                        //Sleep(50);
                        auto result = detector.detect_resized(*current_image, frame_size, thresh, false);   // true
                        ++fps_det_counter;
                        std::unique_lock<std::mutex> lock(mtx);
                        thread_result_vec = result;
                        current_image = det_image;
                        consumed = true;
                        cv_detected.notify_all();
                        while (consumed) cv_pre_tracked.wait(lock);
                        if (detector.wait_stream) {
                           while (consumed) cv_pre_tracked.wait(lock);
                        }
                        current_image = det_image;
                     }
                  });
               }
               //while (!consumed); // sync detection
               if (!cur_frame.empty()) {
                  steady_end = std::chrono::steady_clock::now();
@@ -210,14 +385,21 @@
                     fps_cap_counter = 0;
                  }
                  large_preview.set(cur_frame, result_vec);
#ifdef TRACK_OPTFLOW
                  ++passed_flow_frames;
                  track_optflow_queue.push(cur_frame.clone());
                  result_vec = tracker_flow.tracking_flow(cur_frame, result_vec);   // track optical flow
#endif
                  result_vec = tracker_flow.tracking_flow(cur_frame);   // track optical flow
                  small_preview.draw(cur_frame, show_small_boxes);
#endif
                  draw_boxes(cur_frame, result_vec, obj_names, 3, current_det_fps, current_cap_fps);
                  draw_boxes(cur_frame, result_vec, obj_names, current_det_fps, current_cap_fps);
                  //show_console_result(result_vec, obj_names);
                  large_preview.draw(cur_frame);
                  cv::imshow("window name", cur_frame);
                  int key = cv::waitKey(3);  // 3 or 16ms
                  if (key == 'f') show_small_boxes = !show_small_boxes;
                  if (output_video.isOpened() && videowrite_ready) {
                     if (t_videowrite.joinable()) t_videowrite.join();
@@ -229,11 +411,13 @@
                  }
               }
#ifndef TRACK_OPTFLOW
               // wait detection result for video-file only (not for net-cam)
               //if (protocol != "rtsp://" && protocol != "http://" && protocol != "https:/") {
               // std::unique_lock<std::mutex> lock(mtx);
               // while (!consumed) cv_detected.wait(lock);
               //}
               if (protocol != "rtsp://" && protocol != "http://" && protocol != "https:/") {
                  std::unique_lock<std::mutex> lock(mtx);
                  while (!consumed) cv_detected.wait(lock);
               }
#endif
            }
            if (t_cap.joinable()) t_cap.join();
            if (t_detect.joinable()) t_detect.join();
@@ -257,8 +441,10 @@
         else {   // image file
            cv::Mat mat_img = cv::imread(filename);
            std::vector<bbox_t> result_vec = detector.detect(mat_img);
            result_vec = detector.tracking(result_vec);  // comment it - if track_id is not required
            result_vec = detector.tracking_id(result_vec);  // comment it - if track_id is not required
            draw_boxes(mat_img, result_vec, obj_names);
            cv::imshow("window name", mat_img);
            cv::waitKey(3);   // 3 or 16ms
            show_console_result(result_vec, obj_names);
         }
#else