AlexeyAB
2018-01-24 cc6ab9b3ccf48322b97f7fe096381d5594d198f7
src/yolo_console_dll.cpp
@@ -2,6 +2,7 @@
#include <iomanip> 
#include <string>
#include <vector>
#include <queue>
#include <fstream>
#include <thread>
#include <atomic>
@@ -12,6 +13,9 @@
#define OPENCV
#endif
// To use tracking - uncomment the following line. Tracking is supported only by OpenCV 3.x
//#define TRACK_OPTFLOW
#include "yolo_v2_class.hpp"  // imported functions from DLL
#ifdef OPENCV
@@ -19,24 +23,109 @@
#include "opencv2/core/version.hpp"
#ifndef CV_VERSION_EPOCH
#include "opencv2/videoio/videoio.hpp"
#pragma comment(lib, "opencv_world320.lib")
#define OPENCV_VERSION CVAUX_STR(CV_VERSION_MAJOR)""CVAUX_STR(CV_VERSION_MINOR)""CVAUX_STR(CV_VERSION_REVISION)
#pragma comment(lib, "opencv_world" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_cudaoptflow" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_cudaimgproc" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_core" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_imgproc" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_highgui" OPENCV_VERSION ".lib")
#else
#pragma comment(lib, "opencv_core2413.lib")
#pragma comment(lib, "opencv_imgproc2413.lib")
#pragma comment(lib, "opencv_highgui2413.lib")
#define OPENCV_VERSION CVAUX_STR(CV_VERSION_EPOCH)""CVAUX_STR(CV_VERSION_MAJOR)""CVAUX_STR(CV_VERSION_MINOR)
#pragma comment(lib, "opencv_core" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_imgproc" OPENCV_VERSION ".lib")
#pragma comment(lib, "opencv_highgui" OPENCV_VERSION ".lib")
#endif
cv::Scalar obj_id_to_color(int obj_id) {
   int const colors[6][3] = { { 1,0,1 },{ 0,0,1 },{ 0,1,1 },{ 0,1,0 },{ 1,1,0 },{ 1,0,0 } };
   int const offset = obj_id * 123457 % 6;
   int const color_scale = 150 + (obj_id * 123457) % 100;
   cv::Scalar color(colors[offset][0], colors[offset][1], colors[offset][2]);
   color *= color_scale;
   return color;
}
void draw_preview_boxes(cv::Mat src_mat, cv::Mat draw_mat, std::vector<bbox_t> result_vec)
{
   size_t const preview_box_size = 100;   // size of preview box in ptx
   size_t const count_preview_boxes = draw_mat.cols / preview_box_size;
   unsigned int const frames_history = 30;   // how long to keep the history saved
   struct preview_box_track_t {
      unsigned int track_id, obj_id, last_showed_frames_ago;
      cv::Mat mat_obj;
      preview_box_track_t() : track_id(0), obj_id(0), last_showed_frames_ago(frames_history) {}
   };
   static std::vector<preview_box_track_t> preview_box_track_id(count_preview_boxes);
   // increment frames history
   for (auto &i : preview_box_track_id)
      i.last_showed_frames_ago = std::min(frames_history, i.last_showed_frames_ago + 1);
   // occupy empty boxes
   for (auto &k : result_vec) {
      bool found = false;
      for (auto &i : preview_box_track_id) {
         if (i.track_id == k.track_id) {
            i.last_showed_frames_ago = 0;
            found = true;
            break;
         }
      }
      if (!found) {
         for (auto &i : preview_box_track_id) {
            if (i.last_showed_frames_ago == frames_history) {
               i.track_id = k.track_id;
               i.obj_id = k.obj_id;
               i.last_showed_frames_ago = 0;
               break;
            }
         }
      }
   }
   // draw preview box (from old or current frame)
   for (size_t i = 0; i < preview_box_track_id.size(); ++i) {
      // get object image
      cv::Mat dst = preview_box_track_id[i].mat_obj;
      for (auto &k : result_vec) {
         if (preview_box_track_id[i].track_id == k.track_id) {
            bbox_t b = k;
            cv::Rect r(b.x, b.y, b.w, b.h);
            cv::Rect img_rect(cv::Point2i(0, 0), src_mat.size());
            cv::Rect rect_roi = r & img_rect;
            if (rect_roi.width > 1 || rect_roi.height > 1) {
               cv::Mat roi = src_mat(rect_roi);
               cv::resize(roi, dst, cv::Size(preview_box_size, preview_box_size));
               preview_box_track_id[i].mat_obj = dst;
            }
            break;
         }
      }
      // draw object image
      if (preview_box_track_id[i].last_showed_frames_ago < frames_history &&
         dst.size() == cv::Size(preview_box_size, preview_box_size))
      {
         cv::Rect dst_rect_roi(cv::Point2i(i * preview_box_size, draw_mat.rows - preview_box_size), dst.size());
         cv::Mat dst_roi = draw_mat(dst_rect_roi);
         dst.copyTo(dst_roi);
         cv::Scalar color = obj_id_to_color(preview_box_track_id[i].obj_id);
         cv::rectangle(draw_mat, dst_rect_roi, color, 5);
      }
   }
}
void draw_boxes(cv::Mat mat_img, std::vector<bbox_t> result_vec, std::vector<std::string> obj_names, 
   unsigned int wait_msec = 0, int current_det_fps = -1, int current_cap_fps = -1)
{
   int const colors[6][3] = { { 1,0,1 },{ 0,0,1 },{ 0,1,1 },{ 0,1,0 },{ 1,1,0 },{ 1,0,0 } };
   for (auto &i : result_vec) {
      int const offset = i.obj_id * 123457 % 6;
      int const color_scale = 150 + (i.obj_id * 123457) % 100;
      cv::Scalar color(colors[offset][0], colors[offset][1], colors[offset][2]);
      color *= color_scale;
      cv::Scalar color = obj_id_to_color(i.obj_id);
      cv::rectangle(mat_img, cv::Rect(i.x, i.y, i.w, i.h), color, 5);
      if (obj_names.size() > i.obj_id) {
         std::string obj_name = obj_names[i.obj_id];
@@ -53,6 +142,7 @@
      std::string fps_str = "FPS detection: " + std::to_string(current_det_fps) + "   FPS capture: " + std::to_string(current_cap_fps);
      putText(mat_img, fps_str, cv::Point2f(10, 20), cv::FONT_HERSHEY_COMPLEX_SMALL, 1.2, cv::Scalar(50, 255, 0), 2);
   }
   cv::imshow("window name", mat_img);
   cv::waitKey(wait_msec);
}
@@ -80,14 +170,28 @@
int main(int argc, char *argv[])
{
   std::string  names_file = "data/voc.names";
   std::string  cfg_file = "cfg/yolo-voc.cfg";
   std::string  weights_file = "yolo-voc.weights";
   std::string filename;
   if (argc > 1) filename = argv[1];
   Detector detector("yolo-voc.cfg", "yolo-voc.weights");
   if (argc > 4) {   //voc.names yolo-voc.cfg yolo-voc.weights test.mp4
      names_file = argv[1];
      cfg_file = argv[2];
      weights_file = argv[3];
      filename = argv[4];
   }
   else if (argc > 1) filename = argv[1];
   auto obj_names = objects_names_from_file("data/voc.names");
   Detector detector(cfg_file, weights_file);
   auto obj_names = objects_names_from_file(names_file);
   std::string out_videofile = "result.avi";
   bool const save_output_videofile = false;
#ifdef TRACK_OPTFLOW
   Tracker_optflow tracker_flow;
   detector.wait_stream = true;
#endif
   while (true) 
   {     
@@ -103,6 +207,8 @@
            protocol == "rtmp://" || protocol == "rtsp://" || protocol == "http://" || protocol == "https:/")  // video network stream
         {
            cv::Mat cap_frame, cur_frame, det_frame, write_frame;
            std::queue<cv::Mat> track_optflow_queue;
            int passed_flow_frames = 0;
            std::shared_ptr<image_t> det_image;
            std::vector<bbox_t> result_vec, thread_result_vec;
            detector.nms = 0.02; // comment it - if track_id is not required
@@ -115,7 +221,7 @@
            int current_det_fps = 0, current_cap_fps = 0;
            std::thread t_detect, t_cap, t_videowrite;
            std::mutex mtx;
            std::condition_variable cv;
            std::condition_variable cv_detected, cv_pre_tracked;
            std::chrono::steady_clock::time_point steady_start, steady_end;
            cv::VideoCapture cap(filename); cap >> cur_frame;
            int const video_fps = cap.get(CV_CAP_PROP_FPS);
@@ -124,7 +230,9 @@
            if (save_output_videofile)
               output_video.open(out_videofile, CV_FOURCC('D', 'I', 'V', 'X'), std::max(35, video_fps), frame_size, true);
            while (!cur_frame.empty()) {
            while (!cur_frame.empty())
            {
               // always sync
               if (t_cap.joinable()) {
                  t_cap.join();
                  ++fps_cap_counter;
@@ -132,28 +240,50 @@
               }
               t_cap = std::thread([&]() { cap >> cap_frame; });
               // swap result and input-frame
               // swap result bouned-boxes and input-frame
               if(consumed)
               {
                  std::unique_lock<std::mutex> lock(mtx);
                  det_image = detector.mat_to_image_resize(cur_frame);
                  result_vec = thread_result_vec;
                  result_vec = detector.tracking(result_vec);  // comment it - if track_id is not required
#ifdef TRACK_OPTFLOW
                  // track optical flow
                  if (track_optflow_queue.size() > 0) {
                     //draw_preview_boxes(track_optflow_queue.front(), cur_frame, result_vec);
                     std::queue<cv::Mat> new_track_optflow_queue;
                     //std::cout << "\n !!!! all = " << track_optflow_queue.size() << ", cur = " << passed_flow_frames << std::endl;
                     tracker_flow.update_tracking_flow(track_optflow_queue.front());
                     while (track_optflow_queue.size() > 1) {
                        track_optflow_queue.pop();
                        result_vec = tracker_flow.tracking_flow(track_optflow_queue.front(), result_vec);
                        if (track_optflow_queue.size() <= passed_flow_frames && new_track_optflow_queue.size() == 0)
                           new_track_optflow_queue = track_optflow_queue;
                     }
                     track_optflow_queue = new_track_optflow_queue;
                     passed_flow_frames = 0;
                  }
#endif
                  consumed = false;
                  cv_pre_tracked.notify_all();
               }
               // launch thread once
               // launch thread once - Detection
               if (!t_detect.joinable()) {
                  t_detect = std::thread([&]() {
                     auto current_image = det_image;
                     consumed = true;
                     while (current_image.use_count() > 0) {
                        auto result = detector.detect_resized(*current_image, frame_size, 0.24, true);
                        auto result = detector.detect_resized(*current_image, frame_size, 0.20, false);  // true
                        ++fps_det_counter;
                        std::unique_lock<std::mutex> lock(mtx);
                        thread_result_vec = result;
                        current_image = det_image;
                        consumed = true;
                        cv.notify_all();
                        cv_detected.notify_all();
                        if(detector.wait_stream)
                           while (consumed) cv_pre_tracked.wait(lock);
                     }
                  });
               }
@@ -167,7 +297,14 @@
                     fps_det_counter = 0;
                     fps_cap_counter = 0;
                  }
                  draw_boxes(cur_frame, result_vec, obj_names, 3, current_det_fps, current_cap_fps);
#ifdef TRACK_OPTFLOW
                  ++passed_flow_frames;
                  track_optflow_queue.push(cur_frame.clone());
                  result_vec = tracker_flow.tracking_flow(cur_frame, result_vec);   // track optical flow
#endif
                  //draw_preview_boxes(cur_frame, cur_frame, result_vec);
                  draw_boxes(cur_frame, result_vec, obj_names, 3, current_det_fps, current_cap_fps);  // 3 or 16ms
                  //show_console_result(result_vec, obj_names);
                  if (output_video.isOpened() && videowrite_ready) {
@@ -180,11 +317,13 @@
                  }
               }
#ifndef TRACK_OPTFLOW
               // wait detection result for video-file only (not for net-cam)
               if (protocol != "rtsp://" && protocol != "http://" && protocol != "https:/") {
                  std::unique_lock<std::mutex> lock(mtx);
                  while (!consumed) cv.wait(lock);
                  while (!consumed) cv_detected.wait(lock);
               }
#endif
            }
            if (t_cap.joinable()) t_cap.join();
            if (t_detect.joinable()) t_detect.join();