181 lines
		
	
	
		
			6.2 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			181 lines
		
	
	
		
			6.2 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| #include <opencv2/core/utility.hpp>
 | |
| #include <opencv2/imgproc.hpp>
 | |
| #include <opencv2/objdetect.hpp>
 | |
| #include <opencv2/highgui.hpp>
 | |
| #include <opencv2/softcascade.hpp>
 | |
| 
 | |
| #include <iostream>
 | |
| #include <vector>
 | |
| #include <string>
 | |
| #include <fstream>
 | |
| 
 | |
| void filter_rects(const std::vector<cv::Rect>& candidates, std::vector<cv::Rect>& objects);
 | |
| 
 | |
| int main(int argc, char** argv)
 | |
| {
 | |
|     const std::string keys =
 | |
|     "{help h usage ?    |     | print this message and exit }"
 | |
|     "{cascade c         |     | path to cascade xml, if empty HOG detector will be executed }"
 | |
|     "{frame f           |     | wildchart pattern to frame source}"
 | |
|     "{min_scale         |0.4  | minimum scale to detect }"
 | |
|     "{max_scale         |5.0  | maxamum scale to detect }"
 | |
|     "{total_scales      |55   | prefered number of scales between min and max }"
 | |
|     "{write_file wf     |0    | write to .txt. Disabled by default.}"
 | |
|     "{write_image wi    |0    | write to image. Disabled by default.}"
 | |
|     "{show_image si     |1    | show image. Enabled by default.}"
 | |
|     "{threshold thr     |-1   | detection threshold. Detections with score less then threshold will be ignored.}"
 | |
|     ;
 | |
| 
 | |
|     cv::CommandLineParser parser(argc, argv, keys);
 | |
|     parser.about("Soft cascade training application.");
 | |
| 
 | |
|     if (parser.has("help"))
 | |
|     {
 | |
|         parser.printMessage();
 | |
|         return 0;
 | |
|     }
 | |
| 
 | |
|     if (!parser.check())
 | |
|     {
 | |
|         parser.printErrors();
 | |
|         return 1;
 | |
|     }
 | |
| 
 | |
|     int wf = parser.get<int>("write_file");
 | |
|     if (wf) std::cout << "resulte will be stored to .txt file with the same name as image." << std::endl;
 | |
| 
 | |
|     int wi = parser.get<int>("write_image");
 | |
|     if (wi) std::cout << "resulte will be stored to image with the same name as input plus dt." << std::endl;
 | |
| 
 | |
|     int si = parser.get<int>("show_image");
 | |
| 
 | |
|     float minScale =  parser.get<float>("min_scale");
 | |
|     float maxScale =  parser.get<float>("max_scale");
 | |
|     int scales     =  parser.get<int>("total_scales");
 | |
|     int thr        =  parser.get<int>("threshold");
 | |
| 
 | |
|     cv::HOGDescriptor hog;
 | |
|     cv::softcascade::Detector cascade;
 | |
| 
 | |
|     bool useHOG = false;
 | |
|     std::string cascadePath = parser.get<std::string>("cascade");
 | |
|     if (cascadePath.empty())
 | |
|     {
 | |
|         useHOG = true;
 | |
|         hog.setSVMDetector(cv::HOGDescriptor::getDefaultPeopleDetector());
 | |
|         std::cout << "going to use HOG detector." << std::endl;
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|         cv::FileStorage fs(cascadePath, cv::FileStorage::READ);
 | |
|         if( !fs.isOpened())
 | |
|         {
 | |
|             std::cout << "Soft Cascade file " << cascadePath << " can't be opened." << std::endl << std::flush;
 | |
|             return 1;
 | |
|         }
 | |
| 
 | |
|         cascade = cv::softcascade::Detector(minScale, maxScale, scales, cv::softcascade::Detector::DOLLAR);
 | |
| 
 | |
|         if (!cascade.load(fs.getFirstTopLevelNode()))
 | |
|         {
 | |
|             std::cout << "Soft Cascade can't be parsed." << std::endl << std::flush;
 | |
|             return 1;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     std::string src = parser.get<std::string>("frame");
 | |
|     std::vector<cv::String> frames;
 | |
|     cv::glob(parser.get<std::string>("frame"), frames);
 | |
|     std::cout << "collected " << src << " " << frames.size() << " frames." << std::endl;
 | |
| 
 | |
|     for (int i = 0; i < (int)frames.size(); ++i)
 | |
|     {
 | |
|         std::string frame_sourse = frames[i];
 | |
|         cv::Mat frame = cv::imread(frame_sourse);
 | |
| 
 | |
|         if(frame.empty())
 | |
|         {
 | |
|             std::cout << "Frame source " << frame_sourse << " can't be opened." << std::endl << std::flush;
 | |
|             continue;
 | |
|         }
 | |
| 
 | |
|         std::ofstream myfile;
 | |
|         if (wf)
 | |
|             myfile.open((frame_sourse.replace(frame_sourse.end() - 3, frame_sourse.end(), "txt")).c_str(), std::ios::out);
 | |
| 
 | |
|         ////
 | |
|         if (useHOG)
 | |
|         {
 | |
|             std::vector<cv::Rect> found, found_filtered;
 | |
|             // run the detector with default parameters. to get a higher hit-rate
 | |
|             // (and more false alarms, respectively), decrease the hitThreshold and
 | |
|             // groupThreshold (set groupThreshold to 0 to turn off the grouping completely).
 | |
|             hog.detectMultiScale(frame, found, 0, cv::Size(8,8), cv::Size(32,32), 1.05, 2);
 | |
| 
 | |
|             filter_rects(found, found_filtered);
 | |
|             std::cout << "collected: " << (int)found_filtered.size() << " detections." << std::endl;
 | |
| 
 | |
|             for (size_t ff = 0; ff < found_filtered.size(); ++ff)
 | |
|             {
 | |
|                 cv::Rect r = found_filtered[ff];
 | |
|                 cv::rectangle(frame, r.tl(), r.br(), cv::Scalar(0,255,0), 3);
 | |
| 
 | |
|                 if (wf) myfile << r.x << "," << r.y << "," << r.width << "," << r.height << "," << 0.f << "\n";
 | |
|             }
 | |
|         }
 | |
|         else
 | |
|         {
 | |
|             std::vector<cv::softcascade::Detection> objects;
 | |
|             cascade.detect(frame,  cv::noArray(), objects);
 | |
|             std::cout << "collected: " << (int)objects.size() << " detections." << std::endl;
 | |
| 
 | |
|             for (int obj = 0; obj  < (int)objects.size(); ++obj)
 | |
|             {
 | |
|                 cv::softcascade::Detection d = objects[obj];
 | |
| 
 | |
|                 if(d.confidence > thr)
 | |
|                 {
 | |
|                     float b = d.confidence * 1.5f;
 | |
| 
 | |
|                     std::stringstream conf(std::stringstream::in | std::stringstream::out);
 | |
|                     conf << d.confidence;
 | |
| 
 | |
|                     cv::rectangle(frame, cv::Rect((int)d.x, (int)d.y, (int)d.w, (int)d.h), cv::Scalar(b, 0, 255 - b, 255), 2);
 | |
|                     cv::putText(frame, conf.str() , cv::Point((int)d.x + 10, (int)d.y - 5),1, 1.1, cv::Scalar(25, 133, 255, 0), 1, cv::LINE_AA);
 | |
| 
 | |
|                     if (wf)
 | |
|                         myfile << d.x << "," <<  d.y << "," << d.w << "," <<  d.h << "," << d.confidence << "\n";
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         if (wi) cv::imwrite(frame_sourse + ".dt.png", frame);
 | |
|         if (wf) myfile.close();
 | |
| 
 | |
|         if (si)
 | |
|         {
 | |
|             cv::imshow("pedestrian detector", frame);
 | |
|             cv::waitKey(10);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (si) cv::waitKey(0);
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| void filter_rects(const std::vector<cv::Rect>& candidates, std::vector<cv::Rect>& objects)
 | |
| {
 | |
|     size_t i, j;
 | |
|     for (i = 0; i < candidates.size(); ++i)
 | |
|     {
 | |
|         cv::Rect r = candidates[i];
 | |
| 
 | |
|         for (j = 0; j < candidates.size(); ++j)
 | |
|             if (j != i && (r & candidates[j]) == r)
 | |
|                 break;
 | |
| 
 | |
|         if (j == candidates.size())
 | |
|             objects.push_back(r);
 | |
|     }
 | |
| }
 | 
