#include #include #include #include using namespace cv; using namespace dnn; const char* keys = "{ help h | | print help message }" "{ proto p | | path to .prototxt }" "{ model m | | path to .caffemodel }" "{ image i | | path to input image }" "{ conf c | 0.8 | minimal confidence }"; const char* classNames[] = { "__background__", "aeroplane", "bicycle", "bird", "boat", "bottle", "bus", "car", "cat", "chair", "cow", "diningtable", "dog", "horse", "motorbike", "person", "pottedplant", "sheep", "sofa", "train", "tvmonitor" }; static const int kInpWidth = 800; static const int kInpHeight = 600; int main(int argc, char** argv) { // Parse command line arguments. CommandLineParser parser(argc, argv, keys); parser.about("This sample is used to run Faster-RCNN and R-FCN object detection " "models with OpenCV. You can get required models from " "https://github.com/rbgirshick/py-faster-rcnn (Faster-RCNN) and from " "https://github.com/YuwenXiong/py-R-FCN (R-FCN). Corresponding .prototxt " "files may be found at https://github.com/opencv/opencv_extra/tree/master/testdata/dnn."); if (argc == 1 || parser.has("help")) { parser.printMessage(); return 0; } String protoPath = parser.get("proto"); String modelPath = parser.get("model"); String imagePath = parser.get("image"); float confThreshold = parser.get("conf"); CV_Assert(!protoPath.empty(), !modelPath.empty(), !imagePath.empty()); // Load a model. Net net = readNetFromCaffe(protoPath, modelPath); Mat img = imread(imagePath); resize(img, img, Size(kInpWidth, kInpHeight)); Mat blob = blobFromImage(img, 1.0, Size(), Scalar(102.9801, 115.9465, 122.7717), false, false); Mat imInfo = (Mat_(1, 3) << img.rows, img.cols, 1.6f); net.setInput(blob, "data"); net.setInput(imInfo, "im_info"); // Draw detections. Mat detections = net.forward(); const float* data = (float*)detections.data; for (size_t i = 0; i < detections.total(); i += 7) { // An every detection is a vector [id, classId, confidence, left, top, right, bottom] float confidence = data[i + 2]; if (confidence > confThreshold) { int classId = (int)data[i + 1]; int left = max(0, min((int)data[i + 3], img.cols - 1)); int top = max(0, min((int)data[i + 4], img.rows - 1)); int right = max(0, min((int)data[i + 5], img.cols - 1)); int bottom = max(0, min((int)data[i + 6], img.rows - 1)); // Draw a bounding box. rectangle(img, Point(left, top), Point(right, bottom), Scalar(0, 255, 0)); // Put a label with a class name and confidence. String label = cv::format("%s, %.3f", classNames[classId], confidence); int baseLine; Size labelSize = cv::getTextSize(label, FONT_HERSHEY_SIMPLEX, 0.5, 1, &baseLine); top = max(top, labelSize.height); rectangle(img, Point(left, top - labelSize.height), Point(left + labelSize.width, top + baseLine), Scalar(255, 255, 255), FILLED); putText(img, label, Point(left, top), FONT_HERSHEY_SIMPLEX, 0.5, Scalar(0, 0, 0)); } } imshow("frame", img); waitKey(); return 0; }