#include #include #include #include #include #include #include #include #include #include #include #include #include #include #include const std::string keys = "{ h help | | Print this help message }" "{ input | | Path to the input video file }" "{ facem | face-detection-adas-0001.xml | Path to OpenVINO IE face detection model (.xml) }" "{ faced | CPU | Target device for face detection model (e.g. CPU, GPU, VPU, ...) }" "{ r roi | -1,-1,-1,-1 | Region of interest (ROI) to use for inference. Identified automatically when not set }"; namespace { std::string weights_path(const std::string &model_path) { const auto EXT_LEN = 4u; const auto sz = model_path.size(); CV_Assert(sz > EXT_LEN); auto ext = model_path.substr(sz - EXT_LEN); std::transform(ext.begin(), ext.end(), ext.begin(), [](unsigned char c){ return static_cast(std::tolower(c)); }); CV_Assert(ext == ".xml"); return model_path.substr(0u, sz - EXT_LEN) + ".bin"; } cv::util::optional parse_roi(const std::string &rc) { cv::Rect rv; char delim[3]; std::stringstream is(rc); is >> rv.x >> delim[0] >> rv.y >> delim[1] >> rv.width >> delim[2] >> rv.height; if (is.bad()) { return cv::util::optional(); // empty value } const auto is_delim = [](char c) { return c == ','; }; if (!std::all_of(std::begin(delim), std::end(delim), is_delim)) { return cv::util::optional(); // empty value } if (rv.x < 0 || rv.y < 0 || rv.width <= 0 || rv.height <= 0) { return cv::util::optional(); // empty value } return cv::util::make_optional(std::move(rv)); } } // namespace namespace custom { G_API_NET(FaceDetector, , "face-detector"); using GDetections = cv::GArray; using GRect = cv::GOpaque; using GSize = cv::GOpaque; using GPrims = cv::GArray; G_API_OP(LocateROI, , "sample.custom.locate-roi") { static cv::GOpaqueDesc outMeta(const cv::GMatDesc &) { return cv::empty_gopaque_desc(); } }; G_API_OP(BBoxes, , "sample.custom.b-boxes") { static cv::GArrayDesc outMeta(const cv::GArrayDesc &, const cv::GOpaqueDesc &) { return cv::empty_array_desc(); } }; GAPI_OCV_KERNEL(OCVLocateROI, LocateROI) { // This is the place where we can run extra analytics // on the input image frame and select the ROI (region // of interest) where we want to detect our objects (or // run any other inference). // // Currently it doesn't do anything intelligent, // but only crops the input image to square (this is // the most convenient aspect ratio for detectors to use) static void run(const cv::Mat &in_mat, cv::Rect &out_rect) { // Identify the central point & square size (- some padding) const auto center = cv::Point{in_mat.cols/2, in_mat.rows/2}; auto sqside = std::min(in_mat.cols, in_mat.rows); // Now build the central square ROI out_rect = cv::Rect{ center.x - sqside/2 , center.y - sqside/2 , sqside , sqside }; } }; GAPI_OCV_KERNEL(OCVBBoxes, BBoxes) { // This kernel converts the rectangles into G-API's // rendering primitives static void run(const std::vector &in_face_rcs, const cv::Rect &in_roi, std::vector &out_prims) { out_prims.clear(); const auto cvt = [](const cv::Rect &rc, const cv::Scalar &clr) { return cv::gapi::wip::draw::Rect(rc, clr, 2); }; out_prims.emplace_back(cvt(in_roi, CV_RGB(0,255,255))); // cyan for (auto &&rc : in_face_rcs) { out_prims.emplace_back(cvt(rc, CV_RGB(0,255,0))); // green } } }; } // namespace custom int main(int argc, char *argv[]) { cv::CommandLineParser cmd(argc, argv, keys); if (cmd.has("help")) { cmd.printMessage(); return 0; } // Prepare parameters first const std::string input = cmd.get("input"); const auto opt_roi = parse_roi(cmd.get("roi")); const auto face_model_path = cmd.get("facem"); auto face_net = cv::gapi::ie::Params { face_model_path, // path to topology IR weights_path(face_model_path), // path to weights cmd.get("faced"), // device specifier }; auto kernels = cv::gapi::kernels (); auto networks = cv::gapi::networks(face_net); // Now build the graph. The graph structure may vary // passed on the input parameters cv::GStreamingCompiled pipeline; auto inputs = cv::gin(cv::gapi::wip::make_src(input)); cv::GMat in; cv::GOpaque sz = cv::gapi::streaming::size(in); if (opt_roi.has_value()) { // Use the value provided by user std::cout << "Will run inference for static region " << opt_roi.value() << " only" << std::endl; cv::GOpaque in_roi; auto blob = cv::gapi::infer(in_roi, in); cv::GArray rcs = cv::gapi::parseSSD(blob, sz, 0.5f, true, true); auto out = cv::gapi::wip::draw::render3ch(in, custom::BBoxes::on(rcs, in_roi)); pipeline = cv::GComputation(cv::GIn(in, in_roi), cv::GOut(out)) .compileStreaming(cv::compile_args(kernels, networks)); // Since the ROI to detect is manual, make it part of the input vector inputs.push_back(cv::gin(opt_roi.value())[0]); } else { // Automatically detect ROI to infer. Make it output parameter std::cout << "ROI is not set or invalid. Locating it automatically" << std::endl; cv::GOpaque roi = custom::LocateROI::on(in); auto blob = cv::gapi::infer(roi, in); cv::GArray rcs = cv::gapi::parseSSD(blob, sz, 0.5f, true, true); auto out = cv::gapi::wip::draw::render3ch(in, custom::BBoxes::on(rcs, roi)); pipeline = cv::GComputation(cv::GIn(in), cv::GOut(out)) .compileStreaming(cv::compile_args(kernels, networks)); } // The execution part pipeline.setSource(std::move(inputs)); pipeline.start(); cv::Mat out; size_t frames = 0u; cv::TickMeter tm; tm.start(); while (pipeline.pull(cv::gout(out))) { cv::imshow("Out", out); cv::waitKey(1); ++frames; } tm.stop(); std::cout << "Processed " << frames << " frames" << " (" << frames / tm.getTimeSec() << " FPS)" << std::endl; return 0; }