From ec461a2ff0a3ebd3fb3ff33f1972062d1ab5ae0b Mon Sep 17 00:00:00 2001 From: Ilya Lavrenov Date: Thu, 22 Aug 2013 17:37:48 +0400 Subject: [PATCH 1/4] added a test for ocl::norm --- modules/ocl/test/test_norm.cpp | 63 ++++++++++++++++++++++++++++++++++ 1 file changed, 63 insertions(+) create mode 100644 modules/ocl/test/test_norm.cpp diff --git a/modules/ocl/test/test_norm.cpp b/modules/ocl/test/test_norm.cpp new file mode 100644 index 0000000000..2bd847068e --- /dev/null +++ b/modules/ocl/test/test_norm.cpp @@ -0,0 +1,63 @@ +/*M/////////////////////////////////////////////////////////////////////////////////////// +// +// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. +// +// By downloading, copying, installing or using the software you agree to this license. +// If you do not agree to this license, do not download, install, +// copy or use the software. +// +// +// Intel License Agreement +// For Open Source Computer Vision Library +// +// Copyright (C) 2000, Intel Corporation, all rights reserved. +// Third party copyrights are property of their respective owners. +// +// Redistribution and use in source and binary forms, with or without modification, +// are permitted provided that the following conditions are met: +// +// * Redistribution's of source code must retain the above copyright notice, +// this list of conditions and the following disclaimer. +// +// * Redistribution's in binary form must reproduce the above copyright notice, +// this list of conditions and the following disclaimer in the documentation +// and/or other materials provided with the distribution. +// +// * The name of Intel Corporation may not be used to endorse or promote products +// derived from this software without specific prior written permission. +// +// This software is provided by the copyright holders and contributors "as is" and +// any express or implied warranties, including, but not limited to, the implied +// warranties of merchantability and fitness for a particular purpose are disclaimed. +// In no event shall the Intel Corporation or contributors be liable for any direct, +// indirect, incidental, special, exemplary, or consequential damages +// (including, but not limited to, procurement of substitute goods or services; +// loss of use, data, or profits; or business interruption) however caused +// and on any theory of liability, whether in contract, strict liability, +// or tort (including negligence or otherwise) arising in any way out of +// the use of this software, even if advised of the possibility of such damage. +// +//M*/ + +#include "test_precomp.hpp" + +typedef ::testing::TestWithParam normFixture; + +TEST_P(normFixture, DISABLED_accuracy) +{ + const cv::Size srcSize = GetParam(); + + cv::Mat src1(srcSize, CV_8UC1), src2(srcSize, CV_8UC1); + cv::randu(src1, 0, 2); + cv::randu(src2, 0, 2); + + cv::ocl::oclMat oclSrc1(src1), oclSrc2(src2); + + double value = cv::norm(src1, src2, cv::NORM_INF); + double oclValue = cv::ocl::norm(oclSrc1, oclSrc2, cv::NORM_INF); + + ASSERT_EQ(value, oclValue); +} + +INSTANTIATE_TEST_CASE_P(oclNormTest, normFixture, + ::testing::Values(cv::Size(500, 500), cv::Size(1000, 1000))); From 6c4ad9b597e6ca656d6c832f027f650663d1ecd5 Mon Sep 17 00:00:00 2001 From: Ilya Lavrenov Date: Thu, 22 Aug 2013 17:38:55 +0400 Subject: [PATCH 2/4] fixer error with incorrect condition --- modules/ocl/src/arithm.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/modules/ocl/src/arithm.cpp b/modules/ocl/src/arithm.cpp index a591c82319..11e9c50f43 100644 --- a/modules/ocl/src/arithm.cpp +++ b/modules/ocl/src/arithm.cpp @@ -2336,7 +2336,7 @@ void cv::ocl::pow(const oclMat &x, double p, oclMat &y) return; } - CV_Assert((x.type() == y.type() && x.size() == y.size() && x.depth() == CV_32F) || x.depth() == CV_64F); + CV_Assert(x.depth() == CV_32F || x.depth() == CV_64F); y.create(x.size(), x.type()); string kernelName = "arithm_pow"; From 4c28a6f0f651f3def96d6c10da2ebf9cd28a5068 Mon Sep 17 00:00:00 2001 From: ilya-lavrenov Date: Thu, 22 Aug 2013 18:03:05 +0400 Subject: [PATCH 3/4] most of the performance tests was rewritten in google-test manner --- modules/ocl/perf/main.cpp | 34 +- modules/ocl/perf/perf_arithm.cpp | 1700 ++++++++--------- modules/ocl/perf/perf_blend.cpp | 98 +- modules/ocl/perf/perf_brute_force_matcher.cpp | 291 ++- modules/ocl/perf/perf_calib3d.cpp | 67 +- modules/ocl/perf/perf_canny.cpp | 57 +- modules/ocl/perf/perf_color.cpp | 62 +- modules/ocl/perf/perf_fft.cpp | 62 +- modules/ocl/perf/perf_filters.cpp | 477 ++--- modules/ocl/perf/perf_gemm.cpp | 64 +- modules/ocl/perf/perf_gftt.cpp | 80 +- modules/ocl/perf/perf_haar.cpp | 76 +- modules/ocl/perf/perf_hog.cpp | 62 +- modules/ocl/perf/perf_imgproc.cpp | 1058 +++++----- modules/ocl/perf/perf_match_template.cpp | 160 +- modules/ocl/perf/perf_matrix_operation.cpp | 211 +- modules/ocl/perf/perf_moments.cpp | 73 +- modules/ocl/perf/perf_norm.cpp | 63 +- modules/ocl/perf/perf_opticalflow.cpp | 215 ++- modules/ocl/perf/perf_precomp.hpp | 35 +- modules/ocl/perf/perf_pyramid.cpp | 135 +- modules/ocl/perf/perf_split_merge.cpp | 186 +- 22 files changed, 2674 insertions(+), 2592 deletions(-) diff --git a/modules/ocl/perf/main.cpp b/modules/ocl/perf/main.cpp index 428ab97e43..f67961f87e 100644 --- a/modules/ocl/perf/main.cpp +++ b/modules/ocl/perf/main.cpp @@ -42,7 +42,7 @@ #include "perf_precomp.hpp" -int main(int argc, const char *argv[]) +static int old_main(int argc, const char *argv[]) { const char *keys = "{ h | help | false | print help message }" @@ -99,7 +99,7 @@ int main(int argc, const char *argv[]) // set this to overwrite binary cache every time the test starts ocl::setBinaryDiskCache(ocl::CACHE_UPDATE); - + if (cmd.get("verify")) { TestSystem::instance().setNumIters(1); @@ -162,3 +162,33 @@ END_DEV: return 0; } + +const char * impls[] = +{ + "ocl", + "plain", +#ifdef HAVE_OPENCV_GPU + "gpu" +#endif +}; + +int main(int argc, char **argv) +{ + // temp solution: if no '--gtest_' and '--perf_' args switch to old behavior + bool useGTest = false; + + for(int i=1; i LUTParams; +typedef TestBaseWithParam LUTFixture; - gen(src, size, size, all_type[j], 0, 256); - gen(lut, 1, 256, CV_8UC1, 0, 1); +PERF_TEST_P(LUTFixture, LUT, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + LUTMatTypes::all())) +{ + // getting params + LUTParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); - LUT(src, lut, dst); + const std::string impl = getSelectedImpl(); - CPU_ON; - LUT(src, lut, dst); - CPU_OFF; + // creating src data + Mat src(srcSize, type), lut(1, 256, CV_8UC1); + int dstType = CV_MAKETYPE(lut.depth(), src.channels()); + Mat dst(srcSize, dstType); - d_src.upload(src); - d_lut.upload(lut); + randu(lut, 0, 2); + declare.in(src, WARMUP_RNG).in(lut).out(dst); - WARMUP_ON; - ocl::LUT(d_src, d_lut, d_dst); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclLut(lut), oclDst(srcSize, dstType); - GPU_ON; - ocl::LUT(d_src, d_lut, d_dst); - GPU_OFF; + TEST_CYCLE() cv::ocl::LUT(oclSrc, oclLut, oclDst); - GPU_FULL_ON; - d_src.upload(src); - d_lut.upload(lut); - ocl::LUT(d_src, d_lut, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::LUT(src, lut, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Exp //////////////////////// -PERFTEST(Exp) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size << "; CV_32FC1"; +typedef TestBaseWithParam ExpFixture; + +PERF_TEST_P(ExpFixture, Exp, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); - gen(src, size, size, CV_32FC1, 5, 16); + const std::string impl = getSelectedImpl(); - exp(src, dst); + // creating src data + Mat src(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); + declare.in(src).out(dst); + randu(src, 5, 16); - CPU_ON; - exp(src, dst); - CPU_OFF; - d_src.upload(src); + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); - WARMUP_ON; - ocl::exp(d_src, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::exp(oclSrc, oclDst); - GPU_ON; - ocl::exp(d_src, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src.upload(src); - ocl::exp(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst, 0.3); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::exp(src, dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 2); + SANITY_CHECK(dst, 0.3); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// LOG //////////////////////// -PERFTEST(Log) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size << "; 32F"; +typedef TestBaseWithParam LogFixture; - gen(src, size, size, CV_32F, 1, 10); +PERF_TEST_P(LogFixture, Log, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const std::string impl = getSelectedImpl(); - log(src, dst); + // creating src data + Mat src(srcSize, CV_32F), dst(srcSize, src.type()); + randu(src, 1, 10); + declare.in(src).out(dst); - CPU_ON; - log(src, dst); - CPU_OFF; - d_src.upload(src); + if (srcSize == OCL_SIZE_4000) + declare.time(3.6); - WARMUP_ON; - ocl::log(d_src, d_dst); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); - GPU_ON; - ocl::log(d_src, d_dst); - GPU_OFF; + TEST_CYCLE() cv::ocl::log(oclSrc, oclDst); - GPU_FULL_ON; - d_src.upload(src); - ocl::log(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); + SANITY_CHECK(dst); } -} - -///////////// Add //////////////////////// -PERFTEST(Add) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + else if (impl == "plain") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; + TEST_CYCLE() cv::log(src, dst); - gen(src1, size, size, all_type[j], 0, 1); - gen(src2, size, size, all_type[j], 0, 1); + SANITY_CHECK(dst); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - add(src1, src2, dst); +///////////// Add //////////////////////// - CPU_ON; - add(src1, src2, dst); - CPU_OFF; +CV_ENUM(AddMatTypes, CV_8UC1, CV_32FC1) - d_src1.upload(src1); - d_src2.upload(src2); +typedef tuple AddParams; +typedef TestBaseWithParam AddFixture; - WARMUP_ON; - ocl::add(d_src1, d_src2, d_dst); - WARMUP_OFF; +PERF_TEST_P(AddFixture, Add, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + AddMatTypes::all())) +{ + // getting params + AddParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + randu(src1, 0, 1); + randu(src2, 0, 1); + declare.in(src1, src2).out(dst); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); - GPU_ON; - ocl::add(d_src1, d_src2, d_dst); - GPU_OFF; + TEST_CYCLE() cv::ocl::add(oclSrc1, oclSrc2, oclDst); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::add(d_src1, d_src2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::add(src1, src2, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Mul //////////////////////// -PERFTEST(Mul) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - multiply(src1, src2, dst); +CV_ENUM(MulMatTypes, CV_8UC1, CV_8UC4) - CPU_ON; - multiply(src1, src2, dst); - CPU_OFF; - d_src1.upload(src1); - d_src2.upload(src2); +typedef tuple MulParams; +typedef TestBaseWithParam MulFixture; - WARMUP_ON; - ocl::multiply(d_src1, d_src2, d_dst); - WARMUP_OFF; +PERF_TEST_P(MulFixture, Mul, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + MulMatTypes::all())) +{ + // getting params + MulParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + randu(src1, 0, 256); + randu(src2, 0, 256); + declare.in(src1, src2).out(dst); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); - GPU_ON; - ocl::multiply(d_src1, d_src2, d_dst); - GPU_OFF; + TEST_CYCLE() cv::ocl::multiply(oclSrc1, oclSrc2, oclDst); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::multiply(d_src1, d_src2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::multiply(src1, src2, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Div //////////////////////// -PERFTEST(Div) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; +typedef MulMatTypes DivMatTypes; +typedef tuple DivParams; +typedef TestBaseWithParam DivFixture; - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - - divide(src1, src2, dst); - - CPU_ON; - divide(src1, src2, dst); - CPU_OFF; - - d_src1.upload(src1); - d_src2.upload(src2); - - WARMUP_ON; - ocl::divide(d_src1, d_src2, d_dst); - WARMUP_OFF; +PERF_TEST_P(DivFixture, Div, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + DivMatTypes::all())) +{ + // getting params + DivParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + declare.in(src1, src2).out(dst); + randu(src1, 0, 256); + randu(src2, 0, 256); + + if ((srcSize == OCL_SIZE_4000 && type == CV_8UC1) || + (srcSize == OCL_SIZE_2000 && type == CV_8UC4)) + declare.time(4.2); + else if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(16.6); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); - GPU_ON; - ocl::divide(d_src1, d_src2, d_dst); - GPU_OFF; + TEST_CYCLE() cv::ocl::divide(oclSrc1, oclSrc2, oclDst); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::divide(d_src1, d_src2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::divide(src1, src2, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Absdiff //////////////////////// -PERFTEST(Absdiff) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +typedef MulMatTypes AbsDiffMatTypes; +typedef tuple AbsDiffParams; +typedef TestBaseWithParam AbsDiffFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(AbsDiffFixture, Absdiff, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + AbsDiffMatTypes::all())) +{ + // getting params + AbsDiffParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + declare.in(src1, src2).in(dst); + randu(src1, 0, 256); + randu(src2, 0, 256); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - - absdiff(src1, src2, dst); - - CPU_ON; - absdiff(src1, src2, dst); - CPU_OFF; - - d_src1.upload(src1); - d_src2.upload(src2); + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); - WARMUP_ON; - ocl::absdiff(d_src1, d_src2, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::absdiff(oclSrc1, oclSrc2, oclDst); - GPU_ON; - ocl::absdiff(d_src1, d_src2, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::absdiff(d_src1, d_src2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::absdiff(src1, src2, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// CartToPolar //////////////////////// -PERFTEST(CartToPolar) -{ - Mat src1, src2, dst, dst1, ocl_dst, ocl_dst1; - ocl::oclMat d_src1, d_src2, d_dst, d_dst1; - int all_type[] = {CV_32FC1}; - std::string type_name[] = {"CV_32FC1"}; +typedef TestBaseWithParam CartToPolarFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(CartToPolarFixture, CartToPolar, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + dst1(srcSize, CV_32FC1), dst2(srcSize, CV_32FC1); + declare.in(src1, src2).out(dst1, dst2); + randu(src1, 0, 256); + randu(src2, 0, 256); + + if (srcSize == OCL_SIZE_4000) + declare.time(3.6); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - gen(dst1, size, size, all_type[j], 0, 256); - + ocl::oclMat oclSrc1(src1), oclSrc2(src2), + oclDst1(srcSize, src1.type()), oclDst2(srcSize, src1.type()); - cartToPolar(src1, src2, dst, dst1, 1); + TEST_CYCLE() cv::ocl::cartToPolar(oclSrc1, oclSrc2, oclDst1, oclDst2); - CPU_ON; - cartToPolar(src1, src2, dst, dst1, 1); - CPU_OFF; + oclDst1.download(dst1); + oclDst2.download(dst2); - d_src1.upload(src1); - d_src2.upload(src2); - - WARMUP_ON; - ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); - WARMUP_OFF; - - GPU_ON; - ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); - GPU_OFF; - - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); - d_dst.download(ocl_dst); - d_dst1.download(ocl_dst1); - GPU_FULL_OFF; - - double diff1 = checkNorm(ocl_dst1, dst1); - double diff2 = checkNorm(ocl_dst, dst); - double max_diff = max(diff1, diff2); - TestSystem::instance().setAccurate(max_diff<=.5?1:0, max_diff); - - } + SANITY_CHECK(dst1, 5e-3); + SANITY_CHECK(dst2, 5e-3); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::cartToPolar(src1, src2, dst1, dst2); + SANITY_CHECK(dst1, 5e-3); + SANITY_CHECK(dst2, 5e-3); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// PolarToCart //////////////////////// -PERFTEST(PolarToCart) -{ - Mat src1, src2, dst, dst1, ocl_dst, ocl_dst1; - ocl::oclMat d_src1, d_src2, d_dst, d_dst1; - int all_type[] = {CV_32FC1}; - std::string type_name[] = {"CV_32FC1"}; +typedef TestBaseWithParam PolarToCartFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(PolarToCartFixture, PolarToCart, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + dst1(srcSize, CV_32FC1), dst2(srcSize, CV_32FC1); + declare.in(src1, src2).out(dst1, dst2); + randu(src1, 0, 256); + randu(src2, 0, 256); + + if (srcSize == OCL_SIZE_4000) + declare.time(5.4); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - gen(dst1, size, size, all_type[j], 0, 256); - - - polarToCart(src1, src2, dst, dst1, 1); - - CPU_ON; - polarToCart(src1, src2, dst, dst1, 1); - CPU_OFF; - d_src1.upload(src1); - d_src2.upload(src2); - - WARMUP_ON; - ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); - WARMUP_OFF; + ocl::oclMat oclSrc1(src1), oclSrc2(src2), + oclDst1(srcSize, src1.type()), oclDst2(srcSize, src1.type()); - GPU_ON; - ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); - GPU_OFF; + TEST_CYCLE() cv::ocl::polarToCart(oclSrc1, oclSrc2, oclDst1, oclDst2); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); - d_dst.download(ocl_dst); - d_dst1.download(ocl_dst1); - GPU_FULL_OFF; + oclDst1.download(dst1); + oclDst2.download(dst2); - double diff1 = checkNorm(ocl_dst1, dst1); - double diff2 = checkNorm(ocl_dst, dst); - double max_diff = max(diff1, diff2); - TestSystem::instance().setAccurate(max_diff<=.5?1:0, max_diff); - - } + SANITY_CHECK(dst1, 5e-5); + SANITY_CHECK(dst2, 5e-5); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::polarToCart(src1, src2, dst1, dst2); + SANITY_CHECK(dst1, 5e-5); + SANITY_CHECK(dst2, 5e-5); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Magnitude //////////////////////// -PERFTEST(magnitude) -{ - Mat x, y, mag, ocl_mag; - ocl::oclMat d_x, d_y, d_mag; - int all_type[] = {CV_32FC1}; - std::string type_name[] = {"CV_32FC1"}; +typedef TestBaseWithParam MagnitudeFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(MagnitudeFixture, Magnitude, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + dst(srcSize, CV_32FC1); + randu(src1, 0, 1); + randu(src2, 0, 1); + declare.in(src1, src2).out(dst); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; - - gen(x, size, size, all_type[j], 0, 1); - gen(y, size, size, all_type[j], 0, 1); + ocl::oclMat oclSrc1(src1), oclSrc2(src2), + oclDst(srcSize, src1.type()); - magnitude(x, y, mag); + TEST_CYCLE() cv::ocl::magnitude(oclSrc1, oclSrc2, oclDst); - CPU_ON; - magnitude(x, y, mag); - CPU_OFF; - d_x.upload(x); - d_y.upload(y); + oclDst.download(dst); - WARMUP_ON; - ocl::magnitude(d_x, d_y, d_mag); - WARMUP_OFF; - - GPU_ON; - ocl::magnitude(d_x, d_y, d_mag); - GPU_OFF; - - GPU_FULL_ON; - d_x.upload(x); - d_y.upload(y); - ocl::magnitude(d_x, d_y, d_mag); - d_mag.download(ocl_mag); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_mag, mag, 1e-5); - } + SANITY_CHECK(dst, 1e-6); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::magnitude(src1, src2, dst); + SANITY_CHECK(dst, 1e-6); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Transpose //////////////////////// -PERFTEST(Transpose) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +typedef MulMatTypes TransposeMatTypes; +typedef tuple TransposeParams; +typedef TestBaseWithParam TransposeFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(TransposeFixture, Transpose, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + TransposeMatTypes::all())) +{ + // getting params + TransposeParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - gen(src, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); + TEST_CYCLE() cv::ocl::transpose(oclSrc, oclDst); - transpose(src, dst); + oclDst.download(dst); - CPU_ON; - transpose(src, dst); - CPU_OFF; - d_src.upload(src); - - WARMUP_ON; - ocl::transpose(d_src, d_dst); - WARMUP_OFF; - - GPU_ON; - ocl::transpose(d_src, d_dst); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl::transpose(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::transpose(src, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Flip //////////////////////// -PERFTEST(Flip) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +typedef MulMatTypes FlipMatTypes; +typedef tuple FlipParams; +typedef TestBaseWithParam FlipFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(FlipFixture, Flip, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + FlipMatTypes::all())) +{ + // getting params + TransposeParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; FLIP_BOTH"; - - gen(src, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - - flip(src, dst, 0); + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - CPU_ON; - flip(src, dst, 0); - CPU_OFF; - d_src.upload(src); + TEST_CYCLE() cv::ocl::flip(oclSrc, oclDst, 0); - WARMUP_ON; - ocl::flip(d_src, d_dst, 0); - WARMUP_OFF; + oclDst.download(dst); - GPU_ON; - ocl::flip(d_src, d_dst, 0); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl::flip(d_src, d_dst, 0); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::flip(src, dst, 0); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// minMax //////////////////////// -PERFTEST(minMax) -{ - Mat src; - ocl::oclMat d_src; - - double min_val = 0.0, max_val = 0.0; - double min_val_ = 0.0, max_val_ = 0.0; - Point min_loc, max_loc; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; +typedef AddMatTypes minMaxMatTypes; +typedef tuple minMaxParams; +typedef TestBaseWithParam minMaxFixture; - gen(src, size, size, all_type[j], 0, 256); +PERF_TEST_P(minMaxFixture, minMax, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + minMaxMatTypes::all())) +{ + // getting params + minMaxParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); - CPU_ON; - minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); - CPU_OFF; - d_src.upload(src); + // creating src data + Mat src(srcSize, type); + declare.in(src, WARMUP_RNG); - WARMUP_ON; - ocl::minMax(d_src, &min_val_, &max_val_); - WARMUP_OFF; + double min_val = 0.0, max_val = 0.0; - if(EeceptDoubleEQ(max_val_, max_val) && EeceptDoubleEQ(min_val_, min_val)) - TestSystem::instance().setAccurate(1, max(fabs(max_val_-max_val), fabs(min_val_-min_val))); - else - TestSystem::instance().setAccurate(0, max(fabs(max_val_-max_val), fabs(min_val_-min_val))); + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src); - GPU_ON; - ocl::minMax(d_src, &min_val, &max_val); - GPU_OFF; + TEST_CYCLE() cv::ocl::minMax(oclSrc, &min_val, &max_val); - GPU_FULL_ON; - d_src.upload(src); - ocl::minMax(d_src, &min_val, &max_val); - GPU_FULL_OFF; + ASSERT_GE(max_val, min_val); + SANITY_CHECK(min_val); + SANITY_CHECK(max_val); + } + else if (impl == "plain") + { + Point min_loc, max_loc; - } + TEST_CYCLE() cv::minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); + ASSERT_GE(max_val, min_val); + SANITY_CHECK(min_val); + SANITY_CHECK(max_val); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// minMaxLoc //////////////////////// -PERFTEST(minMaxLoc) + +typedef AddMatTypes minMaxLocMatTypes; +typedef tuple minMaxLocParams; +typedef TestBaseWithParam minMaxLocFixture; + +PERF_TEST_P(minMaxLocFixture, minMaxLoc, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + minMaxLocMatTypes::all())) { - Mat src; - ocl::oclMat d_src; + // getting params + minMaxLocParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type); + randu(src, 0, 1); + declare.in(src); double min_val = 0.0, max_val = 0.0; - double min_val_ = 0.0, max_val_ = 0.0; Point min_loc, max_loc; - Point min_loc_, max_loc_; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; + ocl::oclMat oclSrc(src); - gen(src, size, size, all_type[j], 0, 1); + TEST_CYCLE() cv::ocl::minMaxLoc(oclSrc, &min_val, &max_val, &min_loc, &max_loc); - CPU_ON; - minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); - CPU_OFF; - d_src.upload(src); - - WARMUP_ON; - ocl::minMaxLoc(d_src, &min_val_, &max_val_, &min_loc_, &max_loc_); - WARMUP_OFF; - - double error0 = 0., error1 = 0., minlocVal = 0., minlocVal_ = 0., maxlocVal = 0., maxlocVal_ = 0.; - if(src.depth() == 0) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - if(src.depth() == 1) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - if(src.depth() == 2) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - if(src.depth() == 3) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - if(src.depth() == 4) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - if(src.depth() == 5) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - if(src.depth() == 6) - { - minlocVal = src.at(min_loc); - minlocVal_ = src.at(min_loc_); - maxlocVal = src.at(max_loc); - maxlocVal_ = src.at(max_loc_); - } - error0 = ::abs(minlocVal_ - minlocVal); - error1 = ::abs(maxlocVal_ - maxlocVal); - if( EeceptDoubleEQ(maxlocVal_, maxlocVal) - &&EeceptDoubleEQ(minlocVal_, minlocVal) - &&EeceptDoubleEQ(max_val_, max_val) - &&EeceptDoubleEQ(min_val_, min_val)) - TestSystem::instance().setAccurate(1, 0.); - else - TestSystem::instance().setAccurate(0, max(error0, error1)); - - GPU_ON; - ocl::minMaxLoc(d_src, &min_val, &max_val, &min_loc, &max_loc); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl::minMaxLoc(d_src, &min_val, &max_val, &min_loc, &max_loc); - GPU_FULL_OFF; - } + ASSERT_GE(max_val, min_val); + SANITY_CHECK(min_val); + SANITY_CHECK(max_val); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); + ASSERT_GE(max_val, min_val); + SANITY_CHECK(min_val); + SANITY_CHECK(max_val); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Sum //////////////////////// -PERFTEST(Sum) -{ - Mat src; - Scalar cpures, gpures; - ocl::oclMat d_src; - - int all_type[] = {CV_8UC1, CV_32SC1}; - std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - gen(src, size, size, all_type[j], 0, 60); +CV_ENUM(SumMatTypes, CV_8UC1, CV_32SC1) - cpures = sum(src); +typedef tuple SumParams; +typedef TestBaseWithParam SumFixture; - CPU_ON; - cpures = sum(src); - CPU_OFF; - d_src.upload(src); - - WARMUP_ON; - gpures = ocl::sum(d_src); - WARMUP_OFF; - - vector diffs(4); - diffs[3] = fabs(cpures[3] - gpures[3]); - diffs[2] = fabs(cpures[2] - gpures[2]); - diffs[1] = fabs(cpures[1] - gpures[1]); - diffs[0] = fabs(cpures[0] - gpures[0]); - double max_diff = *max_element(diffs.begin(), diffs.end()); - TestSystem::instance().setAccurate(max_diff<0.1?1:0, max_diff); +PERF_TEST_P(SumFixture, Sum, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + SumMatTypes::all())) +{ + // getting params + SumParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type); + Scalar result; + randu(src, 0, 60); + declare.in(src); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src); - GPU_ON; - gpures = ocl::sum(d_src); - GPU_OFF; + TEST_CYCLE() result = cv::ocl::sum(oclSrc); - GPU_FULL_ON; - d_src.upload(src); - gpures = ocl::sum(d_src); - GPU_FULL_OFF; - } + SANITY_CHECK(result); + } + else if (impl == "plain") + { + TEST_CYCLE() result = cv::sum(src); + SANITY_CHECK(result); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// countNonZero //////////////////////// -PERFTEST(countNonZero) -{ - Mat src; - ocl::oclMat d_src; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; +CV_ENUM(countNonZeroMatTypes, CV_8UC1, CV_32FC1) - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); - - countNonZero(src); - - int cpures = 0, gpures = 0; - CPU_ON; - cpures = countNonZero(src); - CPU_OFF; - d_src.upload(src); +typedef tuple countNonZeroParams; +typedef TestBaseWithParam countNonZeroFixture; - WARMUP_ON; - gpures = ocl::countNonZero(d_src); - WARMUP_OFF; - - int diff = abs(cpures - gpures); - if(diff == 0) - TestSystem::instance().setAccurate(1, 0); - else - TestSystem::instance().setAccurate(0, diff); +PERF_TEST_P(countNonZeroFixture, countNonZero, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + countNonZeroMatTypes::all())) +{ + // getting params + countNonZeroParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type); + int result = 0; + randu(src, 0, 256); + declare.in(src); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src); - GPU_ON; - ocl::countNonZero(d_src); - GPU_OFF; + TEST_CYCLE() result = cv::ocl::countNonZero(oclSrc); - GPU_FULL_ON; - d_src.upload(src); - ocl::countNonZero(d_src); - GPU_FULL_OFF; - } + SANITY_CHECK(result); + } + else if (impl == "plain") + { + TEST_CYCLE() result = cv::countNonZero(src); + SANITY_CHECK(result); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Phase //////////////////////// -PERFTEST(Phase) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - int all_type[] = {CV_32FC1}; - std::string type_name[] = {"CV_32FC1"}; +typedef TestBaseWithParam PhaseFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(PhaseFixture, Phase, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + dst(srcSize, CV_32FC1); + declare.in(src1, src2).out(dst); + randu(src1, 0, 256); + randu(src2, 0, 256); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - - phase(src1, src2, dst, 1); - - CPU_ON; - phase(src1, src2, dst, 1); - CPU_OFF; + ocl::oclMat oclSrc1(src1), oclSrc2(src2), + oclDst(srcSize, src1.type()); - d_src1.upload(src1); - d_src2.upload(src2); + TEST_CYCLE() cv::ocl::phase(oclSrc1, oclSrc2, oclDst, 1); - WARMUP_ON; - ocl::phase(d_src1, d_src2, d_dst, 1); - WARMUP_OFF; + oclDst.download(dst); - GPU_ON; - ocl::phase(d_src1, d_src2, d_dst, 1); - GPU_OFF; - - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::phase(d_src1, d_src2, d_dst, 1); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-2); - } + SANITY_CHECK(dst, 1e-2); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::phase(src1, src2, dst, 1); + SANITY_CHECK(dst, 1e-2); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// bitwise_and//////////////////////// -PERFTEST(bitwise_and) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - int all_type[] = {CV_8UC1, CV_32SC1}; - std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; +typedef SumMatTypes BitwiseAndMatTypes; +typedef tuple BitwiseAndParams; +typedef TestBaseWithParam BitwiseAndFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(BitwiseAndFixture, bitwise_and, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + BitwiseAndMatTypes::all())) +{ + // getting params + BitwiseAndParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + declare.in(src1, src2).out(dst); + randu(src1, 0, 256); + randu(src2, 0, 256); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, src1.type()); - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); + TEST_CYCLE() cv::ocl::bitwise_and(oclSrc1, oclSrc2, oclDst); - bitwise_and(src1, src2, dst); + oclDst.download(dst); - CPU_ON; - bitwise_and(src1, src2, dst); - CPU_OFF; - d_src1.upload(src1); - d_src2.upload(src2); - - WARMUP_ON; - ocl::bitwise_and(d_src1, d_src2, d_dst); - WARMUP_OFF; - - GPU_ON; - ocl::bitwise_and(d_src1, d_src2, d_dst); - GPU_OFF; - - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::bitwise_and(d_src1, d_src2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::bitwise_and(src1, src2, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// bitwise_not//////////////////////// -PERFTEST(bitwise_not) -{ - Mat src1, dst, ocl_dst; - ocl::oclMat d_src1, d_dst; - int all_type[] = {CV_8UC1, CV_32SC1}; - std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; +typedef SumMatTypes BitwiseNotMatTypes; +typedef tuple BitwiseNotParams; +typedef TestBaseWithParam BitwiseNotFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(BitwiseAndFixture, bitwise_not, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + BitwiseAndMatTypes::all())) +{ + // getting params + BitwiseNotParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src1, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - - bitwise_not(src1, dst); - - CPU_ON; - bitwise_not(src1, dst); - CPU_OFF; - d_src1.upload(src1); + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - WARMUP_ON; - ocl::bitwise_not(d_src1, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::bitwise_not(oclSrc, oclDst); - GPU_ON; - ocl::bitwise_not(d_src1, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src1.upload(src1); - ocl::bitwise_not(d_src1, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::bitwise_not(src, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// compare//////////////////////// -PERFTEST(compare) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - int CMP_EQ = 0; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; +typedef countNonZeroMatTypes CompareMatTypes; +typedef tuple CompareParams; +typedef TestBaseWithParam CompareFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(CompareFixture, compare, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + CompareMatTypes::all())) +{ + // getting params + CompareParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, CV_8UC1); + declare.in(src1, src2, WARMUP_RNG).out(dst); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - - compare(src1, src2, dst, CMP_EQ); - - CPU_ON; - compare(src1, src2, dst, CMP_EQ); - CPU_OFF; - - d_src1.upload(src1); - d_src2.upload(src2); - - WARMUP_ON; - ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); - WARMUP_OFF; + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, CV_8UC1); - GPU_ON; - ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); - GPU_OFF; + TEST_CYCLE() cv::ocl::compare(oclSrc1, oclSrc2, oclDst, CMP_EQ); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::compare(src1, src2, dst, CMP_EQ); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// pow //////////////////////// -PERFTEST(pow) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - int all_type[] = {CV_32FC1}; - std::string type_name[] = {"CV_32FC1"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - gen(src, size, size, all_type[j], 5, 16); +typedef TestBaseWithParam PowFixture; - pow(src, -2.0, dst); +PERF_TEST_P(PowFixture, pow, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - CPU_ON; - pow(src, -2.0, dst); - CPU_OFF; - d_src.upload(src); - d_dst.upload(dst); + // creating src data + Mat src(srcSize, CV_32F), dst(srcSize, CV_32F); + declare.in(src, WARMUP_RNG).out(dst); - WARMUP_ON; - ocl::pow(d_src, -2.0, d_dst); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); - GPU_ON; - ocl::pow(d_src, -2.0, d_dst); - GPU_OFF; + TEST_CYCLE() cv::ocl::pow(oclSrc, -2.0, oclDst); - GPU_FULL_ON; - d_src.upload(src); - ocl::pow(d_src, -2.0, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); - } + SANITY_CHECK(dst, 5e-2); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::pow(src, -2.0, dst); + SANITY_CHECK(dst, 5e-2); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// MagnitudeSqr//////////////////////// -PERFTEST(MagnitudeSqr) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; - - int all_type[] = {CV_32FC1}; - std::string type_name[] = {"CV_32FC1"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t t = 0; t < sizeof(all_type) / sizeof(int); t++) - { - SUBTEST << size << 'x' << size << "; " << type_name[t]; +typedef TestBaseWithParam MagnitudeSqrFixture; - gen(src1, size, size, all_type[t], 0, 256); - gen(src2, size, size, all_type[t], 0, 256); - gen(dst, size, size, all_type[t], 0, 256); - - CPU_ON; - for (int i = 0; i < src1.rows; ++i) - for (int j = 0; j < src1.cols; ++j) - { - float val1 = src1.at(i, j); - float val2 = src2.at(i, j); - ((float *)(dst.data))[i * dst.step / 4 + j] = val1 * val1 + val2 * val2; +PERF_TEST_P(MagnitudeSqrFixture, MagnitudeSqr, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - } - CPU_OFF; + // creating src data + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + dst(srcSize, CV_32FC1); + declare.in(src1, src2, WARMUP_RNG).out(dst); - d_src1.upload(src1); - d_src2.upload(src2); + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, src1.type()); - WARMUP_ON; - ocl::magnitudeSqr(d_src1, d_src2, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::magnitudeSqr(oclSrc1, oclSrc2, oclDst); - GPU_ON; - ocl::magnitudeSqr(d_src1, d_src2, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::magnitudeSqr(d_src1, d_src2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst, 1e-6, ERROR_RELATIVE); + } + else if (impl == "plain") + { + ASSERT_EQ(1, src1.channels()); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); + TEST_CYCLE() + { + for (int y = 0; y < srcSize.height; ++y) + { + const float * const src1Data = reinterpret_cast(src1.data + src1.step * y); + const float * const src2Data = reinterpret_cast(src2.data + src2.step * y); + float * const dstData = reinterpret_cast(dst.data + dst.step * y); + for (int x = 0; x < srcSize.width; ++x) + { + float t0 = src1Data[x] * src1Data[x]; + float t1 = src2Data[x] * src2Data[x]; + dstData[x] = t0 + t1; + } + } } + SANITY_CHECK(dst, 1e-6, ERROR_RELATIVE); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// AddWeighted//////////////////////// -PERFTEST(AddWeighted) -{ - Mat src1, src2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_dst; +typedef countNonZeroMatTypes AddWeightedMatTypes; +typedef tuple AddWeightedParams; +typedef TestBaseWithParam AddWeightedFixture; + +PERF_TEST_P(AddWeightedFixture, AddWeighted, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + AddWeightedMatTypes::all())) +{ + // getting params + AddWeightedParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + declare.in(src1, src2, WARMUP_RNG).out(dst); double alpha = 2.0, beta = 1.0, gama = 3.0; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); + TEST_CYCLE() cv::ocl::addWeighted(oclSrc1, alpha, oclSrc2, beta, gama, oclDst); + oclDst.download(dst); - addWeighted(src1, alpha, src2, beta, gama, dst); - - CPU_ON; - addWeighted(src1, alpha, src2, beta, gama, dst); - CPU_OFF; - d_src1.upload(src1); - d_src2.upload(src2); - - WARMUP_ON; - ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); - WARMUP_OFF; - - GPU_ON; - ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); - GPU_OFF; - - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::addWeighted(src1, alpha, src2, beta, gama, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_blend.cpp b/modules/ocl/perf/perf_blend.cpp index 11eea64fbf..c8a7608148 100644 --- a/modules/ocl/perf/perf_blend.cpp +++ b/modules/ocl/perf/perf_blend.cpp @@ -45,9 +45,15 @@ //M*/ #include "perf_precomp.hpp" + +using namespace perf; + ///////////// blend //////////////////////// + template -void blendLinearGold(const cv::Mat &img1, const cv::Mat &img2, const cv::Mat &weights1, const cv::Mat &weights2, cv::Mat &result_gold) +static void blendLinearGold(const cv::Mat &img1, const cv::Mat &img2, + const cv::Mat &weights1, const cv::Mat &weights2, + cv::Mat &result_gold) { result_gold.create(img1.size(), img1.type()); @@ -63,60 +69,54 @@ void blendLinearGold(const cv::Mat &img1, const cv::Mat &img2, const cv::Mat &we for (int x = 0; x < img1.cols * cn; ++x) { - float w1 = weights1_row[x / cn]; - float w2 = weights2_row[x / cn]; - result_gold_row[x] = static_cast((img1_row[x] * w1 + img2_row[x] * w2) / (w1 + w2 + 1e-5f)); + int x1 = x * cn; + float w1 = weights1_row[x]; + float w2 = weights2_row[x]; + result_gold_row[x] = static_cast((img1_row[x1] * w1 + + img2_row[x1] * w2) / (w1 + w2 + 1e-5f)); } } } -PERFTEST(blend) + +typedef TestBaseWithParam blendLinearFixture; + +PERF_TEST_P(blendLinearFixture, blendLinear, OCL_TYPICAL_MAT_SIZES) { - Mat src1, src2, weights1, weights2, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_weights1, d_weights2, d_dst; + // getting params + const Size srcSize = GetParam(); + const int type = CV_8UC1; + const std::string impl = getSelectedImpl(); + + // creating src data + Mat src1(srcSize, type), src2(srcSize, CV_8UC1), dst; + Mat weights1(srcSize, CV_32FC1), weights2(srcSize, CV_32FC1); - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; + declare.in(src1, src2, WARMUP_RNG); + randu(weights1, 0.0f, 1.0f); + randu(weights2, 0.0f, 1.0f); - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " and CV_32FC1"; - - gen(src1, size, size, all_type[j], 0, 256); - gen(src2, size, size, all_type[j], 0, 256); - gen(weights1, size, size, CV_32FC1, 0, 1); - gen(weights2, size, size, CV_32FC1, 0, 1); - - blendLinearGold(src1, src2, weights1, weights2, dst); - - CPU_ON; - blendLinearGold(src1, src2, weights1, weights2, dst); - CPU_OFF; - - d_src1.upload(src1); - d_src2.upload(src2); - d_weights1.upload(weights1); - d_weights2.upload(weights2); - - WARMUP_ON; - ocl::blendLinear(d_src1, d_src2, d_weights1, d_weights2, d_dst); - WARMUP_OFF; - - GPU_ON; - ocl::blendLinear(d_src1, d_src2, d_weights1, d_weights2, d_dst); - GPU_OFF; - - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - d_weights1.upload(weights1); - d_weights2.upload(weights2); - ocl::blendLinear(d_src1, d_src2, d_weights1, d_weights2, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.f); - } + ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst; + ocl::oclMat oclWeights1(weights1), oclWeights2(weights2); + + TEST_CYCLE() cv::ocl::blendLinear(oclSrc1, oclSrc2, oclWeights1, oclWeights2, oclDst); + + oclDst.download(dst); + + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() blendLinearGold(src1, src2, weights1, weights2, dst); + + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_brute_force_matcher.cpp b/modules/ocl/perf/perf_brute_force_matcher.cpp index 14df629e96..841fa64185 100644 --- a/modules/ocl/perf/perf_brute_force_matcher.cpp +++ b/modules/ocl/perf/perf_brute_force_matcher.cpp @@ -45,123 +45,242 @@ //M*/ #include "perf_precomp.hpp" +using namespace perf; + +#define OCL_BFMATCHER_TYPICAL_MAT_SIZES ::testing::Values(cv::Size(128, 500), cv::Size(128, 1000), cv::Size(128, 2000)) + //////////////////// BruteForceMatch ///////////////// -PERFTEST(BruteForceMatcher) + +typedef TestBaseWithParam BruteForceMatcherFixture; + +PERF_TEST_P(BruteForceMatcherFixture, match, + OCL_BFMATCHER_TYPICAL_MAT_SIZES) { - Mat trainIdx_cpu; - Mat distance_cpu; - Mat allDist_cpu; - Mat nMatches_cpu; + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - // Init CPU matcher - int desc_len = 64; + vector matches; + Mat query(srcSize, CV_32F), train(srcSize, CV_32F); + declare.in(query, train).time(srcSize.height == 2000 ? 8 : 4 ); + randu(query, 0.0f, 1.0f); + randu(train, 0.0f, 1.0f); + if (impl == "plain") + { BFMatcher matcher(NORM_L2); + TEST_CYCLE() matcher.match(query, train, matches); - Mat query; - gen(query, size, desc_len, CV_32F, 0, 1); - - Mat train; - gen(train, size, desc_len, CV_32F, 0, 1); - // Output - vector< vector > matches(2); - vector< vector > d_matches(2); + SANITY_CHECK_MATCHES(matches); + } + else if (impl == "ocl") + { // Init GPU matcher - ocl::BruteForceMatcher_OCL_base d_matcher(ocl::BruteForceMatcher_OCL_base::L2Dist); + ocl::BruteForceMatcher_OCL_base oclMatcher(ocl::BruteForceMatcher_OCL_base::L2Dist); + ocl::oclMat oclQuery(query), oclTrain(train); - ocl::oclMat d_query(query); - ocl::oclMat d_train(train); + TEST_CYCLE() oclMatcher.match(oclQuery, oclTrain, matches); - ocl::oclMat d_trainIdx, d_distance, d_allDist, d_nMatches; + SANITY_CHECK_MATCHES(matches); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} + +//PERF_TEST_P(BruteForceMatcherFixture, matchSingle, +// OCL_BFMATCHER_TYPICAL_MAT_SIZES) +//{ +// const Size srcSize = GetParam(); +// const string impl = getSelectedImpl(); + +// Mat query(srcSize, CV_32F), train(srcSize, CV_32F); +// Mat trainIdx, distance; - SUBTEST << size << "; match"; +// randu(query, 0.0f, 1.0f); +// randu(train, 0.0f, 1.0f); - matcher.match(query, train, matches[0]); +// if (impl == "plain") +// CV_TEST_FAIL_NO_IMPL(); +// else if (impl == "ocl") +// { +// ocl::oclMat oclQuery(query), oclTrain(train), oclTrainIdx, oclDistance; - CPU_ON; - matcher.match(query, train, matches[0]); - CPU_OFF; +// TEST_CYCLE() oclMatcher->matchSingle(oclQuery, oclTrain, oclTrainIdx, oclDistance); + +// oclTrainIdx.download(trainIdx); +// oclDistance.download(distance); + +// SANITY_CHECK(trainIdx); +// SANITY_CHECK(distance); +// } +//#ifdef HAVE_OPENCV_GPU +// else if (impl == "gpu") +// CV_TEST_FAIL_NO_IMPL(); +//#endif +// else +// CV_TEST_FAIL_NO_IMPL(); +//} + +PERF_TEST_P(BruteForceMatcherFixture, knnMatch, + OCL_BFMATCHER_TYPICAL_MAT_SIZES) +{ + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - WARMUP_ON; - d_matcher.matchSingle(d_query, d_train, d_trainIdx, d_distance); - WARMUP_OFF; + vector > matches(2); + Mat query(srcSize, CV_32F), train(srcSize, CV_32F); + randu(query, 0.0f, 1.0f); + randu(train, 0.0f, 1.0f); - GPU_ON; - d_matcher.matchSingle(d_query, d_train, d_trainIdx, d_distance); - GPU_OFF; + declare.in(query, train); + if (srcSize.height == 2000) + declare.time(8); - GPU_FULL_ON; - d_query.upload(query); - d_train.upload(train); - d_matcher.match(d_query, d_train, d_matches[0]); - GPU_FULL_OFF; + if (impl == "plain") + { + BFMatcher matcher (NORM_L2); + TEST_CYCLE() matcher.knnMatch(query, train, matches, 2); - int diff = abs((int)d_matches[0].size() - (int)matches[0].size()); - if(diff == 0) - TestSystem::instance().setAccurate(1, 0); - else - TestSystem::instance().setAccurate(0, diff); + std::vector & matches0 = matches[0], & matches1 = matches[1]; + SANITY_CHECK_MATCHES(matches0); + SANITY_CHECK_MATCHES(matches1); + } + else if (impl == "ocl") + { + ocl::BruteForceMatcher_OCL_base oclMatcher(ocl::BruteForceMatcher_OCL_base::L2Dist); + ocl::oclMat oclQuery(query), oclTrain(train); - SUBTEST << size << "; knnMatch"; + TEST_CYCLE() oclMatcher.knnMatch(oclQuery, oclTrain, matches, 2); - matcher.knnMatch(query, train, matches, 2); + std::vector & matches0 = matches[0], & matches1 = matches[1]; + SANITY_CHECK_MATCHES(matches0); + SANITY_CHECK_MATCHES(matches1); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - CPU_ON; - matcher.knnMatch(query, train, matches, 2); - CPU_OFF; +//PERF_TEST_P(BruteForceMatcherFixture, knnMatchSingle, +// OCL_BFMATCHER_TYPICAL_MAT_SIZES) +//{ +// const Size srcSize = GetParam(); +// const string impl = getSelectedImpl(); - WARMUP_ON; - d_matcher.knnMatchSingle(d_query, d_train, d_trainIdx, d_distance, d_allDist, 2); - WARMUP_OFF; +// Mat query(srcSize, CV_32F), train(srcSize, CV_32F); +// Mat trainIdx, distance, allDist; - GPU_ON; - d_matcher.knnMatchSingle(d_query, d_train, d_trainIdx, d_distance, d_allDist, 2); - GPU_OFF; +// randu(query, 0.0f, 1.0f); +// randu(train, 0.0f, 1.0f); - GPU_FULL_ON; - d_query.upload(query); - d_train.upload(train); - d_matcher.knnMatch(d_query, d_train, d_matches, 2); - GPU_FULL_OFF; +// if (impl == "plain") +// CV_TEST_FAIL_NO_IMPL(); +// else if (impl == "ocl") +// { +// ocl::oclMat oclQuery(query), oclTrain(train), oclTrainIdx, oclDistance, oclAllDist; - diff = abs((int)d_matches[0].size() - (int)matches[0].size()); - if(diff == 0) - TestSystem::instance().setAccurate(1, 0); - else - TestSystem::instance().setAccurate(0, diff); +// TEST_CYCLE() oclMatcher->knnMatchSingle(oclQuery, oclTrain, oclTrainIdx, oclDistance, oclAllDist, 2); - SUBTEST << size << "; radiusMatch"; +// oclTrainIdx.download(trainIdx); +// oclDistance.download(distance); +// oclAllDist.download(allDist); - float max_distance = 2.0f; +// SANITY_CHECK(trainIdx); +// SANITY_CHECK(distance); +// SANITY_CHECK(allDist); +// } +//#ifdef HAVE_OPENCV_GPU +// else if (impl == "gpu") +// CV_TEST_FAIL_NO_IMPL(); +//#endif +// else +// CV_TEST_FAIL_NO_IMPL(); +//} - matcher.radiusMatch(query, train, matches, max_distance); +PERF_TEST_P(BruteForceMatcherFixture, DISABLED_radiusMatch, + OCL_BFMATCHER_TYPICAL_MAT_SIZES) +{ + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - CPU_ON; - matcher.radiusMatch(query, train, matches, max_distance); - CPU_OFF; + const float max_distance = 2.0f; + vector > matches(2); + Mat query(srcSize, CV_32F), train(srcSize, CV_32F); + declare.in(query, train); + Mat trainIdx, distance, allDist; - d_trainIdx.release(); + randu(query, 0.0f, 1.0f); + randu(train, 0.0f, 1.0f); - WARMUP_ON; - d_matcher.radiusMatchSingle(d_query, d_train, d_trainIdx, d_distance, d_nMatches, max_distance); - WARMUP_OFF; + if (impl == "plain") + { + BFMatcher matcher (NORM_L2); + TEST_CYCLE() matcher.radiusMatch(query, matches, max_distance); - GPU_ON; - d_matcher.radiusMatchSingle(d_query, d_train, d_trainIdx, d_distance, d_nMatches, max_distance); - GPU_OFF; + std::vector & matches0 = matches[0], & matches1 = matches[1]; + SANITY_CHECK_MATCHES(matches0); + SANITY_CHECK_MATCHES(matches1); + } + else if (impl == "ocl") + { + ocl::oclMat oclQuery(query), oclTrain(train); + ocl::BruteForceMatcher_OCL_base oclMatcher(ocl::BruteForceMatcher_OCL_base::L2Dist); - GPU_FULL_ON; - d_query.upload(query); - d_train.upload(train); - d_matcher.radiusMatch(d_query, d_train, d_matches, max_distance); - GPU_FULL_OFF; + TEST_CYCLE() oclMatcher.radiusMatch(oclQuery, oclTrain, matches, max_distance); - diff = abs((int)d_matches[0].size() - (int)matches[0].size()); - if(diff == 0) - TestSystem::instance().setAccurate(1, 0); - else - TestSystem::instance().setAccurate(0, diff); + std::vector & matches0 = matches[0], & matches1 = matches[1]; + SANITY_CHECK_MATCHES(matches0); + SANITY_CHECK_MATCHES(matches1); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } + +//PERF_TEST_P(BruteForceMatcherFixture, radiusMatchSingle, +// OCL_BFMATCHER_TYPICAL_MAT_SIZES) +//{ +// const Size srcSize = GetParam(); +// const string impl = getSelectedImpl(); + +// const float max_distance = 2.0f; +// Mat query(srcSize, CV_32F), train(srcSize, CV_32F); +// Mat trainIdx, distance, nMatches; + +// randu(query, 0.0f, 1.0f); +// randu(train, 0.0f, 1.0f); + +// if (impl == "plain") +// CV_TEST_FAIL_NO_IMPL(); +// else if (impl == "ocl") +// { +// ocl::oclMat oclQuery(query), oclTrain(train), oclTrainIdx, oclDistance, oclNMatches; + +// TEST_CYCLE() oclMatcher->radiusMatchSingle(oclQuery, oclTrain, oclTrainIdx, oclDistance, oclNMatches, max_distance); + +// oclTrainIdx.download(trainIdx); +// oclDistance.download(distance); +// oclNMatches.download(nMatches); + +// SANITY_CHECK(trainIdx); +// SANITY_CHECK(distance); +// SANITY_CHECK(nMatches); +// } +//#ifdef HAVE_OPENCV_GPU +// else if (impl == "gpu") +// CV_TEST_FAIL_NO_IMPL(); +//#endif +// else +// CV_TEST_FAIL_NO_IMPL(); +//} + +#undef OCL_BFMATCHER_TYPICAL_MAT_SIZES diff --git a/modules/ocl/perf/perf_calib3d.cpp b/modules/ocl/perf/perf_calib3d.cpp index ff6c6f2615..7288677bf7 100644 --- a/modules/ocl/perf/perf_calib3d.cpp +++ b/modules/ocl/perf/perf_calib3d.cpp @@ -45,48 +45,49 @@ //M*/ #include "perf_precomp.hpp" + ///////////// StereoMatchBM //////////////////////// -PERFTEST(StereoMatchBM) -{ - Mat left_image = imread(abspath("aloeL.jpg"), cv::IMREAD_GRAYSCALE); - Mat right_image = imread(abspath("aloeR.jpg"), cv::IMREAD_GRAYSCALE); - Mat disp,dst; - ocl::oclMat d_left, d_right,d_disp; - int n_disp= 128; - int winSize =19; - SUBTEST << left_image.cols << 'x' << left_image.rows << "; aloeL.jpg ;"<< right_image.cols << 'x' << right_image.rows << "; aloeR.jpg "; +PERF_TEST(StereoMatchBMFixture, DISABLED_StereoMatchBM) +{ + Mat left_image = imread(getDataPath("gpu/stereobm/aloe-L.png"), cv::IMREAD_GRAYSCALE); + Mat right_image = imread(getDataPath("gpu/stereobm/aloe-R.png"), cv::IMREAD_GRAYSCALE); - StereoBM bm(0, n_disp, winSize); - bm(left_image, right_image, dst); + ASSERT_TRUE(!left_image.empty()) << "no input image"; + ASSERT_TRUE(!right_image.empty()) << "no input image"; + ASSERT_TRUE(right_image.size() == left_image.size()); + ASSERT_TRUE(right_image.size() == left_image.size()); - CPU_ON; - bm(left_image, right_image, dst); - CPU_OFF; + const std::string impl = getSelectedImpl(); + const int n_disp = 128, winSize = 19; + Mat disp(left_image.size(), CV_16SC1); - d_left.upload(left_image); - d_right.upload(right_image); + declare.in(left_image, right_image).out(disp); - ocl::StereoBM_OCL d_bm(0, n_disp, winSize); + if (impl == "ocl") + { + ocl::oclMat oclLeft(left_image), oclRight(right_image), + oclDisp(left_image.size(), CV_16SC1); + ocl::StereoBM_OCL oclBM(0, n_disp, winSize); - WARMUP_ON; - d_bm(d_left, d_right, d_disp); - WARMUP_OFF; + TEST_CYCLE() oclBM(oclLeft, oclRight, oclDisp); - cv::Mat ocl_mat; - d_disp.download(ocl_mat); - ocl_mat.convertTo(ocl_mat, dst.type()); + oclDisp.download(disp); - GPU_ON; - d_bm(d_left, d_right, d_disp); - GPU_OFF; + SANITY_CHECK(disp); + } + else if (impl == "plain") + { + StereoBM bm(0, n_disp, winSize); - GPU_FULL_ON; - d_left.upload(left_image); - d_right.upload(right_image); - d_bm(d_left, d_right, d_disp); - d_disp.download(disp); - GPU_FULL_OFF; + TEST_CYCLE() bm(left_image, right_image, disp); - TestSystem::instance().setAccurate(-1, 0.); + SANITY_CHECK(disp); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); + #endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_canny.cpp b/modules/ocl/perf/perf_canny.cpp index 6f85ee8a43..34a38efd8e 100644 --- a/modules/ocl/perf/perf_canny.cpp +++ b/modules/ocl/perf/perf_canny.cpp @@ -45,41 +45,38 @@ //M*/ #include "perf_precomp.hpp" -///////////// Canny //////////////////////// -PERFTEST(Canny) -{ - Mat img = imread(abspath("aloeL.jpg"), CV_LOAD_IMAGE_GRAYSCALE); - - if (img.empty()) - { - throw runtime_error("can't open aloeL.jpg"); - } - - SUBTEST << img.cols << 'x' << img.rows << "; aloeL.jpg" << "; edges" << "; CV_8UC1"; +using namespace perf; - Mat edges(img.size(), CV_8UC1), ocl_edges; +///////////// Canny //////////////////////// - CPU_ON; - Canny(img, edges, 50.0, 100.0); - CPU_OFF; +PERF_TEST(CannyFixture, Canny) +{ + Mat img = imread(getDataPath("gpu/stereobm/aloe-L.png"), cv::IMREAD_GRAYSCALE), + edges(img.size(), CV_8UC1); + ASSERT_TRUE(!img.empty()) << "can't open aloeL.jpg"; - ocl::oclMat d_img(img); - ocl::oclMat d_edges; - ocl::CannyBuf d_buf; + const std::string impl = getSelectedImpl(); + declare.in(img).out(edges); - WARMUP_ON; - ocl::Canny(d_img, d_buf, d_edges, 50.0, 100.0); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclImg(img), oclEdges(img.size(), CV_8UC1); - GPU_ON; - ocl::Canny(d_img, d_buf, d_edges, 50.0, 100.0); - GPU_OFF; + TEST_CYCLE() Canny(oclImg, oclEdges, 50.0, 100.0); + oclEdges.download(edges); - GPU_FULL_ON; - d_img.upload(img); - ocl::Canny(d_img, d_buf, d_edges, 50.0, 100.0); - d_edges.download(ocl_edges); - GPU_FULL_OFF; + SANITY_CHECK(edges); + } + else if (impl == "plain") + { + TEST_CYCLE() Canny(img, edges, 50.0, 100.0); - TestSystem::instance().ExceptedMatSimilar(edges, ocl_edges, 2e-2); + SANITY_CHECK(edges); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_color.cpp b/modules/ocl/perf/perf_color.cpp index 1934417448..645b835dfa 100644 --- a/modules/ocl/perf/perf_color.cpp +++ b/modules/ocl/perf/perf_color.cpp @@ -45,49 +45,39 @@ //M*/ #include "perf_precomp.hpp" -///////////// cvtColor//////////////////////// -PERFTEST(cvtColor) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - int all_type[] = {CV_8UC4}; - std::string type_name[] = {"CV_8UC4"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - gen(src, size, size, all_type[j], 0, 256); - SUBTEST << size << "x" << size << "; " << type_name[j] << " ; CV_RGBA2GRAY"; - - cvtColor(src, dst, CV_RGBA2GRAY, 4); - - CPU_ON; - cvtColor(src, dst, CV_RGBA2GRAY, 4); - CPU_OFF; +using namespace perf; - d_src.upload(src); +///////////// cvtColor//////////////////////// - WARMUP_ON; - ocl::cvtColor(d_src, d_dst, CV_RGBA2GRAY, 4); - WARMUP_OFF; +typedef TestBaseWithParam cvtColorFixture; - GPU_ON; - ocl::cvtColor(d_src, d_dst, CV_RGBA2GRAY, 4); - GPU_OFF; +PERF_TEST_P(cvtColorFixture, cvtColor, OCL_TYPICAL_MAT_SIZES) +{ + const Size srcSize = GetParam(); + const std::string impl = getSelectedImpl(); - GPU_FULL_ON; - d_src.upload(src); - ocl::cvtColor(d_src, d_dst, CV_RGBA2GRAY, 4); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + Mat src(srcSize, CV_8UC4), dst(srcSize, CV_8UC4); + declare.in(src).out(dst); - TestSystem::instance().ExceptedMatSimilar(dst, ocl_dst, 1e-5); - } + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(src.size(), CV_8UC4); + TEST_CYCLE() ocl::cvtColor(oclSrc, oclDst, CV_RGBA2GRAY, 4); + oclDst.download(dst); + SANITY_CHECK(dst); } + else if (impl == "plain") + { + TEST_CYCLE() cv::cvtColor(src, dst, CV_RGBA2GRAY, 4); - + SANITY_CHECK(dst); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_fft.cpp b/modules/ocl/perf/perf_fft.cpp index ce9949b7a0..e23450926a 100644 --- a/modules/ocl/perf/perf_fft.cpp +++ b/modules/ocl/perf/perf_fft.cpp @@ -45,47 +45,43 @@ //M*/ #include "perf_precomp.hpp" -///////////// dft //////////////////////// -PERFTEST(dft) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - int all_type[] = {CV_32FC2}; - std::string type_name[] = {"CV_32FC2"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; complex-to-complex"; +using namespace perf; - gen(src, size, size, all_type[j], Scalar::all(0), Scalar::all(1)); +///////////// dft //////////////////////// - dft(src, dst); +typedef TestBaseWithParam dftFixture; - CPU_ON; - dft(src, dst); - CPU_OFF; +PERF_TEST_P(dftFixture, DISABLED_dft, OCL_TYPICAL_MAT_SIZES) +{ + const std::string impl = getSelectedImpl(); + Size srcSize = GetParam(); - d_src.upload(src); + Mat src(srcSize, CV_32FC2), dst; + randu(src, 0.0f, 1.0f); + declare.in(src); - WARMUP_ON; - ocl::dft(d_src, d_dst, Size(size, size)); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst; - GPU_ON; - ocl::dft(d_src, d_dst, Size(size, size)); - GPU_OFF; + EXPECT_NO_THROW({ + TEST_CYCLE() cv::ocl::dft(oclSrc, oclDst); + }); - GPU_FULL_ON; - d_src.upload(src); - ocl::dft(d_src, d_dst, Size(size, size)); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, src.size().area() * 1e-4); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::dft(src, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_filters.cpp b/modules/ocl/perf/perf_filters.cpp index e4204cbbd1..3d9be40aaa 100644 --- a/modules/ocl/perf/perf_filters.cpp +++ b/modules/ocl/perf/perf_filters.cpp @@ -45,333 +45,344 @@ //M*/ #include "perf_precomp.hpp" +using namespace perf; +using std::tr1::get; +using std::tr1::tuple; + ///////////// Blur//////////////////////// -PERFTEST(Blur) -{ - Mat src1, dst, ocl_dst; - ocl::oclMat d_src1, d_dst; - Size ksize = Size(3, 3); - int bordertype = BORDER_CONSTANT; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +CV_ENUM(BlurMatType, CV_8UC1, CV_8UC4) - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef tuple BlurParams; +typedef TestBaseWithParam BlurFixture; - gen(src1, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); +PERF_TEST_P(BlurFixture, Blur, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + BlurMatType::all())) +{ + // getting params + BlurParams params = GetParam(); + const Size srcSize = get<0>(params), ksize(3, 3); + const int type = get<1>(params), bordertype = BORDER_CONSTANT; - blur(src1, dst, ksize, Point(-1, -1), bordertype); + const std::string impl = getSelectedImpl(); - CPU_ON; - blur(src1, dst, ksize, Point(-1, -1), bordertype); - CPU_OFF; + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - d_src1.upload(src1); + if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(5); - WARMUP_ON; - ocl::blur(d_src1, d_dst, ksize, Point(-1, -1), bordertype); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - ocl::blur(d_src1, d_dst, ksize, Point(-1, -1), bordertype); - GPU_OFF; + TEST_CYCLE() cv::ocl::blur(oclSrc, oclDst, ksize, Point(-1, -1), bordertype); - GPU_FULL_ON; - d_src1.upload(src1); - ocl::blur(d_src1, d_dst, ksize, Point(-1, -1), bordertype); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); - } + SANITY_CHECK(dst, 1 + DBL_EPSILON); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::blur(src, dst, ksize, Point(-1, -1), bordertype); + SANITY_CHECK(dst, 1 + DBL_EPSILON); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -///////////// Laplacian//////////////////////// -PERFTEST(Laplacian) -{ - Mat src1, dst, ocl_dst; - ocl::oclMat d_src1, d_dst; - int ksize = 3; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +///////////// Laplacian//////////////////////// - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef BlurMatType LaplacianMatType; +typedef tuple LaplacianParams; +typedef TestBaseWithParam LaplacianFixture; - gen(src1, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); +PERF_TEST_P(LaplacianFixture, Laplacian, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + LaplacianMatType::all())) +{ + // getting params + LaplacianParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), ksize = 3; - Laplacian(src1, dst, -1, ksize, 1); + const std::string impl = getSelectedImpl(); - CPU_ON; - Laplacian(src1, dst, -1, ksize, 1); - CPU_OFF; + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - d_src1.upload(src1); + if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(6); - WARMUP_ON; - ocl::Laplacian(d_src1, d_dst, -1, ksize, 1); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - ocl::Laplacian(d_src1, d_dst, -1, ksize, 1); - GPU_OFF; + TEST_CYCLE() cv::ocl::Laplacian(oclSrc, oclDst, -1, ksize, 1); - GPU_FULL_ON; - d_src1.upload(src1); - ocl::Laplacian(d_src1, d_dst, -1, ksize, 1); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::Laplacian(src, dst, -1, ksize, 1); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Erode //////////////////// -PERFTEST(Erode) -{ - Mat src, dst, ker, ocl_dst; - ocl::oclMat d_src, d_dst; - int all_type[] = {CV_8UC1, CV_8UC4, CV_32FC1, CV_32FC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4", "CV_32FC1", "CV_32FC4"}; +CV_ENUM(ErodeMatType, CV_8UC1, CV_8UC4, CV_32FC1, CV_32FC4) - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef tuple ErodeParams; +typedef TestBaseWithParam ErodeFixture; - gen(src, size, size, all_type[j], Scalar::all(0), Scalar::all(256)); - ker = getStructuringElement(MORPH_RECT, Size(3, 3)); +PERF_TEST_P(ErodeFixture, Erode, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + ErodeMatType::all())) +{ + // getting params + ErodeParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), ksize = 3; + const Mat ker = getStructuringElement(MORPH_RECT, Size(ksize, ksize)); - erode(src, dst, ker); + const std::string impl = getSelectedImpl(); - CPU_ON; - erode(src, dst, ker); - CPU_OFF; + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst).in(ker); - d_src.upload(src); + if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(5); - WARMUP_ON; - ocl::erode(d_src, d_dst, ker); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type), oclKer(ker); - GPU_ON; - ocl::erode(d_src, d_dst, ker); - GPU_OFF; + TEST_CYCLE() cv::ocl::erode(oclSrc, oclDst, oclKer); - GPU_FULL_ON; - d_src.upload(src); - ocl::erode(d_src, d_dst, ker); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::erode(src, dst, ker); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// Sobel //////////////////////// -PERFTEST(Sobel) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - int dx = 1; - int dy = 1; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef BlurMatType SobelMatType; +typedef tuple SobelMatParams; +typedef TestBaseWithParam SobelFixture; - gen(src, size, size, all_type[j], 0, 256); +PERF_TEST_P(SobelFixture, Sobel, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + SobelMatType::all())) +{ + // getting params + SobelMatParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), dx = 1, dy = 1; - Sobel(src, dst, -1, dx, dy); + const std::string impl = getSelectedImpl(); - CPU_ON; - Sobel(src, dst, -1, dx, dy); - CPU_OFF; + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - d_src.upload(src); + if ((srcSize == OCL_SIZE_2000 && type == CV_8UC4) || + (srcSize == OCL_SIZE_4000 && type == CV_8UC1)) + declare.time(5.5); + else if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(20); - WARMUP_ON; - ocl::Sobel(d_src, d_dst, -1, dx, dy); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - ocl::Sobel(d_src, d_dst, -1, dx, dy); - GPU_OFF; + TEST_CYCLE() cv::ocl::Sobel(oclSrc, oclDst, -1, dx, dy); - GPU_FULL_ON; - d_src.upload(src); - ocl::Sobel(d_src, d_dst, -1, dx, dy); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::Sobel(src, dst, -1, dx, dy); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } + ///////////// Scharr //////////////////////// -PERFTEST(Scharr) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - int dx = 1; - int dy = 0; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +typedef BlurMatType ScharrMatType; +typedef tuple ScharrParams; +typedef TestBaseWithParam ScharrFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); +PERF_TEST_P(ScharrFixture, Scharr, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + ScharrMatType::all())) +{ + // getting params + ScharrParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), dx = 1, dy = 0; - Scharr(src, dst, -1, dx, dy); + const std::string impl = getSelectedImpl(); - CPU_ON; - Scharr(src, dst, -1, dx, dy); - CPU_OFF; + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - d_src.upload(src); + if ((srcSize == OCL_SIZE_2000 && type == CV_8UC4) || + (srcSize == OCL_SIZE_4000 && type == CV_8UC1)) + declare.time(5.5); + else if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(21); - WARMUP_ON; - ocl::Scharr(d_src, d_dst, -1, dx, dy); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - ocl::Scharr(d_src, d_dst, -1, dx, dy); - GPU_OFF; + TEST_CYCLE() cv::ocl::Scharr(oclSrc, oclDst, -1, dx, dy); - GPU_FULL_ON; - d_src.upload(src); - ocl::Scharr(d_src, d_dst, -1, dx, dy); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::Scharr(src, dst, -1, dx, dy); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// GaussianBlur //////////////////////// -PERFTEST(GaussianBlur) -{ - Mat src, dst, ocl_dst; - int all_type[] = {CV_8UC1, CV_8UC4, CV_32FC1, CV_32FC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4", "CV_32FC1", "CV_32FC4"}; - const int ksize = 7; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef ErodeMatType GaussianBlurMatType; +typedef tuple GaussianBlurParams; +typedef TestBaseWithParam GaussianBlurFixture; - gen(src, size, size, all_type[j], 0, 256); +PERF_TEST_P(GaussianBlurFixture, GaussianBlur, + ::testing::Combine(::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000), + GaussianBlurMatType::all())) +{ + // getting params + GaussianBlurParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), ksize = 7; - GaussianBlur(src, dst, Size(ksize, ksize), 0); + const std::string impl = getSelectedImpl(); - CPU_ON; - GaussianBlur(src, dst, Size(ksize, ksize), 0); - CPU_OFF; + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - ocl::oclMat d_src(src); - ocl::oclMat d_dst; + const double eps = src.depth() == CV_8U ? 1 + DBL_EPSILON : 3e-4; - WARMUP_ON; - ocl::GaussianBlur(d_src, d_dst, Size(ksize, ksize), 0); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - ocl::GaussianBlur(d_src, d_dst, Size(ksize, ksize), 0); - GPU_OFF; + TEST_CYCLE() cv::ocl::GaussianBlur(oclSrc, oclDst, Size(ksize, ksize), 0); - GPU_FULL_ON; - d_src.upload(src); - ocl::GaussianBlur(d_src, d_dst, Size(ksize, ksize), 0); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); - } + SANITY_CHECK(dst, eps); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::GaussianBlur(src, dst, Size(ksize, ksize), 0); + SANITY_CHECK(dst, eps); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// filter2D//////////////////////// -PERFTEST(filter2D) -{ - Mat src; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - gen(src, size, size, all_type[j], 0, 256); - - const int ksize = 3; - - SUBTEST << "ksize = " << ksize << "; " << size << 'x' << size << "; " << type_name[j] ; - Mat kernel; - gen(kernel, ksize, ksize, CV_32SC1, -3.0, 3.0); +typedef BlurMatType filter2DMatType; +typedef tuple filter2DParams; +typedef TestBaseWithParam filter2DFixture; - Mat dst, ocl_dst; - - cv::filter2D(src, dst, -1, kernel); - - CPU_ON; - cv::filter2D(src, dst, -1, kernel); - CPU_OFF; +PERF_TEST_P(filter2DFixture, filter2D, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + filter2DMatType::all())) +{ + // getting params + filter2DParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), ksize = 3; - ocl::oclMat d_src(src), d_dst; + const std::string impl = getSelectedImpl(); - WARMUP_ON; - ocl::filter2D(d_src, d_dst, -1, kernel); - WARMUP_OFF; + Mat src(srcSize, type), dst(srcSize, type), kernel(ksize, ksize, CV_32SC1); + declare.in(src, WARMUP_RNG).in(kernel).out(dst); + randu(kernel, -3.0, 3.0); - GPU_ON; - ocl::filter2D(d_src, d_dst, -1, kernel); - GPU_OFF; + if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) + declare.time(8); - GPU_FULL_ON; - d_src.upload(src); - ocl::filter2D(d_src, d_dst, -1, kernel); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type), oclKernel(kernel); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); + TEST_CYCLE() cv::ocl::filter2D(oclSrc, oclDst, -1, oclKernel); - } + oclDst.download(dst); + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::filter2D(src, dst, -1, kernel); + SANITY_CHECK(dst); } + #ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_gemm.cpp b/modules/ocl/perf/perf_gemm.cpp index aa04b9c3ae..1e765e85d9 100644 --- a/modules/ocl/perf/perf_gemm.cpp +++ b/modules/ocl/perf/perf_gemm.cpp @@ -45,46 +45,46 @@ //M*/ #include "perf_precomp.hpp" -///////////// gemm //////////////////////// -PERFTEST(gemm) -{ - Mat src1, src2, src3, dst, ocl_dst; - ocl::oclMat d_src1, d_src2, d_src3, d_dst; +using namespace perf; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size; +///////////// gemm //////////////////////// - gen(src1, size, size, CV_32FC1, Scalar::all(-10), Scalar::all(10)); - gen(src2, size, size, CV_32FC1, Scalar::all(-10), Scalar::all(10)); - gen(src3, size, size, CV_32FC1, Scalar::all(-10), Scalar::all(10)); +typedef TestBaseWithParam gemmFixture; - gemm(src1, src2, 1.0, src3, 1.0, dst); +PERF_TEST_P(gemmFixture, DISABLED_gemm, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const std::string impl = getSelectedImpl(); - CPU_ON; - gemm(src1, src2, 1.0, src3, 1.0, dst); - CPU_OFF; + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + src3(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); + declare.in(src1, src2, src3).out(dst); + randu(src1, -10.0f, 10.0f); + randu(src2, -10.0f, 10.0f); + randu(src3, -10.0f, 10.0f); - d_src1.upload(src1); - d_src2.upload(src2); - d_src3.upload(src3); + if (impl == "ocl") + { + ocl::oclMat oclSrc1(src1), oclSrc2(src2), + oclSrc3(src3), oclDst(srcSize, CV_32FC1); - WARMUP_ON; - ocl::gemm(d_src1, d_src2, 1.0, d_src3, 1.0, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::gemm(oclSrc1, oclSrc2, 1.0, oclSrc3, 1.0, oclDst); - GPU_ON; - ocl::gemm(d_src1, d_src2, 1.0, d_src3, 1.0, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - d_src3.upload(src3); - ocl::gemm(d_src1, d_src2, 1.0, d_src3, 1.0, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::gemm(src1, src2, 1.0, src3, 1.0, dst); - TestSystem::instance().ExpectedMatNear(ocl_dst, dst, src1.cols * src1.rows * 1e-4); + SANITY_CHECK(dst); } + #ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_gftt.cpp b/modules/ocl/perf/perf_gftt.cpp index 430d441430..a314fc092a 100644 --- a/modules/ocl/perf/perf_gftt.cpp +++ b/modules/ocl/perf/perf_gftt.cpp @@ -46,56 +46,54 @@ #include "perf_precomp.hpp" -///////////// GoodFeaturesToTrack //////////////////////// -PERFTEST(GoodFeaturesToTrack) -{ - using namespace cv; - - int maxCorners = 2000; - double qualityLevel = 0.01; - - std::string images[] = { "rubberwhale1.png", "aloeL.jpg" }; - - std::vector pts_gold, pts_ocl; - - for(size_t imgIdx = 0; imgIdx < (sizeof(images)/sizeof(std::string)); ++imgIdx) - { - Mat frame = imread(abspath(images[imgIdx]), IMREAD_GRAYSCALE); - CV_Assert(!frame.empty()); +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; - for(float minDistance = 0; minDistance < 4; minDistance += 3.0) - { - SUBTEST << "image = " << images[imgIdx] << "; "; - SUBTEST << "minDistance = " << minDistance << "; "; +///////////// GoodFeaturesToTrack //////////////////////// - cv::goodFeaturesToTrack(frame, pts_gold, maxCorners, qualityLevel, minDistance); +typedef tuple GoodFeaturesToTrackParams; +typedef TestBaseWithParam GoodFeaturesToTrackFixture; - CPU_ON; - cv::goodFeaturesToTrack(frame, pts_gold, maxCorners, qualityLevel, minDistance); - CPU_OFF; +PERF_TEST_P(GoodFeaturesToTrackFixture, GoodFeaturesToTrack, + ::testing::Combine(::testing::Values(string("gpu/opticalflow/rubberwhale1.png"), + string("gpu/stereobm/aloe-L.png")), + ::testing::Range(0.0, 4.0, 3.0))) +{ + std::vector pts_gold; - cv::ocl::GoodFeaturesToTrackDetector_OCL detector(maxCorners, qualityLevel, minDistance); + // getting params + GoodFeaturesToTrackParams param = GetParam(); + const string fileName = getDataPath(get<0>(param)), impl = getSelectedImpl(); + const int maxCorners = 2000; + const double qualityLevel = 0.01, minDistance = get<1>(param); - ocl::oclMat frame_ocl(frame), pts_oclmat; + Mat frame = imread(fileName, IMREAD_GRAYSCALE); + declare.in(frame); + ASSERT_TRUE(!frame.empty()) << "no input image"; - WARMUP_ON; - detector(frame_ocl, pts_oclmat); - WARMUP_OFF; + if (impl == "ocl") + { + ocl::oclMat oclFrame(frame), pts_oclmat; + cv::ocl::GoodFeaturesToTrackDetector_OCL detector(maxCorners, qualityLevel, minDistance); - detector.downloadPoints(pts_oclmat, pts_ocl); + TEST_CYCLE() detector(oclFrame, pts_oclmat); - double diff = abs(static_cast(pts_gold.size() - pts_ocl.size())); - TestSystem::instance().setAccurate(diff == 0.0, diff); + detector.downloadPoints(pts_oclmat, pts_gold); - GPU_ON; - detector(frame_ocl, pts_oclmat); - GPU_OFF; + SANITY_CHECK(pts_gold); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::goodFeaturesToTrack(frame, pts_gold, + maxCorners, qualityLevel, minDistance); - GPU_FULL_ON; - frame_ocl.upload(frame); - detector(frame_ocl, pts_oclmat); - detector.downloadPoints(pts_oclmat, pts_ocl); - GPU_FULL_OFF; - } + SANITY_CHECK(pts_gold); } + #ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_haar.cpp b/modules/ocl/perf/perf_haar.cpp index ea1a4745a5..38917a0704 100644 --- a/modules/ocl/perf/perf_haar.cpp +++ b/modules/ocl/perf/perf_haar.cpp @@ -45,6 +45,8 @@ //M*/ #include "perf_precomp.hpp" +using namespace perf; + ///////////// Haar //////////////////////// namespace cv { @@ -83,61 +85,45 @@ public: } } -PERFTEST(Haar) -{ - Mat img = imread(abspath("basketball1.png"), CV_LOAD_IMAGE_GRAYSCALE); - if (img.empty()) - { - throw runtime_error("can't open basketball1.png"); - } +PERF_TEST(HaarFixture, Haar) +{ + const std::string impl = getSelectedImpl(); + vector faces; - CascadeClassifier faceCascadeCPU; + Mat img = imread(getDataPath("gpu/haarcascade/basketball1.png"), CV_LOAD_IMAGE_GRAYSCALE); + ASSERT_TRUE(!img.empty()) << "can't open basketball1.png"; + declare.in(img); - if (!faceCascadeCPU.load(abspath("haarcascade_frontalface_alt.xml"))) + if (impl == "plain") { - throw runtime_error("can't load haarcascade_frontalface_alt.xml"); - } + CascadeClassifier faceCascade; + ASSERT_TRUE(faceCascade.load(getDataPath("gpu/haarcascade/haarcascade_frontalface_alt.xml"))) + << "can't load haarcascade_frontalface_alt.xml"; - vector faces; + TEST_CYCLE() faceCascade.detectMultiScale(img, faces, + 1.1, 2, 0 | CV_HAAR_SCALE_IMAGE, Size(30, 30)); - SUBTEST << img.cols << "x" << img.rows << "; scale image"; - CPU_ON; - faceCascadeCPU.detectMultiScale(img, faces, - 1.1, 2, 0 | CV_HAAR_SCALE_IMAGE, Size(30, 30)); - CPU_OFF; + SANITY_CHECK(faces, 4 + 1e-4); + } + else if (impl == "ocl") + { + ocl::CascadeClassifier_GPU faceCascade; + ocl::oclMat oclImg(img); + ASSERT_TRUE(faceCascade.load(getDataPath("gpu/haarcascade/haarcascade_frontalface_alt.xml"))) + << "can't load haarcascade_frontalface_alt.xml"; - vector oclfaces; - ocl::CascadeClassifier_GPU faceCascade; + TEST_CYCLE() faceCascade.detectMultiScale(oclImg, faces, + 1.1, 2, 0 | CV_HAAR_SCALE_IMAGE, Size(30, 30)); - if (!faceCascade.load(abspath("haarcascade_frontalface_alt.xml"))) - { - throw runtime_error("can't load haarcascade_frontalface_alt.xml"); + SANITY_CHECK(faces, 4 + 1e-4); } - ocl::oclMat d_img(img); - - WARMUP_ON; - faceCascade.detectMultiScale(d_img, oclfaces, - 1.1, 2, 0 | CV_HAAR_SCALE_IMAGE, Size(30, 30)); - WARMUP_OFF; - - if(faces.size() == oclfaces.size()) - TestSystem::instance().setAccurate(1, 0); +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif else - TestSystem::instance().setAccurate(0, abs((int)faces.size() - (int)oclfaces.size())); - - faces.clear(); - - GPU_ON; - faceCascade.detectMultiScale(d_img, oclfaces, - 1.1, 2, 0 | CV_HAAR_SCALE_IMAGE, Size(30, 30)); - GPU_OFF; - - GPU_FULL_ON; - d_img.upload(img); - faceCascade.detectMultiScale(d_img, oclfaces, - 1.1, 2, 0 | CV_HAAR_SCALE_IMAGE, Size(30, 30)); - GPU_FULL_OFF; + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_hog.cpp b/modules/ocl/perf/perf_hog.cpp index e6d85b5dc0..9f0dab9045 100644 --- a/modules/ocl/perf/perf_hog.cpp +++ b/modules/ocl/perf/perf_hog.cpp @@ -45,50 +45,42 @@ //M*/ #include "perf_precomp.hpp" +using namespace perf; + ///////////// HOG//////////////////////// -PERFTEST(HOG) +PERF_TEST(HOGFixture, HOG) { - Mat src = imread(abspath("road.png"), cv::IMREAD_GRAYSCALE); - - if (src.empty()) - { - throw runtime_error("can't open road.png"); - } + Mat src = imread(getDataPath("gpu/hog/road.png"), cv::IMREAD_GRAYSCALE); + ASSERT_TRUE(!src.empty()) << "can't open input image road.png"; - cv::HOGDescriptor hog; - hog.setSVMDetector(hog.getDefaultPeopleDetector()); + const std::string impl = getSelectedImpl(); std::vector found_locations; - std::vector d_found_locations; - - SUBTEST << src.cols << 'x' << src.rows << "; road.png"; + declare.in(src).time(5); - hog.detectMultiScale(src, found_locations); + if (impl == "plain") + { + cv::HOGDescriptor hog; + hog.setSVMDetector(hog.getDefaultPeopleDetector()); - CPU_ON; - hog.detectMultiScale(src, found_locations); - CPU_OFF; + TEST_CYCLE() hog.detectMultiScale(src, found_locations); - cv::ocl::HOGDescriptor ocl_hog; - ocl_hog.setSVMDetector(ocl_hog.getDefaultPeopleDetector()); - ocl::oclMat d_src; - d_src.upload(src); + SANITY_CHECK(found_locations, 1 + DBL_EPSILON); + } + else if (impl == "ocl") + { + cv::ocl::HOGDescriptor ocl_hog; + ocl_hog.setSVMDetector(ocl_hog.getDefaultPeopleDetector()); + ocl::oclMat oclSrc(src); - WARMUP_ON; - ocl_hog.detectMultiScale(d_src, d_found_locations); - WARMUP_OFF; + TEST_CYCLE() ocl_hog.detectMultiScale(oclSrc, found_locations); - if(d_found_locations.size() == found_locations.size()) - TestSystem::instance().setAccurate(1, 0); + SANITY_CHECK(found_locations, 1 + DBL_EPSILON); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif else - TestSystem::instance().setAccurate(0, abs((int)found_locations.size() - (int)d_found_locations.size())); - - GPU_ON; - ocl_hog.detectMultiScale(d_src, found_locations); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl_hog.detectMultiScale(d_src, found_locations); - GPU_FULL_OFF; + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_imgproc.cpp b/modules/ocl/perf/perf_imgproc.cpp index 2ed64ce325..b33307818f 100644 --- a/modules/ocl/perf/perf_imgproc.cpp +++ b/modules/ocl/perf/perf_imgproc.cpp @@ -45,295 +45,299 @@ //M*/ #include "perf_precomp.hpp" -///////////// equalizeHist //////////////////////// -PERFTEST(equalizeHist) -{ - Mat src, dst, ocl_dst; - int all_type[] = {CV_8UC1}; - std::string type_name[] = {"CV_8UC1"}; +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); - - equalizeHist(src, dst); +///////////// equalizeHist //////////////////////// - CPU_ON; - equalizeHist(src, dst); - CPU_OFF; +typedef TestBaseWithParam equalizeHistFixture; - ocl::oclMat d_src(src); - ocl::oclMat d_dst; - ocl::oclMat d_hist; - ocl::oclMat d_buf; +PERF_TEST_P(equalizeHistFixture, equalizeHist, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - WARMUP_ON; - ocl::equalizeHist(d_src, d_dst); - WARMUP_OFF; + // creating src data + Mat src(srcSize, CV_8UC1), dst(srcSize, CV_8UC1); + declare.in(src, WARMUP_RNG).out(dst); - GPU_ON; - ocl::equalizeHist(d_src, d_dst); - GPU_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); - GPU_FULL_ON; - d_src.upload(src); - ocl::equalizeHist(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + TEST_CYCLE() cv::ocl::equalizeHist(oclSrc, oclDst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.1); - } + oclDst.download(dst); + SANITY_CHECK(dst, 1 + DBL_EPSILON); } -} -/////////// CopyMakeBorder ////////////////////// -PERFTEST(CopyMakeBorder) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_dst; - - int bordertype = BORDER_CONSTANT; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + else if (impl == "plain") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; + TEST_CYCLE() cv::equalizeHist(src, dst); + SANITY_CHECK(dst, 1 + DBL_EPSILON); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - gen(src, size, size, all_type[j], 0, 256); - - copyMakeBorder(src, dst, 7, 5, 5, 7, bordertype, cv::Scalar(1.0)); +/////////// CopyMakeBorder ////////////////////// - CPU_ON; - copyMakeBorder(src, dst, 7, 5, 5, 7, bordertype, cv::Scalar(1.0)); - CPU_OFF; +CV_ENUM(CopyMakeBorderMatType, CV_8UC1, CV_8UC4) - ocl::oclMat d_src(src); +typedef tuple CopyMakeBorderParams; +typedef TestBaseWithParam CopyMakeBorderFixture; - WARMUP_ON; - ocl::copyMakeBorder(d_src, d_dst, 7, 5, 5, 7, bordertype, cv::Scalar(1.0)); - WARMUP_OFF; +PERF_TEST_P(CopyMakeBorderFixture, CopyMakeBorder, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + CopyMakeBorderMatType::all())) +{ + // getting params + CopyMakeBorderParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), borderType = BORDER_CONSTANT; + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type), dst; + const Size dstSize = srcSize + Size(12, 12); + dst.create(dstSize, type); + declare.in(src, WARMUP_RNG).out(dst); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(dstSize, type); - GPU_ON; - ocl::copyMakeBorder(d_src, d_dst, 7, 5, 5, 7, bordertype, cv::Scalar(1.0)); - GPU_OFF; + TEST_CYCLE() cv::ocl::copyMakeBorder(oclSrc, oclDst, 7, 5, 5, 7, borderType, cv::Scalar(1.0)); - GPU_FULL_ON; - d_src.upload(src); - ocl::copyMakeBorder(d_src, d_dst, 7, 5, 5, 7, bordertype, cv::Scalar(1.0)); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::copyMakeBorder(src, dst, 7, 5, 5, 7, borderType, cv::Scalar(1.0)); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -///////////// cornerMinEigenVal //////////////////////// -PERFTEST(cornerMinEigenVal) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_dst; - int blockSize = 7, apertureSize = 1 + 2 * (rand() % 4); - int borderType = BORDER_REFLECT; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; +///////////// cornerMinEigenVal //////////////////////// - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +CV_ENUM(cornerMinEigenValMatType, CV_8UC1, CV_32FC1) - gen(src, size, size, all_type[j], 0, 256); +typedef tuple cornerMinEigenValParams; +typedef TestBaseWithParam cornerMinEigenValFixture; - cornerMinEigenVal(src, dst, blockSize, apertureSize, borderType); +PERF_TEST_P(cornerMinEigenValFixture, cornerMinEigenVal, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + cornerMinEigenValMatType::all())) +{ + // getting params + cornerMinEigenValParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), borderType = BORDER_REFLECT; + const int blockSize = 7, apertureSize = 1 + 2 * 3; - CPU_ON; - cornerMinEigenVal(src, dst, blockSize, apertureSize, borderType); - CPU_OFF; + const string impl = getSelectedImpl(); - ocl::oclMat d_src(src); + // creating src data + Mat src(srcSize, type), dst(srcSize, CV_32FC1); + declare.in(src, WARMUP_RNG).out(dst) + .time(srcSize == OCL_SIZE_4000 ? 20 : srcSize == OCL_SIZE_2000 ? 5 : 3); - WARMUP_ON; - ocl::cornerMinEigenVal(d_src, d_dst, blockSize, apertureSize, borderType); - WARMUP_OFF; + const int depth = CV_MAT_DEPTH(type); + const ERROR_TYPE errorType = depth == CV_8U ? ERROR_ABSOLUTE : ERROR_RELATIVE; - GPU_ON; - ocl::cornerMinEigenVal(d_src, d_dst, blockSize, apertureSize, borderType); - GPU_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, CV_32FC1); - GPU_FULL_ON; - d_src.upload(src); - ocl::cornerMinEigenVal(d_src, d_dst, blockSize, apertureSize, borderType); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + TEST_CYCLE() cv::ocl::cornerMinEigenVal(oclSrc, oclDst, blockSize, apertureSize, borderType); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); - } + oclDst.download(dst); + SANITY_CHECK(dst, 1e-6, errorType); } -} -///////////// cornerHarris //////////////////////// -PERFTEST(cornerHarris) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + else if (impl == "plain") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; BORDER_REFLECT"; + TEST_CYCLE() cv::cornerMinEigenVal(src, dst, blockSize, apertureSize, borderType); - gen(src, size, size, all_type[j], 0, 1); + SANITY_CHECK(dst, 1e-6, errorType); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - cornerHarris(src, dst, 5, 7, 0.1, BORDER_REFLECT); +///////////// cornerHarris //////////////////////// - CPU_ON; - cornerHarris(src, dst, 5, 7, 0.1, BORDER_REFLECT); - CPU_OFF; +typedef cornerMinEigenValMatType cornerHarrisMatType; +typedef tuple cornerHarrisParams; +typedef TestBaseWithParam cornerHarrisFixture; - d_src.upload(src); +PERF_TEST_P(cornerHarrisFixture, cornerHarris, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + cornerHarrisMatType::all())) +{ + // getting params + cornerHarrisParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), borderType = BORDER_REFLECT; - WARMUP_ON; - ocl::cornerHarris(d_src, d_dst, 5, 7, 0.1, BORDER_REFLECT); - WARMUP_OFF; + const string impl = getSelectedImpl(); - GPU_ON; - ocl::cornerHarris(d_src, d_dst, 5, 7, 0.1, BORDER_REFLECT); - GPU_OFF; + // creating src data + Mat src(srcSize, type), dst(srcSize, CV_32FC1); + randu(src, 0, 1); + declare.in(src).out(dst) + .time(srcSize == OCL_SIZE_4000 ? 20 : srcSize == OCL_SIZE_2000 ? 5 : 3); - GPU_FULL_ON; - d_src.upload(src); - ocl::cornerHarris(d_src, d_dst, 5, 7, 0.1, BORDER_REFLECT); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, CV_32FC1); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); - } + TEST_CYCLE() cv::ocl::cornerHarris(oclSrc, oclDst, 5, 7, 0.1, borderType); + oclDst.download(dst); + SANITY_CHECK(dst, 3e-5); } -} -///////////// integral //////////////////////// -PERFTEST(integral) -{ - Mat src, sum, ocl_sum; - ocl::oclMat d_src, d_sum, d_buf; - - int all_type[] = {CV_8UC1}; - std::string type_name[] = {"CV_8UC1"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + else if (impl == "plain") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; + TEST_CYCLE() cv::cornerHarris(src, dst, 5, 7, 0.1, borderType); - gen(src, size, size, all_type[j], 0, 256); + SANITY_CHECK(dst, 3e-5); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - integral(src, sum); +///////////// integral //////////////////////// - CPU_ON; - integral(src, sum); - CPU_OFF; +typedef TestBaseWithParam integralFixture; - d_src.upload(src); +PERF_TEST_P(integralFixture, DISABLED_integral, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - WARMUP_ON; - ocl::integral(d_src, d_sum); - WARMUP_OFF; + // creating src data + Mat src(srcSize, CV_8UC1), dst; + declare.in(src, WARMUP_RNG); - GPU_ON; - ocl::integral(d_src, d_sum); - GPU_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst; - GPU_FULL_ON; - d_src.upload(src); - ocl::integral(d_src, d_sum); - d_sum.download(ocl_sum); - GPU_FULL_OFF; + TEST_CYCLE() cv::ocl::integral(oclSrc, oclDst); - if(sum.type() == ocl_sum.type()) //we won't test accuracy when cpu function overlow - TestSystem::instance().ExpectedMatNear(sum, ocl_sum, 0.0); + oclDst.download(dst); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::integral(src, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } + ///////////// WarpAffine //////////////////////// -PERFTEST(WarpAffine) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; +typedef CopyMakeBorderMatType WarpAffineMatType; +typedef tuple WarpAffineParams; +typedef TestBaseWithParam WarpAffineFixture; + +PERF_TEST_P(WarpAffineFixture, WarpAffine, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + WarpAffineMatType::all())) +{ static const double coeffs[2][3] = { - {cos(CV_PI / 6), -sin(CV_PI / 6), 100.0}, - {sin(CV_PI / 6), cos(CV_PI / 6), -100.0} + { cos(CV_PI / 6), -sin(CV_PI / 6), 100.0 }, + { sin(CV_PI / 6), cos(CV_PI / 6), -100.0 } }; Mat M(2, 3, CV_64F, (void *)coeffs); - int interpolation = INTER_NEAREST; + const int interpolation = INTER_NEAREST; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; + // getting params + WarpAffineParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - Size size1 = Size(size, size); - - warpAffine(src, dst, M, size1, interpolation); - - CPU_ON; - warpAffine(src, dst, M, size1, interpolation); - CPU_OFF; - - d_src.upload(src); + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - WARMUP_ON; - ocl::warpAffine(d_src, d_dst, M, size1, interpolation); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::warpAffine(oclSrc, oclDst, M, srcSize, interpolation); - GPU_ON; - ocl::warpAffine(d_src, d_dst, M, size1, interpolation); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src.upload(src); - ocl::warpAffine(d_src, d_dst, M, size1, interpolation); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::warpAffine(src, dst, M, srcSize, interpolation); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } + ///////////// WarpPerspective //////////////////////// -PERFTEST(WarpPerspective) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; +typedef CopyMakeBorderMatType WarpPerspectiveMatType; +typedef tuple WarpPerspectiveParams; +typedef TestBaseWithParam WarpPerspectiveFixture; + +PERF_TEST_P(WarpPerspectiveFixture, WarpPerspective, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + WarpPerspectiveMatType::all())) +{ static const double coeffs[3][3] = { {cos(CV_PI / 6), -sin(CV_PI / 6), 100.0}, @@ -341,199 +345,154 @@ PERFTEST(WarpPerspective) {0.0, 0.0, 1.0} }; Mat M(3, 3, CV_64F, (void *)coeffs); - int interpolation = INTER_LINEAR; - - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); - gen(dst, size, size, all_type[j], 0, 256); - Size size1 = Size(size, size); - - warpPerspective(src, dst, M, size1, interpolation); + const int interpolation = INTER_LINEAR; - CPU_ON; - warpPerspective(src, dst, M, size1, interpolation); - CPU_OFF; + // getting params + WarpPerspectiveParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const string impl = getSelectedImpl(); - d_src.upload(src); + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst) + .time(srcSize == OCL_SIZE_4000 ? 18 : srcSize == OCL_SIZE_2000 ? 5 : 2); - WARMUP_ON; - ocl::warpPerspective(d_src, d_dst, M, size1, interpolation); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - ocl::warpPerspective(d_src, d_dst, M, size1, interpolation); - GPU_OFF; + TEST_CYCLE() cv::ocl::warpPerspective(oclSrc, oclDst, M, srcSize, interpolation); - GPU_FULL_ON; - d_src.upload(src); - ocl::warpPerspective(d_src, d_dst, M, size1, interpolation); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::warpPerspective(src, dst, M, srcSize, interpolation); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// resize //////////////////////// -PERFTEST(resize) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; +CV_ENUM(resizeInterType, INTER_NEAREST, INTER_LINEAR) - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +typedef CopyMakeBorderMatType resizeMatType; +typedef tuple resizeParams; +typedef TestBaseWithParam resizeFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) +PERF_TEST_P(resizeFixture, resize, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + resizeMatType::all(), + resizeInterType::all(), + ::testing::Values(0.5, 2.0))) +{ + // getting params + resizeParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), interType = get<2>(params); + double scale = get<3>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type), dst; + const Size dstSize(cvRound(srcSize.width * scale), cvRound(srcSize.height * scale)); + dst.create(dstSize, type); + declare.in(src, WARMUP_RNG).out(dst); + if (interType == INTER_LINEAR && type == CV_8UC4 && OCL_SIZE_4000 == srcSize) + declare.time(11); + + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; up"; - - gen(src, size, size, all_type[j], 0, 256); + ocl::oclMat oclSrc(src), oclDst(dstSize, type); - resize(src, dst, Size(), 2.0, 2.0); + TEST_CYCLE() cv::ocl::resize(oclSrc, oclDst, Size(), scale, scale, interType); - CPU_ON; - resize(src, dst, Size(), 2.0, 2.0); - CPU_OFF; - - d_src.upload(src); - - WARMUP_ON; - ocl::resize(d_src, d_dst, Size(), 2.0, 2.0); - WARMUP_OFF; - - GPU_ON; - ocl::resize(d_src, d_dst, Size(), 2.0, 2.0); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl::resize(d_src, d_dst, Size(), 2.0, 2.0); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); - } + oclDst.download(dst); + SANITY_CHECK(dst, 1 + DBL_EPSILON); } - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + else if (impl == "plain") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; down"; - - gen(src, size, size, all_type[j], 0, 256); - - resize(src, dst, Size(), 0.5, 0.5); - - CPU_ON; - resize(src, dst, Size(), 0.5, 0.5); - CPU_OFF; - - d_src.upload(src); - - WARMUP_ON; - ocl::resize(d_src, d_dst, Size(), 0.5, 0.5); - WARMUP_OFF; - - GPU_ON; - ocl::resize(d_src, d_dst, Size(), 0.5, 0.5); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl::resize(d_src, d_dst, Size(), 0.5, 0.5); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); - } + TEST_CYCLE() cv::resize(src, dst, Size(), scale, scale, interType); + SANITY_CHECK(dst, 1 + DBL_EPSILON); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -///////////// threshold//////////////////////// -PERFTEST(threshold) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size << "; 8UC1; THRESH_BINARY"; - gen(src, size, size, CV_8U, 0, 100); - - threshold(src, dst, 50.0, 0.0, THRESH_BINARY); +///////////// threshold//////////////////////// - CPU_ON; - threshold(src, dst, 50.0, 0.0, THRESH_BINARY); - CPU_OFF; +CV_ENUM(ThreshType, THRESH_BINARY, THRESH_TRUNC) - d_src.upload(src); +typedef tuple ThreshParams; +typedef TestBaseWithParam ThreshFixture; - WARMUP_ON; - ocl::threshold(d_src, d_dst, 50.0, 0.0, THRESH_BINARY); - WARMUP_OFF; +PERF_TEST_P(ThreshFixture, threshold, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + ThreshType::all())) +{ + // getting params + ThreshParams params = GetParam(); + const Size srcSize = get<0>(params); + const int threshType = get<1>(params); + const string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, CV_8U), dst(srcSize, CV_8U); + randu(src, 0, 100); + declare.in(src).out(dst); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, CV_8U); - GPU_ON; - ocl::threshold(d_src, d_dst, 50.0, 0.0, THRESH_BINARY); - GPU_OFF; + TEST_CYCLE() cv::ocl::threshold(oclSrc, oclDst, 50.0, 0.0, threshType); - GPU_FULL_ON; - d_src.upload(src); - ocl::threshold(d_src, d_dst, 50.0, 0.0, THRESH_BINARY); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); + SANITY_CHECK(dst); } - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + else if (impl == "plain") { - SUBTEST << size << 'x' << size << "; 32FC1; THRESH_TRUNC [NPP]"; - - gen(src, size, size, CV_32FC1, 0, 100); - - threshold(src, dst, 50.0, 0.0, THRESH_TRUNC); - - CPU_ON; - threshold(src, dst, 50.0, 0.0, THRESH_TRUNC); - CPU_OFF; - - d_src.upload(src); + TEST_CYCLE() cv::threshold(src, dst, 50.0, 0.0, threshType); - WARMUP_ON; - ocl::threshold(d_src, d_dst, 50.0, 0.0, THRESH_TRUNC); - WARMUP_OFF; - - GPU_ON; - ocl::threshold(d_src, d_dst, 50.0, 0.0, THRESH_TRUNC); - GPU_OFF; - - GPU_FULL_ON; - d_src.upload(src); - ocl::threshold(d_src, d_dst, 50.0, 0.0, THRESH_TRUNC); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } + ///////////// meanShiftFiltering//////////////////////// -COOR do_meanShift(int x0, int y0, uchar *sptr, uchar *dptr, int sstep, cv::Size size, int sp, int sr, int maxIter, float eps, int *tab) + +typedef struct +{ + short x; + short y; +} COOR; + +static COOR do_meanShift(int x0, int y0, uchar *sptr, uchar *dptr, int sstep, cv::Size size, int sp, int sr, int maxIter, float eps, int *tab) { int isr2 = sr * sr; @@ -715,48 +674,46 @@ static void meanShiftFiltering_(const Mat &src_roi, Mat &dst_roi, int sp, int sr } } -PERFTEST(meanShiftFiltering) +typedef TestBaseWithParam meanShiftFilteringFixture; + +PERF_TEST_P(meanShiftFilteringFixture, meanShiftFiltering, + OCL_TYPICAL_MAT_SIZES) { - int sp = 5, sr = 6; - Mat src, dst, ocl_dst; + const Size srcSize = GetParam(); + const int sp = 5, sr = 6; + const string impl = getSelectedImpl(); + cv::TermCriteria crit(cv::TermCriteria::COUNT + cv::TermCriteria::EPS, 5, 1); - ocl::oclMat d_src, d_dst; + Mat src(srcSize, CV_8UC4), dst(srcSize, CV_8UC4); + declare.in(src, WARMUP_RNG).out(dst) + .time(srcSize == OCL_SIZE_4000 ? + 56 : srcSize == OCL_SIZE_2000 ? 15 : 3.8); - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + if (impl == "plain") { - SUBTEST << size << 'x' << size << "; 8UC3 vs 8UC4"; - - gen(src, size, size, CV_8UC4, Scalar::all(0), Scalar::all(256)); - - cv::TermCriteria crit(cv::TermCriteria::COUNT + cv::TermCriteria::EPS, 5, 1); - - meanShiftFiltering_(src, dst, sp, sr, crit); + TEST_CYCLE() meanShiftFiltering_(src, dst, sp, sr, crit); - CPU_ON; - meanShiftFiltering_(src, dst, sp, sr, crit); - CPU_OFF; - - d_src.upload(src); - - WARMUP_ON; - ocl::meanShiftFiltering(d_src, d_dst, sp, sr, crit); - WARMUP_OFF; + SANITY_CHECK(dst); + } + else if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, CV_8UC4); - GPU_ON; - ocl::meanShiftFiltering(d_src, d_dst, sp, sr, crit); - GPU_OFF; + TEST_CYCLE() ocl::meanShiftFiltering(oclSrc, oclDst, sp, sr, crit); - GPU_FULL_ON; - d_src.upload(src); - ocl::meanShiftFiltering(d_src, d_dst, sp, sr, crit); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 0.0); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, int sp, int sr, cv::TermCriteria crit) +static void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, int sp, int sr, cv::TermCriteria crit) { if (src_roi.empty()) { @@ -814,200 +771,213 @@ void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, int sp, } } -PERFTEST(meanShiftProc) -{ - Mat src; - vector dst(2), ocl_dst(2); - ocl::oclMat d_src, d_dst, d_dstCoor; - TermCriteria crit(TermCriteria::COUNT + TermCriteria::EPS, 5, 1); - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size << "; 8UC4 and CV_16SC2 "; - - gen(src, size, size, CV_8UC4, Scalar::all(0), Scalar::all(256)); +typedef TestBaseWithParam meanShiftProcFixture; - meanShiftProc_(src, dst[0], dst[1], 5, 6, crit); +PERF_TEST_P(meanShiftProcFixture, meanShiftProc, + OCL_TYPICAL_MAT_SIZES) +{ + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); + TermCriteria crit(TermCriteria::COUNT + TermCriteria::EPS, 5, 1); - CPU_ON; - meanShiftProc_(src, dst[0], dst[1], 5, 6, crit); - CPU_OFF; + Mat src(srcSize, CV_8UC4), dst1(srcSize, CV_8UC4), + dst2(srcSize, CV_16SC2); + declare.in(src, WARMUP_RNG).out(dst1, dst2) + .time(srcSize == OCL_SIZE_4000 ? + 56 : srcSize == OCL_SIZE_2000 ? 15 : 3.8);; - d_src.upload(src); + if (impl == "plain") + { + TEST_CYCLE() meanShiftProc_(src, dst1, dst2, 5, 6, crit); - WARMUP_ON; - ocl::meanShiftProc(d_src, d_dst, d_dstCoor, 5, 6, crit); - WARMUP_OFF; + SANITY_CHECK(dst1); + SANITY_CHECK(dst2); + } + else if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst1(srcSize, CV_8UC4), + oclDst2(srcSize, CV_16SC2); - GPU_ON; - ocl::meanShiftProc(d_src, d_dst, d_dstCoor, 5, 6, crit); - GPU_OFF; + TEST_CYCLE() ocl::meanShiftProc(oclSrc, oclDst1, oclDst2, 5, 6, crit); - GPU_FULL_ON; - d_src.upload(src); - ocl::meanShiftProc(d_src, d_dst, d_dstCoor, 5, 6, crit); - d_dst.download(ocl_dst[0]); - d_dstCoor.download(ocl_dst[1]); - GPU_FULL_OFF; + oclDst1.download(dst1); + oclDst2.download(dst2); - vector eps(2, 0.); - TestSystem::instance().ExpectMatsNear(dst, ocl_dst, eps); + SANITY_CHECK(dst1); + SANITY_CHECK(dst2); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// remap//////////////////////// -PERFTEST(remap) -{ - Mat src, dst, xmap, ymap, ocl_dst; - ocl::oclMat d_src, d_dst, d_xmap, d_ymap; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; +CV_ENUM(RemapInterType, INTER_NEAREST, INTER_LINEAR) - int interpolation = INTER_LINEAR; - int borderMode = BORDER_CONSTANT; +typedef CopyMakeBorderMatType remapMatType; +typedef tuple remapParams; +typedef TestBaseWithParam remapFixture; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t t = 0; t < sizeof(all_type) / sizeof(int); t++) - { - SUBTEST << size << 'x' << size << "; src " << type_name[t] << "; map CV_32FC1"; - - gen(src, size, size, all_type[t], 0, 256); +PERF_TEST_P(remapFixture, remap, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + remapMatType::all(), + RemapInterType::all())) +{ + // getting params + remapParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params), interpolation = get<2>(params); + const string impl = getSelectedImpl(); - xmap.create(size, size, CV_32FC1); - dst.create(size, size, CV_32FC1); - ymap.create(size, size, CV_32FC1); + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - for (int i = 0; i < size; ++i) - { - float *xmap_row = xmap.ptr(i); - float *ymap_row = ymap.ptr(i); + if (srcSize == OCL_SIZE_4000 && interpolation == INTER_LINEAR) + declare.time(9); - for (int j = 0; j < size; ++j) - { - xmap_row[j] = (j - size * 0.5f) * 0.75f + size * 0.5f; - ymap_row[j] = (i - size * 0.5f) * 0.75f + size * 0.5f; - } - } + Mat xmap, ymap; + xmap.create(srcSize, CV_32FC1); + ymap.create(srcSize, CV_32FC1); - remap(src, dst, xmap, ymap, interpolation, borderMode); + for (int i = 0; i < srcSize.height; ++i) + { + float * const xmap_row = xmap.ptr(i); + float * const ymap_row = ymap.ptr(i); - CPU_ON; - remap(src, dst, xmap, ymap, interpolation, borderMode); - CPU_OFF; + for (int j = 0; j < srcSize.width; ++j) + { + xmap_row[j] = (j - srcSize.width * 0.5f) * 0.75f + srcSize.width * 0.5f; + ymap_row[j] = (i - srcSize.height * 0.5f) * 0.75f + srcSize.height * 0.5f; + } + } - d_src.upload(src); - d_dst.upload(dst); - d_xmap.upload(xmap); - d_ymap.upload(ymap); + const int borderMode = BORDER_CONSTANT; - WARMUP_ON; - ocl::remap(d_src, d_dst, d_xmap, d_ymap, interpolation, borderMode); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); + ocl::oclMat oclXMap(xmap), oclYMap(ymap); - GPU_ON; - ocl::remap(d_src, d_dst, d_xmap, d_ymap, interpolation, borderMode); - GPU_OFF; + TEST_CYCLE() cv::ocl::remap(oclSrc, oclDst, oclXMap, oclYMap, interpolation, borderMode); - GPU_FULL_ON; - d_src.upload(src); - ocl::remap(d_src, d_dst, d_xmap, d_ymap, interpolation, borderMode); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 2.0); - } + SANITY_CHECK(dst, 1 + DBL_EPSILON); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::remap(src, dst, xmap, ymap, interpolation, borderMode); + SANITY_CHECK(dst, 1 + DBL_EPSILON); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -///////////// CLAHE //////////////////////// -PERFTEST(CLAHE) -{ - Mat src, dst, ocl_dst; - cv::ocl::oclMat d_src, d_dst; - int all_type[] = {CV_8UC1}; - std::string type_name[] = {"CV_8UC1"}; - - double clipLimit = 40.0; - cv::Ptr clahe = cv::createCLAHE(clipLimit); - cv::Ptr d_clahe = cv::ocl::createCLAHE(clipLimit); +///////////// CLAHE //////////////////////// - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef TestBaseWithParam CLAHEFixture; - gen(src, size, size, all_type[j], 0, 256); +PERF_TEST_P(CLAHEFixture, CLAHE, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - CPU_ON; - clahe->apply(src, dst); - CPU_OFF; + // creating src data + Mat src(srcSize, CV_8UC1), dst; + const double clipLimit = 40.0; + declare.in(src, WARMUP_RNG); - d_src.upload(src); + if (srcSize == OCL_SIZE_4000) + declare.time(11); - WARMUP_ON; - d_clahe->apply(d_src, d_dst); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst; + cv::Ptr oclClahe = cv::ocl::createCLAHE(clipLimit); - ocl_dst = d_dst; + TEST_CYCLE() oclClahe->apply(oclSrc, oclDst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 1.0); + oclDst.download(dst); - GPU_ON; - d_clahe->apply(d_src, d_dst); - GPU_OFF; + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + cv::Ptr clahe = cv::createCLAHE(clipLimit); + TEST_CYCLE() clahe->apply(src, dst); - GPU_FULL_ON; - d_src.upload(src); - d_clahe->apply(d_src, d_dst); - d_dst.download(dst); - GPU_FULL_OFF; - } + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// columnSum//////////////////////// -PERFTEST(columnSum) + +typedef TestBaseWithParam columnSumFixture; + +static void columnSumPerfTest(const Mat & src, Mat & dst) { - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; + for (int j = 0; j < src.cols; j++) + dst.at(0, j) = src.at(0, j); - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size << "; CV_32FC1"; + for (int i = 1; i < src.rows; ++i) + for (int j = 0; j < src.cols; ++j) + dst.at(i, j) = dst.at(i - 1 , j) + src.at(i , j); +} - gen(src, size, size, CV_32FC1, 0, 256); +PERF_TEST_P(columnSumFixture, columnSum, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const string impl = getSelectedImpl(); - CPU_ON; - dst.create(src.size(), src.type()); - for (int j = 0; j < src.cols; j++) - dst.at(0, j) = src.at(0, j); + // creating src data + Mat src(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); + declare.in(src, WARMUP_RNG).out(dst); - for (int i = 1; i < src.rows; ++i) - for (int j = 0; j < src.cols; ++j) - dst.at(i, j) = dst.at(i - 1 , j) + src.at(i , j); - CPU_OFF; + if (srcSize == OCL_SIZE_4000) + declare.time(5); - d_src.upload(src); + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, CV_32FC1); - WARMUP_ON; - ocl::columnSum(d_src, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::columnSum(oclSrc, oclDst); - GPU_ON; - ocl::columnSum(d_src, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src.upload(src); - ocl::columnSum(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() columnSumPerfTest(src, dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 5e-1); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_match_template.cpp b/modules/ocl/perf/perf_match_template.cpp index 8caf4b4f55..a1c7caf738 100644 --- a/modules/ocl/perf/perf_match_template.cpp +++ b/modules/ocl/perf/perf_match_template.cpp @@ -45,101 +45,97 @@ //M*/ #include "perf_precomp.hpp" -/////////// matchTemplate //////////////////////// -//void InitMatchTemplate() -//{ -// Mat src; gen(src, 500, 500, CV_32F, 0, 1); -// Mat templ; gen(templ, 500, 500, CV_32F, 0, 1); -// ocl::oclMat d_src(src), d_templ(templ), d_dst; -// ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR); -//} -PERFTEST(matchTemplate) -{ - //InitMatchTemplate(); - Mat src, templ, dst, ocl_dst; - int templ_size = 5; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - int all_type[] = {CV_32FC1, CV_32FC4}; - std::string type_name[] = {"CV_32FC1", "CV_32FC4"}; - - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - for(templ_size = 5; templ_size <= 5; templ_size *= 5) - { - gen(src, size, size, all_type[j], 0, 1); - - SUBTEST << src.cols << 'x' << src.rows << "; " << type_name[j] << "; templ " << templ_size << 'x' << templ_size << "; CCORR"; - - gen(templ, templ_size, templ_size, all_type[j], 0, 1); - - matchTemplate(src, templ, dst, CV_TM_CCORR); - - CPU_ON; - matchTemplate(src, templ, dst, CV_TM_CCORR); - CPU_OFF; - - ocl::oclMat d_src(src), d_templ(templ), d_dst; - - WARMUP_ON; - ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR); - WARMUP_OFF; +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; - GPU_ON; - ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR); - GPU_OFF; +/////////// matchTemplate //////////////////////// - GPU_FULL_ON; - d_src.upload(src); - d_templ.upload(templ); - ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR); - d_dst.download(ocl_dst); - GPU_FULL_OFF; +CV_ENUM(CV_TM_CCORRMatType, CV_32FC1, CV_32FC4) - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, templ.rows * templ.cols * 1e-1); - } - } +typedef tuple CV_TM_CCORRParams; +typedef TestBaseWithParam CV_TM_CCORRFixture; - int all_type_8U[] = {CV_8UC1}; - std::string type_name_8U[] = {"CV_8UC1"}; +PERF_TEST_P(CV_TM_CCORRFixture, matchTemplate, + ::testing::Combine(::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000), + CV_TM_CCORRMatType::all())) +{ + // getting params + CV_TM_CCORRParams params = GetParam(); + const Size srcSize = get<0>(params), templSize(5, 5); + const int type = get<1>(params); + + std::string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, type), templ(templSize, type); + const Size dstSize(src.cols - templ.cols + 1, src.rows - templ.rows + 1); + Mat dst(dstSize, CV_32F); + randu(src, 0.0f, 1.0f); + randu(templ, 0.0f, 1.0f); + declare.time(srcSize == OCL_SIZE_2000 ? 20 : 6).in(src, templ).out(dst); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclTempl(templ), oclDst(dstSize, CV_32F); - for (size_t j = 0; j < sizeof(all_type_8U) / sizeof(int); j++) - { - for(templ_size = 5; templ_size <= 5; templ_size *= 5) - { - SUBTEST << src.cols << 'x' << src.rows << "; " << type_name_8U[j] << "; templ " << templ_size << 'x' << templ_size << "; CCORR_NORMED"; + TEST_CYCLE() cv::ocl::matchTemplate(oclSrc, oclTempl, oclDst, CV_TM_CCORR); - gen(src, size, size, all_type_8U[j], 0, 255); + oclDst.download(dst); - gen(templ, templ_size, templ_size, all_type_8U[j], 0, 255); + SANITY_CHECK(dst, 1e-4); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::matchTemplate(src, templ, dst, CV_TM_CCORR); - matchTemplate(src, templ, dst, CV_TM_CCORR_NORMED); + SANITY_CHECK(dst, 1e-4); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - CPU_ON; - matchTemplate(src, templ, dst, CV_TM_CCORR_NORMED); - CPU_OFF; +typedef TestBaseWithParam CV_TM_CCORR_NORMEDFixture; - ocl::oclMat d_src(src); - ocl::oclMat d_templ(templ), d_dst; +PERF_TEST_P(CV_TM_CCORR_NORMEDFixture, matchTemplate, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(), templSize(5, 5); + const std::string impl = getSelectedImpl(); + + // creating src data + Mat src(srcSize, CV_8UC1), templ(templSize, CV_8UC1), dst; + const Size dstSize(src.cols - templ.cols + 1, src.rows - templ.rows + 1); + dst.create(dstSize, CV_8UC1); + declare.in(src, templ, WARMUP_RNG).out(dst) + .time(srcSize == OCL_SIZE_2000 ? 10 : srcSize == OCL_SIZE_4000 ? 23 : 2); + + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclTempl(templ), oclDst(dstSize, CV_8UC1); - WARMUP_ON; - ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR_NORMED); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::matchTemplate(oclSrc, oclTempl, oclDst, CV_TM_CCORR_NORMED); - GPU_ON; - ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR_NORMED); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src.upload(src); - d_templ.upload(templ); - ocl::matchTemplate(d_src, d_templ, d_dst, CV_TM_CCORR_NORMED); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst, 2e-2); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::matchTemplate(src, templ, dst, CV_TM_CCORR_NORMED); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, templ.rows * templ.cols * 1e-1); - } - } + SANITY_CHECK(dst, 2e-2); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_matrix_operation.cpp b/modules/ocl/perf/perf_matrix_operation.cpp index 092e548940..dc3e15495a 100644 --- a/modules/ocl/perf/perf_matrix_operation.cpp +++ b/modules/ocl/perf/perf_matrix_operation.cpp @@ -45,142 +45,147 @@ //M*/ #include "perf_precomp.hpp" -///////////// ConvertTo//////////////////////// -PERFTEST(ConvertTo) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] << " to 32FC1"; +///////////// ConvertTo//////////////////////// - gen(src, size, size, all_type[j], 0, 256); - //gen(dst, size, size, all_type[j], 0, 256); +CV_ENUM(ConvertToMatType, CV_8UC1, CV_8UC4) - //d_dst.upload(dst); +typedef tuple ConvertToParams; +typedef TestBaseWithParam ConvertToFixture; - src.convertTo(dst, CV_32FC1); +PERF_TEST_P(ConvertToFixture, ConvertTo, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + ConvertToMatType::all())) +{ + // getting params + ConvertToParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); - CPU_ON; - src.convertTo(dst, CV_32FC1); - CPU_OFF; + std::string impl = getSelectedImpl(); - d_src.upload(src); + // creating src data + Mat src(srcSize, type), dst; + const int dstType = CV_MAKE_TYPE(CV_32F, src.channels()); + dst.create(srcSize, dstType); + declare.in(src, WARMUP_RNG).out(dst); - WARMUP_ON; - d_src.convertTo(d_dst, CV_32FC1); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, dstType); - GPU_ON; - d_src.convertTo(d_dst, CV_32FC1); - GPU_OFF; + TEST_CYCLE() oclSrc.convertTo(oclDst, dstType); - GPU_FULL_ON; - d_src.upload(src); - d_src.convertTo(d_dst, CV_32FC1); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() src.convertTo(dst, dstType); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -///////////// copyTo//////////////////////// -PERFTEST(copyTo) -{ - Mat src, dst, ocl_dst; - ocl::oclMat d_src, d_dst; - - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); - //gen(dst, size, size, all_type[j], 0, 256); +///////////// copyTo//////////////////////// - //d_dst.upload(dst); +typedef ConvertToMatType copyToMatType; +typedef tuple copyToParams; +typedef TestBaseWithParam copyToFixture; - src.copyTo(dst); +PERF_TEST_P(copyToFixture, copyTo, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + copyToMatType::all())) +{ + // getting params + copyToParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); - CPU_ON; - src.copyTo(dst); - CPU_OFF; + std::string impl = getSelectedImpl(); - d_src.upload(src); + // creating src data + Mat src(srcSize, type), dst(srcSize, type); + declare.in(src, WARMUP_RNG).out(dst); - WARMUP_ON; - d_src.copyTo(d_dst); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(srcSize, type); - GPU_ON; - d_src.copyTo(d_dst); - GPU_OFF; + TEST_CYCLE() oclSrc.copyTo(oclDst); - GPU_FULL_ON; - d_src.upload(src); - d_src.copyTo(d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + oclDst.download(dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 0.0); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() src.copyTo(dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } -///////////// setTo//////////////////////// -PERFTEST(setTo) -{ - Mat src, ocl_src; - Scalar val(1, 2, 3, 4); - ocl::oclMat d_src; - - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - - gen(src, size, size, all_type[j], 0, 256); +///////////// setTo//////////////////////// - src.setTo(val); +typedef ConvertToMatType setToMatType; +typedef tuple setToParams; +typedef TestBaseWithParam setToFixture; - CPU_ON; - src.setTo(val); - CPU_OFF; +PERF_TEST_P(setToFixture, setTo, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + setToMatType::all())) +{ + // getting params + setToParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); + const Scalar val(1, 2, 3, 4); - d_src.upload(src); + std::string impl = getSelectedImpl(); - WARMUP_ON; - d_src.setTo(val); - WARMUP_OFF; + // creating src data + Mat src(srcSize, type); + declare.in(src); - d_src.download(ocl_src); - TestSystem::instance().ExpectedMatNear(src, ocl_src, 1.0); + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(srcSize, type); - GPU_ON;; - d_src.setTo(val); - GPU_OFF; + TEST_CYCLE() oclSrc.setTo(val); + oclSrc.download(src); - GPU_FULL_ON; - d_src.upload(src); - d_src.setTo(val); - GPU_FULL_OFF; - } + SANITY_CHECK(src); + } + else if (impl == "plain") + { + TEST_CYCLE() src.setTo(val); + SANITY_CHECK(src); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_moments.cpp b/modules/ocl/perf/perf_moments.cpp index a1515b879b..59452d4fb0 100644 --- a/modules/ocl/perf/perf_moments.cpp +++ b/modules/ocl/perf/perf_moments.cpp @@ -43,50 +43,59 @@ // the use of this software, even if advised of the possibility of such damage. // //M*/ + #include "perf_precomp.hpp" -///////////// Moments //////////////////////// -PERFTEST(Moments) -{ - Mat src; - bool binaryImage = 0; - int all_type[] = {CV_8UC1, CV_16SC1, CV_32FC1, CV_64FC1}; - std::string type_name[] = {"CV_8UC1", "CV_16SC1", "CV_32FC1", "CV_64FC1"}; +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; +///////////// Moments //////////////////////// - gen(src, size, size, all_type[j], 0, 256); +CV_ENUM(MomentsMatType, CV_8UC1, CV_16SC1, CV_32FC1, CV_64FC1) - cv::Moments CvMom = moments(src, binaryImage); +typedef tuple MomentsParams; +typedef TestBaseWithParam MomentsFixture; - CPU_ON; - moments(src, binaryImage); - CPU_OFF; +PERF_TEST_P(MomentsFixture, DISABLED_Moments, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + MomentsMatType::all())) +{ + // getting params + MomentsParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); - cv::Moments oclMom; - WARMUP_ON; - oclMom = ocl::ocl_moments(src, binaryImage); - WARMUP_OFF; + std::string impl = getSelectedImpl(); - Mat gpu_dst, cpu_dst; - HuMoments(CvMom, cpu_dst); - HuMoments(oclMom, gpu_dst); + // creating src data + Mat src(srcSize, type), dst(7, 1, CV_64F); + const bool binaryImage = false; + cv::Moments mom; - GPU_ON; - ocl::ocl_moments(src, binaryImage); - GPU_OFF; + declare.in(src, WARMUP_RNG).out(dst); - GPU_FULL_ON; - ocl::ocl_moments(src, binaryImage); - GPU_FULL_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src); - TestSystem::instance().ExpectedMatNear(gpu_dst, cpu_dst, .5); + TEST_CYCLE() mom = cv::ocl::ocl_moments(oclSrc, binaryImage); + cv::HuMoments(mom, dst); - } + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() mom = cv::moments(src, binaryImage); + cv::HuMoments(mom, dst); + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_norm.cpp b/modules/ocl/perf/perf_norm.cpp index a80ab13547..b0e18facdf 100644 --- a/modules/ocl/perf/perf_norm.cpp +++ b/modules/ocl/perf/perf_norm.cpp @@ -45,43 +45,46 @@ //M*/ #include "perf_precomp.hpp" -///////////// norm//////////////////////// -PERFTEST(norm) -{ - Mat src1, src2, ocl_src1; - ocl::oclMat d_src1, d_src2; +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - SUBTEST << size << 'x' << size << "; CV_8UC1; NORM_INF"; - - gen(src1, size, size, CV_8UC1, Scalar::all(0), Scalar::all(1)); - gen(src2, size, size, CV_8UC1, Scalar::all(0), Scalar::all(1)); +///////////// norm//////////////////////// - norm(src1, src2, NORM_INF); +typedef TestBaseWithParam normFixture; - CPU_ON; - norm(src1, src2, NORM_INF); - CPU_OFF; +PERF_TEST_P(normFixture, DISABLED_norm, OCL_TYPICAL_MAT_SIZES) +{ + // getting params + const Size srcSize = GetParam(); + const std::string impl = getSelectedImpl(); + double value = 0.0; - d_src1.upload(src1); - d_src2.upload(src2); + // creating src data + Mat src1(srcSize, CV_8UC1), src2(srcSize, CV_8UC1); + declare.in(src1, src2); + randu(src1, 0, 1); + randu(src2, 0, 1); - WARMUP_ON; - ocl::norm(d_src1, d_src2, NORM_INF); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc1(src1), oclSrc2(src2); - d_src1.download(ocl_src1); - TestSystem::instance().ExpectedMatNear(src1, ocl_src1, .5); + TEST_CYCLE() value = cv::ocl::norm(oclSrc1, oclSrc2, NORM_INF); - GPU_ON; - ocl::norm(d_src1, d_src2, NORM_INF); - GPU_OFF; + SANITY_CHECK(value); + } + else if (impl == "plain") + { + TEST_CYCLE() value = cv::norm(src1, src2, NORM_INF); - GPU_FULL_ON; - d_src1.upload(src1); - d_src2.upload(src2); - ocl::norm(d_src1, d_src2, NORM_INF); - GPU_FULL_OFF; + SANITY_CHECK(value); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_opticalflow.cpp b/modules/ocl/perf/perf_opticalflow.cpp index a6724c8123..2f0626750c 100644 --- a/modules/ocl/perf/perf_opticalflow.cpp +++ b/modules/ocl/perf/perf_opticalflow.cpp @@ -46,117 +46,130 @@ #include "perf_precomp.hpp" ///////////// PyrLKOpticalFlow //////////////////////// -PERFTEST(PyrLKOpticalFlow) -{ - std::string images1[] = {"rubberwhale1.png", "aloeL.jpg"}; - std::string images2[] = {"rubberwhale2.png", "aloeR.jpg"}; - - for (size_t i = 0; i < sizeof(images1) / sizeof(std::string); i++) - { - Mat frame0 = imread(abspath(images1[i]), i == 0 ? IMREAD_COLOR : IMREAD_GRAYSCALE); - - if (frame0.empty()) - { - std::string errstr = "can't open " + images1[i]; - throw runtime_error(errstr); - } - - Mat frame1 = imread(abspath(images2[i]), i == 0 ? IMREAD_COLOR : IMREAD_GRAYSCALE); - - if (frame1.empty()) - { - std::string errstr = "can't open " + images2[i]; - throw runtime_error(errstr); - } - - Mat gray_frame; - - if (i == 0) - { - cvtColor(frame0, gray_frame, COLOR_BGR2GRAY); - } - - for (int points = Min_Size; points <= Max_Size; points *= Multiple) - { - if (i == 0) - SUBTEST << frame0.cols << "x" << frame0.rows << "; color; " << points << " points"; - else - SUBTEST << frame0.cols << "x" << frame0.rows << "; gray; " << points << " points"; - Mat ocl_nextPts; - Mat ocl_status; - - vector pts; - goodFeaturesToTrack(i == 0 ? gray_frame : frame0, pts, points, 0.01, 0.0); - - vector nextPts; - vector status; - vector err; +using namespace perf; +using std::tr1::get; +using std::tr1::tuple; +using std::tr1::make_tuple; - calcOpticalFlowPyrLK(frame0, frame1, pts, nextPts, status, err); - - CPU_ON; - calcOpticalFlowPyrLK(frame0, frame1, pts, nextPts, status, err); - CPU_OFF; - - ocl::PyrLKOpticalFlow d_pyrLK; - - ocl::oclMat d_frame0(frame0); - ocl::oclMat d_frame1(frame1); - - ocl::oclMat d_pts; - Mat pts_mat(1, (int)pts.size(), CV_32FC2, (void *)&pts[0]); - d_pts.upload(pts_mat); - - ocl::oclMat d_nextPts; - ocl::oclMat d_status; - ocl::oclMat d_err; +template +static vector & MatToVector(const ocl::oclMat & oclSrc, vector & instance) +{ + Mat src; + oclSrc.download(src); - WARMUP_ON; - d_pyrLK.sparse(d_frame0, d_frame1, d_pts, d_nextPts, d_status, &d_err); - WARMUP_OFF; + for (int i = 0; i < src.cols; ++i) + instance.push_back(src.at(0, i)); - GPU_ON; - d_pyrLK.sparse(d_frame0, d_frame1, d_pts, d_nextPts, d_status, &d_err); - GPU_OFF; + return instance; +} - GPU_FULL_ON; - d_frame0.upload(frame0); - d_frame1.upload(frame1); - d_pts.upload(pts_mat); - d_pyrLK.sparse(d_frame0, d_frame1, d_pts, d_nextPts, d_status, &d_err); +CV_ENUM(LoadMode, IMREAD_GRAYSCALE, IMREAD_COLOR) + +typedef tuple > PyrLKOpticalFlowParamType; +typedef TestBaseWithParam PyrLKOpticalFlowFixture; + +PERF_TEST_P(PyrLKOpticalFlowFixture, + PyrLKOpticalFlow, + ::testing::Combine( + ::testing::Values(1000, 2000, 4000), + ::testing::Values( + make_tuple + ( + string("gpu/opticalflow/rubberwhale1.png"), + string("gpu/opticalflow/rubberwhale1.png"), + LoadMode(IMREAD_COLOR) + ) +// , make_tuple +// ( +// string("gpu/stereobm/aloe-L.png"), +// string("gpu/stereobm/aloe-R.png"), +// LoadMode(IMREAD_GRAYSCALE) +// ) + ) + ) + ) +{ + PyrLKOpticalFlowParamType params = GetParam(); + tuple fileParam = get<1>(params); + const int pointsCount = get<0>(params); + const int openMode = static_cast(get<2>(fileParam)); + const string fileName0 = get<0>(fileParam), fileName1 = get<1>(fileParam); + Mat frame0 = imread(getDataPath(fileName0), openMode); + Mat frame1 = imread(getDataPath(fileName1), openMode); + const string impl = getSelectedImpl(); + + ASSERT_FALSE(frame0.empty()) << "can't load " << fileName0; + ASSERT_FALSE(frame1.empty()) << "can't load " << fileName1; + + Mat grayFrame; + if (openMode == IMREAD_COLOR) + cvtColor(frame0, grayFrame, COLOR_BGR2GRAY); + else + grayFrame = frame0; + + // initialization + vector pts, nextPts; + vector status; + vector err; + goodFeaturesToTrack(grayFrame, pts, pointsCount, 0.01, 0.0); + + // selecting implementation + if (impl == "plain") + { + TEST_CYCLE() + cv::calcOpticalFlowPyrLK(frame0, frame1, pts, nextPts, status, err); - if (!d_nextPts.empty()) - d_nextPts.download(ocl_nextPts); + SANITY_CHECK(nextPts); + SANITY_CHECK(status); + SANITY_CHECK(err); + } + else if (impl == "ocl") + { + ocl::PyrLKOpticalFlow oclPyrLK; + ocl::oclMat oclFrame0(frame0), oclFrame1(frame1); + ocl::oclMat oclPts(1, static_cast(pts.size()), CV_32FC2, (void *)&pts[0]); + ocl::oclMat oclNextPts, oclStatus, oclErr; - if (!d_status.empty()) - d_status.download(ocl_status); - GPU_FULL_OFF; + TEST_CYCLE() + oclPyrLK.sparse(oclFrame0, oclFrame1, oclPts, oclNextPts, oclStatus, &oclErr); - size_t mismatch = 0; - for (int i = 0; i < (int)nextPts.size(); ++i) - { - if(status[i] != ocl_status.at(0, i)) - { - mismatch++; - continue; - } - if(status[i]) - { - Point2f gpu_rst = ocl_nextPts.at(0, i); - Point2f cpu_rst = nextPts[i]; - if(fabs(gpu_rst.x - cpu_rst.x) >= 1. || fabs(gpu_rst.y - cpu_rst.y) >= 1.) - mismatch++; - } - } - double ratio = (double)mismatch / (double)nextPts.size(); - if(ratio < .02) - TestSystem::instance().setAccurate(1, ratio); - else - TestSystem::instance().setAccurate(0, ratio); - } + MatToVector(oclNextPts, nextPts); + MatToVector(oclStatus, status); + MatToVector(oclErr, err); + SANITY_CHECK(nextPts); + SANITY_CHECK(status); + SANITY_CHECK(err); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); + +// size_t mismatch = 0; +// for (int i = 0; i < (int)nextPts.size(); ++i) +// { +// if(status[i] != ocl_status.at(0, i)) +// { +// mismatch++; +// continue; +// } +// if(status[i]) +// { +// Point2f gpu_rst = ocl_nextPts.at(0, i); +// Point2f cpu_rst = nextPts[i]; +// if(fabs(gpu_rst.x - cpu_rst.x) >= 1. || fabs(gpu_rst.y - cpu_rst.y) >= 1.) +// mismatch++; +// } +// } +// double ratio = (double)mismatch / (double)nextPts.size(); +// if(ratio < .02) +// TestSystem::instance().setAccurate(1, ratio); +// else +// TestSystem::instance().setAccurate(0, ratio); } diff --git a/modules/ocl/perf/perf_precomp.hpp b/modules/ocl/perf/perf_precomp.hpp index 216ebe5c5d..8c13b9e73e 100644 --- a/modules/ocl/perf/perf_precomp.hpp +++ b/modules/ocl/perf/perf_precomp.hpp @@ -40,6 +40,15 @@ // //M*/ +#ifdef __GNUC__ +# pragma GCC diagnostic ignored "-Wmissing-declarations" +# pragma GCC diagnostic ignored "-Wunused-function" +# if defined __clang__ || defined __APPLE__ +# pragma GCC diagnostic ignored "-Wmissing-prototypes" +# pragma GCC diagnostic ignored "-Wextra" +# endif +#endif + #ifndef __OPENCV_PERF_PRECOMP_HPP__ #define __OPENCV_PERF_PRECOMP_HPP__ @@ -50,6 +59,7 @@ #include #include #include + #include "opencv2/core/core.hpp" #include "opencv2/imgproc/imgproc.hpp" #include "opencv2/highgui/highgui.hpp" @@ -59,9 +69,12 @@ #include "opencv2/features2d/features2d.hpp" #include "opencv2/ocl/ocl.hpp" #include "opencv2/ts/ts.hpp" -#include "opencv2/ts/ts_perf.hpp" -#include "opencv2/ts/ts_gtest.h" +#define OCL_SIZE_1000 cv::Size(1000, 1000) +#define OCL_SIZE_2000 cv::Size(2000, 2000) +#define OCL_SIZE_4000 cv::Size(4000, 4000) + +#define OCL_TYPICAL_MAT_SIZES ::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000, OCL_SIZE_4000) #define Min_Size 1000 #define Max_Size 4000 @@ -76,15 +89,15 @@ void gen(Mat &mat, int rows, int cols, int type, int low, int high, int n); string abspath(const string &relpath); int CV_CDECL cvErrorCallback(int, const char *, const char *, const char *, int, void *); -typedef struct -{ - short x; - short y; -} COOR; -COOR do_meanShift(int x0, int y0, uchar *sptr, uchar *dptr, int sstep, - cv::Size size, int sp, int sr, int maxIter, float eps, int *tab); -void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, - int sp, int sr, cv::TermCriteria crit); +//typedef struct +//{ +// short x; +// short y; +//} COOR; +//COOR do_meanShift(int x0, int y0, uchar *sptr, uchar *dptr, int sstep, +// cv::Size size, int sp, int sr, int maxIter, float eps, int *tab); +//void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, +// int sp, int sr, cv::TermCriteria crit); template diff --git a/modules/ocl/perf/perf_pyramid.cpp b/modules/ocl/perf/perf_pyramid.cpp index 10262799f1..6b24811a6a 100644 --- a/modules/ocl/perf/perf_pyramid.cpp +++ b/modules/ocl/perf/perf_pyramid.cpp @@ -45,88 +45,103 @@ //M*/ #include "perf_precomp.hpp" +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; + ///////////// pyrDown ////////////////////// -PERFTEST(pyrDown) -{ - Mat src, dst, ocl_dst; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +CV_ENUM(pyrDownMatType, CV_8UC1, CV_8UC4) - gen(src, size, size, all_type[j], 0, 256); +typedef tuple pyrDownParams; +typedef TestBaseWithParam pyrDownFixture; - pyrDown(src, dst); +PERF_TEST_P(pyrDownFixture, pyrDown, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + pyrDownMatType::all())) +{ + // getting params + pyrDownParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); - CPU_ON; - pyrDown(src, dst); - CPU_OFF; + std::string impl = getSelectedImpl(); - ocl::oclMat d_src(src); - ocl::oclMat d_dst; + // creating src data + Mat src(srcSize, type), dst; + Size dstSize((srcSize.height + 1) >> 1, (srcSize.width + 1) >> 1); + dst.create(dstSize, type); + declare.in(src).out(dst); - WARMUP_ON; - ocl::pyrDown(d_src, d_dst); - WARMUP_OFF; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(dstSize, type); + + TEST_CYCLE() cv::ocl::pyrDown(oclSrc, oclDst); - GPU_ON; - ocl::pyrDown(d_src, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src.upload(src); - ocl::pyrDown(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::pyrDown(src, dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, dst.depth() == CV_32F ? 1e-4f : 1.0f); - } + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } ///////////// pyrUp //////////////////////// -PERFTEST(pyrUp) -{ - Mat src, dst, ocl_dst; - int all_type[] = {CV_8UC1, CV_8UC4}; - std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; - for (int size = 500; size <= 2000; size *= 2) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; +typedef pyrDownMatType pyrUpMatType; +typedef tuple pyrUpParams; +typedef TestBaseWithParam pyrUpFixture; - gen(src, size, size, all_type[j], 0, 256); +PERF_TEST_P(pyrUpFixture, pyrUp, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + pyrUpMatType::all())) +{ + // getting params + pyrUpParams params = GetParam(); + const Size srcSize = get<0>(params); + const int type = get<1>(params); - pyrUp(src, dst); + std::string impl = getSelectedImpl(); - CPU_ON; - pyrUp(src, dst); - CPU_OFF; + // creating src data + Mat src(srcSize, type), dst; + Size dstSize(srcSize.height << 1, srcSize.width << 1); + dst.create(dstSize, type); + declare.in(src).out(dst); - ocl::oclMat d_src(src); - ocl::oclMat d_dst; + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src), oclDst(dstSize, type); - WARMUP_ON; - ocl::pyrUp(d_src, d_dst); - WARMUP_OFF; + TEST_CYCLE() cv::ocl::pyrDown(oclSrc, oclDst); - GPU_ON; - ocl::pyrUp(d_src, d_dst); - GPU_OFF; + oclDst.download(dst); - GPU_FULL_ON; - d_src.upload(src); - ocl::pyrUp(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::pyrDown(src, dst); - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, (src.depth() == CV_32F ? 1e-4f : 1.0)); - } + SANITY_CHECK(dst); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } diff --git a/modules/ocl/perf/perf_split_merge.cpp b/modules/ocl/perf/perf_split_merge.cpp index 736125ec6c..304d3dd37a 100644 --- a/modules/ocl/perf/perf_split_merge.cpp +++ b/modules/ocl/perf/perf_split_merge.cpp @@ -45,110 +45,120 @@ //M*/ #include "perf_precomp.hpp" +using namespace perf; +using std::tr1::tuple; +using std::tr1::get; + ///////////// Merge//////////////////////// -PERFTEST(Merge) -{ - Mat dst, ocl_dst; - ocl::oclMat d_dst; - int channels = 4; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; +CV_ENUM(MergeMatType, CV_8U, CV_32F) - for (int size = Min_Size; size <= Max_Size; size *= Multiple) - { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j] ; - Size size1 = Size(size, size); - std::vector src(channels); - - for (int i = 0; i < channels; ++i) - { - src[i] = Mat(size1, all_type[j], cv::Scalar::all(i)); - } - - merge(src, dst); - - CPU_ON; - merge(src, dst); - CPU_OFF; - - std::vector d_src(channels); - - for (int i = 0; i < channels; ++i) - { - d_src[i] = ocl::oclMat(size1, all_type[j], cv::Scalar::all(i)); - } - - WARMUP_ON; - ocl::merge(d_src, d_dst); - WARMUP_OFF; - - GPU_ON; - ocl::merge(d_src, d_dst); - GPU_OFF; - - GPU_FULL_ON; - for (int i = 0; i < channels; ++i) - { - d_src[i] = ocl::oclMat(size1, all_type[j], cv::Scalar::all(i)); - } - ocl::merge(d_src, d_dst); - d_dst.download(ocl_dst); - GPU_FULL_OFF; - - TestSystem::instance().ExpectedMatNear(dst, ocl_dst, 0.0); - } +typedef tuple MergeParams; +typedef TestBaseWithParam MergeFixture; - } -} - -///////////// Split//////////////////////// -PERFTEST(Split) +PERF_TEST_P(MergeFixture, Merge, + ::testing::Combine(::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000), + MergeMatType::all())) { - //int channels = 4; - int all_type[] = {CV_8UC1, CV_32FC1}; - std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; + // getting params + MergeParams params = GetParam(); + const Size srcSize = get<0>(params); + const int depth = get<1>(params), channels = 3; + + std::string impl = getSelectedImpl(); + + // creating src data + const int dstType = CV_MAKE_TYPE(depth, channels); + Mat dst(srcSize, dstType); + vector src(channels); + for (vector::iterator i = src.begin(), end = src.end(); i != end; ++i) + { + i->create(srcSize, CV_MAKE_TYPE(depth, 1)); + declare.in(*i, WARMUP_RNG); + } + declare.out(dst); - for (int size = Min_Size; size <= Max_Size; size *= Multiple) + // select implementation + if (impl == "ocl") { - for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) - { - SUBTEST << size << 'x' << size << "; " << type_name[j]; - Size size1 = Size(size, size); + ocl::oclMat oclDst(srcSize, dstType); + vector oclSrc(src.size()); + for (vector::size_type i = 0, end = src.size(); i < end; ++i) + oclSrc[i] = src[i]; - Mat src(size1, CV_MAKE_TYPE(all_type[j], 4), cv::Scalar(1, 2, 3, 4)); + TEST_CYCLE() cv::ocl::merge(oclSrc, oclDst); - std::vector dst, ocl_dst(4); + oclDst.download(dst); - split(src, dst); + SANITY_CHECK(dst); + } + else if (impl == "plain") + { + TEST_CYCLE() cv::merge(src, dst); - CPU_ON; - split(src, dst); - CPU_OFF; + SANITY_CHECK(dst); + } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); +} - ocl::oclMat d_src(size1, CV_MAKE_TYPE(all_type[j], 4), cv::Scalar(1, 2, 3, 4)); - std::vector d_dst; +///////////// Split//////////////////////// - WARMUP_ON; - ocl::split(d_src, d_dst); - WARMUP_OFF; +typedef MergeMatType SplitMatType; +typedef tuple SplitParams; +typedef TestBaseWithParam SplitFixture; - GPU_ON; - ocl::split(d_src, d_dst); - GPU_OFF; +PERF_TEST_P(SplitFixture, Split, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + SplitMatType::all())) +{ + // getting params + MergeParams params = GetParam(); + const Size srcSize = get<0>(params); + const int depth = get<1>(params), channels = 3; - GPU_FULL_ON; - d_src.upload(src); - ocl::split(d_src, d_dst); - for(size_t i = 0; i < dst.size(); i++) - d_dst[i].download(ocl_dst[i]); - GPU_FULL_OFF; + std::string impl = getSelectedImpl(); - vector eps(4, 0.); - TestSystem::instance().ExpectMatsNear(dst, ocl_dst, eps); - } + // creating src data + Mat src(srcSize, CV_MAKE_TYPE(depth, channels)); + declare.in(src, WARMUP_RNG); + // select implementation + if (impl == "ocl") + { + ocl::oclMat oclSrc(src); + vector oclDst(channels, ocl::oclMat(srcSize, CV_MAKE_TYPE(depth, 1))); + + TEST_CYCLE() cv::ocl::split(oclSrc, oclDst); + + AssertEQ(channels, 3); + Mat dst0, dst1, dst2; + oclDst[0].download(dst0); + oclDst[1].download(dst1); + oclDst[2].download(dst2); + SANITY_CHECK(dst0); + SANITY_CHECK(dst1); + SANITY_CHECK(dst2); + } + else if (impl == "plain") + { + vector dst(channels, Mat(srcSize, CV_MAKE_TYPE(depth, 1))); + TEST_CYCLE() cv::split(src, dst); + + AssertEQ(channels, 3); + Mat & dst0 = dst[0], & dst1 = dst[1], & dst2 = dst[2]; + SANITY_CHECK(dst0); + SANITY_CHECK(dst1); + SANITY_CHECK(dst2); } +#ifdef HAVE_OPENCV_GPU + else if (impl == "gpu") + CV_TEST_FAIL_NO_IMPL(); +#endif + else + CV_TEST_FAIL_NO_IMPL(); } From d02ccc95908593a481c7c26ed08f2f6bf49dc11c Mon Sep 17 00:00:00 2001 From: ilya-lavrenov Date: Fri, 23 Aug 2013 18:38:31 +0400 Subject: [PATCH 4/4] the code was refactored and old test system code was removed --- modules/ocl/perf/main.cpp | 159 ++---- modules/ocl/perf/perf_arithm.cpp | 468 +++++------------- modules/ocl/perf/perf_blend.cpp | 14 +- modules/ocl/perf/perf_brute_force_matcher.cpp | 151 +----- modules/ocl/perf/perf_calib3d.cpp | 15 +- modules/ocl/perf/perf_canny.cpp | 17 +- modules/ocl/perf/perf_color.cpp | 13 +- modules/ocl/perf/perf_fft.cpp | 22 +- modules/ocl/perf/perf_filters.cpp | 149 ++---- modules/ocl/perf/perf_gemm.cpp | 14 +- modules/ocl/perf/perf_gftt.cpp | 22 +- modules/ocl/perf/perf_haar.cpp | 12 +- modules/ocl/perf/perf_hog.cpp | 17 +- modules/ocl/perf/perf_imgproc.cpp | 253 +++------- modules/ocl/perf/perf_match_template.cpp | 38 +- modules/ocl/perf/perf_matrix_operation.cpp | 70 +-- modules/ocl/perf/perf_moments.cpp | 26 +- modules/ocl/perf/perf_norm.cpp | 15 +- modules/ocl/perf/perf_opticalflow.cpp | 312 ++++-------- modules/ocl/perf/perf_precomp.cpp | 449 ----------------- modules/ocl/perf/perf_precomp.hpp | 467 +---------------- modules/ocl/perf/perf_pyramid.cpp | 59 +-- modules/ocl/perf/perf_split_merge.cpp | 51 +- 23 files changed, 537 insertions(+), 2276 deletions(-) diff --git a/modules/ocl/perf/main.cpp b/modules/ocl/perf/main.cpp index f67961f87e..e24c2c14e5 100644 --- a/modules/ocl/perf/main.cpp +++ b/modules/ocl/perf/main.cpp @@ -42,153 +42,54 @@ #include "perf_precomp.hpp" -static int old_main(int argc, const char *argv[]) +const char * impls[] = +{ + IMPL_OCL, + IMPL_PLAIN, +#ifdef HAVE_OPENCV_GPU + IMPL_GPU +#endif +}; + +int main(int argc, char ** argv) { - const char *keys = - "{ h | help | false | print help message }" - "{ f | filter | | filter for test }" - "{ w | workdir | | set working directory }" - "{ l | list | false | show all tests }" - "{ d | device | 0 | device id }" - "{ c | cpu_ocl | false | use cpu as ocl device}" - "{ i | iters | 10 | iteration count }" - "{ m | warmup | 1 | gpu warm up iteration count}" - "{ t | xtop | 1.1 | xfactor top boundary}" - "{ b | xbottom | 0.9 | xfactor bottom boundary}" - "{ v | verify | false | only run gpu once to verify if problems occur}"; + const char * keys = + "{ h | help | false | print help message }" + "{ t | type | gpu | set device type:cpu or gpu}" + "{ p | platform | 0 | set platform id }" + "{ d | device | 0 | set device id }"; - redirectError(cvErrorCallback); CommandLineParser cmd(argc, argv, keys); if (cmd.get("help")) { - cout << "Avaible options:" << endl; + cout << "Available options besides google test option:" << endl; cmd.printParams(); return 0; } - // get ocl devices - bool use_cpu = cmd.get("c"); - vector oclinfo; - int num_devices = 0; - if(use_cpu) - num_devices = getDevice(oclinfo, ocl::CVCL_DEVICE_TYPE_CPU); - else - num_devices = getDevice(oclinfo); - if (num_devices < 1) - { - cerr << "no device found\n"; - return -1; - } - - // show device info - int devidx = 0; - for (size_t i = 0; i < oclinfo.size(); i++) - { - for (size_t j = 0; j < oclinfo[i].DeviceName.size(); j++) - { - cout << "device " << devidx++ << ": " << oclinfo[i].DeviceName[j] << endl; - } - } - + string type = cmd.get("type"); + unsigned int pid = cmd.get("platform"); int device = cmd.get("device"); - if (device < 0 || device >= num_devices) - { - cerr << "Invalid device ID" << endl; - return -1; - } - - // set this to overwrite binary cache every time the test starts - ocl::setBinaryDiskCache(ocl::CACHE_UPDATE); - - if (cmd.get("verify")) - { - TestSystem::instance().setNumIters(1); - TestSystem::instance().setGPUWarmupIters(0); - TestSystem::instance().setCPUIters(0); - } - - devidx = 0; - for (size_t i = 0; i < oclinfo.size(); i++) - { - for (size_t j = 0; j < oclinfo[i].DeviceName.size(); j++, devidx++) - { - if (device == devidx) - { - ocl::setDevice(oclinfo[i], (int)j); - TestSystem::instance().setRecordName(oclinfo[i].DeviceName[j]); - cout << "use " << devidx << ": " <("filter"); - string workdir = cmd.get("workdir"); - bool list = cmd.get("list"); - int iters = cmd.get("iters"); - int wu_iters = cmd.get("warmup"); - double x_top = cmd.get("xtop"); - double x_bottom = cmd.get("xbottom"); + int flag = type == "cpu" ? cv::ocl::CVCL_DEVICE_TYPE_CPU : + cv::ocl::CVCL_DEVICE_TYPE_GPU; - TestSystem::instance().setTopThreshold(x_top); - TestSystem::instance().setBottomThreshold(x_bottom); - - if (!filter.empty()) - { - TestSystem::instance().setTestFilter(filter); - } - - if (!workdir.empty()) + std::vector oclinfo; + int devnums = cv::ocl::getDevice(oclinfo, flag); + if (devnums <= device || device < 0) { - if (workdir[workdir.size() - 1] != '/' && workdir[workdir.size() - 1] != '\\') - { - workdir += '/'; - } - - TestSystem::instance().setWorkingDir(workdir); + std::cout << "device invalid\n"; + return -1; } - if (list) + if (pid >= oclinfo.size()) { - TestSystem::instance().setListMode(true); - } - - TestSystem::instance().setNumIters(iters); - TestSystem::instance().setGPUWarmupIters(wu_iters); - - TestSystem::instance().run(); - - return 0; -} - -const char * impls[] = -{ - "ocl", - "plain", -#ifdef HAVE_OPENCV_GPU - "gpu" -#endif -}; - -int main(int argc, char **argv) -{ - // temp solution: if no '--gtest_' and '--perf_' args switch to old behavior - bool useGTest = false; - - for(int i=1; i LUTParams; -typedef TestBaseWithParam LUTFixture; +typedef Size_MatType LUTFixture; PERF_TEST_P(LUTFixture, LUT, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - LUTMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC3))) { // getting params - LUTParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const std::string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), lut(1, 256, CV_8UC1); int dstType = CV_MAKETYPE(lut.depth(), src.channels()); @@ -77,28 +72,23 @@ PERF_TEST_P(LUTFixture, LUT, declare.in(src, WARMUP_RNG).in(lut).out(dst); // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclLut(lut), oclDst(srcSize, dstType); TEST_CYCLE() cv::ocl::LUT(oclSrc, oclLut, oclDst); - oclDst.download(dst); SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::LUT(src, lut, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Exp //////////////////////// @@ -109,8 +99,7 @@ PERF_TEST_P(ExpFixture, Exp, OCL_TYPICAL_MAT_SIZES) { // getting params const Size srcSize = GetParam(); - - const std::string impl = getSelectedImpl(); + const double eps = 3e-1; // creating src data Mat src(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); @@ -118,7 +107,7 @@ PERF_TEST_P(ExpFixture, Exp, OCL_TYPICAL_MAT_SIZES) randu(src, 5, 16); // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); @@ -126,20 +115,16 @@ PERF_TEST_P(ExpFixture, Exp, OCL_TYPICAL_MAT_SIZES) oclDst.download(dst); - SANITY_CHECK(dst, 0.3); + SANITY_CHECK(dst, eps); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::exp(src, dst); - SANITY_CHECK(dst, 0.3); + SANITY_CHECK(dst, eps); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// LOG //////////////////////// @@ -150,7 +135,7 @@ PERF_TEST_P(LogFixture, Log, OCL_TYPICAL_MAT_SIZES) { // getting params const Size srcSize = GetParam(); - const std::string impl = getSelectedImpl(); + const double eps = 1e-5; // creating src data Mat src(srcSize, CV_32F), dst(srcSize, src.type()); @@ -161,7 +146,7 @@ PERF_TEST_P(LogFixture, Log, OCL_TYPICAL_MAT_SIZES) declare.time(3.6); // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); @@ -169,38 +154,30 @@ PERF_TEST_P(LogFixture, Log, OCL_TYPICAL_MAT_SIZES) oclDst.download(dst); - SANITY_CHECK(dst); + SANITY_CHECK(dst, eps); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::log(src, dst); - SANITY_CHECK(dst); + SANITY_CHECK(dst, eps); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Add //////////////////////// -CV_ENUM(AddMatTypes, CV_8UC1, CV_32FC1) - -typedef tuple AddParams; -typedef TestBaseWithParam AddFixture; +typedef Size_MatType AddFixture; PERF_TEST_P(AddFixture, Add, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - AddMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { // getting params - AddParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); // creating src data Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); @@ -209,7 +186,7 @@ PERF_TEST_P(AddFixture, Add, declare.in(src1, src2).out(dst); // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); @@ -219,35 +196,27 @@ PERF_TEST_P(AddFixture, Add, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::add(src1, src2, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Mul //////////////////////// -CV_ENUM(MulMatTypes, CV_8UC1, CV_8UC4) - -typedef tuple MulParams; -typedef TestBaseWithParam MulFixture; +typedef Size_MatType MulFixture; PERF_TEST_P(MulFixture, Mul, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - MulMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { // getting params - MulParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); // creating src data Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); @@ -256,7 +225,7 @@ PERF_TEST_P(MulFixture, Mul, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, declare.in(src1, src2).out(dst); // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); @@ -266,34 +235,28 @@ PERF_TEST_P(MulFixture, Mul, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::multiply(src1, src2, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Div //////////////////////// -typedef MulMatTypes DivMatTypes; -typedef tuple DivParams; -typedef TestBaseWithParam DivFixture; +typedef Size_MatType DivFixture; -PERF_TEST_P(DivFixture, Div, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - DivMatTypes::all())) +PERF_TEST_P(DivFixture, Div, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { // getting params - DivParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); // creating src data Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); @@ -308,7 +271,7 @@ PERF_TEST_P(DivFixture, Div, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, declare.time(16.6); // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); @@ -318,43 +281,34 @@ PERF_TEST_P(DivFixture, Div, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::divide(src1, src2, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Absdiff //////////////////////// -typedef MulMatTypes AbsDiffMatTypes; -typedef tuple AbsDiffParams; -typedef TestBaseWithParam AbsDiffFixture; +typedef Size_MatType AbsDiffFixture; -PERF_TEST_P(AbsDiffFixture, Absdiff, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - AbsDiffMatTypes::all())) +PERF_TEST_P(AbsDiffFixture, Absdiff, + ::testing::Combine(OCL_TYPICAL_MAT_SIZES, + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - AbsDiffParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); declare.in(src1, src2).in(dst); randu(src1, 0, 256); randu(src2, 0, 256); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); @@ -364,18 +318,14 @@ PERF_TEST_P(AbsDiffFixture, Absdiff, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::absdiff(src1, src2, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// CartToPolar //////////////////////// @@ -384,11 +334,9 @@ typedef TestBaseWithParam CartToPolarFixture; PERF_TEST_P(CartToPolarFixture, CartToPolar, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); + const double eps = 8e-3; - // creating src data Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), dst1(srcSize, CV_32FC1), dst2(srcSize, CV_32FC1); declare.in(src1, src2).out(dst1, dst2); @@ -398,8 +346,7 @@ PERF_TEST_P(CartToPolarFixture, CartToPolar, OCL_TYPICAL_MAT_SIZES) if (srcSize == OCL_SIZE_4000) declare.time(3.6); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst1(srcSize, src1.type()), oclDst2(srcSize, src1.type()); @@ -409,22 +356,18 @@ PERF_TEST_P(CartToPolarFixture, CartToPolar, OCL_TYPICAL_MAT_SIZES) oclDst1.download(dst1); oclDst2.download(dst2); - SANITY_CHECK(dst1, 5e-3); - SANITY_CHECK(dst2, 5e-3); + SANITY_CHECK(dst1, eps); + SANITY_CHECK(dst2, eps); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::cartToPolar(src1, src2, dst1, dst2); - SANITY_CHECK(dst1, 5e-3); - SANITY_CHECK(dst2, 5e-3); + SANITY_CHECK(dst1, eps); + SANITY_CHECK(dst2, eps); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// PolarToCart //////////////////////// @@ -433,12 +376,9 @@ typedef TestBaseWithParam PolarToCartFixture; PERF_TEST_P(PolarToCartFixture, PolarToCart, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data - Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), + Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), dst1(srcSize, CV_32FC1), dst2(srcSize, CV_32FC1); declare.in(src1, src2).out(dst1, dst2); randu(src1, 0, 256); @@ -447,8 +387,7 @@ PERF_TEST_P(PolarToCartFixture, PolarToCart, OCL_TYPICAL_MAT_SIZES) if (srcSize == OCL_SIZE_4000) declare.time(5.4); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst1(srcSize, src1.type()), oclDst2(srcSize, src1.type()); @@ -461,19 +400,15 @@ PERF_TEST_P(PolarToCartFixture, PolarToCart, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst1, 5e-5); SANITY_CHECK(dst2, 5e-5); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::polarToCart(src1, src2, dst1, dst2); SANITY_CHECK(dst1, 5e-5); SANITY_CHECK(dst2, 5e-5); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Magnitude //////////////////////// @@ -482,19 +417,15 @@ typedef TestBaseWithParam MagnitudeFixture; PERF_TEST_P(MagnitudeFixture, Magnitude, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); randu(src1, 0, 1); randu(src2, 0, 1); declare.in(src1, src2).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, src1.type()); @@ -505,42 +436,32 @@ PERF_TEST_P(MagnitudeFixture, Magnitude, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 1e-6); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::magnitude(src1, src2, dst); SANITY_CHECK(dst, 1e-6); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Transpose //////////////////////// -typedef MulMatTypes TransposeMatTypes; -typedef tuple TransposeParams; -typedef TestBaseWithParam TransposeFixture; +typedef Size_MatType TransposeFixture; PERF_TEST_P(TransposeFixture, Transpose, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - TransposeMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - TransposeParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -550,42 +471,32 @@ PERF_TEST_P(TransposeFixture, Transpose, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::transpose(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Flip //////////////////////// -typedef MulMatTypes FlipMatTypes; -typedef tuple FlipParams; -typedef TestBaseWithParam FlipFixture; +typedef Size_MatType FlipFixture; PERF_TEST_P(FlipFixture, Flip, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - FlipMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - TransposeParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -595,44 +506,35 @@ PERF_TEST_P(FlipFixture, Flip, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::flip(src, dst, 0); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// minMax //////////////////////// -typedef AddMatTypes minMaxMatTypes; -typedef tuple minMaxParams; -typedef TestBaseWithParam minMaxFixture; +typedef Size_MatType minMaxFixture; PERF_TEST_P(minMaxFixture, minMax, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - minMaxMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - minMaxParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type); declare.in(src, WARMUP_RNG); - double min_val = 0.0, max_val = 0.0; + double min_val = std::numeric_limits::max(), + max_val = std::numeric_limits::min(); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src); @@ -642,7 +544,7 @@ PERF_TEST_P(minMaxFixture, minMax, SANITY_CHECK(min_val); SANITY_CHECK(max_val); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { Point min_loc, max_loc; @@ -652,31 +554,22 @@ PERF_TEST_P(minMaxFixture, minMax, SANITY_CHECK(min_val); SANITY_CHECK(max_val); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// minMaxLoc //////////////////////// -typedef AddMatTypes minMaxLocMatTypes; -typedef tuple minMaxLocParams; -typedef TestBaseWithParam minMaxLocFixture; +typedef Size_MatType minMaxLocFixture; PERF_TEST_P(minMaxLocFixture, minMaxLoc, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - minMaxLocMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - minMaxLocParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type); randu(src, 0, 1); declare.in(src); @@ -684,8 +577,7 @@ PERF_TEST_P(minMaxLocFixture, minMaxLoc, double min_val = 0.0, max_val = 0.0; Point min_loc, max_loc; - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src); @@ -695,7 +587,7 @@ PERF_TEST_P(minMaxLocFixture, minMaxLoc, SANITY_CHECK(min_val); SANITY_CHECK(max_val); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); @@ -703,39 +595,28 @@ PERF_TEST_P(minMaxLocFixture, minMaxLoc, SANITY_CHECK(min_val); SANITY_CHECK(max_val); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Sum //////////////////////// -CV_ENUM(SumMatTypes, CV_8UC1, CV_32SC1) - -typedef tuple SumParams; -typedef TestBaseWithParam SumFixture; +typedef Size_MatType SumFixture; PERF_TEST_P(SumFixture, Sum, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - SumMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32SC1))) { - // getting params - SumParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data - Mat src(srcSize, type); + Mat src(srcSize, type); Scalar result; randu(src, 0, 60); declare.in(src); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src); @@ -743,45 +624,34 @@ PERF_TEST_P(SumFixture, Sum, SANITY_CHECK(result); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() result = cv::sum(src); SANITY_CHECK(result); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// countNonZero //////////////////////// -CV_ENUM(countNonZeroMatTypes, CV_8UC1, CV_32FC1) - -typedef tuple countNonZeroParams; -typedef TestBaseWithParam countNonZeroFixture; +typedef Size_MatType countNonZeroFixture; PERF_TEST_P(countNonZeroFixture, countNonZero, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - countNonZeroMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - countNonZeroParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type); int result = 0; randu(src, 0, 256); declare.in(src); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src); @@ -789,18 +659,14 @@ PERF_TEST_P(countNonZeroFixture, countNonZero, SANITY_CHECK(result); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() result = cv::countNonZero(src); SANITY_CHECK(result); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Phase //////////////////////// @@ -809,19 +675,15 @@ typedef TestBaseWithParam PhaseFixture; PERF_TEST_P(PhaseFixture, Phase, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); declare.in(src1, src2).out(dst); randu(src1, 0, 256); randu(src2, 0, 256); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, src1.type()); @@ -832,44 +694,34 @@ PERF_TEST_P(PhaseFixture, Phase, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 1e-2); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::phase(src1, src2, dst, 1); SANITY_CHECK(dst, 1e-2); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// bitwise_and//////////////////////// -typedef SumMatTypes BitwiseAndMatTypes; -typedef tuple BitwiseAndParams; -typedef TestBaseWithParam BitwiseAndFixture; +typedef Size_MatType BitwiseAndFixture; PERF_TEST_P(BitwiseAndFixture, bitwise_and, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - BitwiseAndMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32SC1))) { - // getting params - BitwiseAndParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data - Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); + Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); declare.in(src1, src2).out(dst); randu(src1, 0, 256); randu(src2, 0, 256); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, src1.type()); @@ -879,42 +731,32 @@ PERF_TEST_P(BitwiseAndFixture, bitwise_and, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::bitwise_and(src1, src2, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// bitwise_not//////////////////////// -typedef SumMatTypes BitwiseNotMatTypes; -typedef tuple BitwiseNotParams; -typedef TestBaseWithParam BitwiseNotFixture; +typedef Size_MatType BitwiseNotFixture; PERF_TEST_P(BitwiseAndFixture, bitwise_not, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - BitwiseAndMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32SC1))) { - // getting params - BitwiseNotParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -924,42 +766,32 @@ PERF_TEST_P(BitwiseAndFixture, bitwise_not, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::bitwise_not(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// compare//////////////////////// -typedef countNonZeroMatTypes CompareMatTypes; -typedef tuple CompareParams; -typedef TestBaseWithParam CompareFixture; +typedef Size_MatType CompareFixture; PERF_TEST_P(CompareFixture, compare, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - CompareMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - CompareParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, CV_8UC1); declare.in(src1, src2, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, CV_8UC1); @@ -969,18 +801,14 @@ PERF_TEST_P(CompareFixture, compare, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::compare(src1, src2, dst, CMP_EQ); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// pow //////////////////////// @@ -989,16 +817,12 @@ typedef TestBaseWithParam PowFixture; PERF_TEST_P(PowFixture, pow, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data - Mat src(srcSize, CV_32F), dst(srcSize, CV_32F); + Mat src(srcSize, CV_32F), dst(srcSize, CV_32F); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); @@ -1008,18 +832,14 @@ PERF_TEST_P(PowFixture, pow, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 5e-2); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::pow(src, -2.0, dst); SANITY_CHECK(dst, 5e-2); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// MagnitudeSqr//////////////////////// @@ -1028,17 +848,13 @@ typedef TestBaseWithParam MagnitudeSqrFixture; PERF_TEST_P(MagnitudeSqrFixture, MagnitudeSqr, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); declare.in(src1, src2, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, src1.type()); @@ -1048,7 +864,7 @@ PERF_TEST_P(MagnitudeSqrFixture, MagnitudeSqr, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 1e-6, ERROR_RELATIVE); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { ASSERT_EQ(1, src1.channels()); @@ -1070,37 +886,27 @@ PERF_TEST_P(MagnitudeSqrFixture, MagnitudeSqr, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 1e-6, ERROR_RELATIVE); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// AddWeighted//////////////////////// -typedef countNonZeroMatTypes AddWeightedMatTypes; -typedef tuple AddWeightedParams; -typedef TestBaseWithParam AddWeightedFixture; +typedef Size_MatType AddWeightedFixture; PERF_TEST_P(AddWeightedFixture, AddWeighted, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - AddWeightedMatTypes::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - AddWeightedParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, type), src2(srcSize, type), dst(srcSize, type); declare.in(src1, src2, WARMUP_RNG).out(dst); double alpha = 2.0, beta = 1.0, gama = 3.0; - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst(srcSize, type); @@ -1110,16 +916,12 @@ PERF_TEST_P(AddWeightedFixture, AddWeighted, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::addWeighted(src1, alpha, src2, beta, gama, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_blend.cpp b/modules/ocl/perf/perf_blend.cpp index c8a7608148..ea53c8a66d 100644 --- a/modules/ocl/perf/perf_blend.cpp +++ b/modules/ocl/perf/perf_blend.cpp @@ -82,12 +82,9 @@ typedef TestBaseWithParam blendLinearFixture; PERF_TEST_P(blendLinearFixture, blendLinear, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); const int type = CV_8UC1; - const std::string impl = getSelectedImpl(); - // creating src data Mat src1(srcSize, type), src2(srcSize, CV_8UC1), dst; Mat weights1(srcSize, CV_32FC1), weights2(srcSize, CV_32FC1); @@ -95,8 +92,7 @@ PERF_TEST_P(blendLinearFixture, blendLinear, OCL_TYPICAL_MAT_SIZES) randu(weights1, 0.0f, 1.0f); randu(weights2, 0.0f, 1.0f); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclDst; ocl::oclMat oclWeights1(weights1), oclWeights2(weights2); @@ -107,16 +103,12 @@ PERF_TEST_P(blendLinearFixture, blendLinear, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() blendLinearGold(src1, src2, weights1, weights2, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_brute_force_matcher.cpp b/modules/ocl/perf/perf_brute_force_matcher.cpp index 841fa64185..af93b1b103 100644 --- a/modules/ocl/perf/perf_brute_force_matcher.cpp +++ b/modules/ocl/perf/perf_brute_force_matcher.cpp @@ -53,11 +53,10 @@ using namespace perf; typedef TestBaseWithParam BruteForceMatcherFixture; -PERF_TEST_P(BruteForceMatcherFixture, match, - OCL_BFMATCHER_TYPICAL_MAT_SIZES) +PERF_TEST_P(BruteForceMatcherFixture, DISABLED_match, + OCL_BFMATCHER_TYPICAL_MAT_SIZES) // TODO too big difference between implementations { const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); vector matches; Mat query(srcSize, CV_32F), train(srcSize, CV_32F); @@ -65,16 +64,15 @@ PERF_TEST_P(BruteForceMatcherFixture, match, randu(query, 0.0f, 1.0f); randu(train, 0.0f, 1.0f); - if (impl == "plain") + if (RUN_PLAIN_IMPL) { BFMatcher matcher(NORM_L2); TEST_CYCLE() matcher.match(query, train, matches); SANITY_CHECK_MATCHES(matches); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { - // Init GPU matcher ocl::BruteForceMatcher_OCL_base oclMatcher(ocl::BruteForceMatcher_OCL_base::L2Dist); ocl::oclMat oclQuery(query), oclTrain(train); @@ -82,53 +80,14 @@ PERF_TEST_P(BruteForceMatcherFixture, match, SANITY_CHECK_MATCHES(matches); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } -//PERF_TEST_P(BruteForceMatcherFixture, matchSingle, -// OCL_BFMATCHER_TYPICAL_MAT_SIZES) -//{ -// const Size srcSize = GetParam(); -// const string impl = getSelectedImpl(); - -// Mat query(srcSize, CV_32F), train(srcSize, CV_32F); -// Mat trainIdx, distance; - -// randu(query, 0.0f, 1.0f); -// randu(train, 0.0f, 1.0f); - -// if (impl == "plain") -// CV_TEST_FAIL_NO_IMPL(); -// else if (impl == "ocl") -// { -// ocl::oclMat oclQuery(query), oclTrain(train), oclTrainIdx, oclDistance; - -// TEST_CYCLE() oclMatcher->matchSingle(oclQuery, oclTrain, oclTrainIdx, oclDistance); - -// oclTrainIdx.download(trainIdx); -// oclDistance.download(distance); - -// SANITY_CHECK(trainIdx); -// SANITY_CHECK(distance); -// } -//#ifdef HAVE_OPENCV_GPU -// else if (impl == "gpu") -// CV_TEST_FAIL_NO_IMPL(); -//#endif -// else -// CV_TEST_FAIL_NO_IMPL(); -//} - -PERF_TEST_P(BruteForceMatcherFixture, knnMatch, - OCL_BFMATCHER_TYPICAL_MAT_SIZES) +PERF_TEST_P(BruteForceMatcherFixture, DISABLED_knnMatch, + OCL_BFMATCHER_TYPICAL_MAT_SIZES) // TODO too many outliers { const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); vector > matches(2); Mat query(srcSize, CV_32F), train(srcSize, CV_32F); @@ -139,7 +98,7 @@ PERF_TEST_P(BruteForceMatcherFixture, knnMatch, if (srcSize.height == 2000) declare.time(8); - if (impl == "plain") + if (RUN_PLAIN_IMPL) { BFMatcher matcher (NORM_L2); TEST_CYCLE() matcher.knnMatch(query, train, matches, 2); @@ -148,7 +107,7 @@ PERF_TEST_P(BruteForceMatcherFixture, knnMatch, SANITY_CHECK_MATCHES(matches0); SANITY_CHECK_MATCHES(matches1); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { ocl::BruteForceMatcher_OCL_base oclMatcher(ocl::BruteForceMatcher_OCL_base::L2Dist); ocl::oclMat oclQuery(query), oclTrain(train); @@ -159,55 +118,14 @@ PERF_TEST_P(BruteForceMatcherFixture, knnMatch, SANITY_CHECK_MATCHES(matches0); SANITY_CHECK_MATCHES(matches1); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } -//PERF_TEST_P(BruteForceMatcherFixture, knnMatchSingle, -// OCL_BFMATCHER_TYPICAL_MAT_SIZES) -//{ -// const Size srcSize = GetParam(); -// const string impl = getSelectedImpl(); - -// Mat query(srcSize, CV_32F), train(srcSize, CV_32F); -// Mat trainIdx, distance, allDist; - -// randu(query, 0.0f, 1.0f); -// randu(train, 0.0f, 1.0f); - -// if (impl == "plain") -// CV_TEST_FAIL_NO_IMPL(); -// else if (impl == "ocl") -// { -// ocl::oclMat oclQuery(query), oclTrain(train), oclTrainIdx, oclDistance, oclAllDist; - -// TEST_CYCLE() oclMatcher->knnMatchSingle(oclQuery, oclTrain, oclTrainIdx, oclDistance, oclAllDist, 2); - -// oclTrainIdx.download(trainIdx); -// oclDistance.download(distance); -// oclAllDist.download(allDist); - -// SANITY_CHECK(trainIdx); -// SANITY_CHECK(distance); -// SANITY_CHECK(allDist); -// } -//#ifdef HAVE_OPENCV_GPU -// else if (impl == "gpu") -// CV_TEST_FAIL_NO_IMPL(); -//#endif -// else -// CV_TEST_FAIL_NO_IMPL(); -//} - PERF_TEST_P(BruteForceMatcherFixture, DISABLED_radiusMatch, - OCL_BFMATCHER_TYPICAL_MAT_SIZES) + OCL_BFMATCHER_TYPICAL_MAT_SIZES) // TODO too many outliers { const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); const float max_distance = 2.0f; vector > matches(2); @@ -218,7 +136,7 @@ PERF_TEST_P(BruteForceMatcherFixture, DISABLED_radiusMatch, randu(query, 0.0f, 1.0f); randu(train, 0.0f, 1.0f); - if (impl == "plain") + if (RUN_PLAIN_IMPL) { BFMatcher matcher (NORM_L2); TEST_CYCLE() matcher.radiusMatch(query, matches, max_distance); @@ -227,7 +145,7 @@ PERF_TEST_P(BruteForceMatcherFixture, DISABLED_radiusMatch, SANITY_CHECK_MATCHES(matches0); SANITY_CHECK_MATCHES(matches1); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { ocl::oclMat oclQuery(query), oclTrain(train); ocl::BruteForceMatcher_OCL_base oclMatcher(ocl::BruteForceMatcher_OCL_base::L2Dist); @@ -238,49 +156,8 @@ PERF_TEST_P(BruteForceMatcherFixture, DISABLED_radiusMatch, SANITY_CHECK_MATCHES(matches0); SANITY_CHECK_MATCHES(matches1); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } -//PERF_TEST_P(BruteForceMatcherFixture, radiusMatchSingle, -// OCL_BFMATCHER_TYPICAL_MAT_SIZES) -//{ -// const Size srcSize = GetParam(); -// const string impl = getSelectedImpl(); - -// const float max_distance = 2.0f; -// Mat query(srcSize, CV_32F), train(srcSize, CV_32F); -// Mat trainIdx, distance, nMatches; - -// randu(query, 0.0f, 1.0f); -// randu(train, 0.0f, 1.0f); - -// if (impl == "plain") -// CV_TEST_FAIL_NO_IMPL(); -// else if (impl == "ocl") -// { -// ocl::oclMat oclQuery(query), oclTrain(train), oclTrainIdx, oclDistance, oclNMatches; - -// TEST_CYCLE() oclMatcher->radiusMatchSingle(oclQuery, oclTrain, oclTrainIdx, oclDistance, oclNMatches, max_distance); - -// oclTrainIdx.download(trainIdx); -// oclDistance.download(distance); -// oclNMatches.download(nMatches); - -// SANITY_CHECK(trainIdx); -// SANITY_CHECK(distance); -// SANITY_CHECK(nMatches); -// } -//#ifdef HAVE_OPENCV_GPU -// else if (impl == "gpu") -// CV_TEST_FAIL_NO_IMPL(); -//#endif -// else -// CV_TEST_FAIL_NO_IMPL(); -//} - #undef OCL_BFMATCHER_TYPICAL_MAT_SIZES diff --git a/modules/ocl/perf/perf_calib3d.cpp b/modules/ocl/perf/perf_calib3d.cpp index 7288677bf7..a155fc371a 100644 --- a/modules/ocl/perf/perf_calib3d.cpp +++ b/modules/ocl/perf/perf_calib3d.cpp @@ -48,7 +48,7 @@ ///////////// StereoMatchBM //////////////////////// -PERF_TEST(StereoMatchBMFixture, DISABLED_StereoMatchBM) +PERF_TEST(StereoMatchBMFixture, DISABLED_StereoMatchBM) // TODO doesn't work properly { Mat left_image = imread(getDataPath("gpu/stereobm/aloe-L.png"), cv::IMREAD_GRAYSCALE); Mat right_image = imread(getDataPath("gpu/stereobm/aloe-R.png"), cv::IMREAD_GRAYSCALE); @@ -58,13 +58,12 @@ PERF_TEST(StereoMatchBMFixture, DISABLED_StereoMatchBM) ASSERT_TRUE(right_image.size() == left_image.size()); ASSERT_TRUE(right_image.size() == left_image.size()); - const std::string impl = getSelectedImpl(); const int n_disp = 128, winSize = 19; Mat disp(left_image.size(), CV_16SC1); declare.in(left_image, right_image).out(disp); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclLeft(left_image), oclRight(right_image), oclDisp(left_image.size(), CV_16SC1); @@ -76,7 +75,7 @@ PERF_TEST(StereoMatchBMFixture, DISABLED_StereoMatchBM) SANITY_CHECK(disp); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { StereoBM bm(0, n_disp, winSize); @@ -84,10 +83,6 @@ PERF_TEST(StereoMatchBMFixture, DISABLED_StereoMatchBM) SANITY_CHECK(disp); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); - #endif - else - CV_TEST_FAIL_NO_IMPL(); + else + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_canny.cpp b/modules/ocl/perf/perf_canny.cpp index 34a38efd8e..3a5c633f56 100644 --- a/modules/ocl/perf/perf_canny.cpp +++ b/modules/ocl/perf/perf_canny.cpp @@ -49,34 +49,29 @@ using namespace perf; ///////////// Canny //////////////////////// -PERF_TEST(CannyFixture, Canny) +PERF_TEST(CannyFixture, DISABLED_Canny) // TODO difference between implmentations { Mat img = imread(getDataPath("gpu/stereobm/aloe-L.png"), cv::IMREAD_GRAYSCALE), edges(img.size(), CV_8UC1); - ASSERT_TRUE(!img.empty()) << "can't open aloeL.jpg"; + ASSERT_TRUE(!img.empty()) << "can't open aloe-L.png"; - const std::string impl = getSelectedImpl(); declare.in(img).out(edges); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclImg(img), oclEdges(img.size(), CV_8UC1); - TEST_CYCLE() Canny(oclImg, oclEdges, 50.0, 100.0); + TEST_CYCLE() ocl::Canny(oclImg, oclEdges, 50.0, 100.0); oclEdges.download(edges); SANITY_CHECK(edges); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() Canny(img, edges, 50.0, 100.0); SANITY_CHECK(edges); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_color.cpp b/modules/ocl/perf/perf_color.cpp index 645b835dfa..703cc36cec 100644 --- a/modules/ocl/perf/perf_color.cpp +++ b/modules/ocl/perf/perf_color.cpp @@ -54,12 +54,11 @@ typedef TestBaseWithParam cvtColorFixture; PERF_TEST_P(cvtColorFixture, cvtColor, OCL_TYPICAL_MAT_SIZES) { const Size srcSize = GetParam(); - const std::string impl = getSelectedImpl(); Mat src(srcSize, CV_8UC4), dst(srcSize, CV_8UC4); - declare.in(src).out(dst); + declare.in(src, WARMUP_RNG).out(dst); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(src.size(), CV_8UC4); @@ -68,16 +67,12 @@ PERF_TEST_P(cvtColorFixture, cvtColor, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::cvtColor(src, dst, CV_RGBA2GRAY, 4); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_fft.cpp b/modules/ocl/perf/perf_fft.cpp index e23450926a..ae0291c3e6 100644 --- a/modules/ocl/perf/perf_fft.cpp +++ b/modules/ocl/perf/perf_fft.cpp @@ -51,37 +51,33 @@ using namespace perf; typedef TestBaseWithParam dftFixture; -PERF_TEST_P(dftFixture, DISABLED_dft, OCL_TYPICAL_MAT_SIZES) +PERF_TEST_P(dftFixture, DISABLED_dft, OCL_TYPICAL_MAT_SIZES) // TODO not implemented { - const std::string impl = getSelectedImpl(); - Size srcSize = GetParam(); + const Size srcSize = GetParam(); Mat src(srcSize, CV_32FC2), dst; randu(src, 0.0f, 1.0f); declare.in(src); - if (impl == "ocl") + if (srcSize == OCL_SIZE_4000) + declare.time(7.4); + + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst; - EXPECT_NO_THROW({ - TEST_CYCLE() cv::ocl::dft(oclSrc, oclDst); - }); + TEST_CYCLE() cv::ocl::dft(oclSrc, oclDst); oclDst.download(dst); SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::dft(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_filters.cpp b/modules/ocl/perf/perf_filters.cpp index 3d9be40aaa..588c0569ea 100644 --- a/modules/ocl/perf/perf_filters.cpp +++ b/modules/ocl/perf/perf_filters.cpp @@ -51,29 +51,23 @@ using std::tr1::tuple; ///////////// Blur//////////////////////// -CV_ENUM(BlurMatType, CV_8UC1, CV_8UC4) - -typedef tuple BlurParams; -typedef TestBaseWithParam BlurFixture; +typedef Size_MatType BlurFixture; PERF_TEST_P(BlurFixture, Blur, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - BlurMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - BlurParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params), ksize(3, 3); const int type = get<1>(params), bordertype = BORDER_CONSTANT; - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) declare.time(5); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -83,44 +77,35 @@ PERF_TEST_P(BlurFixture, Blur, SANITY_CHECK(dst, 1 + DBL_EPSILON); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::blur(src, dst, ksize, Point(-1, -1), bordertype); SANITY_CHECK(dst, 1 + DBL_EPSILON); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Laplacian//////////////////////// -typedef BlurMatType LaplacianMatType; -typedef tuple LaplacianParams; -typedef TestBaseWithParam LaplacianFixture; +typedef Size_MatType LaplacianFixture; PERF_TEST_P(LaplacianFixture, Laplacian, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - LaplacianMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - LaplacianParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), ksize = 3; - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) declare.time(6); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -130,46 +115,36 @@ PERF_TEST_P(LaplacianFixture, Laplacian, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::Laplacian(src, dst, -1, ksize, 1); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Erode //////////////////// -CV_ENUM(ErodeMatType, CV_8UC1, CV_8UC4, CV_32FC1, CV_32FC4) - -typedef tuple ErodeParams; -typedef TestBaseWithParam ErodeFixture; +typedef Size_MatType ErodeFixture; PERF_TEST_P(ErodeFixture, Erode, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - ErodeMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4, CV_32FC1, CV_32FC4))) { - // getting params - ErodeParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), ksize = 3; const Mat ker = getStructuringElement(MORPH_RECT, Size(ksize, ksize)); - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst).in(ker); if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) declare.time(5); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type), oclKer(ker); @@ -179,37 +154,28 @@ PERF_TEST_P(ErodeFixture, Erode, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::erode(src, dst, ker); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Sobel //////////////////////// -typedef BlurMatType SobelMatType; -typedef tuple SobelMatParams; -typedef TestBaseWithParam SobelFixture; +typedef Size_MatType SobelFixture; PERF_TEST_P(SobelFixture, Sobel, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - SobelMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - SobelMatParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), dx = 1, dy = 1; - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); @@ -219,7 +185,7 @@ PERF_TEST_P(SobelFixture, Sobel, else if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) declare.time(20); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -229,37 +195,28 @@ PERF_TEST_P(SobelFixture, Sobel, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::Sobel(src, dst, -1, dx, dy); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Scharr //////////////////////// -typedef BlurMatType ScharrMatType; -typedef tuple ScharrParams; -typedef TestBaseWithParam ScharrFixture; +typedef Size_MatType ScharrFixture; PERF_TEST_P(ScharrFixture, Scharr, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - ScharrMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - ScharrParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), dx = 1, dy = 0; - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); @@ -269,7 +226,7 @@ PERF_TEST_P(ScharrFixture, Scharr, else if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) declare.time(21); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -279,43 +236,34 @@ PERF_TEST_P(ScharrFixture, Scharr, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::Scharr(src, dst, -1, dx, dy); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// GaussianBlur //////////////////////// -typedef ErodeMatType GaussianBlurMatType; -typedef tuple GaussianBlurParams; -typedef TestBaseWithParam GaussianBlurFixture; +typedef Size_MatType GaussianBlurFixture; PERF_TEST_P(GaussianBlurFixture, GaussianBlur, ::testing::Combine(::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000), - GaussianBlurMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4, CV_32FC1, CV_32FC4))) { - // getting params - GaussianBlurParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), ksize = 7; - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); const double eps = src.depth() == CV_8U ? 1 + DBL_EPSILON : 3e-4; - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -325,37 +273,28 @@ PERF_TEST_P(GaussianBlurFixture, GaussianBlur, SANITY_CHECK(dst, eps); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::GaussianBlur(src, dst, Size(ksize, ksize), 0); SANITY_CHECK(dst, eps); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// filter2D//////////////////////// -typedef BlurMatType filter2DMatType; -typedef tuple filter2DParams; -typedef TestBaseWithParam filter2DFixture; +typedef Size_MatType filter2DFixture; PERF_TEST_P(filter2DFixture, filter2D, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - filter2DMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - filter2DParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), ksize = 3; - const std::string impl = getSelectedImpl(); - Mat src(srcSize, type), dst(srcSize, type), kernel(ksize, ksize, CV_32SC1); declare.in(src, WARMUP_RNG).in(kernel).out(dst); randu(kernel, -3.0, 3.0); @@ -363,7 +302,7 @@ PERF_TEST_P(filter2DFixture, filter2D, if (srcSize == OCL_SIZE_4000 && type == CV_8UC4) declare.time(8); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type), oclKernel(kernel); @@ -373,16 +312,12 @@ PERF_TEST_P(filter2DFixture, filter2D, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::filter2D(src, dst, -1, kernel); SANITY_CHECK(dst); } - #ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_gemm.cpp b/modules/ocl/perf/perf_gemm.cpp index 1e765e85d9..fb68b92f72 100644 --- a/modules/ocl/perf/perf_gemm.cpp +++ b/modules/ocl/perf/perf_gemm.cpp @@ -51,11 +51,9 @@ using namespace perf; typedef TestBaseWithParam gemmFixture; -PERF_TEST_P(gemmFixture, DISABLED_gemm, OCL_TYPICAL_MAT_SIZES) +PERF_TEST_P(gemmFixture, DISABLED_gemm, OCL_TYPICAL_MAT_SIZES) // TODO not implemented { - // getting params const Size srcSize = GetParam(); - const std::string impl = getSelectedImpl(); Mat src1(srcSize, CV_32FC1), src2(srcSize, CV_32FC1), src3(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); @@ -64,7 +62,7 @@ PERF_TEST_P(gemmFixture, DISABLED_gemm, OCL_TYPICAL_MAT_SIZES) randu(src2, -10.0f, 10.0f); randu(src3, -10.0f, 10.0f); - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2), oclSrc3(src3), oclDst(srcSize, CV_32FC1); @@ -75,16 +73,12 @@ PERF_TEST_P(gemmFixture, DISABLED_gemm, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::gemm(src1, src2, 1.0, src3, 1.0, dst); SANITY_CHECK(dst); } - #ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_gftt.cpp b/modules/ocl/perf/perf_gftt.cpp index a314fc092a..7fe16c2082 100644 --- a/modules/ocl/perf/perf_gftt.cpp +++ b/modules/ocl/perf/perf_gftt.cpp @@ -60,22 +60,22 @@ PERF_TEST_P(GoodFeaturesToTrackFixture, GoodFeaturesToTrack, string("gpu/stereobm/aloe-L.png")), ::testing::Range(0.0, 4.0, 3.0))) { - std::vector pts_gold; - // getting params - GoodFeaturesToTrackParams param = GetParam(); - const string fileName = getDataPath(get<0>(param)), impl = getSelectedImpl(); + const GoodFeaturesToTrackParams param = GetParam(); + const string fileName = getDataPath(get<0>(param)); const int maxCorners = 2000; const double qualityLevel = 0.01, minDistance = get<1>(param); Mat frame = imread(fileName, IMREAD_GRAYSCALE); - declare.in(frame); ASSERT_TRUE(!frame.empty()) << "no input image"; - if (impl == "ocl") + vector pts_gold; + declare.in(frame); + + if (RUN_OCL_IMPL) { ocl::oclMat oclFrame(frame), pts_oclmat; - cv::ocl::GoodFeaturesToTrackDetector_OCL detector(maxCorners, qualityLevel, minDistance); + ocl::GoodFeaturesToTrackDetector_OCL detector(maxCorners, qualityLevel, minDistance); TEST_CYCLE() detector(oclFrame, pts_oclmat); @@ -83,17 +83,13 @@ PERF_TEST_P(GoodFeaturesToTrackFixture, GoodFeaturesToTrack, SANITY_CHECK(pts_gold); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::goodFeaturesToTrack(frame, pts_gold, maxCorners, qualityLevel, minDistance); SANITY_CHECK(pts_gold); } - #ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_haar.cpp b/modules/ocl/perf/perf_haar.cpp index 38917a0704..eac2b516fd 100644 --- a/modules/ocl/perf/perf_haar.cpp +++ b/modules/ocl/perf/perf_haar.cpp @@ -88,14 +88,13 @@ public: PERF_TEST(HaarFixture, Haar) { - const std::string impl = getSelectedImpl(); vector faces; Mat img = imread(getDataPath("gpu/haarcascade/basketball1.png"), CV_LOAD_IMAGE_GRAYSCALE); ASSERT_TRUE(!img.empty()) << "can't open basketball1.png"; declare.in(img); - if (impl == "plain") + if (RUN_PLAIN_IMPL) { CascadeClassifier faceCascade; ASSERT_TRUE(faceCascade.load(getDataPath("gpu/haarcascade/haarcascade_frontalface_alt.xml"))) @@ -106,7 +105,7 @@ PERF_TEST(HaarFixture, Haar) SANITY_CHECK(faces, 4 + 1e-4); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { ocl::CascadeClassifier_GPU faceCascade; ocl::oclMat oclImg(img); @@ -119,11 +118,6 @@ PERF_TEST(HaarFixture, Haar) SANITY_CHECK(faces, 4 + 1e-4); } - -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_hog.cpp b/modules/ocl/perf/perf_hog.cpp index 9f0dab9045..2288215f48 100644 --- a/modules/ocl/perf/perf_hog.cpp +++ b/modules/ocl/perf/perf_hog.cpp @@ -54,22 +54,21 @@ PERF_TEST(HOGFixture, HOG) Mat src = imread(getDataPath("gpu/hog/road.png"), cv::IMREAD_GRAYSCALE); ASSERT_TRUE(!src.empty()) << "can't open input image road.png"; - const std::string impl = getSelectedImpl(); - std::vector found_locations; + vector found_locations; declare.in(src).time(5); - if (impl == "plain") + if (RUN_PLAIN_IMPL) { - cv::HOGDescriptor hog; + HOGDescriptor hog; hog.setSVMDetector(hog.getDefaultPeopleDetector()); TEST_CYCLE() hog.detectMultiScale(src, found_locations); SANITY_CHECK(found_locations, 1 + DBL_EPSILON); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { - cv::ocl::HOGDescriptor ocl_hog; + ocl::HOGDescriptor ocl_hog; ocl_hog.setSVMDetector(ocl_hog.getDefaultPeopleDetector()); ocl::oclMat oclSrc(src); @@ -77,10 +76,6 @@ PERF_TEST(HOGFixture, HOG) SANITY_CHECK(found_locations, 1 + DBL_EPSILON); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_imgproc.cpp b/modules/ocl/perf/perf_imgproc.cpp index b33307818f..f530e2602b 100644 --- a/modules/ocl/perf/perf_imgproc.cpp +++ b/modules/ocl/perf/perf_imgproc.cpp @@ -55,16 +55,12 @@ typedef TestBaseWithParam equalizeHistFixture; PERF_TEST_P(equalizeHistFixture, equalizeHist, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, CV_8UC1), dst(srcSize, CV_8UC1); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, src.type()); @@ -74,45 +70,34 @@ PERF_TEST_P(equalizeHistFixture, equalizeHist, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 1 + DBL_EPSILON); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::equalizeHist(src, dst); SANITY_CHECK(dst, 1 + DBL_EPSILON); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } /////////// CopyMakeBorder ////////////////////// -CV_ENUM(CopyMakeBorderMatType, CV_8UC1, CV_8UC4) - -typedef tuple CopyMakeBorderParams; -typedef TestBaseWithParam CopyMakeBorderFixture; +typedef Size_MatType CopyMakeBorderFixture; PERF_TEST_P(CopyMakeBorderFixture, CopyMakeBorder, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - CopyMakeBorderMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - CopyMakeBorderParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), borderType = BORDER_CONSTANT; - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst; const Size dstSize = srcSize + Size(12, 12); dst.create(dstSize, type); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(dstSize, type); @@ -122,40 +107,29 @@ PERF_TEST_P(CopyMakeBorderFixture, CopyMakeBorder, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::copyMakeBorder(src, dst, 7, 5, 5, 7, borderType, cv::Scalar(1.0)); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// cornerMinEigenVal //////////////////////// -CV_ENUM(cornerMinEigenValMatType, CV_8UC1, CV_32FC1) - -typedef tuple cornerMinEigenValParams; -typedef TestBaseWithParam cornerMinEigenValFixture; +typedef Size_MatType cornerMinEigenValFixture; PERF_TEST_P(cornerMinEigenValFixture, cornerMinEigenVal, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - cornerMinEigenValMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - cornerMinEigenValParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), borderType = BORDER_REFLECT; const int blockSize = 7, apertureSize = 1 + 2 * 3; - const string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst(srcSize, CV_32FC1); declare.in(src, WARMUP_RNG).out(dst) .time(srcSize == OCL_SIZE_4000 ? 20 : srcSize == OCL_SIZE_2000 ? 5 : 3); @@ -163,8 +137,7 @@ PERF_TEST_P(cornerMinEigenValFixture, cornerMinEigenVal, const int depth = CV_MAT_DEPTH(type); const ERROR_TYPE errorType = depth == CV_8U ? ERROR_ABSOLUTE : ERROR_RELATIVE; - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, CV_32FC1); @@ -174,45 +147,34 @@ PERF_TEST_P(cornerMinEigenValFixture, cornerMinEigenVal, SANITY_CHECK(dst, 1e-6, errorType); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::cornerMinEigenVal(src, dst, blockSize, apertureSize, borderType); SANITY_CHECK(dst, 1e-6, errorType); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// cornerHarris //////////////////////// -typedef cornerMinEigenValMatType cornerHarrisMatType; -typedef tuple cornerHarrisParams; -typedef TestBaseWithParam cornerHarrisFixture; +typedef Size_MatType cornerHarrisFixture; PERF_TEST_P(cornerHarrisFixture, cornerHarris, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - cornerHarrisMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_32FC1))) { - // getting params - cornerHarrisParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), borderType = BORDER_REFLECT; - const string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst(srcSize, CV_32FC1); randu(src, 0, 1); declare.in(src).out(dst) .time(srcSize == OCL_SIZE_4000 ? 20 : srcSize == OCL_SIZE_2000 ? 5 : 3); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, CV_32FC1); @@ -222,36 +184,28 @@ PERF_TEST_P(cornerHarrisFixture, cornerHarris, SANITY_CHECK(dst, 3e-5); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::cornerHarris(src, dst, 5, 7, 0.1, borderType); SANITY_CHECK(dst, 3e-5); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// integral //////////////////////// typedef TestBaseWithParam integralFixture; -PERF_TEST_P(integralFixture, DISABLED_integral, OCL_TYPICAL_MAT_SIZES) +PERF_TEST_P(integralFixture, DISABLED_integral, OCL_TYPICAL_MAT_SIZES) // TODO does not work properly { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, CV_8UC1), dst; declare.in(src, WARMUP_RNG); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst; @@ -261,29 +215,23 @@ PERF_TEST_P(integralFixture, DISABLED_integral, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::integral(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// WarpAffine //////////////////////// -typedef CopyMakeBorderMatType WarpAffineMatType; -typedef tuple WarpAffineParams; -typedef TestBaseWithParam WarpAffineFixture; +typedef Size_MatType WarpAffineFixture; PERF_TEST_P(WarpAffineFixture, WarpAffine, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - WarpAffineMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { static const double coeffs[2][3] = { @@ -293,18 +241,14 @@ PERF_TEST_P(WarpAffineFixture, WarpAffine, Mat M(2, 3, CV_64F, (void *)coeffs); const int interpolation = INTER_NEAREST; - // getting params - WarpAffineParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -314,29 +258,23 @@ PERF_TEST_P(WarpAffineFixture, WarpAffine, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::warpAffine(src, dst, M, srcSize, interpolation); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// WarpPerspective //////////////////////// -typedef CopyMakeBorderMatType WarpPerspectiveMatType; -typedef tuple WarpPerspectiveParams; -typedef TestBaseWithParam WarpPerspectiveFixture; +typedef Size_MatType WarpPerspectiveFixture; PERF_TEST_P(WarpPerspectiveFixture, WarpPerspective, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - WarpPerspectiveMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { static const double coeffs[3][3] = { @@ -347,19 +285,15 @@ PERF_TEST_P(WarpPerspectiveFixture, WarpPerspective, Mat M(3, 3, CV_64F, (void *)coeffs); const int interpolation = INTER_LINEAR; - // getting params - WarpPerspectiveParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst) .time(srcSize == OCL_SIZE_4000 ? 18 : srcSize == OCL_SIZE_2000 ? 5 : 2); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -369,42 +303,34 @@ PERF_TEST_P(WarpPerspectiveFixture, WarpPerspective, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::warpPerspective(src, dst, M, srcSize, interpolation); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// resize //////////////////////// CV_ENUM(resizeInterType, INTER_NEAREST, INTER_LINEAR) -typedef CopyMakeBorderMatType resizeMatType; -typedef tuple resizeParams; +typedef tuple resizeParams; typedef TestBaseWithParam resizeFixture; PERF_TEST_P(resizeFixture, resize, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - resizeMatType::all(), + OCL_PERF_ENUM(CV_8UC1, CV_8UC4), resizeInterType::all(), ::testing::Values(0.5, 2.0))) { - // getting params - resizeParams params = GetParam(); + const resizeParams params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), interType = get<2>(params); double scale = get<3>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst; const Size dstSize(cvRound(srcSize.width * scale), cvRound(srcSize.height * scale)); dst.create(dstSize, type); @@ -412,8 +338,7 @@ PERF_TEST_P(resizeFixture, resize, if (interType == INTER_LINEAR && type == CV_8UC4 && OCL_SIZE_4000 == srcSize) declare.time(11); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(dstSize, type); @@ -423,18 +348,14 @@ PERF_TEST_P(resizeFixture, resize, SANITY_CHECK(dst, 1 + DBL_EPSILON); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::resize(src, dst, Size(), scale, scale, interType); SANITY_CHECK(dst, 1 + DBL_EPSILON); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// threshold//////////////////////// @@ -448,19 +369,15 @@ PERF_TEST_P(ThreshFixture, threshold, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, ThreshType::all())) { - // getting params - ThreshParams params = GetParam(); + const ThreshParams params = GetParam(); const Size srcSize = get<0>(params); const int threshType = get<1>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, CV_8U), dst(srcSize, CV_8U); randu(src, 0, 100); declare.in(src).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, CV_8U); @@ -470,23 +387,19 @@ PERF_TEST_P(ThreshFixture, threshold, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::threshold(src, dst, 50.0, 0.0, threshType); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// meanShiftFiltering//////////////////////// -typedef struct +typedef struct _COOR { short x; short y; @@ -681,7 +594,6 @@ PERF_TEST_P(meanShiftFilteringFixture, meanShiftFiltering, { const Size srcSize = GetParam(); const int sp = 5, sr = 6; - const string impl = getSelectedImpl(); cv::TermCriteria crit(cv::TermCriteria::COUNT + cv::TermCriteria::EPS, 5, 1); Mat src(srcSize, CV_8UC4), dst(srcSize, CV_8UC4); @@ -689,13 +601,13 @@ PERF_TEST_P(meanShiftFilteringFixture, meanShiftFiltering, .time(srcSize == OCL_SIZE_4000 ? 56 : srcSize == OCL_SIZE_2000 ? 15 : 3.8); - if (impl == "plain") + if (RUN_PLAIN_IMPL) { TEST_CYCLE() meanShiftFiltering_(src, dst, sp, sr, crit); SANITY_CHECK(dst); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, CV_8UC4); @@ -705,12 +617,8 @@ PERF_TEST_P(meanShiftFilteringFixture, meanShiftFiltering, SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } static void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, int sp, int sr, cv::TermCriteria crit) @@ -778,7 +686,6 @@ PERF_TEST_P(meanShiftProcFixture, meanShiftProc, OCL_TYPICAL_MAT_SIZES) { const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); TermCriteria crit(TermCriteria::COUNT + TermCriteria::EPS, 5, 1); Mat src(srcSize, CV_8UC4), dst1(srcSize, CV_8UC4), @@ -787,14 +694,14 @@ PERF_TEST_P(meanShiftProcFixture, meanShiftProc, .time(srcSize == OCL_SIZE_4000 ? 56 : srcSize == OCL_SIZE_2000 ? 15 : 3.8);; - if (impl == "plain") + if (RUN_PLAIN_IMPL) { TEST_CYCLE() meanShiftProc_(src, dst1, dst2, 5, 6, crit); SANITY_CHECK(dst1); SANITY_CHECK(dst2); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst1(srcSize, CV_8UC4), oclDst2(srcSize, CV_16SC2); @@ -807,34 +714,26 @@ PERF_TEST_P(meanShiftProcFixture, meanShiftProc, SANITY_CHECK(dst1); SANITY_CHECK(dst2); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// remap//////////////////////// CV_ENUM(RemapInterType, INTER_NEAREST, INTER_LINEAR) -typedef CopyMakeBorderMatType remapMatType; -typedef tuple remapParams; +typedef tuple remapParams; typedef TestBaseWithParam remapFixture; PERF_TEST_P(remapFixture, remap, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - remapMatType::all(), + OCL_PERF_ENUM(CV_8UC1, CV_8UC4), RemapInterType::all())) { - // getting params - remapParams params = GetParam(); + const remapParams params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params), interpolation = get<2>(params); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); @@ -859,8 +758,7 @@ PERF_TEST_P(remapFixture, remap, const int borderMode = BORDER_CONSTANT; - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); ocl::oclMat oclXMap(xmap), oclYMap(ymap); @@ -871,18 +769,14 @@ PERF_TEST_P(remapFixture, remap, SANITY_CHECK(dst, 1 + DBL_EPSILON); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::remap(src, dst, xmap, ymap, interpolation, borderMode); SANITY_CHECK(dst, 1 + DBL_EPSILON); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// CLAHE //////////////////////// @@ -891,11 +785,9 @@ typedef TestBaseWithParam CLAHEFixture; PERF_TEST_P(CLAHEFixture, CLAHE, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, CV_8UC1), dst; const double clipLimit = 40.0; declare.in(src, WARMUP_RNG); @@ -903,8 +795,7 @@ PERF_TEST_P(CLAHEFixture, CLAHE, OCL_TYPICAL_MAT_SIZES) if (srcSize == OCL_SIZE_4000) declare.time(11); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst; cv::Ptr oclClahe = cv::ocl::createCLAHE(clipLimit); @@ -915,19 +806,15 @@ PERF_TEST_P(CLAHEFixture, CLAHE, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { cv::Ptr clahe = cv::createCLAHE(clipLimit); TEST_CYCLE() clahe->apply(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// columnSum//////////////////////// @@ -946,19 +833,15 @@ static void columnSumPerfTest(const Mat & src, Mat & dst) PERF_TEST_P(columnSumFixture, columnSum, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(); - const string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, CV_32FC1), dst(srcSize, CV_32FC1); declare.in(src, WARMUP_RNG).out(dst); if (srcSize == OCL_SIZE_4000) declare.time(5); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, CV_32FC1); @@ -968,16 +851,12 @@ PERF_TEST_P(columnSumFixture, columnSum, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() columnSumPerfTest(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_match_template.cpp b/modules/ocl/perf/perf_match_template.cpp index a1c7caf738..2cf06a4d76 100644 --- a/modules/ocl/perf/perf_match_template.cpp +++ b/modules/ocl/perf/perf_match_template.cpp @@ -51,23 +51,16 @@ using std::tr1::get; /////////// matchTemplate //////////////////////// -CV_ENUM(CV_TM_CCORRMatType, CV_32FC1, CV_32FC4) - -typedef tuple CV_TM_CCORRParams; -typedef TestBaseWithParam CV_TM_CCORRFixture; +typedef Size_MatType CV_TM_CCORRFixture; PERF_TEST_P(CV_TM_CCORRFixture, matchTemplate, ::testing::Combine(::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000), - CV_TM_CCORRMatType::all())) + OCL_PERF_ENUM(CV_32FC1, CV_32FC4))) { - // getting params - CV_TM_CCORRParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params), templSize(5, 5); const int type = get<1>(params); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), templ(templSize, type); const Size dstSize(src.cols - templ.cols + 1, src.rows - templ.rows + 1); Mat dst(dstSize, CV_32F); @@ -75,8 +68,7 @@ PERF_TEST_P(CV_TM_CCORRFixture, matchTemplate, randu(templ, 0.0f, 1.0f); declare.time(srcSize == OCL_SIZE_2000 ? 20 : 6).in(src, templ).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclTempl(templ), oclDst(dstSize, CV_32F); @@ -86,37 +78,29 @@ PERF_TEST_P(CV_TM_CCORRFixture, matchTemplate, SANITY_CHECK(dst, 1e-4); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::matchTemplate(src, templ, dst, CV_TM_CCORR); SANITY_CHECK(dst, 1e-4); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } typedef TestBaseWithParam CV_TM_CCORR_NORMEDFixture; PERF_TEST_P(CV_TM_CCORR_NORMEDFixture, matchTemplate, OCL_TYPICAL_MAT_SIZES) { - // getting params const Size srcSize = GetParam(), templSize(5, 5); - const std::string impl = getSelectedImpl(); - // creating src data Mat src(srcSize, CV_8UC1), templ(templSize, CV_8UC1), dst; const Size dstSize(src.cols - templ.cols + 1, src.rows - templ.rows + 1); dst.create(dstSize, CV_8UC1); declare.in(src, templ, WARMUP_RNG).out(dst) .time(srcSize == OCL_SIZE_2000 ? 10 : srcSize == OCL_SIZE_4000 ? 23 : 2); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclTempl(templ), oclDst(dstSize, CV_8UC1); @@ -126,16 +110,12 @@ PERF_TEST_P(CV_TM_CCORR_NORMEDFixture, matchTemplate, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(dst, 2e-2); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::matchTemplate(src, templ, dst, CV_TM_CCORR_NORMED); SANITY_CHECK(dst, 2e-2); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_matrix_operation.cpp b/modules/ocl/perf/perf_matrix_operation.cpp index dc3e15495a..1fe4616ac3 100644 --- a/modules/ocl/perf/perf_matrix_operation.cpp +++ b/modules/ocl/perf/perf_matrix_operation.cpp @@ -51,30 +51,22 @@ using std::tr1::get; ///////////// ConvertTo//////////////////////// -CV_ENUM(ConvertToMatType, CV_8UC1, CV_8UC4) - -typedef tuple ConvertToParams; -typedef TestBaseWithParam ConvertToFixture; +typedef Size_MatType ConvertToFixture; PERF_TEST_P(ConvertToFixture, ConvertTo, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - ConvertToMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - ConvertToParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst; const int dstType = CV_MAKE_TYPE(CV_32F, src.channels()); dst.create(srcSize, dstType); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, dstType); @@ -84,43 +76,32 @@ PERF_TEST_P(ConvertToFixture, ConvertTo, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() src.convertTo(dst, dstType); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// copyTo//////////////////////// -typedef ConvertToMatType copyToMatType; -typedef tuple copyToParams; -typedef TestBaseWithParam copyToFixture; +typedef Size_MatType copyToFixture; PERF_TEST_P(copyToFixture, copyTo, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - copyToMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - copyToParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst(srcSize, type); declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(srcSize, type); @@ -130,44 +111,33 @@ PERF_TEST_P(copyToFixture, copyTo, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() src.copyTo(dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// setTo//////////////////////// -typedef ConvertToMatType setToMatType; -typedef tuple setToParams; -typedef TestBaseWithParam setToFixture; +typedef Size_MatType setToFixture; PERF_TEST_P(setToFixture, setTo, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - setToMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - setToParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); const Scalar val(1, 2, 3, 4); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type); declare.in(src); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(srcSize, type); @@ -176,16 +146,12 @@ PERF_TEST_P(setToFixture, setTo, SANITY_CHECK(src); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() src.setTo(val); SANITY_CHECK(src); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_moments.cpp b/modules/ocl/perf/perf_moments.cpp index 59452d4fb0..200a27db82 100644 --- a/modules/ocl/perf/perf_moments.cpp +++ b/modules/ocl/perf/perf_moments.cpp @@ -52,50 +52,38 @@ using std::tr1::get; ///////////// Moments //////////////////////// -CV_ENUM(MomentsMatType, CV_8UC1, CV_16SC1, CV_32FC1, CV_64FC1) - -typedef tuple MomentsParams; -typedef TestBaseWithParam MomentsFixture; +typedef Size_MatType MomentsFixture; PERF_TEST_P(MomentsFixture, DISABLED_Moments, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - MomentsMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_16SC1, CV_32FC1, CV_64FC1))) // TODO does not work properly (see below) { - // getting params - MomentsParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst(7, 1, CV_64F); const bool binaryImage = false; cv::Moments mom; declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src); - TEST_CYCLE() mom = cv::ocl::ocl_moments(oclSrc, binaryImage); + TEST_CYCLE() mom = cv::ocl::ocl_moments(oclSrc, binaryImage); // TODO Use oclSrc cv::HuMoments(mom, dst); SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() mom = cv::moments(src, binaryImage); cv::HuMoments(mom, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_norm.cpp b/modules/ocl/perf/perf_norm.cpp index b0e18facdf..736645d904 100644 --- a/modules/ocl/perf/perf_norm.cpp +++ b/modules/ocl/perf/perf_norm.cpp @@ -53,21 +53,18 @@ using std::tr1::get; typedef TestBaseWithParam normFixture; -PERF_TEST_P(normFixture, DISABLED_norm, OCL_TYPICAL_MAT_SIZES) +PERF_TEST_P(normFixture, DISABLED_norm, OCL_TYPICAL_MAT_SIZES) // TODO doesn't work properly { - // getting params const Size srcSize = GetParam(); const std::string impl = getSelectedImpl(); double value = 0.0; - // creating src data Mat src1(srcSize, CV_8UC1), src2(srcSize, CV_8UC1); declare.in(src1, src2); randu(src1, 0, 1); randu(src2, 0, 1); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc1(src1), oclSrc2(src2); @@ -75,16 +72,12 @@ PERF_TEST_P(normFixture, DISABLED_norm, OCL_TYPICAL_MAT_SIZES) SANITY_CHECK(value); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() value = cv::norm(src1, src2, NORM_INF); SANITY_CHECK(value); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_opticalflow.cpp b/modules/ocl/perf/perf_opticalflow.cpp index 2f0626750c..34651d1af8 100644 --- a/modules/ocl/perf/perf_opticalflow.cpp +++ b/modules/ocl/perf/perf_opticalflow.cpp @@ -70,25 +70,25 @@ typedef tuple > PyrLKOpticalFlowParamType; typedef TestBaseWithParam PyrLKOpticalFlowFixture; PERF_TEST_P(PyrLKOpticalFlowFixture, - PyrLKOpticalFlow, + DISABLED_PyrLKOpticalFlow, ::testing::Combine( ::testing::Values(1000, 2000, 4000), ::testing::Values( make_tuple ( string("gpu/opticalflow/rubberwhale1.png"), - string("gpu/opticalflow/rubberwhale1.png"), + string("gpu/opticalflow/rubberwhale2.png"), LoadMode(IMREAD_COLOR) ) -// , make_tuple -// ( -// string("gpu/stereobm/aloe-L.png"), -// string("gpu/stereobm/aloe-R.png"), -// LoadMode(IMREAD_GRAYSCALE) -// ) + , make_tuple + ( + string("gpu/stereobm/aloe-L.png"), + string("gpu/stereobm/aloe-R.png"), + LoadMode(IMREAD_GRAYSCALE) + ) ) ) - ) + ) // TODO to big difference between implementations { PyrLKOpticalFlowParamType params = GetParam(); tuple fileParam = get<1>(params); @@ -97,7 +97,6 @@ PERF_TEST_P(PyrLKOpticalFlowFixture, const string fileName0 = get<0>(fileParam), fileName1 = get<1>(fileParam); Mat frame0 = imread(getDataPath(fileName0), openMode); Mat frame1 = imread(getDataPath(fileName1), openMode); - const string impl = getSelectedImpl(); ASSERT_FALSE(frame0.empty()) << "can't load " << fileName0; ASSERT_FALSE(frame1.empty()) << "can't load " << fileName1; @@ -108,14 +107,12 @@ PERF_TEST_P(PyrLKOpticalFlowFixture, else grayFrame = frame0; - // initialization vector pts, nextPts; vector status; vector err; goodFeaturesToTrack(grayFrame, pts, pointsCount, 0.01, 0.0); - // selecting implementation - if (impl == "plain") + if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::calcOpticalFlowPyrLK(frame0, frame1, pts, nextPts, status, err); @@ -124,7 +121,7 @@ PERF_TEST_P(PyrLKOpticalFlowFixture, SANITY_CHECK(status); SANITY_CHECK(err); } - else if (impl == "ocl") + else if (RUN_OCL_IMPL) { ocl::PyrLKOpticalFlow oclPyrLK; ocl::oclMat oclFrame0(frame0), oclFrame1(frame1); @@ -142,228 +139,135 @@ PERF_TEST_P(PyrLKOpticalFlowFixture, SANITY_CHECK(status); SANITY_CHECK(err); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); - -// size_t mismatch = 0; -// for (int i = 0; i < (int)nextPts.size(); ++i) -// { -// if(status[i] != ocl_status.at(0, i)) -// { -// mismatch++; -// continue; -// } -// if(status[i]) -// { -// Point2f gpu_rst = ocl_nextPts.at(0, i); -// Point2f cpu_rst = nextPts[i]; -// if(fabs(gpu_rst.x - cpu_rst.x) >= 1. || fabs(gpu_rst.y - cpu_rst.y) >= 1.) -// mismatch++; -// } -// } -// double ratio = (double)mismatch / (double)nextPts.size(); -// if(ratio < .02) -// TestSystem::instance().setAccurate(1, ratio); -// else -// TestSystem::instance().setAccurate(0, ratio); + OCL_PERF_ELSE } - -PERFTEST(tvl1flow) +PERF_TEST(tvl1flowFixture, tvl1flow) { - cv::Mat frame0 = imread("rubberwhale1.png", cv::IMREAD_GRAYSCALE); - assert(!frame0.empty()); + Mat frame0 = imread(getDataPath("gpu/opticalflow/rubberwhale1.png"), cv::IMREAD_GRAYSCALE); + ASSERT_FALSE(frame0.empty()) << "can't load rubberwhale1.png"; - cv::Mat frame1 = imread("rubberwhale2.png", cv::IMREAD_GRAYSCALE); - assert(!frame1.empty()); + Mat frame1 = imread(getDataPath("gpu/opticalflow/rubberwhale2.png"), cv::IMREAD_GRAYSCALE); + ASSERT_FALSE(frame1.empty()) << "can't load rubberwhale2.png"; - cv::ocl::OpticalFlowDual_TVL1_OCL d_alg; - cv::ocl::oclMat d_flowx(frame0.size(), CV_32FC1); - cv::ocl::oclMat d_flowy(frame1.size(), CV_32FC1); + const Size srcSize = frame0.size(); + const double eps = 1.2; + Mat flow(srcSize, CV_32FC2), flow1(srcSize, CV_32FC1), flow2(srcSize, CV_32FC1); + declare.in(frame0, frame1).out(flow1, flow2).time(159); - cv::Ptr alg = cv::createOptFlow_DualTVL1(); - cv::Mat flow; + if (RUN_PLAIN_IMPL) + { + Ptr alg = createOptFlow_DualTVL1(); + TEST_CYCLE() alg->calc(frame0, frame1, flow); - SUBTEST << frame0.cols << 'x' << frame0.rows << "; rubberwhale1.png; "<collectGarbage(); + Mat flows[2] = { flow1, flow2 }; + split(flow, flows); - alg->calc(frame0, frame1, flow); + SANITY_CHECK(flow1, eps); + SANITY_CHECK(flow2, eps); + } + else if (RUN_OCL_IMPL) + { + ocl::OpticalFlowDual_TVL1_OCL oclAlg; + ocl::oclMat oclFrame0(frame0), oclFrame1(frame1), oclFlow1(srcSize, CV_32FC1), + oclFlow2(srcSize, CV_32FC1); - CPU_ON; - alg->calc(frame0, frame1, flow); - CPU_OFF; + TEST_CYCLE() oclAlg(oclFrame0, oclFrame1, oclFlow1, oclFlow2); - cv::Mat gold[2]; - cv::split(flow, gold); + oclAlg.collectGarbage(); - cv::ocl::oclMat d0(frame0.size(), CV_32FC1); - d0.upload(frame0); - cv::ocl::oclMat d1(frame1.size(), CV_32FC1); - d1.upload(frame1); + oclFlow1.download(flow1); + oclFlow2.download(flow2); - WARMUP_ON; - d_alg(d0, d1, d_flowx, d_flowy); - WARMUP_OFF; - /* - double diff1 = 0.0, diff2 = 0.0; - if(ExceptedMatSimilar(gold[0], cv::Mat(d_flowx), 3e-3, diff1) == 1 - &&ExceptedMatSimilar(gold[1], cv::Mat(d_flowy), 3e-3, diff2) == 1) - TestSystem::instance().setAccurate(1); - else - TestSystem::instance().setAccurate(0); + SANITY_CHECK(flow1, eps); + SANITY_CHECK(flow2, eps); + } + else + OCL_PERF_ELSE +} - TestSystem::instance().setDiff(diff1); - TestSystem::instance().setDiff(diff2); - */ +///////////// FarnebackOpticalFlow //////////////////////// +CV_ENUM(farneFlagType, 0, OPTFLOW_FARNEBACK_GAUSSIAN) - GPU_ON; - d_alg(d0, d1, d_flowx, d_flowy); - d_alg.collectGarbage(); - GPU_OFF; +typedef tuple, farneFlagType, bool> FarnebackOpticalFlowParams; +typedef TestBaseWithParam FarnebackOpticalFlowFixture; +PERF_TEST_P(FarnebackOpticalFlowFixture, FarnebackOpticalFlow, + ::testing::Combine( + ::testing::Values(make_tuple(5, 1.1), + make_tuple(7, 1.5)), + farneFlagType::all(), + ::testing::Bool())) +{ + Mat frame0 = imread(getDataPath("gpu/opticalflow/rubberwhale1.png"), cv::IMREAD_GRAYSCALE); + ASSERT_FALSE(frame0.empty()) << "can't load rubberwhale1.png"; - cv::Mat flowx, flowy; + Mat frame1 = imread(getDataPath("gpu/opticalflow/rubberwhale2.png"), cv::IMREAD_GRAYSCALE); + ASSERT_FALSE(frame1.empty()) << "can't load rubberwhale2.png"; - GPU_FULL_ON; - d0.upload(frame0); - d1.upload(frame1); - d_alg(d0, d1, d_flowx, d_flowy); - d_alg.collectGarbage(); - d_flowx.download(flowx); - d_flowy.download(flowy); - GPU_FULL_OFF; + const Size srcSize = frame0.size(); - TestSystem::instance().ExceptedMatSimilar(gold[0], flowx, 3e-3); - TestSystem::instance().ExceptedMatSimilar(gold[1], flowy, 3e-3); -} + const FarnebackOpticalFlowParams params = GetParam(); + const tuple polyParams = get<0>(params); + const int polyN = get<0>(polyParams), flags = get<1>(params); + const double polySigma = get<1>(polyParams), pyrScale = 0.5; + const bool useInitFlow = get<2>(params); + const double eps = 1.5; -///////////// FarnebackOpticalFlow //////////////////////// -PERFTEST(FarnebackOpticalFlow) -{ - cv::Mat frame0 = imread("rubberwhale1.png", cv::IMREAD_GRAYSCALE); - ASSERT_FALSE(frame0.empty()); + Mat flowx(srcSize, CV_32FC1), flowy(srcSize, CV_32FC1), flow(srcSize, CV_32FC2); + declare.in(frame0, frame1).out(flowx, flowy); - cv::Mat frame1 = imread("rubberwhale2.png", cv::IMREAD_GRAYSCALE); - ASSERT_FALSE(frame1.empty()); + ocl::FarnebackOpticalFlow farn; + farn.pyrScale = pyrScale; + farn.polyN = polyN; + farn.polySigma = polySigma; + farn.flags = flags; - cv::ocl::oclMat d_frame0(frame0), d_frame1(frame1); + if (RUN_PLAIN_IMPL) + { + if (useInitFlow) + { + calcOpticalFlowFarneback( + frame0, frame1, flow, farn.pyrScale, farn.numLevels, farn.winSize, + farn.numIters, farn.polyN, farn.polySigma, farn.flags); + farn.flags |= OPTFLOW_USE_INITIAL_FLOW; + } - int polyNs[2] = { 5, 7 }; - double polySigmas[2] = { 1.1, 1.5 }; - int farneFlags[2] = { 0, cv::OPTFLOW_FARNEBACK_GAUSSIAN }; - bool UseInitFlows[2] = { false, true }; - double pyrScale = 0.5; + TEST_CYCLE() + calcOpticalFlowFarneback( + frame0, frame1, flow, farn.pyrScale, farn.numLevels, farn.winSize, + farn.numIters, farn.polyN, farn.polySigma, farn.flags); - string farneFlagStrs[2] = { "BoxFilter", "GaussianBlur" }; - string useInitFlowStrs[2] = { "", "UseInitFlow" }; + Mat flowxy[2] = { flowx, flowy }; + split(flow, flowxy); - for ( int i = 0; i < 2; ++i) + SANITY_CHECK(flowx, eps); + SANITY_CHECK(flowy, eps); + } + else if (RUN_OCL_IMPL) { - int polyN = polyNs[i]; - double polySigma = polySigmas[i]; + ocl::oclMat oclFrame0(frame0), oclFrame1(frame1), + oclFlowx(srcSize, CV_32FC1), oclFlowy(srcSize, CV_32FC1); - for ( int j = 0; j < 2; ++j) + if (useInitFlow) { - int flags = farneFlags[j]; - - for ( int k = 0; k < 2; ++k) - { - bool useInitFlow = UseInitFlows[k]; - SUBTEST << "polyN(" << polyN << "); " << farneFlagStrs[j] << "; " << useInitFlowStrs[k]; - - cv::ocl::FarnebackOpticalFlow farn; - farn.pyrScale = pyrScale; - farn.polyN = polyN; - farn.polySigma = polySigma; - farn.flags = flags; - - cv::ocl::oclMat d_flowx, d_flowy; - cv::Mat flow, flowBuf, flowxBuf, flowyBuf; - - WARMUP_ON; - farn(d_frame0, d_frame1, d_flowx, d_flowy); - - if (useInitFlow) - { - cv::Mat flowxy[] = {cv::Mat(d_flowx), cv::Mat(d_flowy)}; - cv::merge(flowxy, 2, flow); - flow.copyTo(flowBuf); - flowxy[0].copyTo(flowxBuf); - flowxy[1].copyTo(flowyBuf); - - farn.flags |= cv::OPTFLOW_USE_INITIAL_FLOW; - farn(d_frame0, d_frame1, d_flowx, d_flowy); - } - WARMUP_OFF; - - cv::calcOpticalFlowFarneback( - frame0, frame1, flow, farn.pyrScale, farn.numLevels, farn.winSize, - farn.numIters, farn.polyN, farn.polySigma, farn.flags); - - std::vector flowxy; - cv::split(flow, flowxy); + farn(oclFrame0, oclFrame1, oclFlowx, oclFlowy); + farn.flags |= OPTFLOW_USE_INITIAL_FLOW; + } - Mat md_flowx = cv::Mat(d_flowx); - Mat md_flowy = cv::Mat(d_flowy); - TestSystem::instance().ExceptedMatSimilar(flowxy[0], md_flowx, 0.1); - TestSystem::instance().ExceptedMatSimilar(flowxy[1], md_flowy, 0.1); + TEST_CYCLE() + farn(oclFrame0, oclFrame1, oclFlowx, oclFlowy); - if (useInitFlow) - { - cv::Mat flowx, flowy; - farn.flags = (flags | cv::OPTFLOW_USE_INITIAL_FLOW); + oclFlowx.download(flowx); + oclFlowy.download(flowy); - CPU_ON; - cv::calcOpticalFlowFarneback( - frame0, frame1, flowBuf, farn.pyrScale, farn.numLevels, farn.winSize, - farn.numIters, farn.polyN, farn.polySigma, farn.flags); - CPU_OFF; - - GPU_ON; - farn(d_frame0, d_frame1, d_flowx, d_flowy); - GPU_OFF; - - GPU_FULL_ON; - d_frame0.upload(frame0); - d_frame1.upload(frame1); - d_flowx.upload(flowxBuf); - d_flowy.upload(flowyBuf); - farn(d_frame0, d_frame1, d_flowx, d_flowy); - d_flowx.download(flowx); - d_flowy.download(flowy); - GPU_FULL_OFF; - } - else - { - cv::Mat flow, flowx, flowy; - cv::ocl::oclMat d_flowx, d_flowy; - - farn.flags = flags; - - CPU_ON; - cv::calcOpticalFlowFarneback( - frame0, frame1, flow, farn.pyrScale, farn.numLevels, farn.winSize, - farn.numIters, farn.polyN, farn.polySigma, farn.flags); - CPU_OFF; - - GPU_ON; - farn(d_frame0, d_frame1, d_flowx, d_flowy); - GPU_OFF; - - GPU_FULL_ON; - d_frame0.upload(frame0); - d_frame1.upload(frame1); - farn(d_frame0, d_frame1, d_flowx, d_flowy); - d_flowx.download(flowx); - d_flowy.download(flowy); - GPU_FULL_OFF; - } - } - } + SANITY_CHECK(flowx, eps); + SANITY_CHECK(flowy, eps); } + else + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_precomp.cpp b/modules/ocl/perf/perf_precomp.cpp index c5679a429f..74f3f0f33c 100644 --- a/modules/ocl/perf/perf_precomp.cpp +++ b/modules/ocl/perf/perf_precomp.cpp @@ -41,452 +41,3 @@ //M*/ #include "perf_precomp.hpp" -#if GTEST_OS_WINDOWS -#ifndef NOMINMAX -#define NOMINMAX -#endif -# include -#endif - -// This program test most of the functions in ocl module and generate data metrix of x-factor in .csv files -// All images needed in this test are in samples/gpu folder. -// For haar template, haarcascade_frontalface_alt.xml shouold be in working directory -void TestSystem::run() -{ - if (is_list_mode_) - { - for (vector::iterator it = tests_.begin(); it != tests_.end(); ++it) - { - cout << (*it)->name() << endl; - } - - return; - } - - // Run test initializers - for (vector::iterator it = inits_.begin(); it != inits_.end(); ++it) - { - if ((*it)->name().find(test_filter_, 0) != string::npos) - { - (*it)->run(); - } - } - - printHeading(); - writeHeading(); - - // Run tests - for (vector::iterator it = tests_.begin(); it != tests_.end(); ++it) - { - try - { - if ((*it)->name().find(test_filter_, 0) != string::npos) - { - cout << endl << (*it)->name() << ":\n"; - - setCurrentTest((*it)->name()); - //fprintf(record_,"%s\n",(*it)->name().c_str()); - - (*it)->run(); - finishCurrentSubtest(); - } - } - catch (const Exception &) - { - // Message is printed via callback - resetCurrentSubtest(); - } - catch (const runtime_error &e) - { - printError(e.what()); - resetCurrentSubtest(); - } - } - - printSummary(); - writeSummary(); -} - - -void TestSystem::finishCurrentSubtest() -{ - if (cur_subtest_is_empty_) - // There is no need to print subtest statistics - { - return; - } - - double cpu_time = cpu_elapsed_ / getTickFrequency() * 1000.0; - double gpu_time = gpu_elapsed_ / getTickFrequency() * 1000.0; - double gpu_full_time = gpu_full_elapsed_ / getTickFrequency() * 1000.0; - - double speedup = static_cast(cpu_elapsed_) / std::max(1.0, gpu_elapsed_); - speedup_total_ += speedup; - - double fullspeedup = static_cast(cpu_elapsed_) / std::max(1.0, gpu_full_elapsed_); - speedup_full_total_ += fullspeedup; - - if (speedup > top_) - { - speedup_faster_count_++; - } - else if (speedup < bottom_) - { - speedup_slower_count_++; - } - else - { - speedup_equal_count_++; - } - - if (fullspeedup > top_) - { - speedup_full_faster_count_++; - } - else if (fullspeedup < bottom_) - { - speedup_full_slower_count_++; - } - else - { - speedup_full_equal_count_++; - } - - // compute min, max and - std::sort(gpu_times_.begin(), gpu_times_.end()); - double gpu_min = gpu_times_.front() / getTickFrequency() * 1000.0; - double gpu_max = gpu_times_.back() / getTickFrequency() * 1000.0; - double deviation = 0; - - if (gpu_times_.size() > 1) - { - double sum = 0; - - for (size_t i = 0; i < gpu_times_.size(); i++) - { - int64 diff = gpu_times_[i] - static_cast(gpu_elapsed_); - double diff_time = diff * 1000 / getTickFrequency(); - sum += diff_time * diff_time; - } - - deviation = std::sqrt(sum / gpu_times_.size()); - } - - printMetrics(is_accurate_, cpu_time, gpu_time, gpu_full_time, speedup, fullspeedup); - writeMetrics(cpu_time, gpu_time, gpu_full_time, speedup, fullspeedup, gpu_min, gpu_max, deviation); - - num_subtests_called_++; - resetCurrentSubtest(); -} - - -double TestSystem::meanTime(const vector &samples) -{ - double sum = accumulate(samples.begin(), samples.end(), 0.); - return sum / samples.size(); -} - - -void TestSystem::printHeading() -{ - cout << endl; - cout<< setiosflags(ios_base::left); - -#if 0 - cout<(0, 0) - 1.f); -} diff --git a/modules/ocl/perf/perf_precomp.hpp b/modules/ocl/perf/perf_precomp.hpp index 8c13b9e73e..5e6cd2266c 100644 --- a/modules/ocl/perf/perf_precomp.hpp +++ b/modules/ocl/perf/perf_precomp.hpp @@ -42,7 +42,6 @@ #ifdef __GNUC__ # pragma GCC diagnostic ignored "-Wmissing-declarations" -# pragma GCC diagnostic ignored "-Wunused-function" # if defined __clang__ || defined __APPLE__ # pragma GCC diagnostic ignored "-Wmissing-prototypes" # pragma GCC diagnostic ignored "-Wextra" @@ -70,457 +69,37 @@ #include "opencv2/ocl/ocl.hpp" #include "opencv2/ts/ts.hpp" -#define OCL_SIZE_1000 cv::Size(1000, 1000) -#define OCL_SIZE_2000 cv::Size(2000, 2000) -#define OCL_SIZE_4000 cv::Size(4000, 4000) - -#define OCL_TYPICAL_MAT_SIZES ::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000, OCL_SIZE_4000) - -#define Min_Size 1000 -#define Max_Size 4000 -#define Multiple 2 -#define TAB " " - using namespace std; using namespace cv; -void gen(Mat &mat, int rows, int cols, int type, Scalar low, Scalar high); -void gen(Mat &mat, int rows, int cols, int type, int low, int high, int n); - -string abspath(const string &relpath); -int CV_CDECL cvErrorCallback(int, const char *, const char *, const char *, int, void *); -//typedef struct -//{ -// short x; -// short y; -//} COOR; -//COOR do_meanShift(int x0, int y0, uchar *sptr, uchar *dptr, int sstep, -// cv::Size size, int sp, int sr, int maxIter, float eps, int *tab); -//void meanShiftProc_(const Mat &src_roi, Mat &dst_roi, Mat &dstCoor_roi, -// int sp, int sr, cv::TermCriteria crit); - - -template -int ExpectedEQ(T1 expected, T2 actual) -{ - if(expected == actual) - return 1; - - return 0; -} - -template -int EeceptDoubleEQ(T1 expected, T1 actual) -{ - testing::internal::Double lhs(expected); - testing::internal::Double rhs(actual); - - if (lhs.AlmostEquals(rhs)) - { - return 1; - } - - return 0; -} - -template -int AssertEQ(T expected, T actual) -{ - if(expected == actual) - { - return 1; - } - return 0; -} - -int ExceptDoubleNear(double val1, double val2, double abs_error); -bool match_rect(cv::Rect r1, cv::Rect r2, int threshold); - -double checkNorm(const cv::Mat &m); -double checkNorm(const cv::Mat &m1, const cv::Mat &m2); -double checkSimilarity(const cv::Mat &m1, const cv::Mat &m2); - -int ExpectedMatNear(cv::Mat dst, cv::Mat cpu_dst, double eps); -int ExceptedMatSimilar(cv::Mat dst, cv::Mat cpu_dst, double eps); - -class Runnable -{ -public: - explicit Runnable(const std::string &runname): name_(runname) {} - virtual ~Runnable() {} - - const std::string &name() const - { - return name_; - } - - virtual void run() = 0; - -private: - std::string name_; -}; - -class TestSystem -{ -public: - static TestSystem &instance() - { - static TestSystem me; - return me; - } - - void setWorkingDir(const std::string &val) - { - working_dir_ = val; - } - const std::string &workingDir() const - { - return working_dir_; - } - - void setTestFilter(const std::string &val) - { - test_filter_ = val; - } - const std::string &testFilter() const - { - return test_filter_; - } - - void setNumIters(int num_iters) - { - num_iters_ = num_iters; - } - void setGPUWarmupIters(int num_iters) - { - gpu_warmup_iters_ = num_iters; - } - void setCPUIters(int num_iters) - { - cpu_num_iters_ = num_iters; - } - - void setTopThreshold(double top) - { - top_ = top; - } - void setBottomThreshold(double bottom) - { - bottom_ = bottom; - } - - void addInit(Runnable *init) - { - inits_.push_back(init); - } - void addTest(Runnable *test) - { - tests_.push_back(test); - } - void run(); - - // It's public because OpenCV callback uses it - void printError(const std::string &msg); - - std::stringstream &startNewSubtest() - { - finishCurrentSubtest(); - return cur_subtest_description_; - } - - bool stop() const - { - return cur_iter_idx_ >= num_iters_; - } - - bool cpu_stop() const - { - return cur_iter_idx_ >= cpu_num_iters_; - } - - int get_cur_iter_idx() - { - return cur_iter_idx_; - } - - int get_cpu_num_iters() - { - return cpu_num_iters_; - } - - bool warmupStop() - { - return cur_warmup_idx_++ >= gpu_warmup_iters_; - } - - void warmupComplete() - { - cur_warmup_idx_ = 0; - } - - void cpuOn() - { - cpu_started_ = cv::getTickCount(); - } - void cpuOff() - { - int64 delta = cv::getTickCount() - cpu_started_; - cpu_times_.push_back(delta); - ++cur_iter_idx_; - } - void cpuComplete() - { - cpu_elapsed_ += meanTime(cpu_times_); - cur_subtest_is_empty_ = false; - cur_iter_idx_ = 0; - } +#define OCL_SIZE_1000 Size(1000, 1000) +#define OCL_SIZE_2000 Size(2000, 2000) +#define OCL_SIZE_4000 Size(4000, 4000) - void gpuOn() - { - gpu_started_ = cv::getTickCount(); - } - void gpuOff() - { - int64 delta = cv::getTickCount() - gpu_started_; - gpu_times_.push_back(delta); - ++cur_iter_idx_; - } - void gpuComplete() - { - gpu_elapsed_ += meanTime(gpu_times_); - cur_subtest_is_empty_ = false; - cur_iter_idx_ = 0; - } - - void gpufullOn() - { - gpu_full_started_ = cv::getTickCount(); - } - void gpufullOff() - { - int64 delta = cv::getTickCount() - gpu_full_started_; - gpu_full_times_.push_back(delta); - ++cur_iter_idx_; - } - void gpufullComplete() - { - gpu_full_elapsed_ += meanTime(gpu_full_times_); - cur_subtest_is_empty_ = false; - cur_iter_idx_ = 0; - } - - bool isListMode() const - { - return is_list_mode_; - } - void setListMode(bool value) - { - is_list_mode_ = value; - } - - void setRecordName(const std::string &name) - { - recordname_ = name; - } - - void setCurrentTest(const std::string &name) - { - itname_ = name; - itname_changed_ = true; - } - - void setAccurate(int accurate, double diff) - { - is_accurate_ = accurate; - accurate_diff_ = diff; - } - - void ExpectMatsNear(vector& dst, vector& cpu_dst, vector& eps) - { - assert(dst.size() == cpu_dst.size()); - assert(cpu_dst.size() == eps.size()); - is_accurate_ = 1; - for(size_t i=0; i eps[i]) - is_accurate_ = 0; - } - } - - void ExpectedMatNear(cv::Mat& dst, cv::Mat& cpu_dst, double eps) - { - assert(dst.type() == cpu_dst.type()); - assert(dst.size() == cpu_dst.size()); - accurate_diff_ = checkNorm(dst, cpu_dst); - if(accurate_diff_ <= eps) - is_accurate_ = 1; - else - is_accurate_ = 0; - } - - void ExceptedMatSimilar(cv::Mat& dst, cv::Mat& cpu_dst, double eps) - { - assert(dst.type() == cpu_dst.type()); - assert(dst.size() == cpu_dst.size()); - accurate_diff_ = checkSimilarity(cpu_dst, dst); - if(accurate_diff_ <= eps) - is_accurate_ = 1; - else - is_accurate_ = 0; - } - - std::stringstream &getCurSubtestDescription() - { - return cur_subtest_description_; - } - -private: - TestSystem(): - cur_subtest_is_empty_(true), cpu_elapsed_(0), - gpu_elapsed_(0), gpu_full_elapsed_(0), speedup_total_(0.0), - num_subtests_called_(0), - speedup_faster_count_(0), speedup_slower_count_(0), speedup_equal_count_(0), - speedup_full_faster_count_(0), speedup_full_slower_count_(0), speedup_full_equal_count_(0), is_list_mode_(false), - num_iters_(10), cpu_num_iters_(2), - gpu_warmup_iters_(1), cur_iter_idx_(0), cur_warmup_idx_(0), - record_(0), recordname_("performance"), itname_changed_(true), - is_accurate_(-1), accurate_diff_(0.) - { - cpu_times_.reserve(num_iters_); - gpu_times_.reserve(num_iters_); - gpu_full_times_.reserve(num_iters_); - } - - void finishCurrentSubtest(); - void resetCurrentSubtest() - { - cpu_elapsed_ = 0; - gpu_elapsed_ = 0; - gpu_full_elapsed_ = 0; - cur_subtest_description_.str(""); - cur_subtest_is_empty_ = true; - cur_iter_idx_ = 0; - cur_warmup_idx_ = 0; - cpu_times_.clear(); - gpu_times_.clear(); - gpu_full_times_.clear(); - is_accurate_ = -1; - accurate_diff_ = 0.; - } - - double meanTime(const std::vector &samples); - - void printHeading(); - void printSummary(); - void printMetrics(int is_accurate, double cpu_time, double gpu_time = 0.0f, double gpu_full_time = 0.0f, double speedup = 0.0f, double fullspeedup = 0.0f); - - void writeHeading(); - void writeSummary(); - void writeMetrics(double cpu_time, double gpu_time = 0.0f, double gpu_full_time = 0.0f, - double speedup = 0.0f, double fullspeedup = 0.0f, - double gpu_min = 0.0f, double gpu_max = 0.0f, double std_dev = 0.0f); - - std::string working_dir_; - std::string test_filter_; - - std::vector inits_; - std::vector tests_; - - std::stringstream cur_subtest_description_; - bool cur_subtest_is_empty_; - - int64 cpu_started_; - int64 gpu_started_; - int64 gpu_full_started_; - double cpu_elapsed_; - double gpu_elapsed_; - double gpu_full_elapsed_; - - double speedup_total_; - double speedup_full_total_; - int num_subtests_called_; - - int speedup_faster_count_; - int speedup_slower_count_; - int speedup_equal_count_; - - int speedup_full_faster_count_; - int speedup_full_slower_count_; - int speedup_full_equal_count_; - - bool is_list_mode_; - - double top_; - double bottom_; - - int num_iters_; - int cpu_num_iters_; //there's no need to set cpu running same times with gpu - int gpu_warmup_iters_; //gpu warm up times, default is 1 - int cur_iter_idx_; - int cur_warmup_idx_; //current gpu warm up times - std::vector cpu_times_; - std::vector gpu_times_; - std::vector gpu_full_times_; - - FILE *record_; - std::string recordname_; - std::string itname_; - bool itname_changed_; - - int is_accurate_; - double accurate_diff_; -}; - - -#define GLOBAL_INIT(name) \ -struct name##_init: Runnable { \ - name##_init(): Runnable(#name) { \ - TestSystem::instance().addInit(this); \ -} \ - void run(); \ -} name##_init_instance; \ - void name##_init::run() - - -#define PERFTEST(name) \ -struct name##_test: Runnable { \ - name##_test(): Runnable(#name) { \ - TestSystem::instance().addTest(this); \ -} \ - void run(); \ -} name##_test_instance; \ - void name##_test::run() +#define OCL_TYPICAL_MAT_SIZES ::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000, OCL_SIZE_4000) -#define SUBTEST TestSystem::instance().startNewSubtest() +#define OCL_PERF_ENUM(type, ...) ::testing::Values(type, ## __VA_ARGS__ ) -#define CPU_ON \ - while (!TestSystem::instance().cpu_stop()) { \ - TestSystem::instance().cpuOn() -#define CPU_OFF \ - TestSystem::instance().cpuOff(); \ - } TestSystem::instance().cpuComplete() +#define IMPL_OCL "ocl" +#define IMPL_GPU "gpu" +#define IMPL_PLAIN "plain" -#define GPU_ON \ - while (!TestSystem::instance().stop()) { \ - TestSystem::instance().gpuOn() -#define GPU_OFF \ - ocl::finish();\ - TestSystem::instance().gpuOff(); \ - } TestSystem::instance().gpuComplete() +#define RUN_OCL_IMPL (IMPL_OCL == getSelectedImpl()) +#define RUN_PLAIN_IMPL (IMPL_PLAIN == getSelectedImpl()) -#define GPU_FULL_ON \ - while (!TestSystem::instance().stop()) { \ - TestSystem::instance().gpufullOn() -#define GPU_FULL_OFF \ - TestSystem::instance().gpufullOff(); \ - } TestSystem::instance().gpufullComplete() +#ifdef HAVE_OPENCV_GPU +# define RUN_GPU_IMPL (IMPL_GPU == getSelectedImpl()) +#endif -#define WARMUP_ON \ - while (!TestSystem::instance().warmupStop()) { -#define WARMUP_OFF \ - ocl::finish();\ - } TestSystem::instance().warmupComplete() +#ifdef HAVE_OPENCV_GPU +#define OCL_PERF_ELSE \ + if (RUN_GPU_IMPL) \ + CV_TEST_FAIL_NO_IMPL(); \ + else \ + CV_TEST_FAIL_NO_IMPL(); +#else +#define OCL_PERF_ELSE \ + CV_TEST_FAIL_NO_IMPL(); +#endif #endif diff --git a/modules/ocl/perf/perf_pyramid.cpp b/modules/ocl/perf/perf_pyramid.cpp index 6b24811a6a..c7f949d2c8 100644 --- a/modules/ocl/perf/perf_pyramid.cpp +++ b/modules/ocl/perf/perf_pyramid.cpp @@ -51,97 +51,74 @@ using std::tr1::get; ///////////// pyrDown ////////////////////// -CV_ENUM(pyrDownMatType, CV_8UC1, CV_8UC4) - -typedef tuple pyrDownParams; -typedef TestBaseWithParam pyrDownFixture; +typedef Size_MatType pyrDownFixture; PERF_TEST_P(pyrDownFixture, pyrDown, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - pyrDownMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - pyrDownParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst; Size dstSize((srcSize.height + 1) >> 1, (srcSize.width + 1) >> 1); dst.create(dstSize, type); - declare.in(src).out(dst); + declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(dstSize, type); - TEST_CYCLE() cv::ocl::pyrDown(oclSrc, oclDst); + TEST_CYCLE() ocl::pyrDown(oclSrc, oclDst); oclDst.download(dst); SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { - TEST_CYCLE() cv::pyrDown(src, dst); + TEST_CYCLE() pyrDown(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// pyrUp //////////////////////// -typedef pyrDownMatType pyrUpMatType; -typedef tuple pyrUpParams; -typedef TestBaseWithParam pyrUpFixture; +typedef Size_MatType pyrUpFixture; PERF_TEST_P(pyrUpFixture, pyrUp, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - pyrUpMatType::all())) + OCL_PERF_ENUM(CV_8UC1, CV_8UC4))) { - // getting params - pyrUpParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int type = get<1>(params); - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, type), dst; Size dstSize(srcSize.height << 1, srcSize.width << 1); dst.create(dstSize, type); - declare.in(src).out(dst); + declare.in(src, WARMUP_RNG).out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src), oclDst(dstSize, type); - TEST_CYCLE() cv::ocl::pyrDown(oclSrc, oclDst); + TEST_CYCLE() ocl::pyrDown(oclSrc, oclDst); oclDst.download(dst); SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { - TEST_CYCLE() cv::pyrDown(src, dst); + TEST_CYCLE() pyrDown(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } diff --git a/modules/ocl/perf/perf_split_merge.cpp b/modules/ocl/perf/perf_split_merge.cpp index 304d3dd37a..48d64c100e 100644 --- a/modules/ocl/perf/perf_split_merge.cpp +++ b/modules/ocl/perf/perf_split_merge.cpp @@ -51,23 +51,16 @@ using std::tr1::get; ///////////// Merge//////////////////////// -CV_ENUM(MergeMatType, CV_8U, CV_32F) - -typedef tuple MergeParams; -typedef TestBaseWithParam MergeFixture; +typedef Size_MatType MergeFixture; PERF_TEST_P(MergeFixture, Merge, ::testing::Combine(::testing::Values(OCL_SIZE_1000, OCL_SIZE_2000), - MergeMatType::all())) + OCL_PERF_ENUM(CV_8U, CV_32F))) { - // getting params - MergeParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int depth = get<1>(params), channels = 3; - std::string impl = getSelectedImpl(); - - // creating src data const int dstType = CV_MAKE_TYPE(depth, channels); Mat dst(srcSize, dstType); vector src(channels); @@ -78,8 +71,7 @@ PERF_TEST_P(MergeFixture, Merge, } declare.out(dst); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclDst(srcSize, dstType); vector oclSrc(src.size()); @@ -92,50 +84,39 @@ PERF_TEST_P(MergeFixture, Merge, SANITY_CHECK(dst); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { TEST_CYCLE() cv::merge(src, dst); SANITY_CHECK(dst); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE } ///////////// Split//////////////////////// -typedef MergeMatType SplitMatType; -typedef tuple SplitParams; -typedef TestBaseWithParam SplitFixture; +typedef Size_MatType SplitFixture; PERF_TEST_P(SplitFixture, Split, ::testing::Combine(OCL_TYPICAL_MAT_SIZES, - SplitMatType::all())) + OCL_PERF_ENUM(CV_8U, CV_32F))) { - // getting params - MergeParams params = GetParam(); + const Size_MatType_t params = GetParam(); const Size srcSize = get<0>(params); const int depth = get<1>(params), channels = 3; - std::string impl = getSelectedImpl(); - - // creating src data Mat src(srcSize, CV_MAKE_TYPE(depth, channels)); declare.in(src, WARMUP_RNG); - // select implementation - if (impl == "ocl") + if (RUN_OCL_IMPL) { ocl::oclMat oclSrc(src); vector oclDst(channels, ocl::oclMat(srcSize, CV_MAKE_TYPE(depth, 1))); TEST_CYCLE() cv::ocl::split(oclSrc, oclDst); - AssertEQ(channels, 3); + ASSERT_EQ(3, channels); Mat dst0, dst1, dst2; oclDst[0].download(dst0); oclDst[1].download(dst1); @@ -144,21 +125,17 @@ PERF_TEST_P(SplitFixture, Split, SANITY_CHECK(dst1); SANITY_CHECK(dst2); } - else if (impl == "plain") + else if (RUN_PLAIN_IMPL) { vector dst(channels, Mat(srcSize, CV_MAKE_TYPE(depth, 1))); TEST_CYCLE() cv::split(src, dst); - AssertEQ(channels, 3); + ASSERT_EQ(3, channels); Mat & dst0 = dst[0], & dst1 = dst[1], & dst2 = dst[2]; SANITY_CHECK(dst0); SANITY_CHECK(dst1); SANITY_CHECK(dst2); } -#ifdef HAVE_OPENCV_GPU - else if (impl == "gpu") - CV_TEST_FAIL_NO_IMPL(); -#endif else - CV_TEST_FAIL_NO_IMPL(); + OCL_PERF_ELSE }