/*M/////////////////////////////////////////////////////////////////////////////////////// // // IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. // // By downloading, copying, installing or using the software you agree to this license. // If you do not agree to this license, do not download, install, // copy or use the software. // // // License Agreement // For Open Source Computer Vision Library // // Copyright (C) 2010-2012, Multicoreware, Inc., all rights reserved. // Copyright (C) 2010-2012, Advanced Micro Devices, Inc., all rights reserved. // Third party copyrights are property of their respective owners. // // @Authors // Fangfang Bai, fangfang@multicorewareinc.com // Jin Ma, jin@multicorewareinc.com // // Redistribution and use in source and binary forms, with or without modification, // are permitted provided that the following conditions are met: // // * Redistribution's of source code must retain the above copyright notice, // this list of conditions and the following disclaimer. // // * Redistribution's in binary form must reproduce the above copyright notice, // this list of conditions and the following disclaimer in the documentation // and/or other oclMaterials provided with the distribution. // // * The name of the copyright holders may not be used to endorse or promote products // derived from this software without specific prior written permission. // // This software is provided by the copyright holders and contributors as is and // any express or implied warranties, including, but not limited to, the implied // warranties of merchantability and fitness for a particular purpose are disclaimed. // In no event shall the Intel Corporation or contributors be liable for any direct, // indirect, incidental, special, exemplary, or consequential damages // (including, but not limited to, procurement of substitute goods or services; // loss of use, data, or profits; or business interruption) however caused // and on any theory of liability, whether in contract, strict liability, // or tort (including negligence or otherwise) arising in any way out of // the use of this software, even if advised of the possibility of such damage. // //M*/ #include "perf_precomp.hpp" ///////////// Lut //////////////////////// PERFTEST(lut) { Mat src, lut, dst, ocl_dst; ocl::oclMat d_src, d_lut, d_dst; int all_type[] = {CV_8UC1, CV_8UC3}; std::string type_name[] = {"CV_8UC1", "CV_8UC3"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(src, size, size, all_type[j], 0, 256); gen(lut, 1, 256, CV_8UC1, 0, 1); LUT(src, lut, dst); CPU_ON; LUT(src, lut, dst); CPU_OFF; d_src.upload(src); d_lut.upload(lut); WARMUP_ON; ocl::LUT(d_src, d_lut, d_dst); WARMUP_OFF; GPU_ON; ocl::LUT(d_src, d_lut, d_dst); GPU_OFF; GPU_FULL_ON; d_src.upload(src); d_lut.upload(lut); ocl::LUT(d_src, d_lut, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0); } } } ///////////// Exp //////////////////////// PERFTEST(Exp) { Mat src, dst, ocl_dst; ocl::oclMat d_src, d_dst; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { SUBTEST << size << 'x' << size << "; CV_32FC1"; gen(src, size, size, CV_32FC1, 5, 16); exp(src, dst); CPU_ON; exp(src, dst); CPU_OFF; d_src.upload(src); WARMUP_ON; ocl::exp(d_src, d_dst); WARMUP_OFF; GPU_ON; ocl::exp(d_src, d_dst); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::exp(d_src, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 2); } } ///////////// LOG //////////////////////// PERFTEST(Log) { Mat src, dst, ocl_dst; ocl::oclMat d_src, d_dst; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { SUBTEST << size << 'x' << size << "; 32F"; gen(src, size, size, CV_32F, 1, 10); log(src, dst); CPU_ON; log(src, dst); CPU_OFF; d_src.upload(src); WARMUP_ON; ocl::log(d_src, d_dst); WARMUP_OFF; GPU_ON; ocl::log(d_src, d_dst); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::log(d_src, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); } } ///////////// Add //////////////////////// PERFTEST(Add) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_8UC1, CV_32FC1}; std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(src1, size, size, all_type[j], 0, 1); gen(src2, size, size, all_type[j], 0, 1); add(src1, src2, dst); CPU_ON; add(src1, src2, dst); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::add(d_src1, d_src2, d_dst); WARMUP_OFF; GPU_ON; ocl::add(d_src1, d_src2, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::add(d_src1, d_src2, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); } } } ///////////// Mul //////////////////////// PERFTEST(Mul) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_8UC1, CV_8UC4}; std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); multiply(src1, src2, dst); CPU_ON; multiply(src1, src2, dst); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::multiply(d_src1, d_src2, d_dst); WARMUP_OFF; GPU_ON; ocl::multiply(d_src1, d_src2, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::multiply(d_src1, d_src2, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); } } } ///////////// Div //////////////////////// PERFTEST(Div) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_8UC1, CV_8UC4}; std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); divide(src1, src2, dst); CPU_ON; divide(src1, src2, dst); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::divide(d_src1, d_src2, d_dst); WARMUP_OFF; GPU_ON; ocl::divide(d_src1, d_src2, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::divide(d_src1, d_src2, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); } } } ///////////// Absdiff //////////////////////// PERFTEST(Absdiff) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_8UC1, CV_8UC4}; std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); absdiff(src1, src2, dst); CPU_ON; absdiff(src1, src2, dst); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::absdiff(d_src1, d_src2, d_dst); WARMUP_OFF; GPU_ON; ocl::absdiff(d_src1, d_src2, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::absdiff(d_src1, d_src2, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); } } } ///////////// CartToPolar //////////////////////// PERFTEST(CartToPolar) { Mat src1, src2, dst, dst1, ocl_dst, ocl_dst1; ocl::oclMat d_src1, d_src2, d_dst, d_dst1; int all_type[] = {CV_32FC1}; std::string type_name[] = {"CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); gen(dst1, size, size, all_type[j], 0, 256); cartToPolar(src1, src2, dst, dst1, 1); CPU_ON; cartToPolar(src1, src2, dst, dst1, 1); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); WARMUP_OFF; GPU_ON; ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); d_dst.download(ocl_dst); d_dst1.download(ocl_dst1); GPU_FULL_OFF; double diff1 = checkNorm(ocl_dst1, dst1); double diff2 = checkNorm(ocl_dst, dst); double max_diff = max(diff1, diff2); TestSystem::instance().setAccurate(max_diff<=.5?1:0, max_diff); } } } ///////////// PolarToCart //////////////////////// PERFTEST(PolarToCart) { Mat src1, src2, dst, dst1, ocl_dst, ocl_dst1; ocl::oclMat d_src1, d_src2, d_dst, d_dst1; int all_type[] = {CV_32FC1}; std::string type_name[] = {"CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); gen(dst1, size, size, all_type[j], 0, 256); polarToCart(src1, src2, dst, dst1, 1); CPU_ON; polarToCart(src1, src2, dst, dst1, 1); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); WARMUP_OFF; GPU_ON; ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); d_dst.download(ocl_dst); d_dst1.download(ocl_dst1); GPU_FULL_OFF; double diff1 = checkNorm(ocl_dst1, dst1); double diff2 = checkNorm(ocl_dst, dst); double max_diff = max(diff1, diff2); TestSystem::instance().setAccurate(max_diff<=.5?1:0, max_diff); } } } ///////////// Magnitude //////////////////////// PERFTEST(magnitude) { Mat x, y, mag, ocl_mag; ocl::oclMat d_x, d_y, d_mag; int all_type[] = {CV_32FC1}; std::string type_name[] = {"CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(x, size, size, all_type[j], 0, 1); gen(y, size, size, all_type[j], 0, 1); magnitude(x, y, mag); CPU_ON; magnitude(x, y, mag); CPU_OFF; d_x.upload(x); d_y.upload(y); WARMUP_ON; ocl::magnitude(d_x, d_y, d_mag); WARMUP_OFF; GPU_ON; ocl::magnitude(d_x, d_y, d_mag); GPU_OFF; GPU_FULL_ON; d_x.upload(x); d_y.upload(y); ocl::magnitude(d_x, d_y, d_mag); d_mag.download(ocl_mag); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_mag, mag, 1e-5); } } } ///////////// Transpose //////////////////////// PERFTEST(Transpose) { Mat src, dst, ocl_dst; ocl::oclMat d_src, d_dst; int all_type[] = {CV_8UC1, CV_8UC4}; std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(src, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); transpose(src, dst); CPU_ON; transpose(src, dst); CPU_OFF; d_src.upload(src); WARMUP_ON; ocl::transpose(d_src, d_dst); WARMUP_OFF; GPU_ON; ocl::transpose(d_src, d_dst); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::transpose(d_src, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); } } } ///////////// Flip //////////////////////// PERFTEST(Flip) { Mat src, dst, ocl_dst; ocl::oclMat d_src, d_dst; int all_type[] = {CV_8UC1, CV_8UC4}; std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; FLIP_BOTH"; gen(src, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); flip(src, dst, 0); CPU_ON; flip(src, dst, 0); CPU_OFF; d_src.upload(src); WARMUP_ON; ocl::flip(d_src, d_dst, 0); WARMUP_OFF; GPU_ON; ocl::flip(d_src, d_dst, 0); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::flip(d_src, d_dst, 0); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); } } } ///////////// minMax //////////////////////// PERFTEST(minMax) { Mat src; ocl::oclMat d_src; double min_val = 0.0, max_val = 0.0; double min_val_ = 0.0, max_val_ = 0.0; Point min_loc, max_loc; int all_type[] = {CV_8UC1, CV_32FC1}; std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j]; gen(src, size, size, all_type[j], 0, 256); CPU_ON; minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); CPU_OFF; d_src.upload(src); WARMUP_ON; ocl::minMax(d_src, &min_val_, &max_val_); WARMUP_OFF; if(EeceptDoubleEQ(max_val_, max_val) && EeceptDoubleEQ(min_val_, min_val)) TestSystem::instance().setAccurate(1, max(fabs(max_val_-max_val), fabs(min_val_-min_val))); else TestSystem::instance().setAccurate(0, max(fabs(max_val_-max_val), fabs(min_val_-min_val))); GPU_ON; ocl::minMax(d_src, &min_val, &max_val); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::minMax(d_src, &min_val, &max_val); GPU_FULL_OFF; } } } ///////////// minMaxLoc //////////////////////// PERFTEST(minMaxLoc) { Mat src; ocl::oclMat d_src; double min_val = 0.0, max_val = 0.0; double min_val_ = 0.0, max_val_ = 0.0; Point min_loc, max_loc; Point min_loc_, max_loc_; int all_type[] = {CV_8UC1, CV_32FC1}; std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src, size, size, all_type[j], 0, 1); CPU_ON; minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); CPU_OFF; d_src.upload(src); WARMUP_ON; ocl::minMaxLoc(d_src, &min_val_, &max_val_, &min_loc_, &max_loc_); WARMUP_OFF; double error0 = 0., error1 = 0., minlocVal = 0., minlocVal_ = 0., maxlocVal = 0., maxlocVal_ = 0.; if(src.depth() == 0) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } if(src.depth() == 1) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } if(src.depth() == 2) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } if(src.depth() == 3) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } if(src.depth() == 4) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } if(src.depth() == 5) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } if(src.depth() == 6) { minlocVal = src.at(min_loc); minlocVal_ = src.at(min_loc_); maxlocVal = src.at(max_loc); maxlocVal_ = src.at(max_loc_); } error0 = ::abs(minlocVal_ - minlocVal); error1 = ::abs(maxlocVal_ - maxlocVal); if( EeceptDoubleEQ(maxlocVal_, maxlocVal) &&EeceptDoubleEQ(minlocVal_, minlocVal) &&EeceptDoubleEQ(max_val_, max_val) &&EeceptDoubleEQ(min_val_, min_val)) TestSystem::instance().setAccurate(1, 0.); else TestSystem::instance().setAccurate(0, max(error0, error1)); GPU_ON; ocl::minMaxLoc(d_src, &min_val, &max_val, &min_loc, &max_loc); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::minMaxLoc(d_src, &min_val, &max_val, &min_loc, &max_loc); GPU_FULL_OFF; } } } ///////////// Sum //////////////////////// PERFTEST(Sum) { Mat src; Scalar cpures, gpures; ocl::oclMat d_src; int all_type[] = {CV_8UC1, CV_32SC1}; std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src, size, size, all_type[j], 0, 60); cpures = sum(src); CPU_ON; cpures = sum(src); CPU_OFF; d_src.upload(src); WARMUP_ON; gpures = ocl::sum(d_src); WARMUP_OFF; vector diffs(4); diffs[3] = fabs(cpures[3] - gpures[3]); diffs[2] = fabs(cpures[2] - gpures[2]); diffs[1] = fabs(cpures[1] - gpures[1]); diffs[0] = fabs(cpures[0] - gpures[0]); double max_diff = *max_element(diffs.begin(), diffs.end()); TestSystem::instance().setAccurate(max_diff<0.1?1:0, max_diff); GPU_ON; gpures = ocl::sum(d_src); GPU_OFF; GPU_FULL_ON; d_src.upload(src); gpures = ocl::sum(d_src); GPU_FULL_OFF; } } } ///////////// countNonZero //////////////////////// PERFTEST(countNonZero) { Mat src; ocl::oclMat d_src; int all_type[] = {CV_8UC1, CV_32FC1}; std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src, size, size, all_type[j], 0, 256); countNonZero(src); int cpures = 0, gpures = 0; CPU_ON; cpures = countNonZero(src); CPU_OFF; d_src.upload(src); WARMUP_ON; gpures = ocl::countNonZero(d_src); WARMUP_OFF; int diff = abs(cpures - gpures); if(diff == 0) TestSystem::instance().setAccurate(1, 0); else TestSystem::instance().setAccurate(0, diff); GPU_ON; ocl::countNonZero(d_src); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::countNonZero(d_src); GPU_FULL_OFF; } } } ///////////// Phase //////////////////////// PERFTEST(Phase) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_32FC1}; std::string type_name[] = {"CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); phase(src1, src2, dst, 1); CPU_ON; phase(src1, src2, dst, 1); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::phase(d_src1, d_src2, d_dst, 1); WARMUP_OFF; GPU_ON; ocl::phase(d_src1, d_src2, d_dst, 1); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::phase(d_src1, d_src2, d_dst, 1); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-2); } } } ///////////// bitwise_and//////////////////////// PERFTEST(bitwise_and) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_8UC1, CV_32SC1}; std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); bitwise_and(src1, src2, dst); CPU_ON; bitwise_and(src1, src2, dst); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::bitwise_and(d_src1, d_src2, d_dst); WARMUP_OFF; GPU_ON; ocl::bitwise_and(d_src1, d_src2, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::bitwise_and(d_src1, d_src2, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); } } } ///////////// bitwise_not//////////////////////// PERFTEST(bitwise_not) { Mat src1, dst, ocl_dst; ocl::oclMat d_src1, d_dst; int all_type[] = {CV_8UC1, CV_32SC1}; std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); bitwise_not(src1, dst); CPU_ON; bitwise_not(src1, dst); CPU_OFF; d_src1.upload(src1); WARMUP_ON; ocl::bitwise_not(d_src1, d_dst); WARMUP_OFF; GPU_ON; ocl::bitwise_not(d_src1, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); ocl::bitwise_not(d_src1, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); } } } ///////////// compare//////////////////////// PERFTEST(compare) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int CMP_EQ = 0; int all_type[] = {CV_8UC1, CV_32FC1}; std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); compare(src1, src2, dst, CMP_EQ); CPU_ON; compare(src1, src2, dst, CMP_EQ); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); WARMUP_OFF; GPU_ON; ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); } } } ///////////// pow //////////////////////// PERFTEST(pow) { Mat src, dst, ocl_dst; ocl::oclMat d_src, d_dst; int all_type[] = {CV_32FC1}; std::string type_name[] = {"CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src, size, size, all_type[j], 5, 16); pow(src, -2.0, dst); CPU_ON; pow(src, -2.0, dst); CPU_OFF; d_src.upload(src); d_dst.upload(dst); WARMUP_ON; ocl::pow(d_src, -2.0, d_dst); WARMUP_OFF; GPU_ON; ocl::pow(d_src, -2.0, d_dst); GPU_OFF; GPU_FULL_ON; d_src.upload(src); ocl::pow(d_src, -2.0, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); } } } ///////////// MagnitudeSqr//////////////////////// PERFTEST(MagnitudeSqr) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; int all_type[] = {CV_32FC1}; std::string type_name[] = {"CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t t = 0; t < sizeof(all_type) / sizeof(int); t++) { SUBTEST << size << 'x' << size << "; " << type_name[t]; gen(src1, size, size, all_type[t], 0, 256); gen(src2, size, size, all_type[t], 0, 256); gen(dst, size, size, all_type[t], 0, 256); CPU_ON; for (int i = 0; i < src1.rows; ++i) for (int j = 0; j < src1.cols; ++j) { float val1 = src1.at(i, j); float val2 = src2.at(i, j); ((float *)(dst.data))[i * dst.step / 4 + j] = val1 * val1 + val2 * val2; } CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::magnitudeSqr(d_src1, d_src2, d_dst); WARMUP_OFF; GPU_ON; ocl::magnitudeSqr(d_src1, d_src2, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::magnitudeSqr(d_src1, d_src2, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); } } } ///////////// AddWeighted//////////////////////// PERFTEST(AddWeighted) { Mat src1, src2, dst, ocl_dst; ocl::oclMat d_src1, d_src2, d_dst; double alpha = 2.0, beta = 1.0, gama = 3.0; int all_type[] = {CV_8UC1, CV_32FC1}; std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; for (int size = Min_Size; size <= Max_Size; size *= Multiple) { for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) { SUBTEST << size << 'x' << size << "; " << type_name[j] ; gen(src1, size, size, all_type[j], 0, 256); gen(src2, size, size, all_type[j], 0, 256); gen(dst, size, size, all_type[j], 0, 256); addWeighted(src1, alpha, src2, beta, gama, dst); CPU_ON; addWeighted(src1, alpha, src2, beta, gama, dst); CPU_OFF; d_src1.upload(src1); d_src2.upload(src2); WARMUP_ON; ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); WARMUP_OFF; GPU_ON; ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); GPU_OFF; GPU_FULL_ON; d_src1.upload(src1); d_src2.upload(src2); ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); d_dst.download(ocl_dst); GPU_FULL_OFF; TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); } } }