mirror of https://github.com/opencv/opencv.git
Open Source Computer Vision Library
https://opencv.org/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1197 lines
33 KiB
1197 lines
33 KiB
/*M/////////////////////////////////////////////////////////////////////////////////////// |
|
// |
|
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. |
|
// |
|
// By downloading, copying, installing or using the software you agree to this license. |
|
// If you do not agree to this license, do not download, install, |
|
// copy or use the software. |
|
// |
|
// |
|
// License Agreement |
|
// For Open Source Computer Vision Library |
|
// |
|
// Copyright (C) 2010-2012, Multicoreware, Inc., all rights reserved. |
|
// Copyright (C) 2010-2012, Advanced Micro Devices, Inc., all rights reserved. |
|
// Third party copyrights are property of their respective owners. |
|
// |
|
// @Authors |
|
// Fangfang Bai, fangfang@multicorewareinc.com |
|
// Jin Ma, jin@multicorewareinc.com |
|
// |
|
// Redistribution and use in source and binary forms, with or without modification, |
|
// are permitted provided that the following conditions are met: |
|
// |
|
// * Redistribution's of source code must retain the above copyright notice, |
|
// this list of conditions and the following disclaimer. |
|
// |
|
// * Redistribution's in binary form must reproduce the above copyright notice, |
|
// this list of conditions and the following disclaimer in the documentation |
|
// and/or other oclMaterials provided with the distribution. |
|
// |
|
// * The name of the copyright holders may not be used to endorse or promote products |
|
// derived from this software without specific prior written permission. |
|
// |
|
// This software is provided by the copyright holders and contributors as is and |
|
// any express or implied warranties, including, but not limited to, the implied |
|
// warranties of merchantability and fitness for a particular purpose are disclaimed. |
|
// In no event shall the Intel Corporation or contributors be liable for any direct, |
|
// indirect, incidental, special, exemplary, or consequential damages |
|
// (including, but not limited to, procurement of substitute goods or services; |
|
// loss of use, data, or profits; or business interruption) however caused |
|
// and on any theory of liability, whether in contract, strict liability, |
|
// or tort (including negligence or otherwise) arising in any way out of |
|
// the use of this software, even if advised of the possibility of such damage. |
|
// |
|
//M*/ |
|
|
|
#include "perf_precomp.hpp" |
|
///////////// Lut //////////////////////// |
|
PERFTEST(lut) |
|
{ |
|
Mat src, lut, dst, ocl_dst; |
|
ocl::oclMat d_src, d_lut, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_8UC3}; |
|
std::string type_name[] = {"CV_8UC1", "CV_8UC3"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(src, size, size, all_type[j], 0, 256); |
|
gen(lut, 1, 256, CV_8UC1, 0, 1); |
|
|
|
LUT(src, lut, dst); |
|
|
|
CPU_ON; |
|
LUT(src, lut, dst); |
|
CPU_OFF; |
|
|
|
d_src.upload(src); |
|
d_lut.upload(lut); |
|
|
|
WARMUP_ON; |
|
ocl::LUT(d_src, d_lut, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::LUT(d_src, d_lut, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
d_lut.upload(lut); |
|
ocl::LUT(d_src, d_lut, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Exp //////////////////////// |
|
PERFTEST(Exp) |
|
{ |
|
Mat src, dst, ocl_dst; |
|
ocl::oclMat d_src, d_dst; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
SUBTEST << size << 'x' << size << "; CV_32FC1"; |
|
|
|
gen(src, size, size, CV_32FC1, 5, 16); |
|
|
|
exp(src, dst); |
|
|
|
CPU_ON; |
|
exp(src, dst); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
ocl::exp(d_src, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::exp(d_src, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::exp(d_src, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 2); |
|
} |
|
} |
|
|
|
///////////// LOG //////////////////////// |
|
PERFTEST(Log) |
|
{ |
|
Mat src, dst, ocl_dst; |
|
ocl::oclMat d_src, d_dst; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
SUBTEST << size << 'x' << size << "; 32F"; |
|
|
|
gen(src, size, size, CV_32F, 1, 10); |
|
|
|
log(src, dst); |
|
|
|
CPU_ON; |
|
log(src, dst); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
ocl::log(d_src, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::log(d_src, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::log(d_src, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); |
|
} |
|
} |
|
|
|
///////////// Add //////////////////////// |
|
PERFTEST(Add) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_32FC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(src1, size, size, all_type[j], 0, 1); |
|
gen(src2, size, size, all_type[j], 0, 1); |
|
|
|
add(src1, src2, dst); |
|
|
|
CPU_ON; |
|
add(src1, src2, dst); |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::add(d_src1, d_src2, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::add(d_src1, d_src2, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::add(d_src1, d_src2, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Mul //////////////////////// |
|
PERFTEST(Mul) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_8UC4}; |
|
std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
|
|
multiply(src1, src2, dst); |
|
|
|
CPU_ON; |
|
multiply(src1, src2, dst); |
|
CPU_OFF; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::multiply(d_src1, d_src2, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::multiply(d_src1, d_src2, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::multiply(d_src1, d_src2, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Div //////////////////////// |
|
PERFTEST(Div) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
int all_type[] = {CV_8UC1, CV_8UC4}; |
|
std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
|
|
divide(src1, src2, dst); |
|
|
|
CPU_ON; |
|
divide(src1, src2, dst); |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::divide(d_src1, d_src2, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::divide(d_src1, d_src2, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::divide(d_src1, d_src2, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Absdiff //////////////////////// |
|
PERFTEST(Absdiff) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_8UC4}; |
|
std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
absdiff(src1, src2, dst); |
|
|
|
CPU_ON; |
|
absdiff(src1, src2, dst); |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::absdiff(d_src1, d_src2, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::absdiff(d_src1, d_src2, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::absdiff(d_src1, d_src2, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// CartToPolar //////////////////////// |
|
PERFTEST(CartToPolar) |
|
{ |
|
Mat src1, src2, dst, dst1, ocl_dst, ocl_dst1; |
|
ocl::oclMat d_src1, d_src2, d_dst, d_dst1; |
|
|
|
int all_type[] = {CV_32FC1}; |
|
std::string type_name[] = {"CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
gen(dst1, size, size, all_type[j], 0, 256); |
|
|
|
|
|
cartToPolar(src1, src2, dst, dst1, 1); |
|
|
|
CPU_ON; |
|
cartToPolar(src1, src2, dst, dst1, 1); |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::cartToPolar(d_src1, d_src2, d_dst, d_dst1, 1); |
|
d_dst.download(ocl_dst); |
|
d_dst1.download(ocl_dst1); |
|
GPU_FULL_OFF; |
|
|
|
double diff1 = checkNorm(ocl_dst1, dst1); |
|
double diff2 = checkNorm(ocl_dst, dst); |
|
double max_diff = max(diff1, diff2); |
|
TestSystem::instance().setAccurate(max_diff<=.5?1:0, max_diff); |
|
|
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// PolarToCart //////////////////////// |
|
PERFTEST(PolarToCart) |
|
{ |
|
Mat src1, src2, dst, dst1, ocl_dst, ocl_dst1; |
|
ocl::oclMat d_src1, d_src2, d_dst, d_dst1; |
|
|
|
int all_type[] = {CV_32FC1}; |
|
std::string type_name[] = {"CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
gen(dst1, size, size, all_type[j], 0, 256); |
|
|
|
|
|
polarToCart(src1, src2, dst, dst1, 1); |
|
|
|
CPU_ON; |
|
polarToCart(src1, src2, dst, dst1, 1); |
|
CPU_OFF; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::polarToCart(d_src1, d_src2, d_dst, d_dst1, 1); |
|
d_dst.download(ocl_dst); |
|
d_dst1.download(ocl_dst1); |
|
GPU_FULL_OFF; |
|
|
|
double diff1 = checkNorm(ocl_dst1, dst1); |
|
double diff2 = checkNorm(ocl_dst, dst); |
|
double max_diff = max(diff1, diff2); |
|
TestSystem::instance().setAccurate(max_diff<=.5?1:0, max_diff); |
|
|
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Magnitude //////////////////////// |
|
PERFTEST(magnitude) |
|
{ |
|
Mat x, y, mag, ocl_mag; |
|
ocl::oclMat d_x, d_y, d_mag; |
|
|
|
int all_type[] = {CV_32FC1}; |
|
std::string type_name[] = {"CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(x, size, size, all_type[j], 0, 1); |
|
gen(y, size, size, all_type[j], 0, 1); |
|
|
|
magnitude(x, y, mag); |
|
|
|
CPU_ON; |
|
magnitude(x, y, mag); |
|
CPU_OFF; |
|
d_x.upload(x); |
|
d_y.upload(y); |
|
|
|
WARMUP_ON; |
|
ocl::magnitude(d_x, d_y, d_mag); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::magnitude(d_x, d_y, d_mag); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_x.upload(x); |
|
d_y.upload(y); |
|
ocl::magnitude(d_x, d_y, d_mag); |
|
d_mag.download(ocl_mag); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_mag, mag, 1e-5); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Transpose //////////////////////// |
|
PERFTEST(Transpose) |
|
{ |
|
Mat src, dst, ocl_dst; |
|
ocl::oclMat d_src, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_8UC4}; |
|
std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(src, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
transpose(src, dst); |
|
|
|
CPU_ON; |
|
transpose(src, dst); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
ocl::transpose(d_src, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::transpose(d_src, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::transpose(d_src, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Flip //////////////////////// |
|
PERFTEST(Flip) |
|
{ |
|
Mat src, dst, ocl_dst; |
|
ocl::oclMat d_src, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_8UC4}; |
|
std::string type_name[] = {"CV_8UC1", "CV_8UC4"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] << " ; FLIP_BOTH"; |
|
|
|
gen(src, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
flip(src, dst, 0); |
|
|
|
CPU_ON; |
|
flip(src, dst, 0); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
ocl::flip(d_src, d_dst, 0); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::flip(d_src, d_dst, 0); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::flip(d_src, d_dst, 0); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// minMax //////////////////////// |
|
PERFTEST(minMax) |
|
{ |
|
Mat src; |
|
ocl::oclMat d_src; |
|
|
|
double min_val = 0.0, max_val = 0.0; |
|
double min_val_ = 0.0, max_val_ = 0.0; |
|
Point min_loc, max_loc; |
|
int all_type[] = {CV_8UC1, CV_32FC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j]; |
|
|
|
gen(src, size, size, all_type[j], 0, 256); |
|
|
|
CPU_ON; |
|
minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
ocl::minMax(d_src, &min_val_, &max_val_); |
|
WARMUP_OFF; |
|
|
|
if(EeceptDoubleEQ<double>(max_val_, max_val) && EeceptDoubleEQ<double>(min_val_, min_val)) |
|
TestSystem::instance().setAccurate(1, max(fabs(max_val_-max_val), fabs(min_val_-min_val))); |
|
else |
|
TestSystem::instance().setAccurate(0, max(fabs(max_val_-max_val), fabs(min_val_-min_val))); |
|
|
|
GPU_ON; |
|
ocl::minMax(d_src, &min_val, &max_val); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::minMax(d_src, &min_val, &max_val); |
|
GPU_FULL_OFF; |
|
|
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// minMaxLoc //////////////////////// |
|
PERFTEST(minMaxLoc) |
|
{ |
|
Mat src; |
|
ocl::oclMat d_src; |
|
|
|
double min_val = 0.0, max_val = 0.0; |
|
double min_val_ = 0.0, max_val_ = 0.0; |
|
Point min_loc, max_loc; |
|
Point min_loc_, max_loc_; |
|
int all_type[] = {CV_8UC1, CV_32FC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src, size, size, all_type[j], 0, 1); |
|
|
|
CPU_ON; |
|
minMaxLoc(src, &min_val, &max_val, &min_loc, &max_loc); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
ocl::minMaxLoc(d_src, &min_val_, &max_val_, &min_loc_, &max_loc_); |
|
WARMUP_OFF; |
|
|
|
double error0 = 0., error1 = 0., minlocVal = 0., minlocVal_ = 0., maxlocVal = 0., maxlocVal_ = 0.; |
|
if(src.depth() == 0) |
|
{ |
|
minlocVal = src.at<unsigned char>(min_loc); |
|
minlocVal_ = src.at<unsigned char>(min_loc_); |
|
maxlocVal = src.at<unsigned char>(max_loc); |
|
maxlocVal_ = src.at<unsigned char>(max_loc_); |
|
} |
|
if(src.depth() == 1) |
|
{ |
|
minlocVal = src.at<signed char>(min_loc); |
|
minlocVal_ = src.at<signed char>(min_loc_); |
|
maxlocVal = src.at<signed char>(max_loc); |
|
maxlocVal_ = src.at<signed char>(max_loc_); |
|
} |
|
if(src.depth() == 2) |
|
{ |
|
minlocVal = src.at<unsigned short>(min_loc); |
|
minlocVal_ = src.at<unsigned short>(min_loc_); |
|
maxlocVal = src.at<unsigned short>(max_loc); |
|
maxlocVal_ = src.at<unsigned short>(max_loc_); |
|
} |
|
if(src.depth() == 3) |
|
{ |
|
minlocVal = src.at<signed short>(min_loc); |
|
minlocVal_ = src.at<signed short>(min_loc_); |
|
maxlocVal = src.at<signed short>(max_loc); |
|
maxlocVal_ = src.at<signed short>(max_loc_); |
|
} |
|
if(src.depth() == 4) |
|
{ |
|
minlocVal = src.at<int>(min_loc); |
|
minlocVal_ = src.at<int>(min_loc_); |
|
maxlocVal = src.at<int>(max_loc); |
|
maxlocVal_ = src.at<int>(max_loc_); |
|
} |
|
if(src.depth() == 5) |
|
{ |
|
minlocVal = src.at<float>(min_loc); |
|
minlocVal_ = src.at<float>(min_loc_); |
|
maxlocVal = src.at<float>(max_loc); |
|
maxlocVal_ = src.at<float>(max_loc_); |
|
} |
|
if(src.depth() == 6) |
|
{ |
|
minlocVal = src.at<double>(min_loc); |
|
minlocVal_ = src.at<double>(min_loc_); |
|
maxlocVal = src.at<double>(max_loc); |
|
maxlocVal_ = src.at<double>(max_loc_); |
|
} |
|
error0 = ::abs(minlocVal_ - minlocVal); |
|
error1 = ::abs(maxlocVal_ - maxlocVal); |
|
if( EeceptDoubleEQ<double>(maxlocVal_, maxlocVal) |
|
&&EeceptDoubleEQ<double>(minlocVal_, minlocVal) |
|
&&EeceptDoubleEQ<double>(max_val_, max_val) |
|
&&EeceptDoubleEQ<double>(min_val_, min_val)) |
|
TestSystem::instance().setAccurate(1, 0.); |
|
else |
|
TestSystem::instance().setAccurate(0, max(error0, error1)); |
|
|
|
GPU_ON; |
|
ocl::minMaxLoc(d_src, &min_val, &max_val, &min_loc, &max_loc); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::minMaxLoc(d_src, &min_val, &max_val, &min_loc, &max_loc); |
|
GPU_FULL_OFF; |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Sum //////////////////////// |
|
PERFTEST(Sum) |
|
{ |
|
Mat src; |
|
Scalar cpures, gpures; |
|
ocl::oclMat d_src; |
|
|
|
int all_type[] = {CV_8UC1, CV_32SC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src, size, size, all_type[j], 0, 60); |
|
|
|
cpures = sum(src); |
|
|
|
CPU_ON; |
|
cpures = sum(src); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
gpures = ocl::sum(d_src); |
|
WARMUP_OFF; |
|
|
|
vector<double> diffs(4); |
|
diffs[3] = fabs(cpures[3] - gpures[3]); |
|
diffs[2] = fabs(cpures[2] - gpures[2]); |
|
diffs[1] = fabs(cpures[1] - gpures[1]); |
|
diffs[0] = fabs(cpures[0] - gpures[0]); |
|
double max_diff = *max_element(diffs.begin(), diffs.end()); |
|
TestSystem::instance().setAccurate(max_diff<0.1?1:0, max_diff); |
|
|
|
GPU_ON; |
|
gpures = ocl::sum(d_src); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
gpures = ocl::sum(d_src); |
|
GPU_FULL_OFF; |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// countNonZero //////////////////////// |
|
PERFTEST(countNonZero) |
|
{ |
|
Mat src; |
|
ocl::oclMat d_src; |
|
|
|
int all_type[] = {CV_8UC1, CV_32FC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src, size, size, all_type[j], 0, 256); |
|
|
|
countNonZero(src); |
|
|
|
int cpures = 0, gpures = 0; |
|
CPU_ON; |
|
cpures = countNonZero(src); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
|
|
WARMUP_ON; |
|
gpures = ocl::countNonZero(d_src); |
|
WARMUP_OFF; |
|
|
|
int diff = abs(cpures - gpures); |
|
if(diff == 0) |
|
TestSystem::instance().setAccurate(1, 0); |
|
else |
|
TestSystem::instance().setAccurate(0, diff); |
|
|
|
GPU_ON; |
|
ocl::countNonZero(d_src); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::countNonZero(d_src); |
|
GPU_FULL_OFF; |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// Phase //////////////////////// |
|
PERFTEST(Phase) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int all_type[] = {CV_32FC1}; |
|
std::string type_name[] = {"CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
phase(src1, src2, dst, 1); |
|
|
|
CPU_ON; |
|
phase(src1, src2, dst, 1); |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::phase(d_src1, d_src2, d_dst, 1); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::phase(d_src1, d_src2, d_dst, 1); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::phase(d_src1, d_src2, d_dst, 1); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-2); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// bitwise_and//////////////////////// |
|
PERFTEST(bitwise_and) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_32SC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
bitwise_and(src1, src2, dst); |
|
|
|
CPU_ON; |
|
bitwise_and(src1, src2, dst); |
|
CPU_OFF; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::bitwise_and(d_src1, d_src2, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::bitwise_and(d_src1, d_src2, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::bitwise_and(d_src1, d_src2, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// bitwise_not//////////////////////// |
|
PERFTEST(bitwise_not) |
|
{ |
|
Mat src1, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_dst; |
|
|
|
int all_type[] = {CV_8UC1, CV_32SC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32SC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
bitwise_not(src1, dst); |
|
|
|
CPU_ON; |
|
bitwise_not(src1, dst); |
|
CPU_OFF; |
|
d_src1.upload(src1); |
|
|
|
WARMUP_ON; |
|
ocl::bitwise_not(d_src1, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::bitwise_not(d_src1, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
ocl::bitwise_not(d_src1, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// compare//////////////////////// |
|
PERFTEST(compare) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int CMP_EQ = 0; |
|
int all_type[] = {CV_8UC1, CV_32FC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
compare(src1, src2, dst, CMP_EQ); |
|
|
|
CPU_ON; |
|
compare(src1, src2, dst, CMP_EQ); |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::compare(d_src1, d_src2, d_dst, CMP_EQ); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 0.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// pow //////////////////////// |
|
PERFTEST(pow) |
|
{ |
|
Mat src, dst, ocl_dst; |
|
ocl::oclMat d_src, d_dst; |
|
|
|
int all_type[] = {CV_32FC1}; |
|
std::string type_name[] = {"CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src, size, size, all_type[j], 5, 16); |
|
|
|
pow(src, -2.0, dst); |
|
|
|
CPU_ON; |
|
pow(src, -2.0, dst); |
|
CPU_OFF; |
|
d_src.upload(src); |
|
d_dst.upload(dst); |
|
|
|
WARMUP_ON; |
|
ocl::pow(d_src, -2.0, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::pow(d_src, -2.0, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src.upload(src); |
|
ocl::pow(d_src, -2.0, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// MagnitudeSqr//////////////////////// |
|
PERFTEST(MagnitudeSqr) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
int all_type[] = {CV_32FC1}; |
|
std::string type_name[] = {"CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t t = 0; t < sizeof(all_type) / sizeof(int); t++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[t]; |
|
|
|
gen(src1, size, size, all_type[t], 0, 256); |
|
gen(src2, size, size, all_type[t], 0, 256); |
|
gen(dst, size, size, all_type[t], 0, 256); |
|
|
|
CPU_ON; |
|
for (int i = 0; i < src1.rows; ++i) |
|
for (int j = 0; j < src1.cols; ++j) |
|
{ |
|
float val1 = src1.at<float>(i, j); |
|
float val2 = src2.at<float>(i, j); |
|
((float *)(dst.data))[i * dst.step / 4 + j] = val1 * val1 + val2 * val2; |
|
|
|
} |
|
CPU_OFF; |
|
|
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::magnitudeSqr(d_src1, d_src2, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::magnitudeSqr(d_src1, d_src2, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::magnitudeSqr(d_src1, d_src2, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1.0); |
|
} |
|
|
|
} |
|
} |
|
|
|
///////////// AddWeighted//////////////////////// |
|
PERFTEST(AddWeighted) |
|
{ |
|
Mat src1, src2, dst, ocl_dst; |
|
ocl::oclMat d_src1, d_src2, d_dst; |
|
|
|
double alpha = 2.0, beta = 1.0, gama = 3.0; |
|
int all_type[] = {CV_8UC1, CV_32FC1}; |
|
std::string type_name[] = {"CV_8UC1", "CV_32FC1"}; |
|
|
|
for (int size = Min_Size; size <= Max_Size; size *= Multiple) |
|
{ |
|
for (size_t j = 0; j < sizeof(all_type) / sizeof(int); j++) |
|
{ |
|
SUBTEST << size << 'x' << size << "; " << type_name[j] ; |
|
|
|
gen(src1, size, size, all_type[j], 0, 256); |
|
gen(src2, size, size, all_type[j], 0, 256); |
|
gen(dst, size, size, all_type[j], 0, 256); |
|
|
|
|
|
addWeighted(src1, alpha, src2, beta, gama, dst); |
|
|
|
CPU_ON; |
|
addWeighted(src1, alpha, src2, beta, gama, dst); |
|
CPU_OFF; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
|
|
WARMUP_ON; |
|
ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); |
|
WARMUP_OFF; |
|
|
|
GPU_ON; |
|
ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); |
|
GPU_OFF; |
|
|
|
GPU_FULL_ON; |
|
d_src1.upload(src1); |
|
d_src2.upload(src2); |
|
ocl::addWeighted(d_src1, alpha, d_src2, beta, gama, d_dst); |
|
d_dst.download(ocl_dst); |
|
GPU_FULL_OFF; |
|
|
|
TestSystem::instance().ExpectedMatNear(ocl_dst, dst, 1e-5); |
|
} |
|
|
|
} |
|
} |