Merge pull request #1573 from alalek:perf_simple_strategy

pull/1622/merge
Andrey Pavlenko 11 years ago committed by OpenCV Buildbot
commit 97da1419e1
  1. 2
      modules/ocl/perf/main.cpp
  2. 14
      modules/ts/include/opencv2/ts/ts_perf.hpp
  3. 229
      modules/ts/src/ts_perf.cpp

@ -67,5 +67,7 @@ static const char * impls[] =
int main(int argc, char ** argv) int main(int argc, char ** argv)
{ {
::perf::TestBase::setPerformanceStrategy(::perf::PERF_STRATEGY_SIMPLE);
CV_PERF_TEST_MAIN_INTERNALS(ocl, impls, dumpOpenCLDevice()) CV_PERF_TEST_MAIN_INTERNALS(ocl, impls, dumpOpenCLDevice())
} }

@ -247,9 +247,20 @@ typedef struct CV_EXPORTS performance_metrics
}; };
performance_metrics(); performance_metrics();
void clear();
} performance_metrics; } performance_metrics;
/*****************************************************************************************\
* Strategy for performance measuring *
\*****************************************************************************************/
enum PERF_STRATEGY
{
PERF_STRATEGY_BASE = 0,
PERF_STRATEGY_SIMPLE = 1,
};
/*****************************************************************************************\ /*****************************************************************************************\
* Base fixture for performance tests * * Base fixture for performance tests *
\*****************************************************************************************/ \*****************************************************************************************/
@ -265,6 +276,9 @@ public:
static std::string getDataPath(const std::string& relativePath); static std::string getDataPath(const std::string& relativePath);
static std::string getSelectedImpl(); static std::string getSelectedImpl();
static enum PERF_STRATEGY getPerformanceStrategy();
static enum PERF_STRATEGY setPerformanceStrategy(enum PERF_STRATEGY strategy);
protected: protected:
virtual void PerfTestBody() = 0; virtual void PerfTestBody() = 0;

@ -18,6 +18,9 @@ int64 TestBase::_timeadjustment = 0;
static std::vector<std::string> available_impls; static std::vector<std::string> available_impls;
static std::string param_impl; static std::string param_impl;
static enum PERF_STRATEGY param_strategy = PERF_STRATEGY_BASE;
static double param_max_outliers; static double param_max_outliers;
static double param_max_deviation; static double param_max_deviation;
static unsigned int param_min_samples; static unsigned int param_min_samples;
@ -152,7 +155,7 @@ void Regression::init(const std::string& testSuitName, const std::string& ext)
{ {
if (!storageInPath.empty()) if (!storageInPath.empty())
{ {
LOGE("Subsequent initialisation of Regression utility is not allowed."); LOGE("Subsequent initialization of Regression utility is not allowed.");
return; return;
} }
@ -598,6 +601,11 @@ Regression& Regression::operator() (const std::string& name, cv::InputArray arra
* ::perf::performance_metrics * ::perf::performance_metrics
\*****************************************************************************************/ \*****************************************************************************************/
performance_metrics::performance_metrics() performance_metrics::performance_metrics()
{
clear();
}
void performance_metrics::clear()
{ {
bytesIn = 0; bytesIn = 0;
bytesOut = 0; bytesOut = 0;
@ -643,6 +651,7 @@ void TestBase::Init(const std::vector<std::string> & availableImpls,
"|the implementation variant of functions under test}" "|the implementation variant of functions under test}"
"{ |perf_list_impls |false |list available implementation variants and exit}" "{ |perf_list_impls |false |list available implementation variants and exit}"
"{ |perf_run_cpu |false |deprecated, equivalent to --perf_impl=plain}" "{ |perf_run_cpu |false |deprecated, equivalent to --perf_impl=plain}"
"{ |perf_strategy |default |specifies performance measuring strategy: default, base or simple (weak restrictions)}"
#ifdef ANDROID #ifdef ANDROID
"{ |perf_time_limit |6.0 |default time limit for a single test (in seconds)}" "{ |perf_time_limit |6.0 |default time limit for a single test (in seconds)}"
"{ |perf_affinity_mask |0 |set affinity mask for the main thread}" "{ |perf_affinity_mask |0 |set affinity mask for the main thread}"
@ -669,6 +678,24 @@ void TestBase::Init(const std::vector<std::string> & availableImpls,
::testing::AddGlobalTestEnvironment(new PerfEnvironment); ::testing::AddGlobalTestEnvironment(new PerfEnvironment);
param_impl = args.get<bool>("perf_run_cpu") ? "plain" : args.get<std::string>("perf_impl"); param_impl = args.get<bool>("perf_run_cpu") ? "plain" : args.get<std::string>("perf_impl");
std::string perf_strategy = args.get<std::string>("perf_strategy");
if (perf_strategy == "default")
{
// nothing
}
else if (perf_strategy == "base")
{
param_strategy = PERF_STRATEGY_BASE;
}
else if (perf_strategy == "simple")
{
param_strategy = PERF_STRATEGY_SIMPLE;
}
else
{
printf("No such strategy: %s\n", perf_strategy.c_str());
exit(1);
}
param_max_outliers = std::min(100., std::max(0., args.get<double>("perf_max_outliers"))); param_max_outliers = std::min(100., std::max(0., args.get<double>("perf_max_outliers")));
param_min_samples = std::max(1u, args.get<unsigned int>("perf_min_samples")); param_min_samples = std::max(1u, args.get<unsigned int>("perf_min_samples"));
param_max_deviation = std::max(0., args.get<double>("perf_max_deviation")); param_max_deviation = std::max(0., args.get<double>("perf_max_deviation"));
@ -762,6 +789,18 @@ std::string TestBase::getSelectedImpl()
return param_impl; return param_impl;
} }
enum PERF_STRATEGY TestBase::getPerformanceStrategy()
{
return param_strategy;
}
enum PERF_STRATEGY TestBase::setPerformanceStrategy(enum PERF_STRATEGY strategy)
{
enum PERF_STRATEGY ret = param_strategy;
param_strategy = strategy;
return ret;
}
int64 TestBase::_calibrate() int64 TestBase::_calibrate()
{ {
@ -792,6 +831,11 @@ int64 TestBase::_calibrate()
_helper h; _helper h;
h.PerfTestBody(); h.PerfTestBody();
double compensation = h.getMetrics().min; double compensation = h.getMetrics().min;
if (param_strategy == PERF_STRATEGY_SIMPLE)
{
CV_Assert(compensation < 0.01 * cv::getTickFrequency());
compensation = 0.0f; // simple strategy doesn't require any compensation
}
LOGD("Time compensation is %.0f", compensation); LOGD("Time compensation is %.0f", compensation);
return (int64)compensation; return (int64)compensation;
} }
@ -855,8 +899,64 @@ cv::Size TestBase::getSize(cv::InputArray a)
bool TestBase::next() bool TestBase::next()
{ {
bool has_next = ++currentIter < nIters && totalTime < timeLimit; static int64 lastActivityPrintTime = 0;
if (currentIter != (unsigned int)-1)
{
if (currentIter + 1 != times.size())
ADD_FAILURE() << " next() is called before stopTimer()";
}
else
{
lastActivityPrintTime = 0;
metrics.clear();
}
cv::theRNG().state = param_seed; //this rng should generate same numbers for each run cv::theRNG().state = param_seed; //this rng should generate same numbers for each run
++currentIter;
bool has_next = false;
do {
assert(currentIter == times.size());
if (currentIter == 0)
{
has_next = true;
break;
}
if (param_strategy == PERF_STRATEGY_BASE)
{
has_next = currentIter < nIters && totalTime < timeLimit;
}
else
{
assert(param_strategy == PERF_STRATEGY_SIMPLE);
if (totalTime - lastActivityPrintTime >= cv::getTickFrequency() * 10)
{
std::cout << '.' << std::endl;
lastActivityPrintTime = totalTime;
}
if (currentIter >= nIters)
{
has_next = false;
break;
}
if (currentIter < param_min_samples)
{
has_next = true;
break;
}
calcMetrics();
double criteria = 0.03; // 3%
if (fabs(metrics.mean) > 1e-6)
has_next = metrics.stddev > criteria * fabs(metrics.mean);
else
has_next = true;
}
} while (false);
#ifdef ANDROID #ifdef ANDROID
if (log_power_checkpoints) if (log_power_checkpoints)
@ -869,6 +969,9 @@ bool TestBase::next()
if (!has_next) RecordProperty("test_complete", cv::format("%llu",t1).c_str()); if (!has_next) RecordProperty("test_complete", cv::format("%llu",t1).c_str());
} }
#endif #endif
if (has_next)
startTimer(); // really we should measure activity from this moment, so reset start time
return has_next; return has_next;
} }
@ -915,7 +1018,7 @@ void TestBase::stopTimer()
{ {
int64 time = cv::getTickCount(); int64 time = cv::getTickCount();
if (lastTime == 0) if (lastTime == 0)
ADD_FAILURE() << " stopTimer() is called before startTimer()"; ADD_FAILURE() << " stopTimer() is called before startTimer()/next()";
lastTime = time - lastTime; lastTime = time - lastTime;
totalTime += lastTime; totalTime += lastTime;
lastTime -= _timeadjustment; lastTime -= _timeadjustment;
@ -926,6 +1029,7 @@ void TestBase::stopTimer()
performance_metrics& TestBase::calcMetrics() performance_metrics& TestBase::calcMetrics()
{ {
CV_Assert(metrics.samples <= (unsigned int)currentIter);
if ((metrics.samples == (unsigned int)currentIter) || times.size() == 0) if ((metrics.samples == (unsigned int)currentIter) || times.size() == 0)
return metrics; return metrics;
@ -947,47 +1051,61 @@ performance_metrics& TestBase::calcMetrics()
std::sort(times.begin(), times.end()); std::sort(times.begin(), times.end());
//estimate mean and stddev for log(time) TimeVector::const_iterator start = times.begin();
double gmean = 0; TimeVector::const_iterator end = times.end();
double gstddev = 0;
int n = 0;
for(TimeVector::const_iterator i = times.begin(); i != times.end(); ++i)
{
double x = static_cast<double>(*i)/runsPerIteration;
if (x < DBL_EPSILON) continue;
double lx = log(x);
++n; if (param_strategy == PERF_STRATEGY_BASE)
double delta = lx - gmean; {
gmean += delta / n; //estimate mean and stddev for log(time)
gstddev += delta * (lx - gmean); double gmean = 0;
} double gstddev = 0;
int n = 0;
for(TimeVector::const_iterator i = times.begin(); i != times.end(); ++i)
{
double x = static_cast<double>(*i)/runsPerIteration;
if (x < DBL_EPSILON) continue;
double lx = log(x);
gstddev = n > 1 ? sqrt(gstddev / (n - 1)) : 0; ++n;
double delta = lx - gmean;
gmean += delta / n;
gstddev += delta * (lx - gmean);
}
TimeVector::const_iterator start = times.begin(); gstddev = n > 1 ? sqrt(gstddev / (n - 1)) : 0;
TimeVector::const_iterator end = times.end();
//filter outliers assuming log-normal distribution //filter outliers assuming log-normal distribution
//http://stackoverflow.com/questions/1867426/modeling-distribution-of-performance-measurements //http://stackoverflow.com/questions/1867426/modeling-distribution-of-performance-measurements
int offset = 0; if (gstddev > DBL_EPSILON)
if (gstddev > DBL_EPSILON) {
double minout = exp(gmean - 3 * gstddev) * runsPerIteration;
double maxout = exp(gmean + 3 * gstddev) * runsPerIteration;
while(*start < minout) ++start, ++metrics.outliers;
do --end, ++metrics.outliers; while(*end > maxout);
++end, --metrics.outliers;
}
}
else if (param_strategy == PERF_STRATEGY_SIMPLE)
{
metrics.outliers = static_cast<int>(times.size() * param_max_outliers / 100);
for (unsigned int i = 0; i < metrics.outliers; i++)
--end;
}
else
{ {
double minout = exp(gmean - 3 * gstddev) * runsPerIteration; assert(false);
double maxout = exp(gmean + 3 * gstddev) * runsPerIteration;
while(*start < minout) ++start, ++metrics.outliers, ++offset;
do --end, ++metrics.outliers; while(*end > maxout);
++end, --metrics.outliers;
} }
int offset = static_cast<int>(start - times.begin());
metrics.min = static_cast<double>(*start)/runsPerIteration; metrics.min = static_cast<double>(*start)/runsPerIteration;
//calc final metrics //calc final metrics
n = 0; unsigned int n = 0;
gmean = 0; double gmean = 0;
gstddev = 0; double gstddev = 0;
double mean = 0; double mean = 0;
double stddev = 0; double stddev = 0;
int m = 0; unsigned int m = 0;
for(; start != end; ++start) for(; start != end; ++start)
{ {
double x = static_cast<double>(*start)/runsPerIteration; double x = static_cast<double>(*start)/runsPerIteration;
@ -1009,11 +1127,10 @@ performance_metrics& TestBase::calcMetrics()
metrics.gmean = exp(gmean); metrics.gmean = exp(gmean);
metrics.gstddev = m > 1 ? sqrt(gstddev / (m - 1)) : 0; metrics.gstddev = m > 1 ? sqrt(gstddev / (m - 1)) : 0;
metrics.stddev = n > 1 ? sqrt(stddev / (n - 1)) : 0; metrics.stddev = n > 1 ? sqrt(stddev / (n - 1)) : 0;
metrics.median = n % 2 metrics.median = (n % 2
? (double)times[offset + n / 2] ? (double)times[offset + n / 2]
: 0.5 * (times[offset + n / 2] + times[offset + n / 2 - 1]); : 0.5 * (times[offset + n / 2] + times[offset + n / 2 - 1])
) / runsPerIteration;
metrics.median /= runsPerIteration;
return metrics; return metrics;
} }
@ -1027,17 +1144,31 @@ void TestBase::validateMetrics()
ASSERT_GE(m.samples, 1u) ASSERT_GE(m.samples, 1u)
<< " No time measurements was performed.\nstartTimer() and stopTimer() commands are required for performance tests."; << " No time measurements was performed.\nstartTimer() and stopTimer() commands are required for performance tests.";
EXPECT_GE(m.samples, param_min_samples) if (param_strategy == PERF_STRATEGY_BASE)
<< " Only a few samples are collected.\nPlease increase number of iterations or/and time limit to get reliable performance measurements."; {
EXPECT_GE(m.samples, param_min_samples)
<< " Only a few samples are collected.\nPlease increase number of iterations or/and time limit to get reliable performance measurements.";
if (m.gstddev > DBL_EPSILON)
{
EXPECT_GT(/*m.gmean * */1., /*m.gmean * */ 2 * sinh(m.gstddev * param_max_deviation))
<< " Test results are not reliable ((mean-sigma,mean+sigma) deviation interval is greater than measured time interval).";
}
if (m.gstddev > DBL_EPSILON) EXPECT_LE(m.outliers, std::max((unsigned int)cvCeil(m.samples * param_max_outliers / 100.), 1u))
<< " Test results are not reliable (too many outliers).";
}
else if (param_strategy == PERF_STRATEGY_SIMPLE)
{ {
EXPECT_GT(/*m.gmean * */1., /*m.gmean * */ 2 * sinh(m.gstddev * param_max_deviation)) double mean = metrics.mean * 1000.0f / metrics.frequency;
<< " Test results are not reliable ((mean-sigma,mean+sigma) deviation interval is greater than measured time interval)."; double stddev = metrics.stddev * 1000.0f / metrics.frequency;
double percents = stddev / mean * 100.f;
printf(" samples = %d, mean = %.2f, stddev = %.2f (%.1f%%)\n", (int)metrics.samples, mean, stddev, percents);
}
else
{
assert(false);
} }
EXPECT_LE(m.outliers, std::max((unsigned int)cvCeil(m.samples * param_max_outliers / 100.), 1u))
<< " Test results are not reliable (too many outliers).";
} }
void TestBase::reportMetrics(bool toJUnitXML) void TestBase::reportMetrics(bool toJUnitXML)
@ -1200,12 +1331,12 @@ void TestBase::RunPerfTestBody()
{ {
this->PerfTestBody(); this->PerfTestBody();
} }
catch(PerfEarlyExitException) catch(PerfEarlyExitException&)
{ {
metrics.terminationReason = performance_metrics::TERM_INTERRUPT; metrics.terminationReason = performance_metrics::TERM_INTERRUPT;
return;//no additional failure logging return;//no additional failure logging
} }
catch(cv::Exception e) catch(cv::Exception& e)
{ {
metrics.terminationReason = performance_metrics::TERM_EXCEPTION; metrics.terminationReason = performance_metrics::TERM_EXCEPTION;
#ifdef HAVE_CUDA #ifdef HAVE_CUDA
@ -1214,7 +1345,7 @@ void TestBase::RunPerfTestBody()
#endif #endif
FAIL() << "Expected: PerfTestBody() doesn't throw an exception.\n Actual: it throws cv::Exception:\n " << e.what(); FAIL() << "Expected: PerfTestBody() doesn't throw an exception.\n Actual: it throws cv::Exception:\n " << e.what();
} }
catch(std::exception e) catch(std::exception& e)
{ {
metrics.terminationReason = performance_metrics::TERM_EXCEPTION; metrics.terminationReason = performance_metrics::TERM_EXCEPTION;
FAIL() << "Expected: PerfTestBody() doesn't throw an exception.\n Actual: it throws std::exception:\n " << e.what(); FAIL() << "Expected: PerfTestBody() doesn't throw an exception.\n Actual: it throws std::exception:\n " << e.what();
@ -1235,6 +1366,7 @@ TestBase::_declareHelper& TestBase::_declareHelper::iterations(unsigned int n)
test->times.reserve(n); test->times.reserve(n);
test->nIters = std::min(n, TestBase::iterationsLimitDefault); test->nIters = std::min(n, TestBase::iterationsLimitDefault);
test->currentIter = (unsigned int)-1; test->currentIter = (unsigned int)-1;
test->metrics.clear();
return *this; return *this;
} }
@ -1243,6 +1375,7 @@ TestBase::_declareHelper& TestBase::_declareHelper::time(double timeLimitSecs)
test->times.clear(); test->times.clear();
test->currentIter = (unsigned int)-1; test->currentIter = (unsigned int)-1;
test->timeLimit = (int64)(timeLimitSecs * cv::getTickFrequency()); test->timeLimit = (int64)(timeLimitSecs * cv::getTickFrequency());
test->metrics.clear();
return *this; return *this;
} }

Loading…
Cancel
Save