updated performance sample
This commit is contained in:
parent
a618b774f2
commit
f883b31cfd
@ -60,8 +60,11 @@ void TestSystem::finishCurrentSubtest()
|
|||||||
// There is no need to print subtest statistics
|
// There is no need to print subtest statistics
|
||||||
return;
|
return;
|
||||||
|
|
||||||
int cpu_time = static_cast<int>(cpu_elapsed_ / getTickFrequency() * 1000.0);
|
//int cpu_time = static_cast<int>(cpu_elapsed_ / getTickFrequency() * 1000.0);
|
||||||
int gpu_time = static_cast<int>(gpu_elapsed_ / getTickFrequency() * 1000.0);
|
//int gpu_time = static_cast<int>(gpu_elapsed_ / getTickFrequency() * 1000.0);
|
||||||
|
|
||||||
|
double cpu_time = cpu_elapsed_ / getTickFrequency() * 1000.0;
|
||||||
|
double gpu_time = gpu_elapsed_ / getTickFrequency() * 1000.0;
|
||||||
|
|
||||||
double speedup = static_cast<double>(cpu_elapsed_) /
|
double speedup = static_cast<double>(cpu_elapsed_) /
|
||||||
std::max((int64)1, gpu_elapsed_);
|
std::max((int64)1, gpu_elapsed_);
|
||||||
@ -161,7 +164,8 @@ int main(int argc, const char* argv[])
|
|||||||
"{ f | filter | | filter for test }"
|
"{ f | filter | | filter for test }"
|
||||||
"{ w | workdir | | set working directory }"
|
"{ w | workdir | | set working directory }"
|
||||||
"{ l | list | false | show all tests }"
|
"{ l | list | false | show all tests }"
|
||||||
"{ d | device | 0 | device id }";
|
"{ d | device | 0 | device id }"
|
||||||
|
"{ i | iters | 10 | iteration count }";
|
||||||
|
|
||||||
CommandLineParser cmd(argc, argv, keys);
|
CommandLineParser cmd(argc, argv, keys);
|
||||||
|
|
||||||
@ -190,6 +194,7 @@ int main(int argc, const char* argv[])
|
|||||||
string filter = cmd.get<string>("filter");
|
string filter = cmd.get<string>("filter");
|
||||||
string workdir = cmd.get<string>("workdir");
|
string workdir = cmd.get<string>("workdir");
|
||||||
bool list = cmd.get<bool>("list");
|
bool list = cmd.get<bool>("list");
|
||||||
|
int iters = cmd.get<int>("iters");
|
||||||
|
|
||||||
if (!filter.empty())
|
if (!filter.empty())
|
||||||
TestSystem::instance().setTestFilter(filter);
|
TestSystem::instance().setTestFilter(filter);
|
||||||
@ -205,6 +210,8 @@ int main(int argc, const char* argv[])
|
|||||||
if (list)
|
if (list)
|
||||||
TestSystem::instance().setListMode(true);
|
TestSystem::instance().setListMode(true);
|
||||||
|
|
||||||
|
TestSystem::instance().setIters(iters);
|
||||||
|
|
||||||
TestSystem::instance().run();
|
TestSystem::instance().run();
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
|
@ -4,6 +4,7 @@
|
|||||||
#include <iostream>
|
#include <iostream>
|
||||||
#include <cstdio>
|
#include <cstdio>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
#include <numeric>
|
||||||
#include <string>
|
#include <string>
|
||||||
#include "opencv2/core/core.hpp"
|
#include "opencv2/core/core.hpp"
|
||||||
#include "opencv2/gpu/gpu.hpp"
|
#include "opencv2/gpu/gpu.hpp"
|
||||||
@ -40,6 +41,8 @@ public:
|
|||||||
void setTestFilter(const std::string& val) { test_filter_ = val; }
|
void setTestFilter(const std::string& val) { test_filter_ = val; }
|
||||||
const std::string& testFilter() const { return test_filter_; }
|
const std::string& testFilter() const { return test_filter_; }
|
||||||
|
|
||||||
|
void setIters(int iters) { iters_ = iters; }
|
||||||
|
|
||||||
void addInit(Runnable* init) { inits_.push_back(init); }
|
void addInit(Runnable* init) { inits_.push_back(init); }
|
||||||
void addTest(Runnable* test) { tests_.push_back(test); }
|
void addTest(Runnable* test) { tests_.push_back(test); }
|
||||||
void run();
|
void run();
|
||||||
@ -53,20 +56,36 @@ public:
|
|||||||
return cur_subtest_description_;
|
return cur_subtest_description_;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool stop() const { return it_ >= iters_; }
|
||||||
|
|
||||||
void cpuOn() { cpu_started_ = cv::getTickCount(); }
|
void cpuOn() { cpu_started_ = cv::getTickCount(); }
|
||||||
void cpuOff()
|
void cpuOff()
|
||||||
{
|
{
|
||||||
int64 delta = cv::getTickCount() - cpu_started_;
|
int64 delta = cv::getTickCount() - cpu_started_;
|
||||||
cpu_elapsed_ += delta;
|
cpu_times_.push_back(delta);
|
||||||
|
++it_;
|
||||||
|
}
|
||||||
|
void cpuComplete()
|
||||||
|
{
|
||||||
|
double delta_mean = std::accumulate(cpu_times_.begin(), cpu_times_.end(), 0.0) / iters_;
|
||||||
|
cpu_elapsed_ += delta_mean;
|
||||||
cur_subtest_is_empty_ = false;
|
cur_subtest_is_empty_ = false;
|
||||||
}
|
it_ = 0;
|
||||||
|
}
|
||||||
|
|
||||||
void gpuOn() { gpu_started_ = cv::getTickCount(); }
|
void gpuOn() { gpu_started_ = cv::getTickCount(); }
|
||||||
void gpuOff()
|
void gpuOff()
|
||||||
{
|
{
|
||||||
int64 delta = cv::getTickCount() - gpu_started_;
|
int64 delta = cv::getTickCount() - gpu_started_;
|
||||||
gpu_elapsed_ += delta;
|
gpu_times_.push_back(delta);
|
||||||
|
++it_;
|
||||||
|
}
|
||||||
|
void gpuComplete()
|
||||||
|
{
|
||||||
|
double delta_mean = std::accumulate(gpu_times_.begin(), gpu_times_.end(), 0.0) / iters_;
|
||||||
|
gpu_elapsed_ += delta_mean;
|
||||||
cur_subtest_is_empty_ = false;
|
cur_subtest_is_empty_ = false;
|
||||||
|
it_ = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
bool isListMode() const { return is_list_mode_; }
|
bool isListMode() const { return is_list_mode_; }
|
||||||
@ -76,7 +95,13 @@ private:
|
|||||||
TestSystem(): cur_subtest_is_empty_(true), cpu_elapsed_(0),
|
TestSystem(): cur_subtest_is_empty_(true), cpu_elapsed_(0),
|
||||||
gpu_elapsed_(0), speedup_total_(0.0),
|
gpu_elapsed_(0), speedup_total_(0.0),
|
||||||
num_subtests_called_(0),
|
num_subtests_called_(0),
|
||||||
is_list_mode_(false) {}
|
is_list_mode_(false)
|
||||||
|
{
|
||||||
|
iters_ = 10;
|
||||||
|
it_ = 0;
|
||||||
|
cpu_times_.reserve(iters_);
|
||||||
|
gpu_times_.reserve(iters_);
|
||||||
|
}
|
||||||
|
|
||||||
void finishCurrentSubtest();
|
void finishCurrentSubtest();
|
||||||
void resetCurrentSubtest()
|
void resetCurrentSubtest()
|
||||||
@ -85,6 +110,9 @@ private:
|
|||||||
gpu_elapsed_ = 0;
|
gpu_elapsed_ = 0;
|
||||||
cur_subtest_description_.str("");
|
cur_subtest_description_.str("");
|
||||||
cur_subtest_is_empty_ = true;
|
cur_subtest_is_empty_ = true;
|
||||||
|
it_ = 0;
|
||||||
|
cpu_times_.clear();
|
||||||
|
gpu_times_.clear();
|
||||||
}
|
}
|
||||||
|
|
||||||
void printHeading();
|
void printHeading();
|
||||||
@ -107,6 +135,11 @@ private:
|
|||||||
int num_subtests_called_;
|
int num_subtests_called_;
|
||||||
|
|
||||||
bool is_list_mode_;
|
bool is_list_mode_;
|
||||||
|
|
||||||
|
int iters_;
|
||||||
|
int it_;
|
||||||
|
std::vector<int64> cpu_times_;
|
||||||
|
std::vector<int64> gpu_times_;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
@ -130,10 +163,12 @@ private:
|
|||||||
void name##_test::run()
|
void name##_test::run()
|
||||||
|
|
||||||
#define SUBTEST TestSystem::instance().startNewSubtest()
|
#define SUBTEST TestSystem::instance().startNewSubtest()
|
||||||
#define CPU_ON TestSystem::instance().cpuOn()
|
|
||||||
#define GPU_ON TestSystem::instance().gpuOn()
|
#define CPU_ON while (!TestSystem::instance().stop()) { TestSystem::instance().cpuOn()
|
||||||
#define CPU_OFF TestSystem::instance().cpuOff()
|
#define CPU_OFF TestSystem::instance().cpuOff(); } TestSystem::instance().cpuComplete()
|
||||||
#define GPU_OFF TestSystem::instance().gpuOff()
|
|
||||||
|
#define GPU_ON while (!TestSystem::instance().stop()) { TestSystem::instance().gpuOn()
|
||||||
|
#define GPU_OFF TestSystem::instance().gpuOff(); } TestSystem::instance().gpuComplete()
|
||||||
|
|
||||||
// Generates matrix
|
// Generates matrix
|
||||||
void gen(cv::Mat& mat, int rows, int cols, int type, cv::Scalar low,
|
void gen(cv::Mat& mat, int rows, int cols, int type, cv::Scalar low,
|
||||||
|
@ -767,6 +767,27 @@ TEST(threshold)
|
|||||||
gpu::threshold(d_src, d_dst, 50.0, 0.0, THRESH_BINARY);
|
gpu::threshold(d_src, d_dst, 50.0, 0.0, THRESH_BINARY);
|
||||||
GPU_OFF;
|
GPU_OFF;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
for (int size = 2000; size <= 4000; size += 1000)
|
||||||
|
{
|
||||||
|
SUBTEST << size << 'x' << size << ", 32FC1, THRESH_TRUNC [NPP]";
|
||||||
|
|
||||||
|
gen(src, size, size, CV_32FC1, 0, 100);
|
||||||
|
|
||||||
|
threshold(src, dst, 50.0, 0.0, THRESH_TRUNC);
|
||||||
|
|
||||||
|
CPU_ON;
|
||||||
|
threshold(src, dst, 50.0, 0.0, THRESH_TRUNC);
|
||||||
|
CPU_OFF;
|
||||||
|
|
||||||
|
d_src.upload(src);
|
||||||
|
|
||||||
|
gpu::threshold(d_src, d_dst, 50.0, 0.0, THRESH_TRUNC);
|
||||||
|
|
||||||
|
GPU_ON;
|
||||||
|
gpu::threshold(d_src, d_dst, 50.0, 0.0, THRESH_TRUNC);
|
||||||
|
GPU_OFF;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
TEST(pow)
|
TEST(pow)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user