Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
O
opencv
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
opencv
Commits
79ba160c
Commit
79ba160c
authored
Jan 26, 2011
by
Alexey Spizhevoy
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
added more GPU perf. tests, refactored
parent
11579324
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
99 additions
and
71 deletions
+99
-71
performance.cpp
samples/gpu/performance/performance.cpp
+17
-21
performance.h
samples/gpu/performance/performance.h
+21
-22
tests.cpp
samples/gpu/performance/tests.cpp
+61
-28
No files found.
samples/gpu/performance/performance.cpp
View file @
79ba160c
...
...
@@ -9,11 +9,14 @@ void TestSystem::run()
// Run initializers
vector
<
Runnable
*>::
iterator
it
=
inits_
.
begin
();
for
(;
it
!=
inits_
.
end
();
++
it
)
{
(
*
it
)
->
run
();
}
cout
<<
setiosflags
(
ios_base
::
left
);
cout
<<
TAB
<<
setw
(
10
)
<<
"CPU, ms"
<<
setw
(
10
)
<<
"GPU, ms"
<<
setw
(
10
)
<<
"SPEEDUP"
<<
"DESCRIPTION
\n
"
;
<<
setw
(
10
)
<<
"SPEEDUP"
<<
"DESCRIPTION
\n
"
;
cout
<<
resetiosflags
(
ios_base
::
left
);
// Run tests
...
...
@@ -24,30 +27,23 @@ void TestSystem::run()
try
{
(
*
it
)
->
run
();
flush
_subtest_d
ata
();
flush
SubtestD
ata
();
}
catch
(
const
cv
::
Exception
&
e
)
catch
(
const
cv
::
Exception
&
)
{
cout
<<
TAB
<<
"error"
;
switch
(
e
.
code
)
{
case
CV_StsNoMem
:
cout
<<
": out of memory"
;
break
;
}
if
(
!
description_
.
str
().
empty
())
cout
<<
" ["
<<
description_
.
str
()
<<
"]"
;
cout
<<
endl
;
reset_subtest_data
();
resetSubtestData
();
}
}
cout
<<
setiosflags
(
ios_base
::
fixed
|
ios_base
::
left
);
cout
<<
"
\n
average GPU speedup: x"
<<
setprecision
(
3
)
<<
speedup_total_
/
num_subtests_called_
<<
endl
;
cout
<<
resetiosflags
(
ios_base
::
fixed
|
ios_base
::
left
);
cout
<<
setiosflags
(
ios_base
::
fixed
);
cout
<<
"
\n
average GPU speedup: x"
<<
setprecision
(
3
)
<<
speedup_total_
/
num_subtests_called_
<<
endl
;
cout
<<
resetiosflags
(
ios_base
::
fixed
);
}
void
TestSystem
::
flush
_subtest_d
ata
()
void
TestSystem
::
flush
SubtestD
ata
()
{
if
(
!
can_flush_
)
return
;
...
...
@@ -58,9 +54,10 @@ void TestSystem::flush_subtest_data()
double
speedup
=
static_cast
<
double
>
(
cpu_time
)
/
std
::
max
(
1
,
gpu_time
);
speedup_total_
+=
speedup
;
cout
<<
TAB
<<
setiosflags
(
ios_base
::
fixed
|
ios_base
::
left
);
cout
<<
TAB
<<
setiosflags
(
ios_base
::
left
);
stringstream
stream
;
stream
<<
cpu_time
;
cout
<<
setw
(
10
)
<<
stream
.
str
();
...
...
@@ -73,11 +70,10 @@ void TestSystem::flush_subtest_data()
cout
<<
setw
(
10
)
<<
stream
.
str
();
cout
<<
description_
.
str
();
cout
<<
resetiosflags
(
ios_base
::
fixed
|
ios_base
::
left
)
<<
endl
;
cout
<<
resetiosflags
(
ios_base
::
left
)
<<
endl
;
num_subtests_called_
++
;
reset
_subtest_d
ata
();
reset
SubtestD
ata
();
}
...
...
samples/gpu/performance/performance.h
View file @
79ba160c
...
...
@@ -38,6 +38,13 @@ public:
void
run
();
// Ends current subtest and starts new one
std
::
stringstream
&
subtest
()
{
flushSubtestData
();
return
description_
;
}
void
cpuOn
()
{
cpu_started_
=
cv
::
getTickCount
();
}
void
cpuOff
()
...
...
@@ -56,20 +63,13 @@ public:
can_flush_
=
true
;
}
// Ends current subtest and starts new one
std
::
stringstream
&
subtest
()
{
flush_subtest_data
();
return
description_
;
}
private
:
TestSystem
()
:
can_flush_
(
false
),
cpu_elapsed_
(
0
),
gpu_elapsed_
(
0
),
speedup_total_
(
0
.
0
),
num_subtests_called_
(
0
)
{};
void
flush
_subtest_d
ata
();
void
flush
SubtestD
ata
();
void
reset
_subtest_d
ata
()
void
reset
SubtestD
ata
()
{
cpu_elapsed_
=
0
;
gpu_elapsed_
=
0
;
...
...
@@ -93,17 +93,6 @@ private:
};
#define TEST(name) \
struct
name
##
_test
:
Runnable
\
{
\
name
##
_test
()
:
Runnable
(
#
name
)
{
\
TestSystem
::
instance
()
->
addTest
(
this
);
\
}
\
void
run
();
\
}
name
##
_test_instance
;
\
void
name
##
_test
::
run
()
#define INIT(name) \
struct
name
##
_init
:
Runnable
\
{
\
...
...
@@ -115,12 +104,22 @@ private:
void
name
##
_init
::
run
()
#define TEST(name) \
struct
name
##
_test
:
Runnable
\
{
\
name
##
_test
()
:
Runnable
(
#
name
)
{
\
TestSystem
::
instance
()
->
addTest
(
this
);
\
}
\
void
run
();
\
}
name
##
_test_instance
;
\
void
name
##
_test
::
run
()
#define SUBTEST TestSystem::instance()->subtest()
#define DESCRIPTION TestSystem::instance()->subtest()
#define CPU_ON TestSystem::instance()->cpuOn()
#define GPU_ON TestSystem::instance()->gpuOn()
#define CPU_OFF TestSystem::instance()->cpuOff()
#define GPU_OFF TestSystem::instance()->gpuOff()
#define SUBTEST TestSystem::instance()->subtest()
#define DESCRIPTION TestSystem::instance()->subtest()
void
gen
(
cv
::
Mat
&
mat
,
int
rows
,
int
cols
,
int
type
,
cv
::
Scalar
low
,
cv
::
Scalar
high
);
...
...
samples/gpu/performance/tests.cpp
View file @
79ba160c
...
...
@@ -6,42 +6,40 @@
using
namespace
std
;
using
namespace
cv
;
// This code calls CUFFT DFT and initializes that lib
INIT
(
CUFFT_library
)
INIT
(
matchTemplate
)
{
Mat
src
,
templ
;
gen
(
src
,
500
,
500
,
CV_32F
,
0
,
1
);
gen
(
templ
,
500
,
500
,
CV_32F
,
0
,
1
);
Mat
src
;
gen
(
src
,
500
,
500
,
CV_32F
,
0
,
1
);
Mat
templ
;
gen
(
templ
,
500
,
500
,
CV_32F
,
0
,
1
);
gpu
::
GpuMat
d_src
(
src
);
gpu
::
GpuMat
d_templ
(
templ
);
gpu
::
GpuMat
d_result
;
gpu
::
GpuMat
d_src
(
src
),
d_templ
(
templ
),
d_dst
;
gpu
::
matchTemplate
(
d_src
,
d_templ
,
d_
resul
t
,
CV_TM_CCORR
);
gpu
::
matchTemplate
(
d_src
,
d_templ
,
d_
ds
t
,
CV_TM_CCORR
);
}
TEST
(
matchTemplate
)
{
Mat
src
,
templ
,
resul
t
;
Mat
src
,
templ
,
ds
t
;
gen
(
src
,
3000
,
3000
,
CV_32F
,
0
,
1
);
gpu
::
GpuMat
d_
image
(
src
),
d_templ
,
d_resul
t
;
gpu
::
GpuMat
d_
src
(
src
),
d_templ
,
d_ds
t
;
for
(
int
templ_size
=
5
;
templ_size
<
=
1000
;
templ_size
*=
2
)
for
(
int
templ_size
=
5
;
templ_size
<
200
;
templ_size
*=
5
)
{
SUBTEST
<<
"src "
<<
src
.
rows
<<
", templ "
<<
templ_size
<<
", 32F, CCORR"
;
gen
(
templ
,
templ_size
,
templ_size
,
CV_32F
,
0
,
1
);
dst
.
create
(
src
.
rows
-
templ
.
rows
+
1
,
src
.
cols
-
templ
.
cols
+
1
,
CV_32F
);
CPU_ON
;
matchTemplate
(
src
,
templ
,
resul
t
,
CV_TM_CCORR
);
matchTemplate
(
src
,
templ
,
ds
t
,
CV_TM_CCORR
);
CPU_OFF
;
d_templ
=
templ
;
d_dst
.
create
(
d_src
.
rows
-
d_templ
.
rows
+
1
,
d_src
.
cols
-
d_templ
.
cols
+
1
,
CV_32F
);
GPU_ON
;
gpu
::
matchTemplate
(
d_
image
,
d_templ
,
d_resul
t
,
CV_TM_CCORR
);
gpu
::
matchTemplate
(
d_
src
,
d_templ
,
d_ds
t
,
CV_TM_CCORR
);
GPU_OFF
;
}
}
...
...
@@ -86,6 +84,7 @@ TEST(remap)
gen
(
src
,
size
,
size
,
CV_8UC1
,
0
,
256
);
gen
(
xmap
,
size
,
size
,
CV_32F
,
0
,
size
);
gen
(
ymap
,
size
,
size
,
CV_32F
,
0
,
size
);
dst
.
create
(
xmap
.
size
(),
src
.
type
());
CPU_ON
;
remap
(
src
,
dst
,
xmap
,
ymap
,
INTER_LINEAR
);
...
...
@@ -94,6 +93,7 @@ TEST(remap)
d_src
=
src
;
d_xmap
=
xmap
;
d_ymap
=
ymap
;
d_dst
.
create
(
d_xmap
.
size
(),
d_src
.
type
());
GPU_ON
;
gpu
::
remap
(
d_src
,
d_dst
,
d_xmap
,
d_ymap
);
...
...
@@ -107,17 +107,19 @@ TEST(dft)
Mat
src
,
dst
;
gpu
::
GpuMat
d_src
,
d_dst
;
for
(
int
size
=
1000
;
size
<=
8
000
;
size
*=
2
)
for
(
int
size
=
1000
;
size
<=
4
000
;
size
*=
2
)
{
SUBTEST
<<
"size "
<<
size
<<
", 32FC2, complex-to-complex"
;
gen
(
src
,
size
,
size
,
CV_32FC2
,
Scalar
::
all
(
0
),
Scalar
::
all
(
1
));
dst
.
create
(
src
.
size
(),
src
.
type
());
CPU_ON
;
dft
(
src
,
dst
);
CPU_OFF
;
d_src
=
src
;
d_dst
.
create
(
d_src
.
size
(),
d_src
.
type
());
GPU_ON
;
gpu
::
dft
(
d_src
,
d_dst
,
Size
(
size
,
size
));
...
...
@@ -136,12 +138,14 @@ TEST(cornerHarris)
SUBTEST
<<
"size "
<<
size
<<
", 32FC1"
;
gen
(
src
,
size
,
size
,
CV_32F
,
0
,
1
);
dst
.
create
(
src
.
size
(),
src
.
type
());
CPU_ON
;
cornerHarris
(
src
,
dst
,
5
,
7
,
0.1
,
BORDER_REFLECT101
);
CPU_OFF
;
d_src
=
src
;
d_dst
.
create
(
src
.
size
(),
src
.
type
());
GPU_ON
;
gpu
::
cornerHarris
(
d_src
,
d_dst
,
5
,
7
,
0.1
);
...
...
@@ -150,22 +154,51 @@ TEST(cornerHarris)
}
TEST
(
memoryAllocation
)
TEST
(
integral
)
{
Mat
mat
;
gpu
::
GpuMat
d_mat
;
Mat
src
,
sum
;
gpu
::
GpuMat
d_src
,
d_sum
;
for
(
int
size
=
1000
;
size
<=
8000
;
size
*=
2
)
{
SUBTEST
<<
"size "
<<
size
<<
", 8U"
;
int
begin
=
100
,
end
=
8000
,
step
=
100
;
gen
(
src
,
size
,
size
,
CV_8U
,
0
,
256
);
sum
.
create
(
size
+
1
,
size
+
1
,
CV_32S
);
DESCRIPTION
<<
"32F matrices from "
<<
begin
<<
" to "
<<
end
;
CPU_ON
;
integral
(
src
,
sum
);
CPU_OFF
;
CPU_ON
;
for
(
int
size
=
begin
;
size
<=
end
;
size
+=
step
)
mat
.
create
(
size
,
size
,
CV_32FC1
);
CPU_OFF
;
d_src
=
src
;
d_sum
.
create
(
size
+
1
,
size
+
1
,
CV_32S
);
GPU_ON
;
for
(
int
size
=
begin
;
size
<=
end
;
size
+=
step
)
d_mat
.
create
(
size
,
size
,
CV_32FC1
);
GPU_OFF
;
GPU_ON
;
gpu
::
integral
(
d_src
,
d_sum
);
GPU_OFF
;
}
}
TEST
(
norm
)
{
Mat
src
;
gpu
::
GpuMat
d_src
;
for
(
int
size
=
1000
;
size
<=
8000
;
size
*=
2
)
{
SUBTEST
<<
"size "
<<
size
<<
", 8U"
;
gen
(
src
,
size
,
size
,
CV_8U
,
0
,
256
);
CPU_ON
;
norm
(
src
);
CPU_OFF
;
d_src
=
src
;
GPU_ON
;
gpu
::
norm
(
d_src
);
GPU_OFF
;
}
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment