Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
N
ngraph
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
ngraph
Commits
31eb5c46
Commit
31eb5c46
authored
Oct 31, 2017
by
Jaikrishnan Menon
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
CPU: Use transpose kernel from MKL in 2D Reshape
Also, add more codegen options
parent
0df3792f
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
52 additions
and
12 deletions
+52
-12
compiler.cpp
src/ngraph/codegen/compiler.cpp
+11
-2
cpu_kernels.hpp
src/ngraph/runtime/cpu/cpu_kernels.hpp
+12
-0
emitter.cpp
src/ngraph/runtime/cpu/emitter.cpp
+29
-10
No files found.
src/ngraph/codegen/compiler.cpp
View file @
31eb5c46
...
@@ -143,10 +143,17 @@ std::unique_ptr<llvm::Module> execution_state::compile(const string& source, con
...
@@ -143,10 +143,17 @@ std::unique_ptr<llvm::Module> execution_state::compile(const string& source, con
LO
->
OpenMP
=
1
;
LO
->
OpenMP
=
1
;
LO
->
OpenMPUseTLS
=
1
;
LO
->
OpenMPUseTLS
=
1
;
// CodeGen options
auto
&
CGO
=
Clang
->
getInvocation
().
getCodeGenOpts
();
CGO
.
OptimizationLevel
=
3
;
CGO
.
RelocationModel
=
"static"
;
CGO
.
ThreadModel
=
"posix"
;
CGO
.
OmitLeafFramePointer
=
1
;
CGO
.
VectorizeLoop
=
1
;
CGO
.
VectorizeSLP
=
1
;
if
(
debuginfo_enabled
)
if
(
debuginfo_enabled
)
{
{
// CodeGen options
auto
&
CGO
=
Clang
->
getInvocation
().
getCodeGenOpts
();
CGO
.
setDebugInfo
(
codegenoptions
::
FullDebugInfo
);
CGO
.
setDebugInfo
(
codegenoptions
::
FullDebugInfo
);
}
}
...
@@ -161,6 +168,8 @@ std::unique_ptr<llvm::Module> execution_state::compile(const string& source, con
...
@@ -161,6 +168,8 @@ std::unique_ptr<llvm::Module> execution_state::compile(const string& source, con
// Enable various target features
// Enable various target features
// Most of these are for Eigen
// Most of these are for Eigen
auto
&
TO
=
Clang
->
getInvocation
().
getTargetOpts
();
auto
&
TO
=
Clang
->
getInvocation
().
getTargetOpts
();
// TODO: This needs to be configurable and selected carefully
TO
.
CPU
=
"broadwell"
;
TO
.
FeaturesAsWritten
.
emplace_back
(
"+sse4.1"
);
TO
.
FeaturesAsWritten
.
emplace_back
(
"+sse4.1"
);
TO
.
FeaturesAsWritten
.
emplace_back
(
"+sse4.2"
);
TO
.
FeaturesAsWritten
.
emplace_back
(
"+sse4.2"
);
TO
.
FeaturesAsWritten
.
emplace_back
(
"+avx"
);
TO
.
FeaturesAsWritten
.
emplace_back
(
"+avx"
);
...
...
src/ngraph/runtime/cpu/cpu_kernels.hpp
View file @
31eb5c46
...
@@ -86,3 +86,15 @@ namespace cblas
...
@@ -86,3 +86,15 @@ namespace cblas
const
ngraph
::
element
::
Int64
::
type
ldc
);
const
ngraph
::
element
::
Int64
::
type
ldc
);
}
}
}
}
namespace
mkl
{
extern
"C"
{
void
MKL_Somatcopy
(
char
ordering
,
char
trans
,
size_t
rows
,
size_t
cols
,
const
ngraph
::
element
::
Float32
::
type
alpha
,
const
ngraph
::
element
::
Float32
::
type
*
A
,
size_t
lda
,
ngraph
::
element
::
Float32
::
type
*
B
,
size_t
ldb
);
}
}
src/ngraph/runtime/cpu/emitter.cpp
View file @
31eb5c46
...
@@ -979,16 +979,35 @@ void Emitter::EMITTER_DECL(EmitReshape)
...
@@ -979,16 +979,35 @@ void Emitter::EMITTER_DECL(EmitReshape)
auto
arg0_layout
=
inputs
[
0
].
get_layout
<
DenseTensorViewLayout
>
();
auto
arg0_layout
=
inputs
[
0
].
get_layout
<
DenseTensorViewLayout
>
();
auto
out_layout
=
outputs
[
0
].
get_layout
<
DenseTensorViewLayout
>
();
auto
out_layout
=
outputs
[
0
].
get_layout
<
DenseTensorViewLayout
>
();
TU
+=
" {
\n
"
// Emit an MKL transpose call if possible
" auto arg0 = call_frame->get_tensor_view_data<"
+
element_type_names
[
TI
(
result_element_type
)]
+
if
(
result_element_type
==
ngraph
::
element
::
Float32
::
element_type
())
">("
+
to_string
(
inputs
[
0
].
get_index
())
+
");
\n
"
{
" auto out = call_frame->get_tensor_view_data<"
+
element_type_names
[
TI
(
result_element_type
)]
+
TU
+=
">("
+
to_string
(
outputs
[
0
].
get_index
())
+
");
\n
"
" {
\n
"
" EigenMatrix<"
+
element_type_names
[
TI
(
result_element_type
)]
+
">(out, "
+
" auto arg0 = call_frame->get_tensor_view_data<"
+
element_type_names
[
TI
(
result_element_type
)]
+
EIGEN_MATRIX_FORMAT
(
out_layout
->
get_shape
(),
out_layout
->
get_strides
())
+
") =
\n
"
">("
+
to_string
(
inputs
[
0
].
get_index
())
+
");
\n
"
" EigenMatrix<"
+
element_type_names
[
TI
(
result_element_type
)]
+
">(arg0, "
+
" auto out = call_frame->get_tensor_view_data<"
+
element_type_names
[
TI
(
result_element_type
)]
+
EIGEN_MATRIX_FORMAT
(
arg0_layout
->
get_shape
(),
arg0_layout
->
get_strides
())
+
").transpose();
\n
"
">("
+
to_string
(
outputs
[
0
].
get_index
())
+
");
\n
"
" }
\n
"
;
" mkl::MKL_Somatcopy('R', 'T', "
+
to_string
(
arg_shape
[
0
])
+
",
\n
"
" "
+
to_string
(
arg_shape
[
1
])
+
", 1.0f,
\n
"
" arg0, "
+
to_string
(
arg_shape
[
1
])
+
",
\n
"
" out, "
+
to_string
(
arg_shape
[
0
])
+
");
\n
"
" }
\n
"
;
}
else
{
TU
+=
" {
\n
"
" auto arg0 = call_frame->get_tensor_view_data<"
+
element_type_names
[
TI
(
result_element_type
)]
+
">("
+
to_string
(
inputs
[
0
].
get_index
())
+
");
\n
"
" auto out = call_frame->get_tensor_view_data<"
+
element_type_names
[
TI
(
result_element_type
)]
+
">("
+
to_string
(
outputs
[
0
].
get_index
())
+
");
\n
"
" EigenMatrix<"
+
element_type_names
[
TI
(
result_element_type
)]
+
">(out, "
+
EIGEN_MATRIX_FORMAT
(
out_layout
->
get_shape
(),
out_layout
->
get_strides
())
+
") =
\n
"
" EigenMatrix<"
+
element_type_names
[
TI
(
result_element_type
)]
+
">(arg0, "
+
EIGEN_MATRIX_FORMAT
(
arg0_layout
->
get_shape
(),
arg0_layout
->
get_strides
())
+
").transpose();
\n
"
" }
\n
"
;
}
}
}
// Other cases (reordering of axes for tensors with rank>2) are not handled yet.
// Other cases (reordering of axes for tensors with rank>2) are not handled yet.
else
else
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment