Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
N
ngraph
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
ngraph
Commits
c775f01b
Commit
c775f01b
authored
Nov 12, 2017
by
Robert Kimball
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
add unit test to check if output is set correctly
parent
431f245c
Hide whitespace changes
Inline
Side-by-side
Showing
21 changed files
with
592 additions
and
403 deletions
+592
-403
CMakeLists.txt
src/ngraph/CMakeLists.txt
+1
-1
tensor.hpp
src/ngraph/descriptor/tensor.hpp
+1
-1
file_util.cpp
src/ngraph/file_util.cpp
+290
-0
file_util.hpp
src/ngraph/file_util.hpp
+52
-0
function.cpp
src/ngraph/function.cpp
+1
-0
node.cpp
src/ngraph/node.cpp
+4
-0
collect_functions.cpp
src/ngraph/pass/collect_functions.cpp
+0
-50
collect_functions.hpp
src/ngraph/pass/collect_functions.hpp
+0
-33
dump_sorted.cpp
src/ngraph/pass/dump_sorted.cpp
+6
-0
manager.cpp
src/ngraph/pass/manager.cpp
+31
-36
manager_state.cpp
src/ngraph/pass/manager_state.cpp
+1
-1
manager_state.hpp
src/ngraph/pass/manager_state.hpp
+1
-1
call_frame.cpp
src/ngraph/runtime/cpu/call_frame.cpp
+6
-20
call_frame.hpp
src/ngraph/runtime/cpu/call_frame.hpp
+3
-13
emitter.cpp
src/ngraph/runtime/cpu/emitter.cpp
+69
-107
emitter.hpp
src/ngraph/runtime/cpu/emitter.hpp
+0
-1
external_function.cpp
src/ngraph/runtime/cpu/external_function.cpp
+99
-127
external_function.hpp
src/ngraph/runtime/cpu/external_function.hpp
+2
-7
backend_test.in.cpp
test/backend_test.in.cpp
+3
-3
tensor.cpp
test/tensor.cpp
+21
-0
topological_sort.cpp
test/topological_sort.cpp
+1
-2
No files found.
src/ngraph/CMakeLists.txt
View file @
c775f01b
...
...
@@ -21,6 +21,7 @@ set (SRC
descriptor/tensor.cpp
descriptor/tensor_view.cpp
descriptor/tuple.cpp
file_util.cpp
function.cpp
log.cpp
node.cpp
...
...
@@ -53,7 +54,6 @@ set (SRC
ops/tuple.cpp
ops/unary_elementwise_arithmetic.cpp
ops/unary_elementwise.cpp
pass/collect_functions.cpp
pass/dump_sorted.cpp
pass/liveness.cpp
pass/manager.cpp
...
...
src/ngraph/descriptor/tensor.hpp
View file @
c775f01b
...
...
@@ -61,7 +61,7 @@ public:
size_t
get_pool_offset
()
const
;
const
element
::
Type
&
get_element_type
()
const
{
return
m_element_type
;
}
static
std
::
string
make_tensor_name
(
const
Node
*
node
,
size_t
value_index
);
void
set_is_output
()
{
m_is_output
=
true
;
}
protected
:
const
element
::
Type
&
m_element_type
;
PrimaryTensorView
*
m_primary_tensor_view
;
...
...
src/ngraph/file_util.cpp
0 → 100644
View file @
c775f01b
/*
Copyright 2016 Nervana Systems Inc.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#include <cassert>
#include <dirent.h>
#include <fcntl.h>
#include <fstream>
#include <ftw.h>
#include <iostream>
#include <sstream>
#include <stdexcept>
#include <string.h>
#include <sys/file.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/types.h>
#include <unistd.h>
#include <vector>
#include "file_util.hpp"
using
namespace
std
;
string
ngraph
::
file_util
::
path_join
(
const
string
&
s1
,
const
string
&
s2
)
{
string
rc
;
if
(
s2
.
size
()
>
0
)
{
if
(
s2
[
0
]
==
'/'
)
{
rc
=
s2
;
}
else
if
(
s1
.
size
()
>
0
)
{
rc
=
s1
;
if
(
rc
[
rc
.
size
()
-
1
]
!=
'/'
)
{
rc
+=
"/"
;
}
rc
+=
s2
;
}
else
{
rc
=
s2
;
}
}
else
{
rc
=
s1
;
}
return
rc
;
}
size_t
ngraph
::
file_util
::
get_file_size
(
const
string
&
filename
)
{
// ensure that filename exists and get its size
struct
stat
stats
;
if
(
stat
(
filename
.
c_str
(),
&
stats
)
==
-
1
)
{
throw
std
::
runtime_error
(
"Could not find file:
\"
"
+
filename
+
"
\"
"
);
}
return
stats
.
st_size
;
}
void
ngraph
::
file_util
::
remove_directory
(
const
string
&
dir
)
{
file_util
::
iterate_files
(
dir
,
[](
const
string
&
file
,
bool
is_dir
)
{
if
(
is_dir
)
rmdir
(
file
.
c_str
());
else
remove
(
file
.
c_str
());
},
true
);
rmdir
(
dir
.
c_str
());
}
void
ngraph
::
file_util
::
remove_file
(
const
string
&
file
)
{
remove
(
file
.
c_str
());
}
bool
ngraph
::
file_util
::
make_directory
(
const
string
&
dir
)
{
if
(
mkdir
(
dir
.
c_str
(),
S_IRWXU
|
S_IRWXG
|
S_IROTH
|
S_IXOTH
))
{
if
(
errno
==
EEXIST
)
{
// not really an error, the directory already exists
return
false
;
}
throw
std
::
runtime_error
(
"error making directory "
+
dir
+
" "
+
strerror
(
errno
));
}
return
true
;
}
string
ngraph
::
file_util
::
make_temp_directory
(
const
string
&
path
)
{
string
fname
=
path
.
empty
()
?
file_util
::
get_temp_directory
()
:
path
;
string
tmp_template
=
file_util
::
path_join
(
fname
,
"aeonXXXXXX"
);
char
*
tmpname
=
strdup
(
tmp_template
.
c_str
());
mkdtemp
(
tmpname
);
string
rc
=
tmpname
;
free
(
tmpname
);
return
rc
;
}
std
::
string
ngraph
::
file_util
::
get_temp_directory
()
{
const
vector
<
string
>
potential_tmps
=
{
"NERVANA_AEON_TMP"
,
"TMPDIR"
,
"TMP"
,
"TEMP"
,
"TEMPDIR"
};
const
char
*
path
=
nullptr
;
for
(
const
string
&
var
:
potential_tmps
)
{
path
=
getenv
(
var
.
c_str
());
if
(
path
!=
nullptr
)
{
break
;
}
}
if
(
path
==
nullptr
)
{
path
=
"/tmp"
;
}
return
path
;
}
vector
<
char
>
ngraph
::
file_util
::
read_file_contents
(
const
string
&
path
)
{
size_t
file_size
=
get_file_size
(
path
);
vector
<
char
>
data
;
data
.
reserve
(
file_size
);
data
.
resize
(
file_size
);
FILE
*
f
=
fopen
(
path
.
c_str
(),
"rb"
);
if
(
f
)
{
char
*
p
=
data
.
data
();
size_t
remainder
=
file_size
;
size_t
offset
=
0
;
while
(
remainder
>
0
)
{
size_t
rc
=
fread
(
&
p
[
offset
],
1
,
remainder
,
f
);
offset
+=
rc
;
remainder
-=
rc
;
}
fclose
(
f
);
}
else
{
throw
std
::
runtime_error
(
"error opening file '"
+
path
+
"'"
);
}
return
data
;
}
std
::
string
ngraph
::
file_util
::
read_file_to_string
(
const
std
::
string
&
path
)
{
std
::
ifstream
f
(
path
);
std
::
stringstream
ss
;
ss
<<
f
.
rdbuf
();
return
ss
.
str
();
}
void
ngraph
::
file_util
::
iterate_files
(
const
string
&
path
,
std
::
function
<
void
(
const
string
&
file
,
bool
is_dir
)
>
func
,
bool
recurse
)
{
vector
<
string
>
files
;
vector
<
string
>
dirs
;
file_util
::
iterate_files_worker
(
path
,
[
&
files
,
&
dirs
](
const
string
&
file
,
bool
is_dir
)
{
if
(
is_dir
)
dirs
.
push_back
(
file
);
else
files
.
push_back
(
file
);
},
true
);
for
(
auto
f
:
files
)
func
(
f
,
false
);
for
(
auto
f
:
dirs
)
func
(
f
,
true
);
}
void
ngraph
::
file_util
::
iterate_files_worker
(
const
string
&
path
,
std
::
function
<
void
(
const
string
&
file
,
bool
is_dir
)
>
func
,
bool
recurse
)
{
DIR
*
dir
;
struct
dirent
*
ent
;
if
((
dir
=
opendir
(
path
.
c_str
()))
!=
nullptr
)
{
while
((
ent
=
readdir
(
dir
))
!=
nullptr
)
{
string
name
=
ent
->
d_name
;
switch
(
ent
->
d_type
)
{
case
DT_DIR
:
if
(
recurse
&&
name
!=
"."
&&
name
!=
".."
)
{
string
dir_path
=
file_util
::
path_join
(
path
,
name
);
iterate_files
(
dir_path
,
func
,
recurse
);
func
(
dir_path
,
true
);
}
break
;
case
DT_LNK
:
break
;
case
DT_REG
:
name
=
file_util
::
path_join
(
path
,
name
);
func
(
name
,
false
);
break
;
default
:
break
;
}
}
closedir
(
dir
);
}
else
{
throw
std
::
runtime_error
(
"error enumerating file "
+
path
);
}
}
string
ngraph
::
file_util
::
tmp_filename
(
const
string
&
extension
)
{
string
tmp_template
=
file_util
::
path_join
(
file_util
::
get_temp_directory
(),
"ngraph_XXXXXX"
+
extension
);
char
*
tmpname
=
strdup
(
tmp_template
.
c_str
());
// mkstemp opens the file with open() so we need to close it
close
(
mkstemps
(
tmpname
,
static_cast
<
int
>
(
extension
.
size
())));
string
rc
=
tmpname
;
free
(
tmpname
);
return
rc
;
}
void
ngraph
::
file_util
::
touch
(
const
std
::
string
&
filename
)
{
// inspired by http://chris-sharpe.blogspot.com/2013/05/better-than-systemtouch.html
int
fd
=
open
(
filename
.
c_str
(),
O_WRONLY
|
O_CREAT
|
O_NOCTTY
|
O_NONBLOCK
,
0666
);
assert
(
fd
>=
0
);
close
(
fd
);
// update timestamp for filename
int
rc
=
utimes
(
filename
.
c_str
(),
nullptr
);
assert
(
!
rc
);
}
bool
ngraph
::
file_util
::
exists
(
const
std
::
string
&
filename
)
{
struct
stat
buffer
;
return
(
stat
(
filename
.
c_str
(),
&
buffer
)
==
0
);
}
int
ngraph
::
file_util
::
try_get_lock
(
const
std
::
string
&
filename
)
{
mode_t
m
=
umask
(
0
);
int
fd
=
open
(
filename
.
c_str
(),
O_RDWR
|
O_CREAT
,
0666
);
umask
(
m
);
if
(
fd
>=
0
&&
flock
(
fd
,
LOCK_EX
|
LOCK_NB
)
<
0
)
{
close
(
fd
);
fd
=
-
1
;
}
return
fd
;
}
void
ngraph
::
file_util
::
release_lock
(
int
fd
,
const
std
::
string
&
filename
)
{
if
(
fd
>=
0
)
{
remove_file
(
filename
);
close
(
fd
);
}
}
src/ngraph/file_util.hpp
0 → 100644
View file @
c775f01b
/*
Copyright 2016 Nervana Systems Inc.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#pragma once
#include <functional>
#include <string>
#include <vector>
namespace
ngraph
{
class
file_util
;
}
class
ngraph
::
file_util
{
public
:
static
std
::
string
path_join
(
const
std
::
string
&
s1
,
const
std
::
string
&
s2
);
static
size_t
get_file_size
(
const
std
::
string
&
filename
);
static
void
remove_directory
(
const
std
::
string
&
dir
);
static
bool
make_directory
(
const
std
::
string
&
dir
);
static
std
::
string
make_temp_directory
(
const
std
::
string
&
path
=
""
);
static
std
::
string
get_temp_directory
();
static
void
remove_file
(
const
std
::
string
&
file
);
static
std
::
vector
<
char
>
read_file_contents
(
const
std
::
string
&
path
);
static
std
::
string
read_file_to_string
(
const
std
::
string
&
path
);
static
void
iterate_files
(
const
std
::
string
&
path
,
std
::
function
<
void
(
const
std
::
string
&
file
,
bool
is_dir
)
>
func
,
bool
recurse
=
false
);
static
std
::
string
tmp_filename
(
const
std
::
string
&
extension
=
""
);
static
void
touch
(
const
std
::
string
&
filename
);
static
bool
exists
(
const
std
::
string
&
filename
);
static
int
try_get_lock
(
const
std
::
string
&
filename
);
static
void
release_lock
(
int
fd
,
const
std
::
string
&
filename
);
private
:
static
void
iterate_files_worker
(
const
std
::
string
&
path
,
std
::
function
<
void
(
const
std
::
string
&
file
,
bool
is_dir
)
>
func
,
bool
recurse
=
false
);
};
src/ngraph/function.cpp
View file @
c775f01b
...
...
@@ -33,6 +33,7 @@ Function::Function(const std::shared_ptr<Node>& result,
,
m_ordered_ops_valid
(
false
)
,
m_instance_id
(
m_next_instance_id
.
fetch_add
(
1
))
{
m_result
->
set_is_output
();
traverse_nodes
(
this
,
[
&
](
shared_ptr
<
Node
>
node
)
{
m_ops
.
push_back
(
node
);
});
}
...
...
src/ngraph/node.cpp
View file @
c775f01b
...
...
@@ -118,6 +118,10 @@ bool Node::is_output() const
void
Node
::
set_is_output
()
{
m_is_output
=
true
;
for
(
descriptor
::
Output
&
output
:
get_outputs
())
{
output
.
get_tensor
().
set_is_output
();
}
}
std
::
string
Node
::
get_node_id
()
const
...
...
src/ngraph/pass/collect_functions.cpp
deleted
100644 → 0
View file @
431f245c
// ----------------------------------------------------------------------------
// Copyright 2017 Nervana Systems Inc.
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// ----------------------------------------------------------------------------
#include "ngraph/pass/collect_functions.hpp"
#include "ngraph/function.hpp"
#include "ngraph/log.hpp"
#include "ngraph/node.hpp"
#include "ngraph/ops/function_call.hpp"
#include "ngraph/ops/op.hpp"
#include "ngraph/util.hpp"
using
namespace
std
;
using
namespace
ngraph
;
using
namespace
ngraph
::
pass
;
bool
CollectFunctions
::
run_on_function
(
shared_ptr
<
ngraph
::
Function
>
func
)
{
set
<
shared_ptr
<
ngraph
::
Function
>>
functions
;
deque
<
shared_ptr
<
ngraph
::
Function
>>
stack
;
stack
.
push_back
(
func
);
while
(
stack
.
empty
()
==
false
)
{
shared_ptr
<
ngraph
::
Function
>
f
=
stack
.
front
();
stack
.
pop_front
();
functions
.
insert
(
f
);
traverse_nodes
(
f
,
[
&
](
shared_ptr
<
Node
>
node
)
{
shared_ptr
<
op
::
FunctionCall
>
fc
=
dynamic_pointer_cast
<
op
::
FunctionCall
>
(
node
);
if
(
fc
)
{
stack
.
push_back
(
fc
->
get_function
());
}
});
}
get_state
().
set_functions
(
functions
);
return
false
;
}
src/ngraph/pass/collect_functions.hpp
deleted
100644 → 0
View file @
431f245c
// ----------------------------------------------------------------------------
// Copyright 2017 Nervana Systems Inc.
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// ----------------------------------------------------------------------------
#pragma once
#include "ngraph/pass/pass.hpp"
namespace
ngraph
{
namespace
pass
{
class
CollectFunctions
;
}
}
class
ngraph
::
pass
::
CollectFunctions
:
public
FunctionPass
{
public
:
bool
run_on_function
(
std
::
shared_ptr
<
ngraph
::
Function
>
)
override
;
private
:
};
src/ngraph/pass/dump_sorted.cpp
View file @
c775f01b
...
...
@@ -35,6 +35,9 @@ bool pass::DumpSorted::run_on_module(vector<shared_ptr<ngraph::Function>>& funct
{
for
(
shared_ptr
<
Function
>
f
:
functions
)
{
out
<<
"=====================================================================
\n
"
;
out
<<
f
->
get_name
()
<<
" start
\n
"
;
out
<<
"=====================================================================
\n
"
;
for
(
const
shared_ptr
<
Node
>&
node
:
f
->
get_ordered_ops
())
{
out
<<
node
->
get_name
()
<<
"("
;
...
...
@@ -67,6 +70,9 @@ bool pass::DumpSorted::run_on_module(vector<shared_ptr<ngraph::Function>>& funct
out
<<
" F "
<<
tensor
->
get_name
()
<<
"
\n
"
;
}
}
out
<<
"=====================================================================
\n
"
;
out
<<
f
->
get_name
()
<<
" end
\n
"
;
out
<<
"=====================================================================
\n
"
;
}
}
...
...
src/ngraph/pass/manager.cpp
View file @
c775f01b
...
...
@@ -18,6 +18,8 @@
#include "ngraph/function.hpp"
#include "ngraph/log.hpp"
#include "ngraph/node.hpp"
#include "ngraph/ops/function_call.hpp"
#include "ngraph/ops/reduce.hpp"
#include "ngraph/pass/manager.hpp"
#include "ngraph/pass/pass.hpp"
...
...
@@ -36,10 +38,37 @@ void ngraph::pass::Manager::initialize_default_passes()
{
}
static
void
find_functions
(
shared_ptr
<
Function
>
f
,
set
<
shared_ptr
<
Function
>>&
funcs
)
{
funcs
.
insert
(
f
);
for
(
shared_ptr
<
Node
>
node
:
f
->
get_ops
())
{
shared_ptr
<
op
::
FunctionCall
>
fc
=
dynamic_pointer_cast
<
op
::
FunctionCall
>
(
node
);
if
(
fc
)
{
find_functions
(
fc
->
get_function
(),
funcs
);
}
shared_ptr
<
op
::
Reduce
>
reduce
=
dynamic_pointer_cast
<
op
::
Reduce
>
(
node
);
if
(
reduce
)
{
find_functions
(
reduce
->
get_reduction_function
(),
funcs
);
}
}
}
void
ngraph
::
pass
::
Manager
::
run_passes
(
shared_ptr
<
Function
>
func
)
{
vector
<
shared_ptr
<
Function
>>
fs
=
{
func
};
get_state
().
set_functions
(
fs
);
// find all functions
set
<
shared_ptr
<
Function
>>
tfs
;
find_functions
(
func
,
tfs
);
get_state
().
set_functions
(
tfs
);
vector
<
shared_ptr
<
Function
>>
fs
;
for
(
shared_ptr
<
Function
>
f
:
get_state
().
get_functions
())
{
fs
.
push_back
(
f
);
}
for
(
shared_ptr
<
PassBase
>
pass
:
m_pass_list
)
{
...
...
@@ -77,40 +106,6 @@ void ngraph::pass::Manager::run_passes(shared_ptr<Function> func)
}
}
}
// for (shared_ptr<ModulePass>& p : m_module_passes)
// {
// p->set_state(get_state());
// p->run_on_module(fs);
// }
// for (Function* f : fs)
// {
// for (shared_ptr<FunctionPass> p : m_function_passes)
// {
// p->set_state(get_state());
// p->run_on_function(f);
// }
// }
// for (Function* f : fs)
// {
// NGRAPH_INFO;
// for (shared_ptr<NodePass> p : m_node_passes)
// {
// for (Node* node : f->get_ops())
// {
// NGRAPH_INFO;
// p->set_state(get_state());
// p->run_on_node(node);
// }
// }
// }
// for (shared_ptr<CallGraphPass>& p : m_call_graph_passes)
// {
// p->set_state(get_state());
// p->run_on_call_graph(func->get_ordered_ops());
// }
}
ngraph
::
pass
::
ManagerState
&
ngraph
::
pass
::
Manager
::
get_state
()
...
...
src/ngraph/pass/manager_state.cpp
View file @
c775f01b
...
...
@@ -23,7 +23,7 @@
using
namespace
std
;
using
namespace
ngraph
;
vector
<
shared_ptr
<
Function
>>&
ngraph
::
pass
::
ManagerState
::
get_functions
()
const
vector
<
shared_ptr
<
Function
>>&
ngraph
::
pass
::
ManagerState
::
get_functions
()
{
return
m_function_list
;
}
...
...
src/ngraph/pass/manager_state.hpp
View file @
c775f01b
...
...
@@ -30,7 +30,7 @@ namespace ngraph
class
ngraph
::
pass
::
ManagerState
{
public
:
std
::
vector
<
std
::
shared_ptr
<
Function
>>&
get_functions
();
const
std
::
vector
<
std
::
shared_ptr
<
Function
>>&
get_functions
();
template
<
typename
T
>
void
set_functions
(
const
T
&
collection
)
...
...
src/ngraph/runtime/cpu/call_frame.cpp
View file @
c775f01b
...
...
@@ -20,10 +20,8 @@
using
namespace
std
;
using
namespace
ngraph
::
runtime
::
cpu
;
CallFrame
::
CallFrame
(
EntryPoint
compiled_function
,
const
std
::
vector
<
std
::
shared_ptr
<
CallFrame
>>&
callees
)
CallFrame
::
CallFrame
(
EntryPoint
compiled_function
)
:
m_compiled_function
(
compiled_function
)
,
m_callees
(
callees
)
{
}
...
...
@@ -31,23 +29,23 @@ void CallFrame::tensor_call(
const
std
::
vector
<
std
::
shared_ptr
<
ngraph
::
runtime
::
TensorView
>>&
input_tvs
,
const
std
::
vector
<
std
::
shared_ptr
<
ngraph
::
runtime
::
TensorView
>>&
output_tvs
)
{
m_inputs
.
clear
()
;
m_outputs
.
clear
()
;
vector
<
void
*>
inputs
;
vector
<
void
*>
outputs
;
for
(
size_t
i
=
0
;
i
<
input_tvs
.
size
();
i
++
)
{
shared_ptr
<
runtime
::
cpu
::
CPUTensorView
>
tv
=
static_pointer_cast
<
runtime
::
cpu
::
CPUTensorView
>
(
input_tvs
[
i
]);
m_
inputs
.
push_back
(
tv
->
get_data_ptr
());
inputs
.
push_back
(
tv
->
get_data_ptr
());
}
for
(
size_t
i
=
0
;
i
<
output_tvs
.
size
();
i
++
)
{
shared_ptr
<
runtime
::
cpu
::
CPUTensorView
>
tv
=
static_pointer_cast
<
runtime
::
cpu
::
CPUTensorView
>
(
output_tvs
[
i
]);
m_
outputs
.
push_back
(
tv
->
get_data_ptr
());
outputs
.
push_back
(
tv
->
get_data_ptr
());
}
// Invoke compiled computation
m_compiled_function
(
thi
s
);
m_compiled_function
(
inputs
,
output
s
);
}
void
CallFrame
::
operator
()(
const
std
::
vector
<
std
::
shared_ptr
<
ngraph
::
runtime
::
Value
>>&
arguments
,
...
...
@@ -68,15 +66,3 @@ void CallFrame::operator()(const std::vector<std::shared_ptr<ngraph::runtime::Va
tensor_call
(
inputs
,
outputs
);
}
void
*
CallFrame
::
get_input_data
(
size_t
index
)
{
void
*
rc
=
m_inputs
.
at
(
index
);
return
rc
;
}
void
*
CallFrame
::
get_output_data
(
size_t
index
)
{
void
*
rc
=
m_outputs
.
at
(
index
);
return
rc
;
}
src/ngraph/runtime/cpu/call_frame.hpp
View file @
c775f01b
...
...
@@ -32,7 +32,8 @@ namespace ngraph
{
class
CallFrame
;
using
EntryPoint_t
=
void
(
ngraph
::
runtime
::
cpu
::
CallFrame
*
call_frame
);
using
EntryPoint_t
=
void
(
const
std
::
vector
<
void
*>&
inputs
,
const
std
::
vector
<
void
*>&
outputs
);
using
EntryPoint
=
std
::
function
<
EntryPoint_t
>
;
...
...
@@ -40,8 +41,7 @@ namespace ngraph
class
CallFrame
:
public
ngraph
::
runtime
::
CallFrame
{
public
:
CallFrame
(
EntryPoint
compiled_function
,
const
std
::
vector
<
std
::
shared_ptr
<
CallFrame
>>&
callees
);
CallFrame
(
EntryPoint
compiled_function
);
/// @brief Invoke the function with values matching the signature of the function.
///
...
...
@@ -56,19 +56,9 @@ namespace ngraph
const
std
::
vector
<
std
::
shared_ptr
<
TensorView
>>&
outputs
);
void
set_return
()
{
m_return
=
true
;
}
// const std::vector<std::shared_ptr<ngraph::runtime::Value>>& get_inputs();
// const std::vector<std::shared_ptr<ngraph::runtime::Value>>& get_outputs();
void
*
get_input_data
(
size_t
index
);
void
*
get_output_data
(
size_t
index
);
protected
:
bool
m_return
;
EntryPoint
m_compiled_function
;
std
::
vector
<
std
::
shared_ptr
<
CallFrame
>>
m_callees
;
std
::
vector
<
void
*>
m_inputs
;
std
::
vector
<
void
*>
m_outputs
;
};
}
}
...
...
src/ngraph/runtime/cpu/emitter.cpp
View file @
c775f01b
...
...
@@ -935,48 +935,25 @@ void Emitter::EMITTER_DECL(EmitReshape)
void
Emitter
::
EMITTER_DECL
(
EmitFunctionCall
)
{
auto
function_call
=
static_cast
<
const
op
::
FunctionCall
*>
(
n
);
auto
function
=
function_call
->
get_function
();
shared_ptr
<
Function
>
function
=
function_call
->
get_function
();
std
::
shared_ptr
<
ExternalFunction
>
external
;
try
{
external
=
function_map
.
at
(
function
);
}
catch
(
const
std
::
out_of_range
)
{
external
=
make_shared
<
ExternalFunction
>
(
function
);
function_map
.
insert
({
function
,
external
});
}
std
::
shared_ptr
<
CallFrame
>
cf
=
std
::
dynamic_pointer_cast
<
CallFrame
>
(
external
->
make_call_frame
());
ef
->
get_callees
().
emplace_back
(
cf
);
TU
<<
"{ // "
<<
n
->
get_name
()
<<
"
\n
"
;
TU
+=
" {
\n
"
" auto cf = callees.at("
+
to_string
(
ef
->
get_callees
().
size
()
-
1
)
+
");
\n
"
" std::vector<std::shared_ptr<ngraph::runtime::Value>> inputs;
\n
"
" std::vector<std::shared_ptr<ngraph::runtime::Value>> outputs;
\n
"
;
for
(
const
auto
&
in
:
inputs
)
TU
<<
"{ // Call "
<<
function
->
get_name
()
<<
"
\n
"
;
TU
.
indent
++
;
TU
<<
"std::vector<void*> inputs;
\n
"
;
for
(
const
TensorViewInfo
&
input
:
inputs
)
{
TU
+=
" inputs.emplace_back(call_frame->get_tensor_view("
+
to_string
(
in
.
get_index
())
+
"));
\n
"
;
TU
<<
"inputs.push_back("
<<
input
.
get_tensor
().
get_name
()
<<
");
\n
"
;
}
for
(
const
auto
&
out
:
outputs
)
TU
<<
"
\n
"
;
TU
<<
"std::vector<void*> outputs;
\n
"
;
for
(
const
TensorViewInfo
&
output
:
outputs
)
{
TU
+=
" outputs.emplace_back(call_frame->get_tensor_view("
+
to_string
(
out
.
get_index
())
+
"));
\n
"
;
TU
<<
"outputs.push_back("
<<
output
.
get_tensor
().
get_name
()
<<
");
\n
"
;
}
TU
+=
" (*cf)(inputs, outputs);
\n
"
"
}
\n
"
;
TU
<<
"
\n
"
;
TU
<<
function
->
get_name
()
<<
"(inputs, outputs);
\n
"
;
TU
.
indent
--
;
TU
<<
"
}
\n
"
;
}
// TODO: This and other ops include comments/notes that
...
...
@@ -990,17 +967,17 @@ void Emitter::EMITTER_DECL(EmitReduce)
auto
reduce
=
static_cast
<
const
op
::
Reduce
*>
(
n
);
auto
reduction_function
=
reduce
->
get_reduction_function
();
std
::
shared_ptr
<
ExternalFunction
>
external
;
//
std::shared_ptr<ExternalFunction> external;
try
{
external
=
function_map
.
at
(
reduction_function
);
}
catch
(
const
std
::
out_of_range
)
{
external
=
make_shared
<
ExternalFunction
>
(
reduction_function
);
function_map
.
insert
({
reduction_function
,
external
});
}
//
try
//
{
//
external = function_map.at(reduction_function);
//
}
//
catch (const std::out_of_range)
//
{
//
external = make_shared<ExternalFunction>(reduction_function);
//
function_map.insert({reduction_function, external});
//
}
auto
reductee_type
=
reduce
->
get_arguments
().
at
(
0
)
->
get_value_type
();
auto
reductee_tensor_view_type
=
dynamic_pointer_cast
<
const
TensorViewType
>
(
reductee_type
);
...
...
@@ -1026,14 +1003,6 @@ void Emitter::EMITTER_DECL(EmitReduce)
{
TU
<<
"{ // "
<<
n
->
get_name
()
<<
" 1
\n
"
;
TU
.
indent
++
;
TU
<<
"// call_frame->get_parameterized_tensor_view<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
to_string
(
outputs
.
at
(
0
).
get_index
())
<<
")->get_vector() =
\n
"
<<
"// call_frame->get_parameterized_tensor_view<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
to_string
(
inputs
.
at
(
0
).
get_index
())
<<
")->get_vector();
\n
"
;
TU
<<
"memcpy("
<<
outputs
[
0
].
get_tensor
().
get_name
()
<<
", "
<<
inputs
[
0
].
get_tensor
().
get_name
()
<<
", "
<<
outputs
[
0
].
get_tensor_view_layout
()
->
get_size
()
*
...
...
@@ -1084,25 +1053,22 @@ void Emitter::EMITTER_DECL(EmitReduce)
}
else
{
std
::
shared_ptr
<
CallFrame
>
cf
=
std
::
dynamic_pointer_cast
<
CallFrame
>
(
external
->
make_call_frame
());
ef
->
get_callees
().
emplace_back
(
cf
);
TU
<<
"{ // "
<<
n
->
get_name
()
<<
" 3
\n
"
;
TU
.
indent
++
;
string
type
=
f_result_element_type
.
c_type_string
();
TU
<<
"using ET = "
<<
f_result_element_type
.
c_type_string
()
<<
";
\n
"
<<
"auto cf = callees.at("
<<
to_string
(
ef
->
get_callees
().
size
()
-
1
)
<<
");
\n
"
<<
"auto f = [cf]("
<<
type
<<
" x, "
<<
type
<<
" y) -> "
<<
type
<<
" {
\n
"
<<
" auto tx = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" *tx = std::vector<"
<<
type
<<
">({x});
\n
"
<<
" auto ty = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" *ty = std::vector<"
<<
type
<<
">({y});
\n
"
<<
" auto tr = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" (*cf)({tx, ty}, {tr});
\n
"
<<
" return tr->get_vector()[0];
\n
"
<<
"};
\n
"
<<
"EigenArray1d<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
TU
<<
"auto f = []("
<<
type
<<
" x, "
<<
type
<<
" y) -> "
<<
type
<<
" {
\n
"
;
TU
.
indent
++
;
TU
<<
"std::vector<void*> inputs;
\n
"
;
TU
<<
"inputs.push_back(&x);
\n
"
;
TU
<<
"inputs.push_back(&y);
\n\n
"
;
TU
<<
type
<<
" result;
\n
"
;
TU
<<
"std::vector<void*> outputs;
\n
"
;
TU
<<
"outputs.push_back(&result);
\n
"
;
TU
<<
reduction_function
->
get_name
()
<<
"(inputs, outputs);
\n
"
;
TU
<<
"return result;
\n
"
;
TU
.
indent
--
;
TU
<<
"};
\n
"
;
TU
<<
"EigenArray1d<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
outputs
[
0
].
get_tensor
().
get_name
()
<<
", "
<<
eigen_vector_format
(
outputs
[
0
])
<<
") =
\n
"
<<
" EigenArray1d<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
...
...
@@ -1129,26 +1095,26 @@ void Emitter::EMITTER_DECL(EmitReduce)
}
else
{
std
::
shared_ptr
<
CallFrame
>
cf
=
std
::
dynamic_pointer_cast
<
CallFrame
>
(
external
->
make_call_frame
());
ef
->
get_callees
().
emplace_back
(
cf
);
//
std::shared_ptr<CallFrame> cf =
//
std::dynamic_pointer_cast<CallFrame>(external->make_call_frame());
//
ef->get_callees().emplace_back(cf);
TU
<<
"{ // "
<<
n
->
get_name
()
<<
" 5
\n
"
;
TU
.
indent
++
;
TU
<<
"using ET = "
<<
f_result_element_type
.
c_type_string
()
<<
";
\n
"
<<
" auto cf = callees.at("
<<
to_string
(
ef
->
get_callees
().
size
()
-
1
)
<<
");
\n
"
<<
" auto f = [cf](typename ET::type x, typename ET::type y) -> typename "
<<
"ET::type {
\n
"
<<
" auto tx = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" *tx = std::vector<typename ET::type>({x});
\n
"
<<
" auto ty = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" *ty = std::vector<typename ET::type>({y});
\n
"
<<
" auto tr = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" (*cf)({tx, ty}, {tr});
\n
"
<<
" return tr->get_vector()[0];
\n
"
<<
" };
\n
"
<<
"EigenVector<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
string
type
=
f_result_element_type
.
c_type_string
();
TU
<<
"auto f = []("
<<
type
<<
" x, "
<<
type
<<
" y) -> "
<<
type
<<
" {
\n
"
;
TU
.
indent
++
;
TU
<<
"std::vector<void*> inputs;
\n
"
;
TU
<<
"inputs.push_back(&x);
\n
"
;
TU
<<
"inputs.push_back(&y);
\n\n
"
;
TU
<<
type
<<
" result;
\n
"
;
TU
<<
"std::vector<void*> outputs;
\n
"
;
TU
<<
"outputs.push_back(&result);
\n
"
;
TU
<<
reduction_function
->
get_name
()
<<
"(inputs, outputs);
\n
"
;
TU
<<
"return result;
\n
"
;
TU
.
indent
--
;
TU
<<
"};
\n
"
;
TU
<<
"EigenVector<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
outputs
[
0
].
get_tensor
().
get_name
()
<<
", "
<<
eigen_vector_format
(
outputs
[
0
])
<<
") =
\n
"
<<
" EigenMatrix<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
...
...
@@ -1176,29 +1142,25 @@ void Emitter::EMITTER_DECL(EmitReduce)
}
else
{
std
::
shared_ptr
<
CallFrame
>
cf
=
std
::
dynamic_pointer_cast
<
CallFrame
>
(
external
->
make_call_frame
());
ef
->
get_callees
().
emplace_back
(
cf
);
TU
<<
"{ // "
<<
n
->
get_name
()
<<
" 7
\n
"
;
TU
.
indent
++
;
TU
<<
" using ET = "
<<
f_result_element_type
.
c_type_string
()
<<
";
\n
"
<<
" auto cf = callees.at("
<<
to_string
(
ef
->
get_callees
().
size
()
-
1
)
<<
");
\n
"
<<
" auto f = [cf](typename ET::type x, typename ET::type y) -> typename "
<<
"ET::type {
\n
"
<<
" auto tx = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" *tx = std::vector<typename ET::type>({x});
\n
"
<<
" auto ty = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" *ty = std::vector<typename ET::type>({y});
\n
"
<<
" auto tr = ngraph::runtime::make_tensor<ET>(ngraph::Shape{});
\n
"
<<
" (*cf)({tx, ty}, {tr});
\n
"
<<
" return tr->get_vector()[0];
\n
"
<<
" };
\n
"
<<
"
EigenVector<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
string
type
=
f_result_element_type
.
c_type_string
();
TU
<<
"auto f = []("
<<
type
<<
" x, "
<<
type
<<
" y) -> "
<<
type
<<
" {
\n
"
;
TU
.
indent
++
;
TU
<<
"std::vector<void*> inputs;
\n
"
;
TU
<<
"inputs.push_back(&x);
\n
"
;
TU
<<
"inputs.push_back(&y);
\n\n
"
;
TU
<<
type
<<
" result;
\n
"
;
TU
<<
"std::vector<void*> outputs;
\n
"
;
TU
<<
"outputs.push_back(&result);
\n
"
;
TU
<<
reduction_function
->
get_name
()
<<
"(inputs, outputs);
\n
"
;
TU
<<
"return result;
\n
"
;
TU
.
indent
--
;
TU
<<
"};
\n
"
;
TU
<<
"
EigenVector<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
outputs
[
0
].
get_tensor
().
get_name
()
<<
", "
<<
eigen_vector_format
(
outputs
[
0
])
<<
") =
\n
"
<<
"
EigenMatrix<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
" EigenMatrix<"
<<
f_result_element_type
.
c_type_string
()
<<
">("
<<
inputs
[
0
].
get_tensor
().
get_name
()
<<
", "
<<
eigen_matrix_format
(
arg0_layout
->
get_shape
(),
arg0_layout
->
get_strides
())
<<
").colwise().redux(f);
\n
"
;
...
...
src/ngraph/runtime/cpu/emitter.hpp
View file @
c775f01b
...
...
@@ -25,7 +25,6 @@
#define EMITTER_DECL(E) \
E(const ngraph::Node* n, \
ExternalFunction* ef, \
FunctionMap& function_map, \
const std::vector<TensorViewInfo>& inputs, \
const std::vector<TensorViewInfo>& outputs)
...
...
src/ngraph/runtime/cpu/external_function.cpp
View file @
c775f01b
...
...
@@ -25,6 +25,7 @@
#include "ngraph/descriptor/input.hpp"
#include "ngraph/descriptor/layout/dense_tensor_view_layout.hpp"
#include "ngraph/descriptor/output.hpp"
#include "ngraph/file_util.hpp"
#include "ngraph/function.hpp"
#include "ngraph/node.hpp"
#include "ngraph/ops/abs.hpp"
...
...
@@ -67,10 +68,10 @@
#include "ngraph/ops/tanh.hpp"
#include "ngraph/ops/tuple.hpp"
#include "ngraph/pass/assign_layout.hpp"
#include "ngraph/pass/dump_sorted.hpp"
#include "ngraph/pass/liveness.hpp"
#include "ngraph/pass/manager.hpp"
#include "ngraph/pass/memory_layout.hpp"
#include "ngraph/pass/propagate_types.hpp"
#include "ngraph/pass/topological_sort.hpp"
#include "ngraph/runtime/cpu/call_frame.hpp"
#include "ngraph/runtime/cpu/emitter.hpp"
...
...
@@ -86,7 +87,7 @@ extern "C" void
allocate_aligned_buffer
(
size_t
size
,
size_t
alignment
,
char
**
allocated
,
char
**
aligned_ptr
)
{
size_t
allocation_size
=
size
+
alignment
;
*
allocated
=
new
char
[
allocation_size
]
;
*
allocated
=
static_cast
<
char
*>
(
malloc
(
allocation_size
))
;
*
aligned_ptr
=
*
allocated
;
size_t
mod
=
size_t
(
*
aligned_ptr
)
%
alignment
;
...
...
@@ -162,16 +163,6 @@ static const OpMap dispatcher{
{
TI
(
ngraph
::
op
::
Atan
),
&
Emitter
::
EmitAtan
},
};
static
unordered_map
<
type_index
,
string
>
element_type_names
=
{
{
TI
(
ngraph
::
element
::
Bool
),
"Bool"
},
{
TI
(
ngraph
::
element
::
Float32
),
"Float32"
},
{
TI
(
ngraph
::
element
::
Int8
),
"Int8"
},
{
TI
(
ngraph
::
element
::
Int32
),
"Int32"
},
{
TI
(
ngraph
::
element
::
Int64
),
"Int64"
},
{
TI
(
ngraph
::
element
::
UInt8
),
"UInt8"
},
{
TI
(
ngraph
::
element
::
UInt32
),
"UInt32"
},
{
TI
(
ngraph
::
element
::
UInt64
),
"UInt64"
}};
ExternalFunction
::
ExternalFunction
(
const
std
::
shared_ptr
<
ngraph
::
Function
>&
function
,
bool
release_function
)
:
ngraph
::
runtime
::
ExternalFunction
(
function
,
release_function
)
...
...
@@ -179,7 +170,7 @@ ExternalFunction::ExternalFunction(const std::shared_ptr<ngraph::Function>& func
{
}
void
ExternalFunction
::
compile
(
FunctionMap
&
function_map
)
void
ExternalFunction
::
compile
()
{
if
(
m_is_compiled
)
{
...
...
@@ -192,51 +183,12 @@ void ExternalFunction::compile(FunctionMap& function_map)
pass_manager
.
register_pass
<
pass
::
AssignLayout
<
DenseTensorViewLayout
>>
();
pass_manager
.
register_pass
<
pass
::
Liveness
>
();
pass_manager
.
register_pass
<
pass
::
MemoryLayout
>
(
64
);
pass_manager
.
register_pass
<
pass
::
DumpSorted
>
(
"sorted_ops.txt"
);
pass_manager
.
run_passes
(
m_function
);
// Determine tensor requirements for the call frame
unordered_map
<
shared_ptr
<
ngraph
::
descriptor
::
TensorView
>
,
size_t
>
tensor_index
;
// First come the function outputs
for
(
const
descriptor
::
Output
&
output
:
m_function
->
get_result
()
->
get_outputs
())
{
auto
tv
=
output
.
get_tensor_view
();
size_t
index
=
tensor_index
.
size
();
tensor_index
[
tv
]
=
index
;
}
m_n_outputs
=
tensor_index
.
size
();
// Next are the function inputs
for
(
auto
param
:
m_function
->
get_parameters
())
{
for
(
const
descriptor
::
Output
&
output
:
param
->
get_outputs
())
{
auto
tv
=
output
.
get_tensor_view
();
size_t
index
=
tensor_index
.
size
();
tensor_index
[
tv
]
=
index
;
}
}
m_n_inputs
=
tensor_index
.
size
()
-
m_n_outputs
;
// All remaining tensor views
for
(
shared_ptr
<
Node
>
node
:
m_function
->
get_ordered_ops
())
{
for
(
const
descriptor
::
Output
&
output
:
node
->
get_outputs
())
{
auto
tv
=
output
.
get_tensor_view
();
if
(
0
==
tensor_index
.
count
(
tv
))
{
size_t
index
=
tensor_index
.
size
();
tensor_index
[
tv
]
=
index
;
m_temp_views
.
push_back
(
tv
);
}
}
}
// Now we build the TU
Emitter
emitter
;
codegen
::
CodeWriter
&
TU
=
emitter
.
get_code_writer
();
string
function_name
=
m_function
->
get_name
()
+
"_entrypoint"
;
TU
+=
R"(// Generated by the NGraph CPU backend
...
...
@@ -267,95 +219,117 @@ extern "C" void free_aligned_buffer(void* allocated);
)"
;
TU
<<
"extern
\"
C
\"
void "
<<
function_name
<<
"(
\n
"
;
TU
<<
" ngraph::runtime::cpu::CallFrame * call_frame)
\n
"
;
TU
<<
"{
\n
"
;
TU
.
indent
++
;
TU
<<
"// Allocate the memory pool
\n
"
;
size_t
temp_pool_size
=
pass_manager
.
get_state
().
get_temporary_pool_size
();
TU
<<
"char* allocated_buffer_pool;
\n
"
;
TU
<<
"char* aligned_buffer_pool;
\n
"
;
TU
<<
"allocate_aligned_buffer("
<<
temp_pool_size
<<
", 64"
<<
", &allocated_buffer_pool, &aligned_buffer_pool);
\n
"
;
TU
<<
"
\n
"
;
TU
<<
"// Define temporary tensors
\n
"
;
for
(
shared_ptr
<
Node
>
node
:
m_function
->
get_ordered_ops
())
TU
<<
"// Declare any functions that are not main
\n
"
;
for
(
shared_ptr
<
Function
>
f
:
pass_manager
.
get_state
().
get_functions
())
{
for
(
descriptor
::
Tensor
*
tensor
:
node
->
liveness_new_list
)
if
(
f
!=
m_function
)
{
TU
<<
tensor
->
get_element_type
()
<<
"* "
<<
tensor
->
get_name
()
<<
" = ("
<<
tensor
->
get_element_type
()
<<
"*)(aligned_buffer_pool + "
<<
tensor
->
get_pool_offset
()
<<
"
);
\n
"
;
TU
<<
"extern
\"
C
\"
void "
<<
f
->
get_name
()
<<
"(
\n
"
;
TU
<<
" const std::vector<void*>& inputs,
\n
"
;
TU
<<
" const std::vector<void*>& outputs
);
\n
"
;
}
}
TU
<<
"
\n
"
;
TU
<<
"// Define inputs
\n
"
;
size_t
arg_index
=
0
;
for
(
shared_ptr
<
op
::
Parameter
>
param
:
m_function
->
get_parameters
())
for
(
shared_ptr
<
Function
>
current_function
:
pass_manager
.
get_state
().
get_functions
())
{
for
(
const
descriptor
::
Output
&
output
:
param
->
get_outputs
())
TU
<<
"extern
\"
C
\"
void "
<<
current_function
->
get_name
()
<<
"(
\n
"
;
TU
<<
" const std::vector<void*>& inputs,
\n
"
;
TU
<<
" const std::vector<void*>& outputs)
\n
"
;
TU
<<
"{
\n
"
;
TU
.
indent
++
;
TU
<<
"// Allocate the memory pool
\n
"
;
size_t
temp_pool_size
=
pass_manager
.
get_state
().
get_temporary_pool_size
();
TU
<<
"char* allocated_buffer_pool;
\n
"
;
TU
<<
"char* aligned_buffer_pool;
\n
"
;
TU
<<
"allocate_aligned_buffer("
<<
temp_pool_size
<<
", 64"
<<
", &allocated_buffer_pool, &aligned_buffer_pool);
\n
"
;
TU
<<
"
\n
"
;
TU
<<
"// Define temporary tensors
\n
"
;
for
(
shared_ptr
<
Node
>
node
:
current_function
->
get_ordered_ops
())
{
shared_ptr
<
descriptor
::
TensorView
>
tv
=
output
.
get_tensor_view
();
const
element
::
Type
&
et
=
tv
->
get_tensor_view_type
()
->
get_element_type
();
string
type
=
et
.
c_type_string
();
TU
<<
""
<<
type
<<
"* "
<<
tv
->
get_tensor
().
get_name
()
<<
" = static_cast<"
<<
type
<<
"*>(call_frame->get_input_data("
<<
arg_index
<<
")
);
\n
"
;
arg_index
++
;
for
(
descriptor
::
Tensor
*
tensor
:
node
->
liveness_new_list
)
{
TU
<<
tensor
->
get_element_type
()
<<
"* "
<<
tensor
->
get_name
()
<<
" = ("
<<
tensor
->
get_element_type
()
<<
"*)(aligned_buffer_pool + "
<<
tensor
->
get_pool_offset
()
<<
"
);
\n
"
;
}
}
}
TU
<<
"
\n
"
;
TU
<<
"
\n
"
;
TU
<<
"// Define outputs
\n
"
;
size_t
output_index
=
0
;
for
(
const
descriptor
::
Output
&
output
:
m_function
->
get_result
()
->
get_outputs
())
{
shared_ptr
<
descriptor
::
TensorView
>
tv
=
output
.
get_tensor_view
();
const
element
::
Type
&
et
=
tv
->
get_tensor_view_type
()
->
get_element_type
();
string
type
=
et
.
c_type_string
();
TU
<<
type
<<
"* "
<<
tv
->
get_tensor
().
get_name
()
<<
" = static_cast<"
<<
type
<<
"*>(call_frame->get_output_data("
<<
output_index
<<
"));
\n
"
;
output_index
++
;
}
TU
<<
"
\n
"
;
TU
<<
"// Define tensor views
\n
"
;
TU
<<
"
\n
"
;
for
(
shared_ptr
<
Node
>
node
:
m_function
->
get_ordered_ops
())
{
auto
&
n
=
*
node
;
// Work around a compiler warning (*node inside typeid may have effects
// with shared pointers, which is fine here but clang doesn't like it.)
auto
handler
=
dispatcher
.
find
(
type_index
(
typeid
(
n
)));
if
(
handler
==
dispatcher
.
end
())
TU
<<
"// Define inputs
\n
"
;
size_t
arg_index
=
0
;
for
(
shared_ptr
<
op
::
Parameter
>
param
:
current_function
->
get_parameters
())
{
throw
ngraph_error
(
"Unhandled op during code generation : "
+
node
->
description
());
for
(
const
descriptor
::
Output
&
output
:
param
->
get_outputs
())
{
shared_ptr
<
descriptor
::
TensorView
>
tv
=
output
.
get_tensor_view
();
const
element
::
Type
&
et
=
tv
->
get_tensor_view_type
()
->
get_element_type
();
string
type
=
et
.
c_type_string
();
TU
<<
""
<<
type
<<
"* "
<<
tv
->
get_tensor
().
get_name
()
<<
" = static_cast<"
<<
type
<<
"*>(inputs["
<<
arg_index
<<
"]);
\n
"
;
arg_index
++
;
}
}
std
::
vector
<
TensorViewInfo
>
in
;
for
(
const
descriptor
::
Input
&
input
:
node
->
get_inputs
())
TU
<<
"
\n
"
;
TU
<<
"// Define outputs
\n
"
;
size_t
output_index
=
0
;
for
(
const
descriptor
::
Output
&
output
:
current_function
->
get_result
()
->
get_outputs
())
{
const
descriptor
::
Output
&
output
=
input
.
get_output
();
auto
tv
=
output
.
get_tensor_view
();
in
.
push_back
({
tensor_index
.
at
(
tv
),
tv
});
shared_ptr
<
descriptor
::
TensorView
>
tv
=
output
.
get_tensor_view
();
const
element
::
Type
&
et
=
tv
->
get_tensor_view_type
()
->
get_element_type
();
string
type
=
et
.
c_type_string
();
TU
<<
type
<<
"* "
<<
tv
->
get_tensor
().
get_name
()
<<
" = static_cast<"
<<
type
<<
"*>(outputs["
<<
output_index
<<
"]);
\n
"
;
output_index
++
;
}
std
::
vector
<
TensorViewInfo
>
out
;
for
(
const
descriptor
::
Output
&
output
:
node
->
get_outputs
())
TU
<<
"
\n
"
;
TU
<<
"// Define tensor views
\n
"
;
TU
<<
"
\n
"
;
for
(
shared_ptr
<
Node
>
node
:
current_function
->
get_ordered_ops
())
{
auto
tv
=
output
.
get_tensor_view
();
out
.
push_back
({
tensor_index
.
at
(
tv
),
tv
});
auto
&
n
=
*
node
;
// Work around a compiler warning (*node inside typeid may have effects
// with shared pointers, which is fine here but clang doesn't like it.)
auto
handler
=
dispatcher
.
find
(
type_index
(
typeid
(
n
)));
if
(
handler
==
dispatcher
.
end
())
{
throw
ngraph_error
(
"Unhandled op during code generation : "
+
node
->
description
());
}
std
::
vector
<
TensorViewInfo
>
in
;
for
(
const
descriptor
::
Input
&
input
:
node
->
get_inputs
())
{
const
descriptor
::
Output
&
output
=
input
.
get_output
();
auto
tv
=
output
.
get_tensor_view
();
in
.
push_back
({
0
,
tv
});
}
std
::
vector
<
TensorViewInfo
>
out
;
for
(
const
descriptor
::
Output
&
output
:
node
->
get_outputs
())
{
auto
tv
=
output
.
get_tensor_view
();
out
.
push_back
({
0
,
tv
});
}
handler
->
second
(
&
emitter
,
node
.
get
(),
this
,
in
,
out
);
}
handler
->
second
(
&
emitter
,
node
.
get
(),
this
,
function_map
,
in
,
out
);
}
TU
.
indent
--
;
TU
.
indent
--
;
// End TU
TU
+=
"}
\n
"
;
// End TU
TU
+=
"}
\n\n
"
;
}
// TODO: Cleanup and make this a utility function
ofstream
out
(
"__ngcpu_codegen.cpp"
);
string
output_dir
=
"cpu_codegen"
;
string
function_name
=
m_function
->
get_name
();
// file_util::remove_directory(output_dir);
file_util
::
make_directory
(
output_dir
);
string
filename
=
file_util
::
path_join
(
output_dir
,
function_name
+
"_codegen.cpp"
);
ofstream
out
(
filename
);
string
code
=
TU
.
get_code
();
out
<<
code
;
out
.
close
();
...
...
@@ -370,7 +344,7 @@ extern "C" void free_aligned_buffer(void* allocated);
estate
.
set_debuginfo_enabled
(
true
);
#endif
auto
llvm_module
=
estate
.
compile
(
code
,
"__ngcpu
_codegen.cpp"
);
auto
llvm_module
=
estate
.
compile
(
code
,
function_name
+
"
_codegen.cpp"
);
if
(
llvm_module
==
nullptr
)
{
throw
runtime_error
(
"function failed to compile"
);
...
...
@@ -389,12 +363,10 @@ extern "C" void free_aligned_buffer(void* allocated);
shared_ptr
<
ngraph
::
runtime
::
CallFrame
>
ExternalFunction
::
make_call_frame
()
{
FunctionMap
function_map
;
if
(
!
m_is_compiled
)
{
compile
(
function_map
);
compile
();
}
return
make_shared
<
ngraph
::
runtime
::
cpu
::
CallFrame
>
(
m_compiled_function
,
callees
);
return
make_shared
<
ngraph
::
runtime
::
cpu
::
CallFrame
>
(
m_compiled_function
);
}
src/ngraph/runtime/cpu/external_function.hpp
View file @
c775f01b
...
...
@@ -42,7 +42,6 @@ namespace ngraph
using
OpFunction
=
std
::
function
<
void
(
Emitter
*
,
const
ngraph
::
Node
*
,
ExternalFunction
*
,
FunctionMap
&
,
const
std
::
vector
<
TensorViewInfo
>&
inputs
,
const
std
::
vector
<
TensorViewInfo
>&
outputs
)
>
;
...
...
@@ -54,15 +53,11 @@ namespace ngraph
ExternalFunction
(
const
std
::
shared_ptr
<
ngraph
::
Function
>&
function
,
bool
release_function
=
true
);
std
::
shared_ptr
<
ngraph
::
runtime
::
CallFrame
>
make_call_frame
();
std
::
vector
<
std
::
shared_ptr
<
CallFrame
>>&
get_callees
()
{
return
callees
;
}
protected
:
void
compile
(
FunctionMap
&
function_map
);
void
compile
();
size_t
m_n_inputs
;
size_t
m_n_outputs
;
ngraph
::
descriptor
::
TensorViewPtrs
m_temp_views
;
EntryPoint
m_compiled_function
;
std
::
vector
<
std
::
shared_ptr
<
CallFrame
>>
callees
;
};
}
}
...
...
test/backend_test.in.cpp
View file @
c775f01b
...
...
@@ -1422,10 +1422,10 @@ TEST(${BACKEND_NAME}, reduce_trivial)
auto
cf
=
backend
->
make_call_frame
(
external
);
// Create some tensors for input/output
auto
a
=
runtime
::
make_tensor
<
element
::
Float32
>
(
shape
);
auto
a
=
backend
->
make_primary_tensor_view
(
element
::
Float32
::
element_type
(),
shape
);
copy_data
(
a
,
vector
<
float
>
{
1
,
2
,
3
,
4
});
auto
b
=
runtime
::
make_tensor
<
element
::
Float32
>
(
shape
);
copy_data
(
b
,
vector
<
float
>
{
0
});
auto
b
=
backend
->
make_primary_tensor_view
(
element
::
Float32
::
element_type
(),
shape
);
copy_data
(
b
,
vector
<
float
>
{
0
,
0
,
0
,
0
});
auto
result
=
backend
->
make_primary_tensor_view
(
element
::
Float32
::
element_type
(),
shape
);
(
*
cf
)({
a
,
b
},
{
result
});
...
...
test/tensor.cpp
View file @
c775f01b
...
...
@@ -113,3 +113,24 @@ TEST(tensor, read_write)
test_read_write
<
element
::
Float32
>
({
1.0
,
3.0
,
5.0
});
test_read_write
<
element
::
Int64
>
({
-
1
,
2
,
4
});
}
TEST
(
tensor
,
output_flag
)
{
pass
::
Manager
pass_manager
;
pass_manager
.
register_pass
<
pass
::
TopologicalSort
>
();
pass_manager
.
register_pass
<
pass
::
Liveness
>
();
auto
arg0
=
make_shared
<
op
::
Parameter
>
(
element
::
Float32
::
element_type
(),
Shape
{
1
});
auto
add
=
make_shared
<
op
::
Add
>
(
arg0
,
arg0
);
auto
rt
=
make_shared
<
TensorViewType
>
(
element
::
Float32
::
element_type
(),
Shape
{
1
});
auto
f0
=
make_shared
<
Function
>
(
add
,
rt
,
op
::
Parameters
{
arg0
});
pass_manager
.
run_passes
(
f0
);
EXPECT_TRUE
(
f0
->
get_result
()
->
is_output
());
for
(
descriptor
::
Output
&
output
:
f0
->
get_result
()
->
get_outputs
())
{
const
Tensor
&
t
=
output
.
get_tensor
();
EXPECT_TRUE
(
t
.
is_output
());
}
}
test/topological_sort.cpp
View file @
c775f01b
...
...
@@ -21,7 +21,6 @@
#include "ngraph/log.hpp"
#include "ngraph/ngraph.hpp"
#include "ngraph/pass/collect_functions.hpp"
#include "ngraph/pass/dump_sorted.hpp"
#include "ngraph/pass/manager.hpp"
#include "ngraph/pass/topological_sort.hpp"
...
...
@@ -172,11 +171,11 @@ TEST(topological_sort, collect_functions)
"h"
);
pass
::
Manager
pass_manager
;
pass_manager
.
register_pass
<
pass
::
CollectFunctions
>
();
pass_manager
.
run_passes
(
h
);
set
<
string
>
expected
=
{
"f"
,
"g"
,
"h"
};
auto
functions
=
pass_manager
.
get_state
().
get_functions
();
vector
<
string
>
fnames
;
for
(
shared_ptr
<
Function
>
func
:
functions
)
{
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment