Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
N
ngraph
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
ngraph
Commits
ffcf2760
Unverified
Commit
ffcf2760
authored
Feb 08, 2019
by
Robert Kimball
Committed by
GitHub
Feb 08, 2019
Browse files
Options
Browse Files
Download
Plain Diff
Merge branch 'master' into master
parents
21205070
e327fe57
Show whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
50 additions
and
57 deletions
+50
-57
intelgpu_op_broadcast.cpp
src/ngraph/runtime/intelgpu/intelgpu_op_broadcast.cpp
+9
-6
intelgpu_op_custom_kernels.cpp
src/ngraph/runtime/intelgpu/intelgpu_op_custom_kernels.cpp
+29
-25
intelgpu_op_custom_kernels.hpp
src/ngraph/runtime/intelgpu/intelgpu_op_custom_kernels.hpp
+2
-0
unit_test.manifest
src/ngraph/runtime/intelgpu/unit_test.manifest
+10
-26
No files found.
src/ngraph/runtime/intelgpu/intelgpu_op_broadcast.cpp
View file @
ffcf2760
...
@@ -191,13 +191,16 @@ void runtime::intelgpu::do_max_min_operation(cldnn::topology& topology,
...
@@ -191,13 +191,16 @@ void runtime::intelgpu::do_max_min_operation(cldnn::topology& topology,
{
{
const
string
function_name
=
"min_max_"
+
output_name
;
const
string
function_name
=
"min_max_"
+
output_name
;
const
size_t
input_size
=
shape_size
<
Shape
>
(
input_shape
);
const
size_t
input_size
=
shape_size
<
Shape
>
(
input_shape
);
const
string
&
init_value
=
is_min
?
"INFINITY"
:
"-INFINITY"
;
const
string
&
init_value
=
get_opencl_type_min_max_value
(
output_type
,
!
is_min
)
;
const
string
&
operation
=
is_min
?
" < "
:
" > "
;
const
string
&
operation
=
is_min
?
" < "
:
" > "
;
codegen
::
CodeWriter
writer
;
codegen
::
CodeWriter
writer
;
writer
<<
"__kernel void "
<<
function_name
<<
"(const __global float input"
runtime
::
intelgpu
::
gen_func_def
(
writer
,
<<
array_dims
(
input_shape
)
<<
", __global float output"
<<
array_dims
(
output_shape
)
function_name
,
<<
")
\n
"
;
{
get_opencl_type_name
(
output_type
)},
{
input_shape
},
get_opencl_type_name
(
output_type
),
output_shape
);
writer
.
block_begin
();
writer
.
block_begin
();
{
{
...
@@ -231,11 +234,11 @@ void runtime::intelgpu::do_max_min_operation(cldnn::topology& topology,
...
@@ -231,11 +234,11 @@ void runtime::intelgpu::do_max_min_operation(cldnn::topology& topology,
++
var_idx
;
++
var_idx
;
}
}
writer
<<
"if (input"
<<
access_dims
(
input_shape
)
<<
operation
<<
"output"
writer
<<
"if (input
0
"
<<
access_dims
(
input_shape
)
<<
operation
<<
"output"
<<
access_dims
(
input_shape
,
"i"
,
axis
)
<<
")
\n
"
;
<<
access_dims
(
input_shape
,
"i"
,
axis
)
<<
")
\n
"
;
writer
.
block_begin
();
writer
.
block_begin
();
{
{
writer
<<
"output"
<<
access_dims
(
input_shape
,
"i"
,
axis
)
<<
" = input"
writer
<<
"output"
<<
access_dims
(
input_shape
,
"i"
,
axis
)
<<
" = input
0
"
<<
access_dims
(
input_shape
)
<<
";
\n
"
;
<<
access_dims
(
input_shape
)
<<
";
\n
"
;
}
}
writer
.
block_end
();
writer
.
block_end
();
...
...
src/ngraph/runtime/intelgpu/intelgpu_op_custom_kernels.cpp
View file @
ffcf2760
...
@@ -28,34 +28,38 @@ using namespace ngraph;
...
@@ -28,34 +28,38 @@ using namespace ngraph;
string
runtime
::
intelgpu
::
get_opencl_type_name
(
const
element
::
Type
&
ngraph_type
)
string
runtime
::
intelgpu
::
get_opencl_type_name
(
const
element
::
Type
&
ngraph_type
)
{
{
if
(
ngraph_type
==
ngraph
::
element
::
i64
)
switch
(
ngraph_type
.
get_type_enum
()
)
{
{
return
"long"
;
case
element
:
:
Type_t
::
i64
:
return
"long"
;
case
element
:
:
Type_t
::
i32
:
return
"int"
;
case
element
:
:
Type_t
::
i16
:
return
"short"
;
case
element
:
:
Type_t
::
u16
:
return
"ushort"
;
case
element
:
:
Type_t
::
i8
:
return
"char"
;
case
element
:
:
Type_t
::
u8
:
return
"uchar"
;
}
}
else
if
(
ngraph_type
==
ngraph
::
element
::
i32
)
{
return
"int"
;
}
else
if
(
ngraph_type
==
ngraph
::
element
::
i16
)
{
return
"short"
;
}
else
if
(
ngraph_type
==
ngraph
::
element
::
u16
)
{
return
"ushort"
;
}
else
if
(
ngraph_type
==
ngraph
::
element
::
i8
)
{
return
"char"
;
}
else
if
(
ngraph_type
==
ngraph
::
element
::
u8
)
{
return
"uchar"
;
}
else
{
return
ngraph_type
.
c_type_string
();
return
ngraph_type
.
c_type_string
();
}
}
string
runtime
::
intelgpu
::
get_opencl_type_min_max_value
(
const
element
::
Type
&
ngraph_type
,
bool
is_min
)
{
switch
(
ngraph_type
.
get_type_enum
())
{
case
element
:
:
Type_t
::
f32
:
return
is_min
?
"-INFINITY"
:
"INFINITY"
;
case
element
:
:
Type_t
::
f64
:
return
is_min
?
"-INFINITY"
:
"INFINITY"
;
case
element
:
:
Type_t
::
i64
:
return
is_min
?
"LONG_MIN"
:
"LONG_MAX"
;
case
element
:
:
Type_t
::
u64
:
return
is_min
?
"0"
:
"ULONG_MAX"
;
case
element
:
:
Type_t
::
i32
:
return
is_min
?
"INT_MIN"
:
"INT_MAX"
;
case
element
:
:
Type_t
::
u32
:
return
is_min
?
"0"
:
"UINT_MAX"
;
case
element
:
:
Type_t
::
i16
:
return
is_min
?
"SHRT_MIN"
:
"SHRT_MAX"
;
case
element
:
:
Type_t
::
u16
:
return
is_min
?
"0"
:
"USHRT_MAX"
;
case
element
:
:
Type_t
::
i8
:
return
is_min
?
"CHAR_MIN"
:
"CHAR_MAX"
;
case
element
:
:
Type_t
::
u8
:
return
is_min
?
"0"
:
"UCHAR_MAX"
;
}
throw
ngraph_error
(
"Unsupported type '"
+
ngraph_type
.
c_type_string
()
+
"' in runtime::intelgpu::get_opencl_type_min_max_value()"
);
}
}
vector
<
cldnn_arg
>
runtime
::
intelgpu
::
get_kernel_args
(
size_t
input
,
size_t
output
)
vector
<
cldnn_arg
>
runtime
::
intelgpu
::
get_kernel_args
(
size_t
input
,
size_t
output
)
...
...
src/ngraph/runtime/intelgpu/intelgpu_op_custom_kernels.hpp
View file @
ffcf2760
...
@@ -197,6 +197,8 @@ namespace ngraph
...
@@ -197,6 +197,8 @@ namespace ngraph
// Helper functions used in cldnn::custom_gpu_primitive kernels
// Helper functions used in cldnn::custom_gpu_primitive kernels
std
::
string
get_opencl_type_name
(
const
element
::
Type
&
ngraph_type
);
std
::
string
get_opencl_type_name
(
const
element
::
Type
&
ngraph_type
);
std
::
string
get_opencl_type_min_max_value
(
const
element
::
Type
&
ngraph_type
,
bool
is_min
);
std
::
vector
<
cldnn_arg
>
get_kernel_args
(
size_t
input
,
size_t
output
);
std
::
vector
<
cldnn_arg
>
get_kernel_args
(
size_t
input
,
size_t
output
);
std
::
string
array_dims
(
const
Shape
&
dimentions
,
const
AxisSet
&
axis
=
{});
std
::
string
array_dims
(
const
Shape
&
dimentions
,
const
AxisSet
&
axis
=
{});
std
::
string
access_dims
(
const
Shape
&
dimentions
,
std
::
string
access_dims
(
const
Shape
&
dimentions
,
...
...
src/ngraph/runtime/intelgpu/unit_test.manifest
View file @
ffcf2760
all_2x2x3_eliminate_dims_0_1
argmax_4D_axis_3_i64_in_i32
argmin_trivial_in_double
argmin_trivial_in_i32
avg_pool_2d_2channel_2image_padded_only_above_do_not_include_in_computation
avg_pool_2d_2channel_2image_padded_only_above_do_not_include_in_computation
avg_pool_2d_2channel_2image_padded_only_above_include_in_computation
avg_pool_2d_2channel_2image_padded_only_above_include_in_computation
avg_pool_3d_uneven_strided_padded
avg_pool_3d_uneven_strided_padded
backwards_batch_norm_three_outputs
backwards_batch_norm_training
backwards_batch_norm_training
backwards_dot_scalar_tensor
backwards_dot_scalar_tensor
backwards_dot_tensor3_tensor3
backwards_dot_tensor_scalar
backwards_dot_tensor_scalar
backwards_dot_tensor_vector
backwards_dot_tensor_vector
backwards_exp
backwards_maxpool_n2_c1_hw5_3x3_str2_max
backwards_maxpool_n2_c1_hw5_3x3_str2_max
backwards_maxpool_n4_c1_hw4_2x2_max
backwards_maxpool_n4_c1_hw4_2x2_max
backwards_replace_slice
backwards_replace_slice
backwards_reverse_sequence_n3_c2_h3
backwards_reverse_sequence_n3_c2_h3
backwards_reverse_sequence_n4d2c3h2w2
backwards_reverse_sequence_n4d2c3h2w2
backwards_slice
backwards_slice
ba
ckwards_tanh
ba
tch_norm_bprop_n4c3h2w2
batch_norm_inference_0eps_f64
batch_norm_inference_0eps_f64
batch_norm_inference_f64
batch_norm_inference_f64
batch_norm_training_0eps_f64
batch_norm_training_0eps_f64
batch_norm_one_output
batch_norm_three_outputs
batch_norm_bprop_n4c3h2w2
dequantize
dequantize
dequantize_axes
dequantize_axes
dequantize_dynamic_offset
dequantize_dynamic_offset
...
@@ -30,10 +28,11 @@ dequantize_int8
...
@@ -30,10 +28,11 @@ dequantize_int8
dequantize_int8_zero_offset
dequantize_int8_zero_offset
dequantize_zero_offset
dequantize_zero_offset
divide_by_zero_int32
divide_by_zero_int32
embedding_lookup_4x5_reverse
embedding_lookup_10x1_arbitrary
embedding_lookup_10x1_arbitrary
embedding_lookup_10x1_arbitrary_index_type_int
embedding_lookup_10x1_arbitrary_index_type_int
embedding_lookup_4x5_reverse
generate_mask
generate_mask
max_3d_to_scalar_double
max_pool_3d
max_pool_3d
numeric_double_inf
numeric_double_inf
numeric_double_nan
numeric_double_nan
...
@@ -74,6 +73,9 @@ shape_of_scalar
...
@@ -74,6 +73,9 @@ shape_of_scalar
shape_of_vector
shape_of_vector
softmax_axis_3d_double
softmax_axis_3d_double
sum_stable_acc
sum_stable_acc
sum_stable_acc_double
sum_stable_simple_double
sum_trivial_in_double
topk_1d_max_all
topk_1d_max_all
topk_1d_max_one
topk_1d_max_one
topk_1d_max_partial
topk_1d_max_partial
...
@@ -127,21 +129,3 @@ zero_sized_sqrt
...
@@ -127,21 +129,3 @@ zero_sized_sqrt
zero_sized_subtract
zero_sized_subtract
zero_sized_tan
zero_sized_tan
zero_sized_tanh
zero_sized_tanh
shape_of_scalar
shape_of_vector
shape_of_matrix
shape_of_5d
sum_stable_acc
sum_stable_acc_double
sum_stable_simple_double
sum_trivial_in_double
max_matrix_rows_zero_int32
max_to_scalar_int8
min_to_scalar_int8
max_3d_to_scalar_double
argmin_trivial_in_i32
argmax_4D_axis_3_i64_in_i32
argmin_trivial_in_double
all_2x2x3_eliminate_dim_1
all_2x2x3_eliminate_dim_2
all_2x2x3_eliminate_dims_0_1
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment