IntelGPU backend. Use clDNN broadcast and fix compilation (#1648)

74a3a354 · shssf · Robert Kimball · 2c03914e · 74a3a354
Commit 74a3a354 authored Sep 21, 2018 by shssf Committed by Robert Kimball Sep 21, 2018
Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 5 deletions

intelgpu_backend.cpp src/ngraph/runtime/intelgpu/intelgpu_backend.cpp +10 -5

No files found.
--- a/src/ngraph/runtime/intelgpu/intelgpu_backend.cpp
+++ b/src/ngraph/runtime/intelgpu/intelgpu_backend.cpp
@@ -17,6 +17,7 @@
 #include <CPP/activation.hpp>
 #include <CPP/activation_grad.hpp>
 #include <CPP/batch_norm.hpp>
+#include <CPP/broadcast.hpp>
 #include <CPP/concatenation.hpp>
 #include <CPP/convolution.hpp>
 #include <CPP/data.hpp>
@@ -592,6 +593,15 @@ bool runtime::intelgpu::IntelGPUBackend::compile(shared_ptr<Function> func)
            {
                do_equal_propagation(topology, get_input_name(op), get_output_name(op));
            }
+            else if (get_input_shape(op).empty() ||
+                     (get_input_shape(op).size() == 1 && get_input_shape(op).at(0) == 1))
+            {
+                const cldnn::tensor output_tensor_size =
+                    runtime::intelgpu::IntelGPULayout::create_cldnn_tensor(get_output_shape(op));
+                const cldnn::broadcast cldnn_broadcast(
+                    get_output_name(op), get_input_name(op), output_tensor_size);
+                topology.add(cldnn_broadcast);
+            }
            else
            {
                do_bcast_sum_operation(topology,
@@ -1197,9 +1207,6 @@ bool runtime::intelgpu::IntelGPUBackend::compile(shared_ptr<Function> func)
        case OP_TYPEID::AllReduce:
        case OP_TYPEID::ArgMax:
        case OP_TYPEID::ArgMin:
-        case OP_TYPEID::Atan:
-        case OP_TYPEID::Ceiling:
-        case OP_TYPEID::Floor:
        case OP_TYPEID::FunctionCall:
        case OP_TYPEID::LRN:
        case OP_TYPEID::Reduce:
@@ -1207,9 +1214,7 @@ bool runtime::intelgpu::IntelGPUBackend::compile(shared_ptr<Function> func)
        case OP_TYPEID::ReplaceSlice:
        case OP_TYPEID::ReverseSequence:
        case OP_TYPEID::SelectAndScatter:
-        case OP_TYPEID::Sign:
        case OP_TYPEID::StopGradient:
-        case OP_TYPEID::Tan:
        case OP_TYPEID::TopK:
        {
            throw unsupported_op("Unsupported op '" + op->description() +