Unverified Commit 3d9004c0 authored by Chris Sullivan's avatar Chris Sullivan Committed by GitHub

Bring NVIDIA GPU backend up to date with nGraph master. (#4306)

Co-authored-by: 's avatarRobert Kimball <robert.kimball@intel.com>
parent 670c74af
...@@ -20,12 +20,17 @@ ...@@ -20,12 +20,17 @@
#include <vector> #include <vector>
#include "ngraph/log.hpp" #include "ngraph/log.hpp"
#include "ngraph/op/convolution.hpp"
#include "ngraph/op/max.hpp"
#include "ngraph/op/max_pool.hpp"
#include "ngraph/op/min.hpp"
#include "ngraph/runtime/gpu/cudnn_emitter.hpp" #include "ngraph/runtime/gpu/cudnn_emitter.hpp"
#include "ngraph/runtime/gpu/gpu_emitter.hpp" #include "ngraph/runtime/gpu/gpu_emitter.hpp"
#include "ngraph/runtime/gpu/gpu_invoke.hpp" #include "ngraph/runtime/gpu/gpu_invoke.hpp"
#include "ngraph/runtime/gpu/gpu_primitive_emitter.hpp" #include "ngraph/runtime/gpu/gpu_primitive_emitter.hpp"
#include "ngraph/runtime/gpu/gpu_runtime_context.hpp" #include "ngraph/runtime/gpu/gpu_runtime_context.hpp"
#include "ngraph/runtime/gpu/gpu_util.hpp" #include "ngraph/runtime/gpu/gpu_util.hpp"
#include "ngraph/runtime/gpu/op/rnn.hpp"
#include "ngraph/runtime/gpu/type_info.hpp" #include "ngraph/runtime/gpu/type_info.hpp"
#include "ngraph/util.hpp" #include "ngraph/util.hpp"
......
...@@ -31,14 +31,21 @@ ...@@ -31,14 +31,21 @@
#include "ngraph/runtime/gpu/gpu_runtime_context.hpp" #include "ngraph/runtime/gpu/gpu_runtime_context.hpp"
#include "ngraph/shape.hpp" #include "ngraph/shape.hpp"
#include "ngraph/op/convolution.hpp"
#include "ngraph/op/max.hpp"
#include "ngraph/op/max_pool.hpp"
#include "ngraph/op/min.hpp"
#include "ngraph/runtime/gpu/op/rnn.hpp"
namespace ngraph namespace ngraph
{ {
namespace op
{
class Convolution;
class ConvolutionBackpropData;
class ConvolutionBackpropFilters;
class MaxPool;
class Max;
class Min;
namespace gpu
{
class Rnn;
}
}
namespace runtime namespace runtime
{ {
namespace gpu namespace gpu
......
...@@ -33,20 +33,11 @@ ...@@ -33,20 +33,11 @@
using namespace ngraph; using namespace ngraph;
using namespace std; using namespace std;
extern "C" runtime::BackendConstructor* get_backend_constructor_pointer() extern "C" GPU_BACKEND_API void ngraph_register_gpu_backend()
{ {
class LocalBackendConstructor : public runtime::BackendConstructor runtime::BackendManager::register_backend("GPU", [](const std::string& /* config */) {
{ return make_shared<runtime::gpu::GPU_Backend>();
public: });
std::shared_ptr<runtime::Backend> create(const std::string& config) override
{
return std::make_shared<runtime::gpu::GPU_Backend>();
}
};
static unique_ptr<runtime::BackendConstructor> s_backend_constructor(
new LocalBackendConstructor());
return s_backend_constructor.get();
} }
runtime::gpu::GPU_Backend::GPU_Backend() runtime::gpu::GPU_Backend::GPU_Backend()
......
...@@ -19,7 +19,9 @@ ...@@ -19,7 +19,9 @@
#include <map> #include <map>
#include <memory> #include <memory>
#include "gpu_backend_visibility.hpp"
#include "ngraph/runtime/backend.hpp" #include "ngraph/runtime/backend.hpp"
#include "ngraph/runtime/backend_manager.hpp"
namespace ngraph namespace ngraph
{ {
...@@ -37,6 +39,7 @@ namespace ngraph ...@@ -37,6 +39,7 @@ namespace ngraph
using EntryPoint_t = void(void** inputs, void** outputs, GPURuntimeContext* ctx); using EntryPoint_t = void(void** inputs, void** outputs, GPURuntimeContext* ctx);
using EntryPoint = std::function<EntryPoint_t>; using EntryPoint = std::function<EntryPoint_t>;
BackendConstructor GPU_BACKEND_API get_backend_constructor_pointer();
class GPU_Backend : public Backend class GPU_Backend : public Backend
{ {
public: public:
......
...@@ -100,7 +100,7 @@ namespace ngraph ...@@ -100,7 +100,7 @@ namespace ngraph
const std::string& output_name) = 0; const std::string& output_name) = 0;
std::shared_ptr<ngraph::Function> m_function; std::shared_ptr<ngraph::Function> m_function;
std::unordered_map<std::shared_ptr<Function>, std::list<std::shared_ptr<Node>>> std::unordered_map<std::shared_ptr<Function>, std::vector<std::shared_ptr<Node>>>
m_function_ordered_ops; m_function_ordered_ops;
bool m_emit_timing; bool m_emit_timing;
......
This diff is collapsed.
...@@ -37,7 +37,7 @@ namespace ngraph ...@@ -37,7 +37,7 @@ namespace ngraph
// This defines a collection of function declarations like this // This defines a collection of function declarations like this
// static std::string emit_Abs(EMIT_ARGS); // static std::string emit_Abs(EMIT_ARGS);
// static std::string emit_Acos(EMIT_ARGS); // static std::string emit_Acos(EMIT_ARGS);
#define NGRAPH_OP(a, b) static std::string emit_##a(EMIT_ARGS); #define NGRAPH_OP(a, b, VERS) static std::string emit_v##VERS##_##a(EMIT_ARGS);
#include "ngraph/runtime/gpu/op/op_tbl.hpp" #include "ngraph/runtime/gpu/op/op_tbl.hpp"
#undef NGRAPH_OP #undef NGRAPH_OP
......
...@@ -39,8 +39,8 @@ namespace ngraph ...@@ -39,8 +39,8 @@ namespace ngraph
public: public:
using op_runtime_t = using op_runtime_t =
std::function<void(GPUCallFrame& call_frame, GPURuntimeContext* ctx)>; std::function<void(GPUCallFrame& call_frame, GPURuntimeContext* ctx)>;
using op_order_t = using op_order_t = std::unordered_map<std::shared_ptr<Function>,
std::unordered_map<std::shared_ptr<Function>, std::list<std::shared_ptr<Node>>>; std::vector<std::shared_ptr<Node>>>;
GPURuntimeConstructor(const op_order_t& ordered_ops); GPURuntimeConstructor(const op_order_t& ordered_ops);
void add(const std::string& name, const op_runtime_t& step); void add(const std::string& name, const op_runtime_t& step);
......
...@@ -15,8 +15,11 @@ ...@@ -15,8 +15,11 @@
//***************************************************************************** //*****************************************************************************
#include "ngraph/runtime/gpu/op/batch_norm.hpp" #include "ngraph/runtime/gpu/op/batch_norm.hpp"
#include "ngraph/node.hpp"
#include "ngraph/validation_util.hpp" #include "ngraph/validation_util.hpp"
constexpr ngraph::NodeTypeInfo ngraph::op::gpu::BatchNormTrainingWithStats::type_info;
ngraph::op::gpu::BatchNormTrainingWithStats::BatchNormTrainingWithStats( ngraph::op::gpu::BatchNormTrainingWithStats::BatchNormTrainingWithStats(
double eps, double eps,
std::shared_ptr<ngraph::Node> gamma, std::shared_ptr<ngraph::Node> gamma,
......
...@@ -40,6 +40,8 @@ namespace ngraph ...@@ -40,6 +40,8 @@ namespace ngraph
void validate_and_infer_types() override; void validate_and_infer_types() override;
static constexpr NodeTypeInfo type_info{"BatchNormTrainingWithStats", 0};
const NodeTypeInfo& get_type_info() const override { return type_info; }
protected: protected:
virtual std::shared_ptr<Node> virtual std::shared_ptr<Node>
copy_with_new_args(const NodeVector& new_args) const override; copy_with_new_args(const NodeVector& new_args) const override;
......
...@@ -14,8 +14,8 @@ ...@@ -14,8 +14,8 @@
// limitations under the License. // limitations under the License.
//***************************************************************************** //*****************************************************************************
#include "ngraph/op/op_tbl.hpp" #include "ngraph/op/op_version_tbl.hpp"
#if CUDNN_VERSION >= 7200 #if CUDNN_VERSION >= 7200
NGRAPH_OP(Rnn, ngraph::op::gpu) NGRAPH_OP(Rnn, ngraph::op::gpu, 0)
#endif #endif
NGRAPH_OP(BatchNormTrainingWithStats, ngraph::op::gpu) NGRAPH_OP(BatchNormTrainingWithStats, ngraph::op::gpu, 0)
...@@ -16,11 +16,14 @@ ...@@ -16,11 +16,14 @@
#include "ngraph/runtime/gpu/op/rnn.hpp" #include "ngraph/runtime/gpu/op/rnn.hpp"
#include "ngraph/log.hpp" #include "ngraph/log.hpp"
#include "ngraph/node.hpp"
#include "ngraph/util.hpp" #include "ngraph/util.hpp"
using namespace std; using namespace std;
using namespace ngraph; using namespace ngraph;
constexpr NodeTypeInfo op::gpu::Rnn::type_info;
shared_ptr<Node> op::gpu::Rnn::copy_with_new_args(const NodeVector& new_args) const shared_ptr<Node> op::gpu::Rnn::copy_with_new_args(const NodeVector& new_args) const
{ {
NGRAPH_CHECK(new_args.size() == 4, "Incorrect number of new arguments"); NGRAPH_CHECK(new_args.size() == 4, "Incorrect number of new arguments");
......
...@@ -65,6 +65,8 @@ namespace ngraph ...@@ -65,6 +65,8 @@ namespace ngraph
const int src_iter_feature_size, const int src_iter_feature_size,
const int direction, const int direction,
const int num_fused_layers); const int num_fused_layers);
static constexpr NodeTypeInfo type_info{"Rnn", 0};
const NodeTypeInfo& get_type_info() const override { return type_info; }
virtual std::shared_ptr<Node> virtual std::shared_ptr<Node>
copy_with_new_args(const NodeVector& new_args) const override; copy_with_new_args(const NodeVector& new_args) const override;
int get_num_timesteps() const { return m_num_timesteps; } int get_num_timesteps() const { return m_num_timesteps; }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment