Commit ea5056fe authored by Sergey Shalnov's avatar Sergey Shalnov

IntelGPU backend: PR2378 backend stability fixed

parent 6a777636
...@@ -55,8 +55,8 @@ public: ...@@ -55,8 +55,8 @@ public:
bool is_supported_property(const Property prop) const override; bool is_supported_property(const Property prop) const override;
private: private:
std::shared_ptr<cldnn::engine> ocl_engine; std::shared_ptr<cldnn::engine> cldnn_engine;
std::map<std::shared_ptr<Function>, std::shared_ptr<runtime::Executable>> ocl_networks; std::map<std::shared_ptr<Function>, std::shared_ptr<runtime::Executable>> cldnn_networks;
bool m_profile_enable = false; bool m_profile_enable = false;
long m_profile_lines_limit_count = 10; long m_profile_lines_limit_count = 10;
...@@ -66,38 +66,32 @@ private: ...@@ -66,38 +66,32 @@ private:
bool m_function_cache_disabled = false; bool m_function_cache_disabled = false;
bool m_disable_backend_optimizations = false; bool m_disable_backend_optimizations = false;
std::string m_cldnn_dump_dir = std::string("intelgpu_codegen"); std::string m_cldnn_dump_dir = std::string("intelgpu_codegen");
std::string delim = std::string(":");
}; };
class ngraph::runtime::intelgpu::IntelGPUExecutable : public runtime::Executable class ngraph::runtime::intelgpu::IntelGPUExecutable : public runtime::Executable
{ {
public: public:
IntelGPUExecutable(std::shared_ptr<Function> func, bool enable_timing); IntelGPUExecutable(std::shared_ptr<Function> func,
std::shared_ptr<cldnn::network> network,
bool enable_timing,
bool enable_profile,
double compilation_time,
double consumed_memory,
size_t profile_lines_limit_count);
bool call(const std::vector<std::shared_ptr<runtime::Tensor>>& outputs, bool call(const std::vector<std::shared_ptr<runtime::Tensor>>& outputs,
const std::vector<std::shared_ptr<runtime::Tensor>>& inputs) override; const std::vector<std::shared_ptr<runtime::Tensor>>& inputs) override;
std::vector<PerformanceCounter> get_performance_data() const override; std::vector<PerformanceCounter> get_performance_data() const override;
private: private:
class FunctionInstance std::shared_ptr<Function> m_function;
{ std::shared_ptr<cldnn::network> m_cldnn_network = nullptr;
public: bool m_performance_counters_enabled = false;
std::shared_ptr<cldnn::network> ocl_network = nullptr;
bool m_performance_counters_enabled = false;
double m_compilation_time = 0.0;
double m_consumed_memory = 0.0;
std::shared_ptr<Function> m_function;
} m_function_instance;
bool m_profile_enable = false; bool m_profile_enable = false;
double m_compilation_time = 0.0;
double m_consumed_memory = 0.0;
long m_profile_lines_limit_count = 10; long m_profile_lines_limit_count = 10;
bool m_dump_graph_enable = false;
bool m_cldnn_graph_optimize = true;
bool m_cldnn_dump_enable = false;
bool m_function_cache_disabled = false;
bool m_disable_backend_optimizations = false;
std::shared_ptr<cldnn::engine> ocl_engine;
std::string m_cldnn_dump_dir = std::string("intelgpu_codegen");
std::string delim = std::string(":"); std::string delim = std::string(":");
// Statistic related things // Statistic related things
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment