Commit 1bc3b21a authored by Adam Rogowiec's avatar Adam Rogowiec

Workaround for nested fused op: run FusedOpDecomposition twice.

parent 94649220
...@@ -172,6 +172,7 @@ void runtime::gpu::GPUCompiledFunction::compile() ...@@ -172,6 +172,7 @@ void runtime::gpu::GPUCompiledFunction::compile()
pass_manager.register_pass<runtime::gpu::pass::BatchNormCache>(); pass_manager.register_pass<runtime::gpu::pass::BatchNormCache>();
pass_manager.register_pass<ngraph::pass::LikeReplacement>(); pass_manager.register_pass<ngraph::pass::LikeReplacement>();
pass_manager.register_pass<ngraph::pass::FusedOpDecomposition>(); pass_manager.register_pass<ngraph::pass::FusedOpDecomposition>();
pass_manager.register_pass<ngraph::pass::FusedOpDecomposition>();
pass_manager.register_pass<runtime::gpu::pass::GPULayout>(this); pass_manager.register_pass<runtime::gpu::pass::GPULayout>(this);
pass_manager.register_pass<ngraph::pass::AssignLayout<descriptor::layout::DenseTensorLayout>>(); pass_manager.register_pass<ngraph::pass::AssignLayout<descriptor::layout::DenseTensorLayout>>();
pass_manager.register_pass<ngraph::pass::GetOutputElementElimination>(); pass_manager.register_pass<ngraph::pass::GetOutputElementElimination>();
......
...@@ -425,6 +425,8 @@ shared_ptr<runtime::Executable> ...@@ -425,6 +425,8 @@ shared_ptr<runtime::Executable>
{ {
pass_manager.register_pass<ngraph::pass::FusedOpDecomposition>( pass_manager.register_pass<ngraph::pass::FusedOpDecomposition>(
IntelGPUBackend::is_supported_impl); IntelGPUBackend::is_supported_impl);
pass_manager.register_pass<ngraph::pass::FusedOpDecomposition>(
IntelGPUBackend::is_supported_impl);
} }
if (m_disable_backend_optimizations < 1) if (m_disable_backend_optimizations < 1)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment