[MLIR] MLIR Compiler refactoring (#3786)

* Re-organize files. Create MLIR backend classes * WIP * Refactored. Code compiles * Moved context to Runtime class to outlive compilation and execution * style-apply * Base Runtime class. Few other modifications * Minor fixes * Fixed Runtime::run() to take type-erased pointer * renamed core compiler * rename backend compiler * rename runtime compiler * PR feedback * Fix build fails

[MLIR] MLIR Compiler refactoring (#3786)
* Re-organize files. Create MLIR backend classes * WIP * Refactored. Code compiles * Moved context to Runtime class to outlive compilation and execution * style-apply * Base Runtime class. Few other modifications * Minor fixes * Fixed Runtime::run() to take type-erased pointer * renamed core compiler * rename backend compiler * rename runtime compiler * PR feedback * Fix build fails
f143bb13 · Nagy Mostafa · Scott Cyphers · bb9b5be6 · f143bb13 · f143bb13
Commit f143bb13 authored Oct 29, 2019 by Nagy Mostafa Committed by Scott Cyphers Oct 29, 2019
36 changed files
--- a/src/contrib/mlir/CMakeLists.txt
+++ b/src/contrib/mlir/CMakeLists.txt
@@ -14,13 +14,97 @@
 # limitations under the License.
 # ******************************************************************************

-# Common MLIR/LLVM setup for the sub-directories below
-
 include_directories(
    ${NGRAPH_INCLUDE_PATH}
    ${MLIR_LLVM_INCLUDE_PATH}
    ${MLIR_INCLUDE_PATHS}
 )

-add_subdirectory(compiler)
 add_subdirectory(tools/ngraph-opt)
+
+set(SRC
+    backend/cpu/cpu_backend.cpp
+    backend/pass/affine_lowerer.cpp
+    backend/pass/memory_optimization.cpp
+    core/compiler.cpp
+    core/ngraph_dialect/dialect.cpp
+    core/ngraph_dialect/type.cpp
+    core/ngraph_dialect/ops.cpp
+    core/pass/mlir_subgraph_extraction.cpp
+    core/pass/mlir_subgraph_extraction.hpp
+    runtime/cpu/memory_manager.cpp
+    runtime/cpu/cpu_runtime.cpp
+    utils.cpp
+)
+
+add_library(mlir_backend SHARED ${SRC})
+
+llvm_map_components_to_libnames(llvm_libs support core irreader)
+
+# Link MLIR libs
+target_link_libraries(
+    mlir_backend PRIVATE 
+    MLIRAnalysis
+    MLIREDSC
+    MLIRExecutionEngine
+    MLIRIR
+    MLIRLLVMIR
+    MLIRStandardToLLVM
+    MLIRParser
+    MLIRPass
+    MLIRTargetLLVMIR
+    MLIRTransforms
+    MLIRSupport
+)
+# some libs need whole archive linkage because of Globals static initialization
+function(whole_archive_link target)
+    if("${CMAKE_SYSTEM_NAME}" STREQUAL "Darwin")
+        set(link_flags "-Llib -Wl,-all_load ")
+        FOREACH(LIB ${ARGN})
+            string(CONCAT link_flags ${link_flags} "${LIB}")
+        ENDFOREACH(LIB)
+    else()
+        set(link_flags "-Llib -Wl,--whole-archive,")
+        FOREACH(LIB ${ARGN})
+            string(CONCAT link_flags ${link_flags} "${LIB},")
+        ENDFOREACH(LIB)
+        string(CONCAT link_flags ${link_flags} "--no-whole-archive")
+    endif()
+    message(STATUS "MLIR Ops link flag: ${link_flags}" )
+
+    set_target_properties(${target} PROPERTIES LINK_FLAGS ${link_flags})
+endfunction(whole_archive_link)
+
+whole_archive_link(mlir_backend
+    ${LLVM_BUILD_LIBRARY_DIR}/libMLIRAffineOps.a
+    ${LLVM_BUILD_LIBRARY_DIR}/libMLIRStandardOps.a
+)
+# Link LLVM libs
+target_link_libraries(
+    mlir_backend PRIVATE 
+    ${llvm_libs}
+)
+
+# Link ngraph 
+target_link_libraries(mlir_backend PUBLIC ngraph)
+
+# table-gen dialect ops
+# include table-gen helpers
+include(${LLVM_DIR}/TableGen.cmake)
+
+function(ngraph_tablegen ofn)
+    tablegen(MLIR ${ARGV} "-I${MLIR_SRC_INCLUDE_PATH}" "-I${MLIR_BIN_INCLUDE_PATH}")
+    set(TABLEGEN_OUTPUT ${TABLEGEN_OUTPUT} ${CMAKE_CURRENT_BINARY_DIR}/${ofn} PARENT_SCOPE)
+endfunction()
+
+set(MLIR_TABLEGEN_EXE mlir-tblgen)
+set(LLVM_TARGET_DEFINITIONS core/ngraph_dialect/ops.td)
+
+ngraph_tablegen(ops.h.inc -gen-op-decls)
+ngraph_tablegen(ops.cpp.inc -gen-op-defs)
+
+add_public_tablegen_target(ngraph_ops_gen)
+add_dependencies(mlir_backend ngraph_ops_gen)
+target_include_directories(mlir_backend PRIVATE ${CMAKE_CURRENT_BINARY_DIR})
+
+install(TARGETS mlir_backend DESTINATION ${NGRAPH_INSTALL_LIB})
--- a/src/contrib/mlir/backend/backend.hpp
+++ b/src/contrib/mlir/backend/backend.hpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+
+#pragma once
+
+#include <memory>
+#include <mlir/IR/Module.h>
+
+namespace ngraph
+{
+    namespace runtime
+    {
+        namespace ngmlir
+        {
+            class MLIRBackend
+            {
+            public:
+                MLIRBackend(mlir::OwningModuleRef& module, mlir::MLIRContext& context)
+                    : m_module(std::move(module))
+                    , m_context(context)
+                {
+                }
+
+                MLIRBackend(mlir::ModuleOp& moduleOp, mlir::MLIRContext& context)
+                    : m_module(moduleOp)
+                    , m_context(context)
+                {
+                }
+
+                /// Generate code for the module
+                virtual void codegen() = 0;
+
+                mlir::OwningModuleRef& get_module() { return m_module; }
+            protected:
+                mlir::OwningModuleRef m_module;
+                mlir::MLIRContext& m_context;
+            };
+        }
+    }
+}
--- a/src/contrib/mlir/backend/cpu/cpu_backend.cpp
+++ b/src/contrib/mlir/backend/cpu/cpu_backend.cpp
--- a/src/contrib/mlir/backend/cpu/cpu_backend.hpp
+++ b/src/contrib/mlir/backend/cpu/cpu_backend.hpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+
+#pragma once
+
+#include <memory>
+#include "contrib/mlir/backend/backend.hpp"
+#include "llvm/Support/CodeGen.h"
+#include "ngraph/check.hpp"
+
+namespace llvm
+{
+    class TargetMachine;
+}
+
+namespace ngraph
+{
+    namespace runtime
+    {
+        namespace ngmlir
+        {
+            class MLIRCPUBackend : public MLIRBackend
+            {
+            public:
+                /// Global Initialization for all CPU backends
+                static void init();
+
+                MLIRCPUBackend(mlir::OwningModuleRef& module, mlir::MLIRContext& context)
+                    : MLIRBackend(module, context)
+                {
+                    NGRAPH_CHECK(initialized,
+                                 "Cannot instantiate CPU MLIR backend without initialization");
+                }
+
+                MLIRCPUBackend(mlir::ModuleOp& moduleOp, mlir::MLIRContext& context)
+                    : MLIRBackend(moduleOp, context)
+                {
+                    NGRAPH_CHECK(initialized,
+                                 "Cannot instantiate CPU MLIR backend without initialization");
+                }
+                // codegen LLVM dialect from nGraph dialect applying CPU backend optimization passes
+                void codegen() override;
+
+            private:
+                // Apply CPU specific optimizations at nGraph dialect level
+                void optimizeNgDialect();
+                // Lowers nGraph dialect all the way to LLVM module.
+                void lowerNgDialect();
+                // Apply affine dialect optimizations
+                void optimizeAffineDialect();
+
+            public:
+                // JIT optimization level
+                static llvm::CodeGenOpt::Level mlirOptLevel;
+
+                // LLVM target machine to be used by this MLIR compiler instance to retrieve
+                // information about target features.
+                // TODO: Note that, unfortunatelly, MLIR/OrcJIT execution engine creates its own
+                // target machine for compilation internally. This target machine is for non-JIT
+                // related stuff. We should change OrcJIT API so that we can pass an external target
+                // machine or configuration flags.
+                // TODO: Move target machine to external nGraph backend when multiple backends start
+                // to use MLIR.
+                static std::unique_ptr<llvm::TargetMachine> targetMachine;
+                // Global initialization done for CPU backend
+                static bool initialized;
+            };
+        }
+    }
+}
--- a/src/contrib/mlir/compiler/lowerer.cpp
+++ b/src/contrib/mlir/compiler/lowerer.cpp
@@ -17,10 +17,10 @@
 // NOTE: This file follows nGraph format style and MLIR naming convention since it does
 // not expose public API to the rest of nGraph codebase and heavily depends on MLIR API.

-#include "lowerer.hpp"
+#include "affine_lowerer.hpp"

-#include "dialect/ops.hpp"
-#include "dialect/type.hpp"
+#include "contrib/mlir/core/ngraph_dialect/ops.hpp"
+#include "contrib/mlir/core/ngraph_dialect/type.hpp"
 #include "ngraph/assertion.hpp"

 #include <llvm/ADT/DenseSet.h>

--- a/src/contrib/mlir/compiler/lowerer.hpp
+++ b/src/contrib/mlir/compiler/lowerer.hpp
@@ -19,7 +19,7 @@

 #pragma once

-#include "contrib/mlir/compiler/compiler.hpp"
+#include "contrib/mlir/core/compiler.hpp"

 #include <mlir/Pass/Pass.h>


--- a/src/contrib/mlir/compiler/pass/memory_optimization.cpp
+++ b/src/contrib/mlir/compiler/pass/memory_optimization.cpp
@@ -17,9 +17,9 @@
 // NOTE: This file follows nGraph format style and MLIR naming convention since it does
 // not expose public API to the rest of nGraph codebase and heavily depends on MLIR API.

-#include "contrib/mlir/compiler/compiler.hpp"
-#include "contrib/mlir/compiler/dialect/ops.hpp"
-#include "contrib/mlir/compiler/dialect/type.hpp"
+#include "contrib/mlir/core/compiler.hpp"
+#include "contrib/mlir/core/ngraph_dialect/ops.hpp"
+#include "contrib/mlir/core/ngraph_dialect/type.hpp"

 #include "ngraph/assertion.hpp"

@@ -53,7 +53,7 @@ namespace
        {
            m_inplaceOps = {
 #define MLIR_OP(OP, INPLACE) {OP::getOperationName().str(), INPLACE},
-#include "contrib/mlir/compiler/op_lowerers.inc"
+#include "contrib/mlir/backend/pass/op_lowerers.inc"
            };
        }
        void runOnFunction() override;

--- a/src/contrib/mlir/compiler/pass/memory_optimization.hpp
+++ b/src/contrib/mlir/compiler/pass/memory_optimization.hpp
--- a/src/contrib/mlir/compiler/op_lowerers.inc
+++ b/src/contrib/mlir/compiler/op_lowerers.inc
--- a/src/contrib/mlir/compiler/CMakeLists.txt
+++ b/src/contrib/mlir/compiler/CMakeLists.txt
-# ******************************************************************************
-# Copyright 2017-2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ******************************************************************************
-
-set(SRC
-    dialect/dialect.cpp
-    dialect/type.cpp
-    dialect/ops.cpp
-    compiler.cpp
-    lowerer.cpp
-    memory_manager.cpp
-    pass/mlir_subgraph_extraction.cpp
-    pass/mlir_subgraph_extraction.hpp
-    pass/memory_optimization.cpp
-    tools.cpp
-)
-
-add_library(mlir_backend SHARED ${SRC})
-
-llvm_map_components_to_libnames(llvm_libs support core irreader)
-
-# Link MLIR libs
-target_link_libraries(
-    mlir_backend PRIVATE 
-    MLIRAnalysis
-    MLIREDSC
-    MLIRExecutionEngine
-    MLIRIR
-    MLIRLLVMIR
-    MLIRStandardToLLVM
-    MLIRParser
-    MLIRPass
-    MLIRTargetLLVMIR
-    MLIRTransforms
-    MLIRSupport
-)
-# some libs need whole archive linkage because of Globals static initialization
-function(whole_archive_link target)
-    if("${CMAKE_SYSTEM_NAME}" STREQUAL "Darwin")
-        set(link_flags "-Llib -Wl,-all_load ")
-        FOREACH(LIB ${ARGN})
-            string(CONCAT link_flags ${link_flags} "${LIB}")
-        ENDFOREACH(LIB)
-    else()
-        set(link_flags "-Llib -Wl,--whole-archive,")
-        FOREACH(LIB ${ARGN})
-            string(CONCAT link_flags ${link_flags} "${LIB},")
-        ENDFOREACH(LIB)
-        string(CONCAT link_flags ${link_flags} "--no-whole-archive")
-    endif()
-    message(STATUS "MLIR Ops link flag: ${link_flags}" )
-
-    set_target_properties(${target} PROPERTIES LINK_FLAGS ${link_flags})
-endfunction(whole_archive_link)
-
-whole_archive_link(mlir_backend
-    ${LLVM_BUILD_LIBRARY_DIR}/libMLIRAffineOps.a
-    ${LLVM_BUILD_LIBRARY_DIR}/libMLIRStandardOps.a
-)
-# Link LLVM libs
-target_link_libraries(
-    mlir_backend PRIVATE 
-    ${llvm_libs}
-)
-
-# Link ngraph 
-target_link_libraries(mlir_backend PUBLIC ngraph)
-
-# table-gen dialect ops
-# include table-gen helpers
-include(${LLVM_DIR}/TableGen.cmake)
-
-function(ngraph_tablegen ofn)
-    tablegen(MLIR ${ARGV} "-I${MLIR_SRC_INCLUDE_PATH}" "-I${MLIR_BIN_INCLUDE_PATH}")
-    set(TABLEGEN_OUTPUT ${TABLEGEN_OUTPUT} ${CMAKE_CURRENT_BINARY_DIR}/${ofn} PARENT_SCOPE)
-endfunction()
-
-set(MLIR_TABLEGEN_EXE mlir-tblgen)
-set(LLVM_TARGET_DEFINITIONS dialect/ops.td)
-
-ngraph_tablegen(ops.h.inc -gen-op-decls)
-ngraph_tablegen(ops.cpp.inc -gen-op-defs)
-
-add_public_tablegen_target(ngraph_ops_gen)
-add_dependencies(mlir_backend ngraph_ops_gen)
-target_include_directories(mlir_backend PRIVATE ${CMAKE_CURRENT_BINARY_DIR})
-
-install(TARGETS mlir_backend DESTINATION ${NGRAPH_INSTALL_LIB})
--- a/src/contrib/mlir/compiler/compiler.cpp
+++ b/src/contrib/mlir/compiler/compiler.cpp
--- a/src/contrib/mlir/compiler/compiler.hpp
+++ b/src/contrib/mlir/compiler/compiler.hpp
@@ -19,10 +19,11 @@

 #pragma once

-#include "memory_manager.hpp"
+#include "contrib/mlir/runtime/cpu/memory_manager.hpp"
+#include "ngraph/check.hpp"
+#include "ngraph/descriptor/tensor.hpp"
 #include "ngraph/node.hpp"

-#include <mlir/ExecutionEngine/ExecutionEngine.h>
 #include <mlir/ExecutionEngine/MemRefUtils.h>
 #include <mlir/IR/Builders.h>
 #include <mlir/IR/Module.h>
@@ -32,11 +33,6 @@
 #include <unordered_map>
 #include <vector>

-namespace llvm
-{
-    class TargetMachine;
-}
-
 namespace ngraph
 {
    namespace descriptor
@@ -55,30 +51,34 @@ namespace ngraph
    {
        namespace ngmlir
        {
-            /// This class is the entry point to MLIR from nGraph. It drives the conversion of
-            /// nGraph sub-graphs, represented with CompiledKernel nodes, to MLIR nGraph dialect
-            /// and its lowering, optimization and execution using LLVM-based MLIR execution engine.
+            /// MLIR Compiler. Given an nGraph sub-graph, represented as CompiledKernel node, it
+            /// translates the graph down to nGraph dialect and applies core optimizations.
+            ///
+            /// The compiler owns the MLIR module until compilation is done. After that,
+            /// the module can be grabbed and plugged into MLIR backends.
            class MLIRCompiler
            {
            public:
-                /// Initializes MLIR environment. It must be called only once per execution.
-                static void init_mlir();
+                /// Initializes MLIR environment. It must be called only once.
+                static void init();

            public:
                using TensorList = std::vector<descriptor::Tensor*>;
                using TypeList = llvm::SmallVector<mlir::Type, 4>;

-                MLIRCompiler(const ngraph::op::CompiledKernel* compiled_kernel)
+                MLIRCompiler(const ngraph::op::CompiledKernel* compiled_kernel,
+                             mlir::MLIRContext& context)
                    : m_compiledKernel(compiled_kernel)
+                    , m_context(context)
                {
+                    NGRAPH_CHECK(initialized,
+                                 "Cannot instantiate a compiler without initializing MLIR");
                }

                /// Compiles a subgraph with MLIR
                void compile();

-                /// Executes a pre-compiled subgraph
-                void run(std::vector<void*>& externalTensors);
-
+                mlir::OwningModuleRef& get_module() { return m_module; }
            private:
                struct TensorInfo
                {
@@ -87,13 +87,11 @@ namespace ngraph
                };

            private:
+                // Converts an nGraph sub-graph to MLIR nGraph dialect.
                void buildNgDialectModule();
-                void lowerNgDialect();
-                void optimizeNgDialect();
-                void optimize();
-                void bindArguments(std::vector<void*>& externalTensors);
-                void execute();
-                void cleanup();
+                void buildNgDialect();
+                // Applies any nGraph dialect optimizations
+                void optimizeNgDialect() { /*TODO: Add Core NG dialect optimizations */}

                mlir::Type getMlirType(const descriptor::Tensor* tensor);
                mlir::Type getMlirType(const element::Type& type);
@@ -102,8 +100,6 @@ namespace ngraph
                TensorInfo getTensorValue(descriptor::Tensor* tensor);
                void updateTensorValue(descriptor::Tensor* tensor, mlir::Value* value);

-                void buildNgDialect();
-
                template <typename Op>
                static mlir::Operation* createOp(MLIRCompiler& compiler, const ngraph::Node* ngNode)
                {
@@ -121,15 +117,6 @@ namespace ngraph

                void createReturn();

-                /// Helper to create memref arguments for MLIR function signature
-                llvm::SmallVector<void*, 8> allocateMemrefArgs();
-
-                /// Helper to allocate a mem ref object. Handles static shapes only for now.
-                mlir::StaticFloatMemRef* allocateMemrefDescriptor();
-
-                /// Helper to dump MLIR module into llvm::dbgs prepended by the message \p msg.
-                void dumpMlirModule(const std::string msg);
-
                /// Converts nGraph shape-like types \p ng_shape to MLIR shape \p mlir_shape.
                template <typename T>
                void getMlirShape(T ngShape, llvm::SmallVectorImpl<int64_t>& mlirShape);
@@ -142,19 +129,12 @@ namespace ngraph
                // Sub-graph to be compiled and executed with MLIR.
                const ngraph::op::CompiledKernel* m_compiledKernel;

-                // Pointers to externally allocated memory for sub-graph's input and output tensors.
-                std::vector<void*>* m_externalTensors;
-
-                // Arguments for the MLIR function generated for the nGraph sub-graph.
-                llvm::SmallVector<void*, 8> m_invokeArgs;
-
                // MLIR context that holds all the MLIR information related to the sub-graph
                // compilation.
-                mlir::MLIRContext m_context;
+                mlir::MLIRContext& m_context;

                mlir::OwningModuleRef m_module;
                std::unique_ptr<mlir::OpBuilder> m_builder;
-                std::unique_ptr<mlir::ExecutionEngine> m_engine;

                using TensorToInfo = std::pair<descriptor::Tensor*, TensorInfo>;
                using TensorToInfoMap = std::unordered_map<descriptor::Tensor*, TensorInfo>;
@@ -166,26 +146,8 @@ namespace ngraph
                // use for MLIR dialect gen
                TensorToInfoMap m_tensorToValueMap;
                static const MLIRCompOpMap opDispatcher;
-
-                // Optimization level used by MLIR and LLVM compilers. It's based on LLVM CG
-                // optimization levels:
-                // enum Level {
-                //   None,        // -O0
-                //   Less,        // -O1
-                //   Default,     // -O2, -Os
-                //   Aggressive   // -O3
-                // };
-                static llvm::CodeGenOpt::Level mlirOptLevel;
-
-                // LLVM target machine to be used by this MLIR compiler instance to retrieve
-                // information about target features.
-                // TODO: Note that, unfortunatelly, MLIR/OrcJIT execution engine creates its own
-                // target machine for compilation internally. This target machine is for non-JIT
-                // related stuff. We should change OrcJIT API so that we can pass an external target
-                // machine or configuration flags.
-                // TODO: Move target machine to external nGraph backend when multiple backends start
-                // to use MLIR.
-                static std::unique_ptr<llvm::TargetMachine> targetMachine;
+                // Global initialization for MLIR compiler
+                static bool initialized;
            };
        }
    }

--- a/src/contrib/mlir/compiler/dialect/dialect.cpp
+++ b/src/contrib/mlir/compiler/dialect/dialect.cpp
--- a/src/contrib/mlir/compiler/dialect/dialect.hpp
+++ b/src/contrib/mlir/compiler/dialect/dialect.hpp
--- a/src/contrib/mlir/compiler/dialect/ops.cpp
+++ b/src/contrib/mlir/compiler/dialect/ops.cpp
--- a/src/contrib/mlir/compiler/dialect/ops.hpp
+++ b/src/contrib/mlir/compiler/dialect/ops.hpp
--- a/src/contrib/mlir/compiler/dialect/ops.td
+++ b/src/contrib/mlir/compiler/dialect/ops.td
--- a/src/contrib/mlir/compiler/dialect/type.cpp
+++ b/src/contrib/mlir/compiler/dialect/type.cpp
--- a/src/contrib/mlir/compiler/dialect/type.hpp
+++ b/src/contrib/mlir/compiler/dialect/type.hpp
--- a/src/contrib/mlir/compiler/ops_supported.inc
+++ b/src/contrib/mlir/compiler/ops_supported.inc
--- a/src/contrib/mlir/compiler/pass/mlir_subgraph_extraction.cpp
+++ b/src/contrib/mlir/compiler/pass/mlir_subgraph_extraction.cpp
@@ -549,5 +549,5 @@ void MLIRSubgraphExtractionPass::clean_up()

 const std::set<std::type_index> MLIRSubgraphExtractionPass::m_supported_ops{
 #define MLIR_OP(OP) TI(ngraph::op::OP),
-#include "contrib/mlir/compiler/ops_supported.inc"
+#include "contrib/mlir/core/ops_supported.inc"
 };
--- a/src/contrib/mlir/compiler/pass/mlir_subgraph_extraction.hpp
+++ b/src/contrib/mlir/compiler/pass/mlir_subgraph_extraction.hpp
--- a/src/contrib/mlir/runtime/cpu/cpu_runtime.cpp
+++ b/src/contrib/mlir/runtime/cpu/cpu_runtime.cpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+
+#include "cpu_runtime.hpp"
+#include "contrib/mlir/backend/cpu/cpu_backend.hpp"
+#include "ngraph/check.hpp"
+
+#include <llvm/ADT/STLExtras.h>
+#include <llvm/Analysis/TargetTransformInfo.h>
+#include <llvm/ExecutionEngine/Orc/JITTargetMachineBuilder.h>
+#include <llvm/IR/Module.h>
+#include <llvm/Support/ErrorOr.h>
+#include <llvm/Support/MemoryBuffer.h>
+#include <llvm/Support/SourceMgr.h>
+#include <llvm/Support/TargetSelect.h>
+#include <llvm/Target/TargetMachine.h>
+#include <mlir/ExecutionEngine/ExecutionEngine.h>
+#include <mlir/ExecutionEngine/MemRefUtils.h>
+#include <mlir/ExecutionEngine/OptUtils.h>
+#include <mlir/IR/Function.h>
+
+using llvm::SmallVector;
+using llvm::StringRef;
+using llvm::ArrayRef;
+
+using namespace ngraph;
+using namespace ngraph::runtime::ngmlir;
+
+#define DEBUG_TYPE "mlir-cpu-runtime"
+
+static llvm::cl::opt<bool>
+    clDumpObjectFile("ngraph-dump-mlir-object-file",
+                     llvm::cl::desc("Dump MLIR JITted-compiled object to file specified with "
+                                    "-object-filename (<input file>.o by default)."));
+
+static llvm::cl::opt<std::string>
+    clObjectFilename("ngraph-mlir-object-filename",
+                     llvm::cl::desc("Dump MLIR JITted-compiled object to file jitted_mlir.o"));
+
+void MLIRCPURuntime::run(void* args)
+{
+    run_internal(*reinterpret_cast<std::vector<void*>*>(args));
+}
+
+void MLIRCPURuntime::run_internal(std::vector<void*>& externalTensors)
+{
+    // Create an MLIR execution engine. We use a null MLIR pass manager for now to make sure we
+    // don't run MLIR passes that were already run. We also pass a default transformer created with
+    // the default or user-provided optimization level.
+    auto llvmTransformer = mlir::makeOptimizingTransformer(
+        MLIRCPUBackend::mlirOptLevel, /*sizeLevel=*/0, MLIRCPUBackend::targetMachine.get());
+    auto maybeEngine = mlir::ExecutionEngine::create(
+        m_module.get(), llvmTransformer, MLIRCPUBackend::mlirOptLevel);
+    NGRAPH_CHECK(maybeEngine, "failed to construct an execution engine");
+    m_engine = std::move(maybeEngine.get());
+
+    bindArguments(externalTensors);
+    execute();
+    cleanup();
+}
+
+// Binds MLIR function arguments to the proper values. This includes externally allocated tensors
+// helpers to be used inside the function.
+void MLIRCPURuntime::bindArguments(std::vector<void*>& externalTensors)
+{
+    NGRAPH_CHECK(m_module, "MLIR module is not ready.");
+
+    mlir::FuncOp func = m_module->lookupSymbol<mlir::FuncOp>("main");
+    NGRAPH_CHECK(func && !func.getBlocks().empty(), "Function not found");
+
+    // Set external arguments
+    m_externalTensors = &externalTensors;
+
+    // Create list with a type-erased double pointer for each invocation arguments.
+    // We currently use 'allocateMemrefArgs', which creates the arguments list per call ABI (see
+    // comment below).
+    // StaticFloatMemref is just a struct with the actual pointer to the data.
+
+    auto expectedArguments = allocateMemrefArgs();
+    NGRAPH_CHECK(expectedArguments.size(), "Arguments can't be created");
+    m_invokeArgs = std::move(expectedArguments);
+
+    NGRAPH_CHECK(m_invokeArgs.size() == m_externalTensors->size(),
+                 "Number of external tensors doesn't match number of function arguments");
+
+    // Assign external tensor pointers to invocation arguments.
+    for (size_t i = 0, numArgs = m_invokeArgs.size(); i < numArgs; ++i)
+    {
+        auto* memRefArg = *(reinterpret_cast<mlir::StaticFloatMemRef**>(m_invokeArgs[i]));
+        memRefArg->data = reinterpret_cast<float*>((*m_externalTensors)[i]);
+    }
+}
+
+// Lowers standard dialect to LLVM dialect and uses the MLIR execution engine to execute the code.
+void MLIRCPURuntime::execute()
+{
+    // Invoke the JIT-compiled function with the arguments. Note that, for API
+    // uniformity reasons, it takes a list of type-erased pointers to arguments.
+    // Please, note that 'invoke' method is overloaded with a parameter pack version.
+    // Make sure the MutableArrayRef version is invoked.
+    auto invocationResult = m_engine->invoke("main", llvm::MutableArrayRef<void*>(m_invokeArgs));
+
+    if (clDumpObjectFile)
+    {
+        m_engine->dumpToObjectFile(clObjectFilename.empty() ? "jitted_mlir.o"
+                                                            : clObjectFilename.getValue());
+    }
+    NGRAPH_CHECK(!invocationResult, "JIT invocation of 'main' failed\n");
+}
+
+void MLIRCPURuntime::cleanup()
+{
+    // Free void double pointer arguments without freeing external tensor data.
+    for (auto* arg : m_invokeArgs)
+    {
+        auto* memRefArg = *(reinterpret_cast<mlir::StaticFloatMemRef**>(arg));
+        free(memRefArg);
+        free(arg);
+    }
+}
+
+// The current call ABI takes a single arg pointer (argPtr) pointing to a list of args.
+// Each arg is a  pointer to a StaticFloatMemRef which contains a data pointer
+//
+// The args are laid out as follows
+// argPtr-> arg[0]-> StaticFloatMemRef -> <data>
+//          arg[1]-> StaticFloatMemRef -> <data>
+//          ...
+SmallVector<void*, 8> MLIRCPURuntime::allocateMemrefArgs()
+{
+    SmallVector<void*, 8> args;
+    for (auto i = 0; i < m_externalTensors->size(); i++)
+    {
+        auto descriptor = allocateMemrefDescriptor();
+        mlir::StaticFloatMemRef** arg =
+            reinterpret_cast<mlir::StaticFloatMemRef**>(malloc(sizeof(mlir::StaticFloatMemRef*)));
+        *arg = descriptor;
+        args.push_back(arg);
+    }
+    return args;
+}
+
+mlir::StaticFloatMemRef* MLIRCPURuntime::allocateMemrefDescriptor()
+{
+    // We only use StaticFloatMemRef because that's what MLIR currently offers.
+    // We should expand this with different types and dynamic MemRefs
+    auto* descriptor =
+        reinterpret_cast<mlir::StaticFloatMemRef*>(malloc(sizeof(mlir::StaticFloatMemRef)));
+    NGRAPH_CHECK(descriptor != nullptr, "NULL MemRef descriptor");
+    descriptor->data = nullptr;
+    return descriptor;
+}
--- a/src/contrib/mlir/runtime/cpu/cpu_runtime.hpp
+++ b/src/contrib/mlir/runtime/cpu/cpu_runtime.hpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+
+#pragma once
+
+#include <memory>
+#include <mlir/ExecutionEngine/ExecutionEngine.h>
+#include <mlir/ExecutionEngine/MemRefUtils.h>
+#include <mlir/IR/Builders.h>
+#include <mlir/IR/Module.h>
+#include <mlir/IR/Types.h>
+#include "contrib/mlir/backend/backend.hpp"
+#include "contrib/mlir/runtime/runtime.hpp"
+
+namespace ngraph
+{
+    namespace runtime
+    {
+        namespace ngmlir
+        {
+            /// A CPU Runtime is an MLIR runtime that owns an MLIR context and a module
+            /// The module should be in LLVM dialect and ready to be lowered via an MLIR
+            /// ExecutionEngine. The runtime owns the context and must out-live any MLIR
+            /// code Compilation and execution.
+            class MLIRCPURuntime : public MLIRRuntime
+            {
+            public:
+                /// Executes a pre-compiled subgraph
+                void run(void* args) override;
+
+            private:
+                void run_internal(std::vector<void*>& externalTensors);
+                // Bind external tensors to MLIR module entry point
+                void bindArguments(std::vector<void*>& externalTensors);
+                // Invokes an MLIR module entry point with bound arguments
+                void execute();
+                // Cleans up allocated args
+                void cleanup();
+
+                /// Helper to create memref arguments for MLIR function signature
+                llvm::SmallVector<void*, 8> allocateMemrefArgs();
+
+                /// Helper to allocate a mem ref object. Handles static shapes only for now.
+                mlir::StaticFloatMemRef* allocateMemrefDescriptor();
+
+            private:
+                // Pointers to externally allocated memory for sub-graph's input and output tensors.
+                std::vector<void*>* m_externalTensors;
+                // Arguments for the MLIR function generated for the nGraph sub-graph.
+                llvm::SmallVector<void*, 8> m_invokeArgs;
+                std::unique_ptr<mlir::ExecutionEngine> m_engine;
+            };
+        }
+    }
+}
--- a/src/contrib/mlir/compiler/memory_manager.cpp
+++ b/src/contrib/mlir/compiler/memory_manager.cpp
--- a/src/contrib/mlir/compiler/memory_manager.hpp
+++ b/src/contrib/mlir/compiler/memory_manager.hpp
--- a/src/contrib/mlir/runtime/runtime.hpp
+++ b/src/contrib/mlir/runtime/runtime.hpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+
+#pragma once
+
+#include "contrib/mlir/backend/backend.hpp"
+
+#include <memory>
+#include <mlir/ExecutionEngine/ExecutionEngine.h>
+#include <mlir/ExecutionEngine/MemRefUtils.h>
+#include <mlir/IR/Builders.h>
+#include <mlir/IR/Module.h>
+#include <mlir/IR/Types.h>
+
+namespace ngraph
+{
+    namespace runtime
+    {
+        namespace ngmlir
+        {
+            /// Base class for an MLIR runtime. An MLIR runtime owns the MLIR Context and owns
+            /// the final compiled module. It supports invoking the module with specific arguments
+            class MLIRRuntime
+            {
+            public:
+                /// Sets the MLIR module that this runtime will own
+                void set_module(mlir::OwningModuleRef& module) { m_module = std::move(module); }
+                /// Overload with module op
+                void set_module(mlir::ModuleOp& module) { m_module = module; }
+                /// Executes a pre-compiled subgraph
+                virtual void run(void* args) = 0;
+
+                /// Get the MLIR module that this runtime owns
+                mlir::OwningModuleRef& get_module() { return m_module; }
+                mlir::MLIRContext& get_context() { return m_context; }
+            protected:
+                mlir::OwningModuleRef m_module;
+                mlir::MLIRContext m_context;
+            };
+        }
+    }
+}
\ No newline at end of file
--- a/src/contrib/mlir/tools/ngraph-opt/ngraph_opt.cpp
+++ b/src/contrib/mlir/tools/ngraph-opt/ngraph_opt.cpp
@@ -24,7 +24,7 @@
 /// small sequence of passes without running the whole compiler pipeline. Please, refer to
 /// ngraph_repo_path/tests/mlir/ for examples.

-#include "contrib/mlir/compiler/tools.hpp"
+#include "contrib/mlir/utils.hpp"
 #include "ngraph/check.hpp"

 #include <llvm/Support/CommandLine.h>

--- a/src/contrib/mlir/compiler/tools.cpp
+++ b/src/contrib/mlir/compiler/tools.cpp
@@ -17,13 +17,32 @@
 // NOTE: This file follows nGraph format style and MLIR naming convention since it does
 // not expose public API to the rest of nGraph codebase and heavily depends on MLIR API.

-#include "tools.hpp"
+#include "utils.hpp"

-#include "dialect/dialect.hpp"
+#include "contrib/mlir/core/ngraph_dialect/dialect.hpp"

+#include <llvm/Support/CommandLine.h>
+#include <llvm/Support/Debug.h>
 #include <mlir/IR/Dialect.h>

+static llvm::cl::opt<bool> clPrintIRAfterAll(
+    "ngraph-print-ir-after-all",
+    llvm::cl::init(false),
+    llvm::cl::desc(
+        "Print IR after transformation that are not implemented as passes in the MLIRCompiler. It "
+        "complements MLIR -print-ir-after-all and LLVM -print-after-all flags"));
+
 void ngraph::runtime::ngmlir::initializeNGraphMLIR()
 {
    mlir::registerDialect<mlir::NGraphOpsDialect>();
 }
+
+void ngraph::runtime::ngmlir::dumpMlirModule(const std::string msg, mlir::ModuleOp module)
+{
+    if (clPrintIRAfterAll)
+    {
+        llvm::dbgs() << "*** IR Dump After " << msg << " ***\n";
+        module.dump();
+        llvm::dbgs() << "\n\n";
+    }
+}
--- a/src/contrib/mlir/compiler/tools.hpp
+++ b/src/contrib/mlir/compiler/tools.hpp
@@ -16,9 +16,10 @@

 // NOTE: This file follows nGraph format style and MLIR naming convention since it does
 // not expose public API to the rest of nGraph codebase and heavily depends on MLIR API.
-
 #pragma once

+#include <mlir/IR/Module.h>
+
 namespace ngraph
 {
    namespace runtime
@@ -29,6 +30,8 @@ namespace ngraph
            /// require nGraph dialect initialization.
            void initializeNGraphMLIR();

+            /// Helper to dump MLIR module into llvm::dbgs prepended by the message \p msg.
+            void dumpMlirModule(const std::string msg, mlir::ModuleOp module);
        } // namespace ngmlir
    }     // namespace runtime
 } // namespace ngraph
--- a/src/ngraph/runtime/cpu/CMakeLists.txt
+++ b/src/ngraph/runtime/cpu/CMakeLists.txt
@@ -272,7 +272,7 @@ if (NGRAPH_CPU_ENABLE)
        # TODO: can we get away without LLVM/MLIR include path. 
        # Currently mlir backend compiler.hpp include LLVM/MLIR files
        get_directory_property(MLIR_LLVM_INCLUDEPATH
-                               DIRECTORY ${NGRAPH_MLIR_SOURCE_DIR}/compiler
+                               DIRECTORY ${NGRAPH_MLIR_SOURCE_DIR}
                               DEFINITION MLIR_LLVM_INCLUDEPATH)
        
        message(STATUS "Building CPU backend with MLIR")

--- a/src/ngraph/runtime/cpu/builder/mlir_cpu_compiled_kernel.cpp
+++ b/src/ngraph/runtime/cpu/builder/mlir_cpu_compiled_kernel.cpp
@@ -16,7 +16,9 @@

 #include "ngraph/runtime/cpu/cpu_builder.hpp"

-#include "contrib/mlir/compiler/compiler.hpp"
+#include "contrib/mlir/backend/cpu/cpu_backend.hpp"
+#include "contrib/mlir/core/compiler.hpp"
+#include "contrib/mlir/runtime/cpu/cpu_runtime.hpp"
 #include "ngraph/op/experimental/compiled_kernel.hpp"
 #include "ngraph/runtime/cpu/cpu_runtime_context.hpp"

@@ -68,22 +70,41 @@ namespace ngraph
                    // Compile nodes within the CompiledKernel op.
                    CompiledKernel* compiled_kernel =
                        static_cast<CompiledKernel*>(const_cast<Node*>(node));
-                    bool is_module_ready = true;
-                    auto it = ctx->mlir_compilers.find(compiled_kernel);

-                    if (it == ctx->mlir_compilers.end())
-                    {
-                        // create a new compiler for the CK
-                        ctx->mlir_compilers.emplace(compiled_kernel, compiled_kernel);
-                        is_module_ready = false;
-                    }
+                    auto it = ctx->mlir_runtimes.find(compiled_kernel);

-                    MLIRCompiler& mlir_compiler = ctx->mlir_compilers.find(compiled_kernel)->second;
-                    if (!is_module_ready)
+                    if (it == ctx->mlir_runtimes.end())
                    {
+                        // Compile the sub-graph and create a new runtime
+                        // We must create an MLIRContext that out lives the compilation/execution
+                        // The runtime contains the context and gets store in the CK cache
+
+                        // Runtime contains context and must be constructed in-place.
+                        // MLIR contexts cannot be copied over
+                        ctx->mlir_runtimes.emplace(std::piecewise_construct,
+                                                   std::make_tuple(compiled_kernel),
+                                                   std::make_tuple());
+                        MLIRCPURuntime& mlir_runtime =
+                            ctx->mlir_runtimes.find(compiled_kernel)->second;
+                        // Grab the context and initialize a core compiler
+                        mlir::MLIRContext& context = mlir_runtime.get_context();
+                        MLIRCompiler mlir_compiler(compiled_kernel, context);
+                        // Compile to NG dialect
                        mlir_compiler.compile();
+                        // Grab a context and initialize a CPU backend using same context
+                        MLIRCPUBackend mlir_backend(mlir_compiler.get_module(), context);
+                        // Codegen to LLVM dialect
+                        mlir_backend.codegen();
+                        // Store module into runtime, and invoke.
+                        mlir_runtime.set_module(mlir_backend.get_module());
+                        mlir_runtime.run(&ptr_args);
+                    }
+                    else
+                    {
+                        // We have found a cached runtime, just invoke.
+                        MLIRCPURuntime& mlir_runtime = it->second;
+                        mlir_runtime.run(&ptr_args);
                    }
-                    mlir_compiler.run(ptr_args);
                };

                functors.emplace_back(functor);

--- a/src/ngraph/runtime/cpu/cpu_backend.cpp
+++ b/src/ngraph/runtime/cpu/cpu_backend.cpp
@@ -32,7 +32,8 @@
 #include "ngraph/util.hpp"

 #ifdef NGRAPH_MLIR_ENABLE
-#include "contrib/mlir/compiler/compiler.hpp"
+#include "contrib/mlir/backend/cpu/cpu_backend.hpp"
+#include "contrib/mlir/core/compiler.hpp"
 #endif

 using namespace ngraph;
@@ -95,7 +96,9 @@ shared_ptr<runtime::Executable>
    if (std::getenv("NGRAPH_MLIR") != nullptr)
    {
        // Initialize MLIR compiler
-        ngmlir::MLIRCompiler::init_mlir();
+        ngmlir::MLIRCompiler::init();
+        // Initialize MLIR backend
+        ngmlir::MLIRCPUBackend::init();
    }
 #endif


--- a/src/ngraph/runtime/cpu/cpu_builder.cpp
+++ b/src/ngraph/runtime/cpu/cpu_builder.cpp
@@ -112,7 +112,7 @@
 #include "ngraph/util.hpp"

 #ifdef NGRAPH_MLIR_ENABLE
-#include "contrib/mlir/compiler/compiler.hpp"
+#include "contrib/mlir/core/compiler.hpp"
 #endif

 using namespace std;

--- a/src/ngraph/runtime/cpu/cpu_external_function.cpp
+++ b/src/ngraph/runtime/cpu/cpu_external_function.cpp
@@ -36,7 +36,7 @@
 #endif

 #ifdef NGRAPH_MLIR_ENABLE
-#include "contrib/mlir/compiler/pass/mlir_subgraph_extraction.hpp"
+#include "contrib/mlir/core/pass/mlir_subgraph_extraction.hpp"
 #endif

 #include "ngraph/descriptor/input.hpp"

--- a/src/ngraph/runtime/cpu/cpu_runtime_context.hpp
+++ b/src/ngraph/runtime/cpu/cpu_runtime_context.hpp
@@ -31,7 +31,7 @@
 #include "ngraph/op/experimental/compiled_kernel.hpp"

 #ifdef NGRAPH_MLIR_ENABLE
-#include "contrib/mlir/compiler/compiler.hpp"
+#include "contrib/mlir/runtime/cpu/cpu_runtime.hpp"
 #endif

 namespace mkldnn
@@ -84,8 +84,8 @@ namespace ngraph
                /// The MLIR compiler caches the compiled code on the first invocation,
                /// and may in the future support re-compilation
                std::unordered_map<ngraph::op::CompiledKernel*,
-                                   ngraph::runtime::ngmlir::MLIRCompiler>
-                    mlir_compilers;
+                                   ngraph::runtime::ngmlir::MLIRCPURuntime>
+                    mlir_runtimes;
 #endif
            };
            }