[MLIR] Graph pass to lower ngraph to ngraph dialect (#3835)

* WIP graph pass to lower ngraph to ngraph dialect * resolved compiler errors * - refactor ngraph-dialect to graph pass * - fix compilation issue - unit test passes * - style fix * Addressed PR comments * - move NgDialectConversionPass to anonymous namespace * - use getModule() to access module inside the graph pass - address PR comments * - fix failing unit test case for negative padding - make builder as an object isntead of pointer to an object * Address PR Comments

[MLIR] Graph pass to lower ngraph to ngraph dialect (#3835)
* WIP graph pass to lower ngraph to ngraph dialect * resolved compiler errors * - refactor ngraph-dialect to graph pass * - fix compilation issue - unit test passes * - style fix * Addressed PR comments * - move NgDialectConversionPass to anonymous namespace * - use getModule() to access module inside the graph pass - address PR comments * - fix failing unit test case for negative padding - make builder as an object isntead of pointer to an object * Address PR Comments
6fbed3b9 · Pruthvi · Scott Cyphers · c06c9405 · 6fbed3b9 · 6fbed3b9
Commit 6fbed3b9 authored Nov 11, 2019 by Pruthvi Committed by Scott Cyphers Nov 11, 2019
6 changed files
--- a/src/contrib/mlir/CMakeLists.txt
+++ b/src/contrib/mlir/CMakeLists.txt
@@ -32,6 +32,8 @@ set(SRC
    core/ngraph_dialect/ops.cpp
    core/pass/mlir_subgraph_extraction.cpp
    core/pass/mlir_subgraph_extraction.hpp
+    core/pass/ng_dialect_builder.cpp
+    core/pass/ng_dialect_builder.hpp
    runtime/cpu/memory_manager.cpp
    runtime/cpu/cpu_runtime.cpp
    utils.cpp

--- a/src/contrib/mlir/core/compiler.cpp
+++ b/src/contrib/mlir/core/compiler.cpp
@@ -22,6 +22,7 @@
 #include "ngraph_dialect/dialect.hpp"
 #include "ngraph_dialect/ops.hpp"
 #include "ngraph_dialect/type.hpp"
+#include "pass/ng_dialect_builder.hpp"
 #include "ngraph/check.hpp"
 #include "ngraph/descriptor/tensor.hpp"
@@ -83,9 +84,6 @@ using llvm::ArrayRef;
 using namespace ngraph;
 using namespace ngraph::runtime::ngmlir;
-#define COMPILE_OP_DECL(op_name)                                                                   \
-    createOp<op_name>(MLIRCompiler & compiler, const ngraph::Node* ngNode)
 bool MLIRCompiler::initialized = false;
 void MLIRCompiler::init()
@@ -112,11 +110,6 @@ void MLIRCompiler::init()
 void MLIRCompiler::compile()
 {
    buildNgDialectModule();
-    // Free MLIR function builder.
-    if (m_builder)
-    {
-        m_builder.reset(nullptr);
-    }
 }
 // Creates an MLIR module and function with nGraph dialect ops from the input CompiledKernel.
@@ -125,42 +118,17 @@ void MLIRCompiler::buildNgDialectModule()
    // initialize an empty module
    m_module = mlir::ModuleOp::create(mlir::UnknownLoc::get(&m_context));
-    TypeList argsTypeList, resultTypeList;
+    mlir::PassManager pm(&m_context);
+    pm.addPass(ngraph::pass::createNgDialectConversionPass(m_compiledKernel, &m_context));
-    // Retrieve input and output tensors.
-    const auto& kernelInputs = m_compiledKernel->get_arguments();
-    const auto& kernelOutput = m_compiledKernel->get_kernel_outputs();
-    NGRAPH_CHECK(kernelInputs.size() != 0, "Cannot have empty inputs list");
-    NGRAPH_CHECK(kernelOutput.size() != 0, "Cannot have empty outputs list");
-    for (auto input : kernelInputs)
-    {
-        argsTypeList.push_back(getMlirType(input.get()));
-    }
-    for (auto output : kernelOutput)
-    {
-        resultTypeList.push_back(getMlirType(output.get()));
-    }
-    auto funcType = mlir::FunctionType::get(argsTypeList, resultTypeList, &m_context);
+    // Apply any generic pass manager command line options.
-    auto function = mlir::FuncOp::create(mlir::UnknownLoc::get(&m_context), "main", funcType);
+    mlir::applyPassManagerCLOptions(pm);
-    function.addEntryBlock();
-    // populate Tensor->Value maps
+    if (failed(pm.run(m_module.get())))
-    int i = 0;
-    for (auto input : kernelInputs)
    {
-        mlir::Value* arg = function.getArgument(i);
+        NGRAPH_CHECK(false, "MLIR pass manager failed");
-        TensorInfo tensorInfo{arg};
-        m_tensorToValueMap.insert(TensorToInfo(input->get_output_tensor_ptr().get(), tensorInfo));
-        i++;
    }
-    // create builder
-    m_builder = std::unique_ptr<mlir::OpBuilder>(new mlir::OpBuilder(function.getBody()));
-    buildNgDialect();
-    m_module->push_back(function);
    if (failed(m_module->verify()))
    {
        NGRAPH_CHECK(false, "Invalid module after lowering to NG dialect");
@@ -168,313 +136,3 @@ void MLIRCompiler::buildNgDialectModule()
    dumpMlirModule("nGraph Dialect Construction", m_module.get());
 }
-template <typename T>
-void MLIRCompiler::getMlirShape(T ngShape, llvm::SmallVectorImpl<int64_t>& mlirShape)
-{
-    for (auto dim : ngShape)
-    {
-        mlirShape.push_back(dim);
-    }
-}
-template <typename T>
-mlir::ArrayAttr MLIRCompiler::getShapeAsAttr(T ngShape)
-{
-    SmallVector<int64_t, 4> mlirShape;
-    getMlirShape(ngShape, mlirShape);
-    return m_builder->getI64ArrayAttr(mlirShape);
-}
-// Converts an nGraph Tensor into an MLIR tensor type, including the conversion of the Tensor's
-// element type.
-mlir::Type MLIRCompiler::getMlirType(const descriptor::Tensor* tensor)
-{
-    llvm::SmallVector<int64_t, 4> mlirShape;
-    getMlirShape(tensor->get_shape(), mlirShape);
-    return mlir::NGTensorType::get(&m_context, getMlirType(tensor->get_element_type()), mlirShape);
-}
-// Converts an nGraph element type into an MLIR type.
-mlir::Type MLIRCompiler::getMlirType(const element::Type& type)
-{
-#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#pragma GCC diagnostic push
-#pragma GCC diagnostic error "-Wswitch"
-#pragma GCC diagnostic error "-Wswitch-enum"
-#endif
-    switch (type)
-    {
-    case ngraph::element::Type_t::undefined:
-    case ngraph::element::Type_t::dynamic:
-    default: NGRAPH_CHECK(false, "MLIR: Unsupported NGraph types"); break;
-    case ngraph::element::Type_t::bf16: return mlir::NGFloatType::getBF16(&m_context);
-    case ngraph::element::Type_t::f16: return mlir::NGFloatType::getF16(&m_context);
-    case ngraph::element::Type_t::f32: return mlir::NGFloatType::getF32(&m_context);
-    case ngraph::element::Type_t::f64: return mlir::NGFloatType::getF64(&m_context);
-    case ngraph::element::Type_t::i8: return mlir::NGIntegerType::getInt8(&m_context);
-    case ngraph::element::Type_t::u8:
-    case ngraph::element::Type_t::boolean: return mlir::NGIntegerType::getUInt8(&m_context);
-    case ngraph::element::Type_t::i16: return mlir::NGIntegerType::getInt16(&m_context);
-    case ngraph::element::Type_t::u16: return mlir::NGIntegerType::getInt16(&m_context);
-    case ngraph::element::Type_t::i32: return mlir::NGIntegerType::getInt32(&m_context);
-    case ngraph::element::Type_t::u32: return mlir::NGIntegerType::getUInt32(&m_context);
-    case ngraph::element::Type_t::i64: return mlir::NGIntegerType::getInt64(&m_context);
-    case ngraph::element::Type_t::u64: return mlir::NGIntegerType::getUInt64(&m_context);
-    }
-    NGRAPH_CHECK(false, "Unreachable");
-    return mlir::Type();
-#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#pragma GCC diagnostic pop
-#endif
-}
-mlir::Type MLIRCompiler::getMlirType(const ngraph::Node* node)
-{
-    descriptor::Tensor* outTensor = node->get_output_tensor_ptr().get();
-    return getMlirType(outTensor);
-}
-void MLIRCompiler::updateTensorValue(descriptor::Tensor* tensor, mlir::Value* value)
-{
-    NGRAPH_CHECK(m_tensorToValueMap.find(tensor) == m_tensorToValueMap.end(),
-                 "tensor value already defined");
-    TensorInfo tensorInfo{value};
-    m_tensorToValueMap.insert(TensorToInfo(tensor, tensorInfo));
-}
-MLIRCompiler::TensorInfo MLIRCompiler::getTensorValue(descriptor::Tensor* tensor)
-{
-    auto it = m_tensorToValueMap.find(tensor);
-    NGRAPH_CHECK(it != m_tensorToValueMap.end(), "Undefined tensor");
-    return it->second;
-}
-// MLIR builders
-#define TI(x) std::type_index(typeid(x))
-void MLIRCompiler::buildNgDialect()
-{
-    const NodeVector& subGraph = m_compiledKernel->get_node_list();
-    for (auto np : subGraph)
-    {
-        auto it = opDispatcher.find(TI(*np));
-        if (it == opDispatcher.end())
-        {
-            throw unsupported_op{std::string{"The MLIR backend doesn't currently implement the '"} +
-                                 np->description() + "' operation"};
-        }
-        mlir::Operation* op = it->second(*this, np.get());
-        // This assumes simple 1:1 mapping between output edges and generated MLIR op results
-        // If the mapping is more complex, the create_op helper can return null operation
-        // and handles populating the value map itself
-        if (op)
-        {
-            for (auto i = 0; i < op->getNumResults(); i++)
-            {
-                mlir::Value* result = op->getResult(i);
-                if (result)
-                {
-                    updateTensorValue(np->get_output_tensor_ptr(i).get(), result);
-                }
-            }
-        }
-    }
-    createReturn();
-}
-namespace ngraph
-{
-    namespace runtime
-    {
-        namespace ngmlir
-        {
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Add)
-            {
-                return compiler.createGenericOp<mlir::NGAddOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Subtract)
-            {
-                return compiler.createGenericOp<mlir::NGSubOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Multiply)
-            {
-                return compiler.createGenericOp<mlir::NGMulOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Divide)
-            {
-                return compiler.createGenericOp<mlir::NGDivOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Greater)
-            {
-                return compiler.createGenericOp<mlir::NGGreaterOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Less)
-            {
-                return compiler.createGenericOp<mlir::NGLessOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Maximum)
-            {
-                return compiler.createGenericOp<mlir::NGMaxOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Minimum)
-            {
-                return compiler.createGenericOp<mlir::NGMinOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::ArgMax)
-            {
-                return compiler.createIndexReduction<mlir::NGArgMaxRedOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::ArgMin)
-            {
-                return compiler.createIndexReduction<mlir::NGArgMinRedOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Dot)
-            {
-                return compiler.createGenericOp<mlir::NGDotOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Concat)
-            {
-                auto concat = static_cast<const ngraph::op::Concat*>(ngNode);
-                auto op = compiler.createGenericOp<mlir::NGConcatOp>(ngNode);
-                op->setAttr(
-                    "concatenation_axis",
-                    compiler.m_builder->getI64IntegerAttr(concat->get_concatenation_axis()));
-                return op;
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Gather)
-            {
-                auto gather = static_cast<const ngraph::op::Gather*>(ngNode);
-                auto op = compiler.createGenericOp<mlir::NGGatherOp>(ngNode);
-                op->setAttr("axis", compiler.m_builder->getI64IntegerAttr(gather->get_axis()));
-                return op;
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Relu)
-            {
-                return compiler.createGenericOp<mlir::NGReluOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Negative)
-            {
-                return compiler.createGenericOp<mlir::NGNegOp>(ngNode);
-            }
-            template <>
-            mlir::Operation* MLIRCompiler::COMPILE_OP_DECL(ngraph::op::Convolution)
-            {
-                mlir::Operation* op = compiler.createGenericOp<mlir::NGConvolutionOp>(ngNode);
-                auto convNode = static_cast<const ngraph::op::Convolution*>(ngNode);
-                auto convOp = llvm::cast<mlir::NGConvolutionOp>(op);
-                mlir::ArrayAttr attr =
-                    compiler.getShapeAsAttr(convNode->get_window_movement_strides());
-                convOp.setStrides(attr);
-                attr = compiler.getShapeAsAttr(convNode->get_padding_below());
-                convOp.setPadBelow(attr);
-                attr = compiler.getShapeAsAttr(convNode->get_padding_above());
-                convOp.setPadAbove(attr);
-                return op;
-            }
-        }
-    }
-}
-template <typename Op>
-mlir::Operation* MLIRCompiler::createGenericOp(const ngraph::Node* ngNode)
-{
-    std::vector<mlir::Value*> argValues;
-    std::vector<mlir::Type> resTypes;
-    auto inputMap = m_compiledKernel->get_input_map();
-    std::shared_ptr<descriptor::Tensor> argTensor;
-    for (auto& argOutput : ngNode->input_values())
-    {
-        auto argOutputNode = argOutput.get_node();
-        if (as_type<op::Parameter>(argOutputNode))
-        {
-            auto it = inputMap.find(argOutputNode->shared_from_this());
-            NGRAPH_CHECK(it != inputMap.end(), "Parameter not in CK input map");
-            argTensor = m_compiledKernel->input_values().at(it->second).get_tensor_ptr();
-        }
-        else
-        {
-            argTensor = argOutput.get_tensor_ptr();
-        }
-        auto argV = getTensorValue(argTensor.get()).m_value;
-        argValues.push_back(argV);
-    }
-    for (auto& output : ngNode->outputs())
-    {
-        resTypes.push_back(getMlirType(output.get_tensor_ptr().get()));
-    }
-    return (m_builder->create<Op,
-                              ArrayRef<mlir::Type>,
-                              ArrayRef<mlir::Value*>,
-                              ArrayRef<mlir::NamedAttribute>>(
-                mlir::UnknownLoc::get(&m_context), resTypes, argValues, {/* no attrs */}))
-        .getOperation();
-}
-const MLIRCompiler::MLIRCompOpMap MLIRCompiler::opDispatcher{
-#define MLIR_OP(OP) {TI(ngraph::op::OP), &MLIRCompiler::createOp<ngraph::op::OP>},
-#include "ops_supported.inc"
-};
-void MLIRCompiler::createReturn()
-{
-    std::vector<mlir::Value*> valueList;
-    for (auto output : m_compiledKernel->get_kernel_outputs())
-    {
-        valueList.push_back(getTensorValue(output->get_output_tensor_ptr().get()).m_value);
-    }
-    m_builder->create<mlir::NGReturnOp>(mlir::UnknownLoc::get(&m_context), valueList);
-}
-template <typename RedOp>
-mlir::Operation* MLIRCompiler::createIndexReduction(const ngraph::Node* ngNode)
-{
-    auto* idxRed = static_cast<const ngraph::op::util::IndexReduction*>(ngNode);
-    auto op = createGenericOp<RedOp>(ngNode);
-    mlir::ArrayAttr redAxesAttr =
-        m_builder->getI64ArrayAttr({(int64_t)idxRed->get_reduction_axis()});
-    op->setAttr("axes", redAxesAttr);
-    return op;
-}
--- a/src/contrib/mlir/core/compiler.hpp
+++ b/src/contrib/mlir/core/compiler.hpp
@@ -63,9 +63,6 @@ namespace ngraph
                static void init();
            public:
-                using TensorList = std::vector<descriptor::Tensor*>;
-                using TypeList = llvm::SmallVector<mlir::Type, 4>;
                MLIRCompiler(const ngraph::op::CompiledKernel* compiled_kernel,
                             mlir::MLIRContext& context)
                    : m_compiledKernel(compiled_kernel)
@@ -79,52 +76,12 @@ namespace ngraph
                void compile();
                mlir::OwningModuleRef& get_module() { return m_module; }
-            private:
-                struct TensorInfo
-                {
-                    // MLIR values this tensor maps to.
-                    mlir::Value* m_value;
-                };
            private:
                // Converts an nGraph sub-graph to MLIR nGraph dialect.
                void buildNgDialectModule();
-                void buildNgDialect();
                // Applies any nGraph dialect optimizations
                void optimizeNgDialect() { /*TODO: Add Core NG dialect optimizations */}
-                mlir::Type getMlirType(const descriptor::Tensor* tensor);
-                mlir::Type getMlirType(const element::Type& type);
-                mlir::Type getMlirType(const ngraph::Node* node);
-                TensorInfo getTensorValue(descriptor::Tensor* tensor);
-                void updateTensorValue(descriptor::Tensor* tensor, mlir::Value* value);
-                template <typename Op>
-                static mlir::Operation* createOp(MLIRCompiler& compiler, const ngraph::Node* ngNode)
-                {
-                    throw std::runtime_error("Unimplemented op '" + ngNode->description() +
-                                             "' in MLIR Compiler");
-                }
-                // Generic op lowerer to ng dialect.
-                // Simply maps ngraph tensors to values and generate an OP. No op-specific logic.
-                template <typename Op>
-                mlir::Operation* createGenericOp(const ngraph::Node* ngNode);
-                template <typename RedOp>
-                mlir::Operation* createIndexReduction(const ngraph::Node* ngNode);
-                void createReturn();
-                /// Converts nGraph shape-like types \p ng_shape to MLIR shape \p mlir_shape.
-                template <typename T>
-                void getMlirShape(T ngShape, llvm::SmallVectorImpl<int64_t>& mlirShape);
-                /// Converts an ngraph shape to an I64 array attribute
-                template <typename T>
-                mlir::ArrayAttr getShapeAsAttr(T ngShape);
            private:
                // Sub-graph to be compiled and executed with MLIR.
                const ngraph::op::CompiledKernel* m_compiledKernel;
@@ -132,20 +89,8 @@ namespace ngraph
                // MLIR context that holds all the MLIR information related to the sub-graph
                // compilation.
                mlir::MLIRContext& m_context;
                mlir::OwningModuleRef m_module;
-                std::unique_ptr<mlir::OpBuilder> m_builder;
-                using TensorToInfo = std::pair<descriptor::Tensor*, TensorInfo>;
-                using TensorToInfoMap = std::unordered_map<descriptor::Tensor*, TensorInfo>;
-                using MLIRCompOpFunction =
-                    std::function<mlir::Operation*(MLIRCompiler& compiler, const ngraph::Node*)>;
-                using MLIRCompOpMap = std::unordered_map<std::type_index, MLIRCompOpFunction>;
-                // Maps tensor to the value it represents in the IR
-                // use for MLIR dialect gen
-                TensorToInfoMap m_tensorToValueMap;
-                static const MLIRCompOpMap opDispatcher;
                // Global initialization for MLIR compiler
                static bool initialized;
            };

--- a/src/contrib/mlir/core/ngraph_dialect/ops.cpp
+++ b/src/contrib/mlir/core/ngraph_dialect/ops.cpp
@@ -277,14 +277,11 @@ mlir::LogicalResult verifyOp(NGConvolutionOp* op)
        auto s = std::get<0>(attrs).cast<IntegerAttr>().getInt();
        auto pb = std::get<1>(attrs).cast<IntegerAttr>().getInt();
        auto pa = std::get<2>(attrs).cast<IntegerAttr>().getInt();
        if (s <= 0)
        {
            return op->emitOpError("Window stride must be non-negative");
        }
-        if (pb < 0 || pa < 0)
-        {
-            return op->emitOpError("Paddings must be positive");
-        }
        stridesVal.push_back(s);
        padBelowVal.push_back(pb);
        padAboveVal.push_back(pa);

--- a/src/contrib/mlir/core/pass/ng_dialect_builder.cpp
+++ b/src/contrib/mlir/core/pass/ng_dialect_builder.cpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+#include "ng_dialect_builder.hpp"
+#include "contrib/mlir/core/ngraph_dialect/dialect.hpp"
+#include "contrib/mlir/core/ngraph_dialect/ops.hpp"
+#include "contrib/mlir/core/ngraph_dialect/type.hpp"
+#include "ngraph/check.hpp"
+#include "ngraph/descriptor/tensor.hpp"
+#include "ngraph/graph_util.hpp"
+#include "ngraph/node.hpp"
+#include "ngraph/op/add.hpp"
+#include "ngraph/op/argmax.hpp"
+#include "ngraph/op/argmin.hpp"
+#include "ngraph/op/concat.hpp"
+#include "ngraph/op/convolution.hpp"
+#include "ngraph/op/divide.hpp"
+#include "ngraph/op/dot.hpp"
+#include "ngraph/op/experimental/compiled_kernel.hpp"
+#include "ngraph/op/gather.hpp"
+#include "ngraph/op/greater.hpp"
+#include "ngraph/op/less.hpp"
+#include "ngraph/op/maximum.hpp"
+#include "ngraph/op/minimum.hpp"
+#include "ngraph/op/multiply.hpp"
+#include "ngraph/op/negative.hpp"
+#include "ngraph/op/relu.hpp"
+#include "ngraph/op/subtract.hpp"
+#include "ngraph/op/util/index_reduction.hpp"
+#include "ngraph/type/element_type.hpp"
+#include "contrib/mlir/utils.hpp"
+#include <llvm/ADT/STLExtras.h>
+#include <llvm/Analysis/TargetTransformInfo.h>
+#include <llvm/ExecutionEngine/Orc/JITTargetMachineBuilder.h>
+#include <llvm/IR/Module.h>
+#include <llvm/Support/ErrorOr.h>
+#include <llvm/Support/MemoryBuffer.h>
+#include <llvm/Support/SourceMgr.h>
+#include <llvm/Support/TargetSelect.h>
+#include <llvm/Target/TargetMachine.h>
+#include <mlir/Conversion/LoopToStandard/ConvertLoopToStandard.h>
+#include <mlir/Conversion/StandardToLLVM/ConvertStandardToLLVM.h>
+#include <mlir/Conversion/StandardToLLVM/ConvertStandardToLLVMPass.h>
+#include <mlir/Dialect/LLVMIR/LLVMDialect.h>
+#include <mlir/ExecutionEngine/ExecutionEngine.h>
+#include <mlir/ExecutionEngine/MemRefUtils.h>
+#include <mlir/ExecutionEngine/OptUtils.h>
+#include <mlir/Pass/PassManager.h>
+#include <mlir/Target/LLVMIR.h>
+#include <mlir/Transforms/DialectConversion.h>
+#include <mlir/Transforms/Passes.h>
+#include <memory>
+#include <mutex>
+// Defines a new LLVM debug type for this file to be used by LLVM_DEBUG macro.
+#define DEBUG_TYPE "mlir-compiler"
+using llvm::SmallVector;
+using llvm::StringRef;
+using llvm::ArrayRef;
+using namespace ngraph;
+using namespace ngraph::runtime::ngmlir;
+#define COMPILE_OP_DECL(op_name)                                                                   \
+    createOp<op_name>(NgDialectConversionPass & NgDialectObj, const ngraph::Node* ngNode)
+namespace
+{
+    /// NgDialectConversionPass is an MLIR ModulePass Given an nGraph sub-graph, represented as
+    /// CompiledKernel node, it
+    /// translates the graph down to nGraph dialect
+    class NgDialectConversionPass : public mlir::ModulePass<NgDialectConversionPass>
+    {
+    public:
+        using TensorList = std::vector<descriptor::Tensor*>;
+        using TypeList = llvm::SmallVector<mlir::Type, 4>;
+        NgDialectConversionPass(const ngraph::op::CompiledKernel* compiled_kernel,
+                                mlir::MLIRContext* context)
+            : m_compiledKernel(compiled_kernel)
+            , m_context(context)
+            , m_builder(context)
+        {
+        }
+        NgDialectConversionPass(const NgDialectConversionPass& obj);
+    private:
+        struct TensorInfo
+        {
+            // MLIR values this tensor maps to.
+            mlir::Value* m_value;
+        };
+    private:
+        // Converts an nGraph sub-graph to MLIR nGraph dialect.
+        void buildNgDialectModule();
+        void buildNgDialect(mlir::FuncOp function);
+        void runOnModule() override;
+        // Applies any nGraph dialect optimizations
+        void optimizeNgDialect() { /*TODO: Add Core NG dialect optimizations */}
+        mlir::Type getMlirType(const descriptor::Tensor* tensor);
+        mlir::Type getMlirType(const element::Type& type);
+        mlir::Type getMlirType(const ngraph::Node* node);
+        TensorInfo getTensorValue(descriptor::Tensor* tensor);
+        void updateTensorValue(descriptor::Tensor* tensor, mlir::Value* value);
+        template <typename Op>
+        static mlir::Operation* createOp(NgDialectConversionPass& NgDialectObj,
+                                         const ngraph::Node* ngNode)
+        {
+            throw std::runtime_error("Unimplemented op '" + ngNode->description() +
+                                     "' in MLIR Compiler");
+        }
+        // Generic op lowerer to ng dialect.
+        // Simply maps ngraph tensors to values and generate an OP. No op-specific logic.
+        template <typename Op>
+        mlir::Operation* createGenericOp(const ngraph::Node* ngNode);
+        template <typename RedOp>
+        mlir::Operation* createIndexReduction(const ngraph::Node* ngNode);
+        void createReturn();
+        /// Converts nGraph shape-like types \p ng_shape to MLIR shape \p mlir_shape.
+        template <typename T>
+        void getMlirShape(T ngShape, llvm::SmallVectorImpl<int64_t>& mlirShape);
+        /// Converts an ngraph shape to an I64 array attribute
+        template <typename T>
+        mlir::ArrayAttr getShapeAsAttr(T ngShape);
+    private:
+        // Sub-graph to be compiled and executed with MLIR.
+        const ngraph::op::CompiledKernel* m_compiledKernel;
+        // MLIR context that holds all the MLIR information related to the sub-graph
+        // compilation.
+        mlir::MLIRContext* m_context;
+        mlir::OpBuilder m_builder;
+        using TensorToInfo = std::pair<descriptor::Tensor*, TensorInfo>;
+        using TensorToInfoMap = std::unordered_map<descriptor::Tensor*, TensorInfo>;
+        using MLIRCompOpFunction = std::function<mlir::Operation*(
+            NgDialectConversionPass& NgDialectObj, const ngraph::Node*)>;
+        using MLIRCompOpMap = std::unordered_map<std::type_index, MLIRCompOpFunction>;
+        // Maps tensor to the value it represents in the IR
+        // use for MLIR dialect gen
+        TensorToInfoMap m_tensorToValueMap;
+        static const MLIRCompOpMap opDispatcher;
+    };
+} // end of namespace
+NgDialectConversionPass::NgDialectConversionPass(const NgDialectConversionPass& obj)
+    : m_compiledKernel(obj.m_compiledKernel)
+    , m_context(obj.m_context)
+    , m_builder(obj.m_builder)
+    , m_tensorToValueMap(obj.m_tensorToValueMap)
+{
+}
+void NgDialectConversionPass::runOnModule()
+{
+    TypeList argsTypeList, resultTypeList;
+    mlir::ModuleOp module = getModule();
+    // Retrieve input and output tensors.
+    const auto& kernelInputs = m_compiledKernel->get_arguments();
+    const auto& kernelOutput = m_compiledKernel->get_kernel_outputs();
+    NGRAPH_CHECK(kernelInputs.size() != 0, "Cannot have empty inputs list");
+    NGRAPH_CHECK(kernelOutput.size() != 0, "Cannot have empty outputs list");
+    for (auto input : kernelInputs)
+    {
+        argsTypeList.push_back(getMlirType(input.get()));
+    }
+    for (auto output : kernelOutput)
+    {
+        resultTypeList.push_back(getMlirType(output.get()));
+    }
+    auto funcType = mlir::FunctionType::get(argsTypeList, resultTypeList, m_context);
+    auto function = mlir::FuncOp::create(mlir::UnknownLoc::get(m_context), "main", funcType);
+    function.addEntryBlock();
+    // populate Tensor->Value maps
+    int i = 0;
+    for (auto input : kernelInputs)
+    {
+        mlir::Value* arg = function.getArgument(i);
+        TensorInfo tensorInfo{arg};
+        m_tensorToValueMap.insert(TensorToInfo(input->get_output_tensor_ptr().get(), tensorInfo));
+        i++;
+    }
+    // create builder
+    buildNgDialect(function);
+    module.push_back(function);
+}
+template <typename T>
+void NgDialectConversionPass::getMlirShape(T ngShape, llvm::SmallVectorImpl<int64_t>& mlirShape)
+{
+    for (auto dim : ngShape)
+    {
+        mlirShape.push_back(dim);
+    }
+}
+template <typename T>
+mlir::ArrayAttr NgDialectConversionPass::getShapeAsAttr(T ngShape)
+{
+    SmallVector<int64_t, 4> mlirShape;
+    getMlirShape(ngShape, mlirShape);
+    return m_builder.getI64ArrayAttr(mlirShape);
+}
+// Converts an nGraph Tensor into an MLIR tensor type, including the conversion of the Tensor's
+// element type.
+mlir::Type NgDialectConversionPass::getMlirType(const descriptor::Tensor* tensor)
+{
+    llvm::SmallVector<int64_t, 4> mlirShape;
+    getMlirShape(tensor->get_shape(), mlirShape);
+    return mlir::NGTensorType::get(m_context, getMlirType(tensor->get_element_type()), mlirShape);
+}
+// Converts an nGraph element type into an MLIR type.
+mlir::Type NgDialectConversionPass::getMlirType(const element::Type& type)
+{
+#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
+#pragma GCC diagnostic push
+#pragma GCC diagnostic error "-Wswitch"
+#pragma GCC diagnostic error "-Wswitch-enum"
+#endif
+    switch (type)
+    {
+    case ngraph::element::Type_t::undefined:
+    case ngraph::element::Type_t::dynamic:
+    default: NGRAPH_CHECK(false, "MLIR: Unsupported NGraph types"); break;
+    case ngraph::element::Type_t::bf16: return mlir::NGFloatType::getBF16(m_context);
+    case ngraph::element::Type_t::f16: return mlir::NGFloatType::getF16(m_context);
+    case ngraph::element::Type_t::f32: return mlir::NGFloatType::getF32(m_context);
+    case ngraph::element::Type_t::f64: return mlir::NGFloatType::getF64(m_context);
+    case ngraph::element::Type_t::i8: return mlir::NGIntegerType::getInt8(m_context);
+    case ngraph::element::Type_t::u8:
+    case ngraph::element::Type_t::boolean: return mlir::NGIntegerType::getUInt8(m_context);
+    case ngraph::element::Type_t::i16: return mlir::NGIntegerType::getInt16(m_context);
+    case ngraph::element::Type_t::u16: return mlir::NGIntegerType::getInt16(m_context);
+    case ngraph::element::Type_t::i32: return mlir::NGIntegerType::getInt32(m_context);
+    case ngraph::element::Type_t::u32: return mlir::NGIntegerType::getUInt32(m_context);
+    case ngraph::element::Type_t::i64: return mlir::NGIntegerType::getInt64(m_context);
+    case ngraph::element::Type_t::u64: return mlir::NGIntegerType::getUInt64(m_context);
+    }
+    NGRAPH_CHECK(false, "Unreachable");
+    return mlir::Type();
+#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
+#pragma GCC diagnostic pop
+#endif
+}
+mlir::Type NgDialectConversionPass::getMlirType(const ngraph::Node* node)
+{
+    descriptor::Tensor* outTensor = node->get_output_tensor_ptr().get();
+    return getMlirType(outTensor);
+}
+void NgDialectConversionPass::updateTensorValue(descriptor::Tensor* tensor, mlir::Value* value)
+{
+    NGRAPH_CHECK(m_tensorToValueMap.find(tensor) == m_tensorToValueMap.end(),
+                 "tensor value already defined");
+    TensorInfo tensorInfo{value};
+    m_tensorToValueMap.insert(TensorToInfo(tensor, tensorInfo));
+}
+NgDialectConversionPass::TensorInfo
+    NgDialectConversionPass::getTensorValue(descriptor::Tensor* tensor)
+{
+    auto it = m_tensorToValueMap.find(tensor);
+    NGRAPH_CHECK(it != m_tensorToValueMap.end(), "Undefined tensor");
+    return it->second;
+}
+// MLIR builders
+#define TI(x) std::type_index(typeid(x))
+void NgDialectConversionPass::buildNgDialect(mlir::FuncOp function)
+{
+    auto& region = function.getBody();
+    m_builder.setInsertionPoint(&region.front(), region.front().begin());
+    const NodeVector& subGraph = m_compiledKernel->get_node_list();
+    for (auto np : subGraph)
+    {
+        auto it = opDispatcher.find(TI(*np));
+        if (it == opDispatcher.end())
+        {
+            throw unsupported_op{std::string{"The MLIR backend doesn't currently implement the '"} +
+                                 np->description() + "' operation"};
+        }
+        mlir::Operation* op = it->second(*this, np.get());
+        // This assumes simple 1:1 mapping between output edges and generated MLIR op results
+        // If the mapping is more complex, the create_op helper can return null operation
+        // and handles populating the value map itself
+        if (op)
+        {
+            for (auto i = 0; i < op->getNumResults(); i++)
+            {
+                mlir::Value* result = op->getResult(i);
+                if (result)
+                {
+                    updateTensorValue(np->get_output_tensor_ptr(i).get(), result);
+                }
+            }
+        }
+    }
+    createReturn();
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Add)
+{
+    return NgDialectObj.createGenericOp<mlir::NGAddOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Subtract)
+{
+    return NgDialectObj.createGenericOp<mlir::NGSubOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Multiply)
+{
+    return NgDialectObj.createGenericOp<mlir::NGMulOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Divide)
+{
+    return NgDialectObj.createGenericOp<mlir::NGDivOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Greater)
+{
+    return NgDialectObj.createGenericOp<mlir::NGGreaterOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Less)
+{
+    return NgDialectObj.createGenericOp<mlir::NGLessOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Maximum)
+{
+    return NgDialectObj.createGenericOp<mlir::NGMaxOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Minimum)
+{
+    return NgDialectObj.createGenericOp<mlir::NGMinOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::ArgMax)
+{
+    return NgDialectObj.createIndexReduction<mlir::NGArgMaxRedOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::ArgMin)
+{
+    return NgDialectObj.createIndexReduction<mlir::NGArgMinRedOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Dot)
+{
+    return NgDialectObj.createGenericOp<mlir::NGDotOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Concat)
+{
+    auto concat = static_cast<const ngraph::op::Concat*>(ngNode);
+    auto op = NgDialectObj.createGenericOp<mlir::NGConcatOp>(ngNode);
+    op->setAttr("concatenation_axis",
+                NgDialectObj.m_builder.getI64IntegerAttr(concat->get_concatenation_axis()));
+    return op;
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Gather)
+{
+    auto gather = static_cast<const ngraph::op::Gather*>(ngNode);
+    auto op = NgDialectObj.createGenericOp<mlir::NGGatherOp>(ngNode);
+    op->setAttr("axis", NgDialectObj.m_builder.getI64IntegerAttr(gather->get_axis()));
+    return op;
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Relu)
+{
+    return NgDialectObj.createGenericOp<mlir::NGReluOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Negative)
+{
+    return NgDialectObj.createGenericOp<mlir::NGNegOp>(ngNode);
+}
+template <>
+mlir::Operation* NgDialectConversionPass::COMPILE_OP_DECL(ngraph::op::Convolution)
+{
+    mlir::Operation* op = NgDialectObj.createGenericOp<mlir::NGConvolutionOp>(ngNode);
+    auto convNode = static_cast<const ngraph::op::Convolution*>(ngNode);
+    auto convOp = llvm::cast<mlir::NGConvolutionOp>(op);
+    mlir::ArrayAttr attr = NgDialectObj.getShapeAsAttr(convNode->get_window_movement_strides());
+    convOp.setStrides(attr);
+    attr = NgDialectObj.getShapeAsAttr(convNode->get_padding_below());
+    convOp.setPadBelow(attr);
+    attr = NgDialectObj.getShapeAsAttr(convNode->get_padding_above());
+    convOp.setPadAbove(attr);
+    return op;
+}
+template <typename Op>
+mlir::Operation* NgDialectConversionPass::createGenericOp(const ngraph::Node* ngNode)
+{
+    std::vector<mlir::Value*> argValues;
+    std::vector<mlir::Type> resTypes;
+    auto inputMap = m_compiledKernel->get_input_map();
+    std::shared_ptr<descriptor::Tensor> argTensor;
+    for (auto& argOutput : ngNode->input_values())
+    {
+        auto argOutputNode = argOutput.get_node();
+        if (as_type<op::Parameter>(argOutputNode))
+        {
+            auto it = inputMap.find(argOutputNode->shared_from_this());
+            NGRAPH_CHECK(it != inputMap.end(), "Parameter not in CK input map");
+            argTensor = m_compiledKernel->input_values().at(it->second).get_tensor_ptr();
+        }
+        else
+        {
+            argTensor = argOutput.get_tensor_ptr();
+        }
+        auto argV = getTensorValue(argTensor.get()).m_value;
+        argValues.push_back(argV);
+    }
+    for (auto& output : ngNode->outputs())
+    {
+        resTypes.push_back(getMlirType(output.get_tensor_ptr().get()));
+    }
+    return (m_builder.create<Op,
+                             ArrayRef<mlir::Type>,
+                             ArrayRef<mlir::Value*>,
+                             ArrayRef<mlir::NamedAttribute>>(
+                mlir::UnknownLoc::get(m_context), resTypes, argValues, {/* no attrs */}))
+        .getOperation();
+}
+const NgDialectConversionPass::MLIRCompOpMap NgDialectConversionPass::opDispatcher{
+#define MLIR_OP(OP) {TI(ngraph::op::OP), &NgDialectConversionPass::createOp<ngraph::op::OP>},
+#include "contrib/mlir/core/ops_supported.inc"
+};
+void NgDialectConversionPass::createReturn()
+{
+    std::vector<mlir::Value*> valueList;
+    for (auto output : m_compiledKernel->get_kernel_outputs())
+    {
+        valueList.push_back(getTensorValue(output->get_output_tensor_ptr().get()).m_value);
+    }
+    m_builder.create<mlir::NGReturnOp>(mlir::UnknownLoc::get(m_context), valueList);
+}
+template <typename RedOp>
+mlir::Operation* NgDialectConversionPass::createIndexReduction(const ngraph::Node* ngNode)
+{
+    auto* idxRed = static_cast<const ngraph::op::util::IndexReduction*>(ngNode);
+    auto op = createGenericOp<RedOp>(ngNode);
+    mlir::ArrayAttr redAxesAttr =
+        m_builder.getI64ArrayAttr({(int64_t)idxRed->get_reduction_axis()});
+    op->setAttr("axes", redAxesAttr);
+    return op;
+}
+std::unique_ptr<mlir::Pass>
+    ngraph::pass::createNgDialectConversionPass(const ngraph::op::CompiledKernel* compiledKernel,
+                                                mlir::MLIRContext* context)
+{
+    return std::make_unique<NgDialectConversionPass>(compiledKernel, context);
+}
--- a/src/contrib/mlir/core/pass/ng_dialect_builder.hpp
+++ b/src/contrib/mlir/core/pass/ng_dialect_builder.hpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+// NOTE: This file follows nGraph format style.
+// Follows nGraph naming convention for public APIs only, else MLIR naming convention.
+#pragma once
+#include "contrib/mlir/core/compiler.hpp"
+#include "contrib/mlir/runtime/cpu/memory_manager.hpp"
+#include "ngraph/check.hpp"
+#include "ngraph/descriptor/tensor.hpp"
+#include "ngraph/node.hpp"
+#include <mlir/ExecutionEngine/MemRefUtils.h>
+#include <mlir/IR/Builders.h>
+#include <mlir/IR/Module.h>
+#include <mlir/IR/Types.h>
+#include <mlir/Pass/Pass.h>
+#include <typeindex>
+#include <unordered_map>
+#include <vector>
+using namespace ngraph::runtime::ngmlir;
+namespace ngraph
+{
+    namespace pass
+    {
+        std::unique_ptr<mlir::Pass>
+            createNgDialectConversionPass(const ngraph::op::CompiledKernel* compiledKernel,
+                                          mlir::MLIRContext* context);
+    }
+}