Add constant folding for v1 reduce ops. (#3791)

* Add constant folding for v1 reduce ops. * Add reference/mean.hpp. * Remove extra semicolon. * Address PR feedback.

Add constant folding for v1 reduce ops. (#3791)
* Add constant folding for v1 reduce ops. * Add reference/mean.hpp. * Remove extra semicolon. * Address PR feedback.
388f449b · Amy Zhuang · Scott Cyphers · 1ad0d723 · 388f449b · 388f449b
Commit 388f449b authored Oct 25, 2019 by Amy Zhuang Committed by Scott Cyphers Oct 25, 2019
4 changed files
--- a/src/ngraph/ngraph.hpp
+++ b/src/ngraph/ngraph.hpp
@@ -181,6 +181,7 @@ namespace ngraph
 #include "ngraph/op/quantized_convolution.hpp"
 #include "ngraph/op/quantized_dot.hpp"
 #include "ngraph/op/recv.hpp"
+#include "ngraph/op/reduce_mean.hpp"
 #include "ngraph/op/reduce_prod.hpp"
 #include "ngraph/op/reduce_sum.hpp"
 #include "ngraph/op/relu.hpp"

--- a/src/ngraph/pass/constant_folding_arithmetic_reduction.cpp
+++ b/src/ngraph/pass/constant_folding_arithmetic_reduction.cpp
@@ -19,8 +19,12 @@
 #include "ngraph/op/max.hpp"
 #include "ngraph/op/min.hpp"
 #include "ngraph/op/product.hpp"
+#include "ngraph/op/reduce_mean.hpp"
+#include "ngraph/op/reduce_prod.hpp"
+#include "ngraph/op/reduce_sum.hpp"
 #include "ngraph/op/sum.hpp"
 #include "ngraph/runtime/reference/max.hpp"
+#include "ngraph/runtime/reference/mean.hpp"
 #include "ngraph/runtime/reference/min.hpp"
 #include "ngraph/runtime/reference/product.hpp"
 #include "ngraph/runtime/reference/sum.hpp"
@@ -43,6 +47,24 @@ static shared_ptr<op::Constant>
                                   reduction_node->get_shape(),
                                   max->get_reduction_axes());
    }
+    else if (auto reduce_max = as_type_ptr<op::v1::ReduceMax>(reduction_node))
+    {
+        auto reduction_axes = reduce_max->get_reduction_axes();
+        auto input_shape = reduce_max->get_input_shape(0);
+        Shape shape_no_keep_dims;
+        for (size_t i = 0; i < input_shape.size(); i++)
+        {
+            if (reduction_axes.count(i) == 0)
+            {
+                shape_no_keep_dims.push_back(input_shape[i]);
+            }
+        }
+        runtime::reference::max<T>(constant->get_vector<T>().data(),
+                                   out_vec.data(),
+                                   constant->get_output_shape(0),
+                                   shape_no_keep_dims,
+                                   reduce_max->get_reduction_axes());
+    }
    else if (auto min = as_type_ptr<op::Min>(reduction_node))
    {
        runtime::reference::min<T>(constant->get_vector<T>().data(),
@@ -51,6 +73,24 @@ static shared_ptr<op::Constant>
                                   reduction_node->get_shape(),
                                   min->get_reduction_axes());
    }
+    else if (auto reduce_min = as_type_ptr<op::v1::ReduceMin>(reduction_node))
+    {
+        auto reduction_axes = reduce_min->get_reduction_axes();
+        auto input_shape = reduce_min->get_input_shape(0);
+        Shape shape_no_keep_dims;
+        for (size_t i = 0; i < input_shape.size(); i++)
+        {
+            if (reduction_axes.count(i) == 0)
+            {
+                shape_no_keep_dims.push_back(input_shape[i]);
+            }
+        }
+        runtime::reference::min<T>(constant->get_vector<T>().data(),
+                                   out_vec.data(),
+                                   constant->get_output_shape(0),
+                                   shape_no_keep_dims,
+                                   reduce_min->get_reduction_axes());
+    }
    else if (auto prod = as_type_ptr<op::Product>(reduction_node))
    {
        runtime::reference::product<T>(constant->get_vector<T>().data(),
@@ -59,6 +99,24 @@ static shared_ptr<op::Constant>
                                       reduction_node->get_shape(),
                                       prod->get_reduction_axes());
    }
+    else if (auto reduce_prod = as_type_ptr<op::v1::ReduceProd>(reduction_node))
+    {
+        auto reduction_axes = reduce_prod->get_reduction_axes();
+        auto input_shape = reduce_prod->get_input_shape(0);
+        Shape shape_no_keep_dims;
+        for (size_t i = 0; i < input_shape.size(); i++)
+        {
+            if (reduction_axes.count(i) == 0)
+            {
+                shape_no_keep_dims.push_back(input_shape[i]);
+            }
+        }
+        runtime::reference::product<T>(constant->get_vector<T>().data(),
+                                       out_vec.data(),
+                                       constant->get_output_shape(0),
+                                       shape_no_keep_dims,
+                                       reduce_prod->get_reduction_axes());
+    }
    else if (auto sum = as_type_ptr<op::Sum>(reduction_node))
    {
        runtime::reference::sum<T>(constant->get_vector<T>().data(),
@@ -67,6 +125,42 @@ static shared_ptr<op::Constant>
                                   reduction_node->get_shape(),
                                   sum->get_reduction_axes());
    }
+    else if (auto reduce_sum = as_type_ptr<op::v1::ReduceSum>(reduction_node))
+    {
+        auto reduction_axes = reduce_sum->get_reduction_axes();
+        auto input_shape = reduce_sum->get_input_shape(0);
+        Shape shape_no_keep_dims;
+        for (size_t i = 0; i < input_shape.size(); i++)
+        {
+            if (reduction_axes.count(i) == 0)
+            {
+                shape_no_keep_dims.push_back(input_shape[i]);
+            }
+        }
+        runtime::reference::sum<T>(constant->get_vector<T>().data(),
+                                   out_vec.data(),
+                                   constant->get_output_shape(0),
+                                   shape_no_keep_dims,
+                                   reduce_sum->get_reduction_axes());
+    }
+    else if (auto reduce_mean = as_type_ptr<op::v1::ReduceMean>(reduction_node))
+    {
+        auto reduction_axes = reduce_mean->get_reduction_axes();
+        auto input_shape = reduce_mean->get_input_shape(0);
+        Shape shape_no_keep_dims;
+        for (size_t i = 0; i < input_shape.size(); i++)
+        {
+            if (reduction_axes.count(i) == 0)
+            {
+                shape_no_keep_dims.push_back(input_shape[i]);
+            }
+        }
+        runtime::reference::mean<T>(constant->get_vector<T>().data(),
+                                    out_vec.data(),
+                                    constant->get_output_shape(0),
+                                    shape_no_keep_dims,
+                                    reduce_mean->get_reduction_axes());
+    }
    else
    {
        NGRAPH_CHECK(false,
@@ -134,7 +228,12 @@ void pass::ConstantFolding::construct_constant_arithmetic_reduction()
        make_shared<pattern::op::Label>(element::i64, Shape{2}, pattern::has_class<op::Constant>());
    auto is_supported_reduction = [](std::shared_ptr<Node> n) {
        return (pattern::has_class<op::Max>()(n) || pattern::has_class<op::Min>()(n) ||
-                pattern::has_class<op::Product>()(n) || pattern::has_class<op::Sum>()(n));
+                pattern::has_class<op::Product>()(n) || pattern::has_class<op::Sum>()(n) ||
+                pattern::has_class<op::v1::ReduceMax>()(n) ||
+                pattern::has_class<op::v1::ReduceMin>()(n) ||
+                pattern::has_class<op::v1::ReduceProd>()(n) ||
+                pattern::has_class<op::v1::ReduceSum>()(n) ||
+                pattern::has_class<op::v1::ReduceMean>()(n));
    };
    auto reduction =
        std::make_shared<pattern::op::Any>(element::i32,

--- a/src/ngraph/runtime/reference/mean.hpp
+++ b/src/ngraph/runtime/reference/mean.hpp
+//*****************************************************************************
+// Copyright 2017-2019 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+#pragma once
+#include <cmath>
+#include "ngraph/coordinate_transform.hpp"
+#include "ngraph/runtime/reference/sum.hpp"
+#include "ngraph/shape_util.hpp"
+#include "ngraph/type/bfloat16.hpp"
+#include "ngraph/type/float16.hpp"
+namespace ngraph
+{
+    namespace runtime
+    {
+        namespace reference
+        {
+            template <typename T>
+            void mean(const T* arg,
+                      T* out,
+                      const Shape& in_shape,
+                      const Shape& out_shape,
+                      const AxisSet& reduction_axes)
+            {
+                CoordinateTransform output_transform(out_shape);
+                std::vector<T> cs(shape_size(out_shape));
+                for (const Coordinate& output_coord : output_transform)
+                {
+                    out[output_transform.index(output_coord)] = 0;
+                    cs[output_transform.index(output_coord)] = 0;
+                }
+                CoordinateTransform input_transform(in_shape);
+                std::map<size_t, int> index_to_count_map;
+                for (const Coordinate& input_coord : input_transform)
+                {
+                    Coordinate output_coord = reduce(input_coord, reduction_axes);
+                    T x = arg[input_transform.index(input_coord)];
+                    T& z = out[output_transform.index(output_coord)];
+                    auto index = output_transform.index(output_coord);
+                    if (index_to_count_map.find(index) == index_to_count_map.end())
+                    {
+                        index_to_count_map[index] = 1;
+                    }
+                    else
+                    {
+                        index_to_count_map[index]++;
+                    }
+                    if (is_finite(x) && is_finite(z))
+                    {
+                        T& c = cs[output_transform.index(output_coord)];
+                        T t = z + (x - c);
+                        c = (t - z) - (x - c);
+                        z = t;
+                    }
+                    else
+                    {
+                        z = z + x;
+                    }
+                }
+                for (const Coordinate& output_coord : output_transform)
+                {
+                    auto count = index_to_count_map[output_transform.index(output_coord)];
+                    out[output_transform.index(output_coord)] =
+                        out[output_transform.index(output_coord)] / count;
+                }
+            }
+        }
+    }
+}
--- a/test/constant_folding.cpp
+++ b/test/constant_folding.cpp
@@ -563,6 +563,68 @@ TEST(constant_folding, const_product)
    ASSERT_EQ(values_expected, values_out);
 }
+TEST(constant_folding, const_reduceprod)
+{
+    Shape input_shape{3, 3};
+    Shape output_shape{3};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6, 7, 8, 9};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceProd>(constant, constant_axes);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceProd>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{6, 120, 504};
+    ASSERT_EQ(values_expected, values_out);
+}
+TEST(constant_folding, const_reduceprod_keepdims)
+{
+    Shape input_shape{3, 3};
+    Shape output_shape{3, 1};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6, 7, 8, 9};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceProd>(constant, constant_axes, true);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceProd>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{6, 120, 504};
+    ASSERT_EQ(values_expected, values_out);
+}
 TEST(constant_folding, const_sum)
 {
    Shape input_shape{3, 3};
@@ -588,6 +650,68 @@ TEST(constant_folding, const_sum)
    ASSERT_EQ(values_expected, values_out);
 }
+TEST(constant_folding, const_reducesum)
+{
+    Shape input_shape{3, 3};
+    Shape output_shape{3};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6, 7, 8, 9};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceSum>(constant, constant_axes);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceSum>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{6, 15, 24};
+    ASSERT_EQ(values_expected, values_out);
+}
+TEST(constant_folding, const_reducesum_keepdims)
+{
+    Shape input_shape{3, 3};
+    Shape output_shape{3, 1};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6, 7, 8, 9};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceSum>(constant, constant_axes, true);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceSum>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{6, 15, 24};
+    ASSERT_EQ(values_expected, values_out);
+}
 TEST(constant_folding, const_max)
 {
    Shape input_shape{3, 3};
@@ -613,6 +737,68 @@ TEST(constant_folding, const_max)
    ASSERT_EQ(values_expected, values_out);
 }
+TEST(constant_folding, const_reducemax)
+{
+    Shape input_shape{3, 2};
+    Shape output_shape{3};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceMax>(constant, constant_axes);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceMax>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{2, 4, 6};
+    ASSERT_EQ(values_expected, values_out);
+}
+TEST(constant_folding, const_reducemax_keepdims)
+{
+    Shape input_shape{3, 2};
+    Shape output_shape{3, 1};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceMax>(constant, constant_axes, true);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceMax>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{2, 4, 6};
+    ASSERT_EQ(values_expected, values_out);
+}
 TEST(constant_folding, const_min)
 {
    Shape input_shape{3, 3};
@@ -638,6 +824,130 @@ TEST(constant_folding, const_min)
    ASSERT_EQ(values_expected, values_out);
 }
+TEST(constant_folding, const_reducemin)
+{
+    Shape input_shape{3, 2};
+    Shape output_shape{3};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceMin>(constant, constant_axes);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceMin>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{1, 3, 5};
+    ASSERT_EQ(values_expected, values_out);
+}
+TEST(constant_folding, const_reducemin_keepdims)
+{
+    Shape input_shape{3, 2};
+    Shape output_shape{3, 1};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceMin>(constant, constant_axes, true);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceMin>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{1, 3, 5};
+    ASSERT_EQ(values_expected, values_out);
+}
+TEST(constant_folding, const_reducemean)
+{
+    Shape input_shape{3, 3};
+    Shape output_shape{3};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6, 7, 8, 9};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceMean>(constant, constant_axes);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceMean>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{2, 5, 8};
+    ASSERT_EQ(values_expected, values_out);
+}
+TEST(constant_folding, const_reducemean_keepdims)
+{
+    Shape input_shape{3, 3};
+    Shape output_shape{3, 1};
+    vector<int32_t> values_in{1, 2, 3, 4, 5, 6, 7, 8, 9};
+    auto constant = op::Constant::create(element::i32, input_shape, values_in);
+    Shape axes_shape{1};
+    vector<int32_t> values_axes{1};
+    auto constant_axes = op::Constant::create(element::i64, axes_shape, values_axes);
+    auto convert = make_shared<op::v1::ReduceMean>(constant, constant_axes, true);
+    auto f = make_shared<Function>(convert, ParameterVector{});
+    pass::Manager pass_manager;
+    pass_manager.register_pass<pass::ConstantFolding>();
+    pass_manager.run_passes(f);
+    ASSERT_EQ(count_ops_of_type<op::v1::ReduceMean>(f), 0);
+    ASSERT_EQ(count_ops_of_type<op::Constant>(f), 1);
+    auto new_const = as_type_ptr<op::Constant>(f->get_results().at(0)->get_argument(0));
+    ASSERT_TRUE(new_const);
+    ASSERT_EQ(new_const->get_shape(), output_shape);
+    auto values_out = new_const->get_vector<int32_t>();
+    vector<int32_t> values_expected{2, 5, 8};
+    ASSERT_EQ(values_expected, values_out);
+}
 TEST(constant_folding, const_all)
 {
    Shape input_shape{3, 3};