Cache functions so the backend does not need to recompile (#1209)

* Cache some generated functions in backwards tests to speed performance * more caching

Cache functions so the backend does not need to recompile (#1209)
* Cache some generated functions in backwards tests to speed performance * more caching
ffe3a631 · Robert Kimball · GitHub · 9fecc560 · ffe3a631 · ffe3a631
Unverified Commit ffe3a631 authored Jul 09, 2018 by Robert Kimball Committed by GitHub Jul 09, 2018
Showing with 48 additions and 10 deletions

autodiff.in.cpp test/autodiff.in.cpp +0 -0

backprop_derivative.hpp test/util/autodiff/backprop_derivative.hpp +21 -4

numeric_compare.hpp test/util/autodiff/numeric_compare.hpp +27 -6

No files found.
--- a/test/autodiff.in.cpp
+++ b/test/autodiff.in.cpp
--- a/test/util/autodiff/backprop_derivative.hpp
+++ b/test/util/autodiff/backprop_derivative.hpp
@@ -17,6 +17,7 @@
 #pragma once

 #include <memory>
+#include <unordered_map>

 #include "ngraph/autodiff/adjoints.hpp"
 #include "ngraph/graph_util.hpp"
@@ -31,6 +32,10 @@ namespace ngraph
    class Node;
    class Function;

+    static std::unordered_map<std::shared_ptr<Function>, std::shared_ptr<Function>> s_df_map;
+    static std::unordered_map<std::shared_ptr<Function>, std::shared_ptr<Function>> s_clone_fwd_map;
+    static std::unordered_map<std::shared_ptr<Function>, std::shared_ptr<Function>> s_clone_bwd_map;
+
    namespace runtime
    {
        class Backend;
@@ -145,7 +150,6 @@ namespace ngraph
            for (auto x : indep_params)
            {
                // add df/dx to df/dX*
-                auto x_shape = x->get_shape();
                df_output_params.push_back(adjoints.backprop_node(x));
            }

@@ -154,7 +158,11 @@ namespace ngraph
            df_input_params.insert(df_input_params.begin(), c_param);

            // df/dX* = f'(c, X)
-            auto df = std::make_shared<Function>(df_output_params, df_input_params);
+            if (!s_df_map[f])
+            {
+                s_df_map[f] = std::make_shared<Function>(df_output_params, df_input_params);
+            }
+            auto df = s_df_map[f];

            // (c, X) arguments
            std::vector<std::shared_ptr<runtime::TensorView>> df_input_args = f_input_args;
@@ -184,11 +192,20 @@ namespace ngraph
            }

            // compile and run modified (y, cached) = f(x)
-            auto clone_fwd = clone_function(*fprop_cache.fprop);
+            if (!s_clone_fwd_map[f])
+            {
+                s_clone_fwd_map[f] = clone_function(*fprop_cache.fprop);
+            }
+            auto clone_fwd = s_clone_fwd_map[f];
+
            backend->call(clone_fwd, mod_f_output_args, f_input_args);

            // call modfied f'(c, cached) to get df/dX*
-            auto clone_bwd = clone_function(*fprop_cache.bprop);
+            if (!s_clone_bwd_map[f])
+            {
+                s_clone_bwd_map[f] = clone_function(*fprop_cache.bprop);
+            }
+            auto clone_bwd = s_clone_bwd_map[f];
            auto cache_dfdx = get_autodiff<T>(backend, clone_bwd, mod_df_input_args, indep_params);

            const auto numpy_atol = 1e-5f;

--- a/test/util/autodiff/numeric_compare.hpp
+++ b/test/util/autodiff/numeric_compare.hpp
@@ -26,7 +26,8 @@
 // TODO: Always compute the numerical derivatives in double
 template <typename T>
 bool autodiff_numeric_compare(const std::shared_ptr<ngraph::runtime::Backend>& backend,
-                              std::function<std::shared_ptr<ngraph::Function>()> make_graph,
+                              std::shared_ptr<ngraph::Function> f,
+                              std::shared_ptr<ngraph::Function> g,
                              const std::vector<std::shared_ptr<ngraph::runtime::TensorView>>& args,
                              T rtol,
                              T atol)
@@ -35,7 +36,6 @@ bool autodiff_numeric_compare(const std::shared_ptr<ngraph::runtime::Backend>& b

    // Use INTERPRETER to compute numerical derivatives
    auto interpreter_backend = ngraph::runtime::Backend::create("INTERPRETER");
-    auto f = make_graph();

    std::vector<std::shared_ptr<ngraph::runtime::TensorView>> interpreter_args;
    for (auto arg : args)
@@ -58,7 +58,6 @@ bool autodiff_numeric_compare(const std::shared_ptr<ngraph::runtime::Backend>& b
        interpreter_backend, f, interpreter_args, delta, f->get_parameters());

    // Use the backend being tested to compute symbolic derivatives
-    auto g = make_graph();
    auto results_sym =
        ngraph::autodiff::backprop_derivative<T>(backend, g, args, g->get_parameters());

@@ -75,10 +74,21 @@ bool autodiff_numeric_compare(const std::shared_ptr<ngraph::runtime::Backend>& b
    return ngraph::test::all_close(results_num, interpreter_results_sym, rtol, atol);
 }

+template <typename T>
+bool autodiff_numeric_compare(const std::shared_ptr<ngraph::runtime::Backend>& backend,
+                              std::function<std::shared_ptr<ngraph::Function>()> make_graph,
+                              const std::vector<std::shared_ptr<ngraph::runtime::TensorView>>& args,
+                              T rtol,
+                              T atol)
+{
+    return autodiff_numeric_compare(backend, make_graph(), make_graph(), args, rtol, atol);
+}
+
 template <typename T>
 bool autodiff_numeric_compare_selective(
    const std::shared_ptr<ngraph::runtime::Backend>& backend,
-    std::function<std::shared_ptr<ngraph::Function>()> make_graph,
+    std::shared_ptr<ngraph::Function> f,
+    std::shared_ptr<ngraph::Function> g,
    const std::vector<std::shared_ptr<ngraph::runtime::TensorView>>& args,
    T rtol,
    T atol,
@@ -86,7 +96,6 @@ bool autodiff_numeric_compare_selective(
 {
    // Use INTERPRETER to compute numerical derivatives
    std::vector<std::shared_ptr<ngraph::op::Parameter>> f_indep_params;
-    auto f = make_graph();

    size_t i = 0;

@@ -123,7 +132,6 @@ bool autodiff_numeric_compare_selective(

    // Use the backend being tested to compute symbolic derivatives
    std::vector<std::shared_ptr<ngraph::op::Parameter>> g_indep_params;
-    auto g = make_graph();

    i = 0;

@@ -150,3 +158,16 @@ bool autodiff_numeric_compare_selective(

    return ngraph::test::all_close(results_num, interpreter_results_sym, rtol, atol);
 }
+
+template <typename T>
+bool autodiff_numeric_compare_selective(
+    const std::shared_ptr<ngraph::runtime::Backend>& backend,
+    std::function<std::shared_ptr<ngraph::Function>()> make_graph,
+    const std::vector<std::shared_ptr<ngraph::runtime::TensorView>>& args,
+    T rtol,
+    T atol,
+    const std::vector<bool>& indep_param_mask)
+{
+    return autodiff_numeric_compare_selective(
+        backend, make_graph(), make_graph(), args, rtol, atol, indep_param_mask);
+}