CPU: Work around Eigen tanh miscompilation for now

This will be revisited if a performant tanh is needed

CPU: Work around Eigen tanh miscompilation for now
This will be revisited if a performant tanh is needed
85f42f42 · Jaikrishnan Menon · 67109304 · 85f42f42 · 85f42f42
Commit 85f42f42 authored Nov 04, 2017 by Jaikrishnan Menon
Hide whitespace changes
Inline Side-by-side

Showing with 12 additions and 8 deletions

emitter.cpp src/ngraph/runtime/cpu/emitter.cpp +10 -8

external_function.cpp src/ngraph/runtime/cpu/external_function.cpp +2 -0

No files found.
--- a/src/ngraph/runtime/cpu/emitter.cpp
+++ b/src/ngraph/runtime/cpu/emitter.cpp
@@ -1620,16 +1620,18 @@ void Emitter::EMITTER_DECL(EmitTanh)
        (dynamic_pointer_cast<const TensorViewType>(n->get_arguments().at(0)->get_value_type()))
        ->get_element_type();
+    // Eigen's generic_fast_tanh_float<float> is currently miscompiled by Clang/LLVM
+    // so we fall-back to std::tanh
+    // TODO: Implement our own internal fast/approximate tanh if this actually gets used
+    // by models
    TU +=
        "    {\n"
-        "        auto arg0 = call_frame->get_tensor_view_data<" + element_type_names[TI(et)] + ">(" +
+        "        auto& arg0 = call_frame->get_parameterized_tensor_view<" + element_type_names[TI(et)] + ">(" +
-        to_string(inputs[0].get_index()) + ");\n"
+        to_string(inputs[0].get_index()) + ")->get_vector();\n"
-        "        auto out  = call_frame->get_tensor_view_data<" + element_type_names[TI(et)] + ">(" +
+        "        auto& out  = call_frame->get_parameterized_tensor_view<" + element_type_names[TI(et)] + ">(" +
-        to_string(outputs[0].get_index()) + ");\n"
+        to_string(outputs[0].get_index()) + ")->get_vector();\n"
-        "        EigenArray1d<" + element_type_names[TI(et)] + ">(out, "
+        "        std::transform(arg0.begin(), arg0.end(), out.begin(), [](" + element_type_names[TI(et)] +
-        EIGEN_VECTOR_FORMAT(outputs[0].get_layout<DenseTensorViewLayout>()->get_size()) ") =\n"
+        "::type x) -> " + element_type_names[TI(et)] + "::type { return std::tanh(x); });\n"
-        "        EigenArray1d<" + element_type_names[TI(et)] + ">(arg0, "
-        EIGEN_VECTOR_FORMAT(inputs[0].get_layout<DenseTensorViewLayout>()->get_size()) ").tanh();\n"
        "    }\n";
 }

--- a/src/ngraph/runtime/cpu/external_function.cpp
+++ b/src/ngraph/runtime/cpu/external_function.cpp
@@ -210,6 +210,8 @@ void ExternalFunction::compile(FunctionMap& function_map)
    TU += R"(// Generated by the NGraph CPU backend
 #include <memory>
 #include <vector>
+#include <algorithm>
+#include <cmath>
 #include <Eigen/Dense>