Merge branch 'tfl/gpu_add_nvrtc' of github.com:NervanaSystems/private-ngraph-cpp…

Merge branch 'tfl/gpu_add_nvrtc' of github.com:NervanaSystems/private-ngraph-cpp into tfl/gpu_add_nvrtc

Merge branch 'tfl/gpu_add_nvrtc' of github.com:NervanaSystems/private-ngraph-cpp…
Merge branch 'tfl/gpu_add_nvrtc' of github.com:NervanaSystems/private-ngraph-cpp into tfl/gpu_add_nvrtc
a574bdaf · Fenglei Tian · 8e78e24c · 21d1070c · a574bdaf
Commit a574bdaf authored Feb 26, 2018 by Fenglei Tian
Hide whitespace changes
Inline Side-by-side

Showing with 11 additions and 12 deletions

gpu_cuda_kernel_emitters.cpp src/ngraph/runtime/gpu/gpu_cuda_kernel_emitters.cpp +11 -12

No files found.
--- a/src/ngraph/runtime/gpu/gpu_cuda_kernel_emitters.cpp
+++ b/src/ngraph/runtime/gpu/gpu_cuda_kernel_emitters.cpp
@@ -52,18 +52,17 @@ namespace ngraph
                        d_ptr_out = (CUdeviceptr)out;

                        void* args_list[] = {&d_ptr_in, &d_ptr_out, &count};
-                        CUDA_SAFE_CALL(
-                            cuLaunchKernel(*CudaFunctionPool::instance().get(name).get(),
-                                           count,
-                                           1,
-                                           1, // grid dim
-                                           1,
-                                           1,
-                                           1, // block dim
-                                           0,
-                                           NULL, // shared mem and stream
-                                           args_list,
-                                           0));             // arguments
+                        CUDA_SAFE_CALL(cuLaunchKernel(*CudaFunctionPool::instance().get(name).get(),
+                                                      count,
+                                                      1,
+                                                      1, // grid dim
+                                                      1,
+                                                      1,
+                                                      1, // block dim
+                                                      0,
+                                                      NULL, // shared mem and stream
+                                                      args_list,
+                                                      0));  // arguments
                        CUDA_SAFE_CALL(cuCtxSynchronize()); // Retrieve and print output.
                    }
                }