Commit a574bdaf authored by Fenglei Tian's avatar Fenglei Tian

Merge branch 'tfl/gpu_add_nvrtc' of github.com:NervanaSystems/private-ngraph-cpp…

Merge branch 'tfl/gpu_add_nvrtc' of github.com:NervanaSystems/private-ngraph-cpp into tfl/gpu_add_nvrtc
parents 8e78e24c 21d1070c
......@@ -52,18 +52,17 @@ namespace ngraph
d_ptr_out = (CUdeviceptr)out;
void* args_list[] = {&d_ptr_in, &d_ptr_out, &count};
CUDA_SAFE_CALL(
cuLaunchKernel(*CudaFunctionPool::instance().get(name).get(),
count,
1,
1, // grid dim
1,
1,
1, // block dim
0,
NULL, // shared mem and stream
args_list,
0)); // arguments
CUDA_SAFE_CALL(cuLaunchKernel(*CudaFunctionPool::instance().get(name).get(),
count,
1,
1, // grid dim
1,
1,
1, // block dim
0,
NULL, // shared mem and stream
args_list,
0)); // arguments
CUDA_SAFE_CALL(cuCtxSynchronize()); // Retrieve and print output.
}
}
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment