Commit df697f65 authored by Yan Wang's avatar Yan Wang

Optimize runLBPClassifierStumpSimple by built-in mad24.

Signed-off-by: 's avatarYan Wang <yan.wang@linux.intel.com>
parent 4949f708
......@@ -397,8 +397,8 @@ __kernel void runLBPClassifierStumpSimple(
for( tileIdx = groupIdx; tileIdx < totalTiles; tileIdx += ngroups )
{
int iy = ((tileIdx / ntiles.x)*local_size_y + ly)*ystep;
int ix = ((tileIdx % ntiles.x)*local_size_x + lx)*ystep;
int iy = mad24((tileIdx / ntiles.x), local_size_y, ly) * ystep;
int ix = mad24((tileIdx % ntiles.x), local_size_x, lx) * ystep;
if( ix < worksize.x && iy < worksize.y )
{
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment