Merge pull request #2749 from jet47:fix-bug-3678

cafcfc4d · Roman Donchenko · OpenCV Buildbot · f13e05cd · f1e44fa5 · cafcfc4d
Commit cafcfc4d authored May 14, 2014 by Roman Donchenko Committed by OpenCV Buildbot May 14, 2014
Show whitespace changes
Inline Side-by-side

Showing with 7 additions and 6 deletions

test_reductions.cpp modules/cudaarithm/test/test_reductions.cpp +1 -1

integral.hpp modules/cudev/include/opencv2/cudev/grid/detail/integral.hpp +6 -5

No files found.
--- a/modules/cudaarithm/test/test_reductions.cpp
+++ b/modules/cudaarithm/test/test_reductions.cpp
@@ -850,7 +850,7 @@ CUDA_TEST_P(Integral, Accuracy)
 INSTANTIATE_TEST_CASE_P(CUDA_Arithm, Integral, testing::Combine(
    ALL_DEVICES,
-    DIFFERENT_SIZES,
+    testing::Values(cv::Size(128, 128), cv::Size(113, 113), cv::Size(768, 1066)),
    WHOLE_SUBMAT));
 ///////////////////////////////////////////////////////////////////////////////////////////////////////

--- a/modules/cudev/include/opencv2/cudev/grid/detail/integral.hpp
+++ b/modules/cudev/include/opencv2/cudev/grid/detail/integral.hpp
@@ -439,8 +439,6 @@ namespace integral_detail
            T sum = (tidx < cols) && (y < rows) ? *p : 0;
-            y += blockDim.y;
            sums[threadIdx.x][threadIdx.y] = sum;
            __syncthreads();
@@ -467,14 +465,17 @@ namespace integral_detail
            if (threadIdx.y > 0)
                sum += sums[threadIdx.x][threadIdx.y - 1];
-            if (tidx < cols)
-            {
            sum += stepSum;
            stepSum += sums[threadIdx.x][blockDim.y - 1];
+            __syncthreads();
+            if ((tidx < cols) && (y < rows))
+            {
                *p = sum;
            }
-            __syncthreads();
+            y += blockDim.y;
        }
    #else
        __shared__ T smem[32][32];