cudalegacy: Use safe block scan function

This commit is contained in:
Namgoo Lee
2019-02-12 08:24:57 +00:00
committed by Namgoo Lee
parent b17c1c6721
commit 21eb60f88b
3 changed files with 9 additions and 202 deletions
@@ -98,7 +98,7 @@ __device__ T warpScanInclusive(T data, volatile T* smem, uint tid)
#pragma unroll
for (int i = 1; i <= (WARP_SIZE / 2); i *= 2)
{
const T val = shfl_up(data, i);
const T val = __shfl_up(data, i, WARP_SIZE);
if (laneId >= i)
data += val;
}