Fix the reordering kernel in cuda
This commit is contained in:
parent
93cba3c3ab
commit
e4f326e394
@ -28,7 +28,7 @@ namespace atrip {
|
|||||||
#if defined(HAVE_CUDA)
|
#if defined(HAVE_CUDA)
|
||||||
#define FOR_K() \
|
#define FOR_K() \
|
||||||
const size_t k = blockIdx.x * blockDim.x + threadIdx.x; \
|
const size_t k = blockIdx.x * blockDim.x + threadIdx.x; \
|
||||||
size_t idx = 0;
|
size_t idx = k*size*size;
|
||||||
#else
|
#else
|
||||||
#define FOR_K() for (size_t k=0, idx=0; k < size; k++)
|
#define FOR_K() for (size_t k=0, idx=0; k < size; k++)
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user