Fix the reordering kernel in cuda
This commit is contained in:
parent
93cba3c3ab
commit
e4f326e394
@ -28,7 +28,7 @@ namespace atrip {
|
||||
#if defined(HAVE_CUDA)
|
||||
#define FOR_K() \
|
||||
const size_t k = blockIdx.x * blockDim.x + threadIdx.x; \
|
||||
size_t idx = 0;
|
||||
size_t idx = k*size*size;
|
||||
#else
|
||||
#define FOR_K() for (size_t k=0, idx=0; k < size; k++)
|
||||
#endif
|
||||
|
||||
Loading…
Reference in New Issue
Block a user