diff --git a/include/atrip/SliceUnion.hpp b/include/atrip/SliceUnion.hpp index 008c926..6ecaf9a 100644 --- a/include/atrip/SliceUnion.hpp +++ b/include/atrip/SliceUnion.hpp @@ -465,30 +465,30 @@ template #if defined(HAVE_CUDA) LOG(1,"Atrip") << "warming communication up " << slices.size() << "\n"; - WITH_CHRONO("cuda:warmup", - int nRanks=Atrip::np, requestCount=0; - int nSends=sliceBuffers.size()*nRanks; - MPI_Request *requests = (MPI_Request*) malloc(nSends*2 * sizeof(MPI_Request)); - MPI_Status *statuses = (MPI_Status*) malloc(nSends*2 * sizeof(MPI_Status)); - for (int sliceId=0; sliceId(), - rankId, - 100, - universe, - &requests[requestCount++]); - MPI_Irecv((void*)sliceBuffers[sliceId], - sliceSize, - traits::mpi::datatypeOf(), - rankId, - 100, - universe, - &requests[requestCount++]); - } - } - MPI_Waitall(nSends*2, requests, statuses); + WITH_CHRONO("cuda:warmup", + int nRanks=Atrip::np, requestCount=0; + int nSends=sliceBuffers.size()*nRanks; + MPI_Request *requests = (MPI_Request*) malloc(nSends*2 * sizeof(MPI_Request)); + MPI_Status *statuses = (MPI_Status*) malloc(nSends*2 * sizeof(MPI_Status)); + for (int sliceId=0; sliceId(), + rankId, + 100, + universe, + &requests[requestCount++]); + MPI_Irecv((void*)sliceBuffers[sliceId], + sliceSize, + traits::mpi::datatypeOf(), + rankId, + 100, + universe, + &requests[requestCount++]); + } + } + MPI_Waitall(nSends*2, requests, statuses); ) #endif