Add a chrono for mpi memcpy in cuda
This commit is contained in:
parent
00a28c990c
commit
49ff3b377c
@ -457,7 +457,8 @@ void unwrapAndMarkReady() {
|
|||||||
|
|
||||||
#if defined(HAVE_CUDA)
|
#if defined(HAVE_CUDA)
|
||||||
// copy the retrieved mpi data to the device
|
// copy the retrieved mpi data to the device
|
||||||
cuMemcpyHtoD(data, (void*)mpi_data, sizeof(F) * size);
|
WITH_CHRONO("cuda:memcpy",
|
||||||
|
cuMemcpyHtoD(data, (void*)mpi_data, sizeof(F) * size);)
|
||||||
std::free(mpi_data);
|
std::free(mpi_data);
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user