From 5783917a751f6cd3cf93a716cb2a6e8a7844aed7 Mon Sep 17 00:00:00 2001 From: Gilbert Lee Date: Fri, 20 Dec 2019 17:08:39 -0800 Subject: [PATCH] Changing single sync mode to time all iterations instead of just last [ROCm/rccl commit: e5074ce94de0df40c460ab611df1ee11eca6344f] --- projects/rccl/tools/TransferBench/TransferBench.cpp | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/projects/rccl/tools/TransferBench/TransferBench.cpp b/projects/rccl/tools/TransferBench/TransferBench.cpp index 016ff80ed4..5bdccdf807 100644 --- a/projects/rccl/tools/TransferBench/TransferBench.cpp +++ b/projects/rccl/tools/TransferBench/TransferBench.cpp @@ -28,7 +28,9 @@ THE SOFTWARE. #include #include #include - +#include +#include +#include #include #include "copy_kernel.h" #include "TransferBench.hpp" @@ -272,7 +274,8 @@ int main(int argc, char **argv) { HIP_CALL(hipSetDevice(links[i].srcGpu)); - HIP_CALL(hipEventRecord(startEvents[i], streams[i])); + if (!useSingleSync || iteration == 0) + HIP_CALL(hipEventRecord(startEvents[i], streams[i])); if (useHipCall) { @@ -308,7 +311,8 @@ int main(int argc, char **argv) gpuBlockParams[i]); } } - HIP_CALL(hipEventRecord(stopEvents[i], streams[i])); + if (!useSingleSync || iteration == numIterations - 1) + HIP_CALL(hipEventRecord(stopEvents[i], streams[i])); } // Synchronize per iteration, unless in single sync mode, in which case @@ -378,8 +382,7 @@ int main(int argc, char **argv) } else { - if (!useSingleSync) - totalGpuTime[i] /= (1.0 * numIterations); + totalGpuTime[i] /= (1.0 * numIterations); printf("%8.3f", (linkCount[i] * numBytesPerLink / 1.0E9) / totalGpuTime[i]); } }