Set flags when calling hipExtLaunchMultiKernelMultiDevice in hip-clang

This commit is contained in:
Wenkai Du
2020-05-08 15:53:51 +00:00
parent 33c23fdcda
commit 24ea2ef6dd
+4
View File
@@ -74,7 +74,11 @@ ncclResult_t ncclLaunchCooperativeKernelMultiDevice(hipLaunchParams *paramsList,
if (cgMode & 0x01) {
CUDACHECK(hipExtLaunchMultiKernelMultiDevice(paramsList, numDevices,
// These flags are to reduce the latency of using this API
#if __HIP__
hipCooperativeLaunchMultiDeviceNoPreSync|hipCooperativeLaunchMultiDeviceNoPostSync));
#else
0));
#endif
return ncclSuccess;
}
int savedDev;