diff --git a/src/graph/paths.cc b/src/graph/paths.cc index a1f8d96896..de78d804d8 100644 --- a/src/graph/paths.cc +++ b/src/graph/paths.cc @@ -458,6 +458,7 @@ ncclResult_t ncclTopoNeedFlush(struct ncclTopoSystem* system, int64_t busId, int NCCLCHECK(ncclTopoIdToIndex(system, GPU, busId, &g)); struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; #if defined(__HIP_PLATFORM_AMD__) || defined(__HIPCC__) + *flush = 1; #else // Flush is required on Ampere and earlier *flush = gpu->gpu.cudaCompCap < 90 ? 1 : ncclParamNetForceFlush();