diff --git a/src/graph/tuning.cc b/src/graph/tuning.cc index 3faf2cd73a..e858888ffc 100644 --- a/src/graph/tuning.cc +++ b/src/graph/tuning.cc @@ -736,7 +736,7 @@ ncclResult_t ncclTopoTuneModel(struct ncclComm* comm, int minCompCap, int maxCom for (int c=0; ctopo->nodes[GPU].nodes[0].gpu.gcn, "gfx12")) ? 0 : protoEnable[c*NCCL_NUM_PROTOCOLS+p]; - if (p == NCCL_PROTO_LL128) { + if (pEnable != 0 && p == NCCL_PROTO_LL128) { #if defined(__HIP_PLATFORM_AMD__) || defined(__HIPCC__) #if defined(ENABLE_LL128) // Enable LL128 by default only on gfx90a with available tuning table