diff --git a/projects/rccl/src/clique/AllReduceCliqueKernel.h b/projects/rccl/src/clique/AllReduceCliqueKernel.h index 67a306d3c7..9889e9a9d5 100644 --- a/projects/rccl/src/clique/AllReduceCliqueKernel.h +++ b/projects/rccl/src/clique/AllReduceCliqueKernel.h @@ -67,7 +67,7 @@ __device__ void AllReduceCliqueSplitKernel(struct CollectiveArgs* args) } // Perform the reduction - #define ALL_REDUCE_CLIQUE_UNROLL 2 + #define ALL_REDUCE_CLIQUE_UNROLL 1 ReduceOrCopyMulti( threadIdx.x, blockDim.x, NUM_RANKS, srcs, NUM_RANKS, dsts, blockN); }