diff --git a/projects/rccl/src/device/all_reduce.h b/projects/rccl/src/device/all_reduce.h index 39e7d3d62b..1d431bce23 100644 --- a/projects/rccl/src/device/all_reduce.h +++ b/projects/rccl/src/device/all_reduce.h @@ -59,14 +59,6 @@ namespace { } #endif - int minChunkSize; - if (Proto::Id == NCCL_PROTO_LL) - minChunkSize = nthreads*(Proto::calcBytePerGrain()/sizeof(T)); - if (Proto::Id == NCCL_PROTO_LL128) { - // We should not need the final /2 but it makes performance much, much smoother. Might be a bug somewhere. - minChunkSize = nthreads*(Proto::calcBytePerGrain()/sizeof(T))/2; - } - Primitives, 0, Proto, 0> prims (tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); @@ -1030,4 +1022,4 @@ struct RunWorkElement(args); //LAUNCH_CLIQUE_KERNEL(AllReduceCliqueSplitKernel, RedOp, T, args); } -}; \ No newline at end of file +};