diff --git a/projects/rccl/src/device/common_kernel.h b/projects/rccl/src/device/common_kernel.h index 98113702fc..31dd2b05d3 100644 --- a/projects/rccl/src/device/common_kernel.h +++ b/projects/rccl/src/device/common_kernel.h @@ -32,11 +32,7 @@ template -#if defined(__gfx942__) || defined(__gfx950__) __device__ __forceinline__ void reduceCopyPacks( -#else -__device__ __attribute__((noinline)) void reduceCopyPacks( -#endif int nThreads, int &thread, uint64_t redArg, uint64_t *preOpArgs, bool postOp, int nSrcs, SrcPtrFn const &srcPtrFn, int nDsts, DstPtrFn const &dstPtrFn, @@ -428,11 +424,7 @@ template -#if defined(__gfx942__) || defined(__gfx950__) __device__ __forceinline__ void reduceCopyPacksWithBias( -#else -__device__ __attribute__((noinline)) void reduceCopyPacksWithBias( -#endif int nThreads, int &thread, uint64_t redArg, uint64_t *preOpArgs, bool postOp, int nSrcs, SrcPtrFn const &srcPtrFn, int nDsts, DstPtrFn const &dstPtrFn,