f8bd2d0cfa
[ROCm/rccl commit: 3a919c1f49]
63 line
1.4 KiB
C
63 line
1.4 KiB
C
/*************************************************************************
|
|
* Copyright (c) 2019-2021, NVIDIA CORPORATION. All rights reserved.
|
|
* Modifications Copyright (c) 2019-2021 Advanced Micro Devices, Inc. All rights reserved.
|
|
*
|
|
* See LICENSE.txt for license information
|
|
************************************************************************/
|
|
|
|
#ifndef NCCL_INFO_H_
|
|
#define NCCL_INFO_H_
|
|
|
|
#include "nccl.h"
|
|
#include "devcomm.h"
|
|
#include "collectives.h"
|
|
|
|
typedef enum {
|
|
ncclPatternRing,
|
|
ncclPatternRingTwice,
|
|
ncclPatternPipelineFrom,
|
|
ncclPatternPipelineTo,
|
|
ncclPatternTreeUp,
|
|
ncclPatternTreeDown,
|
|
ncclPatternTreeUpDown,
|
|
ncclPatternCollTreeUpDown
|
|
} ncclPattern_t;
|
|
|
|
// Used to pass NCCL call information between functions
|
|
struct ncclInfo {
|
|
ncclFunc_t coll;
|
|
const char* opName;
|
|
// NCCL Coll Args
|
|
const void* sendbuff;
|
|
void* recvbuff;
|
|
size_t count;
|
|
ncclDataType_t datatype;
|
|
ncclRedOp_t op;
|
|
int root;
|
|
ncclComm_t comm;
|
|
hipStream_t stream;
|
|
// Algorithm details
|
|
int chunkSteps;
|
|
int sliceSteps;
|
|
// Computed later
|
|
ncclDevRedOpFull opFull;
|
|
int algorithm;
|
|
int protocol;
|
|
ncclPattern_t pattern;
|
|
int nChannels;
|
|
int nThreads;
|
|
size_t nBytes;
|
|
int nstepsPerLoop;
|
|
int nchunksPerLoop;
|
|
ssize_t sendbytes;
|
|
ssize_t recvbytes;
|
|
int recvChunkSize;
|
|
int sendChunkSize;
|
|
uint32_t delta;
|
|
int channelId;
|
|
uint16_t sendIdx;
|
|
uint16_t recvIdx;
|
|
};
|
|
|
|
#endif
|