replacing nccl/cuda related part of the api_trace.h with rccl/hip (#1326)

Co-authored-by: Marzieh Berenjkoub <mberenjk@amd.com>
Этот коммит содержится в:
mberenjk
2024-09-10 11:05:14 -05:00
коммит произвёл GitHub
родитель 289a80c4e9
Коммит 4ceb672179
+7 -7
Просмотреть файл
@@ -22,7 +22,7 @@
#pragma once
#include "nccl.h"
#include <rccl/rccl.h>
#include <stddef.h>
#include <stdint.h>
@@ -60,7 +60,7 @@ typedef ncclResult_t (*ncclAllGather_fn_t)(const void* sendbuff, void* recvbuff,
typedef ncclResult_t (*ncclAllReduce_fn_t)(const void* sendbuff, void* recvbuff,
size_t count, ncclDataType_t datatype,
ncclRedOp_t op, struct ncclComm* comm,
cudaStream_t stream);
hipStream_t stream);
typedef ncclResult_t (*ncclAllToAll_fn_t)(const void* sendbuff, void* recvbuff,
size_t count, ncclDataType_t datatype,
ncclComm_t comm, hipStream_t stream);
@@ -71,27 +71,27 @@ typedef ncclResult_t (*ncclAllToAllv_fn_t)(
typedef ncclResult_t (*ncclBroadcast_fn_t)(const void* sendbuff, void* recvbuff,
size_t count, ncclDataType_t datatype,
int root, ncclComm_t comm,
cudaStream_t stream);
hipStream_t stream);
typedef ncclResult_t (*ncclGather_fn_t)(const void* sendbuff, void* recvbuff,
size_t sendcount, ncclDataType_t datatype,
int root, ncclComm_t comm, hipStream_t stream);
typedef ncclResult_t (*ncclReduce_fn_t)(const void* sendbuff, void* recvbuff,
size_t count, ncclDataType_t datatype,
ncclRedOp_t op, int root, ncclComm_t comm,
cudaStream_t stream);
hipStream_t stream);
typedef ncclResult_t (*ncclReduceScatter_fn_t)(const void* sendbuff, void* recvbuff,
size_t recvcount, ncclDataType_t datatype,
ncclRedOp_t op, struct ncclComm* comm,
cudaStream_t stream);
hipStream_t stream);
typedef ncclResult_t (*ncclScatter_fn_t)(const void* sendbuff, void* recvbuff,
size_t recvcount, ncclDataType_t datatype,
int root, ncclComm_t comm, hipStream_t stream);
typedef ncclResult_t (*ncclSend_fn_t)(const void* sendbuff, size_t count,
ncclDataType_t datatype, int peer, ncclComm_t comm,
cudaStream_t stream);
hipStream_t stream);
typedef ncclResult_t (*ncclRecv_fn_t)(void* recvbuff, size_t count,
ncclDataType_t datatype, int peer, ncclComm_t comm,
cudaStream_t stream);
hipStream_t stream);
typedef ncclResult_t (*ncclRedOpCreatePreMulSum_fn_t)(ncclRedOp_t* op, void* scalar,
ncclDataType_t datatype,
ncclScalarResidence_t residence,