Files

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

208 rader
9.1 KiB
C++
Permalänk Normal vy Historik

2022-03-02 15:50:16 -05:00
/*************************************************************************
2023-04-06 12:28:53 -06:00
* Copyright (c) 2022-2023 Advanced Micro Devices, Inc. All rights reserved.
2022-03-02 15:50:16 -05:00
*
* See LICENSE.txt for license information
************************************************************************/
#include "TestBed.hpp"
namespace RcclUnitTesting
{
TEST(SendRecv, SinglePairs)
{
TestBed testBed;
// Configuration
std::vector<ncclDataType_t> const& testDataTypes = {ncclInt32, ncclFloat16, ncclFloat64};
2023-08-29 09:14:18 -06:00
std::vector<int> const numElements = {1048576, 53327, 1024, 0};
2022-03-02 15:50:16 -05:00
bool const inPlace = false;
bool const useManagedMem = false;
OptionalColArgs options;
std::vector<ncclDataType_t> dataTypes;
testBed.GetSupportedDataTypes(dataTypes, testDataTypes);
if (dataTypes.empty()) {
GTEST_SKIP() << "Skipping... test datatypes excluded by UT_DATATYPES.";
}
2022-03-02 15:50:16 -05:00
bool isCorrect = true;
int numGpus = testBed.ev.maxGpus;
for (int rpg=0; rpg < 2 && isCorrect; ++rpg)
2022-03-02 15:50:16 -05:00
for (int isMultiProcess = 0; isMultiProcess <= 1 && isCorrect; ++isMultiProcess)
{
if (!(testBed.ev.processMask & (1 << isMultiProcess))) continue;
int ranksPerGpu = rpg == 0 ? 1 : testBed.ev.maxRanksPerGpu;
int totalRanks = numGpus * ranksPerGpu;
int const numProcesses = isMultiProcess ? numGpus : 1;
const std::vector<int>& gpuPriorityOrder = testBed.ev.GetGpuPriorityOrder();
testBed.InitComms(TestBed::GetDeviceIdsList(numProcesses, numGpus, ranksPerGpu, gpuPriorityOrder),
2024-10-30 15:13:53 -04:00
{1,2}, //two group, second group sendrecv to self, has 2 coll
testBed.GetNumStreamsPerGroup(1,2),
2);
2022-03-02 15:50:16 -05:00
for (int dataIdx = 0; dataIdx < dataTypes.size() && isCorrect; ++dataIdx)
for (int numIdx = 0; numIdx < numElements.size() && isCorrect; ++numIdx)
for (int sendRank = 0; sendRank < totalRanks; ++sendRank)
{
for (int recvRank = 0; recvRank < totalRanks; ++recvRank)
{
options.root = recvRank;
2024-10-30 15:13:53 -04:00
int groupCallId = sendRank == recvRank; //self sendrecv group has two coll
int recvId = sendRank == recvRank; //where recv will be second coll
2022-03-02 15:50:16 -05:00
testBed.SetCollectiveArgs(ncclCollSend,
dataTypes[dataIdx],
numElements[numIdx],
numElements[numIdx],
options,
2022-03-02 15:50:16 -05:00
0,
groupCallId,
2022-03-02 15:50:16 -05:00
sendRank);
if (recvRank == 0)
{
2024-10-30 15:13:53 -04:00
//set up the collArg slot to make sure AllocateMem is called once and correctly
testBed.SetCollectiveArgs(ncclCollSend,
2022-03-02 15:50:16 -05:00
dataTypes[dataIdx],
numElements[numIdx],
numElements[numIdx],
options,
2022-03-02 15:50:16 -05:00
0,
2024-10-30 15:13:53 -04:00
!groupCallId,
sendRank);
testBed.AllocateMem(inPlace, useManagedMem, 0, 0, sendRank);
testBed.PrepareData(0, 0, sendRank);
testBed.AllocateMem(inPlace, useManagedMem, 1, 0, sendRank);
testBed.PrepareData(1, 0, sendRank);
2022-03-02 15:50:16 -05:00
}
2024-10-30 15:13:53 -04:00
if (testBed.ev.showNames) // Show test names
INFO("%s Datatype: %s SendReceive test Rank %d -> Rank %d for %d Elements\n",
isMultiProcess ? "MP" : "SP",
ncclDataTypeNames[dataTypes[dataIdx]],
sendRank,
recvRank,
numElements[numIdx]);
options.root = sendRank;
testBed.SetCollectiveArgs(ncclCollRecv,
dataTypes[dataIdx],
numElements[numIdx],
numElements[numIdx],
options,
recvId,
groupCallId,
recvRank);
testBed.AllocateMem(inPlace, useManagedMem, groupCallId, recvId, recvRank);
testBed.PrepareData(groupCallId, recvId, recvRank);
testBed.ExecuteCollectives({sendRank, recvRank}, groupCallId);
testBed.ValidateResults(isCorrect, groupCallId, recvId, recvRank);
testBed.DeallocateMem(groupCallId, recvId, recvRank);
2022-03-02 15:50:16 -05:00
}
2024-10-30 15:13:53 -04:00
testBed.DeallocateMem(0, 0, sendRank);
testBed.DeallocateMem(1, 0, sendRank);
2022-03-02 15:50:16 -05:00
}
testBed.DestroyComms();
}
testBed.Finalize();
}
TEST(SendRecv, UserBufferRegister)
{
setenv("RCCL_ENABLE_INTRANET", "1", 1);
TestBed testBed;
// Configuration
std::vector<ncclDataType_t> const& testDataTypes = {ncclInt32, ncclFloat16, ncclFloat64};
2024-09-24 18:16:51 -04:00
std::vector<int> const numElements = {1048576, 53327, 1024};
bool const inPlace = false;
bool const useManagedMem = false;
bool const userRegistered = true;
OptionalColArgs options;
std::vector<ncclDataType_t> dataTypes;
testBed.GetSupportedDataTypes(dataTypes, testDataTypes);
if (dataTypes.empty()) {
GTEST_SKIP() << "Skipping... test datatypes excluded by UT_DATATYPES.";
}
bool isCorrect = true;
int numGpus = testBed.ev.maxGpus;
for (int rpg=0; rpg < 2 && isCorrect; ++rpg)
for (int isMultiProcess = 0; isMultiProcess <= 1 && isCorrect; ++isMultiProcess)
{
if (!(testBed.ev.processMask & (1 << isMultiProcess))) continue;
int ranksPerGpu = rpg == 0 ? 1 : testBed.ev.maxRanksPerGpu;
int totalRanks = numGpus * ranksPerGpu;
int const numProcesses = isMultiProcess ? numGpus : 1;
const std::vector<int>& gpuPriorityOrder = testBed.ev.GetGpuPriorityOrder();
testBed.InitComms(TestBed::GetDeviceIdsList(numProcesses, numGpus, ranksPerGpu, gpuPriorityOrder),
2024-10-30 15:13:53 -04:00
{1,2}, //two group, second group sendrecv to self, has 2 coll
testBed.GetNumStreamsPerGroup(1,2),
2);
for (int dataIdx = 0; dataIdx < dataTypes.size() && isCorrect; ++dataIdx)
for (int numIdx = 0; numIdx < numElements.size() && isCorrect; ++numIdx)
for (int sendRank = 0; sendRank < totalRanks; ++sendRank)
{
for (int recvRank = 0; recvRank < totalRanks; ++recvRank)
{
options.root = recvRank;
2024-10-30 15:13:53 -04:00
int groupCallId = sendRank == recvRank;
int recvId = sendRank == recvRank;
testBed.SetCollectiveArgs(ncclCollSend,
dataTypes[dataIdx],
numElements[numIdx],
numElements[numIdx],
options,
0,
groupCallId,
sendRank);
if (recvRank == 0)
{
2024-10-30 15:13:53 -04:00
testBed.SetCollectiveArgs(ncclCollSend,
dataTypes[dataIdx],
numElements[numIdx],
numElements[numIdx],
options,
0,
2024-10-30 15:13:53 -04:00
!groupCallId,
sendRank);
testBed.AllocateMem(inPlace, useManagedMem, 0, 0, sendRank, userRegistered);
testBed.PrepareData(0, 0, sendRank);
testBed.AllocateMem(inPlace, useManagedMem, 1, 0, sendRank, userRegistered);
testBed.PrepareData(1, 0, sendRank);
}
2024-10-30 15:13:53 -04:00
if (testBed.ev.showNames) // Show test names
INFO("%s Datatype: %s SendReceive test Rank %d -> Rank %d for %d Elements\n",
isMultiProcess ? "MP" : "SP",
ncclDataTypeNames[dataTypes[dataIdx]],
sendRank,
recvRank,
numElements[numIdx]);
options.root = sendRank;
testBed.SetCollectiveArgs(ncclCollRecv,
dataTypes[dataIdx],
numElements[numIdx],
numElements[numIdx],
options,
recvId,
groupCallId,
recvRank);
testBed.AllocateMem(inPlace, useManagedMem, groupCallId, recvId, recvRank, userRegistered);
testBed.PrepareData(groupCallId, recvId, recvRank);
testBed.ExecuteCollectives({sendRank, recvRank}, groupCallId);
testBed.ValidateResults(isCorrect, groupCallId, recvId, recvRank);
testBed.DeallocateMem(groupCallId, recvId, recvRank);
}
2024-10-30 15:13:53 -04:00
testBed.DeallocateMem(0, 0, sendRank);
testBed.DeallocateMem(1, 0, sendRank);
}
testBed.DestroyComms();
}
testBed.Finalize();
unsetenv("RCCL_ENABLE_INTRANET");
}
}