/************************************************************************* * Copyright (c) 2019-2021 Advanced Micro Devices, Inc. All rights reserved. * * See LICENSE.txt for license information ************************************************************************/ #include "test_CombinedCallsMultiProcess.hpp" namespace CorrectnessTests { TEST_P(CombinedCallsMultiProcessCorrectnessTest, Correctness) { // Important: Make sure the order of ncclFunc_t's here match the order of ncclFunc_ts // as they appear in TestCombinedCalls() std::vector ncclFuncs; ncclFuncs.push_back(ncclCollAllGather); ncclFuncs.push_back(ncclCollAllReduce); ncclFuncs.push_back(ncclCollBroadcast); ncclFuncs.push_back(ncclCollReduce); ncclFuncs.push_back(ncclCollReduceScatter); // Create multiple datasets for combined operation std::vector datasets(ncclFuncs.size()); for (int i = 0; i < datasets.size(); i++) { datasets[i] = (Dataset*)mmap(NULL, sizeof(Dataset), PROT_READ|PROT_WRITE, MAP_SHARED|MAP_ANONYMOUS, -1, 0); datasets[i]->InitializeRootProcess(numDevices, numElements, dataType, inPlace, ncclFuncs[i]); } std::vector pids(numDevices); int gpu = -1; for (int i = 0; i < numDevices; i++) { gpu++; int pid = fork(); if (pid == 0) { bool pass; TestCombinedCalls(gpu, datasets, ncclFuncs, pass); TerminateChildProcess(pass); } else { pids[gpu] = pid; } } ValidateProcesses(pids); for (int i = 0; i < datasets.size(); i++) { munmap(datasets[i], sizeof(Dataset)); } } INSTANTIATE_TEST_SUITE_P(CombinedCallsMultiProcessCorrectnessSweep, CombinedCallsMultiProcessCorrectnessTest, testing::Combine( // Reduction operator (not used) testing::Values(ncclSum), // Data types testing::Values(ncclInt8, ncclUint8, ncclInt32, ncclUint32, ncclInt64, ncclUint64, //ncclFloat16, ncclFloat32, ncclFloat64, ncclBfloat16), // Number of elements testing::Values(3072, 3145728), // Number of devices testing::Values(2,3,4,8), // In-place or not testing::Values(false, true), testing::Values("")), CorrectnessTest::PrintToStringParamName()); } // namespace