Files
rocm-systems/src/team.cpp
T
Edgar Gabriel e4c427a736 Remove MPI compile-time dependency (#264)
* use dlsym for MPI functions

to allow compiling without MPI support, convert the usage of MPI functions and symbols to be based on a dlopen/dlsym based mechanism. Turns out this cannot be done entirely vendor neutral, slightly different solutions might be required for Open MPI, MPICH and the new MPI ABI.

* checkpoint

more work to be done.

* checkpoint 2

* checkpoint 3

* checkpoint 4

examples compile and link correctly

* checkpoitn 5 (I think)

* Checkpoitn 6

* dyld-mpi: adapt GDA

* dyldmpi: tests that depend on MPI need to link with it themselves

* do not ../mpi_instance.h

* dyldmpi: make the symetricHeapTestFixture compile

* dyldmpi: Change cmakery, compiles and run gda w/o external MPI

* Make it also compile in external MPI mode

* dyldmpi: ipc unit tests compile but do not link

* dyldmpi: new approach, if external mpi required, link with mpi,
otherwise use ompi5 abi

* C-style comments in cmakelist..

* dyldmpi: examples: do not fail compiling if MPI not found at build time,
instead do not compile the MPI required examples

* more updates to CMake logic

* convert RO backend

and a few other cleanups

* update some unit tests

to work with the dlopen MPI environment correctly.

---------

Co-authored-by: Aurelien Bouteiller <abouteil@amd.com>
2025-10-01 08:06:56 -05:00

125 lines
3.9 KiB
C++

/******************************************************************************
* Copyright (c) Advanced Micro Devices, Inc. All rights reserved.
*
* SPDX-License-Identifier: MIT
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to
* deal in the Software without restriction, including without limitation the
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
* sell copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
* IN THE SOFTWARE.
*****************************************************************************/
#include "team.hpp"
#include <cmath>
#include "rocshmem/rocshmem.hpp"
#include "backend_bc.hpp"
#include "util.hpp"
#include "mpi_instance.hpp"
namespace rocshmem {
rocshmem_team_t ROCSHMEM_TEAM_WORLD;
__host__ __device__ Team* get_internal_team(rocshmem_team_t team) {
return reinterpret_cast<Team*>(team);
}
ROTeam* get_internal_ro_team(rocshmem_team_t team) {
return reinterpret_cast<ROTeam*>(team);
}
IPCTeam* get_internal_ipc_team(rocshmem_team_t team) {
return reinterpret_cast<IPCTeam*>(team);
}
GDATeam* get_internal_gda_team(rocshmem_team_t team) {
return reinterpret_cast<GDATeam*>(team);
}
__host__ __device__ int team_translate_pe(rocshmem_team_t src_team, int src_pe,
rocshmem_team_t dst_team) {
if (src_team == ROCSHMEM_TEAM_INVALID ||
dst_team == ROCSHMEM_TEAM_INVALID) {
return -1;
}
Team* src_team_obj{get_internal_team(src_team)};
Team* dst_team_obj{get_internal_team(dst_team)};
int src_pe_in_world{src_team_obj->get_pe_in_world(src_pe)};
int dst_pe{dst_team_obj->get_pe_in_my_team(src_pe_in_world)};
return dst_pe;
}
__host__ __device__ TeamInfo::TeamInfo(Team* _parent_team, int _pe_start,
int _stride, int _size)
: parent_team(_parent_team),
pe_start(_pe_start),
stride(_stride),
size(_size) {
log_stride = log2(stride);
}
__host__ Team::Team(Backend* handle, TeamInfo* team_info_wrt_parent,
TeamInfo* team_info_wrt_world, int _num_pes, int _my_pe,
MPI_Comm _mpi_comm)
: world_size(handle->getNumPEs()),
my_pe_in_world(handle->getMyPE()),
tinfo_wrt_parent(team_info_wrt_parent),
tinfo_wrt_world(team_info_wrt_world),
num_pes(_num_pes),
my_pe(_my_pe) {
if (_mpi_comm != MPI_COMM_NULL) {
mpilib_ftable_.Comm_dup (_mpi_comm, &mpi_comm);
}
}
__host__ __device__ int Team::get_pe_in_world(int pe) {
int pe_start{tinfo_wrt_world->pe_start};
int stride{tinfo_wrt_world->stride};
return pe_start + stride * pe;
}
__host__ __device__ int Team::get_pe_in_my_team(int pe_in_world) {
int pe_start{tinfo_wrt_world->pe_start};
int stride{tinfo_wrt_world->stride};
if (pe_in_world < pe_start) {
return -1; // Outside the start of the range
}
if ((pe_in_world - pe_start) % stride) {
return -1; // Not a multiple of stride
}
int pe_in_my_team{(pe_in_world - pe_start) / stride};
if (pe_in_my_team >= num_pes) {
return -1; // Outside the end of the range
}
return pe_in_my_team;
}
__host__ Team::~Team() {
if (mpi_comm != MPI_COMM_NULL)
mpilib_ftable_.Comm_free (&mpi_comm);
}
} // namespace rocshmem