// MIT License // // Copyright (c) 2020, The Regents of the University of California, // through Lawrence Berkeley National Laboratory (subject to receipt of any // required approvals from the U.S. Dept. of Energy). All rights reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in all // copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE // SOFTWARE. #include "core/common.hpp" #include "core/components/fwd.hpp" #include "core/defines.hpp" #include "core/timemory.hpp" #include "library/components/category_region.hpp" #include #include #include #include #include #include #if defined(ROCPROFSYS_USE_MPI) # include #endif #include #include #include #include #include #include ROCPROFSYS_COMPONENT_ALIAS(comm_data_tracker_t, ::tim::component::data_tracker) namespace rocprofsys { namespace component { using gotcha_data = ::tim::component::gotcha_data; struct comm_data : base { using value_type = void; using this_type = comm_data; using base_type = base; using tracker_t = tim::auto_tuple; using data_type = float; struct mpi_recv { static constexpr auto value = "comm_data"; static constexpr auto label = "MPI Comm Recv"; }; struct mpi_send { static constexpr auto value = "comm_data"; static constexpr auto label = "MPI Comm Send"; }; struct ucx_recv { static constexpr auto value = "comm_data"; static constexpr auto label = "UCX Comm Recv"; }; struct ucx_send { static constexpr auto value = "comm_data"; static constexpr auto label = "UCX Comm Send"; }; ROCPROFSYS_DEFAULT_OBJECT(comm_data) static void preinit(); static void configure(); static void global_finalize(); static void start(); static void stop() {} #if defined(ROCPROFSYS_USE_MPI) static int mpi_type_size(MPI_Datatype _datatype) { int _size = 0; PMPI_Type_size(_datatype, &_size); return _size; } // MPI_Send static void audit(const gotcha_data& _data, audit::incoming, const void*, int count, MPI_Datatype datatype, int dst, int tag, MPI_Comm); // MPI_Recv static void audit(const gotcha_data& _data, audit::incoming, void*, int count, MPI_Datatype datatype, int dst, int tag, MPI_Comm, MPI_Status*); // MPI_Isend static void audit(const gotcha_data& _data, audit::incoming, const void*, int count, MPI_Datatype datatype, int dst, int tag, MPI_Comm, MPI_Request*); // MPI_Irecv static void audit(const gotcha_data& _data, audit::incoming, void*, int count, MPI_Datatype datatype, int dst, int tag, MPI_Comm, MPI_Request*); // MPI_Bcast static void audit(const gotcha_data& _data, audit::incoming, void*, int count, MPI_Datatype datatype, int root, MPI_Comm); // MPI_Allreduce static void audit(const gotcha_data& _data, audit::incoming, const void*, void*, int count, MPI_Datatype datatype, MPI_Op, MPI_Comm); // MPI_Sendrecv static void audit(const gotcha_data& _data, audit::incoming, const void*, int sendcount, MPI_Datatype sendtype, int, int sendtag, void*, int recvcount, MPI_Datatype recvtype, int, int recvtag, MPI_Comm, MPI_Status*); // MPI_Gather // MPI_Scatter static void audit(const gotcha_data& _data, audit::incoming, const void*, int sendcount, MPI_Datatype sendtype, void*, int recvcount, MPI_Datatype recvtype, int root, MPI_Comm); // MPI_Alltoall static void audit(const gotcha_data& _data, audit::incoming, const void*, int sendcount, MPI_Datatype sendtype, void*, int recvcount, MPI_Datatype recvtype, MPI_Comm); #endif // UCX communication tracking // ucp_tag_send_nbx - send with tag matching (5 params: ep, buffer, count, tag, param) static void audit(const gotcha_data& _data, audit::incoming, void*, const void*, size_t count, uint64_t tag, const void*); // ucp_tag_recv_nbx - receive with tag matching (6 params: worker, buffer, count, tag, // tag_mask, param) static void audit(const gotcha_data& _data, audit::incoming, void*, void*, size_t count, uint64_t tag, uint64_t tag_mask, const void*); // ucp_put_nbx - RMA put operation (6 params: ep, buffer, count, remote_addr, rkey, // param) static void audit(const gotcha_data& _data, audit::incoming, void*, const void*, size_t count, uint64_t remote_addr, void* rkey, const void*); // ucp_get_nbx - RMA get operation (6 params: ep, buffer, count, remote_addr, rkey, // param) static void audit(const gotcha_data& _data, audit::incoming, void*, void*, size_t count, uint64_t remote_addr, void* rkey, const void*); // ucp_am_send_nbx - active message send (7 params: ep, id, header, header_length, // buffer, count, param) static void audit(const gotcha_data& _data, audit::incoming, void*, unsigned id, const void* header, size_t header_length, const void* buffer, size_t count, const void*); // ucp_stream_send_nbx - stream send (4 params: ep, buffer, count, param) static void audit(const gotcha_data& _data, audit::incoming, void*, const void*, size_t count, const void*); // ucp_stream_recv_nbx - stream receive (5 params: ep, buffer, count, length, param) static void audit(const gotcha_data& _data, audit::incoming, void*, void*, size_t count, size_t* length, const void*); // Legacy UCX functions (kept for compatibility) // ucp_tag_send_nb/nbx - send with tag matching static void audit(const gotcha_data& _data, audit::incoming, void*, size_t count, void*, void*, void*); // ucp_tag_recv_nb/nbx - receive with tag matching static void audit(const gotcha_data& _data, audit::incoming, void*, size_t count, void*, void*, void*, void*, void*); // ucp_put/get operations - RMA (legacy) static void audit(const gotcha_data& _data, audit::incoming, void*, size_t length, uint64_t, void*, void*); // ucp_am_send_nb/nbx - active message send (legacy) static void audit(const gotcha_data& _data, audit::incoming, void*, unsigned, void*, size_t, void*, size_t, unsigned, void*); // ucp_stream_send/recv operations (legacy) static void audit(const gotcha_data& _data, audit::incoming, void*, void*, size_t count, void*, unsigned, void*); private: static auto& add(tracker_t& _t, data_type value) { if(rocprofsys::get_state() != rocprofsys::State::Active) { _t.invoke(true); return _t; } _t.store(std::plus{}, value); return _t; } static auto add(const gotcha_data& _data, data_type value) { tracker_t _t{ std::string_view{ _data.tool_id.c_str() } }; return add(_t, value); } static auto add(std::string&& _name, data_type value) { tracker_t _t{ _name }; return add(_t, value); } static auto add(std::string_view _name, data_type value) { tracker_t _t{ _name }; return add(_t, value); } }; } // namespace component } // namespace rocprofsys #if !defined(ROCPROFSYS_EXTERN_COMPONENTS) || \ (defined(ROCPROFSYS_EXTERN_COMPONENTS) && ROCPROFSYS_EXTERN_COMPONENTS > 0) # include # include # include ROCPROFSYS_DECLARE_EXTERN_COMPONENT( TIMEMORY_ESC(data_tracker), true, float) ROCPROFSYS_DECLARE_EXTERN_COMPONENT(comm_data, false, void) #endif