956a73c4c8
## Motivation With the introduction of the new logging system base on `spdlog` library, opportunity shows to replace `timemory` dependent JOIN implementation with `fmt` library `format` and `join` APIs, which are shipped as a part of `spdlog` lib ## Technical Details Use `fmt` provided APIs to properly format and package strings.
281 rinda
10 KiB
C++
281 rinda
10 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2025 Advanced Micro Devices, Inc. All Rights Reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#include "library/rocprofiler-sdk/fwd.hpp"
|
|
#include "core/state.hpp"
|
|
|
|
#include "logger/debug.hpp"
|
|
|
|
#include <exception>
|
|
#include <rocprofiler-sdk/agent.h>
|
|
#include <rocprofiler-sdk/cxx/name_info.hpp>
|
|
#include <rocprofiler-sdk/fwd.h>
|
|
#include <rocprofiler-sdk/rocprofiler.h>
|
|
|
|
#include <spdlog/fmt/ranges.h>
|
|
|
|
#include <algorithm>
|
|
#include <utility>
|
|
|
|
namespace rocprofsys
|
|
{
|
|
namespace rocprofiler_sdk
|
|
{
|
|
namespace
|
|
{
|
|
using tool_agent_vec_t = std::vector<tool_agent>;
|
|
|
|
rocprofiler_status_t
|
|
dimensions_info_callback(rocprofiler_counter_id_t /*id*/,
|
|
const rocprofiler_record_dimension_info_t* dim_info,
|
|
long unsigned int num_dims, void* user_data)
|
|
{
|
|
auto* dimensions_info =
|
|
static_cast<std::vector<rocprofiler_record_dimension_info_t>*>(user_data);
|
|
dimensions_info->reserve(num_dims);
|
|
for(size_t j = 0; j < num_dims; j++)
|
|
dimensions_info->emplace_back(dim_info[j]);
|
|
|
|
return ROCPROFILER_STATUS_SUCCESS;
|
|
}
|
|
|
|
rocprofiler_status_t
|
|
counters_supported_callback(rocprofiler_agent_id_t agent_id,
|
|
rocprofiler_counter_id_t* counters, size_t num_counters,
|
|
void* user_data)
|
|
{
|
|
using value_type = typename agent_counter_info_map_t::mapped_type;
|
|
|
|
auto* data_v = static_cast<agent_counter_info_map_t*>(user_data);
|
|
data_v->emplace(agent_id, value_type{});
|
|
for(size_t i = 0; i < num_counters; ++i)
|
|
{
|
|
auto _info = rocprofiler_counter_info_v0_t{};
|
|
auto _dim_info = std::vector<rocprofiler_record_dimension_info_t>{};
|
|
|
|
ROCPROFILER_CALL(rocprofiler_query_counter_info(
|
|
counters[i], ROCPROFILER_COUNTER_INFO_VERSION_0, &_info));
|
|
|
|
// populate local vector
|
|
ROCPROFILER_CALL(rocprofiler_iterate_counter_dimensions(
|
|
counters[i], dimensions_info_callback, &_dim_info));
|
|
|
|
if(!_info.is_constant)
|
|
data_v->at(agent_id).emplace_back(agent_id, _info, std::move(_dim_info));
|
|
}
|
|
return ROCPROFILER_STATUS_SUCCESS;
|
|
}
|
|
|
|
agent_counter_info_map_t
|
|
get_agent_counter_info(const tool_agent_vec_t& _agents)
|
|
{
|
|
auto _data = agent_counter_info_map_t{};
|
|
|
|
for(auto itr : _agents)
|
|
{
|
|
const auto& _agent_id = rocprofiler_agent_id_t{ itr.agent->handle };
|
|
|
|
auto status = rocprofiler_iterate_agent_supported_counters(
|
|
_agent_id, counters_supported_callback, &_data);
|
|
|
|
if(status != ROCPROFILER_STATUS_SUCCESS)
|
|
{
|
|
LOG_WARNING(
|
|
"rocprofiler_iterate_agent_supported_counters failed for agent {} "
|
|
"with status {} (Agent HW architecture may not be supported)",
|
|
_agent_id.handle, static_cast<int>(status));
|
|
// Skip processing for this agent if it's not supported
|
|
continue;
|
|
}
|
|
|
|
// Only process if the agent was successfully added to the map
|
|
auto agent_it = _data.find(_agent_id);
|
|
if(agent_it != _data.end())
|
|
{
|
|
std::sort(agent_it->second.begin(), agent_it->second.end(),
|
|
[](const auto& lhs, const auto& rhs) {
|
|
return (lhs.id.handle < rhs.id.handle);
|
|
});
|
|
|
|
for(auto& citr : agent_it->second)
|
|
{
|
|
std::sort(
|
|
citr.dimension_info.begin(), citr.dimension_info.end(),
|
|
[](const auto& lhs, const auto& rhs) { return (lhs.id < rhs.id); });
|
|
}
|
|
}
|
|
}
|
|
|
|
return _data;
|
|
}
|
|
} // namespace
|
|
|
|
rocprofiler_tool_counter_info_t::rocprofiler_tool_counter_info_t(
|
|
rocprofiler_agent_id_t _agent_id, parent_type _info, dimension_info_vec_t&& _dim_info)
|
|
: parent_type{ _info }
|
|
, agent_id{ _agent_id }
|
|
, dimension_info{ std::move(_dim_info) }
|
|
{}
|
|
|
|
void
|
|
client_data::initialize()
|
|
{
|
|
buffered_tracing_info = rocprofiler::sdk::get_buffer_tracing_names();
|
|
callback_tracing_info = rocprofiler::sdk::get_callback_tracing_names();
|
|
|
|
set_agents();
|
|
}
|
|
|
|
void
|
|
client_data::initialize_event_info()
|
|
{
|
|
auto& agent_mngr = get_agent_manager_instance();
|
|
|
|
if(agent_mngr.get_agents().empty())
|
|
{
|
|
initialize();
|
|
}
|
|
else if(gpu_agents.empty() && cpu_agents.empty())
|
|
{
|
|
set_agents();
|
|
}
|
|
|
|
if(agent_counter_info.size() != gpu_agents.size())
|
|
agent_counter_info = get_agent_counter_info(gpu_agents);
|
|
|
|
try
|
|
{
|
|
using qualifier_t = tim::hardware_counters::qualifier;
|
|
using qualifier_vec_t = std::vector<qualifier_t>;
|
|
|
|
for(const auto& aitr : gpu_agents)
|
|
{
|
|
auto _dev_index = aitr.device_id;
|
|
const auto& _agent_id = rocprofiler_agent_id_t{ aitr.agent->handle };
|
|
auto _device_qualifier_sym = fmt::format(":device={}", _dev_index);
|
|
auto _device_qualifier =
|
|
tim::hardware_counters::qualifier{ true, static_cast<int>(_dev_index),
|
|
_device_qualifier_sym,
|
|
fmt::format("Device {}", _dev_index) };
|
|
|
|
// Check if agent info is available ( i.e., counters are supported)
|
|
auto agent_info_it = agent_counter_info.find(_agent_id);
|
|
if(agent_info_it == agent_counter_info.end())
|
|
{
|
|
LOG_WARNING("Skipping GPU device {} ({}, handle=0x{:X}) due to "
|
|
"counter not found for the specified architecture",
|
|
_dev_index, aitr.agent->name, aitr.agent->handle);
|
|
continue;
|
|
}
|
|
|
|
auto _counter_info = agent_info_it->second;
|
|
std::sort(_counter_info.begin(), _counter_info.end(),
|
|
[](const rocprofiler_tool_counter_info_t& lhs,
|
|
const rocprofiler_tool_counter_info_t& rhs) {
|
|
if(lhs.is_constant && rhs.is_constant)
|
|
return lhs.id < rhs.id;
|
|
else if(lhs.is_constant)
|
|
return true;
|
|
else if(rhs.is_constant)
|
|
return false;
|
|
|
|
if(!lhs.is_derived && !rhs.is_derived)
|
|
return lhs.id < rhs.id;
|
|
else if(!lhs.is_derived)
|
|
return true;
|
|
else if(!rhs.is_derived)
|
|
return false;
|
|
|
|
return lhs.id < rhs.id;
|
|
});
|
|
|
|
for(const auto& ditr : _counter_info)
|
|
{
|
|
auto _long_desc = std::string{ ditr.description };
|
|
auto _units = std::string{};
|
|
auto _pysym = std::string{};
|
|
if(ditr.is_constant)
|
|
{
|
|
continue;
|
|
}
|
|
else if(ditr.is_derived)
|
|
{
|
|
auto _sym = fmt::format("{}:device={}", ditr.name, _dev_index);
|
|
auto _short_desc =
|
|
fmt::format("Derived counter: {}", ditr.expression);
|
|
events_info.emplace_back(hardware_counter_info(
|
|
true, tim::hardware_counters::api::rocm, events_info.size(), 0,
|
|
_sym, _pysym, _short_desc, _long_desc, _units,
|
|
qualifier_vec_t{ _device_qualifier }));
|
|
}
|
|
else
|
|
{
|
|
auto _dim_info = std::vector<std::string>{};
|
|
|
|
for(const auto& itr : ditr.dimension_info)
|
|
{
|
|
auto _info =
|
|
(itr.instance_size > 1)
|
|
? fmt::format("{}[0:{}]", itr.name, itr.instance_size - 1)
|
|
: std::string{};
|
|
if(!_info.empty()) _dim_info.emplace_back(_info);
|
|
}
|
|
|
|
auto _sym = fmt::format("{}:device={}", ditr.name, _dev_index);
|
|
auto _short_desc =
|
|
fmt::format("{} on device {}", ditr.name, _dev_index);
|
|
if(!_dim_info.empty())
|
|
{
|
|
_short_desc += fmt::format("{}", fmt::join(_dim_info, ". "));
|
|
}
|
|
events_info.emplace_back(hardware_counter_info(
|
|
true, tim::hardware_counters::api::rocm, events_info.size(), 0,
|
|
_sym, _pysym, _short_desc, _long_desc, _units,
|
|
qualifier_vec_t{ _device_qualifier }));
|
|
}
|
|
}
|
|
}
|
|
} catch(std::exception& _e)
|
|
{
|
|
LOG_WARNING("Constructing ROCm event info failed: {}", _e.what());
|
|
}
|
|
}
|
|
|
|
void
|
|
client_data::set_agents()
|
|
{
|
|
auto& agent_mngr = get_agent_manager_instance();
|
|
|
|
auto fill_agents = [&](agent_type type, std::vector<tool_agent>& out) {
|
|
const auto& _agents = agent_mngr.get_agents_by_type(type);
|
|
for(const auto& agent : _agents)
|
|
{
|
|
out.emplace_back(tool_agent{ agent->device_type_index, agent.get() });
|
|
}
|
|
};
|
|
|
|
fill_agents(agent_type::GPU, gpu_agents);
|
|
fill_agents(agent_type::CPU, cpu_agents);
|
|
}
|
|
} // namespace rocprofiler_sdk
|
|
} // namespace rocprofsys
|