88aa2d3cbe
- Renames the CMake option "ROCPROFSYS_USE_HIP" to "ROCPROFSYS_USE_ROCM" - Remove the "ROCPROFSYS_USE_ROCM_SMI option. Controlled with the "ROCPROFSYS_USE_ROCM" option, instead. - Runtime configuration can still toggle ROCPROFSYS_USE_ROCM_SMI to disable the sampling. - Rename ROCPROFSYS_HIP_VERSION macro to ROCPROFSYS_ROCM_VERSION and remove blocks for `ROCPROFSYS_ROCM_VERSION < 60000` - Remove ROCPROFSYS_USE_ROCTRACER and ROCPROFSYS_USE_ROCPROFILER - Update test cases - Update docker files and workflows to install cmake 3.21, which is required for the rocprofiler-sdk findPackage script. - Removed rocm-6.2 from workflows due to a rocprofiler-sdk API change.
136 라인
4.9 KiB
C++
136 라인
4.9 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2024 Advanced Micro Devices, Inc. All Rights Reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#include "library/rocprofiler-sdk/counters.hpp"
|
|
#include "common/synchronized.hpp"
|
|
#include "core/debug.hpp"
|
|
#include "core/timemory.hpp"
|
|
#include "library/rocprofiler-sdk/fwd.hpp"
|
|
|
|
#include <timemory/utility/types.hpp>
|
|
|
|
#include <rocprofiler-sdk/agent.h>
|
|
#include <rocprofiler-sdk/buffer_tracing.h>
|
|
#include <rocprofiler-sdk/callback_tracing.h>
|
|
#include <rocprofiler-sdk/cxx/hash.hpp>
|
|
#include <rocprofiler-sdk/cxx/name_info.hpp>
|
|
#include <rocprofiler-sdk/cxx/operators.hpp>
|
|
#include <rocprofiler-sdk/dispatch_counting_service.h>
|
|
#include <rocprofiler-sdk/fwd.h>
|
|
#include <rocprofiler-sdk/registration.h>
|
|
|
|
#include <memory>
|
|
#include <unordered_map>
|
|
#include <vector>
|
|
|
|
namespace rocprofsys
|
|
{
|
|
namespace rocprofiler_sdk
|
|
{
|
|
namespace
|
|
{
|
|
std::string
|
|
get_counter_description(const client_data* tool_data, std::string_view _v)
|
|
{
|
|
const auto& _info = tool_data->events_info;
|
|
for(const auto& itr : _info)
|
|
{
|
|
if(itr.symbol().find(_v) == 0 || itr.short_description().find(_v) == 0)
|
|
{
|
|
return itr.long_description();
|
|
}
|
|
}
|
|
return std::string{};
|
|
}
|
|
} // namespace
|
|
|
|
void
|
|
counter_event::operator()(const client_data* tool_data, ::perfetto::CounterTrack* _track,
|
|
timing_interval _timing, scope::config _scope) const
|
|
{
|
|
if(!record.dispatch_data) return;
|
|
|
|
const auto& _dispatch_info = record.dispatch_data->dispatch_info;
|
|
const auto* _kern_sym_data =
|
|
tool_data->get_kernel_symbol_info(_dispatch_info.kernel_id);
|
|
|
|
auto _bundle = counter_bundle_t{ tim::demangle(_kern_sym_data->kernel_name), _scope };
|
|
|
|
_bundle.push(_dispatch_info.queue_id.handle)
|
|
.start()
|
|
.store(record.record_counter.counter_value);
|
|
|
|
_bundle.stop().pop(_dispatch_info.queue_id.handle);
|
|
|
|
if(_track && _timing.start > 0 && _timing.end > _timing.start)
|
|
{
|
|
TRACE_COUNTER(trait::name<category::rocm_counter_collection>::value, *_track,
|
|
_timing.start, record.record_counter.counter_value);
|
|
TRACE_COUNTER(trait::name<category::rocm_counter_collection>::value, *_track,
|
|
_timing.end, 0);
|
|
}
|
|
}
|
|
|
|
counter_storage::counter_storage(const client_data* _tool_data, uint64_t _devid,
|
|
size_t _idx, std::string_view _name)
|
|
: tool_data{ _tool_data }
|
|
, device_id{ _devid }
|
|
, index{ static_cast<int64_t>(_idx) }
|
|
, metric_name{ _name }
|
|
, metric_description{ get_counter_description(_tool_data, metric_name) }
|
|
{
|
|
auto _metric_name = std::string{ _name };
|
|
_metric_name =
|
|
std::regex_replace(_metric_name, std::regex{ "(.*)\\[([0-9]+)\\]" }, "$1_$2");
|
|
storage_name = JOIN('-', "rocprof", "device", device_id, _metric_name);
|
|
storage = std::make_unique<counter_storage_type>(tim::standalone_storage{}, index,
|
|
storage_name);
|
|
{
|
|
constexpr auto _unit = ::perfetto::CounterTrack::Unit::UNIT_COUNT;
|
|
track_name = JOIN(" ", "GPU", _metric_name, JOIN("", '[', device_id, ']'));
|
|
track = std::make_unique<counter_track_type>(
|
|
::perfetto::StaticString(track_name.c_str()));
|
|
track->set_is_incremental(false);
|
|
track->set_unit(_unit);
|
|
track->set_unit_multiplier(1);
|
|
}
|
|
}
|
|
|
|
void
|
|
counter_storage::operator()(const counter_event& _event, timing_interval _timing,
|
|
scope::config _scope) const
|
|
{
|
|
operation::set_storage<counter_data_tracker>{}(storage.get());
|
|
_event(tool_data, track.get(), _timing, _scope);
|
|
}
|
|
|
|
void
|
|
counter_storage::write() const
|
|
{
|
|
operation::set_storage<counter_data_tracker>{}(storage.get());
|
|
counter_data_tracker::label() = metric_name;
|
|
counter_data_tracker::description() = metric_description;
|
|
storage->write();
|
|
}
|
|
} // namespace rocprofiler_sdk
|
|
} // namespace rocprofsys
|