69b8a43dc6
* Added first ATT API * Finalizing thread trace API * Fixing more rebase conflicts * Added codeobj disassembly sample * Fixing merge issues with rebase [2] * Adding ATT packets * Implemented thread trace intercept * Moved codeobj parser to same repo as rocprofiler * Moved thread trace to new API * Fixing merge conflicts * Fixing more merge conflicts * Adding thread trace packet reuse * Merged aql_profile_v2 headers * Linked ATT sample to aqlprofile * Updated decoder to include non-loaded codeobjs * Implemented ISA decoder into ATT sample * Added marker_id to vaddr * Updating aql_profile_v2 API to memcpy * Updating thread trace API to include 64bit markers. Using the result of ISA matching. * Added instruction type and cycles summary * Updated sample with selection of kernel by kernel_object * Added option to copy from memory kernels * Moved tool_data in thread_trace to dynamic alloc * Restoring hsa.cpp * Fixed ATT sample crash. General improvements. * Moved codeobj library to outside src/ * Updated license header * Moved codeobj_capture to camelcase * Solving some more merge conflicts * Update samples/advanced_thread_trace/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update samples/advanced_thread_trace/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update samples/code_object_isa_decode/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update source/lib/rocprofiler-sdk/thread_trace/CMakeLists.txt * Removing unused parameter check * Adding const to isEmpty * Removing unused warning * Adding libdw-dev to requirements * Running clang-format * Commenting out new aql calls * Clang format * Unused variable fix * Adding codeobj-decoder coverage * Commenting out threadtrace * Update samples/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * P * WOverloaded * Addressing clang-tidy * Virtual destructor on ttracer class * Corr id * Fixing code source format * Update CMakeLists.txt * Build fixes * Update source/lib/rocprofiler-sdk-codeobj/code_object_track.cpp Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Fix shadowing * Update CMakeLists.txt * Update samples/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --------- Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: Ammar ELWazir <ammar.elwazir@amd.com> Co-authored-by: Ammar ELWazir <aelwazir@amd.com> Co-authored-by: Benjamin Welton <bewelton@amd.com>
141 行
5.1 KiB
C++
141 行
5.1 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2023 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#include "dimensions.hpp"
|
|
|
|
#include <cstdint>
|
|
#include <memory>
|
|
#include <unordered_map>
|
|
#include <vector>
|
|
|
|
#include <fmt/core.h>
|
|
|
|
#include "lib/common/static_object.hpp"
|
|
#include "lib/common/synchronized.hpp"
|
|
#include "lib/common/utility.hpp"
|
|
#include "lib/rocprofiler-sdk/aql/helpers.hpp"
|
|
#include "lib/rocprofiler-sdk/aql/packet_construct.hpp"
|
|
#include "lib/rocprofiler-sdk/counters/evaluate_ast.hpp"
|
|
#include "lib/rocprofiler-sdk/hsa/queue_controller.hpp"
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace counters
|
|
{
|
|
std::vector<MetricDimension>
|
|
getBlockDimensions(std::string_view agent, const Metric& metric)
|
|
{
|
|
if(!metric.special().empty())
|
|
{
|
|
// Special non-hardware counters without dimension data
|
|
return std::vector<MetricDimension>{{dimension_map().at(ROCPROFILER_DIMENSION_INSTANCE),
|
|
1,
|
|
ROCPROFILER_DIMENSION_INSTANCE}};
|
|
}
|
|
|
|
std::unordered_map<rocprofiler_profile_counter_instance_types, uint64_t> count;
|
|
|
|
std::vector<MetricDimension> ret;
|
|
|
|
for(const auto& [_, maybe_agent] :
|
|
CHECK_NOTNULL(hsa::get_queue_controller())->get_supported_agents())
|
|
{
|
|
if(maybe_agent.name() == agent)
|
|
{
|
|
aql::CounterPacketConstruct pkt_gen(maybe_agent, {metric});
|
|
const auto& events = pkt_gen.get_counter_events(metric);
|
|
|
|
for(const auto& event : events)
|
|
{
|
|
std::map<int, uint64_t> dims;
|
|
auto status = aql::get_dim_info(maybe_agent.get_hsa_agent(), event, 0, dims);
|
|
CHECK_EQ(status, ROCPROFILER_STATUS_SUCCESS)
|
|
<< rocprofiler_get_status_string(status);
|
|
|
|
for(const auto& [id, extent] : dims)
|
|
{
|
|
if(const auto* inst_type =
|
|
rocprofiler::common::get_val(aqlprofile_id_to_rocprof_instance(), id))
|
|
{
|
|
count.emplace(*inst_type, 0).first->second = extent;
|
|
}
|
|
else
|
|
{
|
|
ROCP_ERROR << "Unknown AQL Profiler Dimension " << id << " " << extent;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
ret.reserve(count.size());
|
|
for(const auto& [dim, size] : count)
|
|
{
|
|
ret.emplace_back(dimension_map().at(dim), size, dim);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
const std::unordered_map<uint64_t, std::vector<MetricDimension>>&
|
|
get_dimension_cache()
|
|
{
|
|
static auto*& cache =
|
|
common::static_object<std::unordered_map<uint64_t, std::vector<MetricDimension>>>::
|
|
construct([]() -> std::unordered_map<uint64_t, std::vector<MetricDimension>> {
|
|
std::unordered_map<uint64_t, std::vector<MetricDimension>> dims;
|
|
/**
|
|
* Fails if HSA is not loaded by retruning nothing. This should not remain after
|
|
* AQL is transistioned away from HSA.
|
|
*/
|
|
if(CHECK_NOTNULL(rocprofiler::hsa::get_queue_controller())
|
|
->get_supported_agents()
|
|
.empty())
|
|
{
|
|
return {};
|
|
}
|
|
|
|
const auto& asts = counters::get_ast_map();
|
|
for(const auto& [gfx, metrics] : asts)
|
|
{
|
|
for(const auto& [metric, ast] : metrics)
|
|
{
|
|
auto ast_copy = ast;
|
|
try
|
|
{
|
|
dims.emplace(ast.out_id().handle, ast_copy.set_dimensions());
|
|
} catch(std::runtime_error& e)
|
|
{
|
|
ROCP_ERROR << metric << " has improper dimensions"
|
|
<< " " << e.what();
|
|
throw;
|
|
}
|
|
}
|
|
}
|
|
return dims;
|
|
}());
|
|
return *cache;
|
|
}
|
|
|
|
} // namespace counters
|
|
} // namespace rocprofiler
|