69b8a43dc6
* Added first ATT API * Finalizing thread trace API * Fixing more rebase conflicts * Added codeobj disassembly sample * Fixing merge issues with rebase [2] * Adding ATT packets * Implemented thread trace intercept * Moved codeobj parser to same repo as rocprofiler * Moved thread trace to new API * Fixing merge conflicts * Fixing more merge conflicts * Adding thread trace packet reuse * Merged aql_profile_v2 headers * Linked ATT sample to aqlprofile * Updated decoder to include non-loaded codeobjs * Implemented ISA decoder into ATT sample * Added marker_id to vaddr * Updating aql_profile_v2 API to memcpy * Updating thread trace API to include 64bit markers. Using the result of ISA matching. * Added instruction type and cycles summary * Updated sample with selection of kernel by kernel_object * Added option to copy from memory kernels * Moved tool_data in thread_trace to dynamic alloc * Restoring hsa.cpp * Fixed ATT sample crash. General improvements. * Moved codeobj library to outside src/ * Updated license header * Moved codeobj_capture to camelcase * Solving some more merge conflicts * Update samples/advanced_thread_trace/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update samples/advanced_thread_trace/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update samples/code_object_isa_decode/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update source/lib/rocprofiler-sdk/thread_trace/CMakeLists.txt * Removing unused parameter check * Adding const to isEmpty * Removing unused warning * Adding libdw-dev to requirements * Running clang-format * Commenting out new aql calls * Clang format * Unused variable fix * Adding codeobj-decoder coverage * Commenting out threadtrace * Update samples/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * P * WOverloaded * Addressing clang-tidy * Virtual destructor on ttracer class * Corr id * Fixing code source format * Update CMakeLists.txt * Build fixes * Update source/lib/rocprofiler-sdk-codeobj/code_object_track.cpp Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Fix shadowing * Update CMakeLists.txt * Update samples/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --------- Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: Ammar ELWazir <ammar.elwazir@amd.com> Co-authored-by: Ammar ELWazir <aelwazir@amd.com> Co-authored-by: Benjamin Welton <bewelton@amd.com>
82 linhas
3.8 KiB
C++
82 linhas
3.8 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#include <rocprofiler-sdk/rocprofiler.h>
|
|
|
|
#include "lib/rocprofiler-sdk/aql/helpers.hpp"
|
|
#include "lib/rocprofiler-sdk/context/context.hpp"
|
|
#include "lib/rocprofiler-sdk/hsa/agent_cache.hpp"
|
|
|
|
extern "C" {
|
|
/**
|
|
* @brief Configure buffered dispatch profile Counting Service.
|
|
* Collects the counters in dispatch packets and stores them
|
|
* in buffer_id. The buffer may contain packets from more than
|
|
* one dispatch (denoted by correlation id). Will trigger the
|
|
* callback based on the parameters setup in buffer_id_t.
|
|
*
|
|
* @param [in] context_id context id
|
|
* @param [in] buffer_id id of the buffer to use for the counting service
|
|
* @param [in] profile profile config to use for dispatch
|
|
* @return ::rocprofiler_status_t
|
|
*/
|
|
rocprofiler_status_t ROCPROFILER_API
|
|
rocprofiler_configure_thread_trace_service(rocprofiler_context_id_t context_id,
|
|
rocprofiler_att_parameters_t parameters,
|
|
rocprofiler_att_dispatch_callback_t dispatch_callback,
|
|
rocprofiler_att_shader_data_callback_t shader_callback,
|
|
void* callback_userdata)
|
|
{
|
|
auto* ctx = rocprofiler::context::get_mutable_registered_context(context_id);
|
|
if(!ctx) return ROCPROFILER_STATUS_ERROR_CONTEXT_NOT_STARTED;
|
|
if(ctx->thread_trace) return ROCPROFILER_STATUS_ERROR_SERVICE_ALREADY_CONFIGURED;
|
|
if(parameters.flags.raw != 0) return ROCPROFILER_STATUS_ERROR_NOT_IMPLEMENTED;
|
|
|
|
auto thread_tracer = std::make_shared<rocprofiler::thread_trace_parameters>();
|
|
|
|
thread_tracer->context_id = context_id;
|
|
thread_tracer->dispatch_cb_fn = dispatch_callback;
|
|
thread_tracer->shader_cb_fn = shader_callback;
|
|
thread_tracer->callback_userdata = callback_userdata;
|
|
|
|
thread_tracer->flags = parameters.flags;
|
|
thread_tracer->buffer_size = parameters.buffer_size;
|
|
thread_tracer->target_cu = parameters.target_cu;
|
|
thread_tracer->simd_select = parameters.simd_select;
|
|
thread_tracer->vmid_mask = parameters.vmid_mask;
|
|
|
|
thread_tracer->perfcounter_mask = parameters.perfcounter_mask;
|
|
thread_tracer->perfcounter_ctrl = parameters.perfcounter_ctrl;
|
|
|
|
for(int i = 0; i < parameters.perfcounter_num; i++)
|
|
thread_tracer->perfcounters.emplace_back(parameters.perfcounter[i]);
|
|
|
|
thread_tracer->shader_engine_mask = 0;
|
|
for(int i = 0; i < parameters.shader_num; i++)
|
|
thread_tracer->shader_engine_mask |= 1ul << parameters.shader_ids[i];
|
|
|
|
ctx->thread_trace = std::make_shared<rocprofiler::ThreadTracer>(thread_tracer);
|
|
|
|
return ROCPROFILER_STATUS_SUCCESS;
|
|
}
|
|
}
|