69b8a43dc6
* Added first ATT API * Finalizing thread trace API * Fixing more rebase conflicts * Added codeobj disassembly sample * Fixing merge issues with rebase [2] * Adding ATT packets * Implemented thread trace intercept * Moved codeobj parser to same repo as rocprofiler * Moved thread trace to new API * Fixing merge conflicts * Fixing more merge conflicts * Adding thread trace packet reuse * Merged aql_profile_v2 headers * Linked ATT sample to aqlprofile * Updated decoder to include non-loaded codeobjs * Implemented ISA decoder into ATT sample * Added marker_id to vaddr * Updating aql_profile_v2 API to memcpy * Updating thread trace API to include 64bit markers. Using the result of ISA matching. * Added instruction type and cycles summary * Updated sample with selection of kernel by kernel_object * Added option to copy from memory kernels * Moved tool_data in thread_trace to dynamic alloc * Restoring hsa.cpp * Fixed ATT sample crash. General improvements. * Moved codeobj library to outside src/ * Updated license header * Moved codeobj_capture to camelcase * Solving some more merge conflicts * Update samples/advanced_thread_trace/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update samples/advanced_thread_trace/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update samples/code_object_isa_decode/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Update source/lib/rocprofiler-sdk/thread_trace/CMakeLists.txt * Removing unused parameter check * Adding const to isEmpty * Removing unused warning * Adding libdw-dev to requirements * Running clang-format * Commenting out new aql calls * Clang format * Unused variable fix * Adding codeobj-decoder coverage * Commenting out threadtrace * Update samples/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * P * WOverloaded * Addressing clang-tidy * Virtual destructor on ttracer class * Corr id * Fixing code source format * Update CMakeLists.txt * Build fixes * Update source/lib/rocprofiler-sdk-codeobj/code_object_track.cpp Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> * Fix shadowing * Update CMakeLists.txt * Update samples/CMakeLists.txt Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --------- Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: Ammar ELWazir <ammar.elwazir@amd.com> Co-authored-by: Ammar ELWazir <aelwazir@amd.com> Co-authored-by: Benjamin Welton <bewelton@amd.com>
118 خطوط
3.8 KiB
C++
118 خطوط
3.8 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2023 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
#include "lib/rocprofiler-sdk/hsa/aql_packet.hpp"
|
|
#include <cstdlib>
|
|
#include <iostream>
|
|
#include <string>
|
|
|
|
#define CHECK_HSA(fn, message) \
|
|
if((fn) != HSA_STATUS_SUCCESS) \
|
|
{ \
|
|
std::cerr << __FILE__ << ':' << __LINE__ << ' ' << message; \
|
|
exit(1); \
|
|
}
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace hsa
|
|
{
|
|
CounterAQLPacket::~CounterAQLPacket()
|
|
{
|
|
if(!profile.command_buffer.ptr)
|
|
{
|
|
// pass, nothing malloced
|
|
}
|
|
else if(!command_buf_mallocd)
|
|
{
|
|
CHECK_HSA(free_func(profile.command_buffer.ptr), "freeing memory");
|
|
}
|
|
else
|
|
{
|
|
::free(profile.command_buffer.ptr);
|
|
}
|
|
|
|
if(!profile.output_buffer.ptr)
|
|
{
|
|
// pass, nothing malloced
|
|
}
|
|
else if(!output_buffer_malloced)
|
|
{
|
|
CHECK_HSA(free_func(profile.output_buffer.ptr), "freeing memory");
|
|
}
|
|
else
|
|
{
|
|
::free(profile.output_buffer.ptr);
|
|
}
|
|
}
|
|
|
|
TraceAQLPacket::~TraceAQLPacket() = default;
|
|
/*
|
|
TraceAQLPacket::~TraceAQLPacket()
|
|
{
|
|
aqlprofile_att_delete_packets(this->handle);
|
|
}
|
|
*/
|
|
|
|
hsa_status_t
|
|
TraceAQLPacket::Alloc(void** ptr, size_t size, aqlprofile_buffer_desc_flags_t flags, void* data)
|
|
{
|
|
if(!data) return HSA_STATUS_ERROR;
|
|
if(!reinterpret_cast<TraceAQLPacket*>(data)->tracepool) return HSA_STATUS_ERROR;
|
|
|
|
auto& pool = *reinterpret_cast<TraceAQLPacket*>(data)->tracepool;
|
|
|
|
if(!pool.allocate_fn || !pool.free_fn || !pool.allow_access_fn) return HSA_STATUS_ERROR;
|
|
|
|
if(flags.host_access)
|
|
{
|
|
hsa_status_t status = pool.allocate_fn(pool.cpu_pool_, size, 0, ptr);
|
|
if(!flags.device_access || status != HSA_STATUS_SUCCESS) return status;
|
|
return pool.allow_access_fn(1, &pool.gpu_agent, nullptr, *ptr);
|
|
}
|
|
return pool.allocate_fn(pool.gpu_pool_, size, 0, ptr);
|
|
}
|
|
|
|
void
|
|
TraceAQLPacket::Free(void* ptr, void* data)
|
|
{
|
|
auto* pool = reinterpret_cast<TraceAQLPacket*>(data)->tracepool.get();
|
|
if(!pool || !pool->free_fn) return;
|
|
|
|
pool->free_fn(ptr);
|
|
}
|
|
|
|
hsa_status_t
|
|
TraceAQLPacket::Copy(void* dst, const void* src, size_t size, void* data)
|
|
{
|
|
auto* pool = reinterpret_cast<TraceAQLPacket*>(data)->tracepool.get();
|
|
if(!pool || !pool->api_copy_fn) return HSA_STATUS_ERROR;
|
|
|
|
return pool->api_copy_fn(dst, src, size);
|
|
}
|
|
|
|
TraceAQLPacket::TraceAQLPacket(std::shared_ptr<TraceMemoryPool>& _tracepool)
|
|
: tracepool(_tracepool){};
|
|
|
|
} // namespace hsa
|
|
} // namespace rocprofiler
|