7b6d3c70bd
* Moved tests/apps to tests/bin * Renamed cmake project in tests/bin * Update samples - Use ROCPROFILER_DEFAULT_FAIL_REGEX - tweaks to stdout messages * Update tests - Use ROCPROFILER_DEFAULT_FAIL_REGEX * Add tests/lib - libraries with HIP code * Update PTL submodule - remove atexit delete of thread_id_map * Update cmake/rocprofiler_options.cmake - Set ROCPROFILER_DEFAULT_FAIL_REGEX * Update common lib: env + logging - improved customization of logging settings - default to disabling logging to files - install failure handler for rocprofv3 - set_env support in environment.* * Add lib/rocprofiler-sdk/shared_library.cpp - shared library constructor * Update lib/rocprofiler-sdk-tool/tool.cpp - destructor thread safety - convert callback_name_info and buffered_name_info to pointers - install failure handler for logging * Add tests/bin/hip-in-libraries - hip-in-libraries is an exe which uses two shared libraries where each shared library contains HIP kernels - used for testing deadlocking within __hipRegisterFatBinary * Update bin/rocprofv3 - reorganized the env variables - use exec to launch command - set ROCPROFILER_LIBRARY_CTOR=1 * Add tests/rocprofv3/tracing-hip-in-libraries - uses hip-in-libraries exe for exe which uses shared libraries to launch HIP kernels * Update bin/rocprofv3 - fix counter collection (no exec) * Update lib/rocprofiler-sdk-tool/tool.cpp - replace "Kernel-Name" with "Kernel_Name" * Update lib/rocprofiler-sdk/registration.cpp Use RTLD_LOCAL instead of RTLD_GLOBAL for env libraries * Update tests/rocprofv3 - replace "Kernel-Name" with "Kernel_Name" * Update tests - vector-ops (bin) stream syncs + runs with 4 queues per device - improve counter-collection/input1 validation - rocprofv3/tracing-hip-in-libraries does not do sys-trace - improved validation script for tracing-hip-in-libraries - updated dispatch_callback in json-tool.cpp following reworking of prototypes for counter collection * Update samples/counter_collection - updated dispatch_callback(s) and record_callback(s) following reworking of prototypes * Update bin/rocprofv3 - reorganized help menu - added options for sub-HSA tables - added --hip-runtime-trace - changed --hip-trace to include --hip-compiler-trace * Update lib/rocprofiler-sdk-tool - improved kernel filtering - removed arch_vgpr, accum_vgpr, sgpr code (in rocprofiler-sdk) - fixed issue with counter-collection w/o tracing - added support for fine grained HSA API tracing - removed directly linking to HSA-runtime * Update lib/rocprofiler-sdk/agent.cpp - rocp_agents != hsa_agents is non-fatal when ROCPROFILER_BUILD_CI=OFF (CMake option) * GPR (vector and scalar) info in kernel symbol data - rocprofiler_callback_tracing_code_object_kernel_symbol_register_data_t contains general purpose register info * Header include order fix - Include repo headers first - Third party library headers next - standard library headers last * Update dispatch profiling public API - introduce rocprofiler_profile_counting_dispatch_data_t - change signature of rocprofiler_profile_counting_dispatch_callback_t and rocprofiler_profile_counting_record_callback_t - provide rocprofiler_user_data_t pointer in dispatch callback - provide rocprofiler_user_data_t value (from dispatch cb) in record callback * Update tests/bin/CMakeLists.txt - fix add_subdirectory(hip-in-libraries) order * Update VERSION - bump to 0.2.0 in prep for AFAR
150 line
7.4 KiB
C
150 line
7.4 KiB
C
// MIT License
|
|
//
|
|
// Copyright (c) 2023 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#pragma once
|
|
|
|
#include <rocprofiler-sdk/agent.h>
|
|
#include <rocprofiler-sdk/defines.h>
|
|
#include <rocprofiler-sdk/fwd.h>
|
|
#include <rocprofiler-sdk/hsa.h>
|
|
#include <rocprofiler-sdk/profile_config.h>
|
|
|
|
ROCPROFILER_EXTERN_C_INIT
|
|
|
|
/**
|
|
* @defgroup DISPATCH_PROFILE_COUNTING_SERVICE Dispatch Profile Counting Service
|
|
* @brief Per-dispatch hardware counter collection service
|
|
*
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Kernel dispatch data for profile counting callbacks
|
|
*
|
|
*/
|
|
typedef struct rocprofiler_profile_counting_dispatch_data_t
|
|
{
|
|
uint64_t size; ///< Size of this struct
|
|
rocprofiler_kernel_id_t kernel_id; ///< Kernel identifier
|
|
rocprofiler_agent_id_t agent_id; ///< Agent ID where kernel is launched
|
|
rocprofiler_queue_id_t queue_id; ///< Queue ID where kernel packet is enqueued
|
|
rocprofiler_correlation_id_t correlation_id; ///< Correlation ID for this dispatch
|
|
uint32_t private_segment_size; /// runtime private memory segment size
|
|
uint32_t group_segment_size; /// runtime group memory segment size
|
|
rocprofiler_dim3_t workgroup_size; /// runtime workgroup size (grid * threads)
|
|
rocprofiler_dim3_t grid_size; /// runtime grid size
|
|
} rocprofiler_profile_counting_dispatch_data_t;
|
|
|
|
/**
|
|
* @brief Kernel Dispatch Callback. This is a callback that is invoked before the kernel
|
|
* is enqueued into the HSA queue. What counters to collect for a kernel are set
|
|
* via passing back a profile config (config) in this callback. These counters
|
|
* will be collected and emplaced in the buffer with @ref rocprofiler_buffer_id_t used when
|
|
* setting up this callback.
|
|
*
|
|
* @param [in] dispatch_data @see ::rocprofiler_profile_counting_dispatch_data_t
|
|
* @param [out] config Profile config detailing the counters to collect for this kernel
|
|
* @param [out] user_data User data unique to this dispatch. Returned in record callback
|
|
* @param [in] callback_data_args Callback supplied via buffered_dispatch_profile_counting_service
|
|
*/
|
|
typedef void (*rocprofiler_profile_counting_dispatch_callback_t)(
|
|
rocprofiler_profile_counting_dispatch_data_t dispatch_data,
|
|
rocprofiler_profile_config_id_t* config,
|
|
rocprofiler_user_data_t* user_data,
|
|
void* callback_data_args);
|
|
|
|
/**
|
|
* @brief Counting record callback. This is a callback is invoked when the kernel
|
|
* execution is complete and contains the counter profile data requested in
|
|
* @ref rocprofiler_profile_counting_dispatch_callback_t. Only used with
|
|
* @ref rocprofiler_configure_callback_dispatch_profile_counting_service.
|
|
*
|
|
* @param [in] dispatch_data @see ::rocprofiler_profile_counting_dispatch_data_t
|
|
* @param [in] record_data Counter record data.
|
|
* @param [in] record_count Number of counter records.
|
|
* @param [in] user_data User data instance from dispatch callback
|
|
* @param [in] callback_data_args Callback supplied via buffered_dispatch_profile_counting_service
|
|
*/
|
|
typedef void (*rocprofiler_profile_counting_record_callback_t)(
|
|
rocprofiler_profile_counting_dispatch_data_t dispatch_data,
|
|
rocprofiler_record_counter_t* record_data,
|
|
size_t record_count,
|
|
rocprofiler_user_data_t user_data,
|
|
void* callback_data_args);
|
|
|
|
/**
|
|
* @brief Configure buffered dispatch profile Counting Service.
|
|
* Collects the counters in dispatch packets and stores them
|
|
* in a buffer with @p buffer_id. The buffer may contain packets from more than
|
|
* one dispatch (denoted by correlation id). Will trigger the
|
|
* callback based on the parameters setup in buffer_id_t.
|
|
*
|
|
* NOTE: Interface is up for comment as to whether restrictions
|
|
* on agent should be made here (limiting the CB based on agent)
|
|
* or if the restriction should be performed by the tool in
|
|
* @ref rocprofiler_profile_counting_dispatch_callback_t (i.e.
|
|
* tool code checking the agent param to see if they want to profile
|
|
* it).
|
|
*
|
|
* Interface is up for comment as to whether restrictions
|
|
* on agent should be made here (limiting the CB based on agent)
|
|
* or if the restriction should be performed by the tool in
|
|
* @ref rocprofiler_profile_counting_dispatch_callback_t (i.e.
|
|
* tool code checking the agent param to see if they want to profile
|
|
* it).
|
|
*
|
|
* @param [in] context_id context id
|
|
* @param [in] buffer_id id of the buffer to use for the counting service
|
|
* @param [in] callback callback to perform when dispatch is enqueued
|
|
* @param [in] callback_data_args callback data
|
|
* @return ::rocprofiler_status_t
|
|
*/
|
|
rocprofiler_status_t ROCPROFILER_API
|
|
rocprofiler_configure_buffered_dispatch_profile_counting_service(
|
|
rocprofiler_context_id_t context_id,
|
|
rocprofiler_buffer_id_t buffer_id,
|
|
rocprofiler_profile_counting_dispatch_callback_t callback,
|
|
void* callback_data_args);
|
|
|
|
/**
|
|
* @brief Configure buffered dispatch profile Counting Service.
|
|
* Collects the counters in dispatch packets and calls a callback
|
|
* with the counters collected during that dispatch.
|
|
*
|
|
* @param [in] context_id context id
|
|
* @param [in] dispatch_callback callback to perform when dispatch is enqueued
|
|
* @param [in] dispatch_callback_args callback data for dispatch callback
|
|
* @param [in] record_callback Record callback for completed profile data
|
|
* @param [in] record_callback_args Callback args for record callback
|
|
* @return ::rocprofiler_status_t
|
|
*/
|
|
rocprofiler_status_t ROCPROFILER_API
|
|
rocprofiler_configure_callback_dispatch_profile_counting_service(
|
|
rocprofiler_context_id_t context_id,
|
|
rocprofiler_profile_counting_dispatch_callback_t dispatch_callback,
|
|
void* dispatch_callback_args,
|
|
rocprofiler_profile_counting_record_callback_t record_callback,
|
|
void* record_callback_args);
|
|
/** @} */
|
|
|
|
ROCPROFILER_EXTERN_C_FINI
|