55f2dabbb3
- include/rocprofiler/agent.h
- move rocprofiler_dim3_t
- include/rocprofiler/buffer_tracing.h
- size fields
- update kernel dispatch record
- include/rocprofiler/callback_tracing.h
- remove rocprofiler_callback_tracing_code_object_unload_data_t
- remove rocprofiler_callback_tracing_code_object_register_host_kernel_symbol_data_t
- include/rocprofiler/fwd.h
- added ROCPROFILER_STATUS_ERROR_CONTEXT_CONFLICT
- remove ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT_UNLOAD
- remove ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT_DEVICE_KERNEL_SYMBOL_UNREGISTER
- add rocprofiler_kernel_id_t typedef
- add rocprofiler_dim3_t (moved from agent.h)
- lib/common/synchronized.hpp
- rlock/wlock return decltype(auto)
- separate prototype from definition
- lib/common/utility.{hpp,cpp}
- timestamp functions replicating HSA implementation(s)
- init_public_api_struct for setting size field and ensuring certain type traits
- simplified static_cleanup_wrapper
- separate prototype from definition in active_capacity_gate
- lib/rocprofiler/agent.cpp
- tweak get_rocprofiler_agent impl
- lib/rocprofiler/buffer.cpp
- fix buffer message log level
- lib/rocprofiler/context.cpp
- use new paradigm for getting active contexts
- lib/rocprofiler/internal_threading.hpp
- update to simplified static_cleanup_wrapper implementation
- lib/rocprofiler/registration.cpp
- fix deactivating contexts
- lib/rocprofiler/rocprofiler.cpp
- status string for context conflict
- lib/rocprofiler/context/context.*
- correlation_id struct
- new get_active_contexts paradigm
- lib/rocprofiler/counters/core.*
- rocprofiler_packet union
- tweak start/stop context to accept pointer instead of handle
- lib/rocprofiler/counters/dimensions.cpp
- update to new get_rocp_agent() return type
- lib/rocprofiler/hsa/hsa.*
- update to new get_active_contexts paradigm
- update to new correlation id implementation
- guard against hsa.def.cpp direct compilation
- lib/rocprofiler/hsa/queue_controller.*
- update to change in get_rocp_agent return type
- consistent aliases
- lookup function for getting queue pointer from hsa queue id
- lib/rocprofiler/hsa/queue.*
- rocprofiler_packet
- extend queue_info_session_t
- lib/rocprofiler/tests/registration.cpp
- improve diagnostic on perf check for rocprofiler_lib.callback_registration_lambda_with_result
84 lines
3.2 KiB
C++
84 lines
3.2 KiB
C++
// Copyright (c) 2018-2023 Advanced Micro Devices, Inc.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
#pragma once
|
|
|
|
#include <rocprofiler/rocprofiler.h>
|
|
|
|
#include "lib/rocprofiler/hsa/queue.hpp"
|
|
|
|
#include <cstdint>
|
|
#include <unordered_map>
|
|
#include <vector>
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace hsa
|
|
{
|
|
// Tracks and manages HSA queues
|
|
class QueueController
|
|
{
|
|
public:
|
|
QueueController() = default;
|
|
// Initializes the QueueInterceptor. This must be delayed until
|
|
// HSA has been inited.
|
|
void init(CoreApiTable& core_table, AmdExtTable& ext_table);
|
|
|
|
// Called to add a queue that was created by the user program
|
|
void add_queue(hsa_queue_t*, std::unique_ptr<Queue>);
|
|
void destory_queue(hsa_queue_t*);
|
|
|
|
// Add callback to queues associated with the agent. Returns a client
|
|
// id that can be used by callers to remove the callback.
|
|
ClientID add_callback(const rocprofiler_agent_t&, Queue::queue_cb_t, Queue::completed_cb_t);
|
|
void remove_callback(ClientID);
|
|
|
|
const CoreApiTable& get_core_table() const { return _core_table; }
|
|
const AmdExtTable& get_ext_table() const { return _ext_table; }
|
|
|
|
// Gets the list of supported HSA agents that can be intercepted
|
|
const auto& get_supported_agents() const { return _supported_agents; }
|
|
auto& get_supported_agents() { return _supported_agents; }
|
|
|
|
const Queue* get_queue(const hsa_queue_t&) const;
|
|
|
|
private:
|
|
using agent_callback_tuple_t =
|
|
std::tuple<rocprofiler_agent_t, Queue::queue_cb_t, Queue::completed_cb_t>;
|
|
using queue_map_t = std::unordered_map<hsa_queue_t*, std::unique_ptr<Queue>>;
|
|
using client_id_map_t = std::unordered_map<ClientID, agent_callback_tuple_t>;
|
|
using agent_cache_map_t = std::unordered_map<uint32_t, AgentCache>;
|
|
|
|
CoreApiTable _core_table = {};
|
|
AmdExtTable _ext_table = {};
|
|
common::Synchronized<queue_map_t> _queues = {};
|
|
common::Synchronized<client_id_map_t> _callback_cache = {};
|
|
agent_cache_map_t _supported_agents = {};
|
|
};
|
|
|
|
QueueController&
|
|
get_queue_controller();
|
|
|
|
void
|
|
queue_controller_init(HsaApiTable* table);
|
|
|
|
} // namespace hsa
|
|
} // namespace rocprofiler
|