2023-11-14 10:58:33 -06:00
|
|
|
// MIT License
|
|
|
|
|
//
|
2025-01-23 06:41:20 +05:30
|
|
|
// Copyright (c) 2023-2025 Advanced Micro Devices, Inc. All rights reserved.
|
2023-10-18 23:15:56 -05:00
|
|
|
//
|
|
|
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
|
|
|
// in the Software without restriction, including without limitation the rights
|
|
|
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
|
|
|
// furnished to do so, subject to the following conditions:
|
|
|
|
|
//
|
|
|
|
|
// The above copyright notice and this permission notice shall be included in
|
|
|
|
|
// all copies or substantial portions of the Software.
|
|
|
|
|
//
|
|
|
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
|
// THE SOFTWARE.
|
|
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
2023-11-29 20:43:18 -06:00
|
|
|
#include <rocprofiler-sdk/rocprofiler.h>
|
2024-10-25 13:13:36 -07:00
|
|
|
#include <rocprofiler-sdk/cxx/hash.hpp>
|
2023-10-18 23:15:56 -05:00
|
|
|
|
2024-03-08 07:02:43 -08:00
|
|
|
#include "lib/rocprofiler-sdk/hsa/profile_serializer.hpp"
|
2023-11-29 20:43:18 -06:00
|
|
|
#include "lib/rocprofiler-sdk/hsa/queue.hpp"
|
2023-10-18 23:15:56 -05:00
|
|
|
|
|
|
|
|
#include <cstdint>
|
2024-01-24 16:32:54 -06:00
|
|
|
#include <functional>
|
2023-11-17 01:49:51 -08:00
|
|
|
#include <optional>
|
2023-10-18 23:15:56 -05:00
|
|
|
#include <unordered_map>
|
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
|
|
namespace rocprofiler
|
|
|
|
|
{
|
|
|
|
|
namespace hsa
|
|
|
|
|
{
|
|
|
|
|
// Tracks and manages HSA queues
|
|
|
|
|
class QueueController
|
|
|
|
|
{
|
|
|
|
|
public:
|
2024-02-07 20:03:21 -08:00
|
|
|
using agent_callback_tuple_t =
|
|
|
|
|
std::tuple<rocprofiler_agent_t, Queue::queue_cb_t, Queue::completed_cb_t>;
|
|
|
|
|
using queue_iterator_cb_t = std::function<void(const Queue*)>;
|
|
|
|
|
using callback_iterator_cb_t = std::function<void(ClientID, const agent_callback_tuple_t&)>;
|
2024-03-08 07:02:43 -08:00
|
|
|
using queue_map_t = std::unordered_map<hsa_queue_t*, std::unique_ptr<Queue>>;
|
2024-10-21 10:41:29 -07:00
|
|
|
using agent_cache_map_t = std::unordered_map<uint32_t, AgentCache>;
|
2024-01-24 16:32:54 -06:00
|
|
|
|
2024-10-24 20:37:05 -03:00
|
|
|
QueueController() = default;
|
|
|
|
|
~QueueController() = default;
|
2023-10-18 23:15:56 -05:00
|
|
|
// Initializes the QueueInterceptor. This must be delayed until
|
|
|
|
|
// HSA has been inited.
|
|
|
|
|
void init(CoreApiTable& core_table, AmdExtTable& ext_table);
|
|
|
|
|
|
|
|
|
|
// Called to add a queue that was created by the user program
|
|
|
|
|
void add_queue(hsa_queue_t*, std::unique_ptr<Queue>);
|
2024-03-01 01:46:07 -06:00
|
|
|
void destroy_queue(hsa_queue_t*);
|
2023-10-18 23:15:56 -05:00
|
|
|
|
|
|
|
|
// Add callback to queues associated with the agent. Returns a client
|
2023-11-17 01:49:51 -08:00
|
|
|
// id that can be used by callers to remove the callback. If no agent
|
|
|
|
|
// is specified, callback will be applied to all agents.
|
|
|
|
|
ClientID add_callback(std::optional<rocprofiler_agent_t>,
|
|
|
|
|
Queue::queue_cb_t,
|
|
|
|
|
Queue::completed_cb_t);
|
2023-10-18 23:15:56 -05:00
|
|
|
void remove_callback(ClientID);
|
|
|
|
|
|
|
|
|
|
const CoreApiTable& get_core_table() const { return _core_table; }
|
|
|
|
|
const AmdExtTable& get_ext_table() const { return _ext_table; }
|
|
|
|
|
|
2024-03-08 07:02:43 -08:00
|
|
|
// Gets the list of supported HSA agents that can be Pintercepted
|
2024-10-21 10:41:29 -07:00
|
|
|
const agent_cache_map_t& get_supported_agents() const;
|
|
|
|
|
|
|
|
|
|
agent_cache_map_t& get_supported_agents();
|
2023-10-18 23:15:56 -05:00
|
|
|
|
2023-11-06 21:59:31 -06:00
|
|
|
const Queue* get_queue(const hsa_queue_t&) const;
|
|
|
|
|
|
2024-01-24 16:32:54 -06:00
|
|
|
void iterate_queues(const queue_iterator_cb_t&) const;
|
2024-02-05 12:42:59 -06:00
|
|
|
void set_queue_state(queue_state state, hsa_queue_t* hsa_queue);
|
2024-03-08 07:02:43 -08:00
|
|
|
|
2024-02-05 12:42:59 -06:00
|
|
|
void add_dispatch_ready(const Queue* queue);
|
2024-01-24 16:32:54 -06:00
|
|
|
|
2024-02-07 20:03:21 -08:00
|
|
|
void iterate_callbacks(const callback_iterator_cb_t&) const;
|
|
|
|
|
|
2024-10-25 13:13:36 -07:00
|
|
|
common::Synchronized<hsa::profiler_serializer>& serializer(const Queue*);
|
2024-03-08 07:02:43 -08:00
|
|
|
|
2024-02-07 20:03:21 -08:00
|
|
|
/**
|
|
|
|
|
* Disable serialization for QueueController, has no effect if counter collection
|
|
|
|
|
* is not in use (which defaults to no serialization mechanism). Should only be used for
|
|
|
|
|
* testing.
|
|
|
|
|
*/
|
2024-03-08 07:02:43 -08:00
|
|
|
void enable_serialization();
|
2024-02-07 20:03:21 -08:00
|
|
|
void disable_serialization();
|
|
|
|
|
|
2024-03-08 07:02:43 -08:00
|
|
|
// Prints current state of signals for queues, used for debugging. Only prints
|
|
|
|
|
// serialization related signals if not compiled in debug mode.
|
|
|
|
|
void print_debug_signals() const;
|
|
|
|
|
|
|
|
|
|
#if !defined(NDEBUG)
|
|
|
|
|
// Tracks the creation of all signals in queues, used for debugging and disabled
|
|
|
|
|
// in release mode (adds locking around signal creation).
|
|
|
|
|
common::Synchronized<std::unordered_map<uint64_t, hsa_signal_t>> _debug_signals;
|
|
|
|
|
#endif
|
|
|
|
|
|
2023-10-18 23:15:56 -05:00
|
|
|
private:
|
2024-10-21 10:41:29 -07:00
|
|
|
using client_id_map_t = std::unordered_map<ClientID, agent_callback_tuple_t>;
|
|
|
|
|
using resource_alloc_t = void(const AgentCache&, const CoreApiTable&, const AmdExtTable&);
|
2023-10-18 23:15:56 -05:00
|
|
|
|
2024-10-25 13:13:36 -07:00
|
|
|
CoreApiTable _core_table = {};
|
|
|
|
|
AmdExtTable _ext_table = {};
|
|
|
|
|
common::Synchronized<queue_map_t> _queues = {};
|
|
|
|
|
common::Synchronized<client_id_map_t> _callback_cache = {};
|
|
|
|
|
agent_cache_map_t _supported_agents = {};
|
|
|
|
|
std::atomic<bool> _serialized_enabled = {false};
|
|
|
|
|
common::Synchronized<
|
|
|
|
|
std::unordered_map<rocprofiler_agent_id_t,
|
|
|
|
|
std::shared_ptr<common::Synchronized<hsa::profiler_serializer>>>>
|
|
|
|
|
_profiler_serializer;
|
2023-10-18 23:15:56 -05:00
|
|
|
};
|
|
|
|
|
|
2024-03-21 17:52:15 -05:00
|
|
|
QueueController*
|
2023-10-18 23:15:56 -05:00
|
|
|
get_queue_controller();
|
|
|
|
|
|
|
|
|
|
void
|
|
|
|
|
queue_controller_init(HsaApiTable* table);
|
|
|
|
|
|
2024-01-24 16:32:54 -06:00
|
|
|
void
|
|
|
|
|
queue_controller_fini();
|
2024-02-05 12:42:59 -06:00
|
|
|
|
2024-06-24 20:38:34 -05:00
|
|
|
void
|
|
|
|
|
queue_controller_sync();
|
|
|
|
|
|
2024-02-05 12:42:59 -06:00
|
|
|
void
|
|
|
|
|
profiler_serializer_kernel_completion_signal(hsa_signal_t queue_block_signal);
|
|
|
|
|
|
2023-10-18 23:15:56 -05:00
|
|
|
} // namespace hsa
|
|
|
|
|
} // namespace rocprofiler
|