55f2dabbb3
- include/rocprofiler/agent.h
- move rocprofiler_dim3_t
- include/rocprofiler/buffer_tracing.h
- size fields
- update kernel dispatch record
- include/rocprofiler/callback_tracing.h
- remove rocprofiler_callback_tracing_code_object_unload_data_t
- remove rocprofiler_callback_tracing_code_object_register_host_kernel_symbol_data_t
- include/rocprofiler/fwd.h
- added ROCPROFILER_STATUS_ERROR_CONTEXT_CONFLICT
- remove ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT_UNLOAD
- remove ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT_DEVICE_KERNEL_SYMBOL_UNREGISTER
- add rocprofiler_kernel_id_t typedef
- add rocprofiler_dim3_t (moved from agent.h)
- lib/common/synchronized.hpp
- rlock/wlock return decltype(auto)
- separate prototype from definition
- lib/common/utility.{hpp,cpp}
- timestamp functions replicating HSA implementation(s)
- init_public_api_struct for setting size field and ensuring certain type traits
- simplified static_cleanup_wrapper
- separate prototype from definition in active_capacity_gate
- lib/rocprofiler/agent.cpp
- tweak get_rocprofiler_agent impl
- lib/rocprofiler/buffer.cpp
- fix buffer message log level
- lib/rocprofiler/context.cpp
- use new paradigm for getting active contexts
- lib/rocprofiler/internal_threading.hpp
- update to simplified static_cleanup_wrapper implementation
- lib/rocprofiler/registration.cpp
- fix deactivating contexts
- lib/rocprofiler/rocprofiler.cpp
- status string for context conflict
- lib/rocprofiler/context/context.*
- correlation_id struct
- new get_active_contexts paradigm
- lib/rocprofiler/counters/core.*
- rocprofiler_packet union
- tweak start/stop context to accept pointer instead of handle
- lib/rocprofiler/counters/dimensions.cpp
- update to new get_rocp_agent() return type
- lib/rocprofiler/hsa/hsa.*
- update to new get_active_contexts paradigm
- update to new correlation id implementation
- guard against hsa.def.cpp direct compilation
- lib/rocprofiler/hsa/queue_controller.*
- update to change in get_rocp_agent return type
- consistent aliases
- lookup function for getting queue pointer from hsa queue id
- lib/rocprofiler/hsa/queue.*
- rocprofiler_packet
- extend queue_info_session_t
- lib/rocprofiler/tests/registration.cpp
- improve diagnostic on perf check for rocprofiler_lib.callback_registration_lambda_with_result
112 строки
4.0 KiB
C++
112 строки
4.0 KiB
C++
// Copyright (c) 2018-2023 Advanced Micro Devices, Inc.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
#pragma once
|
|
|
|
#include <hsa/hsa.h>
|
|
#include <hsa/hsa_api_trace.h>
|
|
#include <hsa/hsa_ext_amd.h>
|
|
|
|
#include "fmt/core.h"
|
|
#include "fmt/ranges.h"
|
|
|
|
#include <string>
|
|
#include <string_view>
|
|
#include <unordered_map>
|
|
#include <vector>
|
|
|
|
#include <rocprofiler/agent.h>
|
|
#include "lib/common/utility.hpp"
|
|
|
|
// Construct const and non-const accessor functions
|
|
#define CONST_NONCONST_ACCESSOR(RTYPE, NAME, VAL) \
|
|
const RTYPE& NAME() const { return VAL; } \
|
|
RTYPE& NAME() { return VAL; }
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace hsa
|
|
{
|
|
static const uint32_t LDS_BLOCK_SIZE = 128 * 4;
|
|
|
|
// Stores per-agent HSA information such as GPU and Kernel pools
|
|
// along with nearest CPU agent and its pool. Links rocprofiler_agent_t
|
|
// to its HSA agent. Note this class is only valid when HSA is
|
|
// init'd
|
|
class AgentCache
|
|
{
|
|
public:
|
|
AgentCache(const rocprofiler_agent_t* rocp_agent,
|
|
hsa_agent_t hsa_agent,
|
|
size_t index,
|
|
hsa_agent_t nearest_cpu,
|
|
const AmdExtTable& ext_table);
|
|
~AgentCache() = default;
|
|
AgentCache(const AgentCache&) = default;
|
|
AgentCache(AgentCache&&) noexcept = default;
|
|
|
|
AgentCache& operator=(const AgentCache&) = default;
|
|
AgentCache& operator=(AgentCache&&) noexcept = default;
|
|
|
|
// Provides const and a non-const accessor functions.
|
|
CONST_NONCONST_ACCESSOR(hsa_amd_memory_pool_t, cpu_pool, m_cpu_pool);
|
|
CONST_NONCONST_ACCESSOR(hsa_amd_memory_pool_t, kernarg_pool, m_kernarg_pool);
|
|
CONST_NONCONST_ACCESSOR(hsa_amd_memory_pool_t, gpu_pool, m_gpu_pool);
|
|
CONST_NONCONST_ACCESSOR(hsa_agent_t, get_hsa_agent, m_hsa_agent);
|
|
CONST_NONCONST_ACCESSOR(hsa_agent_t, near_cpu, m_nearest_cpu);
|
|
|
|
const rocprofiler_agent_t* get_rocp_agent() const { return m_rocp_agent; }
|
|
std::string_view name() const { return m_name; }
|
|
size_t index() const { return m_index; }
|
|
|
|
bool operator==(const rocprofiler_agent_t*) const;
|
|
bool operator==(hsa_agent_t) const;
|
|
|
|
private:
|
|
// Agent info
|
|
const rocprofiler_agent_t* m_rocp_agent = nullptr;
|
|
size_t m_index{0}; // rocprofiler_agent index
|
|
|
|
// GPU Agent
|
|
hsa_agent_t m_hsa_agent{.handle = 0};
|
|
hsa_agent_t m_nearest_cpu{.handle = 0};
|
|
|
|
// memory pools
|
|
hsa_amd_memory_pool_t m_cpu_pool{.handle = 0};
|
|
hsa_amd_memory_pool_t m_kernarg_pool{.handle = 0};
|
|
hsa_amd_memory_pool_t m_gpu_pool{.handle = 0};
|
|
|
|
std::string_view m_name = {};
|
|
};
|
|
|
|
inline bool
|
|
AgentCache::operator==(const rocprofiler_agent_t* agent) const
|
|
{
|
|
return (agent == m_rocp_agent);
|
|
}
|
|
|
|
inline bool
|
|
AgentCache::operator==(hsa_agent_t agent) const
|
|
{
|
|
return (agent.handle == m_hsa_agent.handle);
|
|
}
|
|
} // namespace hsa
|
|
} // namespace rocprofiler
|