7166b1ab58
* [rocprofv3] Add rocpd output support (part 1: prelude) - git submodules for sqlite3, GOTCHA, and pybind11 - HIP stream data - rocprofiler_query_intercept_table_name(...) - serialization load - rocprofiler::sdk::get_perfetto_category(KindT) - rocprofiler::sdk::parse::strip - common library updates - md5sum - hasher - simple_timer - static_tl_object - get_process_start_time_ns(pid_t) - output library updates - node_info - file_generator (generator is now virtual base class) - stream info updates * Added submodules * Code review updates * Minor unused-but-set-X warning fixes * Update CI - install libsqlite3-dev package * Update CI - install libsqlite3-dev package * Fix static thread-local object memory leak - also fix signal handler chaining * Remove URL from comment * Remove page migration exception * Enable ROCPROFILER_BUILD_SQLITE3 by default - try find_package(SQLite3) first and then build when ROCPROFILER_BUILD_SQLITE3=ON * Fix gotcha installation - make install of target optional * Validate tracing + counter collection dispatch data - i.e. correlation ids, thread ids, timestamps * Make find_package(SQLite3) optional - ROCm CI does not have SQLite3 dev package installed and cannot build from source (missing tclsh) * Fixes to tracing + counter collection test * get_process_start_time_ns update - original implementation did not work * Fix pytest-packages test_perfetto_data for counter collection - erroneous failure when used with same PMC + multiple agents * cmake policy: option() honors normal variables - for GOTCHA submodule * Improve samples/api_buffered_tracing stability - reduce likelihood of sporadic exception throw * Update gotcha submodule --------- Co-authored-by: Jonathan R. Madsen <jonathanrmadsen@gmail.com>
121 خطوط
4.3 KiB
C++
121 خطوط
4.3 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2023-2025 Advanced Micro Devices, Inc.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
#pragma once
|
|
|
|
#include "lib/common/defines.hpp"
|
|
#include "lib/common/logging.hpp"
|
|
#include "lib/common/static_object.hpp"
|
|
|
|
#include <array>
|
|
#include <cstddef>
|
|
#include <functional>
|
|
#include <mutex>
|
|
#include <type_traits>
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace common
|
|
{
|
|
void
|
|
destroy_static_tl_objects();
|
|
|
|
void
|
|
register_static_tl_dtor(static_dtor_func_t&&);
|
|
|
|
/**
|
|
* @brief This struct is used to create static singleton objects which have the properties of a
|
|
* heap-allocated static object without a memory leak.
|
|
*
|
|
* @tparam Tp Data type of singleton
|
|
* @tparam ContextT Use to differentiate singletons in different translation units (if using default
|
|
* parameter) or ensure the singleton can be accessed in different translation units (not
|
|
* recommended) as long as this type is not in an anonymous namespace
|
|
*
|
|
* This template works by creating a buffer of at least `sizeof(Tp)` bytes in the binary and does a
|
|
* placement new into that buffer. The object created is NOT heap allocated, the address of the
|
|
* object is an address in between the library load address and the load address + size of library.
|
|
*/
|
|
template <typename Tp, typename ContextT = anonymous>
|
|
struct static_tl_object
|
|
{
|
|
static_tl_object() = delete;
|
|
~static_tl_object() = delete;
|
|
static_tl_object(const static_tl_object&) = delete;
|
|
static_tl_object(static_tl_object&&) noexcept = delete;
|
|
static_tl_object& operator=(const static_tl_object&) = delete;
|
|
static_tl_object& operator=(static_tl_object&&) noexcept = delete;
|
|
|
|
template <typename... Args>
|
|
static Tp*& construct(Args&&... args);
|
|
|
|
static Tp* get() { return m_object; }
|
|
|
|
static constexpr bool is_trivial_standard_layout();
|
|
|
|
private:
|
|
static thread_local Tp* m_object;
|
|
static thread_local std::array<std::byte, static_buffer_size<Tp>()> m_buffer;
|
|
};
|
|
|
|
template <typename Tp, typename ContextT>
|
|
thread_local Tp* static_tl_object<Tp, ContextT>::m_object = nullptr;
|
|
|
|
template <typename Tp, typename ContextT>
|
|
thread_local std::array<std::byte, static_buffer_size<Tp>()>
|
|
static_tl_object<Tp, ContextT>::m_buffer = {};
|
|
|
|
template <typename Tp, typename ContextT>
|
|
constexpr bool
|
|
static_tl_object<Tp, ContextT>::is_trivial_standard_layout()
|
|
{
|
|
return (std::is_standard_layout<Tp>::value && std::is_trivially_destructible<Tp>::value);
|
|
}
|
|
|
|
template <typename Tp, typename ContextT>
|
|
template <typename... Args>
|
|
Tp*&
|
|
static_tl_object<Tp, ContextT>::construct(Args&&... args)
|
|
{
|
|
if constexpr(!is_trivial_standard_layout())
|
|
{
|
|
static thread_local auto _once = std::once_flag{};
|
|
std::call_once(_once, []() {
|
|
register_static_tl_dtor([]() {
|
|
if(static_tl_object<Tp, ContextT>::m_object)
|
|
{
|
|
static_tl_object<Tp, ContextT>::m_object->~Tp();
|
|
static_tl_object<Tp, ContextT>::m_object = nullptr;
|
|
}
|
|
});
|
|
});
|
|
}
|
|
|
|
ROCP_FATAL_IF(m_object)
|
|
<< "reconstructing static object. Use get() function to retrieve pointer";
|
|
|
|
m_object = new(m_buffer.data()) Tp{std::forward<Args>(args)...};
|
|
return m_object;
|
|
}
|
|
} // namespace common
|
|
} // namespace rocprofiler
|