b097e276a9
* [rocprofv3] Add rocpd output support (part 1: prelude)
- git submodules for sqlite3, GOTCHA, and pybind11
- HIP stream data
- rocprofiler_query_intercept_table_name(...)
- serialization load
- rocprofiler::sdk::get_perfetto_category(KindT)
- rocprofiler::sdk::parse::strip
- common library updates
- md5sum
- hasher
- simple_timer
- static_tl_object
- get_process_start_time_ns(pid_t)
- output library updates
- node_info
- file_generator (generator is now virtual base class)
- stream info updates
* Added submodules
* Code review updates
* Minor unused-but-set-X warning fixes
* Update CI
- install libsqlite3-dev package
* Update CI
- install libsqlite3-dev package
* Fix static thread-local object memory leak
- also fix signal handler chaining
* Remove URL from comment
* Remove page migration exception
* Enable ROCPROFILER_BUILD_SQLITE3 by default
- try find_package(SQLite3) first and then build when ROCPROFILER_BUILD_SQLITE3=ON
* Fix gotcha installation
- make install of target optional
* Validate tracing + counter collection dispatch data
- i.e. correlation ids, thread ids, timestamps
* Make find_package(SQLite3) optional
- ROCm CI does not have SQLite3 dev package installed and cannot build from source (missing tclsh)
* Fixes to tracing + counter collection test
* get_process_start_time_ns update
- original implementation did not work
* Fix pytest-packages test_perfetto_data for counter collection
- erroneous failure when used with same PMC + multiple agents
* cmake policy: option() honors normal variables
- for GOTCHA submodule
* Improve samples/api_buffered_tracing stability
- reduce likelihood of sporadic exception throw
* Update gotcha submodule
---------
Co-authored-by: Jonathan R. Madsen <jonathanrmadsen@gmail.com>
[ROCm/rocprofiler-sdk commit: 7166b1ab58]
121 řádky
4.3 KiB
C++
121 řádky
4.3 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2023-2025 Advanced Micro Devices, Inc.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
#pragma once
|
|
|
|
#include "lib/common/defines.hpp"
|
|
#include "lib/common/logging.hpp"
|
|
#include "lib/common/static_object.hpp"
|
|
|
|
#include <array>
|
|
#include <cstddef>
|
|
#include <functional>
|
|
#include <mutex>
|
|
#include <type_traits>
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace common
|
|
{
|
|
void
|
|
destroy_static_tl_objects();
|
|
|
|
void
|
|
register_static_tl_dtor(static_dtor_func_t&&);
|
|
|
|
/**
|
|
* @brief This struct is used to create static singleton objects which have the properties of a
|
|
* heap-allocated static object without a memory leak.
|
|
*
|
|
* @tparam Tp Data type of singleton
|
|
* @tparam ContextT Use to differentiate singletons in different translation units (if using default
|
|
* parameter) or ensure the singleton can be accessed in different translation units (not
|
|
* recommended) as long as this type is not in an anonymous namespace
|
|
*
|
|
* This template works by creating a buffer of at least `sizeof(Tp)` bytes in the binary and does a
|
|
* placement new into that buffer. The object created is NOT heap allocated, the address of the
|
|
* object is an address in between the library load address and the load address + size of library.
|
|
*/
|
|
template <typename Tp, typename ContextT = anonymous>
|
|
struct static_tl_object
|
|
{
|
|
static_tl_object() = delete;
|
|
~static_tl_object() = delete;
|
|
static_tl_object(const static_tl_object&) = delete;
|
|
static_tl_object(static_tl_object&&) noexcept = delete;
|
|
static_tl_object& operator=(const static_tl_object&) = delete;
|
|
static_tl_object& operator=(static_tl_object&&) noexcept = delete;
|
|
|
|
template <typename... Args>
|
|
static Tp*& construct(Args&&... args);
|
|
|
|
static Tp* get() { return m_object; }
|
|
|
|
static constexpr bool is_trivial_standard_layout();
|
|
|
|
private:
|
|
static thread_local Tp* m_object;
|
|
static thread_local std::array<std::byte, static_buffer_size<Tp>()> m_buffer;
|
|
};
|
|
|
|
template <typename Tp, typename ContextT>
|
|
thread_local Tp* static_tl_object<Tp, ContextT>::m_object = nullptr;
|
|
|
|
template <typename Tp, typename ContextT>
|
|
thread_local std::array<std::byte, static_buffer_size<Tp>()>
|
|
static_tl_object<Tp, ContextT>::m_buffer = {};
|
|
|
|
template <typename Tp, typename ContextT>
|
|
constexpr bool
|
|
static_tl_object<Tp, ContextT>::is_trivial_standard_layout()
|
|
{
|
|
return (std::is_standard_layout<Tp>::value && std::is_trivially_destructible<Tp>::value);
|
|
}
|
|
|
|
template <typename Tp, typename ContextT>
|
|
template <typename... Args>
|
|
Tp*&
|
|
static_tl_object<Tp, ContextT>::construct(Args&&... args)
|
|
{
|
|
if constexpr(!is_trivial_standard_layout())
|
|
{
|
|
static thread_local auto _once = std::once_flag{};
|
|
std::call_once(_once, []() {
|
|
register_static_tl_dtor([]() {
|
|
if(static_tl_object<Tp, ContextT>::m_object)
|
|
{
|
|
static_tl_object<Tp, ContextT>::m_object->~Tp();
|
|
static_tl_object<Tp, ContextT>::m_object = nullptr;
|
|
}
|
|
});
|
|
});
|
|
}
|
|
|
|
ROCP_FATAL_IF(m_object)
|
|
<< "reconstructing static object. Use get() function to retrieve pointer";
|
|
|
|
m_object = new(m_buffer.data()) Tp{std::forward<Args>(args)...};
|
|
return m_object;
|
|
}
|
|
} // namespace common
|
|
} // namespace rocprofiler
|