// MIT License // // Copyright (c) 2022-2025 Advanced Micro Devices, Inc. All Rights Reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in all // copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE // SOFTWARE. #pragma once #include "concepts.hpp" #include #include #include #include #include #include #include #include #include #include #include namespace rocprofsys { namespace utility { /// provides an alternative thread index for when using threading::get_id() is not /// desirable inline auto get_thread_index() { static std::atomic _c{ 0 }; static thread_local int64_t _v = _c++; return _v; } /// fills any array with the result of the functor template inline auto get_filled_array(FuncT&& _func) { using Tp = std::decay_t; std::array _v{}; for(auto& itr : _v) itr = std::move(_func()); return _v; } /// returns a vector with a preallocated buffer template inline auto get_reserved_vector(size_t _n) { std::vector _v{}; _v.reserve(_n); return _v; } /// returns a vector with a preallocated buffer template inline decltype(auto) get_reserved_vector(std::vector&& _v, size_t _n) { _v.reserve(_n); return std::forward>(_v); } template struct offset_index_sequence; template struct offset_index_value { static constexpr size_t value = Idx + Offset; }; template struct offset_index_sequence, Offset> { using type = std::integer_sequence::value...>; }; template using make_offset_index_sequence = offset_index_sequence, OffsetN>; template using make_index_sequence_range = typename offset_index_sequence, StartN>::type; template struct generate { using type = Tp; template auto operator()(Args&&... _args) const { if constexpr(concepts::is_unique_pointer::value) { using value_type = typename type::element_type; if constexpr(use_placement_new_when_generating_unique_ptr::value) { // create a thread-local buffer for placement-new static thread_local auto _buffer = std::array{}; if constexpr(std::is_constructible::value) { return type{ new(_buffer.data()) value_type{ std::forward(_args)... } }; } else { return type{ new(_buffer.data()) value_type{ invoke(std::forward(_args))... } }; } } else { if constexpr(std::is_constructible::value) { return type{ new value_type{ std::forward(_args)... } }; } else { return type{ new value_type{ invoke(std::forward(_args))... } }; } } } else { if constexpr(std::is_constructible::value) { return type{ std::forward(_args)... }; } else { return type{ invoke(std::forward(_args))... }; } } } private: template static auto invoke(Up&& _v, int, std::enable_if_t::value, int> = 0) -> decltype(std::forward(_v)()) { return std::forward(_v)(); } template static auto&& invoke(Up&& _v, long) { return std::forward(_v); } template static decltype(auto) invoke(Up&& _v) { return invoke(std::forward(_v), 0); } }; template