// MIT License // // Copyright (c) 2023-2025 Advanced Micro Devices, Inc. All rights reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in all // copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE // SOFTWARE. #pragma once #include "counter_info.hpp" #include "generator.hpp" #include "pc_sample_transform.hpp" #include "statistics.hpp" #include "stream_info.hpp" #include "tmp_file_buffer.hpp" #include "lib/common/container/ring_buffer.hpp" #include "lib/common/logging.hpp" #include #include namespace rocprofiler { namespace tool { using float_type = double; using stats_data_t = statistics; template struct buffered_output { using type = Tp; static constexpr auto buffer_type_v = DomainT; explicit buffered_output(bool _enabled); ~buffered_output() = default; buffered_output(const buffered_output&) = delete; buffered_output(buffered_output&&) noexcept = delete; buffered_output& operator=(const buffered_output&) = delete; buffered_output& operator=(buffered_output&&) noexcept = delete; operator bool() const { return enabled; } void flush(); void read(); void clear(); void reset(); void destroy(); uint64_t get_num_bytes() const; file_generator get_generator() const; std::deque load_all(); stats_entry_t stats = {}; private: bool enabled = false; }; template buffered_output::buffered_output(bool _enabled) : enabled{_enabled} {} template void buffered_output::flush() { if(!enabled) return; flush_tmp_buffer(buffer_type_v); } template void buffered_output::read() { if(!enabled) return; flush(); read_tmp_file(buffer_type_v); } template file_generator buffered_output::get_generator() const { return file_generator{get_tmp_file_buffer(DomainT)}; } template std::deque buffered_output::load_all() { auto data = std::deque{}; if(enabled) { auto gen = get_generator(); for(auto ditr : gen) { for(auto itr : gen.get(ditr)) { data.emplace_back(itr); } } } return data; } template void buffered_output::clear() { if(!enabled) return; } template void buffered_output::reset() { if(!enabled) return; if(auto*& filebuf = get_tmp_file_buffer(buffer_type_v); filebuf) { filebuf->reset(); } } template void buffered_output::destroy() { if(!enabled) return; clear(); auto*& filebuf = get_tmp_file_buffer(buffer_type_v); if(filebuf) { file_buffer* tmp = nullptr; std::swap(filebuf, tmp); tmp->buffer.destroy(); if(tmp->file) { tmp->file.close(); tmp->file.remove(); } delete tmp; } } template uint64_t buffered_output::get_num_bytes() const { if(auto*& filebuf = get_tmp_file_buffer(buffer_type_v); filebuf) return filebuf->nbytes; return 0; } using hip_buffered_output_t = buffered_output; using hsa_buffered_output_t = buffered_output; using marker_buffered_output_t = buffered_output; using rccl_buffered_output_t = buffered_output; using counter_collection_buffered_output_t = buffered_output; using scratch_memory_buffered_output_t = buffered_output; using memory_allocation_buffered_output_t = buffered_output; using counter_records_buffered_output_t = ::rocprofiler::tool::buffered_output; using pc_sampling_host_trap_buffered_output_t = buffered_output; using rocdecode_buffered_output_t = buffered_output; using rocjpeg_buffered_output_t = buffered_output; using kernel_dispatch_buffered_output_ext_t = buffered_output; using memory_copy_buffered_output_ext_t = buffered_output; using pc_sampling_stochastic_buffered_output_t = buffered_output; } // namespace tool } // namespace rocprofiler