2022-04-21 21:36:07 -05:00
|
|
|
// MIT License
|
|
|
|
|
//
|
2025-01-15 13:06:12 -05:00
|
|
|
// Copyright (c) 2022-2025 Advanced Micro Devices, Inc. All Rights Reserved.
|
2022-04-21 21:36:07 -05:00
|
|
|
//
|
|
|
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
|
|
|
// in the Software without restriction, including without limitation the rights
|
|
|
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
|
|
|
// furnished to do so, subject to the following conditions:
|
|
|
|
|
//
|
|
|
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
|
|
|
// copies or substantial portions of the Software.
|
|
|
|
|
//
|
|
|
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
|
|
|
// SOFTWARE.
|
|
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
2022-08-31 01:24:31 -05:00
|
|
|
#include "api.hpp"
|
2023-02-04 10:59:50 -06:00
|
|
|
#include "core/common.hpp"
|
|
|
|
|
#include "core/defines.hpp"
|
|
|
|
|
#include "core/state.hpp"
|
|
|
|
|
#include "core/timemory.hpp"
|
2023-01-24 18:53:23 -06:00
|
|
|
#include "library/causal/components/causal_gotcha.hpp"
|
2022-07-24 22:09:32 -05:00
|
|
|
#include "library/components/exit_gotcha.hpp"
|
2022-04-21 21:36:07 -05:00
|
|
|
#include "library/components/fork_gotcha.hpp"
|
2025-12-23 03:17:57 +01:00
|
|
|
#include "library/components/kill_gotcha.hpp"
|
2022-04-21 21:36:07 -05:00
|
|
|
#include "library/components/mpi_gotcha.hpp"
|
2022-09-12 17:44:27 -05:00
|
|
|
#include "library/components/numa_gotcha.hpp"
|
2022-04-21 21:36:07 -05:00
|
|
|
#include "library/components/pthread_gotcha.hpp"
|
2025-02-11 13:08:23 -05:00
|
|
|
#include "library/components/vaapi_gotcha.hpp"
|
2022-04-25 17:00:52 -05:00
|
|
|
#include "library/thread_data.hpp"
|
2022-04-21 21:36:07 -05:00
|
|
|
|
|
|
|
|
#include <timemory/backends/threading.hpp>
|
|
|
|
|
#include <timemory/macros/language.hpp>
|
|
|
|
|
|
2022-07-24 22:09:32 -05:00
|
|
|
#include <memory>
|
|
|
|
|
#include <set>
|
2022-04-21 21:36:07 -05:00
|
|
|
#include <string>
|
|
|
|
|
#include <string_view>
|
|
|
|
|
#include <unordered_set>
|
|
|
|
|
|
2024-10-15 11:20:40 -04:00
|
|
|
namespace rocprofsys
|
2022-04-21 21:36:07 -05:00
|
|
|
{
|
2022-08-31 11:33:45 -05:00
|
|
|
// started during preinit phase
|
|
|
|
|
using preinit_bundle_t =
|
2025-12-23 03:17:57 +01:00
|
|
|
tim::lightweight_tuple<exit_gotcha_t, fork_gotcha_t, mpi_gotcha_t, kill_gotcha_t>;
|
2022-08-31 11:33:45 -05:00
|
|
|
|
|
|
|
|
// started during init phase
|
2023-01-24 18:53:23 -06:00
|
|
|
using init_bundle_t = tim::lightweight_tuple<causal::component::causal_gotcha,
|
|
|
|
|
pthread_gotcha, component::numa_gotcha>;
|
2022-08-31 11:33:45 -05:00
|
|
|
|
2024-10-15 11:20:40 -04:00
|
|
|
// bundle of components around rocprofsys_init and rocprofsys_finalize
|
2022-04-21 21:36:07 -05:00
|
|
|
using main_bundle_t =
|
2022-08-31 01:24:31 -05:00
|
|
|
tim::lightweight_tuple<comp::wall_clock, comp::peak_rss, comp::page_rss,
|
2022-08-31 11:33:45 -05:00
|
|
|
comp::cpu_clock, comp::cpu_util>;
|
2022-04-21 21:36:07 -05:00
|
|
|
|
|
|
|
|
// bundle of components around each thread
|
|
|
|
|
#if defined(TIMEMORY_RUSAGE_THREAD) && TIMEMORY_RUSAGE_THREAD > 0
|
2022-08-31 11:33:45 -05:00
|
|
|
using thread_bundle_t = tim::lightweight_tuple<comp::wall_clock, comp::thread_cpu_clock,
|
|
|
|
|
comp::thread_cpu_util, comp::peak_rss>;
|
2022-04-21 21:36:07 -05:00
|
|
|
#else
|
2022-08-31 11:33:45 -05:00
|
|
|
using thread_bundle_t = tim::lightweight_tuple<comp::wall_clock, comp::thread_cpu_clock,
|
|
|
|
|
comp::thread_cpu_util>;
|
2022-04-21 21:36:07 -05:00
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
std::unique_ptr<main_bundle_t>&
|
|
|
|
|
get_main_bundle();
|
|
|
|
|
|
2022-08-31 11:33:45 -05:00
|
|
|
std::unique_ptr<init_bundle_t>&
|
|
|
|
|
get_init_bundle();
|
|
|
|
|
|
|
|
|
|
std::unique_ptr<preinit_bundle_t>&
|
|
|
|
|
get_preinit_bundle();
|
2022-04-21 21:36:07 -05:00
|
|
|
|
|
|
|
|
std::atomic<uint64_t>&
|
2022-06-20 00:44:31 -05:00
|
|
|
get_cpu_cid() TIMEMORY_HOT;
|
2022-04-21 21:36:07 -05:00
|
|
|
|
2022-04-25 17:00:52 -05:00
|
|
|
unique_ptr_t<std::vector<uint64_t>>&
|
2022-06-20 00:44:31 -05:00
|
|
|
get_cpu_cid_stack(int64_t _tid = threading::get_id(), int64_t _parent = 0) TIMEMORY_HOT;
|
2022-04-21 21:36:07 -05:00
|
|
|
|
2022-05-24 19:25:54 -05:00
|
|
|
using cpu_cid_data_t = std::tuple<uint64_t, uint64_t, uint32_t>;
|
|
|
|
|
using cpu_cid_pair_t = std::tuple<uint64_t, uint32_t>;
|
2022-04-21 21:36:07 -05:00
|
|
|
using cpu_cid_parent_map_t = std::unordered_map<uint64_t, cpu_cid_pair_t>;
|
|
|
|
|
|
2022-04-25 17:00:52 -05:00
|
|
|
unique_ptr_t<cpu_cid_parent_map_t>&
|
2022-06-20 00:44:31 -05:00
|
|
|
get_cpu_cid_parents(int64_t _tid = threading::get_id()) TIMEMORY_HOT;
|
2022-04-21 21:36:07 -05:00
|
|
|
|
|
|
|
|
cpu_cid_data_t
|
2022-06-20 00:44:31 -05:00
|
|
|
create_cpu_cid_entry(int64_t _tid = threading::get_id()) TIMEMORY_HOT;
|
2022-04-21 21:36:07 -05:00
|
|
|
|
|
|
|
|
cpu_cid_pair_t
|
2022-06-20 00:44:31 -05:00
|
|
|
get_cpu_cid_entry(uint64_t _cid, int64_t _tid = threading::get_id()) TIMEMORY_HOT;
|
2022-04-21 21:36:07 -05:00
|
|
|
|
2022-04-27 16:56:38 -05:00
|
|
|
tim::mutex_t&
|
2022-06-20 00:44:31 -05:00
|
|
|
get_cpu_cid_stack_lock(int64_t _tid = threading::get_id()) TIMEMORY_HOT;
|
2022-04-27 16:56:38 -05:00
|
|
|
|
2022-08-31 06:29:19 -05:00
|
|
|
// query current value
|
|
|
|
|
bool
|
|
|
|
|
sampling_enabled_on_child_threads();
|
|
|
|
|
|
|
|
|
|
// use this to disable sampling in a region (e.g. right before thread creation)
|
|
|
|
|
bool
|
|
|
|
|
push_enable_sampling_on_child_threads(bool _v);
|
|
|
|
|
|
|
|
|
|
// use this to restore previous setting
|
|
|
|
|
bool
|
|
|
|
|
pop_enable_sampling_on_child_threads();
|
|
|
|
|
|
|
|
|
|
// make sure every newly created thead starts with this value
|
|
|
|
|
void
|
|
|
|
|
set_sampling_on_all_future_threads(bool _v);
|
|
|
|
|
|
|
|
|
|
struct scoped_child_sampling
|
|
|
|
|
{
|
|
|
|
|
scoped_child_sampling(bool _v) { push_enable_sampling_on_child_threads(_v); }
|
|
|
|
|
~scoped_child_sampling() { pop_enable_sampling_on_child_threads(); }
|
|
|
|
|
};
|
2023-02-08 01:31:38 -06:00
|
|
|
|
|
|
|
|
pid_t
|
|
|
|
|
get_root_process_id();
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
|
is_root_process();
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
|
is_child_process();
|
2024-10-15 11:20:40 -04:00
|
|
|
} // namespace rocprofsys
|
2022-05-08 04:40:10 -05:00
|
|
|
|
2024-10-15 11:20:40 -04:00
|
|
|
#define ROCPROFSYS_SCOPED_SAMPLING_ON_CHILD_THREADS(VALUE) \
|
|
|
|
|
::rocprofsys::scoped_child_sampling ROCPROFSYS_VARIABLE(_scoped_child_sampling_, \
|
|
|
|
|
__LINE__) \
|
2022-08-31 06:29:19 -05:00
|
|
|
{ \
|
|
|
|
|
VALUE \
|
|
|
|
|
}
|