Files
rocm-systems/source/lib/omnitrace/library/components/fork_gotcha.cpp
T
Jonathan R. Madsen 3e2fa69a14 CI timeout + line-info in releases (#279)
* Update perfetto args.gn.in

- remove enable_perfetto_tools_trace_to_text (unused)

* core timeout implementation

- requires OMNITRACE_CI=ON
- requires OMNITRACE_CI_TIMEOUT=<sec>
- adds pthread_self and std::this_thread::get_id to thread info
- pthread_create_gotcha stores native handles (pthread_self)

* Testing updates

- improve detection of segfault/failures with PASS_REGEX exists
- add OMNITRACE_CI_TIMEOUT env variable to all tests

* Line-info in releases

- e.g. -g1 + more options to minimize size of debug info

* Fix typo in config exit action message

* OMNITRACE_UNLIKELY around debug/verbose messages

* format fixes

* Overflow tests + capability check

* transpose example update

- link to threads library

* roctracer/rocprofiler update

- in ROCm 5.5.0, cannot include rocprofiler.h and roctracer.h in same file due to conflicting enum defs
- Moved HSA tracing setup/shutdown to component::roctracer

* roctracer update

- fix definition of roctracer::setup when disabled

* Update fork example

- detach threads on main PID
- flush io outputs when printing info

* Update overflow tests

- pass regular expressions
- overflow on PERF_COUNT_SW_CPU_CLOCK event

* fork gotcha update

- use getpid() instead of getppid()

* update fork example

- wait on threads calling fork

* timeout update

- wait on timeout thread to launch before proceeding
2023-06-14 11:55:22 -05:00

179 lines
5.3 KiB
C++

// MIT License
//
// Copyright (c) 2022 Advanced Micro Devices, Inc. All Rights Reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in all
// copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
#include "api.hpp"
#include "core/config.hpp"
#include "core/debug.hpp"
#include "core/perfetto.hpp"
#include "core/perfetto_fwd.hpp"
#include "core/state.hpp"
#include "library/components/fork_gotcha.hpp"
#include "library/runtime.hpp"
#include "library/sampling.hpp"
#include <timemory/backends/process.hpp>
#include <timemory/backends/threading.hpp>
#include <timemory/mpl/types.hpp>
#include <timemory/process/process.hpp>
#include <cstdlib>
#include <memory>
#include <pthread.h>
#include <unistd.h>
namespace omnitrace
{
namespace component
{
namespace
{
// these are used to prevent handlers from executing multiple times
bool prefork_lock = false;
bool postfork_parent_lock = false;
bool postfork_child_lock = false;
// this does a quick exit (no cleanup) on child processes
// because perfetto has a tendency to access memory it
// shouldn't during cleanup
void
child_exit(int _ec, void*)
{
std::quick_exit(_ec);
}
void
prefork_setup()
{
if(prefork_lock) return;
OMNITRACE_SCOPED_THREAD_STATE(ThreadState::Internal);
OMNITRACE_SCOPED_SAMPLING_ON_CHILD_THREADS(false);
if(get_state() < State::Active && !config::settings_are_configured())
omnitrace_init_library_hidden();
tim::set_env("OMNITRACE_PRELOAD", "0", 1);
tim::set_env("OMNITRACE_ROOT_PROCESS", process::get_id(), 0);
omnitrace_reset_preload_hidden();
OMNITRACE_BASIC_VERBOSE(0, "fork() called on PID %i (rank: %i), TID %li\n",
process::get_id(), dmp::rank(), threading::get_id());
OMNITRACE_BASIC_DEBUG(
"Warning! Calling fork() within an OpenMPI application using libfabric "
"may result is segmentation fault\n");
TIMEMORY_CONDITIONAL_DEMANGLED_BACKTRACE(get_debug_env(), 16);
if(config::get_use_sampling()) sampling::block_samples();
omnitrace::categories::disable_categories(config::get_enabled_categories());
// prevent re-entry until post-fork routines have been called
prefork_lock = true;
postfork_parent_lock = false;
postfork_child_lock = false;
}
void
postfork_parent()
{
if(postfork_parent_lock) return;
omnitrace::categories::enable_categories(config::get_enabled_categories());
if(config::get_use_sampling()) sampling::unblock_samples();
// prevent re-entry until prefork has been called
postfork_parent_lock = true;
prefork_lock = false;
}
void
postfork_child()
{
if(postfork_child_lock) return;
OMNITRACE_REQUIRE(is_child_process())
<< "Error! child process " << process::get_id()
<< " believes it is the root process " << get_root_process_id() << "\n";
settings::enabled() = false;
settings::verbose() = -127;
settings::debug() = false;
omnitrace::sampling::shutdown();
omnitrace::categories::shutdown();
set_thread_state(::omnitrace::ThreadState::Disabled);
omnitrace::get_perfetto_session(process::get_parent_id()).release();
// register these exit handlers to avoid cleaning up resources
on_exit(&child_exit, nullptr);
std::atexit([]() { child_exit(EXIT_SUCCESS, nullptr); });
// prevent re-entry until prefork has been called
postfork_child_lock = true;
prefork_lock = false;
}
} // namespace
void
fork_gotcha::configure()
{
fork_gotcha_t::get_initializer() = []() {
TIMEMORY_C_GOTCHA(fork_gotcha_t, 0, fork);
};
// registering the pthread_atfork and gotcha means that we might execute twice
// handlers twice, hence the locks
pthread_atfork(&prefork_setup, &postfork_parent, &postfork_child);
}
pid_t
fork_gotcha::operator()(const gotcha_data_t&, pid_t (*_real_fork)()) const
{
prefork_setup();
auto _pid = (*_real_fork)();
if(_pid != 0)
{
OMNITRACE_BASIC_VERBOSE(0, "fork() called on PID %i created PID %i\n", getpid(),
_pid);
postfork_parent();
}
else
{
postfork_child();
}
if(!settings::use_output_suffix())
{
OMNITRACE_BASIC_VERBOSE(
0, "Application which make calls to fork() should enable using an process "
"identifier output suffix (i.e. set OMNITRACE_USE_PID=ON)\n");
}
return _pid;
}
} // namespace component
} // namespace omnitrace