Files

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

185 lines
5.0 KiB
C++
Raw Permalink Normal View History

2022-01-26 23:25:00 -06:00
// MIT License
//
2025-01-15 13:06:12 -05:00
// Copyright (c) 2022-2025 Advanced Micro Devices, Inc. All Rights Reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
2022-01-26 23:25:00 -06:00
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
2022-01-26 23:25:00 -06:00
// The above copyright notice and this permission notice shall be included in all
// copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
2022-01-26 23:25:00 -06:00
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2022-01-26 23:25:00 -06:00
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
#include "library/ptl.hpp"
#include "core/config.hpp"
#include "core/defines.hpp"
#include "core/state.hpp"
2022-05-08 04:40:10 -05:00
#include "library/runtime.hpp"
2022-02-08 17:42:17 -06:00
#include "library/sampling.hpp"
2022-08-31 01:24:31 -05:00
#include "library/thread_data.hpp"
#include "library/thread_info.hpp"
#include <PTL/ThreadPool.hh>
#include <PTL/UserTaskQueue.hh>
2022-05-08 04:40:10 -05:00
#include "logger/debug.hpp"
2022-08-08 08:37:37 -05:00
#include <timemory/backends/threading.hpp>
#include <timemory/utility/declaration.hpp>
namespace rocprofsys
{
namespace tasking
{
namespace
{
auto _thread_pool_cfg = []() {
2022-08-31 01:24:31 -05:00
int64_t _nthreads = 0;
if(config::settings_are_configured())
{
_nthreads = config::get_thread_pool_size();
}
else
{
const int64_t _max_threads = std::thread::hardware_concurrency() / 2;
const int64_t _min_threads = 1;
_nthreads = get_env<int64_t>("ROCPROFSYS_THREAD_POOL_SIZE", -1, false);
2022-08-31 01:24:31 -05:00
if(_nthreads == -1)
{
_nthreads = 4;
if(_nthreads > _max_threads) _nthreads = _max_threads;
if(_nthreads < _min_threads) _nthreads = _min_threads;
tim::set_env("ROCPROFSYS_THREAD_POOL_SIZE", _nthreads, 0);
2022-08-31 01:24:31 -05:00
}
}
static char buffer[sizeof(PTL::UserTaskQueue)];
static auto* _task_queue = new((void*) buffer) PTL::UserTaskQueue(_nthreads);
PTL::ThreadPool::Config _v{};
_v.init = true;
_v.use_affinity = false;
_v.use_tbb = false;
2022-03-22 15:51:57 -05:00
_v.verbose = -1;
2022-02-08 17:42:17 -06:00
_v.initializer = []() {
rocprofsys::thread_info::init(true);
tim::threading::set_thread_name(
fmt::format("ptl.{}", PTL::Threading::GetThreadId()).c_str());
rocprofsys::set_thread_state(rocprofsys::ThreadState::Disabled);
rocprofsys::sampling::block_signals();
2022-02-08 17:42:17 -06:00
};
_v.finalizer = []() {};
_v.priority = 5;
_v.pool_size = _nthreads;
_v.task_queue = _task_queue;
2022-08-31 01:24:31 -05:00
return _v;
};
auto&
get_thread_pool_state()
{
static auto _v = State::PreInit;
return _v;
}
PTL::ThreadPool&
get_thread_pool()
{
2023-06-15 22:37:33 -05:00
static auto _cfg = _thread_pool_cfg();
static auto* _v =
(get_thread_pool_state() = State::Active, new PTL::ThreadPool{ _cfg });
2023-02-08 01:31:38 -06:00
return *_v;
}
2022-08-31 01:24:31 -05:00
} // namespace
2023-01-24 18:53:23 -06:00
namespace general
{
namespace
{
auto&
get_thread_pool_state()
{
static auto _v = State::PreInit;
return _v;
}
} // namespace
} // namespace general
2022-04-26 22:08:51 -05:00
void
setup()
2022-09-26 07:52:14 -05:00
{
ROCPROFSYS_SCOPED_THREAD_STATE(ThreadState::Internal);
ROCPROFSYS_SCOPED_SAMPLING_ON_CHILD_THREADS(false);
2022-09-26 07:52:14 -05:00
(void) get_thread_pool();
}
2022-04-26 22:08:51 -05:00
void
join()
{
2023-01-24 18:53:23 -06:00
if(general::get_thread_pool_state() == State::Active)
{
LOG_DEBUG("waiting for all general tasks to complete...");
2023-10-16 18:04:47 -05:00
for(size_t i = 0; i < thread_info::get_peak_num_threads(); ++i)
2023-01-24 18:53:23 -06:00
general::get_task_group(i).join();
}
2022-04-26 22:08:51 -05:00
}
void
shutdown()
{
2023-01-24 18:53:23 -06:00
if(general::get_thread_pool_state() == State::Active)
{
LOG_DEBUG("Waiting on completion of general tasks...");
2023-10-16 18:04:47 -05:00
for(size_t i = 0; i < thread_info::get_peak_num_threads(); ++i)
2023-01-24 18:53:23 -06:00
{
general::get_task_group(i).join();
general::get_task_group(i).clear();
general::get_task_group(i).set_pool(nullptr);
}
general::get_thread_pool_state() = State::Finalized;
}
2022-08-31 01:24:31 -05:00
if(get_thread_pool_state() == State::Active)
{
LOG_DEBUG("Destroying the rocprof-sys thread pool...");
2022-08-31 01:24:31 -05:00
get_thread_pool().destroy_threadpool();
get_thread_pool_state() = State::Finalized;
}
2022-10-31 15:39:45 -05:00
else
{
LOG_DEBUG("thread-pool is not active...");
2022-10-31 15:39:45 -05:00
}
}
2022-08-31 01:24:31 -05:00
size_t
initialize_threadpool(size_t _v)
{
2022-08-31 01:24:31 -05:00
return get_thread_pool().initialize_threadpool(_v);
}
2023-01-24 18:53:23 -06:00
PTL::TaskGroup<void>&
general::get_task_group(int64_t _tid)
{
struct local
{};
using thread_data_t = thread_data<PTL::TaskGroup<void>, local>;
2023-10-16 18:04:47 -05:00
static thread_local auto& _v =
thread_data_t::instance(construct_on_thread{ _tid }, &tasking::get_thread_pool());
return *_v;
2023-01-24 18:53:23 -06:00
}
} // namespace tasking
} // namespace rocprofsys