55f2dabbb3
- include/rocprofiler/agent.h
- move rocprofiler_dim3_t
- include/rocprofiler/buffer_tracing.h
- size fields
- update kernel dispatch record
- include/rocprofiler/callback_tracing.h
- remove rocprofiler_callback_tracing_code_object_unload_data_t
- remove rocprofiler_callback_tracing_code_object_register_host_kernel_symbol_data_t
- include/rocprofiler/fwd.h
- added ROCPROFILER_STATUS_ERROR_CONTEXT_CONFLICT
- remove ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT_UNLOAD
- remove ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT_DEVICE_KERNEL_SYMBOL_UNREGISTER
- add rocprofiler_kernel_id_t typedef
- add rocprofiler_dim3_t (moved from agent.h)
- lib/common/synchronized.hpp
- rlock/wlock return decltype(auto)
- separate prototype from definition
- lib/common/utility.{hpp,cpp}
- timestamp functions replicating HSA implementation(s)
- init_public_api_struct for setting size field and ensuring certain type traits
- simplified static_cleanup_wrapper
- separate prototype from definition in active_capacity_gate
- lib/rocprofiler/agent.cpp
- tweak get_rocprofiler_agent impl
- lib/rocprofiler/buffer.cpp
- fix buffer message log level
- lib/rocprofiler/context.cpp
- use new paradigm for getting active contexts
- lib/rocprofiler/internal_threading.hpp
- update to simplified static_cleanup_wrapper implementation
- lib/rocprofiler/registration.cpp
- fix deactivating contexts
- lib/rocprofiler/rocprofiler.cpp
- status string for context conflict
- lib/rocprofiler/context/context.*
- correlation_id struct
- new get_active_contexts paradigm
- lib/rocprofiler/counters/core.*
- rocprofiler_packet union
- tweak start/stop context to accept pointer instead of handle
- lib/rocprofiler/counters/dimensions.cpp
- update to new get_rocp_agent() return type
- lib/rocprofiler/hsa/hsa.*
- update to new get_active_contexts paradigm
- update to new correlation id implementation
- guard against hsa.def.cpp direct compilation
- lib/rocprofiler/hsa/queue_controller.*
- update to change in get_rocp_agent return type
- consistent aliases
- lookup function for getting queue pointer from hsa queue id
- lib/rocprofiler/hsa/queue.*
- rocprofiler_packet
- extend queue_info_session_t
- lib/rocprofiler/tests/registration.cpp
- improve diagnostic on perf check for rocprofiler_lib.callback_registration_lambda_with_result
152 خطوط
4.5 KiB
C++
152 خطوط
4.5 KiB
C++
// Copyright (c) 2023 Advanced Micro Devices, Inc.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
//
|
|
|
|
#include "lib/common/utility.hpp"
|
|
|
|
#include <glog/logging.h>
|
|
|
|
#include <unistd.h>
|
|
#include <cerrno>
|
|
#include <cstring>
|
|
#include <ctime>
|
|
#include <fstream>
|
|
#include <sstream>
|
|
#include <string>
|
|
#include <vector>
|
|
#include "lib/common/defines.hpp"
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace common
|
|
{
|
|
namespace
|
|
{
|
|
std::string_view
|
|
get_clock_name(clockid_t _id)
|
|
{
|
|
#define CLOCK_NAME_CASE_STATEMENT(NAME) \
|
|
case NAME: return #NAME;
|
|
switch(_id)
|
|
{
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_REALTIME)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_MONOTONIC)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_PROCESS_CPUTIME_ID)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_THREAD_CPUTIME_ID)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_MONOTONIC_RAW)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_REALTIME_COARSE)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_MONOTONIC_COARSE)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_BOOTTIME)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_REALTIME_ALARM)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_BOOTTIME_ALARM)
|
|
CLOCK_NAME_CASE_STATEMENT(CLOCK_TAI)
|
|
default: break;
|
|
}
|
|
return "CLOCK_UNKNOWN";
|
|
}
|
|
} // namespace
|
|
|
|
clockid_t
|
|
get_accurate_clock_id_impl()
|
|
{
|
|
auto clock = CLOCK_MONOTONIC;
|
|
utsname kernelInfo;
|
|
if(uname(&kernelInfo) == 0)
|
|
{
|
|
try
|
|
{
|
|
std::string ver = kernelInfo.release;
|
|
size_t idx;
|
|
int major = std::stoi(ver, &idx);
|
|
int minor = std::stoi(ver.substr(idx + 1));
|
|
if(major > 4 || ((major == 4) && (minor >= 4)))
|
|
{
|
|
clock = CLOCK_MONOTONIC_RAW;
|
|
}
|
|
} catch(...)
|
|
{
|
|
// Kernel version string doesn't conform to the standard pattern.
|
|
// Keep using the "safe" (non-RAW) clock.
|
|
}
|
|
}
|
|
return clock;
|
|
}
|
|
|
|
uint64_t
|
|
get_clock_freq_ns_impl(clockid_t _clk_id)
|
|
{
|
|
constexpr auto nanosec = std::nano::den;
|
|
|
|
struct timespec ts;
|
|
auto ret = clock_getres(_clk_id, &ts);
|
|
|
|
if(ROCPROFILER_UNLIKELY(ret != 0))
|
|
{
|
|
auto _err = errno;
|
|
LOG(FATAL) << "error getting clock resolution for " << get_clock_name(_clk_id) << ": "
|
|
<< strerror(_err);
|
|
}
|
|
else if(ROCPROFILER_UNLIKELY(ts.tv_sec != 0 ||
|
|
ts.tv_nsec >= std::numeric_limits<uint32_t>::max()))
|
|
{
|
|
LOG(FATAL) << "clock_getres(" << get_clock_name(_clk_id)
|
|
<< ") returned very low frequency (<1Hz)";
|
|
}
|
|
|
|
auto&& _period =
|
|
(static_cast<uint64_t>(ts.tv_sec) * nanosec) + static_cast<uint64_t>(ts.tv_nsec);
|
|
return nanosec / _period;
|
|
}
|
|
|
|
std::vector<std::string>
|
|
read_command_line(pid_t _pid)
|
|
{
|
|
auto _cmdline = std::vector<std::string>{};
|
|
auto fcmdline = std::stringstream{};
|
|
fcmdline << "/proc/" << _pid << "/cmdline";
|
|
auto ifs = std::ifstream{fcmdline.str().c_str()};
|
|
if(ifs)
|
|
{
|
|
char cstr;
|
|
std::string sarg;
|
|
while(!ifs.eof())
|
|
{
|
|
ifs >> cstr;
|
|
if(!ifs.eof())
|
|
{
|
|
if(cstr != '\0')
|
|
{
|
|
sarg += cstr;
|
|
}
|
|
else
|
|
{
|
|
_cmdline.push_back(sarg);
|
|
sarg = "";
|
|
}
|
|
}
|
|
}
|
|
ifs.close();
|
|
}
|
|
|
|
return _cmdline;
|
|
}
|
|
} // namespace common
|
|
} // namespace rocprofiler
|