7bc50f5a0a
* Fix roctracer_flush_activity
- invoke roctracer_flush_activity() before disabling domains
* create comp::roctracer::flush()
- real issue was the global state when roctracer_flush_activity() was called
* formatting
* Update lib/omnitrace/library/components/roctracer.hpp
- provide definition of comp::roctracer::flush when OMNITRACE_USE_ROCTRACER is not defined
* omnitrace.cfg -> perfetto.cfg
- rename provided perfetto config file (omnitrace.cfg) to perfetto.cfg to avoid confusion
* Update lib/core
- gpu.hpp: defines for OMNITRACE_USE_{HIP,ROCTRACER,ROCPROFILER,ROCM_SMI}
- gpu.cpp
- include core/hip_runtime.hpp
- fix serialization of hipDeviceProp_t
- add hip_runtime.hpp
- ensure proper inclusion of hip_runtime.h
- add rccl.hpp
- ensure proper inclusion of rccl.h
* Update lib/omnitrace/library
- rcclp.cpp
- update includes for rccl
- roctracer.hpp
- update includes for hip_runtime
- components/comm_data.hpp
- update includes for rccl
- components/rcclp.hpp
- update includes for rccl
* Update bin/omnitrace-avail/avail.cpp
- update includes for hip_runtime
* Update examples/rccl/CMakeLists.txt
- fix find_package for rccl when CI enabled
* Update CMakeLists.txt
- set cmake policy CMP0135 to NEW for cmake >= 3.24
- Enable DOWNLOAD_EXTRACT_TIMESTAMP with ExternalProject_Add + URL download method
* Update timemory submodule
* Update pybind11 submodule
* Update pybind11 submodule
* Update lib/core/rccl.hpp
- include rccl.h only if OMNITRACE_USE_RCCL > 0
* Update lib/core/{gpu,hip_runtime}.hpp
* Update lib/core/gpu.cpp
- reintroduce some ppdefs
* Update lib/core/gpu.cpp
- fix ifdef on OMNITRACE_HIP_VERSION
* Update lib/core/gpu.cpp
- fix static assert for OMNITRACE_HIP_VERSION_MINOR when HIP version 4.x or older (unreliable minor versions)
* Update lib/core/gpu.cpp
- fix ifdef on OMNITRACE_HIP_VERSION
* Update lib/core/config.cpp
- disable OMNITRACE_PERFETTO_COMBINE_TRACES by default
* Update lib/core/perfetto.cpp
- if unable to open perfetto temp file, return the ReadTraceBlocking()
* Update lib/core/config.*
- flush tmpfile before closing
90 γραμμές
3.2 KiB
C++
90 γραμμές
3.2 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2022 Advanced Micro Devices, Inc. All Rights Reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#pragma once
|
|
|
|
#include "core/config.hpp"
|
|
#include "core/debug.hpp"
|
|
#include "core/hip_runtime.hpp"
|
|
#include "core/perfetto.hpp"
|
|
#include "library/components/roctracer.hpp"
|
|
#include "library/ptl.hpp"
|
|
|
|
#include <iostream>
|
|
#include <memory>
|
|
|
|
// Macro to check ROC-tracer calls status
|
|
#define OMNITRACE_ROCTRACER_CALL(call) \
|
|
{ \
|
|
OMNITRACE_DEBUG_F(#call); \
|
|
int err = call; \
|
|
if(err != 0) \
|
|
{ \
|
|
OMNITRACE_PRINT_F("%s in: %s\n", roctracer_error_string(), #call); \
|
|
} \
|
|
}
|
|
|
|
namespace omnitrace
|
|
{
|
|
using roctracer_hip_bundle_t =
|
|
tim::component_bundle<category::rocm_hip, comp::roctracer_data, comp::wall_clock>;
|
|
using roctracer_hsa_bundle_t =
|
|
tim::component_bundle<category::rocm_hsa, comp::roctracer_data>;
|
|
using roctracer_functions_t = std::vector<std::pair<std::string, std::function<void()>>>;
|
|
|
|
// HSA API callback function
|
|
void
|
|
hsa_api_callback(uint32_t domain, uint32_t cid, const void* callback_data, void* arg);
|
|
|
|
void
|
|
hsa_activity_callback(uint32_t op, const void* record, void* arg);
|
|
|
|
void
|
|
hip_exec_activity_callbacks(int64_t _tid);
|
|
|
|
// HIP API callback function
|
|
void
|
|
hip_api_callback(uint32_t domain, uint32_t cid, const void* callback_data, void* arg);
|
|
|
|
void
|
|
roctx_api_callback(uint32_t domain, uint32_t cid, const void* callback_data, void* arg);
|
|
|
|
// Activity tracing callback
|
|
void
|
|
hip_activity_callback(const char* begin, const char* end, void*);
|
|
|
|
bool&
|
|
roctracer_is_init();
|
|
|
|
bool&
|
|
roctracer_is_setup();
|
|
|
|
int64_t
|
|
get_clock_skew();
|
|
|
|
roctracer_functions_t&
|
|
roctracer_setup_routines();
|
|
|
|
roctracer_functions_t&
|
|
roctracer_shutdown_routines();
|
|
} // namespace omnitrace
|