// MIT License // // Copyright (c) 2022 Advanced Micro Devices, Inc. All Rights Reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in all // copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE // SOFTWARE. #include "libpyomnitrace.hpp" #include "dl.hpp" #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace pyomnitrace { namespace pyprofile { py::module generate(py::module& _pymod); } } // namespace pyomnitrace PYBIND11_MODULE(libpyomnitrace, omni) { using namespace pyomnitrace; static bool _is_initialized = false; static bool _is_finalized = false; static auto _get_use_mpi = []() { bool _use_mpi = false; try { py::module::import("mpi4py"); _use_mpi = true; } catch(py::error_already_set& _exc) { if(!_exc.matches(PyExc_ImportError)) throw; } return _use_mpi; }; omni.def( "is_initialized", []() { return _is_initialized; }, "Initialization state"); omni.def( "is_finalized", []() { return _is_finalized; }, "Finalization state"); omni.def( "initialize", [](const std::string& _v) { if(_is_initialized) throw std::runtime_error("Error! omnitrace is already initialized"); _is_initialized = true; omnitrace_set_mpi(_get_use_mpi(), false); omnitrace_init("trace", false, _v.c_str()); }, "Initialize omnitrace"); omni.def( "initialize", [](const py::list& _v) { if(_is_initialized) throw std::runtime_error("Error! omnitrace is already initialized"); _is_initialized = true; omnitrace_set_mpi(_get_use_mpi(), false); std::string _cmd = {}; std::string _cmd_line = {}; for(auto&& itr : _v) { if(_cmd.empty()) _cmd = itr.cast(); _cmd_line += " " + itr.cast(); } if(!_cmd_line.empty()) { _cmd_line.substr(_cmd_line.find_first_not_of(' ')); tim::set_env("OMNITRACE_COMMAND_LINE", _cmd_line, 0); } omnitrace_init("trace", false, _cmd.c_str()); }, "Initialize omnitrace"); omni.def( "initialize", [](const std::string& _v) { if(_is_initialized) throw std::runtime_error("Error! omnitrace is already initialized"); _is_initialized = true; bool _use_mpi = false; try { py::module::import("mpi4py"); _use_mpi = true; } catch(py::error_already_set& _exc) { if(!_exc.matches(PyExc_ImportError)) throw; } omnitrace_set_mpi(_use_mpi, false); omnitrace_init("trace", false, _v.c_str()); }, "Initialize omnitrace"); omni.def( "finalize", []() { if(_is_finalized) throw std::runtime_error("Error! omnitrace is already finalized"); _is_finalized = true; omnitrace_finalize(); }, "Initialize omnitrace"); py::doc("omnitrace profiler for python"); pyprofile::generate(omni); } //======================================================================================// // namespace pyomnitrace { namespace pyprofile { // using profiler_t = std::function; using profiler_vec_t = std::vector; using profiler_label_map_t = std::unordered_map; using profiler_index_map_t = std::unordered_map; using strset_t = std::unordered_set; // namespace { strset_t default_exclude_functions = { "^<.*>$" }; strset_t default_exclude_filenames = { "(encoder|decoder|threading).py$", "^<.*>$" }; } // namespace // struct config { bool is_running = false; bool trace_c = false; bool include_internal = false; bool include_args = false; bool include_line = false; bool include_filename = false; bool full_filepath = false; int32_t ignore_stack_depth = 0; int32_t base_stack_depth = -1; int32_t verbose = 0; int64_t depth_tracker = 0; std::string base_module_path = {}; strset_t restrict_functions = {}; strset_t restrict_filenames = {}; strset_t include_functions = {}; strset_t include_filenames = {}; strset_t exclude_functions = default_exclude_functions; strset_t exclude_filenames = default_exclude_filenames; std::vector records = {}; }; // inline config& get_config() { static auto* _instance = new config{}; static thread_local auto* _tl_instance = []() { static std::atomic _count{ 0 }; auto _cnt = _count++; if(_cnt == 0) return _instance; auto* _tmp = new config{}; _tmp->is_running = _instance->is_running; _tmp->trace_c = _instance->trace_c; _tmp->include_internal = _instance->include_internal; _tmp->include_args = _instance->include_args; _tmp->include_line = _instance->include_line; _tmp->include_filename = _instance->include_filename; _tmp->full_filepath = _instance->full_filepath; _tmp->base_module_path = _instance->base_module_path; _tmp->restrict_functions = _instance->restrict_functions; _tmp->restrict_filenames = _instance->restrict_filenames; _tmp->include_functions = _instance->include_functions; _tmp->include_filenames = _instance->include_filenames; _tmp->exclude_functions = _instance->exclude_functions; _tmp->exclude_filenames = _instance->exclude_filenames; _tmp->verbose = _instance->verbose; // if full filepath is specified, include filename is implied if(_tmp->full_filepath && !_tmp->include_filename) _tmp->include_filename = true; return _tmp; }(); return *_tl_instance; } // int32_t get_depth(PyFrameObject* frame) { return (frame->f_back) ? (get_depth(frame->f_back) + 1) : 0; } // void profiler_function(py::object pframe, const char* swhat, py::object arg) { static thread_local auto& _config = get_config(); static thread_local auto _disable = false; if(_disable) return; _disable = true; tim::scope::destructor _dtor{ []() { _disable= false; } }; (void) _dtor; if(pframe.is_none() || pframe.ptr() == nullptr) return; static auto _omnitrace_path = _config.base_module_path; auto* frame = reinterpret_cast(pframe.ptr()); int what = (strcmp(swhat, "call") == 0) ? PyTrace_CALL : (strcmp(swhat, "c_call") == 0) ? PyTrace_C_CALL : (strcmp(swhat, "return") == 0) ? PyTrace_RETURN : (strcmp(swhat, "c_return") == 0) ? PyTrace_C_RETURN : -1; // only support PyTrace_{CALL,C_CALL,RETURN,C_RETURN} if(what < 0) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("%s :: %s", "Ignoring what != {CALL,C_CALL,RETURN,C_RETURN}", swhat); return; } auto _update_ignore_stack_depth = [what]() { switch(what) { case PyTrace_CALL: ++_config.ignore_stack_depth; break; case PyTrace_RETURN: --_config.ignore_stack_depth; break; default: break; } }; if(_config.ignore_stack_depth > 0) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("%s :: %s :: %u", "Ignoring call/return", swhat, _config.ignore_stack_depth); _update_ignore_stack_depth(); return; } else if(_config.ignore_stack_depth < 0) { TIMEMORY_PRINT_HERE("WARNING! ignore_stack_depth is < 0 :: ", _config.ignore_stack_depth); } // if PyTrace_C_{CALL,RETURN} is not enabled if(!_config.trace_c && (what == PyTrace_C_CALL || what == PyTrace_C_RETURN)) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("%s :: %s", "Ignoring C call/return", swhat); return; } // get the arguments auto _get_args = [&]() { auto inspect = py::module::import("inspect"); try { return py::cast( inspect.attr("formatargvalues")(*inspect.attr("getargvalues")(pframe))); } catch(py::error_already_set& _exc) { TIMEMORY_CONDITIONAL_PRINT_HERE(_config.verbose > 1, "Error! %s", _exc.what()); if(!_exc.matches(PyExc_AttributeError)) throw; } return std::string{}; }; // get the final label auto _get_label = [&](auto& _func, auto& _filename, auto& _fullpath) { auto _bracket = _config.include_filename; if(_bracket) _func.insert(0, "["); // append the arguments if(_config.include_args) _func.append(_get_args()); if(_bracket) _func.append("]"); // append the filename if(_config.include_filename) { if(_config.full_filepath) _func.append(TIMEMORY_JOIN("", '[', std::move(_fullpath))); else _func.append(TIMEMORY_JOIN("", '[', std::move(_filename))); } // append the line number if(_config.include_line && _config.include_filename) _func.append(TIMEMORY_JOIN("", ':', frame->f_lineno, ']')); else if(_config.include_line) _func.append(TIMEMORY_JOIN("", ':', frame->f_lineno)); else if(_config.include_filename) _func += "]"; return _func; }; auto _find_matching = [](const strset_t& _expr, const std::string& _name) { const auto _rconstants = std::regex_constants::egrep | std::regex_constants::optimize; for(const auto& itr : _expr) // NOLINT { if(std::regex_search(_name, std::regex(itr, _rconstants))) return true; } return false; }; bool _force = false; auto& _only_funcs = _config.restrict_functions; auto& _incl_funcs = _config.include_functions; auto& _skip_funcs = _config.exclude_functions; auto _func = py::cast(frame->f_code->co_name); if(!_only_funcs.empty()) { _force = _find_matching(_only_funcs, _func); if(!_force) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("Skipping non-restricted function: %s", _func.c_str()); return; } } if(!_force) { if(_find_matching(_incl_funcs, _func)) { _force = true; } else if(_find_matching(_skip_funcs, _func)) { if(_config.verbose > 1) TIMEMORY_PRINT_HERE("Skipping designated function: '%s'", _func.c_str()); if(!_find_matching(default_exclude_functions, _func)) _update_ignore_stack_depth(); return; } } auto& _only_files = _config.restrict_filenames; auto& _incl_files = _config.include_filenames; auto& _skip_files = _config.exclude_filenames; auto _full = py::cast(frame->f_code->co_filename); auto _file = (_full.find('/') != std::string::npos) ? _full.substr(_full.find_last_of('/') + 1) : _full; if(!_config.include_internal && strncmp(_full.c_str(), _omnitrace_path.c_str(), _omnitrace_path.length()) == 0) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("Skipping internal function: %s", _func.c_str()); return; } if(!_force && !_only_files.empty()) { _force = _find_matching(_only_files, _full); if(!_force) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("Skipping non-restricted file: %s", _full.c_str()); return; } } if(!_force) { if(_find_matching(_incl_files, _full)) { _force = true; } else if(_find_matching(_skip_files, _full)) { if(_config.verbose > 2) TIMEMORY_PRINT_HERE("Skipping non-included file: %s", _full.c_str()); return; } } TIMEMORY_CONDITIONAL_PRINT_HERE(_config.verbose > 3, "%8s | %s%s | %s | %s", swhat, _func.c_str(), _get_args().c_str(), _file.c_str(), _full.c_str()); auto _label = _get_label(_func, _file, _full); if(_label.empty()) return; static thread_local strset_t _labels{}; const auto& _label_ref = *_labels.emplace(_label).first; // start function auto _profiler_call = [&]() { _config.records.emplace_back( [&_label_ref]() { omnitrace_pop_region(_label_ref.c_str()); }); omnitrace_push_region(_label_ref.c_str()); }; // stop function auto _profiler_return = [&]() { _config.records.back()(); _config.records.pop_back(); }; // process what switch(what) { case PyTrace_CALL: case PyTrace_C_CALL: _profiler_call(); break; case PyTrace_RETURN: case PyTrace_C_RETURN: _profiler_return(); break; default: break; } // don't do anything with arg tim::consume_parameters(arg); } // py::module generate(py::module& _pymod) { py::module _prof = _pymod.def_submodule("profiler", "Profiling functions"); auto _init = []() { try { auto _file = py::module::import("omnitrace").attr("__file__").cast(); if(_file.find('/') != std::string::npos) _file = _file.substr(0, _file.find_last_of('/')); get_config().base_module_path = _file; } catch(py::cast_error& e) { std::cerr << "[profiler_init]> " << e.what() << std::endl; } if(get_config().is_running) return; get_config().records.clear(); get_config().base_stack_depth = -1; get_config().is_running = true; }; auto _fini = []() { if(!get_config().is_running) return; get_config().is_running = false; get_config().base_stack_depth = -1; get_config().records.clear(); }; _prof.def("profiler_function", &profiler_function, "Profiling function"); _prof.def("profiler_init", _init, "Initialize the profiler"); _prof.def("profiler_finalize", _fini, "Finalize the profiler"); py::class_ _pyconfig(_prof, "config", "Profiler configuration"); #define CONFIGURATION_PROPERTY(NAME, TYPE, DOC, ...) \ _pyconfig.def_property_static( \ NAME, [](py::object&&) { return __VA_ARGS__; }, \ [](py::object&&, TYPE val) { __VA_ARGS__ = val; }, DOC); CONFIGURATION_PROPERTY("_is_running", bool, "Profiler is currently running", get_config().is_running) CONFIGURATION_PROPERTY("trace_c", bool, "Enable tracing C functions", get_config().trace_c) CONFIGURATION_PROPERTY("include_internal", bool, "Include functions within timemory", get_config().include_internal) CONFIGURATION_PROPERTY("include_args", bool, "Encode the function arguments", get_config().include_args) CONFIGURATION_PROPERTY("include_line", bool, "Encode the function line number", get_config().include_line) CONFIGURATION_PROPERTY("include_filename", bool, "Encode the function filename (see also: full_filepath)", get_config().include_filename) CONFIGURATION_PROPERTY("full_filepath", bool, "Display the full filepath (instead of file basename)", get_config().full_filepath) CONFIGURATION_PROPERTY("verbosity", int32_t, "Verbosity of the logging", get_config().verbose) static auto _get_strset = [](const strset_t& _targ) { auto _out = py::list{}; for(auto itr : _targ) _out.append(itr); return _out; }; static auto _set_strset = [](const py::list& _inp, strset_t& _targ) { for(const auto& itr : _inp) _targ.insert(itr.cast()); }; #define CONFIGURATION_PROPERTY_LAMBDA(NAME, DOC, GET, SET) \ _pyconfig.def_property_static(NAME, GET, SET, DOC); #define CONFIGURATION_STRSET(NAME, DOC, ...) \ { \ auto GET = [](py::object&&) { return _get_strset(__VA_ARGS__); }; \ auto SET = [](py::object&&, const py::list& val) { \ _set_strset(val, __VA_ARGS__); \ }; \ CONFIGURATION_PROPERTY_LAMBDA(NAME, DOC, GET, SET) \ } CONFIGURATION_STRSET("restrict_functions", "Function regexes to collect exclusively", get_config().restrict_functions) CONFIGURATION_STRSET("restrict_modules", "Filename regexes to collect exclusively", get_config().restrict_filenames) CONFIGURATION_STRSET("include_functions", "Function regexes to always include in collection", get_config().include_functions) CONFIGURATION_STRSET("include_modules", "Filename regexes to always include in collection", get_config().include_filenames) CONFIGURATION_STRSET("exclude_functions", "Function regexes to filter out of collection", get_config().exclude_functions) CONFIGURATION_STRSET("exclude_modules", "Filename regexes to filter out of collection", get_config().exclude_filenames) return _prof; } } // namespace pyprofile } // namespace pyomnitrace // //======================================================================================//