rocprofv3: rocprofv3-avail tool (#15)

* support avail tool

Updating avail library and script

Listing on Std output incase the output folder is not given

Extending list metrics test

misc fix

misc fix

fixing memory leak

changing list-metrics to list-avail

fixing formatting issue

Fixing CMakeLists

Add test for list avil with trace

Fix test fail

clang tidy errors fixed

Removing build commands for rocprofv3-trigger-list

Addressing review changes

addressing review comment

moving avail to libexec

merge fix

Fix test failures

updating doc

Fix doc error

* updating legacy doc

* fix formatting issue

* Addressing review comments
This commit is contained in:
Nagaraj, Sriraksha
2024-12-04 18:34:10 -06:00
zatwierdzone przez GitHub
rodzic 50b185b9ac
commit c42bdc3128
16 zmienionych plików z 933 dodań i 257 usunięć
+3 -2
Wyświetl plik
@@ -100,8 +100,9 @@ Full documentation for ROCprofiler-SDK is available at [rocm.docs.amd.com/projec
- `Dispatch_Id`
- CSV column for counter collection
## ROCprofiler-SDK 0.5.0 for ROCm release 6.3 (AFAR VII)
### Additions
--List supported PC Sampling Configurations
### Changes
### Added
+10
Wyświetl plik
@@ -14,3 +14,13 @@ install(
PERMISSIONS OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_READ GROUP_EXECUTE WORLD_READ
WORLD_EXECUTE
COMPONENT tools)
configure_file(rocprofv3_avail.py
${PROJECT_BINARY_DIR}/${CMAKE_INSTALL_BINDIR}/rocprofv3_avail COPYONLY)
install(
FILES ${PROJECT_BINARY_DIR}/${CMAKE_INSTALL_BINDIR}/rocprofv3_avail
DESTINATION ${CMAKE_INSTALL_BINDIR}
PERMISSIONS OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_READ GROUP_EXECUTE WORLD_READ
WORLD_EXECUTE
COMPONENT tools)
+18 -8
Wyświetl plik
@@ -412,8 +412,8 @@ For MPI applications (or other job launchers such as SLURM), place rocprofv3 ins
add_parser_bool_argument(
display_options,
"-L",
"--list-metrics",
help="List metrics for counter collection. Backed by a valid YAML file. In earlier rocprof versions, this was known as --list-basic, --list-derived and --list-counters",
"--list-avail",
help="List available PC sampling configurations and metrics for counter collection. Backed by a valid YAML file. In earlier rocprof versions, this was known as --list-basic, --list-derived and --list-counters",
)
advanced_options = parser.add_argument_group("Advanced options")
@@ -678,9 +678,14 @@ def run(app_args, args, **kwargs):
ROCPROF_KOKKOSP_LIBRARY = (
f"{ROCM_DIR}/lib/rocprofiler-sdk/librocprofiler-sdk-tool-kokkosp.so"
)
ROCPROF_LIST_AVAIL_TOOL_LIBRARY = f"{ROCM_DIR}/libexec/librocprofv3-list-avail.so"
prepend_preload = [itr for itr in args.preload if itr]
append_preload = [ROCPROF_TOOL_LIBRARY, ROCPROF_SDK_LIBRARY]
append_preload = [
ROCPROF_TOOL_LIBRARY,
ROCPROF_LIST_AVAIL_TOOL_LIBRARY,
ROCPROF_SDK_LIBRARY,
]
update_env("LD_PRELOAD", ":".join(prepend_preload), prepend=True)
update_env("LD_PRELOAD", ":".join(append_preload), append=True)
@@ -709,7 +714,7 @@ def run(app_args, args, **kwargs):
)
if args.output_file is not None or args.output_directory is not None:
update_env("ROCPROF_OUTPUT_LIST_METRICS_FILE", True)
update_env("ROCPROF_OUTPUT_LIST_AVAIL_FILE", True)
if not args.output_format:
args.output_format = ["csv"]
@@ -841,8 +846,8 @@ def run(app_args, args, **kwargs):
overwrite_if_true=True,
)
update_env(
"ROCPROF_LIST_METRICS",
args.list_metrics,
"ROCPROF_LIST_AVAIL",
args.list_avail,
overwrite_if_true=True,
)
@@ -891,8 +896,13 @@ def run(app_args, args, **kwargs):
sys.stderr.write("\n")
sys.stderr.flush()
if args.list_metrics:
app_args = [f"{ROCM_DIR}/libexec/rocprofv3-trigger-list-metrics"]
if args.list_avail:
update_env("ROCPROFILER_PC_SAMPLING_BETA_ENABLED", "on")
path = os.path.join(f"{ROCM_DIR}", "bin/rocprofv3_avail")
if app_args:
exit_code = subprocess.check_call(["python3", path], env=app_env)
else:
app_args = ["python3", path]
elif not app_args:
log_config(app_env)
+419
Wyświetl plik
@@ -0,0 +1,419 @@
#!/usr/bin/env python3
import ctypes
import pathlib
import os
import io
import csv
import socket
class derived_counter:
def __init__(
self, counter_name, counter_description, counter_expression, counter_dimensions
):
self.name = counter_name
self.description = counter_description
self.expression = counter_expression
self.dimensions = counter_dimensions
class basic_counter:
def __init__(
self, counter_name, counter_description, counter_block, counter_dimensions
):
self.name = counter_name
self.description = counter_description
self.block = counter_block
self.dimensions = counter_dimensions
class pc_config:
def __init__(self, config_method, config_unit, min_interval, max_interval):
self.method = config_method
self.unit = config_unit
self.min_interval = min_interval
self.max_interval = max_interval
MAX_STR = 256
libname = os.environ.get("ROCPROF_LIST_AVAIL_TOOL_LIBRARY")
c_lib = ctypes.CDLL(libname)
c_lib.get_number_of_counters.restype = ctypes.c_ulong
c_lib.get_number_of_pc_sample_configs.restype = ctypes.c_ulong
c_lib.get_number_of_dimensions.restype = ctypes.c_ulong
c_lib.get_number_of_counters.argtypes = [ctypes.c_int]
c_lib.get_number_of_pc_sample_configs.argtypes = [ctypes.c_int]
c_lib.get_number_of_dimensions.argtypes = [ctypes.c_int]
c_lib.get_pc_sample_config.argtypes = [
ctypes.c_ulong,
ctypes.c_ulong,
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
ctypes.POINTER(ctypes.c_ulong),
ctypes.POINTER(ctypes.c_ulong),
]
c_lib.get_counters_info.argtypes = [
ctypes.c_ulong,
ctypes.c_int,
ctypes.POINTER(ctypes.c_ulong),
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
ctypes.POINTER(ctypes.c_int),
]
c_lib.get_counter_expression.argtypes = [
ctypes.c_ulong,
ctypes.c_int,
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
]
c_lib.get_counter_dimension.argtypes = [
ctypes.c_ulong,
ctypes.c_ulong,
ctypes.POINTER(ctypes.c_ulong),
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
ctypes.POINTER(ctypes.c_ulong),
]
c_lib.get_counter_block.argtypes = [
ctypes.c_ulong,
ctypes.c_ulong,
ctypes.POINTER(ctypes.POINTER(ctypes.c_char * MAX_STR)),
]
c_lib.get_number_of_agents.restype = ctypes.c_size_t
c_lib.get_agent_node_id.restype = ctypes.c_ulong
c_lib.get_agent_node_id.argtypes = [ctypes.c_int]
agent_derived_counter_map = dict()
agent_basic_counter_map = dict()
agent_pc_sample_config_map = dict()
def get_counters(node_id):
no_of_counters = c_lib.get_number_of_counters(node_id)
basic_counters = []
derived_counters = []
for counter_idx in range(0, no_of_counters):
name_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
description_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
block_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
is_derived_args = ctypes.c_int()
counter_id_args = ctypes.c_ulong()
c_lib.get_counters_info(
node_id,
counter_idx,
ctypes.byref(counter_id_args),
name_args,
description_args,
ctypes.byref(is_derived_args),
)
is_derived = is_derived_args.value
counter_id = counter_id_args.value
no_of_dimensions = c_lib.get_number_of_dimensions(counter_id)
name = ctypes.cast(name_args, ctypes.c_char_p).value.decode("utf-8")
description = ctypes.cast(description_args, ctypes.c_char_p).value.decode("utf-8")
dimensions_stream = io.StringIO()
for dim in range(0, no_of_dimensions):
dim_name_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
dim_instance_args = ctypes.c_ulong()
dimension_id_args = ctypes.c_ulong()
c_lib.get_counter_dimension(
counter_id,
dim,
ctypes.byref(dimension_id_args),
dim_name_args,
ctypes.byref(dim_instance_args),
)
dim_name = ctypes.cast(dim_name_args, ctypes.c_char_p).value.decode("utf-8")
dim_instance = dim_instance_args.value
dimensions_stream.write(dim_name)
dimensions_stream.write("[0:")
dimensions_stream.write(str(dim_instance - 1))
dimensions_stream.write("]")
if dim != no_of_dimensions - 1:
dimensions_stream.write("\t")
if is_derived:
expression_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
c_lib.get_counter_expression(node_id, counter_idx, expression_args)
counter_expression = ctypes.cast(
expression_args, ctypes.c_char_p
).value.decode("utf-8")
derived_counters.append(
derived_counter(
name, description, counter_expression, dimensions_stream.getvalue()
)
)
else:
block_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
c_lib.get_counter_block(node_id, counter_idx, block_args)
block = ctypes.cast(block_args, ctypes.c_char_p).value.decode("utf-8")
basic_counters.append(
basic_counter(name, description, block, dimensions_stream.getvalue())
)
dimensions_stream.close()
agent_derived_counter_map[node_id] = derived_counters
agent_basic_counter_map[node_id] = basic_counters
def get_pc_sample_configs(node_id):
no_of_pc_sample_configs = c_lib.get_number_of_pc_sample_configs(node_id)
pc_sample_configs = []
if no_of_pc_sample_configs:
for config_idx in range(0, no_of_pc_sample_configs):
method_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
unit_args = ctypes.POINTER(ctypes.c_char * MAX_STR)()
min_interval = ctypes.c_ulong()
max_interval = ctypes.c_ulong()
c_lib.get_pc_sample_config(
node_id,
config_idx,
method_args,
unit_args,
ctypes.byref(min_interval),
ctypes.byref(max_interval),
)
method = ctypes.cast(method_args, ctypes.c_char_p).value.decode("utf-8")
unit = ctypes.cast(unit_args, ctypes.c_char_p).value.decode("utf-8")
pc_sample_configs.append(
pc_config(method, unit, min_interval.value, max_interval.value)
)
agent_pc_sample_config_map[node_id] = pc_sample_configs
def process_filename(file_path, file_type):
filename = os.environ.get(
"ROCPROF_OUTPUT_FILE_NAME", socket.gethostname() + "/" + str(os.getpid())
)
if os.path.exists(file_path) and os.path.isfile(file_path):
fatal_error("ROCPROFILER_OUTPUT_PATH already exists and is not a directory")
elif not os.path.exists(file_path):
os.makedirs(file_path)
output_filename = ""
if file_type == "derived":
output_filename = filename + "_" + "derived_metrics" + ".csv"
elif file_type == "basic":
output_filename = filename + "_" + "basic_metrics" + ".csv"
elif file_type == "pc_sample_config":
output_filename = filename + "_" + "pc_sample_config" + ".csv"
output_path = os.path.join(file_path, output_filename)
output_path_parent = os.path.dirname(output_path)
if not os.path.exists(output_path_parent):
os.makedirs(output_path_parent)
elif os.path.exists(output_path_parent) and os.path.isfile(output_path_parent):
fatal_error("ROCPROFILER_OUTPUT_PATH already exists and is not a directory")
return output_path
def generate_output(agent_ids):
list_avail_file = os.environ.get("ROCPROF_OUTPUT_LIST_AVAIL_FILE")
if list_avail_file:
file_path = os.environ.get("ROCPROF_OUTPUT_PATH")
derived_output_file = process_filename(file_path, "derived")
basic_output_file = process_filename(file_path, "basic")
pc_sample_config_file = process_filename(file_path, "pc_sample_config")
with open(derived_output_file, "w") as csvfile:
print(f"Opened result file: {derived_output_file}")
fieldnames = ["Agent_Id", "Name", "Description", "Expression", "Dimensions"]
writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
writer.writeheader()
for node_id, counters in agent_derived_counter_map.items():
for counter in counters:
writer.writerow(
{
"Agent_Id": node_id,
"Name": counter.name,
"Description": counter.description,
"Expression": counter.expression,
"Dimensions": counter.dimensions,
}
)
with open(basic_output_file, "w") as csvfile:
print(f"Opened result file: {basic_output_file}")
fieldnames = ["Agent_Id", "Name", "Description", "Block", "Dimensions"]
writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
writer.writeheader()
for node_id, counters in agent_basic_counter_map.items():
for counter in counters:
if counter.block:
writer.writerow(
{
"Agent_Id": node_id,
"Name": counter.name,
"Description": counter.description,
"Block": counter.block,
"Dimensions": counter.dimensions,
}
)
with open(pc_sample_config_file, "w") as csvfile:
print(f"Opened result file: {pc_sample_config_file}")
fieldnames = [
"Agent_Id",
"Method",
"Unit",
"Minimum_Interval",
"Maximum_Interval",
]
writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
writer.writeheader()
for node_id, configs in agent_pc_sample_config_map.items():
for config in configs:
writer.writerow(
{
"Agent_Id": node_id,
"Method": config.method,
"Unit": config.unit,
"Minimum_Interval": config.min_interval,
"Maximum_Interval": config.max_interval,
}
)
else:
for node_id in agent_ids:
print(f"gpu-agent:{node_id}\n")
if node_id in agent_basic_counter_map.keys():
basic_counters_stream = io.StringIO()
counters = agent_basic_counter_map[node_id]
for counter in counters:
if counter.block:
basic_counters_stream.write("Name:")
basic_counters_stream.write("\t")
basic_counters_stream.write(str(counter.name))
basic_counters_stream.write("\n")
basic_counters_stream.write("Description:")
basic_counters_stream.write("\t")
basic_counters_stream.write(str(counter.description))
basic_counters_stream.write("\n")
basic_counters_stream.write("Block:")
basic_counters_stream.write("\t")
basic_counters_stream.write(str(counter.block))
basic_counters_stream.write("\n")
basic_counters_stream.write("Dimensions:")
basic_counters_stream.write("\t")
basic_counters_stream.write(str(counter.dimensions))
basic_counters_stream.write("\n")
basic_counters = basic_counters_stream.getvalue()
print("List Metrics Basic\n")
print(basic_counters)
print("\n")
basic_counters_stream.close()
if node_id in agent_derived_counter_map.keys():
derived_counters_stream = io.StringIO()
counters = agent_derived_counter_map[node_id]
for counter in counters:
derived_counters_stream.write("Name:")
derived_counters_stream.write("\t")
derived_counters_stream.write(str(counter.name))
derived_counters_stream.write("\n")
derived_counters_stream.write("Description:")
derived_counters_stream.write("\t")
derived_counters_stream.write(str(counter.description))
derived_counters_stream.write("\n")
derived_counters_stream.write("Expression:")
derived_counters_stream.write("\t")
derived_counters_stream.write(str(counter.expression))
derived_counters_stream.write("\n")
derived_counters_stream.write("Dimensions:")
derived_counters_stream.write("\t")
derived_counters_stream.write(str(counter.dimensions))
derived_counters_stream.write("\n")
derived_counters = derived_counters_stream.getvalue()
print("List Metrics Derived\n")
print(derived_counters)
print("\n")
derived_counters_stream.close()
if node_id in agent_pc_sample_config_map.keys():
pc_sample_config_stream = io.StringIO()
configs = agent_pc_sample_config_map[node_id]
for config in configs:
pc_sample_config_stream.write("Method:")
pc_sample_config_stream.write("\t")
pc_sample_config_stream.write(str(config.method))
pc_sample_config_stream.write("\n")
pc_sample_config_stream.write("Unit:")
pc_sample_config_stream.write("\t")
pc_sample_config_stream.write(str(config.unit))
pc_sample_config_stream.write("\n")
pc_sample_config_stream.write("Minimum_Interval:")
pc_sample_config_stream.write("\t")
pc_sample_config_stream.write(str(config.min_interval))
pc_sample_config_stream.write("\n")
pc_sample_config_stream.write("Maximum_Interval:")
pc_sample_config_stream.write("\t")
pc_sample_config_stream.write(str(config.max_interval))
pc_sample_config_stream.write("\n")
pc_sample = pc_sample_config_stream.getvalue()
print(
"List available PC Sample Configurations for node_id\t"
+ str(node_id)
+ "\n"
)
print(pc_sample)
print("\n")
pc_sample_config_stream.close()
else:
print("PC Sampling not supported on node_id\t" + str(node_id) + "\n")
if __name__ == "__main__":
# Load the shared library into ctypes
c_lib.avail_tool_init()
no_of_agents = c_lib.get_number_of_agents()
agent_ids = []
for idx in range(0, no_of_agents):
node_id = c_lib.get_agent_node_id(idx)
agent_ids.append(node_id)
get_counters(node_id)
get_pc_sample_configs(node_id)
generate_output(agent_ids)
@@ -214,10 +214,10 @@ ROCprofiler-SDK introduces a new command-line tool, `rocprofv3`, which is a more
- New option to output summary in desired time units {sec,msec,usec,nsec}
-
* - Display options
- List Metrics
- List available basic and derived metrics and PC sampling configurations
- `--list-basic`, `--list-derived`
- `--list-counters`
- `-L`, `--list-metrics`
- `-L`, `--list-avail`
- A valid YAML is supported for this option now
-
* - Perfetto-specific options
+3 -3
Wyświetl plik
@@ -122,9 +122,9 @@ Here is the sample of commonly used ``rocprofv3`` command-line options. Some opt
- Iteration range for each kernel that match the filter [start-stop].
- Kernel Dispatch Counter Collection
* - ``-L`` \| ``--list-metrics``
- List metrics for counter collection.
- Kernel Dispatch Counter Collection
* - ``-L`` \| ``--list-avail``
- List metrics for counter collection
- List supported PC sampling configurations.
* - ``-E`` \| ``--extra_counters``
- Specifies the path to a YAML file containing extra counter definitions.
@@ -121,30 +121,6 @@ add_destructor(Tp*& ptr)
std::call_once(_once, []() { add_destructor(PTR); }); \
}
tool::csv_output_file*&
get_list_basic_metrics_file()
{
static auto* _v =
new tool::csv_output_file{tool::get_config(),
"basic_metrics",
tool::csv::list_basic_metrics_csv_encoder{},
{"Agent_Id", "Name", "Description", "Block", "Dimensions"}};
ADD_DESTRUCTOR(_v);
return _v;
}
tool::csv_output_file*&
get_list_derived_metrics_file()
{
static auto* _v =
new tool::csv_output_file{tool::get_config(),
"derived_metrics",
tool::csv::list_derived_metrics_csv_encoder{},
{"Agent_Id", "Name", "Description", "Expression", "Dimensions"}};
ADD_DESTRUCTOR(_v);
return _v;
}
#undef ADD_DESTRUCTOR
struct buffer_ids
@@ -686,25 +662,6 @@ using counter_vec_t = std::vector<rocprofiler_counter_id_t>;
using agent_counter_map_t =
std::unordered_map<rocprofiler_agent_id_t, std::optional<rocprofiler_profile_config_id_t>>;
rocprofiler_status_t
dimensions_info_callback(rocprofiler_counter_id_t /*id*/,
const rocprofiler_record_dimension_info_t* dim_info,
long unsigned int num_dims,
void* user_data)
{
ROCP_FATAL_IF(user_data == nullptr) << "dimensions_info_callback invoked without user data";
if(user_data)
{
auto* _data = static_cast<std::vector<rocprofiler_record_dimension_info_t>*>(user_data);
_data->reserve(num_dims);
for(size_t j = 0; j < num_dims; j++)
_data->emplace_back(dim_info[j]);
}
return ROCPROFILER_STATUS_SUCCESS;
}
auto
get_gpu_agents()
{
@@ -921,116 +878,6 @@ counter_record_callback(rocprofiler_dispatch_counting_service_data_t dispatch_da
tool::write_ring_buffer(counter_record, domain_type::COUNTER_COLLECTION);
}
rocprofiler_status_t
list_metrics_iterate_agents(rocprofiler_agent_version_t,
const void** agents,
size_t num_agents,
void*)
{
for(size_t idx = 0; idx < num_agents; idx++)
{
const auto* agent = static_cast<const rocprofiler_agent_v0_t*>(agents[idx]);
auto counters_v = counter_vec_t{};
// TODO(aelwazir): To be changed back to use node id once ROCR fixes
// the hsa_agents to use the real node id
uint32_t node_id = agent->logical_node_id;
if(agent->type != ROCPROFILER_AGENT_TYPE_GPU) continue;
auto status = rocprofiler_iterate_agent_supported_counters(
agent->id,
[](rocprofiler_agent_id_t,
rocprofiler_counter_id_t* counters,
size_t num_counters,
void* user_data) {
auto* agent_node_id = static_cast<uint32_t*>(user_data);
for(size_t i = 0; i < num_counters; i++)
{
auto counter_info = rocprofiler_counter_info_v0_t{};
auto dimensions = std::vector<rocprofiler_record_dimension_info_t>{};
ROCPROFILER_CALL(rocprofiler_iterate_counter_dimensions(
counters[i], dimensions_info_callback, &dimensions),
"iterate_dimension_info");
ROCPROFILER_CALL(
rocprofiler_query_counter_info(counters[i],
ROCPROFILER_COUNTER_INFO_VERSION_0,
static_cast<void*>(&counter_info)),
"Could not query counter_id");
auto dimensions_info = std::stringstream{};
for(size_t j = 0; j != dimensions.size(); j++)
{
dimensions_info << dimensions[j].name
<< "[0:" << dimensions[j].instance_size - 1 << "]";
if(j != dimensions.size() - 1) dimensions_info << "\t";
}
if(!counter_info.is_derived && tool::get_config().list_metrics &&
!std::string(counter_info.block).empty())
{
auto counter_info_ss = std::stringstream{};
if(tool::get_config().list_metrics_output_file)
{
tool::csv::list_basic_metrics_csv_encoder::write_row(
counter_info_ss,
*agent_node_id,
counter_info.name,
counter_info.description,
counter_info.block,
dimensions_info.str());
get_dereference(get_list_basic_metrics_file()) << counter_info_ss.str();
}
else
{
counter_info_ss << "gpu-agent" << *agent_node_id << ":"
<< "\t" << counter_info.name << "\n";
counter_info_ss << "Description:"
<< "\t" << counter_info.description << "\n";
counter_info_ss << "Block:"
<< "\t" << counter_info.block << "\n";
counter_info_ss << "Dimensions:"
<< "\t" << dimensions_info.str() << "\n";
counter_info_ss << "\n";
std::cout << counter_info_ss.str();
}
}
else if(counter_info.is_derived && tool::get_config().list_metrics)
{
auto counter_info_ss = std::stringstream{};
if(tool::get_config().list_metrics_output_file)
{
tool::csv::list_derived_metrics_csv_encoder::write_row(
counter_info_ss,
*agent_node_id,
counter_info.name,
counter_info.description,
counter_info.expression,
dimensions_info.str());
get_dereference(get_list_derived_metrics_file())
<< counter_info_ss.str();
}
else
{
counter_info_ss << "gpu-agent" << *agent_node_id << ":"
<< "\t" << counter_info.name << "\n"
<< "Description: " << counter_info.description << "\n";
counter_info_ss << "Expression: " << counter_info.expression << "\n";
counter_info_ss << "Dimensions: " << dimensions_info.str() << "\n";
counter_info_ss << "\n";
std::cout << counter_info_ss.str();
}
}
}
return ROCPROFILER_STATUS_SUCCESS;
},
reinterpret_cast<void*>(&node_id));
ROCP_ERROR_IF(status != ROCPROFILER_STATUS_SUCCESS)
<< "Failed to iterate counters for agent " << node_id << " (" << agent->name << ")";
}
return ROCPROFILER_STATUS_SUCCESS;
}
rocprofiler_client_finalize_t client_finalizer = nullptr;
rocprofiler_client_id_t* client_identifier = nullptr;
@@ -1418,21 +1265,6 @@ tool_init(rocprofiler_client_finalize_t fini_func, void* tool_data)
return 0;
}
void
api_registration_callback(rocprofiler_intercept_table_t,
uint64_t,
uint64_t,
void**,
uint64_t,
void*)
{
ROCPROFILER_CALL(rocprofiler_query_available_agents(ROCPROFILER_AGENT_INFO_VERSION_0,
list_metrics_iterate_agents,
sizeof(rocprofiler_agent_t),
nullptr),
"Iterate rocporfiler agents")
}
using stats_data_t = tool::stats_data_t;
using stats_entry_t = tool::stats_entry_t;
using domain_stats_vec_t = tool::domain_stats_vec_t;
@@ -1727,15 +1559,6 @@ rocprofiler_configure(uint32_t version,
"Loading extra counters");
}
if(tool::get_config().list_metrics)
{
tool_metadata->init(tool::metadata::inprocess{});
ROCPROFILER_CALL(rocprofiler_at_intercept_table_registration(
api_registration_callback, ROCPROFILER_HSA_TABLE, nullptr),
"api registration");
return nullptr;
}
ROCP_INFO << id->name << " is using rocprofiler-sdk v" << major << "." << minor << "." << patch
<< " (" << runtime_version << ")";
+1 -1
Wyświetl plik
@@ -2,4 +2,4 @@
#
#
add_subdirectory(rocprofv3-trigger-list-metrics)
add_subdirectory(rocprofiler-avail)
@@ -0,0 +1,26 @@
rocprofiler_activate_clang_tidy()
add_library(rocprofv3-list-avail SHARED)
target_sources(rocprofv3-list-avail PRIVATE rocprofv3_avail.cpp)
target_link_libraries(
rocprofv3-list-avail
PRIVATE rocprofiler-sdk::rocprofiler-sdk-shared-library
rocprofiler-sdk::rocprofiler-sdk-headers
rocprofiler-sdk::rocprofiler-sdk-build-flags
rocprofiler-sdk::rocprofiler-sdk-common-library
rocprofiler-sdk::rocprofiler-sdk-cereal)
set_target_properties(
rocprofv3-list-avail
PROPERTIES LIBRARY_OUTPUT_DIRECTORY ${PROJECT_BINARY_DIR}/${CMAKE_INSTALL_LIBEXECDIR}
SOVERSION ${PROJECT_VERSION_MAJOR}
VERSION ${PROJECT_VERSION}
BUILD_RPATH "\$ORIGIN:\$ORIGIN/.."
INSTALL_RPATH "\$ORIGIN:\$ORIGIN/..")
install(
TARGETS rocprofv3-list-avail
DESTINATION ${CMAKE_INSTALL_LIBEXECDIR}
COMPONENT tools
EXPORT rocprofiler-sdk-tool-targets)
@@ -0,0 +1,399 @@
// MIT License
//
// Copyright (c) 2023 Advanced Micro Devices, Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in all
// copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
#include "lib/common/environment.hpp"
#include "lib/common/filesystem.hpp"
#include "lib/common/logging.hpp"
#include "lib/common/scope_destructor.hpp"
#include "lib/common/string_entry.hpp"
#include "lib/common/synchronized.hpp"
#include "lib/common/units.hpp"
#include "lib/common/utility.hpp"
#include <rocprofiler-sdk/agent.h>
#include <rocprofiler-sdk/callback_tracing.h>
#include <rocprofiler-sdk/defines.h>
#include <rocprofiler-sdk/fwd.h>
#include <rocprofiler-sdk/registration.h>
#include <rocprofiler-sdk/rocprofiler.h>
#include <fmt/core.h>
#include <unistd.h>
#include <algorithm>
#include <cstring>
#include <fstream>
#include <mutex>
#include <unordered_map>
#include <unordered_set>
#include <vector>
auto destructors = new std::vector<std::function<void()>>{};
namespace common = ::rocprofiler::common;
namespace
{
auto pc_sampling_method = std::deque<std::string>{
"ROCPROFILER_PC_SAMPLING_METHOD_NONE",
"ROCPROFILER_PC_SAMPLING_METHOD_STOCHASTIC",
"ROCPROFILER_PC_SAMPLING_METHOD_HOST_TRAP",
"ROCPROFILER_PC_SAMPLING_METHOD_LAST",
};
auto pc_sampling_unit = std::deque<std::string>{
"ROCPROFILER_PC_SAMPLING_UNIT_NONE",
"ROCPROFILER_PC_SAMPLING_UNIT_INSTRUCTIONS",
"ROCPROFILER_PC_SAMPLING_UNIT_CYCLES",
"ROCPROFILER_PC_SAMPLING_UNIT_TIME",
"ROCPROFILER_PC_SAMPLING_UNIT_LAST",
};
} // namespace
using counter_info_t = std::vector<std::vector<std::string>>;
using pc_sample_info_t = std::vector<std::vector<std::string>>;
auto agent_counter_info = std::unordered_map<uint64_t, counter_info_t>{};
auto agent_pc_sample_info = std::unordered_map<uint64_t, pc_sample_info_t>{};
// auto agent_configs_info = std::unordered_map<uint64_t, config_info_t>{};
using counter_dimension_info_t =
std::unordered_map<uint64_t, std::vector<std::vector<std::string>>>;
auto counter_dim_info = counter_dimension_info_t{};
std::vector<uint64_t> agent_node_ids;
constexpr size_t pc_config_fields = 4, method_idx = 0, unit_idx = 1, min_interval_idx = 2,
max_interval_idx = 3;
constexpr size_t dimensions_fields = 3, dim_id_idx = 0, dim_name_idx = 1, size_idx = 2;
constexpr size_t counter_fields = 5, counter_id_idx = 0, name_idx = 1, description_idx = 2,
is_derived_idx = 3, block_idx = 4, expression_idx = 4;
#define ROCPROFILER_CALL(result, msg) \
{ \
rocprofiler_status_t ROCPROFILER_VARIABLE(CHECKSTATUS, __LINE__) = result; \
if(ROCPROFILER_VARIABLE(CHECKSTATUS, __LINE__) != ROCPROFILER_STATUS_SUCCESS) \
{ \
std::string status_msg = \
rocprofiler_get_status_string(ROCPROFILER_VARIABLE(CHECKSTATUS, __LINE__)); \
std::cerr << "[" #result "][" << __FILE__ << ":" << __LINE__ << "] " << msg \
<< " failed with error code " << ROCPROFILER_VARIABLE(CHECKSTATUS, __LINE__) \
<< ": " << status_msg << "\n" \
<< std::flush; \
std::stringstream errmsg{}; \
errmsg << "[" #result "][" << __FILE__ << ":" << __LINE__ << "] " << msg " failure (" \
<< status_msg << ")"; \
throw std::runtime_error(errmsg.str()); \
} \
}
using counter_vec_t = std::vector<rocprofiler_counter_id_t>;
ROCPROFILER_EXTERN_C_INIT
void
avail_tool_init() ROCPROFILER_EXPORT;
size_t
get_number_of_agents() ROCPROFILER_EXPORT;
uint64_t
get_agent_node_id(int idx) ROCPROFILER_EXPORT;
int
get_number_of_counters(uint64_t node_id) ROCPROFILER_EXPORT;
void
get_counters_info(uint64_t node_id,
int idx,
uint64_t* counter_id,
const char** counter_name,
const char** counter_description,
uint8_t* is_derived) ROCPROFILER_EXPORT;
void
get_counter_expression(uint64_t node_id, int idx, const char** counter_expr) ROCPROFILER_EXPORT;
void
get_counter_block(uint64_t node_id, int idx, const char** counter_block) ROCPROFILER_EXPORT;
int
get_number_of_dimensions(int counter_id) ROCPROFILER_EXPORT;
void
get_counter_dimension(uint64_t counter_id,
uint64_t dimension_idx,
uint64_t* dimension_id,
const char** dimension_name,
uint64_t* dimension_instance) ROCPROFILER_EXPORT;
int
get_number_of_pc_sample_configs(uint64_t node_id) ROCPROFILER_EXPORT;
void
get_pc_sample_config(uint64_t node_id,
int idx,
const char** method,
const char** unit,
uint64_t* min_interval,
uint64_t* max_interval) ROCPROFILER_EXPORT;
ROCPROFILER_EXTERN_C_FINI
void
initialize_logging()
{
auto logging_cfg = rocprofiler::common::logging_config{.install_failure_handler = true};
common::init_logging("ROCPROF", logging_cfg);
FLAGS_colorlogtostderr = true;
}
rocprofiler_status_t
pc_configuration_callback(const rocprofiler_pc_sampling_configuration_t* configs,
long unsigned int num_config,
void* user_data)
{
auto* avail_configs = static_cast<std::vector<std::vector<std::string>>*>(user_data);
for(size_t i = 0; i < num_config; i++)
{
auto config = std::vector<std::string>{};
config.reserve(pc_config_fields);
auto it = config.begin();
config.insert(it + method_idx, pc_sampling_method.at(configs[i].method));
config.insert(it + unit_idx, pc_sampling_unit.at(configs[i].unit));
config.insert(it + min_interval_idx, std::to_string(configs[i].min_interval));
config.insert(it + max_interval_idx, std::to_string(configs[i].max_interval));
avail_configs->push_back(config);
}
return ROCPROFILER_STATUS_SUCCESS;
}
rocprofiler_status_t
dimensions_info_callback(rocprofiler_counter_id_t /*id*/,
const rocprofiler_record_dimension_info_t* dim_info,
long unsigned int num_dims,
void* user_data)
{
auto* dimensions_info =
static_cast<std::vector<rocprofiler_record_dimension_info_t>*>(user_data);
dimensions_info->reserve(num_dims);
for(size_t j = 0; j < num_dims; j++)
dimensions_info->emplace_back(dim_info[j]);
return ROCPROFILER_STATUS_SUCCESS;
}
rocprofiler_status_t
iterate_agent_counters_callback(rocprofiler_agent_id_t,
rocprofiler_counter_id_t* counters,
size_t num_counters,
void* user_data)
{
auto* _counters_info = reinterpret_cast<std::vector<std::vector<std::string>>*>(user_data);
auto dimensions_data = std::vector<rocprofiler_record_dimension_info_t>{};
for(size_t i = 0; i < num_counters; i++)
{
rocprofiler_counter_info_v0_t _info;
ROCPROFILER_CALL(
rocprofiler_iterate_counter_dimensions(
counters[i], dimensions_info_callback, static_cast<void*>(&dimensions_data)),
"iterate_dimension_info");
auto dimensions_info = std::vector<std::vector<std::string>>{};
dimensions_info.reserve(dimensions_data.size());
for(auto& dim : dimensions_data)
{
auto dimensions = std::vector<std::string>{};
dimensions.reserve(dimensions_fields);
auto it = dimensions.begin();
dimensions.insert(it + dim_id_idx, std::to_string(dim.id));
dimensions.insert(it + dim_name_idx, std::string(dim.name));
dimensions.insert(it + size_idx, std::to_string(dim.instance_size - 1));
dimensions_info.emplace_back(dimensions);
}
counter_dim_info.emplace(counters[i].handle, dimensions_info);
ROCPROFILER_CALL(
rocprofiler_query_counter_info(
counters[i], ROCPROFILER_COUNTER_INFO_VERSION_0, static_cast<void*>(&_info)),
"Could not query counter_id");
auto counter = std::vector<std::string>{};
if(_info.is_derived)
{
counter.reserve(counter_fields);
auto it = counter.begin();
counter.insert(it + counter_id_idx, std::to_string(_info.id.handle));
counter.insert(it + name_idx, std::string(_info.name));
counter.insert(it + description_idx, std::string(_info.description));
counter.insert(it + is_derived_idx, std::to_string(_info.is_derived));
counter.insert(it + expression_idx, std::string(_info.expression));
}
else
{
counter.reserve(counter_fields);
auto it = counter.begin();
counter.insert(it + counter_id_idx, std::to_string(_info.id.handle));
counter.insert(it + name_idx, std::string(_info.name));
counter.insert(it + description_idx, std::string(_info.description));
counter.insert(it + is_derived_idx, std::to_string(_info.is_derived));
counter.insert(it + block_idx, std::string(_info.block));
}
_counters_info->emplace_back(counter);
}
return ROCPROFILER_STATUS_SUCCESS;
}
rocprofiler_status_t
list_avail_configs(rocprofiler_agent_version_t, const void** agents, size_t num_agents, void*)
{
for(size_t idx = 0; idx < num_agents; idx++)
{
const auto* agent = static_cast<const rocprofiler_agent_v0_t*>(agents[idx]);
if(agent->type == ROCPROFILER_AGENT_TYPE_GPU)
{
auto counters_v = counter_vec_t{};
// TODO(aelwazir): To be changed back to use node id once ROCR fixes
// the hsa_agents to use the real node id
uint32_t node_id = agent->node_id;
std::vector<std::vector<std::string>> configs = {};
std::vector<std::vector<std::string>> _counter_dim_info = {};
agent_node_ids.emplace_back(node_id);
rocprofiler_query_pc_sampling_agent_configurations(
agent->id, pc_configuration_callback, &configs);
ROCPROFILER_CALL(
rocprofiler_iterate_agent_supported_counters(
agent->id, iterate_agent_counters_callback, (void*) (&_counter_dim_info)),
"Iterate rocprofiler counters");
if(!_counter_dim_info.empty()) agent_counter_info.emplace(node_id, _counter_dim_info);
if(!configs.empty())
{
agent_pc_sample_info.emplace(node_id, configs);
}
}
}
return ROCPROFILER_STATUS_SUCCESS;
}
ROCPROFILER_EXTERN_C_INIT
void
avail_tool_init()
{
initialize_logging();
ROCPROFILER_CALL(rocprofiler_query_available_agents(ROCPROFILER_AGENT_INFO_VERSION_0,
list_avail_configs,
sizeof(rocprofiler_agent_t),
nullptr),
"Iterate rocporfiler agents");
}
size_t
get_number_of_agents()
{
return agent_node_ids.size();
}
uint64_t
get_agent_node_id(int idx)
{
return agent_node_ids.at(idx);
}
int
get_number_of_counters(uint64_t node_id)
{
if(agent_counter_info.find(node_id) != agent_counter_info.end())
return agent_counter_info.at(node_id).size();
else
return 0;
}
void
get_counters_info(uint64_t node_id,
int counter_idx,
uint64_t* counter_id,
const char** counter_name,
const char** counter_description,
uint8_t* is_derived)
{
if(agent_counter_info.find(node_id) == agent_counter_info.end()) return;
*counter_id =
std::stoull(agent_counter_info.at(node_id).at(counter_idx).at(0).c_str(), nullptr, 10);
*counter_name = agent_counter_info.at(node_id).at(counter_idx).at(1).c_str();
*counter_description = agent_counter_info.at(node_id).at(counter_idx).at(2).c_str();
*is_derived = std::stoi(agent_counter_info.at(node_id).at(counter_idx).at(3).c_str());
}
void
get_counter_block(uint64_t node_id, int counter_idx, const char** counter_block)
{
if(agent_counter_info.find(node_id) == agent_counter_info.end()) return;
*counter_block = agent_counter_info.at(node_id).at(counter_idx).at(4).c_str();
}
void
get_counter_expression(uint64_t node_id, int idx, const char** counter_expr)
{
if(agent_counter_info.find(node_id) == agent_counter_info.end()) return;
*counter_expr = agent_counter_info.at(node_id).at(idx).at(4).c_str();
}
int
get_number_of_dimensions(int counter_id)
{
if(counter_dim_info.find(counter_id) == counter_dim_info.end()) return 0;
return counter_dim_info.at(counter_id).size();
}
void
get_counter_dimension(uint64_t counter_id,
uint64_t dimension_idx,
uint64_t* dimension_id,
const char** dimension_name,
uint64_t* dimension_instance)
{
if(counter_dim_info.find(counter_id) == counter_dim_info.end()) return;
*dimension_id =
std::stoull(counter_dim_info.at(counter_id).at(dimension_idx).at(0).c_str(), nullptr, 10);
*dimension_name = counter_dim_info.at(counter_id).at(dimension_idx).at(1).c_str();
*dimension_instance =
std::stoull(counter_dim_info.at(counter_id).at(dimension_idx).at(2).c_str(), nullptr, 10);
}
int
get_number_of_pc_sample_configs(uint64_t node_id)
{
if(agent_pc_sample_info.find(node_id) == agent_pc_sample_info.end()) return 0;
return agent_pc_sample_info.at(node_id).size();
}
void
get_pc_sample_config(uint64_t node_id,
int config_idx,
const char** method,
const char** unit,
uint64_t* min_interval,
uint64_t* max_interval)
{
if(agent_pc_sample_info.find(node_id) == agent_pc_sample_info.end()) return;
*method = agent_pc_sample_info.at(node_id).at(config_idx).at(0).c_str();
*unit = agent_pc_sample_info.at(node_id).at(config_idx).at(1).c_str();
*min_interval =
std::stoull(agent_pc_sample_info.at(node_id).at(config_idx).at(2).c_str(), nullptr, 10);
*max_interval =
std::stoull(agent_pc_sample_info.at(node_id).at(config_idx).at(3).c_str(), nullptr, 10);
}
ROCPROFILER_EXTERN_C_FINI
@@ -1,21 +0,0 @@
#
#
#
set(CMAKE_INSTALL_DEFAULT_COMPONENT_NAME "tools")
add_executable(rocprofv3-trigger-list-metrics)
target_sources(rocprofv3-trigger-list-metrics PRIVATE rocprofv3_trigger_list_metrics.cpp)
target_link_libraries(rocprofv3-trigger-list-metrics
PRIVATE rocprofiler-sdk::rocprofiler-sdk-hsa-runtime)
set_target_properties(
rocprofv3-trigger-list-metrics
PROPERTIES RUNTIME_OUTPUT_DIRECTORY ${PROJECT_BINARY_DIR}/${CMAKE_INSTALL_LIBEXECDIR}
BUILD_RPATH "\$ORIGIN:\$ORIGIN/../${CMAKE_INSTALL_LIBDIR}"
INSTALL_RPATH "\$ORIGIN:\$ORIGIN/../${CMAKE_INSTALL_LIBDIR}")
install(
TARGETS rocprofv3-trigger-list-metrics
DESTINATION ${CMAKE_INSTALL_LIBEXECDIR}
COMPONENT tools
EXPORT rocprofiler-sdk-tool-targets)
@@ -1,30 +0,0 @@
// MIT License
//
// Copyright (c) 2023 Advanced Micro Devices, Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in all
// copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
#include <hsa/hsa.h>
int
main()
{
hsa_init();
return 0;
}
@@ -15,28 +15,35 @@ rocprofiler_configure_pytest_files(CONFIG pytest.ini COPY validate.py conftest.p
# basic-metrics
add_test(
NAME rocprofv3-test-list-metrics-execute
COMMAND
$<TARGET_FILE:rocprofiler-sdk::rocprofv3> -d
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2 -o metrics --list-metrics)
NAME rocprofv3-test-list-avail-execute
COMMAND $<TARGET_FILE:rocprofiler-sdk::rocprofv3> -d
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2 -o metrics --list-avail)
# list-metrics-stdout
add_test(NAME rocprofv3-test-list-metrics-std-out-execute
add_test(NAME rocprofv3-test-list-avail-std-out-execute
COMMAND $<TARGET_FILE:rocprofiler-sdk::rocprofv3> -i
${CMAKE_CURRENT_BINARY_DIR}/input.json)
# list-metrics with tracing
add_test(
NAME rocprofv3-test-list-avail-trace-execute
COMMAND
$<TARGET_FILE:rocprofiler-sdk::rocprofv3> -d
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2 -o metrics --list-avail
--sys-trace -- $<TARGET_FILE:transpose>)
string(REPLACE "LD_PRELOAD=" "ROCPROF_PRELOAD=" PRELOAD_ENV
"${ROCPROFILER_MEMCHECK_PRELOAD_ENV}")
set(cc-env-list-metrics "${PRELOAD_ENV}")
set_tests_properties(
rocprofv3-test-list-metrics-execute
rocprofv3-test-list-avail-execute
PROPERTIES TIMEOUT 45 LABELS "integration-tests" ENVIRONMENT "${cc-env-list-metrics}"
FAIL_REGULAR_EXPRESSION "${ROCPROFILER_DEFAULT_FAIL_REGEX}")
set_tests_properties(
rocprofv3-test-list-metrics-std-out-execute
rocprofv3-test-list-avail-std-out-execute
PROPERTIES
TIMEOUT
45
@@ -45,23 +52,32 @@ set_tests_properties(
ENVIRONMENT
"${cc-env-list-metrics}"
PASS_REGULAR_EXPRESSION
"gpu-agent[0-9]*:[a-zA-Z_]*\\n;Description:(.*)\\n*;Expression:(.)*\\n*;Block:[a-zA-Z]*\\n*;Dimensions:([A-Z_]*\\[[0-9]*:[0-9]*\\])*\\n*;"
"gpu-agent:[0-9]*\\n*; Name:\t[a-zA-Z_]*\\n;Description:\t(.*)\\n*;Expression:\t(.)*\\n*;Block:\t[a-zA-Z]*\\n*;Dimensions:\t([A-Z_]*\\[[0-9]*:[0-9]*\\];Method:\t(.*);Unit:\t(.*);Minimum_Interval:\t[0-9]*;Maximum_Interval:\t[0-9]*)*\\n*;"
)
set_tests_properties(
rocprofv3-test-list-avail-trace-execute
PROPERTIES TIMEOUT 45 LABELS "integration-tests" ENVIRONMENT "${cc-env-list-metrics}"
FAIL_REGULAR_EXPRESSION "${ROCPROFILER_DEFAULT_FAIL_REGEX}")
set(VALIDATION_FILES
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_basic_metrics.csv
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_derived_metrics.csv)
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_derived_metrics.csv
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_pc_sample_config.csv)
add_test(
NAME rocprofv3-test-list-metrics-validate
NAME rocprofv3-test-list-avail-validate
COMMAND
${Python3_EXECUTABLE} ${CMAKE_CURRENT_BINARY_DIR}/validate.py
--derived-metrics-input
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_derived_metrics.csv
--basic-metrics-input
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_basic_metrics.csv)
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_basic_metrics.csv
--pc-sample-config-input
${CMAKE_CURRENT_BINARY_DIR}/out_counter_collection_2/metrics_pc_sample_config.csv)
set_tests_properties(
rocprofv3-test-list-metrics-validate
rocprofv3-test-list-avail-validate
PROPERTIES TIMEOUT
45
LABELS
@@ -7,6 +7,7 @@ import pytest
def pytest_addoption(parser):
parser.addoption("--basic-metrics-input", action="store", help="Path to csv file.")
parser.addoption("--derived-metrics-input", action="store", help="Path to csv file.")
parser.addoption("--pc-sample-config-input", action="store", help="Path to csv file.")
@pytest.fixture
@@ -33,3 +34,16 @@ def basic_metrics_input_data(request):
data.append(row)
return data
@pytest.fixture
def pc_sample_config_input_data(request):
filename = request.config.getoption("--pc-sample-config-input")
data = []
if filename:
with open(filename, "r") as inp:
reader = csv.DictReader(inp)
for row in reader:
data.append(row)
return data
@@ -1,7 +1,7 @@
{
"jobs": [
{
"list_metrics": true
"list_avail": true
}
]
}
@@ -29,6 +29,15 @@ def test_validate_list_derived_metrics(derived_metrics_input_data):
row["Expression"] == "reduce(TA_TA_BUSY,min)"
def test_validate_list_pc_sample_config(pc_sample_config_input_data):
for row in pc_sample_config_input_data:
assert row["Agent_Id"].isdigit() == True
assert row["Method"] != ""
assert row["Unit"] != ""
assert row["Minimum_Interval"].isdigit() == True
assert row["Maximum_Interval"].isdigit() == True
if __name__ == "__main__":
exit_code = pytest.main(["-x", __file__] + sys.argv[1:])
sys.exit(exit_code)