Files
rocm-systems/tests/test_utils.py
T
vedithal-amd 55cf0e237e Analysis report block based filtering for profiling (#566)
* Analysis report block based filtering for profiling

* Profiling mode changes

- `-b` option now additionally accepts metric id(s), similar to `-b` option in analyze mode (e.g. 6, 6.2, 6.23)
    - Only counters mentioned in the selected analysis report blocks will be collected
        - Add parsing logic to identify hardware counters from analysis report blocks
        - Add filtering logic to only write filtered counters in perfmon files
        - Log not collected counters in one line
- `--list-metrics` option added in profile mode to list possible metric id(s) similar to analyze mode
- Write arguments provided during profiling in profiling_configuration.yaml file

* Analysis mode changes

- During analysis mode, only show report blocks selected during profiling
    - If `-b` option is provided in analysis mode, then follow provided filters
- Do not show empty tables in analysis report

* Miscellaneous changes

- Update CHANGELOG
- Add test cases
    - Instruction mix report block filter
    - Instruction mix and Memory chart report block filter
    - Instruction mix report block filter and CPC hardware block filter
    - TA hardware block filter
    - --list-metrics in profile mode should work
- Move binary handler fixtures to conftest.py to avoid importing
  fixtures
- cmake file in tests directory has been updated to compile sample/vmem.hip for testing

* Public documentation changes

- Use the term "Hardware report block" instead of "Hardware block"
- Add documentation for "--list-metrics" option in profile mode
- Add example of filtering by hardware report block such as instruction
  mix and wavefront launch statistics
- Add deprecation warning for hardware component (sq, tcc) based filtering
2025-03-10 14:42:56 -04:00

136 wiersze
4.8 KiB
Python

##############################################################################bl
# MIT License
#
# Copyright (c) 2021 - 2025 Advanced Micro Devices, Inc. All Rights Reserved.
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
##############################################################################el
# Common helper routines for testing collateral
import inspect
import os
import re
import shutil
from pathlib import Path
import pandas as pd
def check_resource_allocation():
"""Check if CTEST resource allocation is enabled for parallel testing and set
HIP_VISIBLE_DEVICES variable accordingly with assigned gpu index.
"""
if "CTEST_RESOURCE_GROUP_COUNT" not in os.environ:
return
if "CTEST_RESOURCE_GROUP_0_GPUS" in os.environ:
resource = os.environ["CTEST_RESOURCE_GROUP_0_GPUS"]
# extract assigned gpu id from env var: example format -> 'id:0,slots:1'
for item in resource.split(","):
key, value = item.split(":")
if key == "id":
os.environ["HIP_VISIBLE_DEVICES"] = value
return
return
def check_file_pattern(pattern, file_path):
"""Check if the given pattern exists in the file"""
content = ""
with open(file_path) as f:
content = f.read()
return len(re.findall(pattern, content)) != 0
def get_output_dir(suffix="_output", clean_existing=True):
"""Provides a unique output directory based on the name of the calling test function with a suffix applied.
Args:
suffix (str, optional): suffix to append to output_dir. Defaults to "_output".
clean_existing (bool, optional): Whether to remove existing directory if exists. Defaults to True.
"""
output_dir = inspect.stack()[1].function + suffix
if clean_existing:
if Path(output_dir).exists():
shutil.rmtree(output_dir)
return output_dir
def setup_workload_dir(input_dir, suffix="_tmp", clean_existing=True):
"""Provides a unique input workoad directory with contents of input_dir
based on the name of the calling test function.
Setup is a NOOP when tests run serially.
"""
if "PYTEST_XDIST_WORKER_COUNT" not in os.environ:
return input_dir
output_dir = inspect.stack()[1].function + suffix
if clean_existing:
if Path(output_dir).exists():
shutil.rmtree(output_dir)
shutil.copytree(input_dir, output_dir)
return output_dir
def clean_output_dir(cleanup, output_dir):
"""Remove output directory generated from rocprofiler-compute execution
Args:
cleanup (boolean): flag to enable/disable directory cleanup
output_dir (string): name of directory to remove
"""
if cleanup:
if Path(output_dir).exists():
try:
shutil.rmtree(output_dir)
except OSError as e:
print("WARNING: shutil.rmdir(output_dir): directory may not be empty...")
return
def check_csv_files(output_dir, num_devices, num_kernels):
"""Check profiling output csv files for expected number of entries (based on kernel invocations)
Args:
output_dir (string): output directory containing csv files
num_kernels (int): number of kernels expected to have been profiled
Returns:
dict: dictionary housing file contents as pandas dataframe
"""
file_dict = {}
files_in_workload = os.listdir(output_dir)
for file in files_in_workload:
if file.endswith(".csv"):
file_dict[file] = pd.read_csv(output_dir + "/" + file)
if "roofline" in file:
assert len(file_dict[file].index) >= num_devices
elif not "sysinfo" in file:
assert len(file_dict[file].index) >= num_kernels
elif file.endswith(".pdf"):
file_dict[file] = "pdf"
return file_dict