55cf0e237e
* Analysis report block based filtering for profiling
* Profiling mode changes
- `-b` option now additionally accepts metric id(s), similar to `-b` option in analyze mode (e.g. 6, 6.2, 6.23)
- Only counters mentioned in the selected analysis report blocks will be collected
- Add parsing logic to identify hardware counters from analysis report blocks
- Add filtering logic to only write filtered counters in perfmon files
- Log not collected counters in one line
- `--list-metrics` option added in profile mode to list possible metric id(s) similar to analyze mode
- Write arguments provided during profiling in profiling_configuration.yaml file
* Analysis mode changes
- During analysis mode, only show report blocks selected during profiling
- If `-b` option is provided in analysis mode, then follow provided filters
- Do not show empty tables in analysis report
* Miscellaneous changes
- Update CHANGELOG
- Add test cases
- Instruction mix report block filter
- Instruction mix and Memory chart report block filter
- Instruction mix report block filter and CPC hardware block filter
- TA hardware block filter
- --list-metrics in profile mode should work
- Move binary handler fixtures to conftest.py to avoid importing
fixtures
- cmake file in tests directory has been updated to compile sample/vmem.hip for testing
* Public documentation changes
- Use the term "Hardware report block" instead of "Hardware block"
- Add documentation for "--list-metrics" option in profile mode
- Add example of filtering by hardware report block such as instruction
mix and wavefront launch statistics
- Add deprecation warning for hardware component (sq, tcc) based filtering
74 خطوط
979 B
TOML
74 خطوط
979 B
TOML
[project]
|
|
name = "rocprof_compute"
|
|
requires-python = ">=3.8"
|
|
|
|
[project.optional-dependencies]
|
|
developer = [
|
|
"black>=22.6.0",
|
|
"isort>=5.12.0",
|
|
"pre-commit",
|
|
]
|
|
|
|
[tool.black]
|
|
line-length = 90
|
|
include = '\.py$'
|
|
exclude = '''
|
|
(
|
|
/(
|
|
\.eggs
|
|
| \.git
|
|
| \.github
|
|
| \.tox
|
|
| \.venv
|
|
| \.misc
|
|
| \.vscode
|
|
| \.pyc
|
|
| dist
|
|
| external
|
|
| .pytest_cache
|
|
| build
|
|
| build-rocprof_compute
|
|
)/
|
|
)
|
|
'''
|
|
|
|
[tool.isort]
|
|
profile = "black"
|
|
|
|
[tool.pytest.ini_options]
|
|
addopts = [
|
|
"--import-mode=importlib",
|
|
]
|
|
|
|
pythonpath = [
|
|
".",
|
|
"src",
|
|
"src/rocprof_compute_soc",
|
|
"src/utils",
|
|
"src/rocprof_compute_analyze/utils",
|
|
"tests"
|
|
]
|
|
|
|
markers = [
|
|
"section",
|
|
"kernel_execution",
|
|
"block",
|
|
"misc",
|
|
"mem",
|
|
"sort",
|
|
"join",
|
|
"verbosity",
|
|
"dispatch",
|
|
"list_metrics",
|
|
"filter_block",
|
|
"filter_kernel",
|
|
"dispatch",
|
|
"normal_unit",
|
|
"max_stat",
|
|
"time_unit",
|
|
"decimal",
|
|
"col",
|
|
"kernel_verbose",
|
|
"serial",
|
|
]
|