94f4f56c40
* Initial commit: Need to implement wrapper function to collect data and test that wrapper function is correctly replacing core HSA functions
* Attempted to implement wrapper implementation for hsa memory allocation functions. Need to modify generate record files and test if implementation is working as expected
* Debugging and implementing generateCSV function
* Memory allocation size and starting address outputted to csv and json file formats
* Formatting
* Initial setup for OTF2 and Perfetto generation
* Collecting agent id for memory_allocation and formatting
* Modified memory_allocation.cpp to set up code for AMD_EXT commands
* Support for memory_pool_allocate added
* Removed accidently added file
* Made flag optional and added more OTF2 and Perfetto code. Needs testing to ensure perfetto and OTF2 works
* Formatting
* Fixed perfetto and otf2 output
* Fixed flag issue due to incorrect buffer use
* Updated documentation
* Small cleaning and comments
* Added test for HSA memory allocation tracing
* Fixed summary test validation errors due to allocation tracing. Added type to location_base to create unique event ids for allocation due to OTF2 trace error
* Decreased lower limit of hip calls for test
* Modified summary tests to vary number of allocate requests
* Minor fixes to address comments. Still need to address OTF2 comments
* Fix docs and changed OTF2 to use enum for type specified in location_base construction
* Fixed schema error
* Added vmem command tracking. Need to add test
* Updated test to work with vmem command and updated generateCSV to output int instead of hex string.
* OTF2 enum update and mispelling fix
* CI does not support Virtual Memory API. Removed vmem test. Will add back if CI is modifed to suport vmem API
* Update CMakeLists.txt for memory allocation test
* Updated summary test
* Minor fixes to address comments
* Moved domain_type.hpp enum to before LAST
* Fixed compile errors and formatting
* Fixed stats summary domain name error
* Added rocprofv3 test
* Page migration test fix
* Undo page migration test changes. Failures do not appear to have to do with memory allocation
[ROCm/rocprofiler-sdk commit: 3bd7773cf7]
153 satır
5.7 KiB
JSON
153 satır
5.7 KiB
JSON
{
|
|
"$schema": "http://json-schema.org/draft-07/schema#",
|
|
"type": "object",
|
|
"description": "Schema for the rocprofv3 JSON input",
|
|
"properties": {
|
|
"jobs": {
|
|
"type": "array",
|
|
"description": "rocprofv3 input data per application run",
|
|
"items": {
|
|
"type" : "object",
|
|
"description": "data for rocprofv3",
|
|
"properties": {
|
|
|
|
"pmc": {
|
|
"type" : "array",
|
|
"description": "list of counters to collect"
|
|
},
|
|
|
|
"kernel_include_regex":{
|
|
"type": "string",
|
|
"description": "Include the kernels matching this filter"
|
|
},
|
|
|
|
"kernel_exclude_regex": {
|
|
"type": "string",
|
|
"description": "Exclude the kernels matching this filter"
|
|
},
|
|
|
|
"kernel_iteration_range": {
|
|
"type": "string",
|
|
"description": "Iteration range for each kernel that match the filter [start-stop]"
|
|
},
|
|
|
|
"hip_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HIP Traces (runtime + compiler)"
|
|
},
|
|
|
|
"hip_runtime_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HIP Runtime API Traces"
|
|
},
|
|
|
|
"hip_compiler_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HIP Compiler generated code Traces"
|
|
},
|
|
|
|
"marker_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting Marker (ROCTx) Traces"
|
|
},
|
|
|
|
"kernel_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting Kernel Dispatch Traces"
|
|
},
|
|
|
|
"memory_copy_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting Memory Copy Traces"
|
|
},
|
|
|
|
"memory_allocation_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting Memory Allocation Traces"
|
|
},
|
|
|
|
"scratch_memory_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting Scratch Memory operations Traces"
|
|
},
|
|
|
|
"stats": {
|
|
"type": "boolean",
|
|
"description": "For Collecting statistics of enabled tracing types"
|
|
},
|
|
|
|
"hsa_trace": {
|
|
"type": "boolean",
|
|
"description":"For Collecting HSA Traces (core + amd + image + finalizer)"
|
|
},
|
|
|
|
"hsa_core_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HSA API Traces (core API)"
|
|
},
|
|
|
|
"hsa_amd_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HSA API Traces (AMD-extension API)"
|
|
},
|
|
|
|
"hsa_finalize_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HSA API Traces (Finalizer-extension API)"
|
|
},
|
|
|
|
"hsa_image_trace": {
|
|
"type": "boolean",
|
|
"description": "For Collecting HSA API Traces (Image-extenson API)"
|
|
},
|
|
|
|
"sys_trace" : {
|
|
"type": "boolean",
|
|
"description": "For Collecting HIP, HSA, Marker (ROCTx), Memory copy, Memory allocation, Scratch memory, and Kernel dispatch traces"
|
|
},
|
|
|
|
"mangled_kernels": {
|
|
"type": "boolean",
|
|
"description": "Do not demangle the kernel names"
|
|
},
|
|
|
|
"truncate_kernels": {
|
|
"type": "boolean",
|
|
"description": "Truncate the demangled kernel names"
|
|
},
|
|
|
|
"output_file":{
|
|
"type": "string",
|
|
"description": "For the output file name"
|
|
},
|
|
|
|
"output_directory":{
|
|
"type": "string",
|
|
"description": "For adding output path where the output files will be saved"
|
|
},
|
|
|
|
"output_format":{
|
|
"type": "array",
|
|
"description": "For adding output format (supported formats: csv, json, pftrace)"
|
|
},
|
|
|
|
"list_metrics" : {
|
|
"type" : "boolean",
|
|
"description": "List the metrics"
|
|
},
|
|
|
|
"log_level":{
|
|
"type": "string",
|
|
"description": "fatal, error, warning, info, trace"
|
|
},
|
|
|
|
"preload":{
|
|
"type": "array",
|
|
"description": "Libraries to prepend to LD_PRELOAD (usually for sanitizers)"
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|