42cc721a4b
* remove references to --kernel-names * ruff format * remove redundant comments * update docs and roofline image * added two output lines to docs
62 строки
2.4 KiB
Bash
Исполняемый файл
62 строки
2.4 KiB
Bash
Исполняемый файл
#!/bin/bash
|
|
declare -A commands=(
|
|
[path]=' '
|
|
[no_roof]='--no-roof'
|
|
[kernel_names]='--roof-only'
|
|
[device_filter]='--device 0'
|
|
[kernel]='--kernel "vecCopy(double*, double*, double*, int, int) [clone .kd]"'
|
|
[ipblocks_SQ]='-b SQ'
|
|
[ipblocks_SQC]='-b SQC'
|
|
[ipblocks_TA]='-b TA'
|
|
[ipblocks_TD]='-b TD'
|
|
[ipblocks_TCP]='-b TCP'
|
|
[ipblocks_TCC]='-b TCC'
|
|
[ipblocks_SPI]='-b SPI'
|
|
[ipblocks_CPC]='-b CPC'
|
|
[ipblocks_CPF]='-b CPF'
|
|
[ipblocks_SQ_CPC]='-b SQ CPC'
|
|
[ipblocks_SQ_TA]='-b SQ TA'
|
|
[ipblocks_SQ_SPI]='-b SQ SPI'
|
|
[ipblocks_SQ_SQC_TCP_CPC]='-b SQ SQC TCP CPC'
|
|
[ipblocks_SQ_SPI_TA_TCC_CPF]='-b SQ SPI TA TCC CPF'
|
|
[dispatch_0]='--dispatch 0'
|
|
[dispatch_0_1]='--dispatch 0:2'
|
|
[dispatch_2]='--dispatch 1'
|
|
[kernel_verbose_0]='--kernel-verbose 0'
|
|
[kernel_verbose_1]='--kernel-verbose 1'
|
|
[kernel_verbose_2]='--kernel-verbose 2'
|
|
[kernel_verbose_3]='--kernel-verbose 3'
|
|
[kernel_verbose_4]='--kernel-verbose 4'
|
|
[kernel_verbose_5]='--kernel-verbose 5'
|
|
[join_type_grid]='--join-type grid'
|
|
[join_type_kernel]='--join-type kernel'
|
|
[sort_dispatches]='--roof-only --sort dispatches'
|
|
[sort_kernels]='--roof-only --sort kernels'
|
|
[mem_levels_HBM]='--roof-only --mem-level HBM'
|
|
[mem_levels_L2]='--roof-only --mem-level L2'
|
|
[mem_levels_vL1D]='--roof-only --mem-level vL1D'
|
|
[mem_levels_LDS]='--roof-only --mem-level LDS'
|
|
[mem_levels_HBM_LDS]='--roof-only --mem-level HBM LDS'
|
|
[mem_levels_vL1d_LDS]='--roof-only --mem-level vL1D LDS'
|
|
[mem_levels_L2_vL1d_LDS]='--roof-only --mem-level L2 vL1D LDS'
|
|
#########################################################
|
|
# Attempt to break rocprofiler-compute #
|
|
#########################################################
|
|
[dispatch_7]='--dispatch 7'
|
|
[dispatch_6_8]='--dispatch 6:8'
|
|
[dispatch_inv]='--dispatch invalid'
|
|
[kernel_substr]='--kernel vecCopy'
|
|
[kernel_inv_str]='--kernel vecPaste'
|
|
[kernel_inv_int]='--kernel 42'
|
|
[device_inv]='--device invalid' # does not generate a workload
|
|
[device_inv_int]='--device -1'
|
|
)
|
|
soc=MI300X_A1
|
|
echo "starting"
|
|
for key in "${!commands[@]}"; do
|
|
echo profiling $key;
|
|
command="${commands[$key]}"
|
|
echo "$key = ./src/rocprof-compute profile -n $key ${dirs[@]}"
|
|
./src/rocprof-compute profile -n $key $command -p tests/workloads/$key/$soc -- ./tests/vcopy -n 1048576 -b 256 -i 3 ;
|
|
echo "done" ; done
|