diff --git a/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx90a/pmc_tcc_perf.txt b/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx90a/pmc_tcc_perf.txt index 5586b0d3e0..0494f2b6f9 100644 --- a/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx90a/pmc_tcc_perf.txt +++ b/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx90a/pmc_tcc_perf.txt @@ -5,9 +5,8 @@ pmc: TCC_NC_REQ_sum TCC_UC_REQ_sum pmc: TCC_REQ_sum TCC_STREAMING_REQ_sum TCC_HIT_sum TCC_MISS_sum pmc: TCC_READ_sum TCC_WRITE_sum TCC_ATOMIC_sum TCC_WRITEBACK_sum pmc: TCC_EA_WRREQ_sum TCC_EA_WRREQ_64B_sum TCC_EA_WR_UNCACHED_32B_sum TCC_EA_WRREQ_DRAM_sum -pmc: TCC_EA_WRREQ_STALL_sum TCC_EA_WRREQ_IO_CREDIT_STALL_sum TCC_EA_WRREQ_GMI_CREDIT_STALL_sum TCC_EA_WRREQ_DRAM_CREDIT_STALL_sum +pmc: TCC_EA_WRREQ_STALL_sum pmc: TCC_EA_RDREQ_sum TCC_EA_RDREQ_32B_sum TCC_EA_RD_UNCACHED_32B_sum TCC_EA_RDREQ_DRAM_sum -pmc: TCC_EA_RDREQ_IO_CREDIT_STALL_sum TCC_EA_RDREQ_GMI_CREDIT_STALL_sum TCC_EA_RDREQ_DRAM_CREDIT_STALL_sum pmc: TCC_TAG_STALL_sum TCC_NORMAL_WRITEBACK_sum TCC_ALL_TC_OP_WB_WRITEBACK_sum TCC_NORMAL_EVICT_sum pmc: TCC_ALL_TC_OP_INV_EVICT_sum TCC_TOO_MANY_EA_WRREQS_STALL_sum TCC_EA_ATOMIC_sum pmc: TCC_EA_RDREQ_LEVEL_sum TCC_EA_WRREQ_LEVEL_sum TCC_EA_ATOMIC_LEVEL_sum diff --git a/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx940/pmc_tcc_perf.txt b/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx940/pmc_tcc_perf.txt index 923fc5b26c..3d0fc79d74 100644 --- a/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx940/pmc_tcc_perf.txt +++ b/projects/rocprofiler-compute/src/omniperf_soc/profile_configs/gfx940/pmc_tcc_perf.txt @@ -4,13 +4,11 @@ pmc: TCC_CYCLE_sum TCC_BUSY_sum pmc: TCC_NC_REQ_sum TCC_UC_REQ_sum TCC_CC_REQ_sum TCC_RW_REQ_sum pmc: TCC_REQ_sum TCC_STREAMING_REQ_sum TCC_HIT_sum TCC_MISS_sum pmc: TCC_READ_sum TCC_WRITE_sum TCC_ATOMIC_sum TCC_WRITEBACK_sum -pmc: TCC_EA0_WRREQ_sum TCC_EA0_WRREQ_64B_sum TCC_EA0_WR_UNCACHED_32B_sum -pmc: TCC_EA0_WRREQ_STALL_sum -pmc: TCC_TOO_MANY_EA_WRREQS_STALL_sum TCC_EA0_ATOMIC_sum TCC_EA0_RDREQ_sum TCC_EA0_RDREQ_32B_sum -pmc: TCC_EA0_RD_UNCACHED_32B_sum +pmc: TCC_EA0_WRREQ_sum TCC_EA0_WRREQ_64B_sum TCC_EA0_WR_UNCACHED_32B_sum TCC_EA0_WRREQ_DRAM_sum +pmc: TCC_EA0_RDREQ_sum TCC_EA0_RDREQ_32B_sum TCC_EA0_RD_UNCACHED_32B_sum TCC_EA0_RDREQ_DRAM_sum pmc: TCC_TAG_STALL_sum TCC_NORMAL_WRITEBACK_sum TCC_ALL_TC_OP_WB_WRITEBACK_sum TCC_NORMAL_EVICT_sum -pmc: TCC_ALL_TC_OP_INV_EVICT_sum TCC_EA0_RDREQ_DRAM_sum TCC_EA0_WRREQ_DRAM_sum -pmc: TCC_EA0_RDREQ_LEVEL_sum TCC_EA0_WRREQ_LEVEL_sum TCC_EA0_ATOMIC_LEVEL_sum +pmc: TCC_ALL_TC_OP_INV_EVICT_sum TCC_TOO_MANY_EA_WRREQS_STALL_sum TCC_EA0_ATOMIC_sum +pmc: TCC_EA0_RDREQ_LEVEL_sum TCC_EA0_WRREQ_LEVEL_sum TCC_EA0_ATOMIC_LEVEL_sum TCC_EA0_WRREQ_STALL_sum gpu: kernel: diff --git a/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx940.py b/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx940.py index 3e23f630a7..504f14a523 100644 --- a/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx940.py +++ b/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx940.py @@ -33,6 +33,7 @@ SOC_PARAM = { "numSE": 8, "numCU": 38, "numSIMD": 4, + "numPipes": 4, "numWavesPerCU": 32, "numSQC": 56, "L2Banks": 16, diff --git a/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx941.py b/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx941.py index bea911ac01..6b8865b820 100644 --- a/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx941.py +++ b/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx941.py @@ -33,6 +33,7 @@ SOC_PARAM = { "numSE": 8, "numCU": 38, "numSIMD": 4, + "numPipes": 4, "numWavesPerCU": 32, "numSQC": 56, "L2Banks": 16, diff --git a/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx942.py b/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx942.py index 77c21cde5d..064dd9792d 100644 --- a/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx942.py +++ b/projects/rocprofiler-compute/src/omniperf_soc/soc_gfx942.py @@ -33,6 +33,7 @@ SOC_PARAM = { "numSE": 8, "numCU": 38, "numSIMD": 4, + "numPipes": 4, "numWavesPerCU": 32, "numSQC": 56, "L2Banks": 16,