Fix Stochastic sampling trap handler

The trap handler should read the PERF_SNAPSHOT_DATA after all of
PERF_SNAPSHOT_DATA, PERF_SNAPSHOT_PC_LO and PERF_SNAPSHOT_PC_HI.  This
patch fixes this.

Change-Id: I7f78e16d7a0d8bfebb34906b4dff73c2eaeb5658
Этот коммит содержится в:
Lancelot SIX
2025-03-21 14:38:01 +00:00
коммит произвёл Six, Lancelot
родитель eece210a5c
Коммит 6a4785f650
+3 -3
Просмотреть файл
@@ -507,12 +507,12 @@ trap_entry:
s_waitcnt lgkmcnt(0) // Wait for timestamp
s_store_dwordx2 ttmp[4:5], ttmp[2:3] 0x30 // Store timestamp
s_getreg_b32 ttmp4, hwreg(HW_REG_SQ_PERF_SNAPSHOT_DATA)
s_getreg_b32 ttmp5, hwreg(HW_REG_SQ_PERF_SNAPSHOT_DATA1)
s_store_dwordx2 ttmp[4:5], ttmp[2:3], 0x24 // store snapshot PC
s_getreg_b32 ttmp4, hwreg(HW_REG_SQ_PERF_SNAPSHOT_PC_LO)
s_getreg_b32 ttmp5, hwreg(HW_REG_SQ_PERF_SNAPSHOT_PC_HI)
s_store_dwordx2 ttmp[4:5], ttmp[2:3] 0x00 // store snapshot data
s_getreg_b32 ttmp5, hwreg(HW_REG_SQ_PERF_SNAPSHOT_DATA1)
s_getreg_b32 ttmp4, hwreg(HW_REG_SQ_PERF_SNAPSHOT_DATA)
s_store_dwordx2 ttmp[4:5], ttmp[2:3], 0x24 // store snapshot PC
s_mov_b32 ttmp6, exec_lo
s_store_dword ttmp6, ttmp[2:3], 0x8 // store EXEC_LO