Update CopyOnSignal shader for GFX12

Minor instructions changes for GFX12.

Change-Id: I78a37fa37950b378cdd2a1618c71c97c6ba66aac
Signed-off-by: David Belanger <david.belanger@amd.com>
Signed-off-by: Chris Freehill <cfreehil@amd.com>
Этот коммит содержится в:
David Belanger
2024-05-30 12:55:20 -04:00
коммит произвёл Chris Freehill
родитель 6e6f445f75
Коммит 39f4fbee10
+29 -10
Просмотреть файл
@@ -299,19 +299,38 @@ const char *CopyOnSignalIsa =
.else
s_mov_b32 s18, 0xcafe
.endif
POLLSIGNAL:
s_load_dword s16, s[0:1], 0x0 glc
s_cmp_eq_i32 s16, s18
s_cbranch_scc0 POLLSIGNAL
s_load_dword s17, s[0:1], 0x4 glc
s_waitcnt vmcnt(0) & lgkmcnt(0)
.if (.amdgcn.gfx_generation_number >= 10)
.if (.amdgcn.gfx_generation_number >= 12)
POLLSIGNAL:
s_load_dword s16, s[0:1], 0x0 scope:SCOPE_CU
s_cmp_eq_i32 s16, s18
s_cbranch_scc0 POLLSIGNAL
s_load_dword s17, s[0:1], 0x4 scope:SCOPE_CU
s_wait_kmcnt 0
v_mov_b32 v2, s17
flat_store_dword v[4:5], v2 glc
flat_store_dword v[4:5], v2 scope:SCOPE_CU
s_wait_storecnt 0
.else
s_store_dword s17, s[0:1], 0x8 glc
POLLSIGNAL:
s_load_dword s16, s[0:1], 0x0 glc
s_cmp_eq_i32 s16, s18
s_cbranch_scc0 POLLSIGNAL
s_load_dword s17, s[0:1], 0x4 glc
s_waitcnt vmcnt(0) & lgkmcnt(0)
.if (.amdgcn.gfx_generation_number >= 10)
v_mov_b32 v2, s17
flat_store_dword v[4:5], v2 glc
.else
s_store_dword s17, s[0:1], 0x8 glc
.endif
s_waitcnt vmcnt(0) & lgkmcnt(0)
.endif
s_waitcnt vmcnt(0) & lgkmcnt(0)
s_endpgm
)";