Files
rocm-systems/tests/kfdtest/scripts/kfdtest.exclude
T
Felix Kuehling 5c742f3e5e kfdtest: Blacklist Fragmentation test on all chips
This test has been intermittently failing for various reasons and
was already disabled on all chips except Ellesmere. It stresses
memory management in unusual ways by having lots of memory allocated
but +# not mapped, which is not relevant to compute applications over
ROCr.



Change-Id: I6b791ca7e2e0fcfe93fc720063b4b56acfded751
Signed-off-by: Felix Kuehling <Felix.Kuehling@amd.com>
2018-08-03 20:14:46 -04:00

142 строки
5.1 KiB
Plaintext

# Permanent exclusions
# These tests are included for debugging, but are not executed in normal execution on any ASIC:
#
# Fragmentation test fails intermittently on different systems (see KFD-344). It
# stresses memory management in unusual ways by having lots of memory allocated but
# not mapped, which is not relevant to compute applications over ROCr.
#
# CU Masking Linear/Split are not working correctly due to how the HW distributes work over CUs.
# They are available for testing but are not currently expected to pass on CI/VI/AI.
PERMANENT_BLACKLIST_ALL_ASICS=\
"-KFDEventTest.MeasureInterruptConsumption:"\
"KFDLocalMemoryTest.Fragmentation:"\
"KFDQMTest.BasicCuMaskingLinear:"\
"RDMATest.GPUDirect"
# This is the temporary blacklist for all ASICs. This is to be used when a test is failing consistently
# on every ASIC (Kaveri, Carrizo, Hawaii, Tonga, Fiji, Polaris10, Polaris11 and Vega10 .
# TODO means that a JIRA ticket needs to be created for this issue, as no documentation regarding
# failures can be found
# NOTE: If you update this alphabetical listing, add the corresponding JIRA ticket for reference
#
# KFDGraphicsInterop.RegisterForeignDeviceMem (KFD-366)
# KFDPMTest.SuspendWith[ActiveProcess|IdleQueue|IdleQueueAfterWork] (KFD-326|327|328)
# KFDPNPTest.DisableAndCreateQueue (KFD-329)
# KFDQMTest.GPUDoorbellWrite fails intermittently (KFD-318)
# KFDQMTest.mGPUShareBO (KFD-334)
TEMPORARY_BLACKLIST_ALL_ASICS=\
"KFDGraphicsInterop.RegisterForeignDeviceMem:"\
"KFDPMTest.SuspendWithActiveProcess:"\
"KFDPMTest.SuspendWithIdleQueue:"\
"KFDPMTest.SuspendWithIdleQueueAfterWork:"\
"KFDPNPTest.DisableAndCreateQueue:"\
"KFDQMTest.GPUDoorbellWrite:"\
"KFDQMTest.mGPUShareBO"
BLACKLIST_ALL_ASICS=\
"$PERMANENT_BLACKLIST_ALL_ASICS:"\
"$TEMPORARY_BLACKLIST_ALL_ASICS"
# SDMA-based tests (KFDIPCTest.BasicTest, KFDQM.*Sdma*, KFDMemoryTest.MMBench) are all
# disabled on non-Hawaii due to SDMA instability - SWDEV-101666
SDMA_BLACKLIST=\
"KFDIPCTest.*:"\
"KFDMemoryTest.MMBench:"\
"KFDQMTest.*Sdma*:"\
"KFDQMTest.P2PTest"
# Anything involving CP queue creation is failing on Kaveri. Separate them here for convenience (KFD-336)
KV_QUEUE_BLACKLIST=\
"KFDExceptionTest.InvalidBadAddress:"\
"KFDExceptionTest.InvalidWriteAddress:"\
"KFDExceptionTest.InvalidPPR*:"\
"KFDLocalMemoryTest.*:"\
"KFDEventTest.Signal*Event*:"\
"KFDQMTest.CreateQueueStressSingleThreaded:"\
"KFDQMTest.*CpQueue*:"\
"KFDQMTest.*Dispatch*:"\
"KFDQMTest.Atomics:"\
"KFDQMTest.GPUDoorbellWrite"
# KFDQMTest.CpuWriteCoherence fails. 0 dwordsAvailable (KFD-338)
# KFDMemoryTest.MemoryRegister fails on SDMA queue creation (KFD-337)
KV_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"$SDMA_BLACKLIST:"\
"$KV_QUEUE_BLACKLIST:"\
"KFDMemoryTest.MemoryRegister:"\
"KFDQMTest.CpuWriteCoherence"
# KFDLocalMemoryTest.BasicTest is failing intermittently (KFD-368)
# KFDMemoryTest.BigBufferStressTest was failing intermittently on 4.9 and hangs when executed twice (KFD-312)
# KFDQMTest.GPUDoorbellWrite fails on Hawaii. Could be HW-related (KFD-342)
HI_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"KFDLocalMemoryTest.BasicTest:"\
"KFDMemoryTest.BigBufferStressTest:"\
"KFDQMTest.GPUDoorbellWrite"
CZ_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"$SDMA_BLACKLIST:"\
"KFDExceptionTest.InvalidWriteAddress"
# KFDPerfCountersTest.*Trace fail (KFD-339)
# KFDMemoryTest.QueryPointerInfo/MemoryRegister* (KFD-341)
# The remaining tests listed here fail on map memory to GPU with a VA conflict (KFD-340)
TONGA_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"$SDMA_BLACKLIST:"\
"KFDCWSRTest.BasicTest:"\
"KFDEventTest.*:"\
"KFDLocalMemoryTest.*:"\
"KFDMemoryTest.FlatScratchAccess:"\
"KFDMemoryTest.MapMemoryToGPU:"\
"KFDMemoryTest.MemoryRegister*:"\
"KFDMemoryTest.QueryPointerInfo:"\
"KFDPerfCountersTest.*:"\
"KFDDBGTest.BasicAddressWatch:"\
"KFDQMTest.*"
FIJI_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"$SDMA_BLACKLIST"
ELLESMERE_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"$SDMA_BLACKLIST"
BAFFIN_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"$SDMA_BLACKLIST"
# KFDDBG.BasicAddressWatch fails with message "E,INTERR: Setting ASIC VI (was previously set to GFX9), this changes the backend after we have already started parsing the shader, not currently supported by sp3, sorry." (KFD-317)
# KFDExceptionTest.InvalidBadAddress causes some following tests to fail on SRIOV (KFD-343)
# KFDQMTest.BasicCuMaskingEven fails intermittently (WIP)
# KFDExceptionTest.InvalidWriteAddress is failing once we enable no-retry (KFD-380)
VEGA10_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"KFDDBGTest.BasicAddressWatch:"\
"KFDExceptionTest.InvalidBadAddress:"\
"KFDExceptionTest.InvalidWriteAddress:"\
"KFDQMTest.CreateQueueStressSingleThreaded:"\
"KFDQMTest.GPUDoorbellWrite:"\
"KFDMemoryTest.MemoryRegister"
VEGA20_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"KFDDBGTest.BasicAddressWatch:"\
"KFDExceptionTest.InvalidBadAddress:"\
"KFDExceptionTest.InvalidWriteAddress:"\
"KFDQMTest.CreateQueueStressSingleThreaded:"\
"KFDQMTest.GPUDoorbellWrite:"\
"KFDMemoryTest.MemoryRegister"
RAVEN_TESTS_BLACKLIST=\
"$BLACKLIST_ALL_ASICS:"\
"KFDDBGTest.BasicAddressWatch:"\
"KFDQMTest.CreateQueueStressSingleThreaded:"\
"KFDQMTest.GPUDoorbellWrite:"\
"KFDMemoryTest.MemoryRegister"