Files
rocm-systems/projects/rocr-runtime/rocrtst/suites/test_common/main.cc
T
2026-01-21 10:39:50 +08:00

706 řádky
18 KiB
C++

/*
* =============================================================================
* ROC Runtime Conformance Release License
* =============================================================================
* The University of Illinois/NCSA
* Open Source License (NCSA)
*
* Copyright (c) 2017, Advanced Micro Devices, Inc.
* All rights reserved.
*
* Developed by:
*
* AMD Research and AMD ROC Software Development
*
* Advanced Micro Devices, Inc.
*
* www.amd.com
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to
* deal with the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* - Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimers.
* - Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimers in
* the documentation and/or other materials provided with the distribution.
* - Neither the names of <Name of Development Group, Name of Institution>,
* nor the names of its contributors may be used to endorse or promote
* products derived from this Software without specific prior written
* permission.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS WITH THE SOFTWARE.
*
*/
#include <string>
#include <vector>
#include <memory>
#include "gtest/gtest.h"
#include "suites/functional/agent_props.h"
#include "suites/functional/debug_basic.h"
#include "suites/functional/memory_basic.h"
#include "suites/functional/memory_access.h"
#include "suites/functional/ipc.h"
#include "suites/functional/memory_alignment.h"
#include "suites/functional/memory_atomics.h"
#include "suites/functional/memory_allocation.h"
#include "suites/functional/deallocation_notifier.h"
#include "suites/functional/virtual_memory.h"
#include "suites/functional/svm_memory.h"
#include "suites/performance/dispatch_time.h"
#include "suites/performance/memory_async_copy.h"
#include "suites/performance/memory_async_copy_numa.h"
#include "suites/performance/memory_async_copy_on_engine.h"
#include "suites/performance/enqueueLatency.h"
#include "suites/negative/memory_allocate_negative_tests.h"
#include "suites/negative/queue_validation.h"
#include "suites/stress/memory_concurrent_tests.h"
#include "suites/stress/queue_write_index_concurrent_tests.h"
#include "suites/test_common/test_case_template.h"
#include "suites/test_common/main.h"
#include "suites/test_common/test_common.h"
#include "suites/functional/concurrent_init.h"
#include "suites/functional/concurrent_init_shutdown.h"
#include "suites/functional/concurrent_shutdown.h"
#include "suites/functional/reference_count.h"
#include "suites/functional/signal_concurrent.h"
#include "suites/functional/aql_barrier_bit.h"
#include "suites/functional/signal_kernel.h"
#include "suites/functional/cu_masking.h"
#include "suites/functional/filter_devices.h"
#include "amd_smi/amdsmi.h"
#include "common/common.h"
#include "common/os.h"
static RocrTstGlobals *sRocrtstGlvalues = nullptr;
static void SetFlags(TestBase *test) {
assert(sRocrtstGlvalues != nullptr);
test->set_num_iteration(sRocrtstGlvalues->num_iterations);
test->set_verbosity(sRocrtstGlvalues->verbosity);
test->set_monitor_verbosity(sRocrtstGlvalues->monitor_verbosity);
}
static void RunCustomTestProlog(TestBase *test) {
SetFlags(test);
test->DisplayTestInfo();
test->SetUp();
test->Run();
return;
}
static void RunCustomTestEpilog(TestBase *test) {
test->DisplayResults();
test->Close();
return;
}
// If the test case one big test, you should use RunGenericTest()
// to run the test case. OTOH, if the test case consists of multiple
// functions to be run as separate tests, follow this pattern:
// * RunCustomTestProlog(test) // Run() should contain minimal code
// * <insert call to actual test function within test case>
// * RunCustomTestEpilog(test)
static void RunGenericTest(TestBase *test) {
RunCustomTestProlog(test);
RunCustomTestEpilog(test);
return;
}
// TEST ENTRY TEMPLATE:
// TEST(rocrtst, Perf_<test name>) {
// <Test Implementation class> <test_obj>;
//
// // Copy and modify implementation of RunGenericTest() if you need to deviate
// // from the standard pattern implemented there.
// RunGenericTest(&<test_obj>);
// }
TEST(rocrtst, Test_Example) {
TestExample tst;
RunGenericTest(&tst);
}
TEST(rocrtst, Test_Example_InterruptDisabled) {
TestExample tst;
rocrtst::SetEnv("HSA_ENABLE_INTERRUPT", "0");
RunGenericTest(&tst);
}
TEST(rocrtstFunc, MemoryAccessTests) {
MemoryAccessTest mt;
RunCustomTestProlog(&mt);
mt.CPUAccessToGPUMemoryTest();
mt.GPUAccessToCPUMemoryTest();
RunCustomTestEpilog(&mt);
}
TEST(rocrtstFunc, MemoryAccessCoherent) {
MemoryAccessTest mt;
RunCustomTestProlog(&mt);
mt.MemoryAccessCoherentTest();
RunCustomTestEpilog(&mt);
}
TEST(rocrtstFunc, GroupMemoryAllocationTest) {
MemoryAllocationTest ma(true, false);
RunCustomTestProlog(&ma);
ma.GroupMemoryDynamicAllocation();
RunCustomTestEpilog(&ma);
}
TEST(rocrtstFunc, MemoryAllocateAndFreeTest) {
MemoryAllocationTest ma(false, true);
RunCustomTestProlog(&ma);
ma.MemoryBasicAllocationAndFree();
RunCustomTestEpilog(&ma);
}
TEST(rocrtstFunc, MemoryAllocateContiguousTest) {
MemoryAllocationTest ma(false, true);
RunCustomTestProlog(&ma);
ma.MemoryAllocateContiguousTest();
RunCustomTestEpilog(&ma);
}
TEST(rocrtstFunc, Concurrent_Init_Test) {
ConcurrentInitTest ci;
RunCustomTestProlog(&ci);
ci.TestConcurrentInit();
RunCustomTestEpilog(&ci);
}
TEST(rocrtstFunc, Concurrent_Init_Shutdown_Test) {
ConcurrentInitShutdownTest ci;
RunCustomTestProlog(&ci);
ci.TestConcurrentInitShutdown();
RunCustomTestEpilog(&ci);
}
TEST(rocrtstFunc, Concurrent_Shutdown) {
ConcurrentShutdownTest cs;
RunCustomTestProlog(&cs);
cs.TestConcurrentShutdown();
RunCustomTestEpilog(&cs);
}
TEST(rocrtstFunc, Reference_Count) {
ReferenceCountTest rc(true, false);
RunCustomTestProlog(&rc);
rc.TestReferenceCount();
RunCustomTestEpilog(&rc);
}
TEST(rocrtstFunc, Max_Reference_Count) {
ReferenceCountTest rc(false, true);
RunCustomTestProlog(&rc);
rc.TestMaxReferenceCount();
RunCustomTestEpilog(&rc);
}
TEST(rocrtstFunc, Signal_Destroy_Concurrently) {
SignalConcurrentTest sd(true, false, false, false);
RunCustomTestProlog(&sd);
sd.TestSignalDestroyConcurrent();
RunCustomTestEpilog(&sd);
}
TEST(rocrtstFunc, Signal_Max_Consumer) {
SignalConcurrentTest sd(false, true, false, false);
RunCustomTestProlog(&sd);
sd.TestSignalCreateMaxConsumers();
RunCustomTestEpilog(&sd);
}
TEST(rocrtstFunc, Signal_Create_Concurrently) {
SignalConcurrentTest sd(false, false, false, true);
RunCustomTestProlog(&sd);
sd.TestSignalCreateConcurrent();
RunCustomTestEpilog(&sd);
}
/* Temporary: Disable CU Masking until it is fixed */
TEST(rocrtstFunc, DISABLED_CU_Masking) {
CU_Masking sd;
RunGenericTest(&sd);
}
TEST(rocrtstFunc, IPC) {
RUN_IF_NOT_EMU_MODE(
IPCTest ipc;
RunGenericTest(&ipc);
);
}
TEST(rocrtstFunc, DISABLED_Signal_Kernel_Set) {
RUN_IF_NOT_EMU_MODE(
SignalKernelTest sk(SET);
RunCustomTestProlog(&sk);
sk.TestSignalKernelSet();
RunCustomTestEpilog(&sk);
);
}
TEST(rocrtstFunc, DISABLED_Signal_Kernel_Multi_Set) {
RUN_IF_NOT_EMU_MODE(
SignalKernelTest sk(MULTISET);
RunCustomTestProlog(&sk);
sk.TestSignalKernelMultiSet();
RunCustomTestEpilog(&sk);
);
}
TEST(rocrtstFunc, DISABLED_Signal_Kernel_Wait) {
RUN_IF_NOT_EMU_MODE(
SignalKernelTest sw(WAIT);
RunCustomTestProlog(&sw);
sw.TestSignalKernelWait();
RunCustomTestEpilog(&sw);
);
}
TEST(rocrtstFunc, DISABLED_Signal_Kernel_Multi_Wait) {
RUN_IF_NOT_EMU_MODE(
SignalKernelTest sw(MULTIWAIT);
RunCustomTestProlog(&sw);
sw.TestSignalKernelMultiWait();
RunCustomTestEpilog(&sw);
);
}
TEST(rocrtstFunc, DISABLED_Aql_Barrier_Bit_Set) {
RUN_IF_NOT_EMU_MODE(
AqlBarrierBitTest ab(true, false);
RunCustomTestProlog(&ab);
ab.BarrierBitSet();
RunCustomTestEpilog(&ab);
);
}
TEST(rocrtstFunc, DISABLED_Aql_Barrier_Bit_Not_Set) {
RUN_IF_NOT_EMU_MODE(
AqlBarrierBitTest ab(false, true);
RunCustomTestProlog(&ab);
ab.BarrierBitNotSet();
RunCustomTestEpilog(&ab);
);
}
TEST(rocrtstFunc, Memory_Max_Mem) {
RUN_IF_NOT_EMU_MODE(
MemoryTest mt;
RunCustomTestProlog(&mt);
mt.MaxSingleAllocationTest();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstFunc, Memory_Available) {
RUN_IF_NOT_EMU_MODE(
MemoryTest mt;
RunCustomTestProlog(&mt);
mt.MemAvailableTest();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstFunc, Memory_Atomic_Add_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(ADD);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Sub_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(SUB);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_And_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(AND);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Or_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(OR);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Xor_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(XOR);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Min_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(MIN);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Max_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(MAX);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Inc_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(INC);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Dec_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(DEC);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Memory_Atomic_Xchg_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAtomic ma(XCHG);
RunCustomTestProlog(&ma);
ma.MemoryAtomicTest();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, DISABLED_DebugBasicTests) {
RUN_IF_NOT_EMU_MODE(
DebugBasicTest mt;
RunCustomTestProlog(&mt);
mt.VectorAddDebugTrapTest();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstFunc, Memory_Alignment_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryAlignmentTest ma;
RunCustomTestProlog(&ma);
ma.MemoryPoolAlignment();
RunCustomTestEpilog(&ma);
);
}
TEST(rocrtstFunc, Deallocation_Notifier_Test) {
RUN_IF_NOT_EMU_MODE(
DeallocationNotifierTest notifier;
RunGenericTest(&notifier);
);
}
TEST(rocrtstFunc, AgentPropertiesTests) {
RUN_IF_NOT_EMU_MODE(
AgentPropTest propTest;
RunCustomTestProlog(&propTest);
propTest.QueryAgentUUID();
propTest.QueryAgentClockCounters();
RunCustomTestEpilog(&propTest);
);
}
TEST(rocrtstFunc, SvmMemory_Basic_Test) {
RUN_IF_NOT_EMU_MODE(
SvmMemoryTestBasic smt;
RunCustomTestProlog(&smt);
smt.TestCreateDestroy();
smt.TestSVMPrefetch();
RunCustomTestEpilog(&smt);
);
}
TEST(rocrtstFunc, VirtMemory_Basic_Test) {
RUN_IF_NOT_EMU_MODE(
VirtMemoryTestBasic vmt;
RunCustomTestProlog(&vmt);
vmt.TestCreateDestroy();
vmt.TestRefCount();
vmt.TestPartialMapping();
RunCustomTestEpilog(&vmt);
);
}
TEST(rocrtstFunc, VirtMemory_Access_Test) {
RUN_IF_NOT_EMU_MODE(
VirtMemoryTestBasic vmt;
RunCustomTestProlog(&vmt);
vmt.CPUAccessToGPUMemoryTest();
vmt.GPUAccessToCPUMemoryTest();
vmt.GPUAccessToGPUMemoryTest();
RunCustomTestEpilog(&vmt);
);
}
TEST(rocrtstFunc, VirtMemory_Accounting_Test) {
RUN_IF_NOT_EMU_MODE(
VirtMemoryTestBasic vmt;
RunCustomTestProlog(&vmt);
vmt.MemoryAccountingTest();
RunCustomTestEpilog(&vmt);
);
}
TEST(rocrtstFunc, VirtMemory_Interprocess_Test) {
RUN_IF_NOT_EMU_MODE(
VirtMemoryTestInterProcess vmt;
RunCustomTestProlog(&vmt);
RunCustomTestEpilog(&vmt);
);
}
TEST(rocrtstFunc, Filter_Devices_Test) {
RUN_IF_NOT_EMU_MODE(
FilterDevicesTest fd;
RunCustomTestProlog(&fd);
fd.TestRocrVisibleDevicesFiltering();
RunCustomTestEpilog(&fd);
);
}
TEST(rocrtstNeg, Memory_Negative_Tests) {
RUN_IF_NOT_EMU_MODE(
MemoryAllocateNegativeTest mt;
RunCustomTestProlog(&mt);
mt.ZeroMemoryAllocateTest();
mt.MaxMemoryAllocateTest();
// Disabled temporarily - Renable this test only
// on recent GPUs - gfx94x+
// mt.FreeQueueRingBufferTest();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstNeg, Queue_Validation_InvalidDimension) {
RUN_IF_NOT_EMU_MODE(
QueueValidation qv(true, false, false, false, false);
RunCustomTestProlog(&qv);
qv.QueueValidationForInvalidDimension();
RunCustomTestEpilog(&qv);
);
}
TEST(rocrtstNeg, Queue_Validation_InvalidGroupMemory) {
RUN_IF_NOT_EMU_MODE(
QueueValidation qv(false, true, false, false, false);
RunCustomTestProlog(&qv);
qv.QueueValidationInvalidGroupMemory();
RunCustomTestEpilog(&qv);
);
}
TEST(rocrtstNeg, Queue_Validation_InvalidKernelObject) {
RUN_IF_NOT_EMU_MODE(
QueueValidation qv(false, false, true, false, false);
RunCustomTestProlog(&qv);
qv.QueueValidationForInvalidKernelObject();
RunCustomTestEpilog(&qv);
);
}
TEST(rocrtstNeg, Queue_Validation_InvalidPacket) {
RUN_IF_NOT_EMU_MODE(
QueueValidation qv(false, false, false, true, false);
RunCustomTestProlog(&qv);
qv.QueueValidationForInvalidPacket();
RunCustomTestEpilog(&qv);
);
}
TEST(rocrtstNeg, DISABLED_Queue_Validation_InvalidWorkGroupSize) {
RUN_IF_NOT_EMU_MODE(
QueueValidation qv(false, false, false, false, true);
RunCustomTestProlog(&qv);
qv.QueueValidationForInvalidWorkGroupSize();
RunCustomTestEpilog(&qv);
);
}
TEST(rocrtstStress, Memory_Concurrent_Allocate_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryConcurrentTest mt(true, false, false);
RunCustomTestProlog(&mt);
mt.MemoryConcurrentAllocate();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstStress, Memory_Concurrent_Free_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryConcurrentTest mt(false, true, false);
RunCustomTestProlog(&mt);
mt.MemoryConcurrentFree();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstStress, Memory_Concurrent_Pool_Info_Test) {
RUN_IF_NOT_EMU_MODE(
MemoryConcurrentTest mt(false, false, true);
RunCustomTestProlog(&mt);
mt.MemoryConcurrentPoolGetInfo();
RunCustomTestEpilog(&mt);
);
}
TEST(rocrtstStress, Queue_Add_Write_Index_ConcurrentTest) {
RUN_IF_NOT_EMU_MODE(
QueueWriteIndexConcurrentTest Qw(true, false, false);
RunCustomTestProlog(&Qw);
Qw.QueueAddWriteIndexAtomic();
RunCustomTestEpilog(&Qw);
);
}
TEST(rocrtstStress, Queue_CAS_Write_Index_ConcurrentTest) {
RUN_IF_NOT_EMU_MODE(
QueueWriteIndexConcurrentTest Qw(false, true, false);
RunCustomTestProlog(&Qw);
Qw.QueueCasWriteIndexAtomic();
RunCustomTestEpilog(&Qw);
);
}
TEST(rocrtstStress, Queue_LoadStore_Write_Index_ConcurrentTest) {
RUN_IF_NOT_EMU_MODE(
QueueWriteIndexConcurrentTest Qw(false, false, true);
RunCustomTestProlog(&Qw);
Qw.QueueLoadStoreWriteIndexAtomic();
RunCustomTestEpilog(&Qw);
);
}
TEST(rocrtstPerf, Memory_Async_Copy) {
RUN_IF_NOT_EMU_MODE(
MemoryAsyncCopy mac;
// To do full test, uncomment this:
// mac.set_full_test(true);
// To test only 1 path, add lines like this:
// mac.set_src_pool(<src pool id>);
// mac.set_dst_pool(<dst pool id>);
// The default is to and from the cpu to 1 gpu, and to/from a gpu to
// another gpu
RunGenericTest(&mac);
);
}
TEST(rocrtstPerf, Memory_Async_Copy_On_Engine) {
RUN_IF_NOT_EMU_MODE(
MemoryAsyncCopyOnEngine mac;
RunGenericTest(&mac);
);
}
TEST(rocrtstPerf, ENQUEUE_LATENCY) {
EnqueueLatency singlePacketequeue(true);
EnqueueLatency multiPacketequeue(false);
RunGenericTest(&singlePacketequeue);
RunGenericTest(&multiPacketequeue);
}
TEST(rocrtstPerf, DISABLED_Memory_Async_Copy_NUMA) {
MemoryAsyncCopyNUMA numa;
RunGenericTest(&numa);
}
TEST(rocrtstPerf, AQL_Dispatch_Time_Single_SpinWait) {
DispatchTime dt(true, true);
RunGenericTest(&dt);
}
TEST(rocrtstPerf, AQL_Dispatch_Time_Single_Interrupt) {
DispatchTime dt(false, true);
RunGenericTest(&dt);
}
TEST(rocrtstPerf, AQL_Dispatch_Time_Multi_SpinWait) {
DispatchTime dt(true, false);
RunGenericTest(&dt);
}
TEST(rocrtstPerf, AQL_Dispatch_Time_Multi_Interrupt) {
DispatchTime dt(false, false);
RunGenericTest(&dt);
}
int main(int argc, char** argv) {
::testing::InitGoogleTest(&argc, argv);
if (rocrtst::isEmuModeEnabled()) {
std::cout << "--- Emulation build ---" << std::endl;
}
RocrTstGlobals settings;
// Set some default values
settings.verbosity = 1;
settings.monitor_verbosity = 0;
settings.num_iterations = 5;
if (ProcessCmdline(&settings, argc, argv)) {
return 1;
}
sRocrtstGlvalues = &settings;
if (settings.monitor_verbosity > 0) {
amdsmi_status_t amdsmi_ret = amdsmi_init(AMDSMI_INIT_AMD_GPUS);
if (amdsmi_ret != AMDSMI_STATUS_SUCCESS) {
std::cout << "Failed to initialize AMD smi" << std::endl;
return 1;
}
DumpMonitorInfo();
}
return RUN_ALL_TESTS();
}