358 líneas
11 KiB
C++
358 líneas
11 KiB
C++
/*
|
|
Copyright (c) 2025 Advanced Micro Devices, Inc. All rights reserved.
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
#include <hip_test_common.hh>
|
|
#include <utils.hh>
|
|
#if __linux__
|
|
#include <numa.h>
|
|
#include <numaif.h>
|
|
#endif
|
|
|
|
/**
|
|
* Kernel to fill value for each element in the given array
|
|
*/
|
|
static __global__ void fillDataKernel(int *arr, int value) {
|
|
arr[threadIdx.x] = value;
|
|
}
|
|
|
|
/**
|
|
* Kernel to copy data from source array to destination array
|
|
*/
|
|
static __global__ void copyDataKernel(int *dstArr, int *srcArr) {
|
|
dstArr[threadIdx.x] = srcArr[threadIdx.x];
|
|
}
|
|
|
|
/**
|
|
* Helper function to get the list of devices which supports
|
|
* Managed memory
|
|
*/
|
|
static std::vector<int> getSupportedDevices() {
|
|
const auto deviceCount = HipTest::getDeviceCount();
|
|
std::vector<int> supportedDevices;
|
|
supportedDevices.reserve(deviceCount + 1);
|
|
for (int i = 0; i < deviceCount; ++i) {
|
|
if (DeviceAttributesSupport(i, hipDeviceAttributeManagedMemory,
|
|
hipDeviceAttributeConcurrentManagedAccess)) {
|
|
supportedDevices.push_back(i);
|
|
}
|
|
}
|
|
return supportedDevices;
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This test case checks the following scenarios
|
|
* - 1) With Location type Device
|
|
* - 2) With Location type Host
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemPrefetchAsync_v2.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 7.1
|
|
*/
|
|
TEST_CASE("Unit_hipMemPrefetchAsync_v2_Device_Host", "[multigpu]") {
|
|
auto supportedDevices = getSupportedDevices();
|
|
if (supportedDevices.empty()) {
|
|
HipTest::HIP_SKIP_TEST(
|
|
"Test need at least one device with managed memory support");
|
|
}
|
|
|
|
HIP_CHECK(hipSetDevice(supportedDevices[0]));
|
|
|
|
constexpr int N = 1024;
|
|
constexpr int Nbytes = N * sizeof(int);
|
|
constexpr int value = 10;
|
|
int *memPtr = nullptr;
|
|
|
|
hipStream_t stream;
|
|
HIP_CHECK(hipStreamCreate(&stream));
|
|
|
|
HIP_CHECK(hipMallocManaged(reinterpret_cast<void **>(&memPtr), Nbytes,
|
|
hipMemAttachGlobal));
|
|
REQUIRE(memPtr != nullptr);
|
|
|
|
SECTION("With Device") {
|
|
int currentValue = value;
|
|
std::fill_n(memPtr, N, value);
|
|
|
|
for (int deviceId : supportedDevices) {
|
|
HIP_CHECK(hipSetDevice(deviceId));
|
|
|
|
hipMemLocation location;
|
|
location.type = hipMemLocationTypeDevice;
|
|
location.id = deviceId;
|
|
|
|
HIP_CHECK(hipMemPrefetchAsync_v2(memPtr, Nbytes, location, 0, stream));
|
|
HIP_CHECK(hipStreamSynchronize(stream));
|
|
|
|
int *devArr = nullptr;
|
|
HIP_CHECK(hipMalloc(&devArr, Nbytes));
|
|
REQUIRE(devArr != nullptr);
|
|
|
|
copyDataKernel<<<1, N>>>(devArr, memPtr);
|
|
|
|
int hostArr[N];
|
|
HIP_CHECK(hipMemcpy(hostArr, devArr, Nbytes, hipMemcpyDeviceToHost));
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("For Device " << deviceId << " At index " << i
|
|
<< " Expected value = " << currentValue
|
|
<< " Got value = " << hostArr[i]);
|
|
REQUIRE(hostArr[i] == currentValue);
|
|
}
|
|
|
|
currentValue = currentValue + 1;
|
|
fillDataKernel<<<1, N>>>(memPtr, currentValue);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("At index " << i << " Expected value = " << currentValue
|
|
<< " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == currentValue);
|
|
}
|
|
|
|
HIP_CHECK(hipFree(devArr));
|
|
}
|
|
}
|
|
|
|
SECTION("With Host") {
|
|
fillDataKernel<<<1, N>>>(memPtr, value);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
hipMemLocation location;
|
|
location.type = hipMemLocationTypeHost;
|
|
|
|
HIP_CHECK(hipMemPrefetchAsync_v2(memPtr, Nbytes, location, 0, stream));
|
|
HIP_CHECK(hipStreamSynchronize(stream));
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("At index " << i << " Expected value = " << value
|
|
<< " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == value);
|
|
}
|
|
|
|
constexpr int newValue = 20;
|
|
std::fill_n(memPtr, N, newValue);
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("At index " << i << " Expected value = " << newValue
|
|
<< " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == newValue);
|
|
}
|
|
}
|
|
|
|
HIP_CHECK(hipStreamDestroy(stream));
|
|
HIP_CHECK(hipFree(memPtr));
|
|
// Reset to default device
|
|
HIP_CHECK(hipSetDevice(0));
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This test case checks the following scenarios
|
|
* - 1) With Location type Host Numa
|
|
* - 2) With Location type Host Numa Current
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemPrefetchAsync_v2.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 7.1
|
|
*/
|
|
#if __linux__
|
|
TEST_CASE("Unit_hipMemPrefetchAsync_v2_HostNuma_HostNumaCurrent") {
|
|
auto supportedDevices = getSupportedDevices();
|
|
if (supportedDevices.empty() || numa_available() < 0) {
|
|
HipTest::HIP_SKIP_TEST("Skipping as System does not have managed memory "
|
|
"supported devices or No Numa nodes in system");
|
|
}
|
|
|
|
HIP_CHECK(hipSetDevice(supportedDevices[0]));
|
|
|
|
int maxNode = numa_max_node();
|
|
REQUIRE(maxNode >= 0);
|
|
|
|
constexpr int N = 1024;
|
|
constexpr int Nbytes = N * sizeof(int);
|
|
constexpr int value = 10;
|
|
int *memPtr = nullptr;
|
|
|
|
hipStream_t stream;
|
|
HIP_CHECK(hipStreamCreate(&stream));
|
|
|
|
HIP_CHECK(hipMallocManaged(reinterpret_cast<void **>(&memPtr), Nbytes,
|
|
hipMemAttachGlobal));
|
|
REQUIRE(memPtr != nullptr);
|
|
fillDataKernel<<<1, N>>>(memPtr, value);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
SECTION("With Host NUMA") {
|
|
hipMemLocation location;
|
|
int currentValue = value;
|
|
for (int node = 0; node <= maxNode; ++node) {
|
|
location.type = hipMemLocationTypeHostNuma;
|
|
location.id = node;
|
|
|
|
HIP_CHECK(hipMemPrefetchAsync_v2(memPtr, Nbytes, location, 0, stream));
|
|
HIP_CHECK(hipStreamSynchronize(stream));
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("For Node " << node << " At index " << i << " Expected value = "
|
|
<< currentValue << " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == currentValue);
|
|
}
|
|
|
|
currentValue = currentValue + 1;
|
|
std::fill_n(memPtr, N, currentValue);
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("For Node " << node << " At index " << i << " Expected value = "
|
|
<< currentValue << " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == currentValue);
|
|
}
|
|
|
|
#if 0 // To work this part, fix provided in SWDEV-548802 is required
|
|
// verify placement
|
|
void* page = memPtr;
|
|
int status = -1;
|
|
int ret = move_pages(0, 1, &page, nullptr, &status, 0);
|
|
REQUIRE(ret == 0);
|
|
REQUIRE(status == node);
|
|
#endif
|
|
}
|
|
}
|
|
|
|
SECTION("With Host Numa Current") {
|
|
hipMemLocation location;
|
|
location.type = hipMemLocationTypeHostNumaCurrent;
|
|
|
|
HIP_CHECK(hipMemPrefetchAsync_v2(memPtr, Nbytes, location, 0, stream));
|
|
HIP_CHECK(hipStreamSynchronize(stream));
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("At index " << i << " Expected value = " << value
|
|
<< " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == value);
|
|
}
|
|
|
|
constexpr int newValue = 20;
|
|
std::fill_n(memPtr, N, newValue);
|
|
|
|
for (int i = 0; i < N; i++) {
|
|
INFO("At index " << i << " Expected value = " << newValue
|
|
<< " Got value = " << memPtr[i]);
|
|
REQUIRE(memPtr[i] == newValue);
|
|
}
|
|
|
|
// determine current CPU’s NUMA node
|
|
int cpu = sched_getcpu();
|
|
int cur_node = numa_node_of_cpu(cpu);
|
|
REQUIRE(cur_node >= 0);
|
|
|
|
// verify that the page is on the current node
|
|
void *page = memPtr;
|
|
int status = -1;
|
|
int ret = move_pages(0, 1, &page, nullptr, &status, 0);
|
|
REQUIRE(ret == 0);
|
|
REQUIRE(status == cur_node);
|
|
}
|
|
|
|
HIP_CHECK(hipStreamDestroy(stream));
|
|
HIP_CHECK(hipFree(memPtr));
|
|
// Reset to default device
|
|
HIP_CHECK(hipSetDevice(0));
|
|
}
|
|
#endif
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This test case checks the following Negative scenarios
|
|
* - 1) With dev_ptr as nullptr
|
|
* - 2) With count 0
|
|
* - 3) With count larger than actual size
|
|
* - 4) With invalid device
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemPrefetchAsync_v2.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 7.1
|
|
*/
|
|
TEST_CASE("Unit_hipMemPrefetchAsync_v2_Negative") {
|
|
auto supportedDevices = getSupportedDevices();
|
|
if (supportedDevices.empty()) {
|
|
HipTest::HIP_SKIP_TEST(
|
|
"Test need at least one device with managed memory support");
|
|
}
|
|
|
|
HIP_CHECK(hipSetDevice(supportedDevices[0]));
|
|
|
|
constexpr int N = 16;
|
|
constexpr int Nbytes = N * sizeof(int);
|
|
|
|
hipStream_t stream;
|
|
HIP_CHECK(hipStreamCreate(&stream));
|
|
|
|
void *memPtr = nullptr;
|
|
HIP_CHECK(hipMallocManaged(&memPtr, Nbytes, hipMemAttachGlobal));
|
|
|
|
hipMemLocation location;
|
|
location.type = hipMemLocationTypeDevice;
|
|
|
|
SECTION("With dev_ptr as nullptr") {
|
|
HIP_CHECK_ERROR(
|
|
hipMemPrefetchAsync_v2(nullptr, Nbytes, location, 0, stream),
|
|
hipErrorInvalidValue);
|
|
}
|
|
|
|
SECTION("With count 0") {
|
|
HIP_CHECK_ERROR(hipMemPrefetchAsync_v2(memPtr, 0, location, 0, stream),
|
|
hipErrorInvalidValue);
|
|
}
|
|
|
|
SECTION("With count larger than actual size") {
|
|
HIP_CHECK_ERROR(
|
|
hipMemPrefetchAsync_v2(memPtr, Nbytes + 10, location, 0, stream),
|
|
hipErrorInvalidValue);
|
|
}
|
|
|
|
SECTION("With invalid device") {
|
|
hipMemLocation dstLocation;
|
|
dstLocation.type = hipMemLocationTypeDevice;
|
|
int deviceCount = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&deviceCount));
|
|
dstLocation.id = deviceCount;
|
|
HIP_CHECK_ERROR(
|
|
hipMemPrefetchAsync_v2(memPtr, Nbytes, dstLocation, 0, stream),
|
|
hipErrorInvalidDevice);
|
|
}
|
|
|
|
HIP_CHECK(hipStreamDestroy(stream));
|
|
HIP_CHECK(hipFree(memPtr));
|
|
// Reset to default device
|
|
HIP_CHECK(hipSetDevice(0));
|
|
}
|