Files
2025-08-20 19:58:06 +05:30

409 lines
12 KiB
C++

/*
Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved.
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
#ifdef _WIN32
#define NOMINMAX
#endif /* _WIN32 */
#include <hip/hip_runtime_api.h>
#include <hip_test_common.hh>
#ifdef __linux__
#include <sys/sysinfo.h>
#else
#include <windows.h>
#include <sysinfoapi.h>
#endif
static constexpr size_t ONE_MB = 1024 * 1024;
TEST_CASE("Unit_hipMalloc_Positive_Basic") {
constexpr size_t page_size = 4096;
void* ptr = nullptr;
const auto alloc_size =
GENERATE_COPY(10, page_size / 2, page_size, page_size * 3 / 2, page_size * 2);
HIP_CHECK(hipMalloc(&ptr, alloc_size));
CHECK(ptr != nullptr);
CHECK(reinterpret_cast<intptr_t>(ptr) % 256 == 0);
HIP_CHECK(hipFree(ptr));
}
TEST_CASE("Unit_hipMalloc_Positive_Zero_Size") {
void* ptr = reinterpret_cast<void*>(0x1);
HIP_CHECK(hipMalloc(&ptr, 0));
REQUIRE(ptr == nullptr);
}
TEST_CASE("Unit_hipMalloc_Positive_Alignment") {
void *ptr1 = nullptr, *ptr2 = nullptr;
HIP_CHECK(hipMalloc(&ptr1, 1));
HIP_CHECK(hipMalloc(&ptr2, 10));
CHECK(reinterpret_cast<intptr_t>(ptr1) % 256 == 0);
CHECK(reinterpret_cast<intptr_t>(ptr2) % 256 == 0);
HIP_CHECK(hipFree(ptr1));
HIP_CHECK(hipFree(ptr2));
}
TEST_CASE("Unit_hipMalloc_Negative_Parameters") {
SECTION("ptr == nullptr") { HIP_CHECK_ERROR(hipMalloc(nullptr, 4096), hipErrorInvalidValue); }
SECTION("size == max size_t") {
void* ptr;
HIP_CHECK_ERROR(hipMalloc(&ptr, std::numeric_limits<size_t>::max()), hipErrorOutOfMemory);
}
}
// Commenting this due to defect SWDEV-501675, used in below commented tests
#if 0
/**
/**
* Local Function to Get total RAM size in bytes
*/
static inline size_t getTotalRAM() {
#ifdef __linux__
struct sysinfo info {};
sysinfo(&info);
return info.totalram;
#else
MEMORYSTATUSEX statex;
statex.dwLength = sizeof(statex);
GlobalMemoryStatusEx(&statex);
return (statex.ullTotalPhys);
#endif
}
/**
* Local Function to Get Available RAM size in bytes
*/
static inline size_t getAvailableRAM() {
#ifdef __linux__
struct sysinfo info {};
sysinfo(&info);
return info.freeram;
#else
MEMORYSTATUSEX statex;
statex.dwLength = sizeof(statex);
GlobalMemoryStatusEx(&statex);
return (statex.ullAvailPhys);
#endif
}
#endif
/**
* In addKernel function, all elements of the array a increased by 1
*/
static __global__ void addKernel(char* a, size_t size) {
for (int i = 0; i < size; i++) {
a[i] += 1;
}
}
/**
* Local Function to perform some operations on device memory and validate it
*/
static void performOperations(char* devMem, size_t size) {
/**
* Validating 1MB or less than that, since the most of the scenarios uses
* this function allocates memory in GB's and execution time will be more
*/
const size_t sizeToCheck = (size < ONE_MB) ? size : ONE_MB;
constexpr char value = 'A';
HIP_CHECK(hipMemset(devMem, value, sizeToCheck));
addKernel<<<1, 1>>>(devMem, sizeToCheck);
char* arrToCheck = new char[sizeToCheck];
memset(arrToCheck, '0', sizeToCheck);
HIP_CHECK(hipMemcpy(arrToCheck, devMem, sizeToCheck, hipMemcpyDeviceToHost));
for (int i = 0; i < sizeToCheck; i++) {
INFO("At index : " << i << " Got value : " << arrToCheck[i] << " Expected value : B ");
REQUIRE(arrToCheck[i] == 'B');
}
delete[] arrToCheck;
}
/**
* Test Description
* ------------------------
* - This test case tests the following scenario:-
* - 1) Get the Available VRAM size
* - 2) Allocate 90% of that using hipMalloc
* - 3) Perform operations on device memory
* Test source
* ------------------------
* - unit/memory/hipMalloc.cc
*/
TEST_CASE("Unit_hipMalloc_Allocate90PercentOfDeviceMemory") {
char* devMem = nullptr;
size_t freeVRAM = 0, totalVRAM = 0;
HIP_CHECK(hipMemGetInfo(&freeVRAM, &totalVRAM));
INFO("Available device memory : " << freeVRAM);
/**
* Allocating 90% of available VRAM.
* Avoided allocating total available VRAM just for stability
* and to keep some buffer memory.
*/
size_t size = freeVRAM * 0.9;
INFO("Size going to allocate : " << size);
HIP_CHECK(hipMalloc(&devMem, size));
REQUIRE(devMem != nullptr);
performOperations(devMem, size);
HIP_CHECK(hipFree(devMem));
}
// Commenting this due to defect SWDEV-501675
#if 0
/**
* Test Description
* ------------------------
* - This test case tests the following scenario:-
* - 1) Get the Available VRAM size
* - 2) Allocate 110% of that using hipMalloc
* - 3) Check the behaviour in linux and windows
* - 4) In linux it should give hipErrorOutOfMemory
* - 5) In windows it should success by using the Shared GPU memory
* - 6) Perform operations on device memory
* Test source
* ------------------------
* - unit/memory/hipMalloc.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.4
*/
TEST_CASE("Unit_hipMalloc_Allocate110PercentOfDeviceMemory") {
char *devMem = nullptr;
size_t freeVRAM = 0, totalVRAM = 0;
HIP_CHECK(hipMemGetInfo(&freeVRAM, &totalVRAM));
INFO("Available Free device memory : " << freeVRAM);
// Allocating 110% of available VRAM
size_t size = freeVRAM * 1.1;
INFO("Size Planning to allocate : " << size);
// Determine amount of memory which is needed from RAM
size_t requiredMemFromRAM = size - freeVRAM;
INFO("Required Memory From RAM : " << requiredMemFromRAM);
#ifdef __linux__
INFO("LINUX");
HIP_CHECK_ERROR(hipMalloc(&devMem, size), hipErrorOutOfMemory);
#else
INFO("WINDOWS");
size_t totalRAM = getTotalRAM();
size_t availableRAM = getAvailableRAM();
INFO("Total RAM : " << totalRAM);
INFO("Available RAM : " << availableRAM);
/**
* Validating size of Required Memory From RAM,
* 1) Since we can use half of RAM as shared GPU memory,
* Required Memory From RAM should be less than that.
* 2) And Required Memory From RAM should be less than Available RAM.
* If Required Memory From RAM is crossing the threshold,
* allocating 90% available VRAM
*/
if ((requiredMemFromRAM < (totalRAM / 2)) &&
(requiredMemFromRAM < availableRAM)) {
INFO("Required Memory From RAM is Available");
} else {
INFO("Required Memory From RAM is Not available, "
"allocating 90% of available VRAM");
// Avoided using total available VRAM for stability, to keep buffer memory
size = freeVRAM * 0.9;
}
INFO("Size going to allocate : " << size);
HIP_CHECK(hipMalloc(&devMem, size));
REQUIRE(devMem != nullptr);
performOperations(devMem, size);
HIP_CHECK(hipFree(devMem));
#endif
}
#endif
// Commenting this due to defect SWDEV-501675
#if 0
/**
* Test Description
* ------------------------
* - This test case tests the following scenario:-
* - 1) Get the Available VRAM size, Total RAM size and Available RAM size
* - 2) In case if Available RAM size is greater than half of Total RAM,
* - allocate 90% of half of Total RAM
* - 3) In case if Available RAM size is less than half of Total RAM,
* - allocate 50% of half of Available RAM
* - 4) Check the behaviour in linux and windows,
* - In linux it should give hipErrorOutOfMemory and
* - in windows it should success by using the Shared GPU memory
* - 5) Perform operations on device memory
* Test source
* ------------------------
* - unit/memory/hipMalloc.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.4
*/
TEST_CASE("Unit_hipMalloc_AllocateAvailableVRAMAndPossibleRAM") {
char *devMem = nullptr;
size_t freeVRAM = 0, totalVRAM = 0;
HIP_CHECK(hipMemGetInfo(&freeVRAM, &totalVRAM));
INFO("Available Free device memory : " << freeVRAM);
size_t totalRAM = getTotalRAM();
size_t availableRAM = getAvailableRAM();
INFO("Total RAM : " << totalRAM);
INFO("Available RAM : " << availableRAM);
// Determine usable Shared GPU Memory by GPU From RAM which is half of RAM
size_t usableSharedGPUMemFromRam = totalRAM / 2;
if (availableRAM > usableSharedGPUMemFromRam) {
/*
* If Available RAM is greater than the usable Shared GPU Memory
* Allocating 90% of Usable Shared GPU Memory
* Not allocating 100% of Usable Shared GPU Memory just to keep
* buffer memory and for stability
*/
usableSharedGPUMemFromRam = usableSharedGPUMemFromRam * 0.9;
} else {
/*
* If Available RAM is less than the usable Shared GPU Memory
* Allocating 50% of RAM only just to keep buffer memory and for stability
*/
usableSharedGPUMemFromRam = availableRAM * 0.5;
}
INFO("Usable Shared GPU Memory from RAM : " << usableSharedGPUMemFromRam);
size_t size = freeVRAM + usableSharedGPUMemFromRam;
INFO("Size going to allocate : " << size);
#ifdef __linux__
INFO("LINUX");
HIP_CHECK_ERROR(hipMalloc(&devMem, size), hipErrorOutOfMemory);
#else
INFO("WINDOWS");
HIP_CHECK(hipMalloc(&devMem, size));
REQUIRE(devMem != nullptr);
performOperations(devMem, size);
HIP_CHECK(hipFree(devMem));
#endif
}
/**
* Test Description
* ------------------------
* - This test case tests the following scenario:-
* - 1) Get the Total RAM size
* - 2) Allocate 1MB more than that using hipMalloc
* - 3) Check the behaviour in linux and windows.
* - In linux, windows it should give hipErrorOutOfMemory
* Test source
* ------------------------
* - unit/memory/hipMalloc.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.4
*/
TEST_CASE("Unit_hipMalloc_AllocateMoreThanTotalRAM") {
char *devMem = nullptr;
size_t totalRAM = getTotalRAM();
INFO("Total RAM : " << totalRAM);
size_t size = totalRAM + ONE_MB;
INFO("Size going to allocate : " << size);
HIP_CHECK_ERROR(hipMalloc(&devMem, size), hipErrorOutOfMemory);
}
/**
* Test Description
* ------------------------
* - This test case tests the following scenario:-
* - 1) Get the Total VRAM size
* - 2) Allocate 1MB more than total VRAM size using hipMalloc
* - 3) Check the behaviour in linux and windows
* - 4) In linux it should give hipErrorOutOfMemory
* - 5) In windows it should success using shared GPU memory
* - 6) Perform operations on device memory
* Test source
* ------------------------
* - unit/memory/hipMalloc.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.4
*/
TEST_CASE("Unit_hipMalloc_AllocateMoreThanTotalVRAM") {
char *devMem = nullptr;
size_t freeVRAM = 0, totalVRAM = 0;
HIP_CHECK(hipMemGetInfo(&freeVRAM, &totalVRAM));
INFO("Available total device memory : " << totalVRAM);
size_t size = totalVRAM + ONE_MB;
INFO("Size Planning to allocate : " << size);
#ifdef __linux__
INFO("LINUX");
HIP_CHECK_ERROR(hipMalloc(&devMem, size), hipErrorOutOfMemory);
#else
INFO("WINDOWS");
size_t requiredMemFromRAM = size - freeVRAM;
INFO("Required Memory From RAM : " << requiredMemFromRAM);
size_t totalRAM = getTotalRAM();
size_t availableRAM = getAvailableRAM();
INFO("Total RAM : " << totalRAM);
INFO("Available RAM : " << availableRAM);
/**
* Validating size of Required Memory From RAM,
* 1) Since we can use half of RAM as shared GPU memory,
* Required Memory From RAM should be less than that.
* 2) And Required Memory From RAM should be less than Available RAM.
* If Required Memory From RAM is crossing the threshold,
* allocating 90% available VRAM
*/
if ((requiredMemFromRAM < (totalRAM / 2)) &&
(requiredMemFromRAM < availableRAM)) {
INFO("Required Memory From RAM is Available");
} else {
INFO("Required Memory From RAM is Not available, "
"allocating 90% of available VRAM");
// Avoided using total available VRAM for stability, to keep buffer memory
size = freeVRAM * 0.9;
}
INFO("Size going to allocate : " << size);
HIP_CHECK(hipMalloc(&devMem, size));
REQUIRE(devMem != nullptr);
performOperations(devMem, size);
HIP_CHECK(hipFree(devMem));
#endif
}
#endif