2023-08-14 21:17:55 +05:30
|
|
|
|
/*
|
|
|
|
|
|
Copyright (c) 2023 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
|
|
|
|
in the Software without restriction, including without limitation the rights
|
|
|
|
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
|
|
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
|
|
|
|
all copies or substantial portions of the Software.
|
|
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
|
|
THE SOFTWARE.
|
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
2025-08-15 16:09:19 -04:00
|
|
|
|
* @addtogroup hipMemcpy hipMemcpy
|
|
|
|
|
|
* @{
|
|
|
|
|
|
* @ingroup perfMemoryTest
|
|
|
|
|
|
* `hipMemcpy(void* dst, const void* src, size_t count, hipMemcpyKind kind)` -
|
|
|
|
|
|
* Copies data between host and device.
|
|
|
|
|
|
*/
|
|
|
|
|
|
// #define ENABLE_DEBUG 1
|
2023-08-14 21:17:55 +05:30
|
|
|
|
#include <time.h>
|
|
|
|
|
|
#include <hip_test_common.hh>
|
|
|
|
|
|
|
|
|
|
|
|
#define NUM_SIZE 19 // size up to 16M
|
|
|
|
|
|
#define NUM_ITER 500 // Total GPU memory up to 16M*500=8G
|
|
|
|
|
|
|
|
|
|
|
|
void valSet(int* A, int val, size_t size) {
|
|
|
|
|
|
size_t len = size / sizeof(int);
|
|
|
|
|
|
for (int i = 0; i < len; i++) {
|
|
|
|
|
|
A[i] = val;
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-08-15 16:09:19 -04:00
|
|
|
|
void setup(size_t* size, int* num, int** pA, const size_t totalGlobalMem) {
|
2023-08-14 21:17:55 +05:30
|
|
|
|
for (int i = 0; i < *num; i++) {
|
|
|
|
|
|
size[i] = 1 << (i + 6);
|
|
|
|
|
|
if ((NUM_ITER + 1) * size[i] > totalGlobalMem) {
|
|
|
|
|
|
*num = i;
|
|
|
|
|
|
break;
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
*pA = reinterpret_cast<int*>(malloc(size[*num - 1]));
|
|
|
|
|
|
valSet(*pA, 1, size[*num - 1]);
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-08-15 16:09:19 -04:00
|
|
|
|
void testInit(size_t size, int* A) {
|
|
|
|
|
|
int* Ad;
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
clock_t start = clock();
|
2025-08-15 16:09:19 -04:00
|
|
|
|
HIP_CHECK(hipMalloc(&Ad, size)); // hip::init() will be called
|
2023-08-14 21:17:55 +05:30
|
|
|
|
clock_t end = clock();
|
|
|
|
|
|
double uS = (end - start) * 1000000. / CLOCKS_PER_SEC;
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("Initial: hipMalloc(%zu) cost %.2fus\n", size, uS);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
start = clock();
|
|
|
|
|
|
HIP_CHECK(hipMemcpy(Ad, A, size, hipMemcpyHostToDevice));
|
|
|
|
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
|
|
end = clock();
|
|
|
|
|
|
uS = (end - start) * 1000000. / CLOCKS_PER_SEC;
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("hipMemcpy(%zu) cost %.2fus\n", size, uS);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
start = clock();
|
|
|
|
|
|
HIP_CHECK(hipFree(Ad));
|
|
|
|
|
|
end = clock();
|
|
|
|
|
|
uS = (end - start) * 1000000. / CLOCKS_PER_SEC;
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("hipFree(%zu) cost %.2fus\n", size, uS);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static bool hipPerfMemMallocCpyFree_test() {
|
|
|
|
|
|
double uS;
|
|
|
|
|
|
clock_t start, end;
|
2025-08-15 16:09:19 -04:00
|
|
|
|
size_t size[NUM_SIZE] = {0};
|
|
|
|
|
|
int* Ad[NUM_ITER] = {nullptr};
|
|
|
|
|
|
int* A;
|
2023-08-14 21:17:55 +05:30
|
|
|
|
hipDeviceProp_t props;
|
|
|
|
|
|
memset(&props, 0, sizeof(props));
|
|
|
|
|
|
HIP_CHECK(hipGetDeviceProperties(&props, 0));
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("totalGlobalMem: %zu\n", props.totalGlobalMem);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
int num = NUM_SIZE;
|
|
|
|
|
|
setup(size, &num, &A, props.totalGlobalMem);
|
|
|
|
|
|
testInit(size[0], A);
|
|
|
|
|
|
|
|
|
|
|
|
for (int i = 0; i < num; i++) {
|
|
|
|
|
|
start = clock();
|
|
|
|
|
|
for (int j = 0; j < NUM_ITER; j++) {
|
2025-08-15 16:09:19 -04:00
|
|
|
|
HIP_CHECK(hipMalloc(&Ad[j], size[i]));
|
2023-08-14 21:17:55 +05:30
|
|
|
|
}
|
|
|
|
|
|
end = clock();
|
|
|
|
|
|
uS = (end - start) * 1000000. / (NUM_ITER * CLOCKS_PER_SEC);
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("hipMalloc(%zu) cost %.2fus\n", size[i], uS);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
start = clock();
|
|
|
|
|
|
for (int j = 0; j < NUM_ITER; j++) {
|
2025-08-15 16:09:19 -04:00
|
|
|
|
HIP_CHECK(hipMemcpy(Ad[j], A, size[i], hipMemcpyHostToDevice));
|
2023-08-14 21:17:55 +05:30
|
|
|
|
}
|
|
|
|
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
|
|
end = clock();
|
|
|
|
|
|
uS = (end - start) * 1000000. / (NUM_ITER * CLOCKS_PER_SEC);
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("hipMemcpy(%zu) cost %.2fus\n", size[i], uS);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
start = clock();
|
|
|
|
|
|
for (int j = 0; j < NUM_ITER; j++) {
|
2025-08-15 16:09:19 -04:00
|
|
|
|
HIP_CHECK(hipFree(Ad[j]));
|
|
|
|
|
|
Ad[j] = nullptr;
|
2023-08-14 21:17:55 +05:30
|
|
|
|
}
|
|
|
|
|
|
end = clock();
|
|
|
|
|
|
double uS = (end - start) * 1000000. / (NUM_ITER * CLOCKS_PER_SEC);
|
2025-08-15 16:09:19 -04:00
|
|
|
|
CONSOLE_PRINT("hipFree(%zu) cost %.2fus\n", size[i], uS);
|
2023-08-14 21:17:55 +05:30
|
|
|
|
}
|
|
|
|
|
|
free(A);
|
|
|
|
|
|
return true;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
2025-08-15 16:09:19 -04:00
|
|
|
|
* Test Description
|
|
|
|
|
|
* ------------------------
|
|
|
|
|
|
* - Verify hipPerfMemMallocCpyFree status.
|
|
|
|
|
|
* Test source
|
|
|
|
|
|
* ------------------------
|
|
|
|
|
|
* - perftests/memory/hipPerfMemMallocCpyFree.cc
|
|
|
|
|
|
* Test requirements
|
|
|
|
|
|
* ------------------------
|
|
|
|
|
|
* - HIP_VERSION >= 5.6
|
|
|
|
|
|
*/
|
2023-08-14 21:17:55 +05:30
|
|
|
|
|
|
|
|
|
|
TEST_CASE("Perf_hipPerfMemMallocCpyFree_test") {
|
|
|
|
|
|
int numDevices = 0;
|
|
|
|
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
|
|
|
|
|
|
|
|
|
|
if (numDevices <= 0) {
|
2025-08-15 16:09:19 -04:00
|
|
|
|
SUCCEED(
|
|
|
|
|
|
"Skipped testcase hipPerfDevMemReadSpeed as"
|
|
|
|
|
|
"there is no device to test.");
|
2023-08-14 21:17:55 +05:30
|
|
|
|
} else {
|
|
|
|
|
|
REQUIRE(true == hipPerfMemMallocCpyFree_test());
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2024-03-22 11:17:00 +01:00
|
|
|
|
|
|
|
|
|
|
/**
|
2025-08-15 16:09:19 -04:00
|
|
|
|
* End doxygen group perfMemoryTest.
|
|
|
|
|
|
* @}
|
|
|
|
|
|
*/
|