SWDEV-433563 - [catch2][dtest] Functional testcases for hipGetFuncBySymbol API

Change-Id: Ic1bcfe35d124da990e6f1868475ba2ed1752b1d5
Tá an tiomantas seo le fáil i:
Rambabu Swargam
2024-03-21 16:40:27 +05:30
tiomanta ag Rakesh Roy
tuismitheoir 27d173286c
tiomantas 73ccc66ca2
D'athraigh 3 comhad le 363 breiseanna agus 12 scriosta
+4
Féach ar an gComhad
@@ -32,6 +32,7 @@ set(TEST_SRC
hipModuleLaunchCooperativeKernel.cc
hipModuleLaunchCooperativeKernelMultiDevice.cc
hipFuncGetAttribute.cc
hipGetFuncBySymbol.cc
)
add_custom_command(OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/get_function_module.code
@@ -178,3 +179,6 @@ add_dependencies(build_tests copiousArgKernel.code copiousArgKernel0.code copiou
copiousArgKernel3.code copiousArgKernel16.code copiousArgKernel17.code)
endif()
endif()
add_executable(hipGetFuncBySymbol_exe EXCLUDE_FROM_ALL hipGetFuncBySymbol_exe.cc)
add_dependencies(build_tests hipGetFuncBySymbol_exe)
+247 -12
Féach ar an gComhad
@@ -16,12 +16,28 @@ LIABILITY, WHETHER INN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR INN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
/**
* @addtogroup hipGetFuncBySymbol hipGetFuncBySymbol
* @{
* @ingroup KernelTest
* `hipError_t hipGetFuncBySymbol (hipFunction_t* functionPtr,
* const void* symbolPtr
* )` -
* Gets pointer to device entry function that matches entry function symbolPtr.
*/
#include <hip_test_common.hh>
#include <hip_test_defgroups.hh>
#include <hip_test_checkers.hh>
#include <hip_test_process.hh>
#define LEN 64
#define SIZE LEN * sizeof(float)
#define ARR_SIZE (32*32)
#define SIZE_BYTES (ARR_SIZE*sizeof(int))
extern "C" __global__ void bit_extract_kernel(uint32_t* C_d, const uint32_t*
A_d, size_t N) {
size_t offset = (blockIdx.x * blockDim.x + threadIdx.x);
@@ -36,16 +52,35 @@ extern "C" __global__ void bit_extract_kernel(uint32_t* C_d, const uint32_t*
}
/**
* @addtogroup hipGetFuncBySymbol hipModuleLaunchKernel
* @{
* @ingroup KernelTest
* `hipError_t hipGetFuncBySymbol(hipFunction_t*, const void*)` -
* function with kernelname will be fetched when pointer to the kernel function is passed.
* `hipError_t hipModuleLaunchKernel(hipFunction_t, unsigned int,
* unsigned int, unsigned int, unsigned int, unsigned int,
* unsigned int, unsigned int, hipStream_t, void**, void**)` -
* launches Kernel with launch parameters and shared memory on stream with arguments passed.
*/
* Host Function to check for negative case.
*/
__host__ void hostFunction() {
printf("hostFunction\n");
}
/**
* Sample Kernel to be used for functional test cases
*/
__global__ void hipKernel(int *a) {
int offset = blockDim.x * blockIdx.x + threadIdx.x;
int stride = blockDim.x * gridDim.x;
for (int i = offset; i < ARR_SIZE; i+= stride) {
a[i] += a[i];
}
}
/**
* Local Function to validate the result
*/
bool verifyResult(int *a, int *output_ref, int arrSize) {
for (int i = 0; i < arrSize; i++) {
if (a[i] != output_ref[i]) {
return false;
}
}
return true;
}
/**
* Test Description
@@ -61,7 +96,7 @@ extern "C" __global__ void bit_extract_kernel(uint32_t* C_d, const uint32_t*
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipGetFuncBySymbol") {
TEST_CASE("Unit_hipGetFuncBySymbol_PositiveTest") {
uint32_t *A_d, *C_d;
uint32_t *A_h, *C_h;
size_t N = 1000000;
@@ -100,7 +135,8 @@ TEST_CASE("Unit_hipGetFuncBySymbol") {
HIP_LAUNCH_PARAM_BUFFER_SIZE, &size, HIP_LAUNCH_PARAM_END};
hipFunction_t Function;
HIPCHECK(hipGetFuncBySymbol(&Function, reinterpret_cast<void*>(bit_extract_kernel)));
HIPCHECK(hipGetFuncBySymbol(&Function,
reinterpret_cast<void*>(bit_extract_kernel)));
HIPCHECK(hipModuleLaunchKernel(Function, 1, 1, 1, LEN, 1, 1, 0, 0, NULL,
reinterpret_cast<void**>(&config)));
@@ -118,3 +154,202 @@ TEST_CASE("Unit_hipGetFuncBySymbol") {
free(A_h);
free(C_h);
}
/**
* Test Description
* ------------------------
* - Pass the NULL as a symbolPtr it should return
* hipErrorInvalidDeviceFunction
* - Pass a host function as a symbolPtr it should return
* hipErrorInvalidDeviceFunction
* Test source
* ------------------------
* - catch/unit/module/hipGetFuncBySymbol.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipGetFuncBySymbol_NegativeTests") {
hipFunction_t funcPointer;
// Passing NULL as second parameter
REQUIRE(hipGetFuncBySymbol(&funcPointer, NULL) != hipSuccess);
// Passing hostFunction as second parameter
REQUIRE(hipGetFuncBySymbol(&funcPointer,
reinterpret_cast<const void*>(hostFunction)));
}
/**
* Test Description
* ------------------------
* - Create a child process and pass the __global__ function as a symbolPtr
* it should return hipSuccess, and kernel launch and execution with
* functionPtr should success.
* Test source
* ------------------------
* - catch/unit/module/hipGetFuncBySymbol.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipGetFuncBySymbol_InChildProcess") {
hip::SpawnProc proc("hipGetFuncBySymbol_exe", true);
REQUIRE(proc.run() == 0);
}
/**
* Test Description
* ------------------------
* - For all the GPU devices in the system and pass the __global__ function
* as a symbolPtr it should return hipSuccess, and kernel launch and
* execution with functionPtr should success.
* Test source
* ------------------------
* - catch/unit/module/hipGetFuncBySymbol.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipGetFuncBySymbol_MultiDev") {
int deviceCount = 0;
HIP_CHECK(hipGetDeviceCount(&deviceCount));
if (deviceCount < 2) {
HipTest::HIP_SKIP_TEST("Skipping because this machine has total GPUs < 2");
return;
}
hipFunction_t funcPointer;
for (int deviceId = 0; deviceId < deviceCount; deviceId++) {
HIP_CHECK(hipSetDevice(deviceId));
REQUIRE(hipGetFuncBySymbol(&funcPointer,
reinterpret_cast<const void*>(hipKernel))== hipSuccess);
int *h_a = reinterpret_cast<int *>(malloc(SIZE_BYTES));
REQUIRE(h_a != nullptr);
int *output_ref = reinterpret_cast<int *>(malloc(SIZE_BYTES));
REQUIRE(output_ref != nullptr);
for (int i = 0; i < ARR_SIZE; i++) {
h_a[i] = 2;
output_ref[i] = 4;
}
int *d_a = nullptr;
HIP_CHECK(hipMalloc(&d_a, SIZE_BYTES));
REQUIRE(d_a != nullptr);
HIP_CHECK(hipMemcpy(d_a, h_a, SIZE_BYTES, hipMemcpyHostToDevice));
dim3 blocksPerGrid(1, 1, 1);
dim3 threadsPerBlock(1, 1, 64);
void* kernelParam[] = {d_a};
auto size = sizeof(kernelParam);
void* kernel_parameter[] = {HIP_LAUNCH_PARAM_BUFFER_POINTER, &kernelParam,
HIP_LAUNCH_PARAM_BUFFER_SIZE, &size,
HIP_LAUNCH_PARAM_END};
REQUIRE(hipModuleLaunchKernel(funcPointer,
blocksPerGrid.x, blocksPerGrid.y, blocksPerGrid.z,
threadsPerBlock.x, threadsPerBlock.y, threadsPerBlock.z,
0, 0, nullptr, kernel_parameter) == hipSuccess);
HIP_CHECK(hipMemcpy(h_a, d_a, SIZE_BYTES, hipMemcpyDeviceToHost));
REQUIRE(verifyResult(h_a, output_ref, ARR_SIZE) == true);
free(h_a);
free(output_ref);
HIP_CHECK(hipFree(d_a));
}
}
/**
* Local function useful to create stream and memory copy and launch kernel
*/
void MultiThreadMultiDevFunc(int DevId) {
HIP_CHECK(hipSetDevice(DevId));
int *h_a = reinterpret_cast<int *>(malloc(SIZE_BYTES));
REQUIRE(h_a != nullptr);
int *output_ref = reinterpret_cast<int *>(malloc(SIZE_BYTES));
REQUIRE(output_ref != nullptr);
for (int i = 0; i < ARR_SIZE; i++) {
h_a[i] = 2;
output_ref[i] = 4;
}
hipStream_t stream;
HIP_CHECK(hipSetDevice(DevId));
HIP_CHECK(hipStreamCreate(&stream));
int *d_a = nullptr;
HIP_CHECK(hipMalloc(&d_a, SIZE_BYTES));
REQUIRE(d_a != nullptr);
HIP_CHECK(hipMemcpyAsync(d_a, h_a, SIZE_BYTES,
hipMemcpyHostToDevice, stream));
dim3 blocksPerGrid(1, 1, 1);
dim3 threadsPerBlock(1, 1, 64);
hipFunction_t funcPointer;
REQUIRE(hipGetFuncBySymbol(&funcPointer,
reinterpret_cast<const void*>(hipKernel))== hipSuccess);
void* kernelParam[] = {d_a};
auto size = sizeof(kernelParam);
void* kernel_parameter[] = {HIP_LAUNCH_PARAM_BUFFER_POINTER, &kernelParam,
HIP_LAUNCH_PARAM_BUFFER_SIZE, &size,
HIP_LAUNCH_PARAM_END};
REQUIRE(hipModuleLaunchKernel(funcPointer,
blocksPerGrid.x, blocksPerGrid.y, blocksPerGrid.z,
threadsPerBlock.x, threadsPerBlock.y, threadsPerBlock.z,
0, stream, nullptr, kernel_parameter) == hipSuccess);
HIP_CHECK(hipMemcpyAsync(h_a, d_a, SIZE_BYTES,
hipMemcpyDeviceToHost, stream));
REQUIRE(verifyResult(h_a, output_ref, ARR_SIZE) == true);
free(h_a);
free(output_ref);
HIP_CHECK(hipStreamDestroy(stream));
HIP_CHECK(hipFree(d_a));
}
/**
* Test Description
* ------------------------
* - Create number of threads equals to number of devices and in each devices
* pass the __global__ function as a symbolPtr it should return hipSuccess,
* and kernel launch and execution with functionPtr should success.
* Test source
* ------------------------
* - catch/unit/module/hipGetFuncBySymbol.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipGetFuncBySymbol_MultiDevMultiThread") {
int deviceCount = 0;
HIP_CHECK(hipGetDeviceCount(&deviceCount));
if (deviceCount < 2) {
HipTest::HIP_SKIP_TEST("Skipping because this machine has total GPUs < 2");
return;
}
::std::vector< ::std::thread> threads;
for (int dev = 0; dev < deviceCount; dev++) {
threads.push_back(::std::thread(MultiThreadMultiDevFunc, dev));
}
for (int dev = 0; (dev < deviceCount) && (dev < threads.size()); dev++) {
threads[dev].join();
}
}
+112
Féach ar an gComhad
@@ -0,0 +1,112 @@
/*
Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANNTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER INN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR INN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
#include "hip/hip_runtime.h"
#define ARR_SIZE (32*32)
#define SIZE (ARR_SIZE*sizeof(int))
#define HIP_CHECK(error) \
{ \
hipError_t localError = error; \
if ((localError != hipSuccess) && \
(localError != hipErrorPeerAccessAlreadyEnabled)) { \
printf("error: '%s'(%d) from %s at %s:%d\n", \
hipGetErrorString(localError), \
localError, #error, __FUNCTION__, __LINE__);\
exit(0); \
} \
}
/**
* Sample Kernel to be used for functional test cases
*/
__global__ void hipKernel(int *a) {
int offset = blockDim.x * blockIdx.x + threadIdx.x;
int stride = blockDim.x * gridDim.x;
for (int i = offset; i < ARR_SIZE; i+= stride) {
a[i] += a[i];
}
}
/**
* This function gets the function pointer and launches the kernel and
* verifies the reult
*/
int main() {
hipFunction_t funcPointer;
if (hipGetFuncBySymbol(&funcPointer,
reinterpret_cast<const void*>(hipKernel)) != hipSuccess) {
return -1;
}
int *h_a = reinterpret_cast<int *>(malloc(SIZE));
if (h_a == nullptr) {
return -1;
}
int *output_ref = reinterpret_cast<int *>(malloc(SIZE));
if (output_ref == nullptr) {
return -1;
}
for (int i = 0; i < ARR_SIZE; i++) {
h_a[i] = 2;
output_ref[i] = 4;
}
int *d_a = nullptr;
HIP_CHECK(hipMalloc(&d_a, SIZE));
if (d_a == nullptr) {
return -1;
}
HIP_CHECK(hipMemcpy(d_a, h_a, SIZE, hipMemcpyHostToDevice));
dim3 blocksPerGrid(1, 1, 1);
dim3 threadsPerBlock(1, 1, 64);
void* kernelParam[] = {d_a};
auto size = sizeof(kernelParam);
void* kernel_parameter[] = {HIP_LAUNCH_PARAM_BUFFER_POINTER, &kernelParam,
HIP_LAUNCH_PARAM_BUFFER_SIZE, &size,
HIP_LAUNCH_PARAM_END};
if (hipModuleLaunchKernel(funcPointer,
blocksPerGrid.x, blocksPerGrid.y, blocksPerGrid.z,
threadsPerBlock.x, threadsPerBlock.y, threadsPerBlock.z,
0, 0, nullptr, kernel_parameter) != hipSuccess) {
return -1;
}
HIP_CHECK(hipMemcpy(h_a, d_a, SIZE, hipMemcpyDeviceToHost));
for (int i = 0; i < ARR_SIZE; i++) {
if (h_a[i] != output_ref[i]) {
return -1;
}
}
free(h_a);
free(output_ref);
HIP_CHECK(hipFree(d_a));
return 0;
}