/* Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved. Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ /* Added Negative and Functional tests for hipPointerGetAttribute API Functional Scenarios: 1. Allocate memory using different Allocation APIs and check whether correct memory type and device oridinal are returned. 2. Allocate device variable and get the pointer info by calling hipPointerGetAttribute API with HIP_POINTER_ATTRIBUTE_DEVICE_POINTER/HIP_POINTER_ATTRIBUTE_START_ADDRESS and Launch kernel with device variable and verify whether the pointer variable of hipPointerGetAttribute is getting updated or not 3. Allocate device memory in GPU-0 and get the pointer info in peer GPU 4. Allocate device memory and get the buffer ID by calling hipPointerGetAttribute API with HIP_POINTER_ATTRIBUTE_BUFFER_ID, DeAllocate and Allocate the memory again and ensure that the buffer ID is unique 5. Allocate host memory and get the device ordinal by calling hipPointerGetAttribute API with HIP_POINTER_ATTRIBUTE_DEVICE_ORDINAL and ensure that it matches with CUDA result(which returns 100) 6. Allocate managed memory with different flags and trigger hipPointerGetAttribute with the following flags HIP_POINTER_ATTRIBUTE_MAPPED and verify the behaviour */ #define checkVMMSupported(device) { \ int value = 0; \ hipDeviceAttribute_t attr = hipDeviceAttributeVirtualMemoryManagementSupported; \ HIP_CHECK(hipDeviceGetAttribute(&value, attr, device)); \ if (value == 0) { \ printf("Machine does not support VMM. Skipping this test.."); \ return; \ } \ } #include #include static constexpr auto NUM_W{16}; static constexpr auto NUM_H{16}; static constexpr size_t N{10}; #define INT_VAL 10 #define VAL_DATA 99 static __global__ void var_update(int* data) { for (unsigned int i = 0; i < N; i++) { data[i] = VAL_DATA; } } /* Allocate memory using different Allocation APIs and check whether correct memory type and device oridinal are returned */ TEST_CASE("Unit_hipPointerGetAttribute_MemoryTypes") { CHECK_IMAGE_SUPPORT HIP_CHECK(hipSetDevice(0)); size_t pitch_A; size_t width{NUM_W * sizeof(char)}; unsigned int datatype; SECTION("Malloc Pitch Allocation") { char* A_d; HIP_CHECK(hipMallocPitch(reinterpret_cast(&A_d), &pitch_A, width, NUM_H)); HIP_CHECK(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_MEMORY_TYPE, reinterpret_cast(A_d))); REQUIRE(datatype == hipMemoryTypeDevice); } #if HT_AMD SECTION("Malloc Array Allocation") { hipArray_t B_d; hipChannelFormatDesc desc = hipCreateChannelDesc(); HIP_CHECK(hipMallocArray(&B_d, &desc, NUM_W, NUM_H, hipArrayDefault)); HIP_CHECK(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_MEMORY_TYPE, reinterpret_cast(B_d))); REQUIRE(datatype == hipMemoryTypeArray); HIP_CHECK(hipFreeArray(B_d)); } SECTION("Malloc 3D Array Allocation") { int width = 10, height = 10, depth = 10; hipArray_t arr; hipChannelFormatDesc channelDesc = hipCreateChannelDesc(sizeof(float) * 8, 0, 0, 0, hipChannelFormatKindFloat); HIP_CHECK(hipMalloc3DArray(&arr, &channelDesc, make_hipExtent(width, height, depth), hipArrayDefault)); HIP_CHECK(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_MEMORY_TYPE, reinterpret_cast(arr))); REQUIRE(datatype == hipMemoryTypeArray); HIP_CHECK(hipFreeArray(arr)); } #endif } /* * This testcase verifies the following scenario * Initializes A_d with A_h and get pointer info using hipPointerGetAttribute * The result of the API is passed to kernel for validation * and modifies it in kernel. * Validates the device variable to check whether the * data is updated or not. */ TEST_CASE("Unit_hipPointerGetAttribute_KernelUpdation") { HIP_CHECK(hipSetDevice(0)); size_t Nbytes = 0; Nbytes = N * sizeof(int); int *A_d, *A_h; HIP_CHECK(hipMalloc(&A_d, Nbytes)); hipDeviceptr_t data = 0; A_h = reinterpret_cast(malloc(Nbytes)); for (unsigned int i = 0; i < N; i++) { A_h[i] = INT_VAL; } HIP_CHECK(hipMemcpy(A_d, A_h, Nbytes, hipMemcpyHostToDevice)); HIP_CHECK(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_DEVICE_POINTER, reinterpret_cast(A_d))); hipLaunchKernelGGL(var_update, dim3(1), dim3(1), 0, 0, reinterpret_cast(data)); HIP_CHECK(hipGetLastError()); HIP_CHECK(hipDeviceSynchronize()); HIP_CHECK(hipMemcpy(A_h, A_d, Nbytes, hipMemcpyDeviceToHost)); for (unsigned int i = 0; i < N; i++) { REQUIRE(A_h[i] == VAL_DATA); } HIP_CHECK(hipFree(A_d)); free(A_h); } /* * This testcase verifies the pointer info of device variable * from peer GPU device.It validates the memory type and * device ordinal in peer GPU */ TEST_CASE("Unit_hipPointerGetAttribute_PeerGPU", "[multigpu]") { HIP_CHECK(hipSetDevice(0)); size_t Nbytes = 0; Nbytes = N * sizeof(int); int* A_d; HIP_CHECK(hipMalloc(&A_d, Nbytes)); unsigned int data = 0; int numDevices = 0; int canAccessPeer = 0; HIP_CHECK(hipGetDeviceCount(&numDevices)); if (numDevices > 1) { HIP_CHECK(hipDeviceCanAccessPeer(&canAccessPeer, 0, 1)); if (canAccessPeer) { HIP_CHECK(hipSetDevice(1)); HIP_CHECK(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_MEMORY_TYPE, reinterpret_cast(A_d))); REQUIRE(data == hipMemoryTypeDevice); HIP_CHECK(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_DEVICE_ORDINAL, reinterpret_cast(A_d))); REQUIRE(data == 0); } else { SUCCEED("Machine does not seem to have P2P"); } } else { SUCCEED("skipped the testcase as no of devices is less than 2"); } HIP_CHECK(hipFree(A_d)); } /* Allocate device memory and get the buffer ID by calling hipPointerGetAttribute API with HIP_POINTER_ATTRIBUTE_BUFFER_ID, DeAllocate and Allocate the memory again and ensure that the buffer ID is unique */ TEST_CASE("Unit_hipPointerGetAttribute_BufferID") { HIP_CHECK(hipSetDevice(0)); size_t Nbytes = 0; Nbytes = N * sizeof(int); int* A_d; HIP_CHECK(hipMalloc(&A_d, Nbytes)); unsigned int bufid1, bufid2; HIP_CHECK(hipPointerGetAttribute(&bufid1, HIP_POINTER_ATTRIBUTE_BUFFER_ID, reinterpret_cast(A_d))); HIP_CHECK(hipFree(A_d)); HIP_CHECK(hipMalloc(&A_d, Nbytes)); HIP_CHECK(hipPointerGetAttribute(&bufid2, HIP_POINTER_ATTRIBUTE_BUFFER_ID, reinterpret_cast(A_d))); REQUIRE(bufid1 != bufid2); HIP_CHECK(hipFree(A_d)); } /* Allocate host memory and get the device ordinal by calling hipPointerGetAttribute API with HIP_POINTER_ATTRIBUTE_DEVICE_ORDINAL and ensure that it matches with CUDA result */ #if HT_AMD TEST_CASE("Unit_hipPointerGetAttribute_HostDeviceOrdinal") { size_t Nbytes = 0; Nbytes = N * sizeof(int); int* A_h; unsigned int data = 0, data1 = 0; A_h = reinterpret_cast(malloc(Nbytes)); for (unsigned int i = 0; i < N; i++) { A_h[i] = INT_VAL; } REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_DEVICE_ORDINAL, reinterpret_cast(A_h)) == hipErrorInvalidValue); REQUIRE(hipPointerGetAttribute(&data1, HIP_POINTER_ATTRIBUTE_RANGE_SIZE, reinterpret_cast(A_h)) == hipErrorInvalidValue); free(A_h); } #endif /* Allocate managed memory with different flags and trigger hipPointerGetAttribute with the following flags HIP_POINTER_ATTRIBUTE_MAPPED and verify the behaviour */ TEST_CASE("Unit_hipPointerGetAttribute_MappedMem") { HIP_CHECK(hipSetDevice(0)); size_t Nbytes = 0; Nbytes = N * sizeof(int); int *A_d, *A_h; HIP_CHECK(hipMalloc(&A_d, Nbytes)); A_h = reinterpret_cast(malloc(Nbytes)); for (unsigned int i = 0; i < N; i++) { A_h[i] = INT_VAL; } HIP_CHECK(hipMemcpy(A_d, A_h, Nbytes, hipMemcpyHostToDevice)); int *ptr1 = 0, *ptr2 = 0; unsigned int hostMalloc_mapped = 0; unsigned int mallocManaged = 0; HIP_CHECK(hipHostMalloc(&ptr1, Nbytes, hipHostMallocMapped)); HIP_CHECK(hipMallocManaged(&ptr2, Nbytes, hipMemAttachGlobal)); HIP_CHECK(hipPointerGetAttribute(&hostMalloc_mapped, HIP_POINTER_ATTRIBUTE_MAPPED, reinterpret_cast(A_d))); HIP_CHECK(hipPointerGetAttribute(&mallocManaged, HIP_POINTER_ATTRIBUTE_MAPPED, reinterpret_cast(ptr2))); REQUIRE(hostMalloc_mapped == 1); REQUIRE(mallocManaged == 1); HIP_CHECK(hipFree(A_d)); HIP_CHECK(hipHostFree(ptr1)); HIP_CHECK(hipFree(ptr2)); free(A_h); } /* This testcase verifies negative scenarios of hipPointerGetAttribute API */ TEST_CASE("Unit_hipPointerGetAttribute_Negative") { HIP_CHECK(hipSetDevice(0)); size_t Nbytes = 0; constexpr size_t N{100}; Nbytes = N * sizeof(char); char* A_d; HIP_CHECK(hipMalloc(&A_d, Nbytes)); hipDeviceptr_t data = 0; char* A_h; A_h = reinterpret_cast(malloc(Nbytes)); SECTION("Pass nullptr to data") { REQUIRE(hipPointerGetAttribute(nullptr, HIP_POINTER_ATTRIBUTE_DEVICE_POINTER, reinterpret_cast(A_d)) == hipErrorInvalidValue); } SECTION("Pass nullptr to device attribute") { #if HT_AMD REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_DEVICE_POINTER, nullptr) == hipErrorInvalidValue); #else REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_DEVICE_POINTER, reinterpret_cast(nullptr)) == hipErrorInvalidValue); #endif } SECTION("DeAllocateMem and get the pointer info") { char* B_d; HIP_CHECK(hipMalloc(&B_d, Nbytes)); HIP_CHECK(hipFree(B_d)); REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_DEVICE_POINTER, reinterpret_cast(B_d)) == hipErrorInvalidValue); } SECTION("Get Start address of host pointer") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_RANGE_START_ADDR, reinterpret_cast(A_h)) == hipErrorInvalidValue); } SECTION("Pass HIP_POINTER_ATTRIBUTE_HOST_POINTER to device pointer") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_HOST_POINTER, reinterpret_cast(A_d)) == hipErrorInvalidValue); } SECTION("Pass BUFFER_ID attribute to host pointer") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_BUFFER_ID, reinterpret_cast(A_h)) == hipErrorInvalidValue); } SECTION("Pass invalid attribute") { REQUIRE(hipPointerGetAttribute(&data, static_cast(-1), reinterpret_cast(A_h)) == hipErrorInvalidValue); } #if HT_AMD SECTION( "Pass HIP_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE" "not supported by HIP") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE, reinterpret_cast(A_d)) == hipErrorNotSupported); } SECTION("Pass HIP_POINTER_ATTRIBUTE_MEMPOOL_HANDLE not supported by HIP") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_MEMPOOL_HANDLE, reinterpret_cast(A_d)) == hipErrorNotSupported); } SECTION("Pass HIP_POINTER_ATTRIBUTE_P2P_TOKENS not supported by HIP") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_P2P_TOKENS, reinterpret_cast(A_d)) == hipErrorNotSupported); } SECTION( "Pass HIP_POINTER_ATTRIBUTE_ALLOWED_HANDLE_TYPES" "not supported by HIP") { REQUIRE(hipPointerGetAttribute(&data, HIP_POINTER_ATTRIBUTE_ALLOWED_HANDLE_TYPES, reinterpret_cast(A_d)) == hipErrorNotSupported); } #endif HIP_CHECK(hipFree(A_d)); free(A_h); } /* Allocate memory using different Allocation APIs and check whether IPC CAPABLE attribute returns correctly */ TEST_CASE("Unit_hipPointerGetAttribute_ipc_capable") { HIP_CHECK(hipSetDevice(0)); size_t Nbytes = N * sizeof(int); unsigned int datatype; SECTION("Malloc Allocation") { int *A_d; HIP_CHECK(hipMalloc(&A_d, Nbytes)); HIP_CHECK(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_IS_LEGACY_HIP_IPC_CAPABLE, reinterpret_cast(A_d))); REQUIRE(datatype == 1); } size_t pitch_A; size_t width{NUM_W * sizeof(char)}; SECTION("Malloc Pitch Allocation") { CHECK_IMAGE_SUPPORT char* A_d; HIP_CHECK(hipMallocPitch(reinterpret_cast(&A_d), &pitch_A, width, NUM_H)); HIP_CHECK(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_IS_LEGACY_HIP_IPC_CAPABLE, reinterpret_cast(A_d))); REQUIRE(datatype == 1); } #if HT_AMD SECTION("Malloc Array Allocation") { CHECK_IMAGE_SUPPORT hipArray_t B_d; hipChannelFormatDesc desc = hipCreateChannelDesc(); HIP_CHECK(hipMallocArray(&B_d, &desc, NUM_W, NUM_H, hipArrayDefault)); HIP_CHECK_ERROR(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_IS_LEGACY_HIP_IPC_CAPABLE, reinterpret_cast(B_d)), hipErrorInvalidValue); HIP_CHECK(hipFreeArray(B_d)); } SECTION("Malloc 3D Array Allocation") { CHECK_IMAGE_SUPPORT int width = 10, height = 10, depth = 10; hipArray_t arr; hipChannelFormatDesc channelDesc = hipCreateChannelDesc(sizeof(float) * 8, 0, 0, 0, hipChannelFormatKindFloat); HIP_CHECK(hipMalloc3DArray(&arr, &channelDesc, make_hipExtent(width, height, depth), hipArrayDefault)); HIP_CHECK_ERROR(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_IS_LEGACY_HIP_IPC_CAPABLE, reinterpret_cast(arr)), hipErrorInvalidValue); HIP_CHECK(hipFreeArray(arr)); } #endif SECTION("VMM Memory Allocation") { size_t granularity = 0; int deviceId = 0; size_t buffer_size = N * sizeof(int); hipDevice_t device; HIP_CHECK(hipDeviceGet(&device, deviceId)); checkVMMSupported(device); hipMemAllocationProp prop{}; prop.type = hipMemAllocationTypePinned; prop.location.type = hipMemLocationTypeDevice; prop.location.id = device; // Current Devices HIP_CHECK( hipMemGetAllocationGranularity(&granularity, &prop, hipMemAllocationGranularityMinimum)); REQUIRE(granularity > 0); size_t size_mem = ((granularity + buffer_size - 1) / granularity) * granularity; hipMemGenericAllocationHandle_t handle; // Allocate physical memory HIP_CHECK(hipMemCreate(&handle, size_mem, &prop, 0)); // Allocate virtual address range void* ptrA; HIP_CHECK(hipMemAddressReserve(&ptrA, size_mem, 0, 0, 0)); HIP_CHECK(hipMemMap(ptrA, size_mem, 0, handle, 0)); // Set access hipMemAccessDesc accessDesc = {}; accessDesc.location.type = hipMemLocationTypeDevice; accessDesc.location.id = device; accessDesc.flags = hipMemAccessFlagsProtReadWrite; // Make the address accessible to GPU 0 HIP_CHECK(hipMemSetAccess(ptrA, size_mem, &accessDesc, 1)); HIP_CHECK(hipPointerGetAttribute(&datatype, HIP_POINTER_ATTRIBUTE_IS_LEGACY_HIP_IPC_CAPABLE, reinterpret_cast(ptrA))); REQUIRE(datatype == 0); } }