680 regels
22 KiB
C++
680 regels
22 KiB
C++
/*
|
|
Copyright (c) 2021-2023 Advanced Micro Devices, Inc. All rights reserved.
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
/**
|
|
* @addtogroup hipMemcpy3D hipMemcpy3D
|
|
* @{
|
|
* @ingroup MemoryTest
|
|
* `hipMemcpy3D(const hipMemcpy3DParms* p)` -
|
|
* Copies data between 3D objects.
|
|
*/
|
|
|
|
/*
|
|
* This testfile verifies the following scenarios of hipMemcpy3D API
|
|
*
|
|
* 1. Verifying hipMemcpy3D API for H2D,D2D and D2H scenarios for
|
|
different datatypes and sizes.
|
|
* 2. Verifying Negative Scenarios
|
|
* 3. Verifying Extent validation scenarios by passing 0
|
|
* 4. Verifying hipMemcpy3D API by allocating Memory in
|
|
* one GPU and trigger hipMemcpy3D from peer GPU
|
|
*
|
|
*/
|
|
|
|
#include <hip_test_common.hh>
|
|
#include <hip_test_checkers.hh>
|
|
|
|
static constexpr auto width{10};
|
|
static constexpr auto height{10};
|
|
static constexpr auto depth{10};
|
|
|
|
template <typename T> class Memcpy3D {
|
|
size_t width, height, depth;
|
|
size_t size;
|
|
hipArray_t arr, arr1;
|
|
hipChannelFormatKind formatKind;
|
|
hipMemcpy3DParms myparms;
|
|
T* hData;
|
|
|
|
public:
|
|
Memcpy3D(size_t l_width, size_t l_height, size_t l_depth, hipChannelFormatKind l_format);
|
|
void simple_Memcpy3D();
|
|
void Extent_Validation();
|
|
void NegativeTests();
|
|
void AllocateMemory();
|
|
void DeAllocateMemory();
|
|
void SetDefaultData();
|
|
void D2D_DeviceMem_OnDiffDevice();
|
|
void D2H_H2D_DeviceMem_OnDiffDevice();
|
|
};
|
|
|
|
/*
|
|
* This API sets the default values of hipMemcpy3DParms structure
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::SetDefaultData() {
|
|
myparms.srcPos = make_hipPos(0, 0, 0);
|
|
myparms.dstPos = make_hipPos(0, 0, 0);
|
|
myparms.extent = make_hipExtent(width, height, depth);
|
|
}
|
|
|
|
/*
|
|
* Constructor initalized width,depth and height
|
|
*/
|
|
template <typename T> Memcpy3D<T>::Memcpy3D(size_t l_width, size_t l_height, size_t l_depth,
|
|
hipChannelFormatKind l_format) {
|
|
width = l_width;
|
|
height = l_height;
|
|
depth = l_depth;
|
|
formatKind = l_format;
|
|
}
|
|
|
|
/*
|
|
* Allocating Memory and initalizing data for both
|
|
* device and host variables
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::AllocateMemory() {
|
|
size = width * height * depth * sizeof(T);
|
|
hData = reinterpret_cast<T*>(malloc(size));
|
|
memset(hData, 0, size);
|
|
for (int i = 0; i < depth; i++) {
|
|
for (int j = 0; j < height; j++) {
|
|
for (int k = 0; k < width; k++) {
|
|
hData[i * width * height + j * width + k] = i * width * height + j * width + k;
|
|
}
|
|
}
|
|
}
|
|
hipChannelFormatDesc channelDesc = hipCreateChannelDesc(sizeof(T) * 8, 0, 0, 0, formatKind);
|
|
HIP_CHECK(
|
|
hipMalloc3DArray(&arr, &channelDesc, make_hipExtent(width, height, depth), hipArrayDefault));
|
|
HIP_CHECK(
|
|
hipMalloc3DArray(&arr1, &channelDesc, make_hipExtent(width, height, depth), hipArrayDefault));
|
|
}
|
|
|
|
/*
|
|
* DeAllocates the Memory of device and host variables
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::DeAllocateMemory() {
|
|
HIP_CHECK(hipFreeArray(arr));
|
|
HIP_CHECK(hipFreeArray(arr1));
|
|
free(hData);
|
|
}
|
|
|
|
/*
|
|
* This API verifies both H2D & D2H functionalities of hipMemcpy3D API
|
|
* by allocating memory in one GPU and calling the hipMemcpy3D API
|
|
* from another GPU.
|
|
* H2D case:
|
|
* Input : "hData" is initialized with the respective offset value
|
|
* Output: Destination array "arr" variable.
|
|
*
|
|
* D2H case:
|
|
* Input: "arr" array variable from the above output
|
|
* Output: "hOutputData" variable data is copied from "arr" variable
|
|
*
|
|
* Validating the result by comparing "hData" and "hOutputData" variables
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::D2H_H2D_DeviceMem_OnDiffDevice() {
|
|
HIP_CHECK(hipSetDevice(0));
|
|
int peerAccess = 0;
|
|
HIP_CHECK(hipDeviceCanAccessPeer(&peerAccess, 1, 0));
|
|
if (peerAccess) {
|
|
AllocateMemory();
|
|
// Memory is allocated on device 0 and Memcpy3DAsync triggered from device 1
|
|
HIP_CHECK(hipSetDevice(1));
|
|
|
|
// H2D Scenario
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
SetDefaultData();
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyHostToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyHostToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
// Device to host
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
T* hOutputData = reinterpret_cast<T*>(malloc(size));
|
|
memset(hOutputData, 0, size);
|
|
SetDefaultData();
|
|
myparms.dstPtr = make_hipPitchedPtr(hOutputData, width * sizeof(T), width, height);
|
|
myparms.srcArray = arr;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToHost;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToHost;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
// Validating the result
|
|
HipTest::checkArray(hData, hOutputData, width, height, depth);
|
|
free(hOutputData);
|
|
DeAllocateMemory();
|
|
} else {
|
|
SUCCEED("Skipped the test as there is no peer access\n");
|
|
}
|
|
}
|
|
/*
|
|
* This API verifies both D2D functionalities of hipMemcpy3D API
|
|
* by allocating memory in one GPU and calling the hipMemcpy3D API
|
|
* from another GPU.
|
|
*
|
|
* D2D case:
|
|
* Input : "arr" variable is initialized with the "hData" variable in GPU-0
|
|
* Output: "arr2" variable in GPU-0
|
|
*
|
|
* hipMemcpy3D API is triggered from GPU-1
|
|
* The "arr2" variable is then copied to "hOutputData" for validating
|
|
* the result
|
|
*
|
|
* Validating the result by comparing "hData" and "hOutputData" variables
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::D2D_DeviceMem_OnDiffDevice() {
|
|
HIP_CHECK(hipSetDevice(0));
|
|
int peerAccess = 0;
|
|
HIP_CHECK(hipDeviceCanAccessPeer(&peerAccess, 0, 1));
|
|
if (peerAccess) {
|
|
AllocateMemory();
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
SetDefaultData();
|
|
|
|
// Host to device copy
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyHostToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyHostToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
hipArray_t arr2;
|
|
hipChannelFormatDesc channelDesc1 = hipCreateChannelDesc(sizeof(T) * 8, 0, 0, 0, formatKind);
|
|
HIP_CHECK(hipMalloc3DArray(&arr2, &channelDesc1, make_hipExtent(width, height, depth),
|
|
hipArrayDefault));
|
|
|
|
// Allocating Mem on GPU device 0 and trigger hipMemcpy3D from GPU 1
|
|
HIP_CHECK(hipSetDevice(1));
|
|
|
|
// D2D Scenario
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
SetDefaultData();
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr2;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
|
|
// For validating the D2D copy copying it again to hOutputData and
|
|
// verifying it with iniital data hData
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
T* hOutputData = reinterpret_cast<T*>(malloc(size));
|
|
memset(hOutputData, 0, size);
|
|
SetDefaultData();
|
|
|
|
// Device to host
|
|
myparms.dstPtr = make_hipPitchedPtr(hOutputData, width * sizeof(T), width, height);
|
|
myparms.srcArray = arr2;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToHost;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToHost;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
HIP_CHECK(hipDeviceSynchronize());
|
|
HipTest::checkArray(hData, hOutputData, width, height, depth);
|
|
|
|
// DeAllocating Memory
|
|
free(hOutputData);
|
|
DeAllocateMemory();
|
|
} else {
|
|
SUCCEED("Skipped the test as there is no peer access\n");
|
|
}
|
|
}
|
|
/*
|
|
* This API verifies all the negative scenarios of hipMemcpy3D API
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::NegativeTests() {
|
|
HIP_CHECK(hipSetDevice(0));
|
|
AllocateMemory();
|
|
|
|
// Initialization of data
|
|
memset(&myparms, 0, sizeof(myparms));
|
|
myparms.srcPos = make_hipPos(0, 0, 0);
|
|
myparms.dstPos = make_hipPos(0, 0, 0);
|
|
myparms.extent = make_hipExtent(width, height, depth);
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyHostToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyHostToDevice;
|
|
#endif
|
|
|
|
SECTION("Nullptr to destination array") {
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = nullptr;
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Nullptr to source array") {
|
|
myparms.srcArray = nullptr;
|
|
myparms.dstPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing both Source ptr and array") {
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr1;
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing both destination ptr and array") {
|
|
myparms.dstPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
myparms.srcArray = arr1;
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing Max value to extent") {
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
myparms.extent =
|
|
make_hipExtent(std::numeric_limits<int>::max(), std::numeric_limits<int>::max(),
|
|
std::numeric_limits<int>::max());
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing Source pitchedPtr as nullptr") {
|
|
myparms.srcPtr = make_hipPitchedPtr(nullptr, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing Dst pitchedPtr as nullptr") {
|
|
myparms.dstPtr = make_hipPitchedPtr(nullptr, width * sizeof(T), width, height);
|
|
myparms.srcArray = arr;
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing width > max width size in extent") {
|
|
myparms.extent = make_hipExtent(width + 1, height, depth);
|
|
myparms.dstArray = arr;
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing hgt > max width size in extent") {
|
|
myparms.extent = make_hipExtent(width, height + 1, depth);
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing depth > max width size in extent") {
|
|
myparms.extent = make_hipExtent(width, height, depth + 1);
|
|
myparms.dstArray = arr;
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing dst width pos > max allocated width") {
|
|
myparms.dstPos = make_hipPos(width + 1, 0, 0);
|
|
myparms.dstArray = arr;
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing dst height pos > max allocated hgt") {
|
|
myparms.dstPos = make_hipPos(0, height + 1, 0);
|
|
myparms.dstArray = arr;
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing dst depth pos > max allocated depth") {
|
|
myparms.dstPos = make_hipPos(0, 0, depth + 1);
|
|
myparms.dstArray = arr;
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing src width pos > max allocated width") {
|
|
myparms.srcPos = make_hipPos(width + 1, 0, 0);
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr1;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing src height pos > max allocated hgt") {
|
|
myparms.srcPos = make_hipPos(0, height + 1, 0);
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr1;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing src height pos > max allocated hgt") {
|
|
myparms.srcPos = make_hipPos(0, 0, depth + 1);
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr1;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing src array size > dst array size") {
|
|
// Passing src array size greater than destination array size
|
|
hipArray_t arr2;
|
|
hipChannelFormatDesc channelDesc1 = hipCreateChannelDesc(sizeof(T) * 8, 0, 0, 0, formatKind);
|
|
HIP_CHECK(hipMalloc3DArray(&arr2, &channelDesc1, make_hipExtent(3, 3, 3), hipArrayDefault));
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr2;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) != hipSuccess);
|
|
}
|
|
|
|
// DeAllocation of memory
|
|
DeAllocateMemory();
|
|
}
|
|
|
|
/*
|
|
* This API verifies the Extent validation Scenarios
|
|
*/
|
|
template <typename T> void Memcpy3D<T>::Extent_Validation() {
|
|
HIP_CHECK(hipSetDevice(0));
|
|
AllocateMemory();
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
myparms.srcPos = make_hipPos(0, 0, 0);
|
|
myparms.dstPos = make_hipPos(0, 0, 0);
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyHostToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyHostToDevice;
|
|
#endif
|
|
SECTION("Passing Extent as 0") {
|
|
myparms.extent = make_hipExtent(0, 0, 0);
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
}
|
|
SECTION("Passing Width 0 in Extent") {
|
|
myparms.extent = make_hipExtent(0, height, depth);
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
}
|
|
SECTION("Passing Height 0 in Extent") {
|
|
myparms.extent = make_hipExtent(width, 0, depth);
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
}
|
|
SECTION("Passing Depth 0 in Extent") {
|
|
myparms.extent = make_hipExtent(width, height, 0);
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
}
|
|
SECTION("Passing Depth 0 in Extent") { REQUIRE(hipMemcpy3D(nullptr) != hipSuccess); }
|
|
DeAllocateMemory();
|
|
}
|
|
|
|
/*
|
|
* This API verifies H2H-D2D-D2H functionalities of hipMemcpy3D API
|
|
*
|
|
* Input : "arr" variable is initialized with the "hData" variable in GPU-0
|
|
* Output: "arr1" variable in GPU-0
|
|
*
|
|
* The "arr1" variable is then copied to "hOutputData" for validating
|
|
* the result
|
|
*
|
|
* Validating the result by comparing "hData" and "hOutputData" variables
|
|
*/
|
|
|
|
template <typename T> void Memcpy3D<T>::simple_Memcpy3D() {
|
|
HIP_CHECK(hipSetDevice(0));
|
|
AllocateMemory();
|
|
|
|
// Host to Device
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
SetDefaultData();
|
|
myparms.srcPtr = make_hipPitchedPtr(hData, width * sizeof(T), width, height);
|
|
myparms.dstArray = arr;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyHostToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyHostToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
|
|
// Array to Array
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
SetDefaultData();
|
|
myparms.srcArray = arr;
|
|
myparms.dstArray = arr1;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToDevice;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToDevice;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
T* hOutputData = reinterpret_cast<T*>(malloc(size));
|
|
memset(hOutputData, 0, size);
|
|
|
|
// Device to host
|
|
memset(&myparms, 0x0, sizeof(hipMemcpy3DParms));
|
|
SetDefaultData();
|
|
myparms.dstPtr = make_hipPitchedPtr(hOutputData, width * sizeof(T), width, height);
|
|
myparms.srcArray = arr1;
|
|
#ifdef __HIP_PLATFORM_NVIDIA__
|
|
myparms.kind = cudaMemcpyDeviceToHost;
|
|
#else
|
|
myparms.kind = hipMemcpyDeviceToHost;
|
|
#endif
|
|
REQUIRE(hipMemcpy3D(&myparms) == hipSuccess);
|
|
|
|
// Validating the result
|
|
HipTest::checkArray(hData, hOutputData, width, height, depth);
|
|
|
|
// DeAllocating the Memory
|
|
free(hOutputData);
|
|
DeAllocateMemory();
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This testcase performs hipMemcpy3D API validation for
|
|
different datatypes and different sizes
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemcpy3D_old.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 5.2
|
|
*/
|
|
|
|
TEMPLATE_TEST_CASE("Unit_hipMemcpy3D_Basic", "[hipMemcpy3D]", int, unsigned int, float) {
|
|
CHECK_IMAGE_SUPPORT
|
|
int device = -1;
|
|
HIP_CHECK(hipGetDevice(&device));
|
|
hipDeviceProp_t prop;
|
|
HIP_CHECK(hipGetDeviceProperties(&prop, device));
|
|
auto i = GENERATE_COPY(10, 100, 1024, prop.maxTexture3D[0]);
|
|
auto j = GENERATE(10, 100);
|
|
int numDevices = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
if (numDevices > 1) {
|
|
if (std::is_same<TestType, float>::value) {
|
|
Memcpy3D<TestType> memcpy3d_obj(i, j, j, hipChannelFormatKindFloat);
|
|
memcpy3d_obj.simple_Memcpy3D();
|
|
} else if (std::is_same<TestType, unsigned int>::value) {
|
|
Memcpy3D<TestType> memcpy3d_obj(i, j, j, hipChannelFormatKindUnsigned);
|
|
memcpy3d_obj.simple_Memcpy3D();
|
|
} else if (std::is_same<TestType, int>::value) {
|
|
Memcpy3D<TestType> memcpy3d_obj(i, j, j, hipChannelFormatKindSigned);
|
|
memcpy3d_obj.simple_Memcpy3D();
|
|
}
|
|
} else {
|
|
SUCCEED("skipping the testcases as numDevices < 2");
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This testcase performs the extent validation scenarios of hipMemcpy3D API
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemcpy3D_old.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 5.2
|
|
*/
|
|
|
|
TEST_CASE("Unit_hipMemcpy3D_ExtentValidation") {
|
|
CHECK_IMAGE_SUPPORT
|
|
Memcpy3D<int> memcpy3d(width, height, depth, hipChannelFormatKindSigned);
|
|
memcpy3d.Extent_Validation();
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This testcase performs the negative scenarios of hipMemcpy3D API
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemcpy3D_old.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 5.2
|
|
*/
|
|
|
|
TEST_CASE("Unit_hipMemcpy3D_multiDevice-Negative") {
|
|
CHECK_IMAGE_SUPPORT
|
|
int numDevices = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
if (numDevices > 1) {
|
|
Memcpy3D<int> memcpy3d(width, height, depth, hipChannelFormatKindSigned);
|
|
memcpy3d.NegativeTests();
|
|
} else {
|
|
SUCCEED("skipping the testcases as numDevices < 2");
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This testcase performs the D2H,H2D and D2D on peer GPU device
|
|
1. Verify with D2H & H2D On DiffDevice
|
|
2. Verify with D2D On DiffDevice
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemcpy3D_old.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 5.2
|
|
*/
|
|
|
|
TEST_CASE("Unit_hipMemcpy3D_multiDevice-OnPeerDevice", "[multigpu]") {
|
|
CHECK_IMAGE_SUPPORT
|
|
int numDevices = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
if (numDevices > 1) {
|
|
SECTION("D2H & H2D On DiffDevice") {
|
|
Memcpy3D<float> memcpy3d_d2h_obj(width, height, depth, hipChannelFormatKindFloat);
|
|
memcpy3d_d2h_obj.D2H_H2D_DeviceMem_OnDiffDevice();
|
|
}
|
|
|
|
SECTION("D2D On DiffDevice") {
|
|
Memcpy3D<float> memcpy3d_d2d_obj(width, height, depth, hipChannelFormatKindFloat);
|
|
memcpy3d_d2d_obj.D2D_DeviceMem_OnDiffDevice();
|
|
}
|
|
} else {
|
|
SUCCEED("skipping the testcases as numDevices < 2");
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Test Description
|
|
* ------------------------
|
|
* - This testcase performs multidevice size check on hipMemcpy3D API
|
|
1. Verify with 128 for all height, width & depth value
|
|
2. Verify with 256 for height and 128 for width & depth value
|
|
3. Verify with 256 for width and 128 for height & depth value
|
|
4. Verify with 256 for depth and 128 for height & width value
|
|
* Test source
|
|
* ------------------------
|
|
* - unit/memory/hipMemcpy3D_old.cc
|
|
* Test requirements
|
|
* ------------------------
|
|
* - HIP_VERSION >= 6.0
|
|
*/
|
|
|
|
TEST_CASE("Unit_hipMemcpy3D_multiDevice_Basic_Size_Test", "[multigpu]") {
|
|
CHECK_IMAGE_SUPPORT
|
|
constexpr int size_128b = 128, size_256b = 256;
|
|
int numDevices = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
|
|
for (int i = 0; i < numDevices; i++) {
|
|
HIP_CHECK(hipSetDevice(i));
|
|
|
|
SECTION("Verify with 128 for all height, width & depth value") {
|
|
Memcpy3D<int> memcpy3d_obj1(size_128b, size_128b, size_128b, hipChannelFormatKindUnsigned);
|
|
memcpy3d_obj1.simple_Memcpy3D();
|
|
}
|
|
SECTION("Verify with 256 for height and 128 for width & depth value") {
|
|
Memcpy3D<int> memcpy3d_obj2(size_256b, size_128b, size_128b, hipChannelFormatKindUnsigned);
|
|
memcpy3d_obj2.simple_Memcpy3D();
|
|
}
|
|
SECTION("Verify with 256 for width and 128 for height & depth value") {
|
|
Memcpy3D<float> memcpy3d_obj3(size_128b, size_256b, size_128b, hipChannelFormatKindFloat);
|
|
memcpy3d_obj3.simple_Memcpy3D();
|
|
}
|
|
SECTION("Verify with 256 for depth and 128 for height & width value") {
|
|
Memcpy3D<unsigned int> memcpy3d_obj4(size_128b, size_128b, size_256b,
|
|
hipChannelFormatKindUnsigned);
|
|
memcpy3d_obj4.simple_Memcpy3D();
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* End doxygen group MemoryTest.
|
|
* @}
|
|
*/
|