Files

244 строки
8.1 KiB
C++

/*
Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
#include <hip_test_common.hh>
#include <hip_test_checkers.hh>
#include <hip_test_defgroups.hh>
#include <numeric>
#define N 32
TEMPLATE_TEST_CASE("Unit_hipMemcpyHtoAAsync_Basic", "", char, int, float) {
CHECK_IMAGE_SUPPORT
hipArray_t dst_array = nullptr;
std::vector<TestType> host_src(N);
std::vector<TestType> host_dst(N);
size_t copy_size = N * sizeof(TestType);
size_t offset = GENERATE(0, N * sizeof(TestType) / 2);
std::iota(host_src.begin(), host_src.end(), 0);
auto channel_descriptor = hipCreateChannelDesc<TestType>();
HIP_CHECK(hipMallocArray(&dst_array, &channel_descriptor, copy_size));
HIP_CHECK(hipMemcpyHtoAAsync(dst_array, offset, host_src.data(), copy_size - offset, nullptr));
HIP_CHECK(hipStreamSynchronize(nullptr));
HIP_CHECK(hipMemcpyAtoH(host_dst.data(), dst_array, offset, copy_size - offset));
for (int i = 0; i < offset / sizeof(TestType); i++) {
if (host_src[i] != host_dst[i]) {
REQUIRE(false);
}
}
HIP_CHECK(hipFreeArray(dst_array));
}
TEST_CASE("Unit_hipMemcpyHtoAAsync_Negative") {
CHECK_IMAGE_SUPPORT
hipArray_t dst_array = nullptr;
std::vector<int> host_src(N);
size_t copy_size = N * sizeof(int);
std::iota(host_src.begin(), host_src.end(), 0);
auto channel_descriptor = hipCreateChannelDesc<int>();
HIP_CHECK(hipMallocArray(&dst_array, &channel_descriptor, copy_size));
SECTION("dst array is null") {
HIP_CHECK_ERROR(hipMemcpyHtoAAsync(nullptr, 0, host_src.data(), copy_size, nullptr),
hipErrorInvalidValue);
}
SECTION("src is nullptr") {
HIP_CHECK_ERROR(hipMemcpyHtoAAsync(dst_array, 0, nullptr, copy_size, nullptr),
hipErrorInvalidValue);
}
SECTION("copy size is negative") {
HIP_CHECK_ERROR(hipMemcpyHtoAAsync(dst_array, 0, host_src.data(), -1, nullptr),
hipErrorInvalidValue);
}
HIP_CHECK(hipFreeArray(dst_array));
}
/**
* @addtogroup hipMemcpyHtoAAsync hipMemcpyHtoAAsync
* @{
* @ingroup MemoryTest
* `hipError_t hipMemcpyHtoAAsync(hipArray_t dstArray, size_t dstOffset,
* const void* srcHost,
size_t ByteCount, hipStream_t stream)` -
* Copies from host memory to a 1D array.
*/
/**
* Test Description
* ------------------------
* - This testcase is to verify the basic functionality of hipMemcpyHtoAAsync API
* with different streams.
* Test source
* ------------------------
* - unit/memory/hipMemcpyHtoAAsync.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipMemcpyHtoAAsync_BasicTstsWithDiffStreams") {
#if HT_NVIDIA
HipTest::HIP_SKIP_TEST("API currently unsupported on nvidia, skipping...");
return;
#else
CHECK_IMAGE_SUPPORT
HIP_CHECK(hipSetDevice(0));
int row, col;
row = 1;
col = GENERATE(3, 4, 100);
int* A_h = reinterpret_cast<int*>(malloc(sizeof(int) * row * col));
int* B_h = reinterpret_cast<int*>(malloc(sizeof(int) * row * col));
for (int i = 0; i < (row * col); i++) {
B_h[i] = i;
}
hipArray_t A_a;
hipChannelFormatDesc desc = hipCreateChannelDesc<int>();
HIP_CHECK(hipMallocArray(&A_a, &desc, col, row, hipArrayDefault));
SECTION("With Default Stream") {
HIP_CHECK(hipMemcpyHtoAAsync(A_a, 0, B_h, sizeof(int) * col * row, 0));
HIP_CHECK(hipMemcpyAtoHAsync(A_h, A_a, 0, sizeof(int) * col * row, 0));
HIP_CHECK(hipStreamSynchronize(0));
}
SECTION("With User Stream") {
hipStream_t stream;
HIP_CHECK(hipStreamCreate(&stream));
HIP_CHECK(hipMemcpyHtoAAsync(A_a, 0, B_h, sizeof(int) * col * row, stream));
HIP_CHECK(hipMemcpyAtoHAsync(A_h, A_a, 0, sizeof(int) * col * row, stream));
HIP_CHECK(hipStreamSynchronize(stream));
HIP_CHECK(hipStreamDestroy(stream));
}
SECTION("With Stream per thread") {
HIP_CHECK(hipMemcpyHtoAAsync(A_a, 0, B_h, sizeof(int) * col * row, hipStreamPerThread));
HIP_CHECK(hipMemcpyAtoHAsync(A_h, A_a, 0, sizeof(int) * col * row, hipStreamPerThread));
HIP_CHECK(hipStreamSynchronize(hipStreamPerThread));
}
SECTION("With Legacy Stream") {
HIP_CHECK(hipMemcpyHtoAAsync(A_a, 0, B_h, sizeof(int) * col * row, hipStreamLegacy));
HIP_CHECK(hipMemcpyAtoHAsync(A_h, A_a, 0, sizeof(int) * col * row, hipStreamLegacy));
HIP_CHECK(hipStreamSynchronize(hipStreamLegacy));
}
for (int i = 0; i < (row * col); i++) {
REQUIRE(A_h[i] == B_h[i]);
}
HIP_CHECK(hipFreeArray(A_a));
free(A_h);
free(B_h);
#endif
}
/**
* Test Description
* ------------------------
* - This testcase is to verify the basic functionality of hipMemcpyHtoAAsync API
* with different streams on multiple devices.
* Test source
* ------------------------
* - unit/memory/hipMemcpyHtoAAsync.cc
* Test requirements
* ------------------------
* - HIP_VERSION >= 6.2
*/
TEST_CASE("Unit_hipMemcpyHtoAAsync_MultiDevice", "[multigpu]") {
#if HT_NVIDIA
HipTest::HIP_SKIP_TEST("API currently unsupported on nvidia, skipping...");
return;
#else
CHECK_IMAGE_SUPPORT
int devCount = 0;
HIP_CHECK(hipGetDeviceCount(&devCount));
for (int i = 0; i < devCount; i++) {
HIP_CHECK(hipSetDevice(i));
int row, col;
row = 1;
col = GENERATE(3, 4, 100);
int* A_h = reinterpret_cast<int*>(malloc(sizeof(int) * row * col));
int* B_h = reinterpret_cast<int*>(malloc(sizeof(int) * row * col));
for (int i = 0; i < (row * col); i++) {
B_h[i] = i;
}
hipArray_t A_a;
hipChannelFormatDesc desc = hipCreateChannelDesc<int>();
HIP_CHECK(hipMallocArray(&A_a, &desc, col, row, hipArrayDefault));
hipStream_t stream;
HIP_CHECK(hipStreamCreate(&stream));
HIP_CHECK(hipMemcpyHtoAAsync(A_a, 0, B_h, sizeof(int) * col * row, stream));
HIP_CHECK(hipMemcpyAtoHAsync(A_h, A_a, 0, sizeof(int) * col * row, stream));
HIP_CHECK(hipStreamSynchronize(stream));
for (int i = 0; i < (row * col); i++) {
REQUIRE(A_h[i] == B_h[i]);
}
HIP_CHECK(hipFreeArray(A_a));
HIP_CHECK(hipStreamDestroy(stream));
free(A_h);
free(B_h);
}
#endif
}
TEST_CASE("UnitHipMemcpyHtoAAsync_Capture") {
CHECK_IMAGE_SUPPORT
auto host_src = std::make_unique<std::vector<int>>(N);
auto host_dst = std::make_unique<std::vector<int>>(N);
constexpr size_t kCopySize = N * sizeof(int);
size_t offset = GENERATE(0, N * sizeof(int) / 2);
std::iota(host_src->begin(), host_src->end(), 0);
auto channel_desc = hipCreateChannelDesc<int>();
hipArray_t dst_array = nullptr;
HIP_CHECK(hipMallocArray(&dst_array, &channel_desc, kCopySize));
hipStream_t stream = nullptr;
HIP_CHECK(hipStreamCreate(&stream));
GENERATE_CAPTURE();
BEGIN_CAPTURE(stream);
HIP_CHECK(hipMemcpyHtoAAsync(dst_array, offset, host_src->data(), kCopySize - offset, nullptr));
END_CAPTURE(stream);
HIP_CHECK(hipStreamSynchronize(nullptr));
HIP_CHECK(hipMemcpyAtoH(host_dst->data(), dst_array, offset, kCopySize - offset));
for (size_t i = 0; i < offset / sizeof(int); ++i) {
REQUIRE((*host_src)[i] == (*host_dst)[i]);
}
HIP_CHECK(hipFreeArray(dst_array));
HIP_CHECK(hipStreamDestroy(stream));
}
/**
* End doxygen group MemoryTest.
* @}
*/