146 lines
6.2 KiB
C++
146 lines
6.2 KiB
C++
/*
|
|
Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
#include <hip_test_common.hh>
|
|
#include <hip_test_kernels.hh>
|
|
#include <hip_test_checkers.hh>
|
|
/*
|
|
This testfile verifies the following scenarios of hipMemcpyPeer API
|
|
1. Negative Scenarios
|
|
2. Basic scenario of hipMemcpyPeer API
|
|
*/
|
|
|
|
/*This testcase verifies the negative scenarios of hipmemcpypeer
|
|
*/
|
|
TEST_CASE("Unit_hipMemcpyPeer_Negative", "[multigpu]") {
|
|
constexpr auto numElements{10};
|
|
constexpr auto copy_bytes{numElements * sizeof(int)};
|
|
int numDevices = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
if (numDevices > 1) {
|
|
int canAccessPeer = 0;
|
|
HIP_CHECK(hipDeviceCanAccessPeer(&canAccessPeer, 0, 1));
|
|
if (canAccessPeer) {
|
|
// Initialization of variables
|
|
int *A_d{nullptr}, *B_d{nullptr};
|
|
int *A_h{nullptr}, *B_h{nullptr};
|
|
HIP_CHECK(hipSetDevice(0));
|
|
HipTest::initArrays<int>(&A_d, nullptr, nullptr, &A_h, &B_h, nullptr,
|
|
numElements * sizeof(int));
|
|
HipTest::setDefaultData<int>(numElements, A_h, B_h, nullptr);
|
|
HIP_CHECK(hipSetDevice(1));
|
|
HipTest::initArrays<int>(nullptr, &B_d, nullptr, nullptr, nullptr, nullptr,
|
|
numElements * sizeof(int));
|
|
HIP_CHECK(hipMemcpy(B_d, B_h, numElements * sizeof(int), hipMemcpyHostToDevice));
|
|
|
|
SECTION("Nullptr to Destination Pointer") {
|
|
REQUIRE(hipMemcpyPeer(nullptr, 1, A_d, 0, copy_bytes) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Nullptr to Source Pointer") {
|
|
REQUIRE(hipMemcpyPeer(B_d, 1, nullptr, 0, copy_bytes) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Pass NumElements as 0") {
|
|
HIP_CHECK(hipMemcpy(A_d, A_h, numElements * sizeof(int), hipMemcpyHostToDevice));
|
|
HIP_CHECK(hipMemcpyPeer(B_d, 1, A_d, 0, 0));
|
|
HIP_CHECK(hipMemcpy(A_h, B_d, numElements * sizeof(int), hipMemcpyDeviceToHost));
|
|
HipTest::checkTest<int>(A_h, B_h, numElements);
|
|
}
|
|
|
|
SECTION("Passing more than allocated size") {
|
|
REQUIRE(hipMemcpyPeer(B_d, 1, A_d, 0, ((numElements + 40) * sizeof(int))) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing invalid Destination device ID") {
|
|
REQUIRE(hipMemcpyPeer(B_d, numDevices, A_d, 0, copy_bytes) != hipSuccess);
|
|
}
|
|
|
|
SECTION("Passing invalid Source device ID") {
|
|
REQUIRE(hipMemcpyPeer(B_d, 1, A_d, numDevices, copy_bytes) != hipSuccess);
|
|
}
|
|
HipTest::freeArrays<int>(A_d, B_d, nullptr, A_h, B_h, nullptr, false);
|
|
} else {
|
|
SUCCEED("Machine Does not have P2P capability");
|
|
}
|
|
} else {
|
|
SUCCEED("Number of devices are < 2");
|
|
}
|
|
}
|
|
|
|
/*
|
|
* This test case verifies the basic scenario of hipMemcpyPeer API
|
|
* Initializes data in GPU-0
|
|
* Launches the kernel and performs addition in GPU-0
|
|
* Copies the data from GPU-0 to GPU-1 using hipMemcpyPeer API
|
|
* Then performs the addition and validates the sum
|
|
*/
|
|
TEST_CASE("Unit_hipMemcpyPeer_Basic", "[multigpu]") {
|
|
constexpr auto numElements{10};
|
|
constexpr auto copy_bytes{numElements * sizeof(int)};
|
|
int numDevices = 0;
|
|
HIP_CHECK(hipGetDeviceCount(&numDevices));
|
|
if (numDevices > 1) {
|
|
int canAccessPeer = 0;
|
|
HIP_CHECK(hipDeviceCanAccessPeer(&canAccessPeer, 0, 1));
|
|
if (canAccessPeer) {
|
|
int *A_d{nullptr}, *B_d{nullptr}, *C_d{nullptr};
|
|
int *X_d{nullptr}, *Y_d{nullptr}, *Z_d{nullptr};
|
|
int *A_h{nullptr}, *B_h{nullptr}, *C_h{nullptr};
|
|
|
|
// Initialization of Variables on GPU-0
|
|
HIP_CHECK(hipSetDevice(0));
|
|
HipTest::initArrays<int>(&A_d, &B_d, &C_d, &A_h, &B_h, &C_h, numElements * sizeof(int));
|
|
HIP_CHECK(hipMemcpy(A_d, A_h, numElements * sizeof(int), hipMemcpyHostToDevice));
|
|
HIP_CHECK(hipMemcpy(B_d, B_h, numElements * sizeof(int), hipMemcpyHostToDevice));
|
|
|
|
// Initialization of Variables on GPU-1
|
|
HIP_CHECK(hipSetDevice(1));
|
|
HipTest::initArrays<int>(&X_d, &Y_d, &Z_d, nullptr, nullptr, nullptr,
|
|
numElements * sizeof(int));
|
|
|
|
// Launching kernel and performing vector addition on GPU-0
|
|
HIP_CHECK(hipSetDevice(0));
|
|
hipLaunchKernelGGL(HipTest::vectorADD, dim3(1), dim3(1), 0, 0, static_cast<const int*>(A_d),
|
|
static_cast<const int*>(B_d), C_d, numElements * sizeof(int));
|
|
HIP_CHECK(hipGetLastError());
|
|
HIP_CHECK(hipMemcpy(C_h, C_d, numElements * sizeof(int), hipMemcpyDeviceToHost));
|
|
HipTest::checkVectorADD<int>(A_h, B_h, C_h, numElements);
|
|
|
|
HIP_CHECK(hipSetDevice(1));
|
|
// Copying data from GPU-0 to GPU-1 and performing vector addition
|
|
HIP_CHECK(hipMemcpyPeer(X_d, 1, A_d, 0, copy_bytes));
|
|
HIP_CHECK(hipMemcpyPeer(Y_d, 1, B_d, 0, copy_bytes));
|
|
hipLaunchKernelGGL(HipTest::vectorADD, dim3(1), dim3(1), 0, 0, static_cast<const int*>(X_d),
|
|
static_cast<const int*>(Y_d), Z_d, numElements * sizeof(int));
|
|
HIP_CHECK(hipGetLastError());
|
|
HIP_CHECK(hipMemcpy(C_h, Z_d, numElements * sizeof(int), hipMemcpyDeviceToHost));
|
|
HipTest::checkVectorADD<int>(A_h, B_h, C_h, numElements);
|
|
|
|
// Cleaning the memory
|
|
HipTest::freeArrays<int>(A_d, B_d, C_d, A_h, B_h, C_h, false);
|
|
HipTest::freeArrays<int>(X_d, Y_d, Z_d, nullptr, nullptr, nullptr, false);
|
|
} else {
|
|
SUCCEED("Machine Does not have P2P capability");
|
|
}
|
|
} else {
|
|
SUCCEED("Number of devices are < 2");
|
|
}
|
|
}
|