/* Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved. Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANNTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER INN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR INN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ /** Testcase Scenarios of hipGraphAddHostNode API: Functional: 1. Creates graph, Adds HostNode which updates the variable and validates the result 2. Create graph, Add Graphnodes and clones the graph. Add Hostnode to the cloned graph and validate the result 3. Creates graph which performs the square of number in the kernel function and the result is validated in the callback function of hipGraphAddHostNode API Negative: 1) Pass pGraphNode as nullptr and verify api doesn’t crash, returns error code. 2) Pass graph as nullptr and verify api doesn’t crash, returns error code. 3) Pass pNodeParams as nullptr and verify api doesn’t crash, returns error code. 4) Pass hipHostNodeParams::hipHostFn_t as nullptr and verify api doesn't crash, returns error code. */ #include #include #define SIZE 1024 static int *B_h; static int *D_h; static void callbackfunc(void *A_h) { int *A = reinterpret_cast(A_h); for (int i = 0; i < SIZE; i++) { A[i] = i; } } static void __global__ vector_square(int *B_d, int *D_d) { for (int i = 0; i < SIZE; i++) { D_d[i] = B_d[i] * B_d[i]; } } static void vectorsquare_callback(void* ptr) { // The callback func is not working with zero parameters // Temporary fix for adding the below 2 lines and ticket // has been raised for the same. int *A = reinterpret_cast(ptr); A++; for (int i = 0; i < SIZE; i++) { if (D_h[i] != B_h[i] * B_h[i]) { INFO("Validation failed " << D_h[i] << B_h[i]); REQUIRE(false); } } } /* This testcase verifies the negative scenarios of hipGraphAddHostNode API */ TEST_CASE("Unit_hipGraphAddHostNode_Negative") { constexpr size_t N = 1024; hipGraph_t graph; int *A_d{nullptr}, *C_d{nullptr}; int *A_h{nullptr}, *C_h{nullptr}; HipTest::initArrays(&A_d, nullptr, &C_d, &A_h, nullptr, &C_h, N, false); HIP_CHECK(hipGraphCreate(&graph, 0)); hipGraphNode_t hostNode; hipHostNodeParams hostParams = {0, 0}; hostParams.fn = callbackfunc; hostParams.userData = A_h; SECTION("Passing nullptr to graph node") { REQUIRE(hipGraphAddHostNode(nullptr, graph, nullptr, 0, &hostParams) == hipErrorInvalidValue); } SECTION("Passing nullptr to graph") { REQUIRE(hipGraphAddHostNode(&hostNode, nullptr, nullptr, 0, &hostParams) == hipErrorInvalidValue); } #if HT_NVIDIA SECTION("Passing nullptr to host params") { REQUIRE(hipGraphAddHostNode(&hostNode, graph, nullptr, 0, nullptr) == hipErrorInvalidValue); } #endif SECTION("Passing nullptr to host func") { hostParams.fn = nullptr; REQUIRE(hipGraphAddHostNode(&hostNode, graph, nullptr, 0, &hostParams) == hipErrorInvalidValue); } HIP_CHECK(hipGraphDestroy(graph)); } /* This testcase verifies hipGraphAddHostNode API in cloned graph Creates graph, Add graph nodes and clone the graph Add HostNode to the cloned graph and validate the result */ TEST_CASE("Unit_hipGraphAddHostNode_ClonedGraphwithHostNode") { constexpr size_t N = 1024; constexpr size_t Nbytes = N * sizeof(int); hipGraph_t graph; hipGraphExec_t graphExec; int *A_d{nullptr}, *C_d{nullptr}; int *A_h{nullptr}, *C_h{nullptr}; HipTest::initArrays(&A_d, nullptr, &C_d, &A_h, nullptr, &C_h, N, false); HIP_CHECK(hipGraphCreate(&graph, 0)); hipGraphNode_t memcpyH2D_A, memcpyH2D_C, memcpyD2H_AC; hipStream_t streamForGraph; HIP_CHECK(hipStreamCreate(&streamForGraph)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyH2D_A, graph, nullptr, 0, A_d, A_h, Nbytes, hipMemcpyHostToDevice)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyH2D_C, graph, nullptr, 0, C_d, C_h, Nbytes, hipMemcpyHostToDevice)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyD2H_AC, graph, nullptr, 0, A_h, C_d, Nbytes, hipMemcpyDeviceToHost)); hipGraph_t clonedgraph; HIP_CHECK(hipGraphClone(&clonedgraph, graph)); hipGraphNode_t hostNode; hipHostNodeParams hostParams = {0, 0}; hostParams.fn = callbackfunc; hostParams.userData = A_h; HIP_CHECK(hipGraphAddHostNode(&hostNode, clonedgraph, nullptr, 0, &hostParams)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyH2D_A, &memcpyD2H_AC, 1)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyH2D_C, &memcpyD2H_AC, 1)); // Instantiate and launch the cloned graph HIP_CHECK(hipGraphInstantiate(&graphExec, clonedgraph, nullptr, nullptr, 0)); HIP_CHECK(hipGraphLaunch(graphExec, streamForGraph)); HIP_CHECK(hipStreamSynchronize(streamForGraph)); // Verify execution result for (size_t i = 0; i < N; i++) { if (A_h[i] != static_cast(i)) { INFO("Validation failed i " << i << "C_h[i] "<< C_h[i]); REQUIRE(false); } } HipTest::freeArrays(A_d, nullptr, C_d, A_h, nullptr, C_h, false); HIP_CHECK(hipGraphExecDestroy(graphExec)); HIP_CHECK(hipGraphDestroy(graph)); HIP_CHECK(hipGraphDestroy(clonedgraph)); HIP_CHECK(hipStreamDestroy(streamForGraph)); } /* This testcase verifies the square of number by creating graph, Add kernel node which does the square of number and the result is validated byhipGrahAddHostNode API */ TEST_CASE("Unit_hipGraphAddHostNode_VectorSquare") { constexpr size_t N = 1024; constexpr size_t Nbytes = N * sizeof(int); hipGraph_t graph; hipGraphExec_t graphExec; int *A_d{nullptr}, *A_h{nullptr}, *B_d{nullptr}, *D_d{nullptr}; int *param = reinterpret_cast(sizeof(int));; HipTest::initArrays(&A_d, &B_d, &D_d, &A_h, &B_h, &D_h, N, false); HIP_CHECK(hipGraphCreate(&graph, 0)); hipGraphNode_t memcpyH2D_B, memcpyH2D_D, memcpyD2H_D, kernel_vecAdd; hipKernelNodeParams kernelNodeParams{}; hipStream_t streamForGraph; HIP_CHECK(hipStreamCreate(&streamForGraph)); hipGraphNode_t hostNode; hipHostNodeParams hostParams = {0, 0}; hostParams.fn = vectorsquare_callback; hostParams.userData = param; HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyH2D_B, graph, nullptr, 0, B_d, B_h, Nbytes, hipMemcpyHostToDevice)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyH2D_D, graph, nullptr, 0, D_d, D_h, Nbytes, hipMemcpyHostToDevice)); void* kernelArgs2[] = {&B_d, &D_d}; kernelNodeParams.func = reinterpret_cast(vector_square); kernelNodeParams.gridDim = dim3(1); kernelNodeParams.blockDim = dim3(1); kernelNodeParams.sharedMemBytes = 0; kernelNodeParams.kernelParams = reinterpret_cast(kernelArgs2); kernelNodeParams.extra = nullptr; HIP_CHECK(hipGraphAddKernelNode(&kernel_vecAdd, graph, nullptr, 0, &kernelNodeParams)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyD2H_D, graph, nullptr, 0, D_h, D_d, Nbytes, hipMemcpyDeviceToHost)); HIP_CHECK(hipGraphAddHostNode(&hostNode, graph, nullptr, 0, &hostParams)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyH2D_B, &kernel_vecAdd, 1)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyH2D_D, &kernel_vecAdd, 1)); HIP_CHECK(hipGraphAddDependencies(graph, &kernel_vecAdd, &memcpyD2H_D, 1)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyD2H_D, &hostNode, 1)); // Instantiate and launch the graph HIP_CHECK(hipGraphInstantiate(&graphExec, graph, nullptr, nullptr, 0)); HIP_CHECK(hipGraphLaunch(graphExec, streamForGraph)); HIP_CHECK(hipStreamSynchronize(streamForGraph)); HipTest::freeArrays(A_d, B_d, D_d, A_h, B_h, D_h, false); HIP_CHECK(hipGraphExecDestroy(graphExec)); HIP_CHECK(hipGraphDestroy(graph)); HIP_CHECK(hipStreamDestroy(streamForGraph)); } /* This testcase verifies the following scenario Create graph, calls the host function and updates the parameters in the callback function and validates it. */ TEST_CASE("Unit_hipGraphAddHostNode_BasicFunc") { constexpr size_t N = 1024; constexpr size_t Nbytes = N * sizeof(int); hipGraph_t graph; hipGraphExec_t graphExec; int *A_d{nullptr}, *C_d{nullptr}; int *A_h{nullptr}, *C_h{nullptr}; HipTest::initArrays(&A_d, nullptr, &C_d, &A_h, nullptr, &C_h, N, false); HIP_CHECK(hipGraphCreate(&graph, 0)); hipGraphNode_t memcpyH2D_A, memcpyD2H_AC, memcpyH2D_C; hipStream_t streamForGraph; HIP_CHECK(hipStreamCreate(&streamForGraph)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyH2D_A, graph, nullptr, 0, A_d, A_h, Nbytes, hipMemcpyHostToDevice)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyH2D_C, graph, nullptr, 0, C_d, C_h, Nbytes, hipMemcpyHostToDevice)); HIP_CHECK(hipGraphAddMemcpyNode1D(&memcpyD2H_AC, graph, nullptr, 0, A_h, C_d, Nbytes, hipMemcpyDeviceToHost)); hipGraphNode_t hostNode; hipHostNodeParams hostParams = {0, 0}; hostParams.fn = callbackfunc; hostParams.userData = A_h; HIP_CHECK(hipGraphAddHostNode(&hostNode, graph, nullptr, 0, &hostParams)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyH2D_A, &memcpyD2H_AC, 1)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyH2D_C, &memcpyD2H_AC, 1)); HIP_CHECK(hipGraphAddDependencies(graph, &memcpyD2H_AC, &hostNode, 1)); // Instantiate and launch the graph HIP_CHECK(hipGraphInstantiate(&graphExec, graph, nullptr, nullptr, 0)); HIP_CHECK(hipGraphLaunch(graphExec, streamForGraph)); HIP_CHECK(hipStreamSynchronize(streamForGraph)); // Verify execution result for (size_t i = 0; i < N; i++) { if (A_h[i] != static_cast(i)) { INFO("Validation failed i " << i << "A_h[i] "<< A_h[i]); REQUIRE(false); } } HipTest::freeArrays(A_d, nullptr, C_d, A_h, nullptr, C_h, false); HIP_CHECK(hipGraphExecDestroy(graphExec)); HIP_CHECK(hipGraphDestroy(graph)); HIP_CHECK(hipStreamDestroy(streamForGraph)); }