/* Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved. Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANNTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER INN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR INN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ /** Testcase Scenarios ------------------ Functional: 1) Start stream capture and get capture info. Verify api is success, capture status is hipStreamCaptureStatusActive and identifier returned is valid/non-zero. 2) End stream capture and get capture info. Verify api is success, capture status is hipStreamCaptureStatusNone and identifier is not returned/updated by api. 3) Begin capture on hipStreamPerThread and get capture info. Verify api is success, capture status is hipStreamCaptureStatusActive and identifier returned is valid/non-zero. 4) End capture on hipStreamPerThread, get capture info. Verify api is success, capture status is hipStreamCaptureStatusNone and identifier is not returned/updated by api. 5) Perform multiple captures and verify the identifier returned is unique. Argument Validation/Negative: 1) Pass pId as nullptr and verify api doesn’t crash and returns success. 2) Pass pCaptureStatus as nullptr and verify api doesn’t crash and returns error code. */ #include #include #include constexpr size_t N = 1000000; constexpr int LAUNCH_ITERS = 1; /** * Validates stream capture info, launches graph and verify results */ void validateStreamCaptureInfo(hipStream_t mstream) { hipStream_t stream1{nullptr}, stream2{nullptr}, streamForLaunch{nullptr}; hipEvent_t memsetEvent1, memsetEvent2, forkStreamEvent; hipGraph_t graph{nullptr}; hipGraphExec_t graphExec{nullptr}; constexpr unsigned blocks = 512; constexpr unsigned threadsPerBlock = 256; size_t Nbytes = N * sizeof(float); float *A_d, *C_d; float *A_h, *C_h; A_h = reinterpret_cast(malloc(Nbytes)); C_h = reinterpret_cast(malloc(Nbytes)); REQUIRE(A_h != nullptr); REQUIRE(C_h != nullptr); HIP_CHECK(hipMalloc(&A_d, Nbytes)); HIP_CHECK(hipMalloc(&C_d, Nbytes)); REQUIRE(A_d != nullptr); REQUIRE(C_d != nullptr); HIP_CHECK(hipStreamCreate(&streamForLaunch)); // Initialize input buffer for (size_t i = 0; i < N; ++i) { A_h[i] = 3.146f + i; // Pi } // Create cross stream dependencies. // memset operations are done on stream1 and stream2 // and they are joined back to mainstream HIP_CHECK(hipStreamCreate(&stream1)); HIP_CHECK(hipStreamCreate(&stream2)); HIP_CHECK(hipEventCreate(&memsetEvent1)); HIP_CHECK(hipEventCreate(&memsetEvent2)); HIP_CHECK(hipEventCreate(&forkStreamEvent)); HIP_CHECK(hipStreamBeginCapture(mstream, hipStreamCaptureModeGlobal)); HIP_CHECK(hipEventRecord(forkStreamEvent, mstream)); HIP_CHECK(hipStreamWaitEvent(stream1, forkStreamEvent, 0)); HIP_CHECK(hipStreamWaitEvent(stream2, forkStreamEvent, 0)); HIP_CHECK(hipMemsetAsync(A_d, 0, Nbytes, stream1)); HIP_CHECK(hipEventRecord(memsetEvent1, stream1)); HIP_CHECK(hipMemsetAsync(C_d, 0, Nbytes, stream2)); HIP_CHECK(hipEventRecord(memsetEvent2, stream2)); HIP_CHECK(hipStreamWaitEvent(mstream, memsetEvent1, 0)); HIP_CHECK(hipStreamWaitEvent(mstream, memsetEvent2, 0)); HIP_CHECK(hipMemcpyAsync(A_d, A_h, Nbytes, hipMemcpyHostToDevice, mstream)); hipLaunchKernelGGL(HipTest::vector_square, dim3(blocks), dim3(threadsPerBlock), 0, mstream, A_d, C_d, N); hipStreamCaptureStatus captureStatus{hipStreamCaptureStatusNone}; unsigned long long capSequenceID = 0; // NOLINT HIP_CHECK(hipStreamGetCaptureInfo(mstream, &captureStatus, &capSequenceID)); // verify capture status is active and sequence id is valid REQUIRE(captureStatus == hipStreamCaptureStatusActive); REQUIRE(capSequenceID > 0); // End capture and verify graph is returned HIP_CHECK(hipMemcpyAsync(C_h, C_d, Nbytes, hipMemcpyDeviceToHost, mstream)); HIP_CHECK(hipStreamEndCapture(mstream, &graph)); REQUIRE(graph != nullptr); // verify capture status is inactive and sequence id is not updated capSequenceID = 0; HIP_CHECK(hipStreamGetCaptureInfo(mstream, &captureStatus, &capSequenceID)); REQUIRE(captureStatus == hipStreamCaptureStatusNone); REQUIRE(capSequenceID == 0); HIP_CHECK(hipGraphInstantiate(&graphExec, graph, nullptr, nullptr, 0)); REQUIRE(graphExec != nullptr); // Replay the recorded sequence multiple times for (int i = 0; i < LAUNCH_ITERS; i++) { HIP_CHECK(hipGraphLaunch(graphExec, streamForLaunch)); } HIP_CHECK(hipStreamSynchronize(streamForLaunch)); HIP_CHECK(hipGraphDestroy(graph)); HIP_CHECK(hipStreamDestroy(streamForLaunch)); HIP_CHECK(hipStreamDestroy(stream1)); HIP_CHECK(hipStreamDestroy(stream2)); HIP_CHECK(hipEventDestroy(forkStreamEvent)); HIP_CHECK(hipEventDestroy(memsetEvent1)); HIP_CHECK(hipEventDestroy(memsetEvent2)); HIP_CHECK(hipFree(A_d)); HIP_CHECK(hipFree(C_d)); // Validate the computation for (size_t i = 0; i < N; i++) { if (C_h[i] != A_h[i] * A_h[i]) { INFO("A and C not matching at " << i << " C_h[i] " << C_h[i] << " A_h[i] " << A_h[i]); REQUIRE(false); } } free(A_h); free(C_h); } /** * Basic Functional Test for stream capture and getting capture info. * Regular/custom stream is used for stream capture. */ TEST_CASE("Unit_hipStreamGetCaptureInfo_BasicFunctional") { hipStream_t streamForCapture; HIP_CHECK(hipStreamCreate(&streamForCapture)); validateStreamCaptureInfo(streamForCapture); HIP_CHECK(hipStreamDestroy(streamForCapture)); } /** * Test performs stream capture on hipStreamPerThread and validates * capture info. */ TEST_CASE("Unit_hipStreamGetCaptureInfo_hipStreamPerThread") { validateStreamCaptureInfo(hipStreamPerThread); } /** * Test starts stream capture on multiple streams and verifies uniqueness of * identifiers returned. */ TEST_CASE("Unit_hipStreamGetCaptureInfo_UniqueID") { constexpr int numStreams = 100; hipStream_t streams[numStreams]{}; hipStreamCaptureStatus captureStatus{hipStreamCaptureStatusNone}; std::vector idlist; unsigned long long capSequenceID{}; // NOLINT hipGraph_t graph{nullptr}; for (int i = 0; i < numStreams; i++) { HIP_CHECK(hipStreamCreate(&streams[i])); HIP_CHECK(hipStreamBeginCapture(streams[i], hipStreamCaptureModeGlobal)); HIP_CHECK(hipStreamGetCaptureInfo(streams[i], &captureStatus, &capSequenceID)); REQUIRE(captureStatus == hipStreamCaptureStatusActive); REQUIRE(capSequenceID > 0); idlist.push_back(capSequenceID); } for (int i = 0; i < numStreams; i++) { for (int j = i+1; j < numStreams; j++) { if (idlist[i] == idlist[j]) { INFO("Same identifier returned for stream " << i << " and stream " << j); REQUIRE(false); } } } for (int i = 0; i < numStreams; i++) { HIP_CHECK(hipStreamEndCapture(streams[i], &graph)); HIP_CHECK(hipGraphDestroy(graph)); HIP_CHECK(hipStreamDestroy(streams[i])); } } /** * Argument validation/Negative tests for api */ TEST_CASE("Unit_hipStreamGetCaptureInfo_ArgValidation") { hipError_t ret; hipStream_t stream; hipStreamCaptureStatus captureStatus; unsigned long long capSequenceID; // NOLINT HIP_CHECK(hipStreamCreate(&stream)); SECTION("Capture ID location as nullptr") { ret = hipStreamGetCaptureInfo(stream, &captureStatus, nullptr); // Capture ID is optional REQUIRE(ret == hipSuccess); } SECTION("Capture Status location as nullptr") { ret = hipStreamGetCaptureInfo(stream, nullptr, &capSequenceID); REQUIRE(ret == hipErrorInvalidValue); } HIP_CHECK(hipStreamDestroy(stream)); }