431c938938
Change-Id: I73d42a87797cf70c5ac6093bc308203eae5cca00
232 строки
8.5 KiB
C++
232 строки
8.5 KiB
C++
/*
|
||
Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved.
|
||
Permission is hereby granted, free of charge, to any person obtaining a copy
|
||
of this software and associated documentation files (the "Software"), to deal
|
||
in the Software without restriction, including without limitation the rights
|
||
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
||
copies of the Software, and to permit persons to whom the Software is
|
||
furnished to do so, subject to the following conditions:
|
||
The above copyright notice and this permission notice shall be included in
|
||
all copies or substantial portions of the Software.
|
||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANNTY OF ANY KIND, EXPRESS OR
|
||
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||
FITNNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||
LIABILITY, WHETHER INN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||
OUT OF OR INN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
||
THE SOFTWARE.
|
||
*/
|
||
|
||
/**
|
||
|
||
Testcase Scenarios
|
||
------------------
|
||
Functional:
|
||
1) Start stream capture and get capture info. Verify api is success, capture status is hipStreamCaptureStatusActive
|
||
and identifier returned is valid/non-zero.
|
||
2) End stream capture and get capture info. Verify api is success, capture status is hipStreamCaptureStatusNone
|
||
and identifier is not returned/updated by api.
|
||
3) Begin capture on hipStreamPerThread and get capture info. Verify api is success, capture status is hipStreamCaptureStatusActive
|
||
and identifier returned is valid/non-zero.
|
||
4) End capture on hipStreamPerThread, get capture info. Verify api is success, capture status is hipStreamCaptureStatusNone
|
||
and identifier is not returned/updated by api.
|
||
5) Perform multiple captures and verify the identifier returned is unique.
|
||
|
||
Argument Validation/Negative:
|
||
1) Pass pId as nullptr and verify api doesn’t crash and returns success.
|
||
2) Pass pCaptureStatus as nullptr and verify api doesn’t crash and returns error code.
|
||
|
||
*/
|
||
|
||
#include <hip_test_common.hh>
|
||
#include <hip_test_checkers.hh>
|
||
#include <hip_test_kernels.hh>
|
||
|
||
constexpr size_t N = 1000000;
|
||
constexpr int LAUNCH_ITERS = 1;
|
||
|
||
/**
|
||
* Validates stream capture info, launches graph and verify results
|
||
*/
|
||
void validateStreamCaptureInfo(hipStream_t mstream) {
|
||
hipStream_t stream1{nullptr}, stream2{nullptr}, streamForLaunch{nullptr};
|
||
hipEvent_t memsetEvent1, memsetEvent2, forkStreamEvent;
|
||
hipGraph_t graph{nullptr};
|
||
hipGraphExec_t graphExec{nullptr};
|
||
constexpr unsigned blocks = 512;
|
||
constexpr unsigned threadsPerBlock = 256;
|
||
size_t Nbytes = N * sizeof(float);
|
||
float *A_d, *C_d;
|
||
float *A_h, *C_h;
|
||
A_h = reinterpret_cast<float*>(malloc(Nbytes));
|
||
C_h = reinterpret_cast<float*>(malloc(Nbytes));
|
||
REQUIRE(A_h != nullptr);
|
||
REQUIRE(C_h != nullptr);
|
||
HIP_CHECK(hipMalloc(&A_d, Nbytes));
|
||
HIP_CHECK(hipMalloc(&C_d, Nbytes));
|
||
REQUIRE(A_d != nullptr);
|
||
REQUIRE(C_d != nullptr);
|
||
HIP_CHECK(hipStreamCreate(&streamForLaunch));
|
||
|
||
// Initialize input buffer
|
||
for (size_t i = 0; i < N; ++i) {
|
||
A_h[i] = 3.146f + i; // Pi
|
||
}
|
||
|
||
// Create cross stream dependencies.
|
||
// memset operations are done on stream1 and stream2
|
||
// and they are joined back to mainstream
|
||
HIP_CHECK(hipStreamCreate(&stream1));
|
||
HIP_CHECK(hipStreamCreate(&stream2));
|
||
HIP_CHECK(hipEventCreate(&memsetEvent1));
|
||
HIP_CHECK(hipEventCreate(&memsetEvent2));
|
||
HIP_CHECK(hipEventCreate(&forkStreamEvent));
|
||
|
||
HIP_CHECK(hipStreamBeginCapture(mstream, hipStreamCaptureModeGlobal));
|
||
HIP_CHECK(hipEventRecord(forkStreamEvent, mstream));
|
||
HIP_CHECK(hipStreamWaitEvent(stream1, forkStreamEvent, 0));
|
||
HIP_CHECK(hipStreamWaitEvent(stream2, forkStreamEvent, 0));
|
||
HIP_CHECK(hipMemsetAsync(A_d, 0, Nbytes, stream1));
|
||
HIP_CHECK(hipEventRecord(memsetEvent1, stream1));
|
||
HIP_CHECK(hipMemsetAsync(C_d, 0, Nbytes, stream2));
|
||
HIP_CHECK(hipEventRecord(memsetEvent2, stream2));
|
||
HIP_CHECK(hipStreamWaitEvent(mstream, memsetEvent1, 0));
|
||
HIP_CHECK(hipStreamWaitEvent(mstream, memsetEvent2, 0));
|
||
HIP_CHECK(hipMemcpyAsync(A_d, A_h, Nbytes, hipMemcpyHostToDevice, mstream));
|
||
hipLaunchKernelGGL(HipTest::vector_square, dim3(blocks),
|
||
dim3(threadsPerBlock), 0, mstream, A_d, C_d, N);
|
||
|
||
hipStreamCaptureStatus captureStatus{hipStreamCaptureStatusNone};
|
||
unsigned long long capSequenceID = 0; // NOLINT
|
||
HIP_CHECK(hipStreamGetCaptureInfo(mstream, &captureStatus, &capSequenceID));
|
||
|
||
// verify capture status is active and sequence id is valid
|
||
REQUIRE(captureStatus == hipStreamCaptureStatusActive);
|
||
REQUIRE(capSequenceID > 0);
|
||
|
||
// End capture and verify graph is returned
|
||
HIP_CHECK(hipMemcpyAsync(C_h, C_d, Nbytes, hipMemcpyDeviceToHost, mstream));
|
||
HIP_CHECK(hipStreamEndCapture(mstream, &graph));
|
||
REQUIRE(graph != nullptr);
|
||
|
||
// verify capture status is inactive and sequence id is not updated
|
||
capSequenceID = 0;
|
||
HIP_CHECK(hipStreamGetCaptureInfo(mstream, &captureStatus, &capSequenceID));
|
||
REQUIRE(captureStatus == hipStreamCaptureStatusNone);
|
||
REQUIRE(capSequenceID == 0);
|
||
|
||
HIP_CHECK(hipGraphInstantiate(&graphExec, graph, nullptr, nullptr, 0));
|
||
REQUIRE(graphExec != nullptr);
|
||
|
||
// Replay the recorded sequence multiple times
|
||
for (int i = 0; i < LAUNCH_ITERS; i++) {
|
||
HIP_CHECK(hipGraphLaunch(graphExec, streamForLaunch));
|
||
}
|
||
|
||
HIP_CHECK(hipStreamSynchronize(streamForLaunch));
|
||
|
||
HIP_CHECK(hipGraphDestroy(graph));
|
||
HIP_CHECK(hipStreamDestroy(streamForLaunch));
|
||
HIP_CHECK(hipStreamDestroy(stream1));
|
||
HIP_CHECK(hipStreamDestroy(stream2));
|
||
HIP_CHECK(hipEventDestroy(forkStreamEvent));
|
||
HIP_CHECK(hipEventDestroy(memsetEvent1));
|
||
HIP_CHECK(hipEventDestroy(memsetEvent2));
|
||
HIP_CHECK(hipFree(A_d));
|
||
HIP_CHECK(hipFree(C_d));
|
||
|
||
// Validate the computation
|
||
for (size_t i = 0; i < N; i++) {
|
||
if (C_h[i] != A_h[i] * A_h[i]) {
|
||
INFO("A and C not matching at " << i << " C_h[i] " << C_h[i]
|
||
<< " A_h[i] " << A_h[i]);
|
||
REQUIRE(false);
|
||
}
|
||
}
|
||
free(A_h);
|
||
free(C_h);
|
||
}
|
||
|
||
/**
|
||
* Basic Functional Test for stream capture and getting capture info.
|
||
* Regular/custom stream is used for stream capture.
|
||
*/
|
||
TEST_CASE("Unit_hipStreamGetCaptureInfo_BasicFunctional") {
|
||
hipStream_t streamForCapture;
|
||
|
||
HIP_CHECK(hipStreamCreate(&streamForCapture));
|
||
validateStreamCaptureInfo(streamForCapture);
|
||
HIP_CHECK(hipStreamDestroy(streamForCapture));
|
||
}
|
||
|
||
/**
|
||
* Test performs stream capture on hipStreamPerThread and validates
|
||
* capture info.
|
||
*/
|
||
TEST_CASE("Unit_hipStreamGetCaptureInfo_hipStreamPerThread") {
|
||
validateStreamCaptureInfo(hipStreamPerThread);
|
||
}
|
||
|
||
/**
|
||
* Test starts stream capture on multiple streams and verifies uniqueness of
|
||
* identifiers returned.
|
||
*/
|
||
TEST_CASE("Unit_hipStreamGetCaptureInfo_UniqueID") {
|
||
constexpr int numStreams = 100;
|
||
hipStream_t streams[numStreams]{};
|
||
hipStreamCaptureStatus captureStatus{hipStreamCaptureStatusNone};
|
||
std::vector<int> idlist;
|
||
unsigned long long capSequenceID{}; // NOLINT
|
||
hipGraph_t graph{nullptr};
|
||
|
||
for (int i = 0; i < numStreams; i++) {
|
||
HIP_CHECK(hipStreamCreate(&streams[i]));
|
||
HIP_CHECK(hipStreamBeginCapture(streams[i], hipStreamCaptureModeGlobal));
|
||
HIP_CHECK(hipStreamGetCaptureInfo(streams[i], &captureStatus,
|
||
&capSequenceID));
|
||
REQUIRE(captureStatus == hipStreamCaptureStatusActive);
|
||
REQUIRE(capSequenceID > 0);
|
||
idlist.push_back(capSequenceID);
|
||
}
|
||
|
||
for (int i = 0; i < numStreams; i++) {
|
||
for (int j = i+1; j < numStreams; j++) {
|
||
if (idlist[i] == idlist[j]) {
|
||
INFO("Same identifier returned for stream "
|
||
<< i << " and stream " << j);
|
||
REQUIRE(false);
|
||
}
|
||
}
|
||
}
|
||
|
||
for (int i = 0; i < numStreams; i++) {
|
||
HIP_CHECK(hipStreamEndCapture(streams[i], &graph));
|
||
HIP_CHECK(hipGraphDestroy(graph));
|
||
HIP_CHECK(hipStreamDestroy(streams[i]));
|
||
}
|
||
}
|
||
|
||
/**
|
||
* Argument validation/Negative tests for api
|
||
*/
|
||
TEST_CASE("Unit_hipStreamGetCaptureInfo_ArgValidation") {
|
||
hipError_t ret;
|
||
hipStream_t stream;
|
||
hipStreamCaptureStatus captureStatus;
|
||
unsigned long long capSequenceID; // NOLINT
|
||
HIP_CHECK(hipStreamCreate(&stream));
|
||
|
||
SECTION("Capture ID location as nullptr") {
|
||
ret = hipStreamGetCaptureInfo(stream, &captureStatus, nullptr);
|
||
// Capture ID is optional
|
||
REQUIRE(ret == hipSuccess);
|
||
}
|
||
|
||
SECTION("Capture Status location as nullptr") {
|
||
ret = hipStreamGetCaptureInfo(stream, nullptr, &capSequenceID);
|
||
REQUIRE(ret == hipErrorInvalidValue);
|
||
}
|
||
|
||
HIP_CHECK(hipStreamDestroy(stream));
|
||
}
|