bb791d8e86
Change-Id: I4e51bb999f43c4f304ed4712dadc3fc1aae3f7a4
104 строки
4.2 KiB
C++
104 строки
4.2 KiB
C++
/*
|
|
Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved.
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
/*
|
|
Testcase Scenarios :
|
|
Unit_hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags_Positive_RangeValidation - Test
|
|
correct execution of hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags for diffrent
|
|
parameter values
|
|
Unit_hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags_Negative_Parameters - Test
|
|
unsuccessful execution of hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags api when
|
|
parameters are invalid
|
|
*/
|
|
#include "occupancy_common.hh"
|
|
|
|
TEST_CASE("Unit_hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags_Negative_Parameters") {
|
|
hipModule_t module;
|
|
hipFunction_t function;
|
|
int numBlocks = 0;
|
|
int blockSize = 0;
|
|
int gridSize = 0;
|
|
|
|
HIP_CHECK(hipFree(nullptr));
|
|
|
|
HIP_CHECK(hipModuleLoad(&module, "simple_kernel.code"));
|
|
HIPCHECK(hipModuleGetFunction(&function, module, "SimpleKernel"));
|
|
|
|
// Get potential blocksize
|
|
HIP_CHECK(hipModuleOccupancyMaxPotentialBlockSize(&gridSize, &blockSize, function, 0, 0));
|
|
|
|
// Common negative tests
|
|
MaxActiveBlocksPerMultiprocessorNegative(
|
|
[&function](int* numBlocks, int blockSize, size_t dynSharedMemPerBlk) {
|
|
return hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(
|
|
numBlocks, function, blockSize, dynSharedMemPerBlk, hipOccupancyDefault);
|
|
},
|
|
blockSize);
|
|
|
|
SECTION("Flag is invalid") {
|
|
// Only default flag is supported
|
|
HIP_CHECK_ERROR(hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(
|
|
&numBlocks, function, blockSize, 0, 2),
|
|
hipErrorInvalidValue);
|
|
}
|
|
|
|
HIP_CHECK(hipModuleUnload(module));
|
|
}
|
|
|
|
TEST_CASE(
|
|
"Unit_hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags_Positive_RangeValidation") {
|
|
hipDeviceProp_t devProp;
|
|
hipModule_t module;
|
|
hipFunction_t function;
|
|
int blockSize = 0;
|
|
int gridSize = 0;
|
|
|
|
HIP_CHECK(hipFree(nullptr));
|
|
|
|
HIP_CHECK(hipModuleLoad(&module, "simple_kernel.code"));
|
|
HIPCHECK(hipModuleGetFunction(&function, module, "SimpleKernel"));
|
|
|
|
HIP_CHECK(hipGetDeviceProperties(&devProp, 0));
|
|
|
|
SECTION("dynSharedMemPerBlk = 0") {
|
|
// Get potential blocksize
|
|
HIP_CHECK(hipModuleOccupancyMaxPotentialBlockSize(&gridSize, &blockSize, function, 0, 0));
|
|
|
|
MaxActiveBlocksPerMultiprocessor(
|
|
[blockSize, &function](int* numBlocks) {
|
|
return hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(
|
|
numBlocks, function, blockSize, 0, hipOccupancyDefault);
|
|
},
|
|
blockSize, devProp.maxThreadsPerMultiProcessor);
|
|
}
|
|
SECTION("dynSharedMemPerBlk = sharedMemPerBlock") {
|
|
// Get potential blocksize
|
|
HIP_CHECK(hipModuleOccupancyMaxPotentialBlockSize(&gridSize, &blockSize, function,
|
|
devProp.sharedMemPerBlock, 0));
|
|
|
|
MaxActiveBlocksPerMultiprocessor(
|
|
[blockSize, devProp, &function](int* numBlocks) {
|
|
return hipModuleOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(
|
|
numBlocks, function, blockSize, devProp.sharedMemPerBlock, hipOccupancyDefault);
|
|
},
|
|
blockSize, devProp.maxThreadsPerMultiProcessor);
|
|
}
|
|
|
|
HIP_CHECK(hipModuleUnload(module));
|
|
}
|