65a428aaff
* test fixes
* address PR comment
* PR comment fixing Nvidia pass
* add additional kernel launch checks
* pr comments
[ROCm/hip-tests commit: da453211ed]
104 líneas
3.9 KiB
C++
104 líneas
3.9 KiB
C++
/*
|
|
Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
#include <hip_test_common.hh>
|
|
|
|
#include <stdio.h>
|
|
#include <algorithm>
|
|
#include <stdlib.h>
|
|
#include <hip/hip_runtime.h>
|
|
#include <hip/device_functions.h>
|
|
|
|
__global__ void HIP_kernel(unsigned int* mbcnt_lo, unsigned int* mbcnt_hi, unsigned int* lane_id) {
|
|
int x = blockDim.x * blockIdx.x + threadIdx.x;
|
|
mbcnt_lo[x] = __builtin_amdgcn_mbcnt_lo(0xFFFFFFFF, 0);
|
|
mbcnt_hi[x] = __builtin_amdgcn_mbcnt_hi(0xFFFFFFFF, 0);
|
|
lane_id[x] = __lane_id();
|
|
}
|
|
|
|
|
|
TEST_CASE("Unit_mbcnt") {
|
|
using namespace std;
|
|
unsigned int* device_mbcnt_lo;
|
|
unsigned int* device_mbcnt_hi;
|
|
unsigned int* device_lane_id;
|
|
|
|
hipDeviceProp_t devProp;
|
|
HIP_CHECK(hipGetDeviceProperties(&devProp, 0));
|
|
INFO("System minor : " << devProp.minor);
|
|
INFO("System major : " << devProp.major);
|
|
INFO("agent prop name : " << devProp.name);
|
|
|
|
INFO("hip Device prop succeeded");
|
|
|
|
constexpr unsigned int num_waves_per_block = 2;
|
|
const unsigned int wave_size = devProp.warpSize;
|
|
const unsigned int num_threads_per_block = wave_size * num_waves_per_block;
|
|
const unsigned int num_blocks = 2;
|
|
const unsigned int num_threads = num_threads_per_block * num_blocks;
|
|
const size_t buffer_size = num_threads * sizeof(unsigned int);
|
|
|
|
HIP_CHECK(hipMalloc((void**)&device_mbcnt_lo, buffer_size));
|
|
HIP_CHECK(hipMalloc((void**)&device_mbcnt_hi, buffer_size));
|
|
HIP_CHECK(hipMalloc((void**)&device_lane_id, buffer_size));
|
|
|
|
hipLaunchKernelGGL(HIP_kernel, dim3(num_blocks), dim3(num_threads_per_block), 0, 0,
|
|
device_mbcnt_lo, device_mbcnt_hi, device_lane_id);
|
|
HIP_CHECK(hipGetLastError());
|
|
unsigned int* host_mbcnt_lo = (unsigned int*)malloc(buffer_size);
|
|
unsigned int* host_mbcnt_hi = (unsigned int*)malloc(buffer_size);
|
|
unsigned int* host_lane_id = (unsigned int*)malloc(buffer_size);
|
|
|
|
HIP_CHECK(hipMemcpy(host_mbcnt_lo, device_mbcnt_lo, buffer_size, hipMemcpyDeviceToHost));
|
|
HIP_CHECK(hipMemcpy(host_mbcnt_hi, device_mbcnt_hi, buffer_size, hipMemcpyDeviceToHost));
|
|
HIP_CHECK(hipMemcpy(host_lane_id, device_lane_id, buffer_size, hipMemcpyDeviceToHost));
|
|
|
|
// verify the results
|
|
int mbcnt_lo_errors = 0;
|
|
int mbcnt_hi_errors = 0;
|
|
int lane_id_errors = 0;
|
|
for (unsigned int i = 0; i < num_threads; i++) {
|
|
unsigned int this_lane_id = i % wave_size;
|
|
unsigned int this_mbcnt_lo = this_lane_id >= 32 ? 32 : this_lane_id;
|
|
unsigned int this_mbcnt_hi = this_lane_id < 32 ? 0 : (this_lane_id - 32);
|
|
|
|
if (host_mbcnt_lo[i] != this_mbcnt_lo) mbcnt_lo_errors++;
|
|
|
|
if (host_mbcnt_hi[i] != this_mbcnt_hi) mbcnt_hi_errors++;
|
|
|
|
if (host_lane_id[i] != this_lane_id) lane_id_errors++;
|
|
}
|
|
|
|
|
|
HIP_CHECK(hipFree(device_mbcnt_lo));
|
|
HIP_CHECK(hipFree(device_mbcnt_hi));
|
|
HIP_CHECK(hipFree(device_lane_id));
|
|
|
|
free(host_mbcnt_lo);
|
|
free(host_mbcnt_hi);
|
|
free(host_lane_id);
|
|
|
|
REQUIRE(mbcnt_lo_errors == 0);
|
|
REQUIRE(mbcnt_hi_errors == 0);
|
|
REQUIRE(lane_id_errors == 0);
|
|
}
|