60e1733afe
module_api_global relies on a HCC only feature which allows host code to write to device variables. This feature does not exist in CUDA or hip-clang, which causes the sample not working in CUDA or hip-clang. This patch fixes the sample by using standard features of CUDA and hip-clang. The fixed sample works in HCC, CUDA and hip-clang.
39 righe
1.5 KiB
C++
39 righe
1.5 KiB
C++
/*
|
|
Copyright (c) 2017-present Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
#include "hip/hip_runtime.h"
|
|
|
|
#define ARRAY_SIZE (16)
|
|
|
|
__device__ float myDeviceGlobal;
|
|
__device__ float myDeviceGlobalArray[16];
|
|
|
|
extern "C" __global__ void hello_world(const float* a, float* b) {
|
|
int tx = hipThreadIdx_x;
|
|
b[tx] = a[tx];
|
|
}
|
|
|
|
extern "C" __global__ void test_globals(const float* a, float* b) {
|
|
int tx = hipThreadIdx_x;
|
|
b[tx] = a[tx] + myDeviceGlobal + myDeviceGlobalArray[tx % ARRAY_SIZE];
|
|
}
|