added compiler flag for polaris

Change-Id: Ib14c14c0618982ac7b48f5bc704c04b54ff40ed9


[ROCm/hip commit: 90a71c4be4]
This commit is contained in:
Aditya Atluri
2016-10-13 14:16:48 -05:00
parent 252e32859e
commit d06509f680
3 changed files with 10 additions and 8 deletions
+3
View File
@@ -119,6 +119,9 @@ if ($HIP_PLATFORM eq "hcc") {
if ($ROCM_TARGET eq "hawaii") {
$HIPLDFLAGS .= " -amdgpu-target=AMD:AMDGPU:7:0:1";
}
if ($ROCM_TARGET eq "polaris") {
$HIPLDFLAGS .= " -amdgpu-target=AMD:AMDGPU:8:0:3";
}
# Add trace marker library:
# TODO - once we cleanly separate the HIP API headers from HIP library headers this logic should move to CMakebuild option - apps do not need to see the marker library.
@@ -34,13 +34,6 @@ typedef struct __attribute__((aligned(4))){
typedef __half half;
typedef __half2 half2;
typedef struct{
union{
float f;
unsigned u;
};
} struct_float;
/*
Arithmetic functions
*/
+7 -1
View File
@@ -25,6 +25,13 @@ static const __half __half_value_zero_float = {0x0};
static const unsigned __half_pos_inf = 0x7C00;
static const unsigned __half_neg_inf = 0xFC00;
typedef struct{
union{
float f;
unsigned u;
};
} struct_float;
static __device__ float cvt_half_to_float(__half a){
struct_float ret = {0};
if(a.x == 0){
@@ -362,4 +369,3 @@ __device__ __half2 __lowhigh2highlow(const __half2 a){
__device__ __half2 __low2half2(const __half2 a, const __half2 b){
return {a.q, b.q};
}