b723169ee9
1. All fp32, fp64 math device/host functions should be in math_functions.h/.cpp 2. All fp32, fp64 fast math intrinsics for device/host functions should be in device_functions.h/.cpp 3. All the device code implementations should be in device_util.h/.cpp 4. Hence, made changes appropriately by moving code and creating new header files 5. Added math_functions.cpp/.h 6. Changed #ifndef signature to make sure no conflicts between headers with same names in hip/hip_runtime.h and hip/hcc_detail/hip_runtime.h 7. Changed tests to fit the code changes, making them to include appropriate headers 8. Added math_functions.cpp to CMakeLists.txt 9. Some of the tests are still broken, mostly host math functions will fix them in next commit 10. TODO: FIX compilation issues for host math functions Change-Id: I7a17637d7e294a7d224ffba932c1a08668febd26
83 lines
2.9 KiB
C++
83 lines
2.9 KiB
C++
/*
|
|
Copyright (c) 2015-2016 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
/* HIT_START
|
|
* BUILD: %t %s
|
|
* RUN: %t
|
|
* HIT_END
|
|
*/
|
|
|
|
#include<hip/hip_runtime_api.h>
|
|
#include<hip/hip_runtime.h>
|
|
#include<iostream>
|
|
#include"test_common.h"
|
|
#include<hip/device_functions.h>
|
|
|
|
#define LEN 512
|
|
#define SIZE LEN<<2
|
|
|
|
__global__ void kernel_trig(hipLaunchParm lp, float *In, float *sin_d, float *cos_d, float *tan_d, float *sin_pd, float *cos_pd){
|
|
int tid = hipThreadIdx_x + hipBlockIdx_x * hipBlockDim_x;
|
|
sin_d[tid] = __sinf(In[tid]);
|
|
cos_d[tid] = __cosf(In[tid]);
|
|
tan_d[tid] = __tanf(In[tid]);
|
|
__sincosf(In[tid], &sin_pd[tid], &cos_pd[tid]);
|
|
}
|
|
|
|
int main(){
|
|
float *In, *sin_h, *cos_h, *tan_h, *sin_ph, *cos_ph;
|
|
float *In_d, *sin_d, *cos_d, *tan_d, *sin_pd, *cos_pd;
|
|
In = new float[LEN];
|
|
sin_h = new float[LEN];
|
|
cos_h = new float[LEN];
|
|
tan_h = new float[LEN];
|
|
sin_ph = new float[LEN];
|
|
cos_ph = new float[LEN];
|
|
for(int i=0;i<LEN;i++){
|
|
In[i] = 1.0f;
|
|
sin_h[i] = 0.0f;
|
|
cos_h[i] = 0.0f;
|
|
tan_h[i] = 0.0f;
|
|
sin_ph[i] = 0.0f;
|
|
cos_ph[i] = 0.0f;
|
|
}
|
|
hipMalloc((void**)&In_d, SIZE);
|
|
hipMalloc((void**)&sin_d, SIZE);
|
|
hipMalloc((void**)&cos_d, SIZE);
|
|
hipMalloc((void**)&tan_d, SIZE);
|
|
hipMalloc((void**)&sin_pd, SIZE);
|
|
hipMalloc((void**)&cos_pd, SIZE);
|
|
hipMemcpy(In_d, In, SIZE, hipMemcpyHostToDevice);
|
|
hipLaunchKernel(kernel_trig, dim3(LEN,1,1), dim3(1,1,1), 0, 0, In_d, sin_d, cos_d, tan_d, sin_pd, cos_pd);
|
|
hipMemcpy(sin_h, sin_d, SIZE, hipMemcpyDeviceToHost);
|
|
hipMemcpy(cos_h, cos_d, SIZE, hipMemcpyDeviceToHost);
|
|
hipMemcpy(tan_h, tan_d, SIZE, hipMemcpyDeviceToHost);
|
|
hipMemcpy(sin_ph, sin_pd, SIZE, hipMemcpyDeviceToHost);
|
|
hipMemcpy(cos_ph, cos_pd, SIZE, hipMemcpyDeviceToHost);
|
|
for(int i=0;i<LEN;i++) {
|
|
if(sin_h[i] != sin_ph[i] || cos_h[i] != cos_ph[i] || tan_h[i]*cos_h[i] != sin_h[i]){
|
|
std::cout<<"Failed!"<<std::endl;
|
|
}
|
|
}
|
|
passed();
|
|
}
|