2016-06-10 09:46:31 -05:00
|
|
|
/*
|
|
|
|
|
Copyright (c) 2015-2016 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
|
|
|
in the Software without restriction, including without limitation the rights
|
|
|
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
|
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
|
|
|
all copies or substantial portions of the Software.
|
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
|
THE SOFTWARE.
|
|
|
|
|
*/
|
|
|
|
|
#include"test_common.h"
|
|
|
|
|
#include"hip_runtime.h"
|
|
|
|
|
#include"hip_runtime_api.h"
|
|
|
|
|
|
|
|
|
|
#define N 512
|
|
|
|
|
#define SIZE N*sizeof(double)
|
|
|
|
|
|
|
|
|
|
__global__ void test_sincos(hipLaunchParm lp, double* a, double* b, double *c){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
sincos(a[tid], b+tid, c+tid);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_sincospi(hipLaunchParm lp, double* a, double* b, double *c){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
sincospi(a[tid], b+tid, c+tid);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_llrint(hipLaunchParm lp, double *a, long long int *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = llrint(a[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_lrint(hipLaunchParm lp, double *a, long int *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = lrint(a[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_rint(hipLaunchParm lp, double *a, double *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = rint(a[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_llround(hipLaunchParm lp, double *a, long long int *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = llround(a[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_lround(hipLaunchParm lp, double *a, long int *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = lround(a[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_rhypot(hipLaunchParm lp, double *a, double* b, double *c){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
c[tid] = rhypot(a[tid], b[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_norm3d(hipLaunchParm lp, double *a, double* b, double *c, double *d){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
d[tid] = norm3d(a[tid], b[tid], c[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_norm4d(hipLaunchParm lp, double *a, double* b, double *c, double *d, double *e){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
e[tid] = norm4d(a[tid], b[tid], c[tid], d[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_rnorm3d(hipLaunchParm lp, double *a, double* b, double *c, double *d){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
d[tid] = rnorm3d(a[tid], b[tid], c[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_rnorm4d(hipLaunchParm lp, double *a, double* b, double *c, double *d, double *e){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
e[tid] = rnorm4d(a[tid], b[tid], c[tid], d[tid]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
__global__ void test_rnorm(hipLaunchParm lp, double *a, double *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = rnorm(N, a);
|
|
|
|
|
}
|
|
|
|
|
|
2016-06-13 14:44:18 -05:00
|
|
|
__global__ void test_erfinv(hipLaunchParm lp, double *a, double *b){
|
|
|
|
|
int tid = hipThreadIdx_x;
|
|
|
|
|
b[tid] = erf(erfinv(a[tid]));
|
|
|
|
|
}
|
|
|
|
|
|
2016-06-10 09:46:31 -05:00
|
|
|
bool run_sincos(){
|
|
|
|
|
double *A, *Ad, *B, *C, *Bd, *Cd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_sincos, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd);
|
|
|
|
|
hipMemcpy(B, Bd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
hipMemcpy(C, Cd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(B[i] == sin(1.0)){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(C[i] == cos(1.0)){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_sincospi(){
|
|
|
|
|
double *A, *Ad, *B, *C, *Bd, *Cd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_sincospi, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd);
|
|
|
|
|
hipMemcpy(B, Bd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
hipMemcpy(C, Cd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(B[i] - sinpi(1.0) < 0.1){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(C[i] - cospi(1.0) < 0.1){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bool run_llrint(){
|
|
|
|
|
double *A, *Ad;
|
|
|
|
|
long long int *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new long long int[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.345;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, N*sizeof(long long int));
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_llrint, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, N*sizeof(long long int), hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
int x = round(A[i]);
|
|
|
|
|
long long int y = x;
|
|
|
|
|
if(B[i] == x){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_lrint(){
|
|
|
|
|
double *A, *Ad;
|
|
|
|
|
long int *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new long int[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.345;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, N*sizeof(long int));
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_lrint, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, N*sizeof(long int), hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
long int x = round(A[i]);
|
|
|
|
|
if(B[i] == x){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_rint(){
|
|
|
|
|
double *A, *Ad;
|
|
|
|
|
double *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.345;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_rint, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
double x = round(A[i]);
|
|
|
|
|
if(B[i] == x){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bool run_llround(){
|
|
|
|
|
double *A, *Ad;
|
|
|
|
|
long long int *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new long long int[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.345;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, N*sizeof(long long int));
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_llround, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, N*sizeof(long long int), hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
long long int x = round(A[i]);
|
|
|
|
|
if(B[i] == x){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_lround(){
|
|
|
|
|
double *A, *Ad;
|
|
|
|
|
long int *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new long int[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.345;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, N*sizeof(long int));
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_lround, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, N*sizeof(long int), hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
long int x = round(A[i]);
|
|
|
|
|
if(B[i] == x){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bool run_norm3d(){
|
|
|
|
|
double *A, *Ad, *B, *Bd, *C, *Cd, *D, *Dd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
D = new double[N];
|
|
|
|
|
double val = 0.0;
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
B[i] = 2.0;
|
|
|
|
|
C[i] = 3.0;
|
|
|
|
|
}
|
|
|
|
|
val = sqrt(1.0 + 4.0 + 9.0);
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Dd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Bd, B, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Cd, C, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_norm3d, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd, Dd);
|
|
|
|
|
hipMemcpy(D, Dd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(D[i] - val < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_norm4d(){
|
|
|
|
|
double *A, *Ad, *B, *Bd, *C, *Cd, *D, *Dd, *E, *Ed;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
D = new double[N];
|
|
|
|
|
E = new double[N];
|
|
|
|
|
double val = 0.0;
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
B[i] = 2.0;
|
|
|
|
|
C[i] = 3.0;
|
|
|
|
|
D[i] = 4.0;
|
|
|
|
|
}
|
|
|
|
|
val = sqrt(1.0 + 4.0 + 9.0 + 16.0);
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Dd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Ed, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Bd, B, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Cd, C, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Dd, D, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_norm4d, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd, Dd, Ed);
|
|
|
|
|
hipMemcpy(E, Ed, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(E[i] - val < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bool run_rhypot(){
|
|
|
|
|
double *A, *Ad, *B, *Bd, *C, *Cd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
double val = 0.0;
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
B[i] = 2.0;
|
|
|
|
|
}
|
|
|
|
|
val = 1/sqrt(1.0 + 4.0);
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Bd, B, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_rhypot, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd);
|
|
|
|
|
hipMemcpy(C, Cd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(C[i] - val < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_rnorm3d(){
|
|
|
|
|
double *A, *Ad, *B, *Bd, *C, *Cd, *D, *Dd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
D = new double[N];
|
|
|
|
|
double val = 0.0;
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
B[i] = 2.0;
|
|
|
|
|
C[i] = 3.0;
|
|
|
|
|
}
|
|
|
|
|
val = 1/sqrt(1.0 + 4.0 + 9.0);
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Dd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Bd, B, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Cd, C, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_rnorm3d, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd, Dd);
|
|
|
|
|
hipMemcpy(D, Dd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(D[i] - val < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_rnorm4d(){
|
|
|
|
|
double *A, *Ad, *B, *Bd, *C, *Cd, *D, *Dd, *E, *Ed;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
C = new double[N];
|
|
|
|
|
D = new double[N];
|
|
|
|
|
E = new double[N];
|
|
|
|
|
double val = 0.0;
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
B[i] = 2.0;
|
|
|
|
|
C[i] = 3.0;
|
|
|
|
|
D[i] = 4.0;
|
|
|
|
|
}
|
|
|
|
|
val = 1/sqrt(1.0 + 4.0 + 9.0 + 16.0);
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Cd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Dd, SIZE);
|
|
|
|
|
hipMalloc((void**)&Ed, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Bd, B, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Cd, C, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipMemcpy(Dd, D, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_rnorm4d, dim3(1), dim3(N), 0, 0, Ad, Bd, Cd, Dd, Ed);
|
|
|
|
|
hipMemcpy(E, Ed, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(E[i] - val < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool run_rnorm(){
|
|
|
|
|
double *A, *Ad, *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
double val = 0.0;
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = 1.0;
|
|
|
|
|
B[i] = 0.0;
|
|
|
|
|
val += 1.0;
|
|
|
|
|
}
|
|
|
|
|
val = 1/sqrt(val);
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_rnorm, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(B[0] - val < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2016-06-13 14:44:18 -05:00
|
|
|
bool run_erfinv(){
|
|
|
|
|
double *A, *Ad, *B, *Bd;
|
|
|
|
|
A = new double[N];
|
|
|
|
|
B = new double[N];
|
|
|
|
|
for(int i=0;i<N;i++){
|
|
|
|
|
A[i] = -0.6;
|
|
|
|
|
B[i] = 0.0;
|
|
|
|
|
}
|
|
|
|
|
hipMalloc((void**)&Ad, SIZE);
|
|
|
|
|
hipMalloc((void**)&Bd, SIZE);
|
|
|
|
|
hipMemcpy(Ad, A, SIZE, hipMemcpyHostToDevice);
|
|
|
|
|
hipLaunchKernel(test_erfinv, dim3(1), dim3(N), 0, 0, Ad, Bd);
|
|
|
|
|
hipMemcpy(B, Bd, SIZE, hipMemcpyDeviceToHost);
|
|
|
|
|
int passed = 0;
|
|
|
|
|
for(int i=0;i<512;i++){
|
|
|
|
|
if(B[i] - A[i] < 0.000001){
|
|
|
|
|
passed = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
free(A);
|
|
|
|
|
if(passed == 1){
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
assert(passed == 1);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
2016-06-10 09:46:31 -05:00
|
|
|
|
|
|
|
|
int main(){
|
|
|
|
|
if(run_sincos() && run_sincospi() && run_llrint() && run_norm3d() && run_norm4d() &&
|
|
|
|
|
run_rnorm3d() && run_rnorm4d() &&
|
|
|
|
|
run_rnorm() && run_lround() && run_llround() &&
|
2016-06-13 14:44:18 -05:00
|
|
|
run_rint() && run_rhypot() && run_erfinv()
|
2016-06-10 09:46:31 -05:00
|
|
|
){
|
|
|
|
|
passed();
|
|
|
|
|
}
|
|
|
|
|
}
|