[nvccTests]Enabled inline_asm_vadd on nvcc

[ROCm/hip commit: 18f6e31d1d]
This commit is contained in:
Phaneendr-kumar Lanka
2017-11-14 16:37:59 +05:30
orang tua 0fd5239b14
melakukan 65a8021933
@@ -39,7 +39,13 @@ __global__ void vadd_asm(hipLaunchParm lp,
{
int i = hipBlockDim_x * hipBlockIdx_x + hipThreadIdx_x;
asm volatile ("v_add_f32_e32 %0, %1, %2" : "=v" (out[i]) : "v"(in[i]),"v" (out[i]));
#ifdef __HIP_PLATFORM_NVCC__
asm volatile("add.f32 %0,%1,%2;":"=f"(out[i]):"f"(in[i]),"f"(out[i]));
#endif
#ifdef __HIP_PLATFORM_HCC__
asm volatile ("v_add_f32_e32 %0, %1, %2" : "=v" (out[i]) : "v"(in[i]),"v" (out[i]));
#endif
}
// CPU implementation of Vector Result