Fix warpSize for gfx10
Change-Id: I8029ebeb91db1efa8e166ad349aaae6364e8069d
[ROCm/clr commit: 71586b02e3]
This commit is contained in:
committed by
Yaxun Liu
parent
b022db2663
commit
f3663d440c
@@ -306,7 +306,17 @@ __device__ static inline int __hip_move_dpp_N(int src) {
|
||||
bound_ctrl);
|
||||
}
|
||||
|
||||
static constexpr int warpSize = 64;
|
||||
// FIXME: Remove the following workaround once the clang change is released.
|
||||
// This is for backward compatibility with older clang which does not define
|
||||
// __AMDGCN_WAVEFRONT_SIZE. It does not consider -mwavefrontsize64.
|
||||
#ifndef __AMDGCN_WAVEFRONT_SIZE
|
||||
#if __gfx1010__ || __gfx1011__ || __gfx1012__ || __gfx1030__ || __gfx1031__
|
||||
#define __AMDGCN_WAVEFRONT_SIZE 32
|
||||
#else
|
||||
#define __AMDGCN_WAVEFRONT_SIZE 64
|
||||
#endif
|
||||
#endif
|
||||
static constexpr int warpSize = __AMDGCN_WAVEFRONT_SIZE;
|
||||
|
||||
__device__
|
||||
inline
|
||||
|
||||
Reference in New Issue
Block a user