diff --git a/src/device/prims_ll.h b/src/device/prims_ll.h index d5867ef4b1..2cf1045c84 100644 --- a/src/device/prims_ll.h +++ b/src/device/prims_ll.h @@ -268,7 +268,7 @@ private: i4.flag2 = flag; __builtin_nontemporal_store(i4.v[0], dst->v); __builtin_nontemporal_store(i4.v[1], dst->v+1); -#if defined(__gfx950__) +#if defined(__gfx950__) && ROCM_VERSION < 70200 __builtin_amdgcn_fence(__ATOMIC_RELEASE, ""); // flush cache #endif #else @@ -344,7 +344,7 @@ private: __builtin_nontemporal_store(u4, (uint32_t*)dst); else __builtin_nontemporal_store(u8, (uint64_t*)dst); -#if defined(__gfx950__) +#if defined(__gfx950__) && ROCM_VERSION < 70200 __builtin_amdgcn_fence(__ATOMIC_RELEASE, ""); // flush cache #endif #else