SWDEV-525969 - add gfx950 to use ocp type for fp8 (#157)
* do not use __gfx94plus_clr__ macro in fp8 header
[ROCm/clr commit: 5214d1ca07]
This commit is contained in:
zatwierdzone przez
GitHub
rodzic
ef52738425
commit
b0d9ea7454
@@ -30,8 +30,9 @@
|
||||
#ifndef _HIP_INCLUDE_HIP_AMD_DETAIL_HIP_FP8_H_
|
||||
#define _HIP_INCLUDE_HIP_AMD_DETAIL_HIP_FP8_H_
|
||||
|
||||
#if (defined(__gfx94plus_clr__) || defined(__gfx1200__) || defined(__gfx1201__)) && \
|
||||
__HIP_DEVICE_COMPILE__
|
||||
#if (defined(__gfx942__) || defined(__gfx1200__) || defined(__gfx1201__) || \
|
||||
defined(__gfx950__)) && \
|
||||
__HIP_DEVICE_COMPILE__
|
||||
#define HIP_FP8_CVT_FAST_PATH 1
|
||||
#else
|
||||
#define HIP_FP8_CVT_FAST_PATH 0
|
||||
@@ -40,7 +41,8 @@
|
||||
#if defined(__gfx942__) && __HIP_DEVICE_COMPILE__
|
||||
#define HIP_FP8_TYPE_OCP 0
|
||||
#define HIP_FP8_TYPE_FNUZ 1
|
||||
#elif (defined(__gfx1200__) || defined(__gfx1201__)) && __HIP_DEVICE_COMPILE__
|
||||
#elif (defined(__gfx1200__) || defined(__gfx1201__) || defined(__gfx950__)) && \
|
||||
__HIP_DEVICE_COMPILE__
|
||||
#define HIP_FP8_TYPE_OCP 1
|
||||
#define HIP_FP8_TYPE_FNUZ 0
|
||||
#else
|
||||
|
||||
Reference in New Issue
Block a user