updated envs for better strix halo support on vllm
Šī revīzija ir iekļauta:
@@ -1,4 +1,8 @@
|
|||||||
# Required for Strix Halo / RDNA3.5 on vLLM
|
# Required for Strix Halo / RDNA3.5 on vLLM
|
||||||
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
||||||
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
||||||
export VLLM_TARGET_DEVICE=rocm
|
export VLLM_TARGET_DEVICE=rocm
|
||||||
|
export VLLM_USE_MMAP=0
|
||||||
|
export VLLM_ROCM_USE_AITER=0
|
||||||
|
export VLLM_ROCM_USE_AITER_MOE=0
|
||||||
|
export VLLM_USE_TRITON_AWQ=1
|
||||||
Atsaukties uz šo jaunā problēmā
Block a user