updated envs for better strix halo support on vllm
This commit is contained in:
@@ -2,3 +2,7 @@
|
||||
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
||||
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
||||
export VLLM_TARGET_DEVICE=rocm
|
||||
export VLLM_USE_MMAP=0
|
||||
export VLLM_ROCM_USE_AITER=0
|
||||
export VLLM_ROCM_USE_AITER_MOE=0
|
||||
export VLLM_USE_TRITON_AWQ=1
|
||||
Fai riferimento in un nuovo problema
Block a user