updated envs for better strix halo support on vllm
This commit is contained in:
@@ -2,3 +2,7 @@
|
|||||||
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
||||||
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
||||||
export VLLM_TARGET_DEVICE=rocm
|
export VLLM_TARGET_DEVICE=rocm
|
||||||
|
export VLLM_USE_MMAP=0
|
||||||
|
export VLLM_ROCM_USE_AITER=0
|
||||||
|
export VLLM_ROCM_USE_AITER_MOE=0
|
||||||
|
export VLLM_USE_TRITON_AWQ=1
|
||||||
مرجع در شماره جدید
Block a user