8 lignes
285 B
Bash
8 lignes
285 B
Bash
# Required for Strix Halo / RDNA3.5 on vLLM
|
|
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
|
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
|
export VLLM_TARGET_DEVICE=rocm
|
|
export VLLM_USE_MMAP=0
|
|
export VLLM_ROCM_USE_AITER=0
|
|
export VLLM_ROCM_USE_AITER_MOE=0
|
|
export VLLM_USE_TRITON_AWQ=1 |