Installing flash_attn, as this is now neded by vLLM
This commit is contained in:
@@ -1,3 +1,4 @@
|
||||
# Required for Strix Halo / RDNA3.5 on vLLM
|
||||
export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1
|
||||
export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
|
||||
export VLLM_TARGET_DEVICE=rocm
|
||||
Referens i nytt ärende
Block a user