removing llvm flags as they have no impact on performance

Bu işleme şunda yer alıyor:
Donato Capitella
2026-02-24 08:27:57 +00:00
ebeveyn e726d406fa
işleme 1af159af81
-8
Dosyayı Görüntüle
@@ -38,8 +38,6 @@ ENV FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE"
RUN git clone https://github.com/ROCm/flash-attention.git &&\
cd flash-attention &&\
git checkout main_perf &&\
export CXXFLAGS="-mllvm --amdgpu-unroll-threshold-local=600" && \
export HIPCXXFLAGS="-mllvm --amdgpu-unroll-threshold-local=600" && \
python setup.py install && \
cd /opt && rm -rf /opt/flash-attention
@@ -70,10 +68,6 @@ ENV CXX="/opt/rocm/llvm/bin/clang++"
RUN export HIP_DEVICE_LIB_PATH=$(find /opt/rocm -type d -name bitcode -print -quit) && \
echo "Compiling with Bitcode: $HIP_DEVICE_LIB_PATH" && \
export CXXFLAGS="-mllvm --amdgpu-unroll-threshold-local=600" && \
export CFLAGS="-mllvm --amdgpu-unroll-threshold-local=600" && \
export HIPFLAGS="-mllvm --amdgpu-unroll-threshold-local=600" && \
export HIPCXXFLAGS="-mllvm --amdgpu-unroll-threshold-local=600" && \
export CMAKE_ARGS="-DROCM_PATH=/opt/rocm -DHIP_PATH=/opt/rocm -DAMDGPU_TARGETS=gfx1151 -DHIP_ARCHITECTURES=gfx1151" && \
python -m pip wheel --no-build-isolation --no-deps -w /tmp/dist -v . && \
python -m pip install /tmp/dist/*.whl
@@ -96,8 +90,6 @@ RUN cmake -S . \
-DCOMPUTE_BACKEND=hip \
-DCMAKE_HIP_COMPILER=/opt/rocm/llvm/bin/clang++ \
-DCMAKE_CXX_COMPILER=/opt/rocm/llvm/bin/clang++ \
-DCMAKE_CXX_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600" \
-DCMAKE_HIP_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600" \
&& \
make -j$(nproc) && \
python -m pip install --no-cache-dir . --no-build-isolation --no-deps