Skip to content

Commit a14f48b

Browse files
committed
Use prebuilt flash_attn_3 wheel
1 parent 2981be4 commit a14f48b

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

Dockerfile

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,12 @@ RUN echo "🔧 Building lightllm-kernel package..." && \
7979
CMAKE_PREFIX_PATH="$TORCH_CMAKE_PATH:$CMAKE_PREFIX_PATH" python -m build --wheel --outdir /out/ && \
8080
echo "✅ lightllm-kernel build completed"
8181

82-
# # Build flash_attn_3 package (hopper)
82+
# Use prebuilt flash_attn_3 wheel (saves ~50+ minutes!)
83+
RUN echo "📦 Using prebuilt flash_attn_3 wheel..." && \
84+
cp flash-attention/hopper/dist/flash_attn_3-3.0.0b1-cp39-abi3-linux_x86_64.whl /out/ && \
85+
echo "✅ flash_attn_3 wheel copied successfully"
86+
87+
# Fallback: Build from source if needed (uncomment if you need to rebuild)
8388
# RUN echo "🔧 Building flash_attn_3 package..." && \
8489
# cd flash-attention/hopper && \
8590
# MAX_JOBS=2 NVCC_THREADS=2 FLASH_ATTN_CUDA_ARCHS=90 FLASH_ATTENTION_DISABLE_SM80=TRUE python setup.py bdist_wheel && \

0 commit comments

Comments
 (0)