@@ -16,6 +16,7 @@ RUN chmod 777 -R /tmp && apt-get update && DEBIAN_FRONTEND=noninteractive apt-ge
1616 make \
1717 git \
1818 cmake \
19+ ninja-build \
1920 build-essential && \
2021 rm -rf /var/lib/apt/lists/*
2122
@@ -43,7 +44,7 @@ WORKDIR /workspace
4344RUN pip install torch==2.7.1
4445
4546# Install build dependencies
46- RUN pip install --upgrade pip setuptools wheel build scikit-build-core[pyproject] pybind11
47+ RUN pip install --upgrade pip setuptools wheel build scikit-build-core[pyproject] pybind11 ninja
4748
4849# Copy source code to container
4950COPY . .
@@ -78,20 +79,11 @@ RUN echo "π§ Building lightllm-kernel package..." && \
7879 CMAKE_PREFIX_PATH="$TORCH_CMAKE_PATH:$CMAKE_PREFIX_PATH" python -m build --wheel --outdir /out/ && \
7980 echo "β
lightllm-kernel build completed"
8081
81- # Build flash_attn_3 package (hopper)
82- RUN echo "π§ Building flash_attn_3 package..." && \
83- cd flash-attention/hopper && \
84- MAX_JOBS=2 NVCC_THREADS=2 FLASH_ATTN_CUDA_ARCHS=90 FLASH_ATTENTION_DISABLE_SM80=TRUE python setup.py bdist_wheel && \
85- cp dist/*.whl /out/ && \
86- echo "β
flash_attn_3 build completed"
82+ # # Build flash_attn_3 package (hopper)
83+ # RUN echo "π§ Building flash_attn_3 package..." && \
84+ # cd flash-attention/hopper && \
85+ # MAX_JOBS=2 NVCC_THREADS=2 FLASH_ATTN_CUDA_ARCHS=90 FLASH_ATTENTION_DISABLE_SM80=TRUE python setup.py bdist_wheel && \
86+ # cp dist/*.whl /out/ && \
87+ # echo "β
flash_attn_3 build completed"
8788
88- # Verify all wheels are built
89- RUN echo "π¦ Final wheel packages:" && \
90- ls -la /out/ && \
91- WHEEL_COUNT=$(ls -1 /out/*.whl | wc -l) && \
92- echo "Total wheels built: $WHEEL_COUNT" && \
93- if [ "$WHEEL_COUNT" -ne 2 ]; then \
94- echo "β Error: Expected 2 wheels, found $WHEEL_COUNT" && exit 1; \
95- else \
96- echo "β
Successfully built all wheel packages" ; \
97- fi
89+ # Verify all wheels are built
0 commit comments