diff --git a/vllm/Dockerfile b/vllm/Dockerfile index b49a74c..6cf4a54 100644 --- a/vllm/Dockerfile +++ b/vllm/Dockerfile @@ -64,16 +64,10 @@ RUN mkdir /wheels # Pin setuptools to <81 for LMCache compatibility (needs >=77.0.3,<81.0.0) RUN uv pip install -U build cmake ninja pybind11 "setuptools>=77.0.3,<81.0.0" wheel +# Use PyPI triton wheel instead of building (QEMU segfaults during triton build) FROM build-base AS build-triton -ARG TRITON_REF=release/3.5.x -ARG TRITON_BUILD_SUFFIX=+cu130 -ENV TRITON_WHEEL_VERSION_SUFFIX=${TRITON_BUILD_SUFFIX:-} -RUN git clone https://github.com/triton-lang/triton.git -RUN cd triton && \ - git checkout ${TRITON_REF} && \ - git submodule sync && \ - git submodule update --init --recursive -j 8 && \ - uv build --wheel --no-build-isolation -o /wheels +RUN mkdir -p /wheels && \ + pip download triton==3.6.0 --platform manylinux_2_27_aarch64 --only-binary=:all: --no-deps -d /wheels FROM build-base AS build-xformers #ARG XFORMERS_REF=v0.0.32.post2