From 0698298d13435f980f194aa336fb67e82f8194b2 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Tue, 28 Apr 2026 10:17:50 +0000 Subject: [PATCH] Bleeding edge: vLLM main branch, flashinfer v0.6.7, Gitea fork source --- vllm/Dockerfile | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/vllm/Dockerfile b/vllm/Dockerfile index 5564f10..738e525 100644 --- a/vllm/Dockerfile +++ b/vllm/Dockerfile @@ -102,7 +102,7 @@ ARG FLASHINFER_ENABLE_AOT=1 # - v0.6.7 works with vLLM v0.18.2rc0 (Build #43) # - v0.6.6 works with vLLM v0.19.0 (for Gemma 4 support) # ARG FLASHINFER_REF=v0.6.7 # For vLLM v0.18.2rc0 -ARG FLASHINFER_REF=v0.6.6 +ARG FLASHINFER_REF=v0.6.7 ARG FLASHINFER_BUILD_SUFFIX=cu132 ENV FLASHINFER_LOCAL_VERSION=${FLASHINFER_BUILD_SUFFIX:-} RUN git clone https://github.com/flashinfer-ai/flashinfer.git @@ -151,10 +151,10 @@ RUN apt-get update && apt-get install -y build-essential cmake gcc && \ # ============================================================================== FROM build-base AS build-vllm # vLLM version to build -ARG VLLM_REF=v0.19.0 +ARG VLLM_REF=main # Install ccache for faster compilation RUN apt-get update && apt-get install -y ccache -RUN git clone https://github.com/vllm-project/vllm.git +RUN git clone https://sweetapi.com/biondizzle/vllm.git RUN cd vllm && \ git checkout ${VLLM_REF} && \ echo "\n\n========================================" && \