From 10c71a446c3834843a14828a60385e86fcd2c5af Mon Sep 17 00:00:00 2001 From: biondizzle Date: Tue, 28 Apr 2026 03:07:14 +0000 Subject: [PATCH] =?UTF-8?q?Remove=20flash-attn=20GIT=5FTAG=20override=20to?= =?UTF-8?q?=20main=20=E2=80=94=20causes=20FLASHATTENTION=5FFP8=5FTWO=5FLEV?= =?UTF-8?q?EL=5FINTERVAL=20undefined=20error?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit v0.19.0 pins a compatible flash-attn commit (2921022). The sed that forced GIT_TAG to main pulled in newer code that references FLASHATTENTION_FP8_TWO_LEVEL_INTERVAL which isn't defined in v0.19.0's build config. Use the pinned commit instead. --- vllm/Dockerfile | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/vllm/Dockerfile b/vllm/Dockerfile index 3030348..5564f10 100644 --- a/vllm/Dockerfile +++ b/vllm/Dockerfile @@ -166,7 +166,9 @@ RUN cd vllm && \ echo "========================================\n\n" && \ git submodule sync && \ git submodule update --init --recursive -j 8 && \ - sed -i 's/GIT_TAG [a-f0-9]\{40\}/GIT_TAG main/' cmake/external_projects/vllm_flash_attn.cmake && \ + # NOTE: Removed the sed that forced flash-attn GIT_TAG to main. + # v0.19.0 pins a compatible commit; building from main causes + # FLASHATTENTION_FP8_TWO_LEVEL_INTERVAL undefined errors. sed -i 's/register_opaque_type(ModuleName, typ="value", hoist=True)/register_opaque_type(ModuleName, typ="value")/' vllm/utils/torch_utils.py && \ export MAX_JOBS=8 && \ export CMAKE_BUILD_PARALLEL_LEVEL=$MAX_JOBS && \