From 68a275ee38d509d56c900343e4c03bf6f946890d Mon Sep 17 00:00:00 2001 From: Matthew Harris Date: Mon, 1 Jun 2026 19:54:26 -0400 Subject: [PATCH] Patch deepseek_v4 sparse attn cutedsl op for cutlass.min --- Dockerfile | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/Dockerfile b/Dockerfile index 2469e0f..99fdd0b 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,3 +1,4 @@ FROM vllm/vllm-openai:nightly -RUN pip3 install --force-reinstall --no-deps nvidia-cutlass-dsl-libs-cu13==4.5.2 +RUN pip3 install --force-reinstall --no-deps nvidia-cutlass-dsl-libs-cu13==4.5.2 && \ + sed -i 's/cute.arch.fmin/cutlass.min/g' /usr/local/lib/python3.12/dist-packages/vllm/models/deepseek_v4/nvidia/ops/sparse_attn_compress_cutedsl.py