From c8564caf9d8551fe6cd8e5af478d6daec6b5ff51 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Mon, 11 May 2026 06:09:40 +0000 Subject: [PATCH] fix: patch vLLM deepseek_v4.py directly in image --- Dockerfile | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/Dockerfile b/Dockerfile index 0277f24..f136533 100644 --- a/Dockerfile +++ b/Dockerfile @@ -18,8 +18,8 @@ ENV PYTHONPATH="/root/DeepGEMM:${PYTHONPATH}" RUN ln -sf /usr/local/lib/python3.12/dist-packages/nvidia/cu13/lib/libnvrtc.so.13 /usr/local/cuda/lib64/libnvrtc.so RUN cd /root/DeepGEMM && python3 setup.py build_ext --inplace -# Copy our DeepSeek V4 patch into the image -COPY patches/deepseek_v4.py /defaults/deepseek_v4.py +# Copy our DeepSeek V4 patch over vLLM's model file +COPY patches/deepseek_v4.py /usr/local/lib/python3.12/dist-packages/vllm/model_executor/models/deepseek_v4.py # Verify everything imports RUN python3 -c "import deep_gemm; print('DeepGEMM NVFP4 OK')" && \