fix: patch vLLM deepseek_v4.py directly in image

This commit is contained in:
2026-05-11 06:09:40 +00:00
parent 7c8c6cd67f
commit c8564caf9d

View File

@@ -18,8 +18,8 @@ ENV PYTHONPATH="/root/DeepGEMM:${PYTHONPATH}"
RUN ln -sf /usr/local/lib/python3.12/dist-packages/nvidia/cu13/lib/libnvrtc.so.13 /usr/local/cuda/lib64/libnvrtc.so
RUN cd /root/DeepGEMM && python3 setup.py build_ext --inplace
# Copy our DeepSeek V4 patch into the image
COPY patches/deepseek_v4.py /defaults/deepseek_v4.py
# Copy our DeepSeek V4 patch over vLLM's model file
COPY patches/deepseek_v4.py /usr/local/lib/python3.12/dist-packages/vllm/model_executor/models/deepseek_v4.py
# Verify everything imports
RUN python3 -c "import deep_gemm; print('DeepGEMM NVFP4 OK')" && \