Files
vllm-image/Dockerfile

4 lines
188 B
Docker

FROM vllm/vllm-openai:cu129-nightly
RUN sed -i 's/cute.arch.fmin/cutlass.min/g' /usr/local/lib/python3.12/dist-packages/vllm/models/deepseek_v4/nvidia/ops/sparse_attn_compress_cutedsl.py