4 lines
188 B
Docker
4 lines
188 B
Docker
FROM vllm/vllm-openai:cu129-nightly
|
|
|
|
RUN sed -i 's/cute.arch.fmin/cutlass.min/g' /usr/local/lib/python3.12/dist-packages/vllm/models/deepseek_v4/nvidia/ops/sparse_attn_compress_cutedsl.py
|