6 lines
276 B
Docker
6 lines
276 B
Docker
#FROM vllm/vllm-openai:v0.19.0-cu130
|
|
FROM atl.vultrcr.com/vllm/vllm-with-lmcache:v0.19.0-cu130-mla-multi-group-kv-cache
|
|
|
|
# Patch tool parser for GLM regex fix
|
|
COPY deepseekv32_tool_parser.py /usr/local/lib/python3.12/dist-packages/vllm/tool_parsers/deepseekv32_tool_parser.py
|