Files
vllm-kimi25-eagle/Dockerfile

12 lines
581 B
Docker

FROM vllm/vllm-openai:v0.19.0
# Download and extract Eagle3 drafter model layers
RUN apt-get update && apt-get install -y --no-install-recommends unzip && rm -rf /var/lib/apt/lists/*
ADD https://ewr1.vultrobjects.com/artifacts/models--nvidia--Kimi-K2.5-Thinking-Eagle3.zip /tmp/eagle3.zip
RUN unzip /tmp/eagle3.zip -d /opt/nvidia-Kimi-K2.5-Thinking-Eagle3 && \
rm /tmp/eagle3.zip && \
apt-get remove -y unzip && apt-get autoremove -y
# Patch tool parser for MTP
COPY kimi_k2_tool_parser.py /usr/local/lib/python3.12/dist-packages/vllm/tool_parsers/kimi_k2_tool_parser.py