2026-04-11 23:39:36 +00:00
|
|
|
FROM lmsysorg/sglang-rocm:v0.5.10rc0-rocm700-mi30x-20260411
|
|
|
|
|
|
2026-04-12 17:09:58 +00:00
|
|
|
# ---------------------------------------------------------------
|
|
|
|
|
# haproxy: routes /metrics stub, proxies everything else to SGLang
|
|
|
|
|
# ---------------------------------------------------------------
|
|
|
|
|
RUN apt-get update && apt-get install -y --no-install-recommends haproxy \
|
|
|
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
|
|
2026-04-12 02:47:33 +00:00
|
|
|
# ---------------------------------------------------------------
|
|
|
|
|
# Replace the vllm binary with our shim
|
|
|
|
|
# ---------------------------------------------------------------
|
2026-04-12 02:19:55 +00:00
|
|
|
COPY vllm-shim.sh /usr/local/bin/vllm
|
|
|
|
|
RUN chmod +x /usr/local/bin/vllm
|
2026-04-11 23:39:36 +00:00
|
|
|
|
2026-04-12 02:47:33 +00:00
|
|
|
# Shadow `python -m vllm.*` invocations
|
2026-04-12 02:19:55 +00:00
|
|
|
RUN mkdir -p /opt/vllm-shim/vllm/entrypoints/openai \
|
|
|
|
|
/opt/vllm-shim/vllm/entrypoints/cli
|
|
|
|
|
COPY vllm_shim_module.py /opt/vllm-shim/vllm/__main__.py
|
|
|
|
|
COPY vllm_shim_module.py /opt/vllm-shim/vllm/entrypoints/openai/api_server.py
|
|
|
|
|
COPY vllm_shim_module.py /opt/vllm-shim/vllm/entrypoints/cli/main.py
|
2026-04-12 18:58:37 +00:00
|
|
|
COPY vllm_middleware.py /opt/vllm-shim/vllm_middleware.py
|
2026-04-12 02:19:55 +00:00
|
|
|
RUN touch /opt/vllm-shim/vllm/__init__.py \
|
|
|
|
|
/opt/vllm-shim/vllm/entrypoints/__init__.py \
|
|
|
|
|
/opt/vllm-shim/vllm/entrypoints/openai/__init__.py \
|
|
|
|
|
/opt/vllm-shim/vllm/entrypoints/cli/__init__.py
|
|
|
|
|
|
2026-04-12 04:16:50 +00:00
|
|
|
# ---------------------------------------------------------------
|
|
|
|
|
# PYTHONPATH: two fixes in one
|
|
|
|
|
# 1. /sgl-workspace/aiter — use the source-built aiter instead
|
|
|
|
|
# of the broken pip version in site-packages
|
|
|
|
|
# 2. /opt/vllm-shim — shadow vllm for python -m invocations
|
|
|
|
|
# ---------------------------------------------------------------
|
|
|
|
|
ENV PYTHONPATH="/sgl-workspace/aiter:/opt/vllm-shim:${PYTHONPATH}"
|
2026-04-12 02:19:55 +00:00
|
|
|
|
2026-04-12 02:47:33 +00:00
|
|
|
# ---------------------------------------------------------------
|
|
|
|
|
# MI300X tuning
|
|
|
|
|
# ---------------------------------------------------------------
|
2026-04-12 02:19:55 +00:00
|
|
|
ENV HIP_FORCE_DEV_KERNARG=1
|
|
|
|
|
ENV NCCL_MIN_NCHANNELS=112
|
2026-04-12 02:47:33 +00:00
|
|
|
ENV GPU_MAX_HW_QUEUES=2
|
|
|
|
|
ENV SGLANG_USE_AITER=1
|