diff --git a/Dockerfile b/Dockerfile index 658d268..fd4a365 100644 --- a/Dockerfile +++ b/Dockerfile @@ -10,9 +10,9 @@ COPY utils.py /usr/local/lib/python3.12/dist-packages/vllm/tool_parsers/utils.py COPY vllm_patches/hf.py /usr/local/lib/python3.12/dist-packages/vllm/renderers/hf.py # Install LMCache for KV cache offloading / sharing across nodes -# Build from source to match CUDA 13 (pip wheel is CUDA 12) +# NO_CUDA_EXT=1 skips CUDA extension build (not needed for Redis backend) RUN apt-get update && apt-get install -y git && \ git clone --depth 1 https://github.com/LMCache/LMCache.git /tmp/lmcache && \ cd /tmp/lmcache && \ - pip install --no-cache-dir -e . && \ + NO_CUDA_EXT=1 pip install --no-cache-dir . && \ rm -rf /tmp/lmcache