diff --git a/Dockerfile b/Dockerfile
index 658d268..fd4a365 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -10,9 +10,9 @@ COPY utils.py /usr/local/lib/python3.12/dist-packages/vllm/tool_parsers/utils.py
 COPY vllm_patches/hf.py /usr/local/lib/python3.12/dist-packages/vllm/renderers/hf.py
 
 # Install LMCache for KV cache offloading / sharing across nodes
-# Build from source to match CUDA 13 (pip wheel is CUDA 12)
+# NO_CUDA_EXT=1 skips CUDA extension build (not needed for Redis backend)
 RUN apt-get update && apt-get install -y git && \
     git clone --depth 1 https://github.com/LMCache/LMCache.git /tmp/lmcache && \
     cd /tmp/lmcache && \
-    pip install --no-cache-dir -e . && \
+    NO_CUDA_EXT=1 pip install --no-cache-dir . && \
     rm -rf /tmp/lmcache