[V1] Allow sliding window + prefix caching (#13069)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
@@ -1146,7 +1146,7 @@ class CacheConfig:
|
|||||||
if not self.enable_prefix_caching:
|
if not self.enable_prefix_caching:
|
||||||
return
|
return
|
||||||
|
|
||||||
if self.sliding_window is not None:
|
if self.sliding_window is not None and not envs.VLLM_USE_V1:
|
||||||
raise NotImplementedError(
|
raise NotImplementedError(
|
||||||
"Prefix caching is not supported with sliding window. "
|
"Prefix caching is not supported with sliding window. "
|
||||||
"Run with --disable-sliding-window to use prefix caching.")
|
"Run with --disable-sliding-window to use prefix caching.")
|
||||||
|
|||||||
Reference in New Issue
Block a user