[Core] Support reset_prefix_cache (#12284)

This commit is contained in:
Cody Yu
2025-01-22 10:52:27 -08:00
committed by GitHub
parent 96f6a7596f
commit 7206ce4ce1
27 changed files with 300 additions and 21 deletions

View File

@@ -194,11 +194,6 @@ class ExecutorBase(ABC):
self.collective_rpc("stop_profile")
def sleep(self, level: int = 1):
if self.cache_config.enable_prefix_caching:
# TODO: support sleep with prefix caching
# by resetting the prefix cache state,
# after https://github.com/vllm-project/vllm/pull/12284
raise ValueError("Cannot sleep when prefix caching is enabled.")
self.collective_rpc("sleep", kwargs=dict(level=level))
def wake_up(self):