[BUG] Reset running requests when clearing cache for pause/resume (#34382)
Signed-off-by: hao-aaron <ahao@anyscale.com>
This commit is contained in:
@@ -793,7 +793,7 @@ class AsyncLLM(EngineClient):
|
||||
|
||||
# Clear cache
|
||||
if clear_cache:
|
||||
await self.reset_prefix_cache()
|
||||
await self.reset_prefix_cache(reset_running_requests=True)
|
||||
await self.reset_mm_cache()
|
||||
await self.reset_encoder_cache()
|
||||
|
||||
|
||||
Reference in New Issue
Block a user