[BUG] Reset running requests when clearing cache for pause/resume (#34382)
Signed-off-by: hao-aaron <ahao@anyscale.com>
This commit is contained in:
@@ -793,7 +793,7 @@ class AsyncLLM(EngineClient):
|
|||||||
|
|
||||||
# Clear cache
|
# Clear cache
|
||||||
if clear_cache:
|
if clear_cache:
|
||||||
await self.reset_prefix_cache()
|
await self.reset_prefix_cache(reset_running_requests=True)
|
||||||
await self.reset_mm_cache()
|
await self.reset_mm_cache()
|
||||||
await self.reset_encoder_cache()
|
await self.reset_encoder_cache()
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user