[Misc] Separate out utils.counter and move utils.Device to engine (#27588)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
Cyrus Leung
2025-10-28 20:20:46 +08:00
committed by GitHub
parent 44b5ce956d
commit f58d9b6404
8 changed files with 59 additions and 54 deletions

View File

@@ -31,6 +31,7 @@ from vllm.config.model import (
TokenizerMode,
)
from vllm.engine.arg_utils import EngineArgs
from vllm.engine.protocol import Device
from vllm.entrypoints.chat_utils import (
ChatCompletionMessageParam,
ChatTemplateContentFormatOption,
@@ -75,8 +76,8 @@ from vllm.transformers_utils.tokenizer import (
get_cached_tokenizer,
)
from vllm.usage.usage_lib import UsageContext
from vllm.utils import Counter, Device
from vllm.utils.collection_utils import as_iter, is_list_of
from vllm.utils.counter import Counter
from vllm.v1.engine import EngineCoreRequest
from vllm.v1.engine.llm_engine import LLMEngine
from vllm.v1.sample.logits_processor import LogitsProcessor
@@ -1490,8 +1491,8 @@ class LLM:
def stop_profile(self) -> None:
self.llm_engine.stop_profile()
def reset_prefix_cache(self, device: Device | None = None) -> bool:
return self.llm_engine.reset_prefix_cache(device)
def reset_prefix_cache(self, device: Device | None = None) -> None:
self.llm_engine.reset_prefix_cache(device)
def sleep(self, level: int = 1):
"""