[V1][Core][1/n] Logging and Metrics (#11962)

Signed-off-by: rshaw@neuralmagic.com <rshaw@neuralmagic.com>
This commit is contained in:
Robert Shaw
2025-01-12 16:02:02 -05:00
committed by GitHub
parent 263a870ee1
commit 9597a095f2
11 changed files with 129 additions and 84 deletions

View File

@@ -74,7 +74,6 @@ class LLMEngine:
asyncio_mode=False,
vllm_config=vllm_config,
executor_class=executor_class,
log_stats=False,
)
@classmethod
@@ -147,11 +146,11 @@ class LLMEngine:
def step(self) -> List[RequestOutput]:
# 1) Get EngineCoreOutput from the EngineCore.
engine_core_outputs = self.engine_core.get_output()
outputs = self.engine_core.get_output()
# 2) Detokenizer the EngineCoreOutput.
request_outputs, requests_to_abort = self.detokenizer.step(
engine_core_outputs)
outputs.outputs)
# 3) Abort requests that finished due to stopping criteria.
if requests_to_abort: