Export NaNs in logits to scheduler_stats if output is corrupted (#18777)

Signed-off-by: Vlad Mihailescu <vtmihailescu@gmail.com>
This commit is contained in:
Vlad Tiberiu Mihailescu
2025-06-20 07:47:16 -07:00
committed by GitHub
parent 7e8977fcd4
commit 2e3e3c86dc
7 changed files with 104 additions and 2 deletions

View File

@@ -97,6 +97,10 @@ class Request:
# The number of tokens with prefix cache hits.
self.num_cached_tokens = -1
# The number of NaNs in logits. A value greater than 0
# indicates that the output is corrupted
self.num_nans_in_logits = 0
@classmethod
def from_engine_core_request(cls, request: EngineCoreRequest) -> "Request":
if request.mm_inputs is not None:
@@ -132,6 +136,10 @@ class Request:
self._output_token_ids.extend(token_ids)
self._all_token_ids.extend(token_ids)
@property
def is_output_corrupted(self) -> bool:
return self.num_nans_in_logits > 0
@property
def num_tokens(self) -> int:
return len(self._all_token_ids)