[Frontend] Add logits_processors as an extra completion argument (#11150)

Signed-off-by: Brad Hilton <brad.hilton.nw@gmail.com>
This commit is contained in:
Brad Hilton
2024-12-14 09:46:42 -07:00
committed by GitHub
parent 3cb5769883
commit 9c3dadd1c9
6 changed files with 127 additions and 39 deletions

View File

@@ -197,7 +197,8 @@ class OpenAIServingChat(OpenAIServing):
default_max_tokens)
else:
sampling_params = request.to_sampling_params(
default_max_tokens)
default_max_tokens,
self.model_config.logits_processor_pattern)
self._log_inputs(request_id,
request_prompts[i],