[Core] Remove prompt string from engine core data structures (#17214)

Signed-off-by: Nick Hill <nhill@redhat.com>
This commit is contained in:
Nick Hill
2025-04-25 23:41:05 -07:00
committed by GitHub
parent 513f074766
commit df6f3ce883
21 changed files with 40 additions and 76 deletions

View File

@@ -202,7 +202,7 @@ class Processor:
trace_headers: Optional[Mapping[str, str]] = None,
prompt_adapter_request: Optional[PromptAdapterRequest] = None,
priority: int = 0,
) -> EngineCoreRequest:
) -> tuple[Optional[str], EngineCoreRequest]:
# TODO(woosuk): Support pooling models.
# TODO(woosuk): Support encoder-decoder models.
@@ -306,9 +306,8 @@ class Processor:
else:
sorted_mm_inputs = orig_sorted_mm_inputs
return EngineCoreRequest(
return decoder_inputs.get("prompt"), EngineCoreRequest(
request_id=request_id,
prompt=decoder_inputs.get("prompt"),
prompt_token_ids=decoder_inputs["prompt_token_ids"],
mm_inputs=sorted_mm_inputs,
mm_hashes=sorted_mm_hashes,