[DisaggEverything] Tokens in<>out /generate endpoint (#24261)

Signed-off-by: NickLucche <nlucches@redhat.com>
Signed-off-by: Harry Mellor <19981378+hmellor@users.noreply.github.com>
Co-authored-by: Harry Mellor <19981378+hmellor@users.noreply.github.com>
This commit is contained in:
Nicolò Lucchesi
2025-11-14 17:58:01 +01:00
committed by GitHub
parent d54a18a47e
commit 6f1e7f7226
12 changed files with 822 additions and 9 deletions

View File

@@ -15,6 +15,7 @@ from pydantic.dataclasses import dataclass
from vllm.logger import init_logger
from vllm.logits_process import LogitsProcessor
from vllm.transformers_utils.tokenizer import AnyTokenizer
from vllm.v1.serial_utils import PydanticMsgspecMixin
logger = init_logger(__name__)
@@ -122,6 +123,7 @@ class RequestOutputKind(Enum):
class SamplingParams(
PydanticMsgspecMixin,
msgspec.Struct,
omit_defaults=True, # type: ignore[call-arg]
# required for @cached_property.