29 lines
937 B
Python
29 lines
937 B
Python
# SPDX-License-Identifier: Apache-2.0
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
|
from typing import Literal, get_args
|
|
|
|
GenerationTask = Literal["generate", "transcription", "realtime"]
|
|
GENERATION_TASKS: tuple[GenerationTask, ...] = get_args(GenerationTask)
|
|
|
|
PoolingTask = Literal[
|
|
"embed",
|
|
"classify",
|
|
"score",
|
|
"token_embed",
|
|
"token_classify",
|
|
"plugin",
|
|
"embed&token_classify",
|
|
]
|
|
POOLING_TASKS: tuple[PoolingTask, ...] = get_args(PoolingTask)
|
|
|
|
# Score API handles score/rerank for:
|
|
# - "score" task (score_type: cross-encoder models)
|
|
# - "embed" task (score_type: bi-encoder models)
|
|
# - "token_embed" task (score_type: late interaction models)
|
|
ScoreType = Literal["bi-encoder", "cross-encoder", "late-interaction"]
|
|
|
|
FrontendTask = Literal["render"]
|
|
FRONTEND_TASKS: tuple[FrontendTask, ...] = get_args(FrontendTask)
|
|
|
|
SupportedTask = Literal[GenerationTask, PoolingTask, FrontendTask]
|