[Model] Consolidate score logic by introduce score_type (#36479)

Signed-off-by: wang.yuqi <yuqi.wang@daocloud.io>
2026-03-10 21:32:25 +08:00
parent 409c4e632d
commit a3189a08b0
14 changed files with 213 additions and 194 deletions
--- a/vllm/entrypoints/llm.py
+++ b/vllm/entrypoints/llm.py
@@ -1584,8 +1584,11 @@ class LLM:
            )

        supported_tasks = self.supported_tasks
+        score_type = self.model_config.score_type
+        is_late_interaction = score_type == "late-interaction"
+        is_cross_encoder = score_type == "cross-encoder"
+
        # Late interaction models (e.g., ColBERT) use token_embed for scoring
-        is_late_interaction = model_config.is_late_interaction
        if not is_late_interaction and all(
            t not in supported_tasks for t in ("embed", "classify")
        ):
@@ -1595,13 +1598,10 @@ class LLM:
                "`--convert embed` or `--convert classify`."
            )

-        if (
-            model_config.is_cross_encoder
-            and getattr(model_config.hf_config, "num_labels", 0) != 1
-        ):
+        if is_cross_encoder and getattr(model_config.hf_config, "num_labels", 0) != 1:
            raise ValueError("Score API is only enabled for num_labels == 1.")

-        if not model_config.is_cross_encoder and chat_template is not None:
+        if not is_cross_encoder and chat_template is not None:
            raise ValueError(
                "chat_template is only supported for cross-encoder models."
            )
@@ -1622,7 +1622,7 @@ class LLM:
        )
        encode_kwargs = tok_params.get_encode_kwargs()

-        if model_config.is_cross_encoder:
+        if is_cross_encoder:
            return self._cross_encoding_score(
                score_data_1,
                score_data_2,