[Model] Interface to enable batch-level DP support (#23733)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
Signed-off-by: Cyrus Leung <cyrus.tl.leung@gmail.com>
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
This commit is contained in:
Cyrus Leung
2025-08-27 21:41:22 +08:00
committed by GitHub
parent 16dc4052b0
commit fe8d7b6f03
8 changed files with 38 additions and 4 deletions

View File

@@ -27,8 +27,10 @@ from vllm.transformers_utils.dynamic_module import (
from .interfaces import (has_inner_state, has_noops, is_attention_free,
is_hybrid, supports_cross_encoding,
supports_multimodal, supports_multimodal_raw_input,
supports_pp, supports_transcription, supports_v0_only)
supports_multimodal,
supports_multimodal_encoder_tp_data,
supports_multimodal_raw_input, supports_pp,
supports_transcription, supports_v0_only)
from .interfaces_base import (get_default_pooling_type, is_pooling_model,
is_text_generation_model)
@@ -324,6 +326,7 @@ class _ModelInfo:
supports_cross_encoding: bool
supports_multimodal: bool
supports_multimodal_raw_input: bool
supports_multimodal_encoder_tp_data: bool
supports_pp: bool
has_inner_state: bool
is_attention_free: bool
@@ -343,6 +346,8 @@ class _ModelInfo:
supports_cross_encoding=supports_cross_encoding(model),
supports_multimodal=supports_multimodal(model),
supports_multimodal_raw_input=supports_multimodal_raw_input(model),
supports_multimodal_encoder_tp_data=
supports_multimodal_encoder_tp_data(model),
supports_pp=supports_pp(model),
has_inner_state=has_inner_state(model),
is_attention_free=is_attention_free(model),