[bugfix] add api process rank in default multimodal request (#36150)

Signed-off-by: fake0fan <645327136@qq.com> Signed-off-by: Chenguang ZHENG <645327136@qq.com>
2026-03-06 20:00:09 +08:00
parent e2090bf3af
commit fcb73f306c
7 changed files with 46 additions and 9 deletions
--- a/tests/entrypoints/openai/test_completion_error.py
+++ b/tests/entrypoints/openai/test_completion_error.py
@@ -58,9 +58,15 @@ class MockModelConfig:
        return self.diff_sampling_param or {}


+@dataclass
+class MockParallelConfig:
+    _api_process_rank: int = 0
+
+
@dataclass
 class MockVllmConfig:
    model_config: MockModelConfig
+    parallel_config: MockParallelConfig


 def _build_serving_completion(engine: AsyncLLM) -> OpenAIServingCompletion:
@@ -79,7 +85,7 @@ def _build_renderer(model_config: MockModelConfig):
    _, tokenizer_name, _, kwargs = tokenizer_args_from_config(model_config)

    return HfRenderer.from_config(
-        MockVllmConfig(model_config),
+        MockVllmConfig(model_config, parallel_config=MockParallelConfig()),
        tokenizer_kwargs={**kwargs, "tokenizer_name": tokenizer_name},
    )