[V0 Deprecation] Enable the remaining multimodal tests in V1 (#25307)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
2025-09-21 01:50:58 +08:00
parent d88918e4c2
commit bef180f009
8 changed files with 195 additions and 214 deletions
--- a/tests/models/multimodal/generation/test_qwen2_vl.py
+++ b/tests/models/multimodal/generation/test_qwen2_vl.py
@@ -10,7 +10,6 @@ from PIL import Image

 from vllm.multimodal.image import rescale_image_size
 from vllm.multimodal.video import rescale_video_size, sample_frames_from_video
-from vllm.utils import set_default_torch_num_threads

 from ....conftest import (IMAGE_ASSETS, VIDEO_ASSETS, PromptImageInput,
                          PromptVideoInput, VllmRunner)
@@ -264,8 +263,7 @@ def run_embedding_input_test(
    processor = AutoProcessor.from_pretrained(model)

    # max_model_len should be greater than image_feature_size
-    with set_default_torch_num_threads(1):
-        vllm_model = vllm_runner(
+    with vllm_runner(
            model,
            runner="generate",
            max_model_len=4000,
@@ -277,9 +275,8 @@ def run_embedding_input_test(
            },
            tensor_parallel_size=tensor_parallel_size,
            distributed_executor_backend=distributed_executor_backend,
-        )
-
-    with vllm_model:
+            default_torch_num_threads=1,
+    ) as vllm_model:
        outputs_per_case_for_original_input = [
            vllm_model.generate_greedy_logprobs(prompts,
                                                max_tokens,