[Core] Update dtype detection and defaults (#14858)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
2025-03-19 13:49:33 +08:00
parent 8b3e94a357
commit f690372b68
22 changed files with 175 additions and 227 deletions
--- a/tests/models/encoder_decoder/vision_language/test_mllama.py
+++ b/tests/models/encoder_decoder/vision_language/test_mllama.py
@@ -4,8 +4,7 @@ from typing import Optional, overload

 import pytest
 import torch
-from transformers import (AutoConfig, AutoModelForImageTextToText,
-                          AutoTokenizer, BatchEncoding)
+from transformers import AutoConfig, AutoModelForImageTextToText, AutoTokenizer

 from vllm import LLM, SamplingParams
 from vllm.attention.backends.flash_attn import FlashAttentionMetadata
@@ -227,13 +226,9 @@ def _run_test(
            for prompts, images in inputs
        ]

-    def process(hf_inputs: BatchEncoding, **kwargs):
-        return hf_inputs
-
    with hf_runner(model,
                   dtype=dtype,
                   model_kwargs={"device_map": "auto"},
-                   postprocess_inputs=process,
                   auto_cls=AutoModelForImageTextToText) as hf_model:
        hf_outputs_per_image = [
            hf_model.generate_greedy_logprobs_limit(prompts,