[Model] Support Qwen2 embeddings and use tags to select model tests (#10184)

2024-11-15 12:23:09 +08:00
parent 2885ba0e24
commit b40cf6402e
19 changed files with 252 additions and 178 deletions
--- a/tests/models/encoder_decoder/vision_language/test_mllama.py
+++ b/tests/models/encoder_decoder/vision_language/test_mllama.py
@@ -233,6 +233,7 @@ def clear_cache():


@large_gpu_test(min_gb=48)
+@pytest.mark.core_model
@pytest.mark.parametrize("model", models)
@pytest.mark.parametrize(
    "sizes",
@@ -278,6 +279,7 @@ def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,


@large_gpu_test(min_gb=48)
+@pytest.mark.core_model
@pytest.mark.parametrize("model", models)
@pytest.mark.parametrize("dtype", ["bfloat16"])
@pytest.mark.parametrize("max_tokens", [128])
@@ -326,6 +328,7 @@ def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,


@large_gpu_test(min_gb=48)
+@pytest.mark.core_model
@pytest.mark.parametrize("model", models)
@pytest.mark.parametrize("dtype", ["bfloat16"])
@pytest.mark.parametrize("max_tokens", [128])