2025-09-10 21:16:39 +08:00
|
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
|
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
|
|
|
|
|
from tests.models.utils import GenerateModelInfo
|
|
|
|
|
|
|
|
|
|
from .ppl_utils import wikitext_ppl_test
|
|
|
|
|
|
|
|
|
|
MODELS = [
|
2026-03-03 21:15:51 +08:00
|
|
|
# for Qwen3
|
|
|
|
|
GenerateModelInfo("Qwen/Qwen3-0.6B", hf_ppl=23.864173889160156),
|
|
|
|
|
GenerateModelInfo("Qwen/Qwen3-0.6B-FP8", hf_ppl=24.313045501708984),
|
|
|
|
|
# for Qwen3.5
|
|
|
|
|
GenerateModelInfo("Qwen/Qwen3.5-0.8B", hf_ppl=19.38858413696289),
|
2025-09-10 21:16:39 +08:00
|
|
|
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize("model_info", MODELS)
|
|
|
|
|
def test_ppl(hf_runner, vllm_runner, model_info: GenerateModelInfo):
|
2026-03-03 21:15:51 +08:00
|
|
|
vllm_extra_kwargs = {}
|
|
|
|
|
if model_info.name == "Qwen/Qwen3.5-0.8B":
|
|
|
|
|
vllm_extra_kwargs["language_model_only"] = True
|
|
|
|
|
|
|
|
|
|
wikitext_ppl_test(
|
|
|
|
|
hf_runner, vllm_runner, model_info, vllm_extra_kwargs=vllm_extra_kwargs
|
|
|
|
|
)
|