diff --git a/tests/evals/gsm8k/test_gsm8k_correctness.py b/tests/evals/gsm8k/test_gsm8k_correctness.py index 6b2cb02e9..c8028c0b8 100644 --- a/tests/evals/gsm8k/test_gsm8k_correctness.py +++ b/tests/evals/gsm8k/test_gsm8k_correctness.py @@ -11,9 +11,11 @@ pytest -s -v tests/evals/gsm8k/test_gsm8k_correctness.py \ import shlex +import pytest import yaml from tests.utils import RemoteOpenAIServer +from vllm.platforms import current_platform from .gsm8k_eval import evaluate_gsm8k @@ -53,6 +55,15 @@ def test_gsm8k_correctness(config_filename): """Test GSM8K correctness for a given model configuration.""" eval_config = yaml.safe_load(config_filename.read_text(encoding="utf-8")) + if ( + not current_platform.is_cuda() + and "Qwen3-30B-A3B-MXFP4A16" in eval_config["model_name"] + ): + pytest.skip( + "Skipping Qwen3-30B-A3B-MXFP4A16 on non-CUDA platforms. " + "Marlin kernels are not supported." + ) + # Parse server arguments from config (use shlex to handle quoted strings) server_args_str = eval_config.get("server_args", "") server_args = shlex.split(server_args_str) if server_args_str else []