diff --git a/tests/models/language/generation/conftest.py b/tests/models/language/generation/conftest.py index f423b656b..aeb13bde4 100644 --- a/tests/models/language/generation/conftest.py +++ b/tests/models/language/generation/conftest.py @@ -2,6 +2,7 @@ # SPDX-FileCopyrightText: Copyright contributors to the vLLM project """Pytest configuration for vLLM language generation tests.""" +import os import warnings import torch @@ -9,6 +10,23 @@ import torch from vllm.platforms import current_platform +def pytest_configure(config): + """Early ROCm configuration that must happen before test collection.""" + if not current_platform.is_rocm(): + return + + # Disable skinny GEMM on ROCm to avoid non-deterministic results + # from atomic reductions in wvSplitKrc kernel. + # See: https://github.com/vllm-project/vllm/pull/33493#issuecomment-3906083975 + os.environ["VLLM_ROCM_USE_SKINNY_GEMM"] = "0" + warnings.warn( + "ROCm: Set VLLM_ROCM_USE_SKINNY_GEMM=0 to avoid non-deterministic " + "results from skinny GEMM atomic reductions", + UserWarning, + stacklevel=1, + ) + + def pytest_sessionstart(session): """Configure ROCm-specific settings before test session starts.""" if not current_platform.is_rocm():