[V0 Deprecation] Remove VLLM_USE_V1 from tests (#26341)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
2025-10-07 23:42:31 +08:00
parent c0a7b89d8e
commit 1e4ecca1d0
51 changed files with 817 additions and 1275 deletions
--- a/tests/compile/test_fusion_attn.py
+++ b/tests/compile/test_fusion_attn.py
@@ -303,7 +303,6 @@ def test_attention_quant_pattern(
    model_class: type[AttentionQuantPatternModel],
    backend: _Backend,
    use_inductor_graph_partition: bool,
-    monkeypatch,
    dist_init,
    caplog_vllm,
 ):
@@ -312,8 +311,6 @@ def test_attention_quant_pattern(
    if use_inductor_graph_partition and not is_torch_equal_or_newer("2.9.0.dev"):
        pytest.skip("inductor graph partition is only available in PyTorch 2.9+")

-    monkeypatch.setenv("VLLM_USE_V1", "1")
-
    device = torch.device("cuda:0")
    torch.manual_seed(42)