From 43877a620bf629d3625c870ef787e590101e0518 Mon Sep 17 00:00:00 2001 From: Woosuk Kwon Date: Sun, 22 Mar 2026 16:30:25 -0700 Subject: [PATCH] [MRV2] Enable PP CUDA graph test (#37830) Signed-off-by: Woosuk Kwon --- .buildkite/test_areas/model_runner_v2.yaml | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/.buildkite/test_areas/model_runner_v2.yaml b/.buildkite/test_areas/model_runner_v2.yaml index 238d5956a..dd64a0d23 100644 --- a/.buildkite/test_areas/model_runner_v2.yaml +++ b/.buildkite/test_areas/model_runner_v2.yaml @@ -87,13 +87,12 @@ steps: - vllm/v1/worker/gpu/ - vllm/v1/worker/gpu_worker.py - tests/distributed/test_pipeline_parallel.py - #- tests/distributed/test_pp_cudagraph.py + - tests/distributed/test_pp_cudagraph.py commands: - set -x - export VLLM_USE_V2_MODEL_RUNNER=1 - pytest -v -s distributed/test_pipeline_parallel.py -k "not ray and not Jamba" - # TODO: Uncomment once https://github.com/vllm-project/vllm/pull/35162 is merged. - #- pytest -v -s distributed/test_pp_cudagraph.py -k "not ray" + - pytest -v -s distributed/test_pp_cudagraph.py -k "not ray" - label: Model Runner V2 Spec Decode timeout_in_minutes: 30