[MRV2] Enable PP CUDA graph test (#37830)

Signed-off-by: Woosuk Kwon <woosuk@inferact.ai>
This commit is contained in:
Woosuk Kwon
2026-03-22 16:30:25 -07:00
committed by GitHub
parent 63f49b8bd4
commit 43877a620b

View File

@@ -87,13 +87,12 @@ steps:
- vllm/v1/worker/gpu/ - vllm/v1/worker/gpu/
- vllm/v1/worker/gpu_worker.py - vllm/v1/worker/gpu_worker.py
- tests/distributed/test_pipeline_parallel.py - tests/distributed/test_pipeline_parallel.py
#- tests/distributed/test_pp_cudagraph.py - tests/distributed/test_pp_cudagraph.py
commands: commands:
- set -x - set -x
- export VLLM_USE_V2_MODEL_RUNNER=1 - export VLLM_USE_V2_MODEL_RUNNER=1
- pytest -v -s distributed/test_pipeline_parallel.py -k "not ray and not Jamba" - pytest -v -s distributed/test_pipeline_parallel.py -k "not ray and not Jamba"
# TODO: Uncomment once https://github.com/vllm-project/vllm/pull/35162 is merged. - pytest -v -s distributed/test_pp_cudagraph.py -k "not ray"
#- pytest -v -s distributed/test_pp_cudagraph.py -k "not ray"
- label: Model Runner V2 Spec Decode - label: Model Runner V2 Spec Decode
timeout_in_minutes: 30 timeout_in_minutes: 30