.buildkite/test_areas/engine.yaml

group: Engine
depends_on: 
  - image-build
steps:
- label: Engine
  timeout_in_minutes: 15
  source_file_dependencies:
  - vllm/
  - tests/engine
  - tests/test_sequence
  - tests/test_config
  - tests/test_logger
  - tests/test_vllm_port
  commands:
  - pytest -v -s engine test_sequence.py test_config.py test_logger.py test_vllm_port.py

- label: V1 e2e + engine (1 GPU)
  timeout_in_minutes: 45
  source_file_dependencies:
    - vllm/
    - tests/v1
  commands:
    # TODO: accuracy does not match, whether setting
    # VLLM_USE_FLASHINFER_SAMPLER or not on H100.
    - pytest -v -s v1/e2e
    # Run this test standalone for now;
    # need to untangle use (implicit) use of spawn/fork across the tests.
    - pytest -v -s v1/engine/test_preprocess_error_handling.py
    # Run the rest of v1/engine tests
    - pytest -v -s v1/engine --ignore v1/engine/test_preprocess_error_handling.py
  mirror:
    amd:
      device: mi325_1
      depends_on:
      - image-build-amd
      commands:
      - pytest -v -s v1/e2e
      - pytest -v -s v1/engine

- label: V1 e2e (2 GPUs)
  timeout_in_minutes: 60 # TODO: Fix timeout after we have more confidence in the test stability
  optional: true
  num_devices: 2
  source_file_dependencies:
    - vllm/
    - tests/v1/e2e
  commands:
    # Only run tests that need exactly 2 GPUs
    - pytest -v -s v1/e2e/test_spec_decode.py -k "tensor_parallelism"
  mirror:
    amd:
      device: mi325_2
      depends_on:
      - image-build-amd

- label: V1 e2e (4 GPUs)
  timeout_in_minutes: 60 # TODO: Fix timeout after we have more confidence in the test stability
  optional: true
  num_devices: 4
  source_file_dependencies:
    - vllm/
    - tests/v1/e2e
  commands:
    # Only run tests that need 4 GPUs
    - pytest -v -s v1/e2e/test_spec_decode.py -k "eagle_correctness_heavy"
  mirror:
    amd:
      device: mi325_4
      depends_on:
      - image-build-amd
[ci] Refactor CI file structure (#29343) 2025-12-08 18:25:43 -08:00			`group: Engine`
			`depends_on:`
			`- image-build`
			`steps:`
			`- label: Engine`
			`timeout_in_minutes: 15`
			`source_file_dependencies:`
			`- vllm/`
			`- tests/engine`
			`- tests/test_sequence`
			`- tests/test_config`
			`- tests/test_logger`
			`- tests/test_vllm_port`
			`commands:`
			`- pytest -v -s engine test_sequence.py test_config.py test_logger.py test_vllm_port.py`

[CI] Defining extended V1 e2e + engine tests (#35580) Signed-off-by: Andreas Karatzas <akaratza@amd.com> 2026-03-02 02:10:54 -06:00			`- label: V1 e2e + engine (1 GPU)`
[ci] Refactor CI file structure (#29343) 2025-12-08 18:25:43 -08:00			`timeout_in_minutes: 45`
			`source_file_dependencies:`
			`- vllm/`
			`- tests/v1`
			`commands:`
			`# TODO: accuracy does not match, whether setting`
			`# VLLM_USE_FLASHINFER_SAMPLER or not on H100.`
			`- pytest -v -s v1/e2e`
[ci] Sync test areas with test-pipeline.yaml and enable new pipeline generator (#33080) Signed-off-by: Kevin H. Luu <khluu000@gmail.com> Signed-off-by: khluu <khluu000@gmail.com> Co-authored-by: Kevin Luu <khluu@Kevins-MacBook-Pro.local> 2026-01-26 12:28:20 -08:00			`# Run this test standalone for now;`
			`# need to untangle use (implicit) use of spawn/fork across the tests.`
			`- pytest -v -s v1/engine/test_preprocess_error_handling.py`
			`# Run the rest of v1/engine tests`
			`- pytest -v -s v1/engine --ignore v1/engine/test_preprocess_error_handling.py`
[ROCm][CI] Added MI325 mirrors (#34923) Signed-off-by: Andreas Karatzas <akaratza@amd.com> 2026-02-24 15:37:15 -06:00			`mirror:`
			`amd:`
[ROCm][CI] Extending attention backend coverage for Eagle spec decode tests (#35265) Signed-off-by: Andreas Karatzas <akaratza@amd.com> 2026-02-25 16:16:18 -06:00			`device: mi325_1`
[ROCm][CI] Added MI325 mirrors (#34923) Signed-off-by: Andreas Karatzas <akaratza@amd.com> 2026-02-24 15:37:15 -06:00			`depends_on:`
			`- image-build-amd`
			`commands:`
			`- pytest -v -s v1/e2e`
			`- pytest -v -s v1/engine`
[CI] Defining extended V1 e2e + engine tests (#35580) Signed-off-by: Andreas Karatzas <akaratza@amd.com> 2026-03-02 02:10:54 -06:00
			`- label: V1 e2e (2 GPUs)`
			`timeout_in_minutes: 60 # TODO: Fix timeout after we have more confidence in the test stability`
			`optional: true`
			`num_devices: 2`
			`source_file_dependencies:`
			`- vllm/`
			`- tests/v1/e2e`
			`commands:`
			`# Only run tests that need exactly 2 GPUs`
			`- pytest -v -s v1/e2e/test_spec_decode.py -k "tensor_parallelism"`
			`mirror:`
			`amd:`
			`device: mi325_2`
			`depends_on:`
			`- image-build-amd`

			`- label: V1 e2e (4 GPUs)`
			`timeout_in_minutes: 60 # TODO: Fix timeout after we have more confidence in the test stability`
			`optional: true`
			`num_devices: 4`
			`source_file_dependencies:`
			`- vllm/`
			`- tests/v1/e2e`
			`commands:`
			`# Only run tests that need 4 GPUs`
			`- pytest -v -s v1/e2e/test_spec_decode.py -k "eagle_correctness_heavy"`
			`mirror:`
			`amd:`
			`device: mi325_4`
			`depends_on:`
			`- image-build-amd`