2025-12-08 18:25:43 -08:00
|
|
|
group: Expert Parallelism
|
|
|
|
|
depends_on:
|
|
|
|
|
- image-build
|
|
|
|
|
steps:
|
|
|
|
|
- label: EPLB Algorithm
|
|
|
|
|
timeout_in_minutes: 15
|
|
|
|
|
working_dir: "/vllm-workspace/tests"
|
|
|
|
|
source_file_dependencies:
|
|
|
|
|
- vllm/distributed/eplb
|
|
|
|
|
- tests/distributed/test_eplb_algo.py
|
2026-03-27 02:18:46 -07:00
|
|
|
- tests/distributed/test_eplb_utils.py
|
2025-12-08 18:25:43 -08:00
|
|
|
commands:
|
|
|
|
|
- pytest -v -s distributed/test_eplb_algo.py
|
2026-03-27 02:18:46 -07:00
|
|
|
- pytest -v -s distributed/test_eplb_utils.py
|
2025-12-08 18:25:43 -08:00
|
|
|
|
2026-03-31 14:17:12 +02:00
|
|
|
- label: EPLB Execution # 17min
|
|
|
|
|
timeout_in_minutes: 27
|
2025-12-08 18:25:43 -08:00
|
|
|
working_dir: "/vllm-workspace/tests"
|
2026-01-26 12:28:20 -08:00
|
|
|
num_devices: 4
|
2025-12-08 18:25:43 -08:00
|
|
|
source_file_dependencies:
|
|
|
|
|
- vllm/distributed/eplb
|
|
|
|
|
- tests/distributed/test_eplb_execute.py
|
|
|
|
|
commands:
|
|
|
|
|
- pytest -v -s distributed/test_eplb_execute.py
|
2026-02-28 06:46:42 +02:00
|
|
|
- pytest -v -s distributed/test_eplb_spec_decode.py
|
|
|
|
|
|
|
|
|
|
- label: Elastic EP Scaling Test
|
|
|
|
|
timeout_in_minutes: 20
|
2026-03-18 16:36:18 +02:00
|
|
|
device: h100
|
2026-02-28 06:46:42 +02:00
|
|
|
working_dir: "/vllm-workspace/tests"
|
|
|
|
|
num_devices: 4
|
|
|
|
|
source_file_dependencies:
|
|
|
|
|
- vllm/distributed/
|
|
|
|
|
- vllm/engine/
|
|
|
|
|
- vllm/executor/
|
|
|
|
|
- vllm/compilation/
|
|
|
|
|
- tests/distributed/
|
|
|
|
|
commands:
|
|
|
|
|
- pytest -v -s distributed/test_elastic_ep.py
|