2025-12-08 18:25:43 -08:00
|
|
|
group: E2E Integration
|
|
|
|
|
depends_on:
|
|
|
|
|
- image-build
|
|
|
|
|
steps:
|
|
|
|
|
- label: DeepSeek V2-Lite Accuracy
|
|
|
|
|
timeout_in_minutes: 60
|
2026-01-26 12:28:20 -08:00
|
|
|
device: h100
|
2025-12-08 18:25:43 -08:00
|
|
|
optional: true
|
2026-01-26 12:28:20 -08:00
|
|
|
num_devices: 4
|
2025-12-08 18:25:43 -08:00
|
|
|
working_dir: "/vllm-workspace"
|
|
|
|
|
commands:
|
|
|
|
|
- bash .buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_ep_eplb.sh 0.25 200 8010
|
|
|
|
|
|
|
|
|
|
- label: Qwen3-30B-A3B-FP8-block Accuracy
|
|
|
|
|
timeout_in_minutes: 60
|
2026-01-26 12:28:20 -08:00
|
|
|
device: h100
|
2025-12-08 18:25:43 -08:00
|
|
|
optional: true
|
2026-01-26 12:28:20 -08:00
|
|
|
num_devices: 4
|
2025-12-08 18:25:43 -08:00
|
|
|
working_dir: "/vllm-workspace"
|
|
|
|
|
commands:
|
|
|
|
|
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
|
|
|
|
|
|
|
|
|
|
- label: Qwen3-30B-A3B-FP8-block Accuracy (B200)
|
|
|
|
|
timeout_in_minutes: 60
|
2026-01-26 12:28:20 -08:00
|
|
|
device: b200
|
2025-12-08 18:25:43 -08:00
|
|
|
optional: true
|
2026-01-26 12:28:20 -08:00
|
|
|
num_devices: 2
|
2025-12-08 18:25:43 -08:00
|
|
|
working_dir: "/vllm-workspace"
|
|
|
|
|
commands:
|
|
|
|
|
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020 2 1
|
2026-02-25 17:20:59 -08:00
|
|
|
|
|
|
|
|
- label: DeepSeek V2-Lite Prefetch Offload Accuracy (H100)
|
|
|
|
|
timeout_in_minutes: 60
|
|
|
|
|
device: h100
|
|
|
|
|
optional: true
|
|
|
|
|
num_devices: 1
|
|
|
|
|
working_dir: "/vllm-workspace"
|
|
|
|
|
commands:
|
|
|
|
|
- bash .buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_prefetch_offload.sh 0.25 200 8030
|