22 lines
526 B
YAML
22 lines
526 B
YAML
group: Attention
|
|
depends_on:
|
|
- image-build
|
|
steps:
|
|
- label: V1 attention (H100)
|
|
timeout_in_minutes: 30
|
|
gpu: h100
|
|
source_file_dependencies:
|
|
- vllm/v1/attention
|
|
- tests/v1/attention
|
|
commands:
|
|
- pytest -v -s v1/attention
|
|
|
|
- label: V1 attention (B200)
|
|
timeout_in_minutes: 30
|
|
gpu: b200
|
|
source_file_dependencies:
|
|
- vllm/v1/attention
|
|
- tests/v1/attention
|
|
commands:
|
|
- VLLM_DISABLE_FLASHINFER_PREFILL=1 pytest -v -s v1/attention # TODO: FI prefill is bugged and causes incorrectness, fix this
|