2026-04-02 09:06:01 -07:00
|
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
2026-04-02 20:29:57 -07:00
|
|
|
model_name: amd/gpt-oss-20b-w-mxfp4-a-bf16
|
2026-04-02 09:06:01 -07:00
|
|
|
metric_threshold: 0.568
|
|
|
|
|
reasoning_effort: low
|
2026-04-02 20:29:57 -07:00
|
|
|
server_args: "--attention-backend ROCM_AITER_UNIFIED_ATTN --moe-backend aiter"
|
2026-04-02 09:06:01 -07:00
|
|
|
env:
|
2026-04-02 20:29:57 -07:00
|
|
|
VLLM_ROCM_USE_AITER: "1"
|