diff --git a/tests/evals/gpt_oss/configs/gpt-oss-20b-rocm-mxfp4-fp8.yaml b/tests/evals/gpt_oss/configs/gpt-oss-20b-rocm-mxfp4-fp8.yaml new file mode 100644 index 000000000..f7dd14784 --- /dev/null +++ b/tests/evals/gpt_oss/configs/gpt-oss-20b-rocm-mxfp4-fp8.yaml @@ -0,0 +1,8 @@ +# SPDX-License-Identifier: Apache-2.0 +# SPDX-FileCopyrightText: Copyright contributors to the vLLM project +model_name: amd/gpt-oss-20b-MoE-Quant-W-MXFP4-A-FP8-KV-FP8 +metric_threshold: 0.568 +reasoning_effort: low +server_args: "--attention-backend ROCM_AITER_UNIFIED_ATTN" +env: + VLLM_ROCM_USE_AITER: "1" \ No newline at end of file diff --git a/tests/evals/gpt_oss/configs/models-gfx950.txt b/tests/evals/gpt_oss/configs/models-gfx950.txt index 2b6ff4f4a..5085aa9f2 100644 --- a/tests/evals/gpt_oss/configs/models-gfx950.txt +++ b/tests/evals/gpt_oss/configs/models-gfx950.txt @@ -1,3 +1,4 @@ # GFX950 model configurations for GPQA evaluation # Tests different environment variable combinations -gpt-oss-20b-rocm-baseline.yaml \ No newline at end of file +gpt-oss-20b-rocm-baseline.yaml +gpt-oss-20b-rocm-mxfp4-fp8.yaml \ No newline at end of file