Signed-off-by: khluu <khluu000@gmail.com>
This commit is contained in:
Vadim Gimpelson
2026-03-26 12:21:47 +04:00
committed by khluu
parent ccbc5ac449
commit 05d96d7991
10 changed files with 73 additions and 10 deletions

View File

@@ -1,5 +1,6 @@
model_name: "Qwen/Qwen3.5-35B-A3B"
accuracy_threshold: 0.86
accuracy_threshold: 0.84
tolerance: 0.03
num_questions: 1319
num_fewshot: 5
server_args: >-

View File

@@ -1,5 +1,6 @@
model_name: "Qwen/Qwen3.5-35B-A3B-FP8"
accuracy_threshold: 0.86
accuracy_threshold: 0.79
tolerance: 0.03
num_questions: 1319
num_fewshot: 5
server_args: >-

View File

@@ -0,0 +1,9 @@
model_name: "nvidia/Qwen3.5-397B-A17B-NVFP4"
accuracy_threshold: 0.88
tolerance: 0.03
num_questions: 1319
num_fewshot: 5
server_args: >-
--max-model-len 4096
--data-parallel-size 2
--enable-expert-parallel

View File

@@ -1,2 +1,3 @@
Qwen3.5-35B-A3B-DEP2.yaml
Qwen3.5-35B-A3B-FP8-DEP2.yaml
Qwen3.5-397B-A17B-NVFP4-DEP2.yaml