2026-03-26 12:21:47 +04:00
|
|
|
model_name: "nvidia/Qwen3.5-397B-A17B-NVFP4"
|
|
|
|
|
accuracy_threshold: 0.88
|
|
|
|
|
tolerance: 0.03
|
|
|
|
|
num_questions: 1319
|
|
|
|
|
num_fewshot: 5
|
|
|
|
|
server_args: >-
|
|
|
|
|
--max-model-len 4096
|
|
|
|
|
--data-parallel-size 2
|
|
|
|
|
--enable-expert-parallel
|
2026-03-31 21:20:08 +08:00
|
|
|
--max-num-seqs 512
|