diff --git a/scripts/model_opt_nvfp4_experts_only.py b/scripts/model_opt_nvfp4_experts_only.py index 70d080a..4558251 100644 --- a/scripts/model_opt_nvfp4_experts_only.py +++ b/scripts/model_opt_nvfp4_experts_only.py @@ -30,7 +30,7 @@ import sys import os # ── Config ────────────────────────────────────────────────────────────────── -MODEL = "/root/nvidia-meeting/DeepSeek-V4-Pro" # Mixed-precision source +MODEL = "/root/nvidia-meeting/DeepSeek-V4-Pro-BF16" # Dequantized BF16 (from scripts/dequant_fp8_to_bf16.py) QUANT = "nvfp4_experts_only" TP = 8 CALIB = 256