Update nvfp4_experts_only to use dequantized BF16 model
This commit is contained in:
@@ -30,7 +30,7 @@ import sys
|
||||
import os
|
||||
|
||||
# ── Config ──────────────────────────────────────────────────────────────────
|
||||
MODEL = "/root/nvidia-meeting/DeepSeek-V4-Pro" # Mixed-precision source
|
||||
MODEL = "/root/nvidia-meeting/DeepSeek-V4-Pro-BF16" # Dequantized BF16 (from scripts/dequant_fp8_to_bf16.py)
|
||||
QUANT = "nvfp4_experts_only"
|
||||
TP = 8
|
||||
CALIB = 256
|
||||
|
||||
Reference in New Issue
Block a user