diff --git a/scripts/quantize_nvfp4.py b/scripts/quantize_nvfp4.py index f45d11d..4532a73 100644 --- a/scripts/quantize_nvfp4.py +++ b/scripts/quantize_nvfp4.py @@ -212,12 +212,12 @@ def run_calibration(model_path, export_dir, calib_save_path, amax_snapshot_path, saved_argv = sys.argv sys.argv = [ "hf_ptq.py", - "--model", model_path, - "--quant", QUANT, + "--pyt_ckpt_path", model_path, + "--qformat", QUANT, "--calib_size", str(calib_size), "--calib_seq", str(calib_seq), "--kv_cache_qformat", KV_CACHE_QUANT, - "--tp", str(TP), + "--inference_tensor_parallel", str(TP), "--export_path", export_dir, "--trust_remote_code", "--use_seq_device_map",