Fix: use hf_ptq.py arg names (--pyt_ckpt_path, --qformat, --inference_tensor_parallel)
This commit is contained in:
@@ -212,12 +212,12 @@ def run_calibration(model_path, export_dir, calib_save_path, amax_snapshot_path,
|
||||
saved_argv = sys.argv
|
||||
sys.argv = [
|
||||
"hf_ptq.py",
|
||||
"--model", model_path,
|
||||
"--quant", QUANT,
|
||||
"--pyt_ckpt_path", model_path,
|
||||
"--qformat", QUANT,
|
||||
"--calib_size", str(calib_size),
|
||||
"--calib_seq", str(calib_seq),
|
||||
"--kv_cache_qformat", KV_CACHE_QUANT,
|
||||
"--tp", str(TP),
|
||||
"--inference_tensor_parallel", str(TP),
|
||||
"--export_path", export_dir,
|
||||
"--trust_remote_code",
|
||||
"--use_seq_device_map",
|
||||
|
||||
Reference in New Issue
Block a user