Fix: skip .cuda() when low_memory_mode; switch default to nvfp4

This commit is contained in:
2026-05-07 03:06:33 +00:00
parent b8bdd00d19
commit 116933dcf6

View File

@@ -110,7 +110,7 @@ def main():
model = AutoModelForCausalLM.from_pretrained(args.model, **model_kwargs)
if not args.use_seq_device_map:
if not args.use_seq_device_map and not args.low_memory_mode:
model = model.cuda()
# Build calibration dataloader