Fix: skip .cuda() when low_memory_mode; switch default to nvfp4
This commit is contained in:
@@ -110,7 +110,7 @@ def main():
|
||||
|
||||
model = AutoModelForCausalLM.from_pretrained(args.model, **model_kwargs)
|
||||
|
||||
if not args.use_seq_device_map:
|
||||
if not args.use_seq_device_map and not args.low_memory_mode:
|
||||
model = model.cuda()
|
||||
|
||||
# Build calibration dataloader
|
||||
|
||||
Reference in New Issue
Block a user