From 9a3bb43f205da80b27b308aa61209bb02414dc9e Mon Sep 17 00:00:00 2001 From: biondizzle Date: Mon, 1 Jun 2026 17:27:01 +0000 Subject: [PATCH] Set default max-tokens=512 for reasoning model --- single_shot_inference.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/single_shot_inference.py b/single_shot_inference.py index d33f4160..c29a4315 100644 --- a/single_shot_inference.py +++ b/single_shot_inference.py @@ -18,7 +18,7 @@ log = logging.getLogger("single_shot") def parse_args(): p = argparse.ArgumentParser() - p.add_argument('--max-tokens', type=int, default=128) + p.add_argument('--max-tokens', type=int, default=512) p.add_argument('--temperature', type=float, default=0.0, help='Sampling temperature (0=greedy)') p.add_argument('--repetition-penalty', type=float, default=1.2, help='Repetition penalty factor') p.add_argument('--prompt', type=str, default=None)