[Core] Support min_tokens with speculative decoding (#32642)
Signed-off-by: qianlihuang <yiliu.dong@qq.com> Co-authored-by: qianlihuang <yiliu.dong@qq.com>
This commit is contained in:
@@ -32,8 +32,7 @@ example_prompts = [first_prompt, "In one word, the capital of France is "] + [
|
||||
default_params = dict(
|
||||
temperature=0.0, # greedy
|
||||
max_tokens=30,
|
||||
# spec decoding currently doesn't support min_tokens
|
||||
# min_tokens=28,
|
||||
min_tokens=28,
|
||||
)
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user