[Bugfix][SpecDecode] apply sampling parameters to target probabilities for consistency in rejection sampling. (#10198)
Signed-off-by: jeongin601 <0200angela@gmail.com> Signed-off-by: jeong_in.bae <jeong_in.bae@navercorp.com>
This commit is contained in:
@@ -90,6 +90,14 @@ def test_create_single_target_seq_group_metadata(k: int):
|
||||
)
|
||||
|
||||
assert output.request_id == input_seq_group_metadata.request_id
|
||||
assert output.sampling_params.repetition_penalty == \
|
||||
input_seq_group_metadata.sampling_params.repetition_penalty
|
||||
assert output.sampling_params.temperature == \
|
||||
input_seq_group_metadata.sampling_params.temperature
|
||||
assert output.sampling_params.top_p == \
|
||||
input_seq_group_metadata.sampling_params.top_p
|
||||
assert output.sampling_params.top_k == \
|
||||
input_seq_group_metadata.sampling_params.top_k
|
||||
assert len(output.seq_data) == 1
|
||||
assert output.seq_data[target_seq_id].get_prompt_token_ids() == tuple(
|
||||
prompt_tokens)
|
||||
|
||||
Reference in New Issue
Block a user