[Frontend] New allowed_token_ids decoding request parameter (#6753)
This commit is contained in:
@@ -95,7 +95,7 @@ class OpenAIServingCompletion(OpenAIServing):
|
||||
|
||||
tokenizer = await self.engine.get_tokenizer(lora_request)
|
||||
|
||||
sampling_params = request.to_sampling_params()
|
||||
sampling_params = request.to_sampling_params(tokenizer)
|
||||
decoding_config = await self.engine.get_decoding_config()
|
||||
guided_decoding_backend = request.guided_decoding_backend \
|
||||
or decoding_config.guided_decoding_backend
|
||||
|
||||
Reference in New Issue
Block a user