Signed-off-by: NickLucche <nlucches@redhat.com>
This commit is contained in:
@@ -524,7 +524,7 @@ class Worker(WorkerBase):
|
||||
|
||||
@torch.inference_mode()
|
||||
def sample_tokens(
|
||||
self, grammar_output: "GrammarOutput | None"
|
||||
self, grammar_output: "GrammarOutput"
|
||||
) -> ModelRunnerOutput | AsyncModelRunnerOutput:
|
||||
return self.model_runner.sample_tokens(grammar_output)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user