Provide default max model length (#1224)

This commit is contained in:
Woosuk Kwon
2023-09-28 14:44:02 -07:00
committed by GitHub
parent 6f88f762bf
commit f936657eb6
4 changed files with 14 additions and 9 deletions

View File

@@ -615,7 +615,7 @@ if __name__ == "__main__":
engine_args = AsyncEngineArgs.from_cli_args(args)
engine = AsyncLLMEngine.from_engine_args(engine_args)
engine_model_config = asyncio.run(engine.get_model_config())
max_model_len = engine_model_config.get_max_model_len()
max_model_len = engine_model_config.max_model_len
# A separate tokenizer to map token IDs to strings.
tokenizer = get_tokenizer(engine_args.tokenizer,