[LoRA] Change lora_tokenizers capacity (#10796)

Signed-off-by: Xin Yang <xyang19@gmail.com>
This commit is contained in:
Xin Yang
2024-12-04 09:40:16 -08:00
committed by GitHub
parent c92acb9693
commit 01d079fd8e
7 changed files with 31 additions and 10 deletions

View File

@@ -51,7 +51,7 @@ class AsyncLLM(EngineClient):
model_config=vllm_config.model_config,
scheduler_config=vllm_config.scheduler_config,
parallel_config=vllm_config.parallel_config,
enable_lora=bool(vllm_config.lora_config))
lora_config=vllm_config.lora_config)
self.tokenizer.ping()
# Request streams (map of request_id -> AsyncStream).