[Frontend] Perform offline path replacement to tokenizer (#29706)

Signed-off-by: Tsukasa OI <floss_llm@irq.a4lg.com>
This commit is contained in:
Tsukasa OI
2025-11-29 11:32:08 +09:00
committed by GitHub
parent b2c50eda50
commit 762a4a6ca9
2 changed files with 27 additions and 6 deletions

View File

@@ -23,6 +23,16 @@ MODEL_CONFIGS = [
"max_num_seqs": 64,
"tensor_parallel_size": 1,
},
{
"model": "Qwen/Qwen3-0.6B",
"enforce_eager": True,
"gpu_memory_utilization": 0.50,
"max_model_len": 64,
"max_num_batched_tokens": 64,
"max_num_seqs": 64,
"tensor_parallel_size": 1,
"tokenizer": "Qwen/Qwen3-4B",
},
{
"model": "mistralai/Mistral-7B-Instruct-v0.1",
"enforce_eager": True,