[spec decode] Fix MTP inference path for MiMo-7B model (#25136)
Signed-off-by: zixi-qi <qizixi@meta.com> Co-authored-by: Cyrus Leung <tlleungac@connect.ust.hk>
This commit is contained in:
@@ -31,7 +31,7 @@ logger = init_logger(__name__)
|
||||
|
||||
SpeculativeMethod = Literal["ngram", "eagle", "eagle3", "medusa",
|
||||
"mlp_speculator", "draft_model", "deepseek_mtp",
|
||||
"ernie_mtp", "qwen3_next_mtp"]
|
||||
"ernie_mtp", "qwen3_next_mtp", "mimo_mtp"]
|
||||
|
||||
|
||||
@config
|
||||
|
||||
Reference in New Issue
Block a user