[spec decode] Fix MTP inference path for MiMo-7B model (#25136)

Signed-off-by: zixi-qi <qizixi@meta.com>
Co-authored-by: Cyrus Leung <tlleungac@connect.ust.hk>
This commit is contained in:
qizixi
2025-09-18 09:12:19 -07:00
committed by GitHub
parent 1c3b1634aa
commit c4cb0af98a
3 changed files with 20 additions and 6 deletions

View File

@@ -31,7 +31,7 @@ logger = init_logger(__name__)
SpeculativeMethod = Literal["ngram", "eagle", "eagle3", "medusa",
"mlp_speculator", "draft_model", "deepseek_mtp",
"ernie_mtp", "qwen3_next_mtp"]
"ernie_mtp", "qwen3_next_mtp", "mimo_mtp"]
@config