Kimi k2.5 MLA based eagle3 (#36361)

Signed-off-by: Izzy Putterman <iputterman@nvidia.com>
Signed-off-by: Jhao-Ting Chen <jhaotingc@nvidia.com>
Co-authored-by: Izzy Putterman <iputterman@nvidia.com>
This commit is contained in:
Jhao-Ting Chen
2026-03-11 08:36:11 -07:00
committed by GitHub
parent d5816c8c2f
commit 5573894737
8 changed files with 499 additions and 8 deletions

View File

@@ -551,6 +551,8 @@ _SPECULATIVE_DECODING_MODELS = {
"mistral_large_3_eagle",
"EagleMistralLarge3ForCausalLM",
),
"Eagle3DeepseekV2ForCausalLM": ("deepseek_eagle3", "Eagle3DeepseekV2ForCausalLM"),
"Eagle3DeepseekV3ForCausalLM": ("deepseek_eagle3", "Eagle3DeepseekV2ForCausalLM"),
"EagleDeepSeekMTPModel": ("deepseek_eagle", "EagleDeepseekV3ForCausalLM"),
"DeepSeekMTPModel": ("deepseek_mtp", "DeepSeekMTP"),
"ErnieMTPModel": ("ernie_mtp", "ErnieMTP"),