Kimi k2.5 MLA based eagle3 (#36361)
Signed-off-by: Izzy Putterman <iputterman@nvidia.com> Signed-off-by: Jhao-Ting Chen <jhaotingc@nvidia.com> Co-authored-by: Izzy Putterman <iputterman@nvidia.com>
This commit is contained in:
@@ -779,6 +779,10 @@ class SpeculativeConfig:
|
||||
"hunyuan_v1_dense",
|
||||
"afmoe",
|
||||
"nemotron_h",
|
||||
"deepseek_v2",
|
||||
"deepseek_v3",
|
||||
"kimi_k2",
|
||||
"kimi_k25",
|
||||
]
|
||||
if (
|
||||
self.method in ("eagle3", "extract_hidden_states")
|
||||
|
||||
Reference in New Issue
Block a user