[VLM] Add MLA with pure RoPE support for deepseek-vl2 models (#12729)
This commit is contained in:
@@ -414,7 +414,8 @@ class DeepseekV2MLAAttention(nn.Module):
|
||||
quant_config=quant_config,
|
||||
prefix=f"{prefix}.o_proj")
|
||||
|
||||
rope_scaling["rope_type"] = 'deepseek_yarn'
|
||||
if rope_scaling:
|
||||
rope_scaling["rope_type"] = 'deepseek_yarn'
|
||||
self.rotary_emb = get_rope(qk_rope_head_dim,
|
||||
rotary_dim=qk_rope_head_dim,
|
||||
max_position=max_position_embeddings,
|
||||
|
||||
Reference in New Issue
Block a user