[Models] Lfm2Moe: minor name changes for resolving lora conflicts (#29063)

Signed-off-by: Paul Pak <paulpak58@gmail.com>
2026-01-16 23:12:55 -07:00
parent 8e61425ee6
commit d3317bbba4
2 changed files with 12 additions and 4 deletions
--- a/vllm/model_executor/models/lfm2.py
+++ b/vllm/model_executor/models/lfm2.py
@@ -248,7 +248,7 @@ class Lfm2ShortConvDecoderLayer(nn.Module):
    ) -> None:
        super().__init__()
        self.layer_idx = layer_idx
-        self.conv = ShortConv(
+        self.short_conv = ShortConv(
            config=config,
            dim=config.conv_dim,
            layer_idx=layer_idx,
@@ -281,7 +281,7 @@ class Lfm2ShortConvDecoderLayer(nn.Module):
        else:
            hidden_states, residual = self.operator_norm(hidden_states, residual)
        output = torch.empty_like(hidden_states)
-        self.conv(
+        self.short_conv(
            hidden_states,
            output,
        )
@@ -380,6 +380,9 @@ class Lfm2Model(nn.Module):
        params_dict = dict(self.named_parameters())
        loaded_params: set[str] = set()
        for name, loaded_weight in weights:
+            if ".conv." in name:
+                name = name.replace(".conv.", ".short_conv.", 1)
+
            for param_name, weight_name, shard_id in stacked_params_mapping:
                if weight_name not in name:
                    continue
@@ -414,6 +417,7 @@ class Lfm2ForCausalLM(
            "w1",
            "w3",
        ],
+        "in_proj": ["in_proj"],
    }

    # LoRA specific attributes