Fix NVFP4 mapper: strip model. prefix from checkpoint keys

The NVFP4 checkpoint uses model.layers.* but vLLM's AutoWeightsLoader expects layers.* (relative to the model module). Strip the model. prefix instead of adding it.
2026-05-18 22:46:04 +00:00
parent 5d37674fb1
commit 1528d4e182
1 changed files with 2 additions and 3 deletions
--- a/vllm/patches/deepseek_v4.py
+++ b/vllm/patches/deepseek_v4.py
@@ -1667,9 +1667,8 @@ def _make_deepseek_v4_nvfp4_weights_mapper() -> WeightsMapper:

    return WeightsMapper(
        orig_to_new_prefix={
-            "layers.": "model.layers.",
-            "embed.": "model.embed.",
-            "norm.": "model.norm.",
+            # Strip model. prefix (checkpoint has it, model params don't)
+            "model.": "",
        },
        orig_to_new_regex=expert_rename_regex,
        orig_to_new_suffix=suffix_renames,