diff --git a/vllm/patches/deepseek_v4.py b/vllm/patches/deepseek_v4.py index 3551dc0c..b71d93be 100644 --- a/vllm/patches/deepseek_v4.py +++ b/vllm/patches/deepseek_v4.py @@ -1412,8 +1412,10 @@ class DeepseekV4Model(nn.Module): ) if success: name = name_mapped + loaded_params.add(name_mapped) break - loaded_params.add(name_mapped) + else: + continue continue elif "attn_sink" in name: narrow_weight = loaded_weight[head_rank_start:head_rank_end]