more fixes2

This commit is contained in:
2026-05-14 19:43:24 +00:00
parent 4749a92fca
commit c68f4e9d6e

View File

@@ -1412,8 +1412,10 @@ class DeepseekV4Model(nn.Module):
)
if success:
name = name_mapped
loaded_params.add(name_mapped)
break
loaded_params.add(name_mapped)
else:
continue
continue
elif "attn_sink" in name:
narrow_weight = loaded_weight[head_rank_start:head_rank_end]