From d2965b432db80723e1f3e14938c8a3645a1fd979 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Sun, 17 May 2026 03:35:20 +0000 Subject: [PATCH] =?UTF-8?q?fix:=20set=20=5Fl1=5Factivation=5Fglobal=5Fscal?= =?UTF-8?q?e=20(with=20underscore)=20=E2=80=94=20attribute=20name=20mismat?= =?UTF-8?q?ch?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- vllm/patches/deepseek_v4.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/vllm/patches/deepseek_v4.py b/vllm/patches/deepseek_v4.py index abf2a2ad..61625034 100644 --- a/vllm/patches/deepseek_v4.py +++ b/vllm/patches/deepseek_v4.py @@ -526,8 +526,8 @@ class DeepseekV4MegaMoEExperts(nn.Module): l2_igs = w2_igs[:, 0] else: l2_igs = w2_igs - self._cutedsl_runner.l1_activation_global_scale = l1_igs.mean().item() - self._cutedsl_runner.l2_activation_global_scale = l2_igs.mean().item() + self._cutedsl_runner._l1_activation_global_scale = l1_igs.mean().item() + self._cutedsl_runner._l2_activation_global_scale = l2_igs.mean().item() # Drop the original loader-side parameters self._w13_input_scale = self.w13_input_scale.data.clone()