From 707b240d7e7523c652b8a5b075ffc1ee9e1120ae Mon Sep 17 00:00:00 2001 From: Xin Yang <105740670+xyang16@users.noreply.github.com> Date: Thu, 8 Jan 2026 21:54:05 -0800 Subject: [PATCH] [Bugfix] Fix FusedMoE LoRA w2_output_size (#31949) Signed-off-by: Xin Yang --- vllm/lora/layers/fused_moe.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/lora/layers/fused_moe.py b/vllm/lora/layers/fused_moe.py index 093737f11..99242806c 100644 --- a/vllm/lora/layers/fused_moe.py +++ b/vllm/lora/layers/fused_moe.py @@ -720,7 +720,7 @@ class FusedMoE3DWithLoRA(FusedMoEWithLoRA): """ Full size """ - return self.w2_lora_a_stacked[0].shape[-2] + return self.base_layer.hidden_size @classmethod def can_replace_layer(