diff --git a/vllm/lora/layers/fused_moe.py b/vllm/lora/layers/fused_moe.py index 093737f11..99242806c 100644 --- a/vllm/lora/layers/fused_moe.py +++ b/vllm/lora/layers/fused_moe.py @@ -720,7 +720,7 @@ class FusedMoE3DWithLoRA(FusedMoEWithLoRA): """ Full size """ - return self.w2_lora_a_stacked[0].shape[-2] + return self.base_layer.hidden_size @classmethod def can_replace_layer(