From ec7d9e67459dd8ca6e2e3e77a40993291cab152c Mon Sep 17 00:00:00 2001 From: danisereb Date: Mon, 16 Feb 2026 17:33:09 +0200 Subject: [PATCH] Fix call to moe_mk in modelopt MoE modules (required for LoRA) (#34575) Signed-off-by: Daniel Serebrenik --- .../layers/quantization/modelopt.py | 20 +++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/vllm/model_executor/layers/quantization/modelopt.py b/vllm/model_executor/layers/quantization/modelopt.py index 9af815ee9..1991c6935 100644 --- a/vllm/model_executor/layers/quantization/modelopt.py +++ b/vllm/model_executor/layers/quantization/modelopt.py @@ -977,11 +977,11 @@ class ModelOptFp8MoEMethod(FusedMoEMethodBase): assert self.moe_mk is not None return self.moe_mk( - x, - layer.w13_weight, - layer.w2_weight, - topk_weights, - topk_ids, + hidden_states=x, + w1=layer.w13_weight, + w2=layer.w2_weight, + topk_weights=topk_weights, + topk_ids=topk_ids, activation=layer.activation, global_num_experts=layer.global_num_experts, expert_map=layer.expert_map, @@ -1549,11 +1549,11 @@ class ModelOptNvFp4FusedMoE(FusedMoEMethodBase): else: assert self.moe_mk is not None return self.moe_mk( - x, - layer.w13_weight, - layer.w2_weight, - topk_weights, - topk_ids, + hidden_states=x, + w1=layer.w13_weight, + w2=layer.w2_weight, + topk_weights=topk_weights, + topk_ids=topk_ids, activation=layer.activation, global_num_experts=layer.global_num_experts, expert_map=layer.expert_map,