From ec7d9e67459dd8ca6e2e3e77a40993291cab152c Mon Sep 17 00:00:00 2001
From: danisereb <daserebrenik@nvidia.com>
Date: Mon, 16 Feb 2026 17:33:09 +0200
Subject: [PATCH] Fix call to moe_mk in modelopt MoE modules (required for
 LoRA) (#34575)

Signed-off-by: Daniel Serebrenik <daserebrenik@nvidia.com>
---
 .../layers/quantization/modelopt.py           | 20 +++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/vllm/model_executor/layers/quantization/modelopt.py b/vllm/model_executor/layers/quantization/modelopt.py
index 9af815ee9..1991c6935 100644
--- a/vllm/model_executor/layers/quantization/modelopt.py
+++ b/vllm/model_executor/layers/quantization/modelopt.py
@@ -977,11 +977,11 @@ class ModelOptFp8MoEMethod(FusedMoEMethodBase):
 
         assert self.moe_mk is not None
         return self.moe_mk(
-            x,
-            layer.w13_weight,
-            layer.w2_weight,
-            topk_weights,
-            topk_ids,
+            hidden_states=x,
+            w1=layer.w13_weight,
+            w2=layer.w2_weight,
+            topk_weights=topk_weights,
+            topk_ids=topk_ids,
             activation=layer.activation,
             global_num_experts=layer.global_num_experts,
             expert_map=layer.expert_map,
@@ -1549,11 +1549,11 @@ class ModelOptNvFp4FusedMoE(FusedMoEMethodBase):
         else:
             assert self.moe_mk is not None
             return self.moe_mk(
-                x,
-                layer.w13_weight,
-                layer.w2_weight,
-                topk_weights,
-                topk_ids,
+                hidden_states=x,
+                w1=layer.w13_weight,
+                w2=layer.w2_weight,
+                topk_weights=topk_weights,
+                topk_ids=topk_ids,
                 activation=layer.activation,
                 global_num_experts=layer.global_num_experts,
                 expert_map=layer.expert_map,