From b7e5a588d89003223bebc9b163413529f3db4cae Mon Sep 17 00:00:00 2001 From: Robert Shaw <114415538+robertgshaw2-redhat@users.noreply.github.com> Date: Wed, 11 Mar 2026 12:07:14 -0400 Subject: [PATCH] [Bugfix] Fix DP/EP Shared Expert With Monolithic Kernels (#36061) Signed-off-by: Robert Shaw Co-authored-by: Robert Shaw --- vllm/model_executor/layers/fused_moe/oracle/fp8.py | 2 +- vllm/model_executor/layers/fused_moe/oracle/nvfp4.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/vllm/model_executor/layers/fused_moe/oracle/fp8.py b/vllm/model_executor/layers/fused_moe/oracle/fp8.py index c7b012677..85997468a 100644 --- a/vllm/model_executor/layers/fused_moe/oracle/fp8.py +++ b/vllm/model_executor/layers/fused_moe/oracle/fp8.py @@ -567,7 +567,7 @@ def make_fp8_moe_kernel( experts, shared_experts=( shared_experts - if moe_config.moe_parallel_config.use_all2all_kernels + if moe_config.moe_parallel_config.use_deepep_ll_kernels else None ), moe_parallel_config=moe_config.moe_parallel_config, diff --git a/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py b/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py index dd1a24d86..b06cf49cf 100644 --- a/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py +++ b/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py @@ -433,7 +433,7 @@ def make_nvfp4_moe_kernel( experts, shared_experts=( shared_experts - if moe_config.moe_parallel_config.use_all2all_kernels + if moe_config.moe_parallel_config.use_deepep_ll_kernels else None ), moe_parallel_config=moe_config.moe_parallel_config,