[MoE Refactor] Make SharedExperts class for use with DefaultMoERunner (#35153)

Signed-off-by: Bill Nell <bnell@redhat.com>
2026-04-01 09:44:08 -04:00
parent 5e30e9b9a9
commit 7cf56a59a2
34 changed files with 556 additions and 397 deletions
--- a/tests/kernels/moe/utils.py
+++ b/tests/kernels/moe/utils.py
@@ -603,7 +603,6 @@ def make_shared_experts(
 def modular_triton_fused_moe(
    moe_config: FusedMoEConfig,
    quant_config: FusedMoEQuantConfig,
-    shared_experts: torch.nn.Module | None = None,
 ) -> FusedMoEKernel:
    return FusedMoEKernel(
        maybe_make_prepare_finalize(
@@ -613,6 +612,5 @@ def modular_triton_fused_moe(
            use_monolithic=False,
        ),
        TritonExperts(moe_config, quant_config),
-        shared_experts,
        inplace=False,
    )