[Kernel] Enable FusedMoEModularKernel support bias (#27754)

Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>
This commit is contained in:
Jee Jee Li
2025-11-01 10:05:12 +08:00
committed by GitHub
parent 0cdbe7b744
commit bc4486d609
2 changed files with 15 additions and 30 deletions

View File

@@ -672,8 +672,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
apply_router_weight_on_input=apply_router_weight_on_input,
)
elif self.fused_experts is not None:
if self.moe.has_bias:
raise ValueError("FusedMoEModularKernel does not support bias.")
result = self.fused_experts(
hidden_states=x,
w1=layer.w13_weight,