diff --git a/vllm/model_executor/layers/fused_moe/fused_moe_modular_method.py b/vllm/model_executor/layers/fused_moe/fused_moe_modular_method.py index 1aa9e3a65..187464ce8 100644 --- a/vllm/model_executor/layers/fused_moe/fused_moe_modular_method.py +++ b/vllm/model_executor/layers/fused_moe/fused_moe_modular_method.py @@ -37,7 +37,6 @@ class FusedMoEModularMethod(FusedMoEMethodBase, CustomOp): not self.moe_mk.supports_expert_map(), ) self.old_quant_method = old_quant_method - assert not self.old_quant_method.is_monolithic logger.debug("Swapping out %s", self.old_quant_method.__class__.__name__) @staticmethod