[Bugfix] Allow skipping MoE in NVFP4 (fix for MTP) (#25987)
Signed-off-by: Benjamin Chislett <bchislett@nvidia.com>
This commit is contained in:
committed by
GitHub
parent
f23b4c04fd
commit
2161efe978
@@ -1194,6 +1194,8 @@ class FusedMoE(CustomOp):
|
||||
if quant_config is None
|
||||
else quant_config.get_quant_method(self, prefix)
|
||||
)
|
||||
if quant_method is None:
|
||||
quant_method = UnquantizedFusedMoEMethod(moe)
|
||||
|
||||
assert quant_method is not None
|
||||
assert isinstance(quant_method, FusedMoEMethodBase)
|
||||
|
||||
Reference in New Issue
Block a user