diff --git a/vllm/model_executor/layers/quantization/quark/schemes/quark_ocp_mx.py b/vllm/model_executor/layers/quantization/quark/schemes/quark_ocp_mx.py index eeb60023d..edf1ad5a9 100644 --- a/vllm/model_executor/layers/quantization/quark/schemes/quark_ocp_mx.py +++ b/vllm/model_executor/layers/quantization/quark/schemes/quark_ocp_mx.py @@ -153,7 +153,11 @@ try: fake_impl=gemm_with_dynamic_quant_fake, dispatch_key=current_platform.dispatch_key, ) -except (ImportError, AttributeError): +except (ImportError, AttributeError, RuntimeError): + logger.warning( + "AITER is not found or QuarkOCP_MX is not supported on the current " + "platform. QuarkOCP_MX quantization will not be available." + ) dynamic_mxfp4_quant = gemm_afp4wfp4 = None