[ROCm] Improve error handling while loading quantized model on gfx120… (#31715)
Signed-off-by: brian033 <85883730+brian033@users.noreply.github.com> Co-authored-by: TJian <tunjian.tan@embeddedllm.com>
This commit is contained in:
@@ -153,7 +153,11 @@ try:
|
|||||||
fake_impl=gemm_with_dynamic_quant_fake,
|
fake_impl=gemm_with_dynamic_quant_fake,
|
||||||
dispatch_key=current_platform.dispatch_key,
|
dispatch_key=current_platform.dispatch_key,
|
||||||
)
|
)
|
||||||
except (ImportError, AttributeError):
|
except (ImportError, AttributeError, RuntimeError):
|
||||||
|
logger.warning(
|
||||||
|
"AITER is not found or QuarkOCP_MX is not supported on the current "
|
||||||
|
"platform. QuarkOCP_MX quantization will not be available."
|
||||||
|
)
|
||||||
dynamic_mxfp4_quant = gemm_afp4wfp4 = None
|
dynamic_mxfp4_quant = gemm_afp4wfp4 = None
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user