From ade81f17feeebef775e8cddf9a8f23848ec694a3 Mon Sep 17 00:00:00 2001 From: Kevin McKay Date: Thu, 26 Feb 2026 02:11:07 -0600 Subject: [PATCH] [Bugfix][Hardware][AMD] Gate FP4 ops on gfx950 to prevent MI300X crash (#35250) Signed-off-by: c0de128 --- vllm/_aiter_ops.py | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/vllm/_aiter_ops.py b/vllm/_aiter_ops.py index 3414443e5..8ef34bfd6 100644 --- a/vllm/_aiter_ops.py +++ b/vllm/_aiter_ops.py @@ -1052,12 +1052,16 @@ class rocm_aiter_ops: @classmethod @if_aiter_supported def is_fp4bmm_enabled(cls) -> bool: - return cls._AITER_ENABLED and cls._FP4BMM_ENABLED + from vllm.platforms.rocm import on_gfx950 + + return cls._AITER_ENABLED and cls._FP4BMM_ENABLED and on_gfx950() @classmethod @if_aiter_supported def is_asm_fp4_gemm_dynamic_quant_enabled(cls) -> bool: - return cls._AITER_ENABLED and cls._FP4_GEMM_DYNAMIC_QUANT_ASM + from vllm.platforms.rocm import on_gfx950 + + return cls._AITER_ENABLED and cls._FP4_GEMM_DYNAMIC_QUANT_ASM and on_gfx950() @classmethod @if_aiter_supported