diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py index 20f399d7f..92d21b742 100644 --- a/vllm/_custom_ops.py +++ b/vllm/_custom_ops.py @@ -900,6 +900,8 @@ def cutlass_sparse_scaled_mm_supported(cuda_device_capability: int) -> bool: def cutlass_group_gemm_supported(cuda_device_capability: int) -> bool: + if cuda_device_capability < 90 or cuda_device_capability >= 110: + return False try: return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability) except AttributeError: