[Bugfix] Fix unsupported FA version check for Turing GPU (#12828)
This commit is contained in:
@@ -612,5 +612,5 @@ try:
|
||||
return fa_version
|
||||
|
||||
VLLM_FLASH_ATTN_VERSION = flash_attn_version()
|
||||
except ImportError:
|
||||
except (ImportError, AssertionError):
|
||||
VLLM_FLASH_ATTN_VERSION = None
|
||||
|
||||
Reference in New Issue
Block a user