Enable bitsandbytes quantization on AMD GPUs that use warp size 32 (#27307)
Signed-off-by: sstamenk <strahinja.stamenkovic@amd.com>
This commit is contained in:
committed by
GitHub
parent
20852c8f4c
commit
814843e021
@@ -185,6 +185,9 @@ class RocmPlatform(Platform):
|
||||
"petit_nvfp4",
|
||||
"torchao",
|
||||
]
|
||||
# bitsandbytes not supported on gfx9 (warp size 64 limitation)
|
||||
if not on_gfx9():
|
||||
supported_quantization += ["bitsandbytes"]
|
||||
|
||||
@classmethod
|
||||
def get_vit_attn_backend(
|
||||
|
||||
Reference in New Issue
Block a user