[ROCm] Small functional changes for gptoss (#25201)

Signed-off-by: jpvillam <jpvillam@amd.com>
Co-authored-by: jpvillam <jpvillam@amd.com>
This commit is contained in:
Juan Villamizar
2025-09-23 18:39:50 -05:00
committed by GitHub
parent 5e25b12236
commit bde2a1a8a4
3 changed files with 26 additions and 6 deletions

View File

@@ -118,6 +118,12 @@ def on_gfx9() -> bool:
return any(arch in GPU_ARCH for arch in ["gfx90a", "gfx942", "gfx950"])
@cache
def on_gfx950() -> bool:
GPU_ARCH = torch.cuda.get_device_properties("cuda").gcnArchName
return any(arch in GPU_ARCH for arch in ["gfx950"])
@cache
def use_rocm_custom_paged_attention(
qtype: torch.dtype,