[ROCm][Bugfix] Add missing parameter to ROCm backend (#26029)

Signed-off-by: Gregory Shtrasberg <Gregory.Shtrasberg@amd.com>
This commit is contained in:
Gregory Shtrasberg
2025-10-01 22:23:14 -04:00
committed by GitHub
parent c31246800c
commit 0b018d8baf

View File

@@ -175,6 +175,7 @@ class RocmAttentionBackend(AttentionBackend):
block_size: int,
num_kv_heads: int,
head_size: int,
cache_dtype_str: str = "auto",
) -> tuple[int, ...]:
if block_size % 16 != 0:
raise ValueError("Block size must be a multiple of 16.")