[FEAT][ROCm]: Support AITER MLA on V1 Engine (#17523)

Signed-off-by: vllmellm <vllm.ellm@embeddedllm.com>
Co-authored-by: qli88 <qiang.li2@amd.com>
Co-authored-by: Hongxia Yang <62075498+hongxiayang@users.noreply.github.com>
This commit is contained in:
vllmellm
2025-05-09 10:42:05 +08:00
committed by GitHub
parent 376786fac1
commit 3c9396a64f
10 changed files with 269 additions and 14 deletions

View File

@@ -102,7 +102,10 @@ def test_env(
block_size,
False,
use_mla=use_mla)
assert backend.get_name() == name
if use_v1 and name != "TRITON_MLA":
assert backend.get_name() == f"{name}_VLLM_V1"
else:
assert backend.get_name() == name
else:
with pytest.raises(ValueError) as exc_info:
get_attn_backend(16,