[V1] port xformers backend to v1 (#21342)

Signed-off-by: Giancarlo Delfin <gdelfin@meta.com>
This commit is contained in:
Giancarlo Delfin
2025-08-05 10:04:46 -07:00
committed by GitHub
parent ae87ddd040
commit 469b3ffaaa
6 changed files with 438 additions and 1 deletions

View File

@@ -1469,6 +1469,7 @@ class EngineArgs:
"TORCH_SDPA_VLLM_V1",
"FLEX_ATTENTION",
"TREE_ATTN",
"XFORMERS_VLLM_V1",
]
if (envs.is_set("VLLM_ATTENTION_BACKEND")
and envs.VLLM_ATTENTION_BACKEND not in V1_BACKENDS):