[Bugfix] Disable tma_aligned_scales in test_fusions_e2e (#32916)

Signed-off-by: Xin Yang <xyangx@amazon.com>
This commit is contained in:
Xin Yang
2026-01-23 06:34:30 -08:00
committed by GitHub
parent d95d650762
commit 90c2007932
3 changed files with 9 additions and 1 deletions

View File

@@ -290,6 +290,9 @@ def test_rms_group_quant(
# Force spawn as it is more general.
monkeypatch.setenv("VLLM_WORKER_MULTIPROC_METHOD", "spawn")
# TODO: remove this after fusion is fixed
monkeypatch.setenv("VLLM_USE_DEEP_GEMM_TMA_ALIGNED_SCALES", "0")
model_kwargs["attention_config"] = {"backend": backend.name}
compilation_config = CompilationConfig(