From 25b236fe00db3556967c5a2afeccf1ceca0a17e5 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Tue, 26 May 2026 15:31:38 +0000 Subject: [PATCH] diag: test D5c multi-tile with no sink bias to isolate issue --- tests/unit/test_d5c_multitile.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/unit/test_d5c_multitile.py b/tests/unit/test_d5c_multitile.py index b0a39544..691923d7 100644 --- a/tests/unit/test_d5c_multitile.py +++ b/tests/unit/test_d5c_multitile.py @@ -134,7 +134,7 @@ def test_d5c_multitile(): k_swa = torch.randn(n_swa, hd, dtype=torch.bfloat16, device='cuda') v_swa = torch.randn(n_swa, hd, dtype=torch.bfloat16, device='cuda') - attn_sink_val = 0.5 + attn_sink_val = 0.0 # Start with no sink bias to isolate issues attn_sink = torch.tensor([attn_sink_val], dtype=torch.float32, device='cuda') # Reference