From 20aa6b4d9043bb0d9b842ba1063d4012dcf76863 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Fri, 22 May 2026 18:45:55 +0000 Subject: [PATCH] =?UTF-8?q?CRITICAL=20FIX:=20TMA=20pre-slice=20(None,0,Non?= =?UTF-8?q?e,0)=20=E2=86=92=20(None,None,0,0)=20to=20keep=20GMEM=20tile=20?= =?UTF-8?q?dim=20free?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- tests/fmha_v3_stage_c_example6.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/fmha_v3_stage_c_example6.py b/tests/fmha_v3_stage_c_example6.py index 0e38bdbc..1ad54f53 100644 --- a/tests/fmha_v3_stage_c_example6.py +++ b/tests/fmha_v3_stage_c_example6.py @@ -183,7 +183,7 @@ class FmhaV3StageCMulti: b_lay = cute.make_layout(cute.slice_(cl_vmnk,(0,None,0,0)).shape) tBsK,tBgK = cpasync.tma_partition(tma_k,0,b_lay,cute.group_modes(sK,0,3),cute.group_modes(tCgK,0,3)) tVsV,tVgV = cpasync.tma_partition(tma_v,0,b_lay,cute.group_modes(sV,0,3),cute.group_modes(tCgV,0,3)) - tAgQ = tAgQ[(None,0,None,0)]; tBgK = tBgK[(None,0,None,0)]; tVgV = tVgV[(None,0,None,0)] + tAgQ = tAgQ[(None,0,None,0)]; tBgK = tBgK[(None,None,0,0)]; tVgV = tVgV[(None,None,0,0)] tCrQ = qk_mma.make_fragment_A(sQ); tCrK = qk_mma.make_fragment_B(sK) tCrV = pv_mma.make_fragment_B(sV)