From ebde1d67fde2fd3869b360425701cbe374fec35b Mon Sep 17 00:00:00 2001 From: biondizzle Date: Sun, 24 May 2026 03:46:27 +0000 Subject: [PATCH] D1: Add sP shape debug print --- dsv4/kernels/attention/fmha.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/dsv4/kernels/attention/fmha.py b/dsv4/kernels/attention/fmha.py index 2ed27d7e..8217286a 100644 --- a/dsv4/kernels/attention/fmha.py +++ b/dsv4/kernels/attention/fmha.py @@ -288,6 +288,8 @@ class FmhaKernel: # sP_addr = 64*m + (k%16) + 16*((k//16)%4) + 8192*(k//64) # This is representable as a CuTe layout: (128, (16, 4, 2)) -> (64, (1, 16, 8192)) _sP_nostage = sP[(None, None, None, 0)] # remove stage dim + # Debug: print sP shape at trace time + print(f"SMEM-P: sP shape={cute.shape(sP)}, sP_nostage shape={cute.shape(_sP_nostage)}") row_max = -Float32.inf row_sum = Float32(0.0)