From 111b50b62a06813efc5ef3cd15e9541c4721990b Mon Sep 17 00:00:00 2001 From: biondizzle Date: Sat, 23 May 2026 19:52:02 +0000 Subject: [PATCH] SMEM-P: debug with test pattern (k+j)*0.01 --- dsv4/kernels/attention/fmha.py | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/dsv4/kernels/attention/fmha.py b/dsv4/kernels/attention/fmha.py index 8a136b6f..d7c04886 100644 --- a/dsv4/kernels/attention/fmha.py +++ b/dsv4/kernels/attention/fmha.py @@ -359,8 +359,12 @@ class FmhaKernel: n2 = n // 64 pv_coord = ((m, n0), 0, (n1, n2), 0) - # Convert Float32 → BF16 and write to SMEM - p_val_bf16 = tTMEM_LOADrS_frg[k, j].to(self.q_dtype) + # DEBUG: Write simple test pattern (k+j)*0.01 + # This helps verify coordinate mapping + # k and j are loop indices (0-31, 0-3) + pattern_val = Float32(k + j) * Float32(0.01) + p_val_bf16 = pattern_val.to(self.q_dtype) + # Original: p_val_bf16 = tTMEM_LOADrS_frg[k, j].to(self.q_dtype) sP[pv_coord] = p_val_bf16 row_sum = row_sum + tTMEM_LOADrS_frg[k, j]