SMEM-P: debug compute offset for known coordinate

This commit is contained in:
2026-05-23 20:05:02 +00:00
parent db9d9b09d2
commit 6a2f3d2e27

View File

@@ -408,6 +408,12 @@ class FmhaKernel:
# SMEM-P: Already wrote P values to SMEM in softmax loop
# Just need fence and barrier
print(f"[SMEM-P CUTLASS] P values already written to SMEM, proceeding to fence")
# DEBUG: Compute offset for known coordinate to verify mapping
test_coord = ((0,0), 0, (0,0), 0)
test_offset = cute.crd2idx(test_coord, sP.layout)
print(f"[SMEM-P DEBUG] test_coord {test_coord} -> offset {test_offset}")
cute.arch.fence_proxy("async.shared", space="cta")
# Barrier for both TMEM-P and SMEM-P paths