From 72c97f25462a498cdb6ecd2210ef4bd0c0ba797f Mon Sep 17 00:00:00 2001 From: biondizzle Date: Thu, 28 May 2026 08:48:01 +0000 Subject: [PATCH] debug: minimal UMMA descriptor (just start_addr + version) --- dsv4/kernels/attention/fmha_qk_verify.cuh | 10 ++++++++-- 1 file changed, 8 insertions(+), 2 deletions(-) diff --git a/dsv4/kernels/attention/fmha_qk_verify.cuh b/dsv4/kernels/attention/fmha_qk_verify.cuh index 8e551d3c..396b6ca8 100644 --- a/dsv4/kernels/attention/fmha_qk_verify.cuh +++ b/dsv4/kernels/attention/fmha_qk_verify.cuh @@ -69,8 +69,14 @@ fmha_qk_verify( uint32_t sQ_smem = __cvta_generic_to_shared(sQ); uint32_t sK_smem = __cvta_generic_to_shared(sK); - uint64_t desc_q = make_umma_desc_mn_none(sQ_smem, HD); - uint64_t desc_k = make_umma_desc_k_none(sK_smem, HD); + uint64_t desc_q = 0; + desc_q |= (static_cast(sQ_smem >> 4) & 0x3FFF); // start_address + desc_q |= (static_cast(1) << 46); // version + // Everything else = 0 (no strides, no swizzle) + + uint64_t desc_k = 0; + desc_k |= (static_cast(sK_smem >> 4) & 0x3FFF); + desc_k |= (static_cast(1) << 46); // Quick test: verify SMEM data was loaded correctly // Write Q[0,0..3] * K[0,0..3] dot product (scalar) to s_out[0] as sanity check