test: M=64 in both desc and idesc

This commit is contained in:
2026-05-28 10:04:17 +00:00
parent 0f51fda0da
commit 68d1a7920c

View File

@@ -66,12 +66,12 @@ test_umma_qk_hd16(const bf16_t* q, const bf16_t* k,
// Descriptors
uint32_t sQ_smem = __cvta_generic_to_shared(sQ);
uint32_t sK_smem = __cvta_generic_to_shared(sK);
uint64_t desc_q = make_umma_desc_kmajor_none(sQ_smem, 128);
uint64_t desc_k = make_umma_desc_kmajor_none(sK_smem, 128);
uint64_t desc_q = make_umma_desc_kmajor_none(sQ_smem, 64); // M=64
uint64_t desc_k = make_umma_desc_kmajor_none(sK_smem, 64); // M=64
// Test with different N values to understand scaling
// N=8 → n_dim=1
uint32_t idesc = make_idesc(128, 8); // Try N=8
uint32_t idesc = make_idesc(64, 128); // Try M=64
if (tid == 0) {
memcpy(&s_out[128], &desc_q, 8);