From 73bd21ce01e355b4f5295d4abb070e4e3d9794cc Mon Sep 17 00:00:00 2001 From: biondizzle Date: Thu, 28 May 2026 11:46:12 +0000 Subject: [PATCH] test: force 1 K-tile for HD=64 debug --- tests/unit/test_umma_qk_hd64.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/unit/test_umma_qk_hd64.cu b/tests/unit/test_umma_qk_hd64.cu index 6a671f32..76d88851 100644 --- a/tests/unit/test_umma_qk_hd64.cu +++ b/tests/unit/test_umma_qk_hd64.cu @@ -29,7 +29,7 @@ test_umma_qk_hd64(const bf16_t* q, const bf16_t* k, { const int tid = threadIdx.x; const int wid = tid / 32, lane = tid % 32; - const int n_ktiles = hd / MMA_K; // 4 for hd=64 + const int n_ktiles = 1; // hd / MMA_K; // Force 1 K-tile for debugging // SMEM: sQ (128, HD) canonical + sK (128, HD) canonical // Each K-tile of (128, 16) = 4096 bytes