Fix: printf after var declarations

This commit is contained in:
2026-05-28 15:03:25 +00:00
parent 2d44f8e356
commit 7becbfc07e

View File

@@ -32,8 +32,8 @@ __global__ void __launch_bounds__(128)
test_fmha_hd64_smem_p(const bf16_t* q, const bf16_t* k, const bf16_t* v,
bf16_t* o_out, float* o_scalar, float scale)
{
if (tid == 0) printf("Kernel started! smem_buf=%p\n", sbuf);
const int tid = threadIdx.x, wid = tid / 32, lane = tid % 32;
if (tid == 0) printf("Kernel started!\n");
extern __shared__ char sbuf[];
uint32_t* sTmemBase = (uint32_t*)sbuf;