diff --git a/tests/unit/test_minimal_pv.cu b/tests/unit/test_minimal_pv.cu index e2f1c709..89945867 100644 --- a/tests/unit/test_minimal_pv.cu +++ b/tests/unit/test_minimal_pv.cu @@ -81,10 +81,11 @@ test_minimal_pv() } __syncthreads(); + uint32_t tb = 0; // TMEM alloc if (wid == 1) tmem_alloc(__cvta_generic_to_shared(sTmemBase), 128); __syncthreads(); - uint32_t tb = *sTmemBase; + tb = *sTmemBase; // QK GEMM (SS) — uses sQ0 and sK0 {