test: fix compile error, skip TMEM read
This commit is contained in:
@@ -124,15 +124,13 @@ test_umma_qk_hd16(
|
||||
// __syncthreads();
|
||||
|
||||
// ================================================================
|
||||
// Read S from TMEM
|
||||
// Read S from TMEM — skipped (no TMEM allocated)
|
||||
// ================================================================
|
||||
// Just compute scalar reference and output descriptor debug info
|
||||
if (wid == 0) {
|
||||
// Placeholder: write zeros
|
||||
for (int col = 0; col < 128; col++) {
|
||||
uint32_t u0, u1, u2, u3;
|
||||
tmem_load(tmem_base + col, u0, u1, u2, u3);
|
||||
if (lane == 0) {
|
||||
s_out[col] = u32_to_f32(u0); // S[0, col]
|
||||
}
|
||||
if (lane == 0) s_out[col] = 0.0f;
|
||||
}
|
||||
}
|
||||
__syncthreads();
|
||||
|
||||
Reference in New Issue
Block a user