test: just 1 tmem_store, no fence, no loop
This commit is contained in:
@@ -78,12 +78,9 @@ test_umma_qk_hd16(
|
||||
}
|
||||
__syncthreads();
|
||||
|
||||
// Zero TMEM — test without fence
|
||||
// Zero TMEM — test just 1 store call, no fence
|
||||
if (wid == 0) {
|
||||
for (int col = 0; col < 128; col++) {
|
||||
tmem_store(tmem_base + col, 0, 0, 0, 0);
|
||||
}
|
||||
// tmem_fence_store(); // skip fence
|
||||
tmem_store(tmem_base, 0, 0, 0, 0);
|
||||
}
|
||||
__syncthreads();
|
||||
|
||||
|
||||
Reference in New Issue
Block a user