diff --git a/tests/fmha_v3_real_softmax.py b/tests/fmha_v3_real_softmax.py index 089e15ea..05f6eb5a 100644 --- a/tests/fmha_v3_real_softmax.py +++ b/tests/fmha_v3_real_softmax.py @@ -201,7 +201,7 @@ class FmhaV3RealSoftmax: for kb in cutlass.range(cute.size(tOrP0, mode=[2]), unroll_full=True): cute.gemm(pv_mma, tOtO0, tOrP0[(None,None,kb)], tCrV[(None,None,kb,kvh.index)], tOtO0) pv_mma.set(tcgen05.Field.ACCUMULATE, True) - cute.arch.fence_async_shared() + cute.arch.fence_view_async_shared() kvh.release() acc_pipe.producer_commit(acc_st); acc_st.advance() acc_pipe.producer_tail(acc_st)