diff --git a/dsv4/kernels/attention/fmha_smem_acc.py b/dsv4/kernels/attention/fmha_smem_acc.py index f64c6921..8e88b4bd 100644 --- a/dsv4/kernels/attention/fmha_smem_acc.py +++ b/dsv4/kernels/attention/fmha_smem_acc.py @@ -634,7 +634,7 @@ class FmhaKernel: ) c_pipe.producer_acquire() if warp_idx == self.epilogue_warp_id[0]: - cute.copy(tma_c, bSG_sC[(Int32(0),)], bSG_gC[(Int32(0),)]) + cute.copy(tma_c, bSG_sC[(None, Int32(0))], bSG_gC[(None, Int32(0))]) c_pipe.producer_commit() c_pipe.producer_tail()