From 0ecde542f1e38613f4d50fefdf143d1c8f862d8e Mon Sep 17 00:00:00 2001 From: biondizzle Date: Sat, 23 May 2026 02:23:16 +0000 Subject: [PATCH] fix: use cute.copy instead of cpasync.copy for TMA store --- tests/unit/test_fmha_v3_stage_c.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/unit/test_fmha_v3_stage_c.py b/tests/unit/test_fmha_v3_stage_c.py index ab5b733e..ade097b9 100644 --- a/tests/unit/test_fmha_v3_stage_c.py +++ b/tests/unit/test_fmha_v3_stage_c.py @@ -397,7 +397,7 @@ class FmhaV3StageCMulti: num_threads=32 * len(self.epilogue_warp_id), ) epi_bar.arrive_and_wait() - cpasync.copy(tma_c, cute.select(sC, mode=[0, 1]), gC) + cute.copy(tma_c, cute.select(sC, mode=[0, 1]), gC) cute.arch.cp_async_bulk_commit_group() cute.arch.cp_async_bulk_wait_group(0, read=True)