[Kernel] Fix CUTLASS 3.x custom broadcast load epilogue (#5516)

This commit is contained in:
Tyler Michael Smith
2024-06-14 12:30:15 -04:00
committed by GitHub
parent d47af2bc02
commit 703475f6c2
2 changed files with 2 additions and 4 deletions

View File

@@ -153,7 +153,7 @@ struct Sm90RowOrScalarBroadcast {
CUTLASS_DEVICE void
begin(uint64_t* full_mbarrier_ptr, int load_iteration, bool issue_tma_load) {
if (params.ptr_row == nullptr) {
if (!params.row_broadcast) {
return;
}