[Kernel] Fix CUTLASS 3.x custom broadcast load epilogue (#5516)
This commit is contained in:
committed by
GitHub
parent
d47af2bc02
commit
703475f6c2
@@ -153,7 +153,7 @@ struct Sm90RowOrScalarBroadcast {
|
||||
|
||||
CUTLASS_DEVICE void
|
||||
begin(uint64_t* full_mbarrier_ptr, int load_iteration, bool issue_tma_load) {
|
||||
if (params.ptr_row == nullptr) {
|
||||
if (!params.row_broadcast) {
|
||||
return;
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user