Set splitk=1 for fused-moe-lora expand kernel (#32882)

Signed-off-by: Danielle Robinson <dmmaddix@amazon.com>
Co-authored-by: Danielle Robinson <dmmaddix@amazon.com>
Co-authored-by: Jee Jee Li <pandaleefree@gmail.com>
This commit is contained in:
Danielle Robinson
2026-01-25 22:52:34 -08:00
committed by GitHub
parent a9b53dd435
commit ee484b3f4b

View File

@@ -351,7 +351,7 @@ def _fused_moe_lora_expand(
"GROUP_SIZE_M": group_size_m,
"num_warps": num_warps,
"num_stages": num_stages,
"SPLIT_K": split_k, # Set split_k = 1 for expand calls
"SPLIT_K": 1, # Set split_k = 1 for expand calls
"USE_GDC": use_gdc,
"launch_pdl": use_gdc, # triton kernel metadata
}