debug: disable kernel cache to test fresh compilation

This commit is contained in:
2026-05-16 20:22:51 +00:00
parent 647c03b2ee
commit bc56452be8

View File

@@ -355,7 +355,7 @@ def run_nvfp4_grouped_gemm(
N_packed = mat_b.shape[2]
cache_key = (num_experts, str(device), mma_tiler_mn, cluster_shape_mn, K_packed, N_packed)
if cache_key not in _compiled_kernel_cache:
if False and cache_key not in _compiled_kernel_cache: # TEMP: always recompile
kernel = ScaledGroupedGemmKernel(
scenario="2Dx3D",
sf_vec_size=SF_VEC_SIZE,