fix: invert cache check logic (compile when NOT in cache)

This commit is contained in:
2026-05-16 20:25:16 +00:00
parent e337ec86a3
commit 98cc6ac1f3

View File

@@ -356,7 +356,7 @@ def run_nvfp4_grouped_gemm(
cache_key = (num_experts, str(device), mma_tiler_mn, cluster_shape_mn, K_packed, N_packed)
use_cache = True # TEMP: set False to always recompile (debug)
if use_cache and cache_key in _compiled_kernel_cache:
if not (use_cache and cache_key in _compiled_kernel_cache):
kernel = ScaledGroupedGemmKernel(
scenario="2Dx3D",
sf_vec_size=SF_VEC_SIZE,