fix: invert cache check logic (compile when NOT in cache)
This commit is contained in:
@@ -356,7 +356,7 @@ def run_nvfp4_grouped_gemm(
|
||||
cache_key = (num_experts, str(device), mma_tiler_mn, cluster_shape_mn, K_packed, N_packed)
|
||||
use_cache = True # TEMP: set False to always recompile (debug)
|
||||
|
||||
if use_cache and cache_key in _compiled_kernel_cache:
|
||||
if not (use_cache and cache_key in _compiled_kernel_cache):
|
||||
kernel = ScaledGroupedGemmKernel(
|
||||
scenario="2Dx3D",
|
||||
sf_vec_size=SF_VEC_SIZE,
|
||||
|
||||
Reference in New Issue
Block a user