From 8658c8eca5644faa62c4f23edbef3eabc7da7a50 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Mon, 1 Jun 2026 07:01:02 +0000 Subject: [PATCH] fix: add sf_vec_size parameter back to Nvfp4FusedRouterKernel __init__ --- dsv4/kernels/router/nvfp4_fused_router_kernel.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/dsv4/kernels/router/nvfp4_fused_router_kernel.py b/dsv4/kernels/router/nvfp4_fused_router_kernel.py index 398422f6..dc04b837 100644 --- a/dsv4/kernels/router/nvfp4_fused_router_kernel.py +++ b/dsv4/kernels/router/nvfp4_fused_router_kernel.py @@ -59,7 +59,7 @@ class Nvfp4FusedRouterKernel: bandwidth savings and reduced kernel launch overhead are significant. """ - def __init__(self, mma_tiler_mn=(128, 128), cluster_shape_mn=(1, 1), top_k=6): + def __init__(self, mma_tiler_mn=(128, 128), cluster_shape_mn=(1, 1), top_k=6, sf_vec_size=16): # Data types self.a_dtype = cutlass.Float4E2M1FN # FP4 activation (quantized from BF16) self.b_dtype = cutlass.Float4E2M1FN # FP4 weight