diff --git a/dsv4/ops/quantize.py b/dsv4/ops/quantize.py index e564c4cd..399ba922 100644 --- a/dsv4/ops/quantize.py +++ b/dsv4/ops/quantize.py @@ -430,4 +430,4 @@ def rmsnorm_quantize_nvfp4(x_bf16, norm_weight, eps=1e-6, divisor=6.0 * 448.0): from dsv4.kernels.cuda.loader import get_cuda_module mod = get_cuda_module("fused_rmsnorm_quantize", ["fused_rmsnorm_quantize.cu"]) x_fp4, x_sf, gsa, inv_rms = mod.rmsnorm_quantize_nvfp4(x_bf16, norm_weight, eps, divisor) - return x_fp4, x_sf, gsa, inv_rms + return QuantizedActivation(x_fp4, x_sf, gsa, inv_rms)