From 1f310defa00a586fb2e1f26d2e7524b269c6e978 Mon Sep 17 00:00:00 2001 From: biondizzle Date: Mon, 25 May 2026 03:17:13 +0000 Subject: [PATCH] fix: quantize_activation_nvfp4 returns 2 values, not 3 --- tests/unit/test_nvfp4_quantize_kernel.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/unit/test_nvfp4_quantize_kernel.py b/tests/unit/test_nvfp4_quantize_kernel.py index 56342ead..8acebd71 100644 --- a/tests/unit/test_nvfp4_quantize_kernel.py +++ b/tests/unit/test_nvfp4_quantize_kernel.py @@ -90,7 +90,7 @@ def test_nvfp4_quantize_correctness(): x = torch.randn(M, N, dtype=torch.bfloat16, device='cuda') global_scale = 1.0 - x_fp4, block_scale, _ = quantize_activation_nvfp4(x, global_scale) + x_fp4, block_scale = quantize_activation_nvfp4(x, global_scale) print(f" Input: ({M}, {N}) BF16") print(f" FP4 output: {x_fp4.shape}, dtype={x_fp4.dtype}")