fix: quantize_activation_nvfp4 returns 2 values, not 3
This commit is contained in:
@@ -90,7 +90,7 @@ def test_nvfp4_quantize_correctness():
|
||||
x = torch.randn(M, N, dtype=torch.bfloat16, device='cuda')
|
||||
global_scale = 1.0
|
||||
|
||||
x_fp4, block_scale, _ = quantize_activation_nvfp4(x, global_scale)
|
||||
x_fp4, block_scale = quantize_activation_nvfp4(x, global_scale)
|
||||
|
||||
print(f" Input: ({M}, {N}) BF16")
|
||||
print(f" FP4 output: {x_fp4.shape}, dtype={x_fp4.dtype}")
|
||||
|
||||
Reference in New Issue
Block a user