[Hardware][AMD][CI][Bugfix] Fix Kernels Attention Cache test (#32904)

Signed-off-by: Matthew Wong <Matthew.Wong2@amd.com>
This commit is contained in:
Matt
2026-01-23 10:24:26 -06:00
committed by GitHub
parent 1cb4341fbc
commit 305e53ade8

View File

@@ -242,7 +242,7 @@ def test_reshape_and_cache_flash(
value_cache_compact = permute_and_compact(value_cache)
def convert_fp8_local(output, input, scale, kv_dtype):
fp8_input = input.view(torch.float8_e4m3fn)
fp8_input = input.view(current_platform.fp8_dtype())
if scale.numel() == 1: # per-tensor
result = scaled_dequantize(
fp8_input.flatten(0, 2), scale, group_shape=None, out_dtype=output.dtype