diff --git a/tests/kernels/attention/test_trtllm_kvfp8_dequant.py b/tests/kernels/attention/test_trtllm_kvfp8_dequant.py index a2ea372c0..c49ceb03f 100644 --- a/tests/kernels/attention/test_trtllm_kvfp8_dequant.py +++ b/tests/kernels/attention/test_trtllm_kvfp8_dequant.py @@ -12,6 +12,12 @@ import torch from vllm.platforms import current_platform +if current_platform.is_rocm(): + pytest.skip( + "trtllm kvfp8 dequant is not supported on ROCm.", + allow_module_level=True, + ) + FP8_DTYPE = current_platform.fp8_dtype() NUM_BLOCKS = 128