[Hardware] Replace torch.cuda.empty_cache with torch.accelerator.empty_cache (#30681)

Signed-off-by: Kunshang Ji <kunshang.ji@intel.com> Signed-off-by: Kunshang Ji <jikunshang95@gmail.com> Co-authored-by: Harry Mellor <19981378+hmellor@users.noreply.github.com>
2026-03-04 17:49:47 +08:00
parent 5dc3538736
commit 16d2ad1d38
35 changed files with 110 additions and 59 deletions
--- a/tests/v1/e2e/test_lora_with_spec_decode.py
+++ b/tests/v1/e2e/test_lora_with_spec_decode.py
@@ -95,7 +95,7 @@ def test_batch_inference_correctness(
            prompts, sampling_params, lora_request=lora_request
        )
        del ref_llm
-        torch.cuda.empty_cache()
+        torch.accelerator.empty_cache()
        cleanup_dist_env_and_memory()

        lora_spec_llm = LLM(
@@ -135,5 +135,5 @@ def test_batch_inference_correctness(
        print(f"match ratio: {matches}/{len(ref_outputs)}")
        assert matches > int(0.90 * len(ref_outputs))
        del lora_spec_llm
-        torch.cuda.empty_cache()
+        torch.accelerator.empty_cache()
        cleanup_dist_env_and_memory()