[Model Runner V2] Add dummy profile_cudagraph_memory API (#36520)

Signed-off-by: Woosuk Kwon <woosuk@inferact.ai>
2026-03-09 10:20:13 -07:00
parent 1e0f917b34
commit 6e956d9eca
1 changed files with 4 additions and 0 deletions
--- a/vllm/v1/worker/gpu/model_runner.py
+++ b/vllm/v1/worker/gpu/model_runner.py
@@ -473,6 +473,10 @@ class GPUModelRunner(LoRAModelRunnerMixin):
        # SP is not supported yet.
        return num_scheduled_tokens

+    def profile_cudagraph_memory(self) -> int:
+        # NOTE(woosuk): It is TBD whether we keep this API or not.
+        return 0
+
    @torch.inference_mode()
    def capture_model(self) -> int:
        if not self.cudagraph_manager.needs_capture():