[Feat] Drop-in Torch CUDA Profiler (#27841)

Signed-off-by: Benjamin Chislett <bchislett@nvidia.com>
2025-11-08 17:07:37 -05:00
parent 77d702a22b
commit 975676d174
5 changed files with 76 additions and 29 deletions
--- a/vllm/entrypoints/openai/api_server.py
+++ b/vllm/entrypoints/openai/api_server.py
@@ -1280,10 +1280,16 @@ async def invocations(raw_request: Request):


 if envs.VLLM_TORCH_PROFILER_DIR:
-    logger.warning(
+    logger.warning_once(
        "Torch Profiler is enabled in the API server. This should ONLY be "
        "used for local development!"
    )
+elif envs.VLLM_TORCH_CUDA_PROFILE:
+    logger.warning_once(
+        "CUDA Profiler is enabled in the API server. This should ONLY be "
+        "used for local development!"
+    )
+if envs.VLLM_TORCH_PROFILER_DIR or envs.VLLM_TORCH_CUDA_PROFILE:

    @router.post("/start_profile")
    async def start_profile(raw_request: Request):