[Misc] Remove use of CUDA_VISIBLE_DEVICES for device selection (fix DP slow startup time &c) (#26709)

Signed-off-by: ilmarkov <markovilya197@gmail.com>
Co-authored-by: Tyler Michael Smith <tlrmchlsmth@gmail.com>
This commit is contained in:
Ilya Markov
2025-10-23 14:58:39 +02:00
committed by GitHub
parent faee3ccdc2
commit 237cf6d32a
4 changed files with 35 additions and 7 deletions

View File

@@ -134,9 +134,12 @@ class CoreEngineProcManager:
data_parallel = vllm_config.parallel_config.data_parallel_size > 1
try:
for proc, local_dp_rank in zip(self.processes, local_dp_ranks):
# Adjust device control in DP for non-CUDA platforms
# For CUDA platforms, setting same device id for different DP
# processes affects NCCL init performance.
with (
set_device_control_env_var(vllm_config, local_dp_rank)
if (data_parallel)
if (data_parallel and not current_platform.is_cuda_alike())
else contextlib.nullcontext()
):
proc.start()