[Core] Support multi-node inference(eager and cuda graph) (#3686)

This commit is contained in:
Roy
2024-03-29 06:01:55 +08:00
committed by GitHub
parent a4075cba4d
commit 515386ef3c
7 changed files with 25 additions and 22 deletions

View File

@@ -188,8 +188,6 @@ class RayGPUExecutor(ExecutorBase):
is_driver_worker=True,
)
# FIXME(woosuk): We are not properly initializing pynccl when
# we have multiple nodes.
self._run_workers("init_device")
self._run_workers(
"load_model",