[Core] Support multi-node inference(eager and cuda graph) (#3686)
This commit is contained in:
@@ -188,8 +188,6 @@ class RayGPUExecutor(ExecutorBase):
|
||||
is_driver_worker=True,
|
||||
)
|
||||
|
||||
# FIXME(woosuk): We are not properly initializing pynccl when
|
||||
# we have multiple nodes.
|
||||
self._run_workers("init_device")
|
||||
self._run_workers(
|
||||
"load_model",
|
||||
|
||||
Reference in New Issue
Block a user