[V1][PP] Enable true PP with Ray executor (#13472)

Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
Woosuk Kwon
2025-02-18 09:15:32 -08:00
committed by GitHub
parent a02c86b4dd
commit 4fb8142a0e

View File

@@ -32,7 +32,7 @@ class RayDistributedExecutor(RayDistributedExecutorV0, Executor):
"""Ray distributed executor supports pipeline parallelism, """Ray distributed executor supports pipeline parallelism,
meaning that it allows PP size batches to be executed concurrently. meaning that it allows PP size batches to be executed concurrently.
""" """
return 1 #self.vllm_config.parallel_config.pipeline_parallel_size return self.parallel_config.pipeline_parallel_size
def execute_model( def execute_model(
self, self,