[Bugfix] Fix torchrun PP broadcast deadlock with async scheduling (#33701)

Signed-off-by: Isotr0py <mozf@mail2.sysu.edu.cn>
This commit is contained in:
Isotr0py
2026-02-04 10:17:37 +08:00
committed by GitHub
parent 1b8fe6f7c4
commit 02080179a3
3 changed files with 4 additions and 7 deletions

View File

@@ -32,9 +32,6 @@ llm = LLM(
gpu_memory_utilization=random.uniform(0.7, 0.9),
swap_space=random.randint(1, 4),
seed=0,
# FIXME(Isotr0py): async scheduling causes deadlock
# on torchrun with PP, need to investigate further.
async_scheduling=False,
)
outputs = llm.generate(prompts, sampling_params)