allow parallel dp starting (#7426)

This commit is contained in:
RichardWooSJTU
2026-04-16 18:43:09 +08:00
committed by GitHub
parent 420a8c1af5
commit d2d633b05c
+7 -1
View File
@@ -876,8 +876,14 @@ class LLMEngine:
+ f" data parallel id {i}"
)
self.dp_processed[-1].start()
for i in range(
1,
self.cfg.parallel_config.data_parallel_size // self.cfg.nnode,
):
while self.launched_expert_service_signal.value[i] == 0:
time.sleep(1)
time.sleep(0.1)
def check_worker_initialize_status(self):
"""