[Model Runner] Support overlap schedule (#6259)

This commit is contained in:
sunxin
2026-02-04 10:49:44 +08:00
committed by GitHub
parent 6225439778
commit 9b0a82cfa9
8 changed files with 132 additions and 57 deletions
+1
View File
@@ -1989,6 +1989,7 @@ class EngineService:
"enable_logprob": self.cfg.model_config.enable_logprob,
"lm_head_fp32": self.cfg.model_config.lm_head_fp32,
"enable_entropy": self.cfg.model_config.enable_entropy,
"enable_overlap_schedule": self.cfg.scheduler_config.enable_overlap_schedule,
}
for worker_flag, value in worker_store_true_flag.items():
if value: