[Model Runner] Support overlap schedule (#6259)

This commit is contained in:
sunxin
2026-02-04 10:49:44 +08:00
committed by GitHub
parent 6225439778
commit 9b0a82cfa9
8 changed files with 132 additions and 57 deletions
+1
View File
@@ -272,6 +272,7 @@ class SchedulerConfig:
self.max_extra_num_batched_tokens = 16384 # extra token_num for multimodal inputs
self.max_num_seqs = 34
self.splitwise_role = "mixed"
self.enable_overlap_schedule = False
self.config = None
for key, value in args.items():