mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Model Runner] Support overlap schedule (#6259)
This commit is contained in:
@@ -272,6 +272,7 @@ class SchedulerConfig:
|
||||
self.max_extra_num_batched_tokens = 16384 # extra token_num for multimodal inputs
|
||||
self.max_num_seqs = 34
|
||||
self.splitwise_role = "mixed"
|
||||
self.enable_overlap_schedule = False
|
||||
self.config = None
|
||||
|
||||
for key, value in args.items():
|
||||
|
||||
Reference in New Issue
Block a user