mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Optimization][DeepSeekV3.2]Reducing slot_mapping compute frequency from twice per layer to a single pre-processing step. (#7367)
This commit is contained in:
@@ -85,6 +85,7 @@ class MockFDConfig:
|
||||
name = "default"
|
||||
splitwise_role = "mixed"
|
||||
max_num_seqs = 2
|
||||
max_num_batched_tokens = 2048
|
||||
|
||||
parallel_config = ParallelConfig()
|
||||
scheduler_config = SchedulerConfig()
|
||||
|
||||
Reference in New Issue
Block a user