mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[FDConfig] disable chunked_mm_input in ernie5 (#5774)
* disable chunked_mm_input in ernie5 * update code * update code * update test case * update testcase * upate case
This commit is contained in:
@@ -55,6 +55,7 @@ class TestRedundantExpertManager(unittest.TestCase):
|
||||
model_cfg.moe_num_experts = 64
|
||||
model_cfg.moe_layer_start_index = 1
|
||||
model_cfg.model = "/test/model"
|
||||
model_cfg.architectures = ["test_model"]
|
||||
cache_cfg.bytes_per_layer_per_block = 1
|
||||
|
||||
parallel_cfg = ParallelConfig(args)
|
||||
|
||||
Reference in New Issue
Block a user