mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Loader] add multi-thread model loading (#6877)
* multi-thread-loader * fix ut
This commit is contained in:
@@ -613,6 +613,7 @@ class LLMEngine:
|
||||
f" --early_stop_config '{self.cfg.early_stop_config.to_json_string()}'"
|
||||
f" --reasoning_parser {self.cfg.structured_outputs_config.reasoning_parser}"
|
||||
f" --load_choices {self.cfg.load_config.load_choices}"
|
||||
f" --model_loader_extra_config '{json.dumps(self.cfg.load_config.model_loader_extra_config)}'"
|
||||
f" --plas_attention_config '{self.cfg.plas_attention_config.to_json_string()}'"
|
||||
f" --ips {ips}"
|
||||
f" --max_encoder_cache {self.cfg.cache_config.max_encoder_cache}"
|
||||
|
||||
Reference in New Issue
Block a user