mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
qwen loader (#3057)
This commit is contained in:
@@ -84,9 +84,10 @@ class MTPProposer(Proposer):
|
||||
"""
|
||||
Load MTP Layer
|
||||
"""
|
||||
from fastdeploy.model_executor.model_loader import get_model_from_loader
|
||||
from fastdeploy.model_executor.model_loader import get_model_loader
|
||||
|
||||
self.model = get_model_from_loader(self.cfg)
|
||||
model_loader = get_model_loader(load_config=self.cfg.load_config)
|
||||
self.model = model_loader.load_model(fd_config=self.cfg)
|
||||
|
||||
def dummy_prefill_inputs(self, num_tokens: int, batch_size: int, expected_decode_len: int):
|
||||
"""Set dummy prefill inputs to model_inputs"""
|
||||
|
||||
Reference in New Issue
Block a user