mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
fix mtp acceptance rate decline (#6470)
This commit is contained in:
@@ -890,7 +890,8 @@ class ProposerInputBatch(InputBatch):
|
||||
self.block_tables = paddle.clone(self.target_model_input_batch["block_tables"])
|
||||
self.input_ids = paddle.clone(self.target_model_input_batch["input_ids"])
|
||||
fill_paddle_tensor(self, "input_ids_cpu", -1)
|
||||
self.seq_lens_this_time_buffer = paddle.clone(self.target_model_input_batch["seq_lens_this_time"])
|
||||
# acceptance rate decline when reset seq_lens_this_time
|
||||
# self.seq_lens_this_time_buffer = paddle.clone(self.target_model_input_batch["seq_lens_this_time"])
|
||||
|
||||
self.seq_lens_encoder = paddle.clone(self.target_model_input_batch["seq_lens_encoder"])
|
||||
self.seq_lens_decoder = paddle.clone(self.target_model_input_batch["seq_lens_decoder"])
|
||||
|
||||
Reference in New Issue
Block a user