mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-22 16:07:51 +08:00
2.4_fix_mtp_forward_meta (#5977)
This commit is contained in:
@@ -1014,7 +1014,9 @@ class MTPProposer(Proposer):
|
||||
# 4. Compute logits, Sample
|
||||
logits = self.model.compute_logits(hidden_states, forward_meta=self.forward_meta)
|
||||
if self.enable_logprob and self.enable_draft_logprob and substep == 0:
|
||||
first_token_logits = self.model.compute_logits(self.model_inputs["first_token_hidden_states"])
|
||||
first_token_logits = self.model.compute_logits(
|
||||
self.model_inputs["first_token_hidden_states"], forward_meta=self.forward_meta
|
||||
)
|
||||
|
||||
speculate_get_logits(
|
||||
self.model_inputs["draft_logits"],
|
||||
|
||||
Reference in New Issue
Block a user