mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
2.4_fix_mtp_forward_meta (#5977)
This commit is contained in:
@@ -1014,7 +1014,9 @@ class MTPProposer(Proposer):
|
|||||||
# 4. Compute logits, Sample
|
# 4. Compute logits, Sample
|
||||||
logits = self.model.compute_logits(hidden_states, forward_meta=self.forward_meta)
|
logits = self.model.compute_logits(hidden_states, forward_meta=self.forward_meta)
|
||||||
if self.enable_logprob and self.enable_draft_logprob and substep == 0:
|
if self.enable_logprob and self.enable_draft_logprob and substep == 0:
|
||||||
first_token_logits = self.model.compute_logits(self.model_inputs["first_token_hidden_states"])
|
first_token_logits = self.model.compute_logits(
|
||||||
|
self.model_inputs["first_token_hidden_states"], forward_meta=self.forward_meta
|
||||||
|
)
|
||||||
|
|
||||||
speculate_get_logits(
|
speculate_get_logits(
|
||||||
self.model_inputs["draft_logits"],
|
self.model_inputs["draft_logits"],
|
||||||
|
|||||||
Reference in New Issue
Block a user