mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-24 09:44:10 +08:00
[Feature] Support mtp overlap schedule (#7001)
This commit is contained in:
@@ -123,7 +123,7 @@ def gather_logprobs(
|
||||
indices = token_ids
|
||||
top_logprobs = token_logprobs
|
||||
|
||||
return LogprobsTensors(indices, top_logprobs, token_ranks)
|
||||
return LogprobsTensors(indices.cpu(), top_logprobs.cpu(), token_ranks.cpu())
|
||||
|
||||
|
||||
def build_output_logprobs(
|
||||
|
||||
Reference in New Issue
Block a user