mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[BugFix] Fix redundant prompt_logprobs in the second chunk of streaming response when return_token_ids is enabled for v1/completions and fix trace file name (#5829)
* fix prompt logprobs bug * fix trace file name --------- Co-authored-by: qwes5s5 <root@yq01-sys-rpm26xc1knu.yq01.baidu.com>
This commit is contained in:
@@ -546,7 +546,9 @@ class OpenAIServingCompletion:
|
||||
reasoning_content="",
|
||||
arrival_time=arrival_time,
|
||||
logprobs=logprobs_res,
|
||||
prompt_logprobs=clamp_prompt_logprobs(prompt_logprobs_res),
|
||||
prompt_logprobs=(
|
||||
clamp_prompt_logprobs(prompt_logprobs_res) if not request.return_token_ids else None
|
||||
),
|
||||
draft_logprobs=draft_logprobs_res,
|
||||
speculate_metrics=output_speculate_metrics,
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user