[XPU] fix thinking bug where output only contains reasoning_content (#4760)

Co-authored-by: ddchenhao66 <dhaochen163.com>
2026-04-23 00:17:25 +08:00 · 2025-11-04 12:47:34 +08:00
parent ffa57dbfac
commit 78a1451eb7
8 changed files with 201 additions and 21 deletions
@@ -202,6 +202,8 @@ def xpu_post_process(
        max_think_lens = share_inputs["max_think_lens"]
        step_idx = share_inputs["step_idx"]
        limit_think_status = share_inputs["limit_think_status"]
+        stop_flags = share_inputs["stop_flags"]
+        eos_token_ids = share_inputs["eos_token_id"]
        if limit_strategy == "</think>":
            # for ernie-45-vl
            limit_thinking_content_length_v1(
@@ -209,6 +211,8 @@ def xpu_post_process(
                max_think_lens,
                step_idx,
                limit_think_status,
+                stop_flags,
+                eos_token_ids,  # 处理由于模型效果问题导致思考过程中输出eos token的问题
                think_end_id,
            )
        elif limit_strategy == "\n</think>\n\n":
@@ -219,6 +223,7 @@ def xpu_post_process(
                max_think_lens,
                step_idx,
                limit_think_status,
+                stop_flags,
                think_end_id,
                line_break_id,
            )