[Others] Support constrained decoding when enable_thinking is false (#6248)

* support constrained decoding when enable_thinking is false

* fix

* fix

* fix
This commit is contained in:
GoldPancake
2026-01-28 00:05:17 -08:00
committed by GitHub
parent 27f8799f04
commit 7d6c87c29e
6 changed files with 88 additions and 4 deletions
@@ -243,6 +243,7 @@ def reasoning_phase_token_constraint(
reasoning_status: paddle.Tensor,
output_padding_offset: paddle.Tensor,
output_cum_offsets: paddle.Tensor,
enable_thinking: paddle.Tensor,
think_end_id: int,
line_break_id: int,
):
@@ -263,6 +264,7 @@ def reasoning_phase_token_constraint(
reasoning_status,
output_padding_offset,
output_cum_offsets,
enable_thinking,
think_end_id,
line_break_id,
)