mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Feature] support stop_token_ids (#5399)
* support stop_token_ids * fix * delete chinese * support both * delete print
This commit is contained in:
@@ -420,6 +420,7 @@ void GetStopFlagsMulti(const paddle::Tensor& topk_ids,
|
||||
const paddle::Tensor& step_idx,
|
||||
const paddle::Tensor& stop_seqs,
|
||||
const paddle::Tensor& stop_seqs_len,
|
||||
const paddle::Tensor& min_tokens,
|
||||
const bool beam_search);
|
||||
|
||||
void UpdateInputs(const paddle::Tensor& stop_flags,
|
||||
@@ -764,7 +765,8 @@ void SpecGetStopFlagsMultiSeqs(const paddle::Tensor& accept_tokens,
|
||||
const paddle::Tensor& seq_lens,
|
||||
const paddle::Tensor& stop_seqs,
|
||||
const paddle::Tensor& stop_seqs_len,
|
||||
const paddle::Tensor& end_ids);
|
||||
const paddle::Tensor& end_ids,
|
||||
const paddle::Tensor& min_tokens);
|
||||
|
||||
void SpeculateVerify(const paddle::Tensor& sampled_token_ids,
|
||||
const paddle::Tensor& accept_tokens,
|
||||
|
||||
Reference in New Issue
Block a user