[Fix]fix top_k_top_p sampling (#2801)
Deploy GitHub Pages / deploy (push) Has been cancelled

* fix topk-topp

* update

* add base_non_truncated
This commit is contained in:
Sunny-bot1
2025-07-10 22:35:10 +08:00
committed by GitHub
parent 59071268b6
commit 240d6236bc
8 changed files with 23 additions and 123 deletions
+1 -1
View File
@@ -51,7 +51,7 @@ environment_variables: dict[str, Callable[[], Any]] = {
"FD_ATTENTION_BACKEND":
lambda: os.getenv("FD_ATTENTION_BACKEND", "APPEND_ATTN"),
# 设置采样类别,当前可设置为 "base"、"air" 或 "rejection"
# 设置采样类别,当前可设置为 "base"、"base_non_truncated"、"air" 或 "rejection"
"FD_SAMPLING_CLASS":
lambda: os.getenv("FD_SAMPLING_CLASS", "base"),