mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 17:11:21 +08:00
[Feature] Config eviction_duration (#7125)
* [Feature] Config eviction_duration * [Feature] Config eviction_duration * [Feature] Config eviction_duration * [Feature] Config eviction_duration --------- Co-authored-by: mouxin <mouxin@baidu.com>
This commit is contained in:
@@ -9,6 +9,7 @@ scheduler:
|
||||
prefill-policy: "cache_aware"
|
||||
decode-policy: "request_num"
|
||||
eviction-interval-secs: 60
|
||||
eviction-duration-mins: 30 # eviction duration for cache-aware radix tree nodes (minutes); default: 30
|
||||
balance-abs-threshold: 1
|
||||
balance-rel-threshold: 0.2
|
||||
hit-ratio-weight: 1.0
|
||||
|
||||
Reference in New Issue
Block a user