Files
FastDeploy/fastdeploy/golang_router/examples/run_with_config/config/config.example.yaml
T
mouxin 0a92e96f20 [Feature] Add Golang-based Router for Request Scheduling and Load Balancing (#5882)
* [Feature] add golang router

* [Feature] add golang router

* [Feature] add golang router

* [Feature] add golang router

* [Feature] add golang router

* [Feature] Add Golang-based Router for Request Scheduling and Load Balancing

* [Feature] Add Golang-based Router for Request Scheduling and Load Balancing

* [Feature] Add Golang-based Router for Request Scheduling and Load Balancing

* [Feature] Add Golang-based Router for Request Scheduling and Load Balancing

---------

Co-authored-by: mouxin <mouxin@baidu.com>
2026-01-07 21:28:08 +08:00

32 lines
821 B
YAML

server:
port: "8080"
host: "0.0.0.0"
mode: "debug" # debug, release, test
splitwise: true # true means pd mode, false means mixed mode
scheduler:
policy: "power_of_two"
prefill-policy: "cache_aware"
decode-policy: "fd_metrics_score"
eviction-interval-secs: 60
balance-abs-threshold: 1
balance-rel-threshold: 0.2
hit-ratio-weight: 1.0
load-balance-weight: 0.05
cache-block-size: 4
tokenizer-url: "http://0.0.0.0:8098" # optional tokenizer service endpoint
tokenizer-timeout-secs: 2
waiting-weight: 10
manager:
health-failure-threshold: 3
health-success-threshold: 2
health-check-timeout-secs: 5
health-check-interval-secs: 5
health-check-endpoint: /health
register-path: "config/register.yaml"
log:
level: "info" # debug, info, warn, error
output: "file" # stdout, file