From bd57b1e2a79fd18a1cf7a7c217fcb4e7d9c5c22a Mon Sep 17 00:00:00 2001 From: Jiang-Jia-Jun <163579578+Jiang-Jia-Jun@users.noreply.github.com> Date: Wed, 22 Apr 2026 11:02:26 +0800 Subject: [PATCH] Update args_utils.py --- fastdeploy/engine/args_utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fastdeploy/engine/args_utils.py b/fastdeploy/engine/args_utils.py index 01b0c9de8e..1b9e21c202 100644 --- a/fastdeploy/engine/args_utils.py +++ b/fastdeploy/engine/args_utils.py @@ -263,7 +263,7 @@ class EngineArgs: """ Flag to enable prefix caching. """ - enable_output_caching: bool = False + enable_output_caching: bool = True """ Flag to enable kv cache for output tokens, only valid in V1 scheduler. """