[XPU]MAX_BSZ aligns gpu settings and disable prefix cache in OCR VL (#5831)

This commit is contained in:
ddchenhao66
2025-12-31 09:49:12 +08:00
committed by GitHub
parent 74e162697f
commit 9e45ef7ca9
6 changed files with 25 additions and 27 deletions
+3
View File
@@ -564,6 +564,9 @@ class EngineArgs:
if "PaddleOCR" in get_model_architecture(self.model, self.model_config_name):
envs.FD_ENABLE_MAX_PREFILL = 1
# TODO XPU support PaddleOCR prefix caching
if current_platform.is_xpu():
self.enable_prefix_caching = False
if self.kvcache_storage_backend is not None:
if not self.enable_prefix_caching: