[XPU]MAX_BSZ aligns gpu settings and disable prefix cache in OCR VL (#5831)

2026-04-23 00:17:25 +08:00 · 2025-12-31 09:49:12 +08:00
parent 74e162697f
commit 9e45ef7ca9
6 changed files with 25 additions and 27 deletions
@@ -564,6 +564,9 @@ class EngineArgs:

        if "PaddleOCR" in get_model_architecture(self.model, self.model_config_name):
            envs.FD_ENABLE_MAX_PREFILL = 1
+            # TODO XPU support PaddleOCR prefix caching
+            if current_platform.is_xpu():
+                self.enable_prefix_caching = False

        if self.kvcache_storage_backend is not None:
            if not self.enable_prefix_caching: