[Feature] consider multimodal model when dummy run (#6045)

* add mm do profile * updata code * update code * update code * update code * update test case * update code * update code * fix xpu bug * update code * add mm do profile * update test case * update code
2026-04-23 00:17:25 +08:00 · 2026-02-09 17:49:55 +08:00
parent 783d56e28a
commit d60daca4a8
25 changed files with 166 additions and 19 deletions
@@ -584,6 +584,7 @@ class TestCommonEngineAdditionalCoverage(unittest.TestCase):
        with patch("fastdeploy.engine.common_engine.EngineWorkerQueue", DummyQ):
            eng = EngineService(cfg, start_queue=False, use_async_llm=True)
        eng.data_processor = self._stub_processor()
+        eng.mm_max_tokens_per_item = None

        captured = {"cmd": None}