[Feature] consider multimodal model when dummy run (#6045)

* add mm do profile

* updata code

* update code

* update code

* update code

* update test case

* update code

* update code

* fix xpu bug

* update code

* add mm do profile

* update test case

* update code
This commit is contained in:
kevin
2026-02-09 17:49:55 +08:00
committed by GitHub
parent 783d56e28a
commit d60daca4a8
25 changed files with 166 additions and 19 deletions
@@ -98,6 +98,7 @@ class TestGraphOptBackend(unittest.TestCase):
model_config = Mock()
model_config.max_model_len = 512
model_config.architectures = ["test_model"]
model_config.mm_max_tokens_per_item = None
self.baseline_fd_config = FDConfig(
graph_opt_config=baseline_graph_opt_config,
scheduler_config=baseline_scheduler_config,
@@ -146,6 +147,7 @@ class TestGraphOptBackend(unittest.TestCase):
model_config = Mock()
model_config.max_model_len = 512
model_config.architectures = ["test_model"]
model_config.mm_max_tokens_per_item = None
# Create FD config
return FDConfig(