[DataProcessor] Refactor multimodal processor: extract encoding strategies and unify MM processing pipeline (#7298)

* merge mm processor
This commit is contained in:
luukunn
2026-04-15 19:01:06 +08:00
committed by GitHub
parent a218d29488
commit 3f84d8d893
36 changed files with 4016 additions and 681 deletions
+2 -2
View File
@@ -94,13 +94,13 @@ class InputPreprocessor:
tool_parser_obj=tool_parser_obj,
)
else:
from fastdeploy.input.multimodal_processor import (
from fastdeploy.input.mm_model_config import (
ERNIE4_5_VL,
PADDLEOCR_VL,
QWEN3_VL,
QWEN_VL,
MultiModalProcessor,
)
from fastdeploy.input.multimodal_processor import MultiModalProcessor
if ErnieArchitectures.contains_ernie_arch(architecture):
model_type = ERNIE4_5_VL