[Iluvatar GPU] Adapt VL model (#4313)

This commit is contained in:
yzwu
2025-10-17 16:13:38 +08:00
committed by GitHub
parent ba5c2b7e37
commit 4b661512ca
15 changed files with 345 additions and 228 deletions
@@ -35,6 +35,7 @@ from paddleformers.transformers.model_utils import PretrainedModel
from fastdeploy.model_executor.layers.utils import divide, get_tensor
from fastdeploy.model_executor.utils import set_weight_attrs
from fastdeploy.platforms import current_platform
from .activation import ACT2FN
from .configuration import DFNRopeVisionTransformerConfig
@@ -174,7 +175,7 @@ class VisionFlashAttention2(nn.Layer):
mp_group=fleet.get_hybrid_communicate_group().get_model_parallel_group(),
weight_attr=None,
has_bias=True,
fuse_matmul_bias=True,
fuse_matmul_bias=False if current_platform.is_iluvatar() else True,
gather_output=False,
)
self.proj = RowParallelLinear(
@@ -26,6 +26,11 @@ elif current_platform.is_xpu():
text_image_gather_scatter,
text_image_index_out,
)
elif current_platform.is_iluvatar():
from fastdeploy.model_executor.ops.iluvatar import (
text_image_gather_scatter,
text_image_index_out,
)
else:
raise ImportError("Unsupported platform, only support CUDA and XPU")
@@ -31,6 +31,7 @@ from fastdeploy.model_executor.models.ernie4_5_vl.dist_utils import (
scatter_axis,
)
from fastdeploy.model_executor.utils import set_weight_attrs
from fastdeploy.platforms import current_platform
class ScatterOp(PyLayer):
@@ -172,7 +173,7 @@ class VariableResolutionResamplerModel(nn.Layer):
self.spatial_dim,
input_is_parallel=True,
has_bias=True,
fuse_matmul_bias=True,
fuse_matmul_bias=False if current_platform.is_iluvatar() else True,
)
if self.tensor_parallel_degree > 1
else nn.Linear(self.spatial_dim, self.spatial_dim)