mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[BugFix] Fix return value inconsistency for ep_moe_expert_combine op (#5812)
This commit is contained in:
@@ -210,7 +210,7 @@ class CutlassMoEMethod(UnquantizedFusedMoEMethod):
|
||||
None, # down_proj_bias,
|
||||
False, # norm_topk_prob
|
||||
1.0,
|
||||
)[0]
|
||||
)
|
||||
else:
|
||||
tmp_ffn_out = recv_x
|
||||
|
||||
|
||||
@@ -250,7 +250,7 @@ class DeepGemmFusedMoeMethod(MoEMethodBase):
|
||||
None, # down_proj_bias
|
||||
False, # norm_topk_prob
|
||||
1.0,
|
||||
)[0]
|
||||
)
|
||||
|
||||
else:
|
||||
tmp_ffn_out = paddle.cast(recv_x[0], paddle.bfloat16)
|
||||
@@ -448,6 +448,6 @@ class DeepGemmFusedMoeMethod(MoEMethodBase):
|
||||
None,
|
||||
False, # norm_topk_prob
|
||||
1.0,
|
||||
)[0]
|
||||
)
|
||||
|
||||
return tmp_ffn_out
|
||||
|
||||
Reference in New Issue
Block a user