mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 08:21:53 +08:00
remove dev sync in prefill (#4598)
This commit is contained in:
@@ -435,6 +435,7 @@ class EPPrefillRunner(EPRunner):
|
||||
x: paddle.Tensor,
|
||||
topk_idx: paddle.Tensor,
|
||||
topk_weights: paddle.Tensor,
|
||||
expert_alignment: int = 1,
|
||||
*args,
|
||||
**kwargs,
|
||||
):
|
||||
@@ -461,6 +462,7 @@ class EPPrefillRunner(EPRunner):
|
||||
"async_finish": self.ep_engine.async_finish,
|
||||
"topk_idx": topk_idx,
|
||||
"topk_weights": topk_weights,
|
||||
"expert_alignment": expert_alignment,
|
||||
}
|
||||
return buffer.dispatch(**dispatch_args)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user