mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-24 09:44:10 +08:00
moe preprocess op support 160 experts and fused_moe triton kernel name add K (#3121)
This commit is contained in:
@@ -168,6 +168,8 @@ std::vector<paddle::Tensor> tritonmoe_preprocess_kernel(const paddle::Tensor& to
|
||||
run_align_kernel(64);
|
||||
} else if (num_experts == 128) {
|
||||
run_align_kernel(128);
|
||||
} else if (num_experts == 160) {
|
||||
run_align_kernel(160);
|
||||
} else {
|
||||
PD_THROW("Not support num_experts: %d", num_experts);
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user