[XPU] refine fused moe (#4219)

This commit is contained in:
zhupengyang
2025-10-16 19:04:07 +08:00
committed by GitHub
parent 3bbe99eae7
commit 26ff2f8683
7 changed files with 354 additions and 585 deletions
+3 -3
View File
@@ -404,9 +404,9 @@ class PaddleDisWorkerProc:
if num_blocks_local <= 0:
raise ValueError(
"The total number of blocks cannot be less than zero."
"Please increase gpu_memory_utilization"
"Or decrease max_num_batched_tokens(max model length) "
"The total number of blocks cannot be less than zero. "
"Please increase gpu_memory_utilization "
"Or decrease max_num_batched_tokens(max model length)."
)
if self.ranks > 1: