fix pfcc deep ep in low latency mode (#6440)

This commit is contained in:
RichardWooSJTU
2026-03-02 10:35:51 +08:00
committed by GitHub
parent 59b578c337
commit 7cfb0ffba0
+6 -3
View File
@@ -196,10 +196,13 @@ class DeepEPBuffer:
def _create_low_latency_buffer(self):
if self.deepep_buffer is None:
assert self.num_experts % self.ep_size == 0
if self.ep_size // 8 > 1:
num_qps_per_rank_now = self.ep_size // 8
if envs.FD_USE_PFCC_DEEP_EP:
num_qps_per_rank_now = self.num_experts // self.ep_size
else:
num_qps_per_rank_now = 1
if self.ep_size // 8 > 1:
num_qps_per_rank_now = self.ep_size // 8
else:
num_qps_per_rank_now = 1
self.deepep_buffer = deep_ep.Buffer(
self.group,
self.num_nvl_bytes,