[Feature] Support mtp overlap schedule (#7001)

This commit is contained in:
sunxin
2026-04-01 14:24:26 +08:00
committed by GitHub
parent c6f0c5c3a6
commit c29e86fc9d
23 changed files with 215 additions and 138 deletions
@@ -160,6 +160,8 @@ class ForwardMeta:
position_ids: Optional[paddle.Tensor] = None
real_bsz: int = 0
def clear_caches(self):
"""Safely clean up the caches"""
if self.caches: