mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Feature] Support mtp overlap schedule (#7001)
This commit is contained in:
@@ -160,6 +160,8 @@ class ForwardMeta:
|
||||
|
||||
position_ids: Optional[paddle.Tensor] = None
|
||||
|
||||
real_bsz: int = 0
|
||||
|
||||
def clear_caches(self):
|
||||
"""Safely clean up the caches"""
|
||||
if self.caches:
|
||||
|
||||
Reference in New Issue
Block a user