[MTP]Support mtp reshard (#4099)

* support rl reshard * modify model name
2026-04-23 00:17:25 +08:00 · 2025-09-15 17:13:53 +08:00
parent 46911f903d
commit 69aa2781a1
3 changed files with 4 additions and 0 deletions
@@ -63,6 +63,7 @@ class RolloutModelConfig:
        local_rank: int = 0,
        moba_attention_config: str = None,
        data_parallel_size: int = 1,
+        num_nextn_predict_layers: int = 0,
    ):
        # Required parameters
        self.model = model_name_or_path
@@ -109,6 +110,7 @@ class RolloutModelConfig:
        self.early_stop_config = early_stop_config
        self.ips = None
        self.moba_attention_config = moba_attention_config
+        self.num_nextn_predict_layers = num_nextn_predict_layers

    def __str__(self):
        return "\n".join(f"{k}: {v}" for k, v in self.__dict__.items())