[Others] upgrade paddleformer to 0.4.0 (#5599)

This commit is contained in:
bukejiyu
2025-12-23 21:08:01 +08:00
committed by GitHub
parent 85db9d5e56
commit d1c6e57341
21 changed files with 32 additions and 184 deletions
+3 -3
View File
@@ -815,8 +815,8 @@ def parse_args():
parser.add_argument(
"--load_choices",
type=str,
default="default",
help="The format of the model weights to load. default/new_loader.",
default="default_v1",
help="The format of the model weights to load. default/default_v1.",
)
parser.add_argument(
@@ -952,7 +952,7 @@ def initialize_fd_config(args, ranks: int = 1, local_rank: int = 0) -> FDConfig:
# Note(tangbinhan): used for load_checkpoint
model_config.pretrained_config.tensor_parallel_rank = parallel_config.tensor_parallel_rank
model_config.pretrained_config.tensor_parallel_degree = parallel_config.tensor_parallel_size
model_config.pretrained_config.tensor_model_parallel_size = parallel_config.tensor_parallel_size
model_config.pretrained_config.is_mtp = False
model_config.pretrained_config.head_dim = model_config.head_dim