diff --git a/examples/experiments/deepseek_v3_pretrain/run_pretrain.py b/examples/experiments/deepseek_v3_pretrain/run_pretrain.py index 8358c316224..e36d500ad52 100644 --- a/examples/experiments/deepseek_v3_pretrain/run_pretrain.py +++ b/examples/experiments/deepseek_v3_pretrain/run_pretrain.py @@ -239,10 +239,6 @@ class ModelArguments: "help": "Pre-training from existing paddleformers model weights. Default False and model will train from scratch. If set True, the model_name_or_path argument must exist in the paddleformers models." }, ) - num_hidden_layers: Optional[int] = field( - default=None, - metadata={"help": "num_hidden_layers."}, - ) def create_pretrained_dataset( diff --git a/paddleformers/cli/train/pretrain/workflow.py b/paddleformers/cli/train/pretrain/workflow.py index b2cea517dd3..a04cdf3eae2 100644 --- a/paddleformers/cli/train/pretrain/workflow.py +++ b/paddleformers/cli/train/pretrain/workflow.py @@ -176,10 +176,6 @@ class ModelArguments: "help": "Pre-training from existing paddleformers model weights. Default False and model will train from scratch. If set True, the model_name_or_path argument must exist in the paddleformers models." }, ) - num_hidden_layers: Optional[int] = field( - default=None, - metadata={"help": "num_hidden_layers."}, - ) def create_pretrained_dataset(