PaddlePaddle · w5688414 · Dec 18, 2023 · Dec 4, 2023 · Dec 13, 2023 · Dec 13, 2023
diff --git a/model_zoo/bert/README.md b/model_zoo/bert/README.md
@@ -65,7 +65,6 @@ python -m paddle.distributed.launch --gpus "0" run_pretrain.py \
     --weight_decay 1e-2 \
     --adam_epsilon 1e-6 \
     --warmup_steps 10000 \
-    --num_train_epochs 3 \
     --input_dir data/ \
     --output_dir pretrained_models/ \
     --logging_steps 1 \
@@ -83,7 +82,6 @@ python -m paddle.distributed.launch --gpus "0" run_pretrain.py \
 - `weight_decay` 表示AdamW优化器中使用的weight_decay的系数。
 - `adam_epsilon` 表示AdamW优化器中使用的epsilon值。
 - `warmup_steps` 表示动态学习率热启的step数。
-- `num_train_epochs` 表示训练轮数。
 - `input_dir` 表示输入数据的目录，该目录下所有文件名中包含training的文件将被作为训练数据。
 - `output_dir` 表示模型的保存目录。
 - `logging_steps` 表示日志打印间隔。
@@ -128,7 +126,6 @@ python -m paddle.distributed.launch --xpus "0" run_pretrain.py \
     --weight_decay 1e-2 \
     --adam_epsilon 1e-6 \
     --warmup_steps 10000 \
-    --num_train_epochs 3 \
     --input_dir data/ \
     --output_dir pretrained_models/ \
     --logging_steps 1 \
@@ -146,7 +143,6 @@ python -m paddle.distributed.launch --xpus "0" run_pretrain.py \
 - `weight_decay` 表示AdamW优化器中使用的weight_decay的系数。
 - `adam_epsilon` 表示AdamW优化器中使用的epsilon值。
 - `warmup_steps` 表示动态学习率热启的step数。
-- `num_train_epochs` 表示训练轮数。
 - `input_dir` 表示输入数据的目录，该目录下所有文件名中包含training的文件将被作为训练数据。
 - `output_dir` 表示模型的保存目录。
 - `logging_steps` 表示日志打印间隔。

diff --git a/paddlenlp/trainer/trainer.py b/paddlenlp/trainer/trainer.py
@@ -264,6 +264,10 @@ def __init__(
         if model is None:
             raise RuntimeError("`Trainer` requires either a `model` or `model_init` argument")
 
+        if self.args.to_static:
+            model = paddle.jit.to_static(model)
+            logger.info("Successfully to apply @to_static to the whole model.")
+
         if self.args.should_save or self.args.should_save_model_state:
             os.makedirs(self.args.output_dir, exist_ok=True)
 

diff --git a/paddlenlp/trainer/training_args.py b/paddlenlp/trainer/training_args.py
@@ -705,6 +705,10 @@ class TrainingArguments:
         default=False,
         metadata={"help": "Whether to unify hybrid parallel checkpoint."},
     )
+    to_static: Optional[bool] = field(
+        default=False,
+        metadata={"help": "Enable training under @to_static."},
+    )
 
     def __post_init__(self):
         env_local_rank = int(os.environ.get("PADDLE_RANK_IN_NODE", -1))