Skip to content

Commit dc5a6af

Browse files
committed
save_model: checkpoint_done --> model_done
1 parent 6c1f449 commit dc5a6af

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

paddlenlp/trainer/trainer.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2096,10 +2096,10 @@ def save_model(self, output_dir: Optional[str] = None, merge_tensor_parallel: Op
20962096
if not self.is_in_train:
20972097
self.args.unified_checkpoint_config = unified_checkpoint_config_backup
20982098
if strtobool(os.getenv("FLAG_LLM_PDC", "False")):
2099-
# save checkpoint_done file to ensure checkpoint is complete
2099+
# save model_done file to ensure model is complete
21002100
if self.args.should_save_model_state and self.args.should_save:
21012101
# For ckpt integrity
2102-
paddle.save(self.state.global_step, os.path.join(output_dir, ".checkpoint_done"))
2102+
paddle.save(self.state.global_step, os.path.join(output_dir, ".model_done"))
21032103

21042104
def _save_checkpoint(self, model, metrics=None):
21052105
# assert unwrap_model(model) is self.model, "internal model should be a reference to self.model"

0 commit comments

Comments
 (0)