Skip to content

Commit dcf0a13

Browse files
committed
default load_best_model_at_end=False (#432)
1 parent adf68d1 commit dcf0a13

File tree

2 files changed

+0
-7
lines changed

2 files changed

+0
-7
lines changed

swift/llm/dpo.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -119,10 +119,8 @@ def llm_dpo(args: DPOArguments) -> str:
119119

120120
# Setting training_args
121121
evaluation_strategy = IntervalStrategy.STEPS
122-
load_best_model_at_end = False
123122
if val_dataset is None:
124123
evaluation_strategy = IntervalStrategy.NO
125-
load_best_model_at_end = False
126124
additional_saved_files = []
127125
if args.sft_type == 'full':
128126
additional_saved_files = get_additional_saved_files(args.model_type)
@@ -149,7 +147,6 @@ def llm_dpo(args: DPOArguments) -> str:
149147
fp16=args.fp16,
150148
eval_steps=args.eval_steps,
151149
dataloader_num_workers=args.dataloader_num_workers,
152-
load_best_model_at_end=load_best_model_at_end,
153150
metric_for_best_model='rouge-l'
154151
if args.predict_with_generate else 'loss',
155152
greater_is_better=args.predict_with_generate,

swift/llm/sft.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -170,11 +170,8 @@ def llm_sft(args: SftArguments) -> Dict[str, Union[str, Any]]:
170170
data_collator = partial(template.data_collator, padding_to=padding_to)
171171
# Setting training_args
172172
evaluation_strategy = args.evaluation_strategy
173-
load_best_model_at_end = True
174173
if val_dataset is None:
175174
evaluation_strategy = 'no'
176-
if evaluation_strategy == 'no':
177-
load_best_model_at_end = False
178175
additional_saved_files = []
179176
if args.sft_type == 'full':
180177
additional_saved_files = get_additional_saved_files(args.model_type)
@@ -210,7 +207,6 @@ def llm_sft(args: SftArguments) -> Dict[str, Union[str, Any]]:
210207
eval_steps=args.eval_steps,
211208
dataloader_num_workers=args.dataloader_num_workers,
212209
dataloader_pin_memory=args.dataloader_pin_memory,
213-
load_best_model_at_end=load_best_model_at_end,
214210
metric_for_best_model='rouge-l'
215211
if args.predict_with_generate else 'loss',
216212
greater_is_better=args.predict_with_generate,

0 commit comments

Comments
 (0)