File tree Expand file tree Collapse file tree 2 files changed +1
-8
lines changed Expand file tree Collapse file tree 2 files changed +1
-8
lines changed Original file line number Diff line number Diff line change @@ -147,11 +147,6 @@ class TrainingConfig:
147
147
gradient_checkpointing : bool = True
148
148
gradient_checkpointing_kwargs : Dict [str , Any ] = field (default_factory = lambda : {"use_reentrant" : False })
149
149
150
- # Mixed precision
151
- fp16 : bool = False
152
- bf16 : bool = True
153
- tf32 : bool = True # Enable TF32 on Ampere GPUs
154
-
155
150
# Evaluation and checkpointing
156
151
evaluation_strategy : str = "steps"
157
152
eval_steps : int = 500
Original file line number Diff line number Diff line change @@ -178,9 +178,7 @@ def main():
178
178
adam_epsilon = config .training .adam_epsilon ,
179
179
weight_decay = config .training .weight_decay ,
180
180
max_grad_norm = config .training .max_grad_norm ,
181
- fp16 = config .training .fp16 ,
182
- bf16 = config .training .bf16 ,
183
- tf32 = config .training .tf32 ,
181
+ bf16 = True , # We're sticking with this known good reduced precision option
184
182
eval_strategy = config .training .evaluation_strategy ,
185
183
eval_steps = config .training .eval_steps ,
186
184
save_strategy = config .training .save_strategy ,
You can’t perform that action at this time.
0 commit comments