Skip to content

Commit 60a8f09

Browse files
authored
zero val fix for beta (axolotl-ai-cloud#2538)
1 parent 9da730d commit 60a8f09

File tree

1 file changed

+5
-3
lines changed

1 file changed

+5
-3
lines changed

src/axolotl/core/trainer_builder.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1040,9 +1040,11 @@ def build_training_arguments(self, total_num_steps):
10401040
if self.cfg.dataset_processes:
10411041
training_args_kwargs["dataset_num_proc"] = self.cfg.dataset_processes
10421042

1043-
if (self.cfg.trl and self.cfg.trl.beta) or self.cfg.rl_beta:
1044-
training_args_kwargs["beta"] = self.cfg.trl.beta or self.cfg.rl_beta
1045-
if self.cfg.orpo_alpha:
1043+
if self.cfg.trl and self.cfg.trl.beta is not None:
1044+
training_args_kwargs["beta"] = self.cfg.trl.beta
1045+
elif self.cfg.rl_beta is not None:
1046+
training_args_kwargs["beta"] = self.cfg.rl_beta
1047+
elif self.cfg.orpo_alpha is not None:
10461048
# trl does some odd mapping of alpha to beta to reuse the beta parameter ???
10471049
training_args_kwargs["beta"] = self.cfg.orpo_alpha
10481050

0 commit comments

Comments
 (0)