We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent bcb59c7 commit e4f73bcCopy full SHA for e4f73bc
src/axolotl/core/trainers/dpo/trainer.py
@@ -177,12 +177,8 @@ def tokenize_row(
177
# dpo trainer may incorrectly prepend the bos_token_id to the dpo outputs
178
if res["chosen_input_ids"][0] == processing_class.bos_token_id:
179
res["chosen_input_ids"] = res["chosen_input_ids"][1:]
180
- res["chosen_labels"] = res["chosen_labels"][1:]
181
- res["chosen_attention_mask"] = res["chosen_attention_mask"][1:]
182
if res["rejected_input_ids"][0] == processing_class.bos_token_id:
183
res["rejected_input_ids"] = res["rejected_input_ids"][1:]
184
- res["rejected_labels"] = res["rejected_labels"][1:]
185
- res["rejected_attention_mask"] = res["rejected_attention_mask"][1:]
186
187
return res
188
0 commit comments