Skip to content

Commit 0dc40b3

Browse files
committed
rollback trl
1 parent 5951c9a commit 0dc40b3

File tree

2 files changed

+4
-5
lines changed

2 files changed

+4
-5
lines changed

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@ dependencies = [
3434
"sentencepiece>=0.1.99,<0.3",
3535
"tokenizers>=0.13.3,<1.0",
3636
"tqdm>=4.66.2,<5.0",
37-
"trl>=0.13,<0.18",
37+
"trl>=0.13,<0.17",
3838
"peft>=0.15.0,<=0.15.2",
3939
"protobuf>=5.28.0,<6.0.0",
4040
"datasets>=3.5.0,<4.0",

tuning/data/data_preprocessing_utils.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -98,10 +98,9 @@ def get_data_collator(
9898
# was removed from tokenized data processing, should eventually
9999
# be added back in with support directly in fms-hf-tuning, not
100100
# dependent on trl.
101-
# return DataCollatorForSeq2Seq(
102-
# tokenizer=tokenizer, padding=True, max_length=max_seq_length
103-
# )
104-
return None
101+
return DataCollatorForSeq2Seq(
102+
tokenizer=tokenizer, padding=True, max_length=max_seq_length
103+
)
105104

106105
# TODO: near term - how response template ids are parsed out needs to be cleaned.
107106
# The [2:] here applies if response template has \n prefix, it is needed to strip \n,

0 commit comments

Comments
 (0)