Skip to content

Commit a8862f4

Browse files
committed
Merge remote-tracking branch 'upstream/main'
2 parents 4e0fd36 + 806d6bc commit a8862f4

File tree

3 files changed

+776
-707
lines changed

3 files changed

+776
-707
lines changed

examples/kfto-sft-llm/sft.ipynb

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -198,7 +198,12 @@
198198
" model_args.model_name_or_path, trust_remote_code=model_args.trust_remote_code, use_fast=True\n",
199199
" )\n",
200200
" if tokenizer.pad_token is None:\n",
201-
" tokenizer.pad_token = tokenizer.eos_token\n",
201+
" # Models like Llama 3 use a dedicated padding token\n",
202+
" right_pad_id = tokenizer.convert_tokens_to_ids('<|finetune_right_pad_id|>')\n",
203+
" if right_pad_id is not None:\n",
204+
" tokenizer.pad_token = '<|finetune_right_pad_id|>'\n",
205+
" else:\n",
206+
" tokenizer.pad_token = tokenizer.eos_token\n",
202207
"\n",
203208
" # Chat template\n",
204209
" # You may need to provide your own chat template if the model does not have a default one\n",

images/runtime/training/py311-rocm62-torch251/Pipfile

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -9,18 +9,18 @@ verify_ssl = true
99
name = "pytorch"
1010

1111
[packages]
12-
peft = ">=0.14.0"
12+
peft = ">=0.15.2"
1313
datasets = ">=2.15.0"
1414
liger-kernel = "==0.5.4"
15-
transformers = ">=4.49.0"
15+
transformers = ">=4.51.3"
1616
numpy = "<2.0.0,>=1.23.5"
17-
accelerate = ">=1.4.0"
17+
accelerate = ">=1.6.0"
1818
torch = {version = "==2.5.1+rocm6.2", index = "pytorch"}
1919
pytorch-triton-rocm = {version = "*", index = "pytorch"}
2020
sentencepiece = "<0.3,>=0.1.99"
2121
tokenizers = "<1.0,>=0.13.3"
2222
tqdm = "<5.0,>=4.66.2"
23-
trl = ">=0.15.2"
23+
trl = ">=0.17.0"
2424
protobuf = "<6.0.0,>=5.28.0"
2525
simpleeval = "<1.0,>=0.9.13"
2626
safetensors = "*"

0 commit comments

Comments
 (0)