Skip to content

Commit eae2b7e

Browse files
authored
chore: Upgrade trl, vllm, and transformers in grpo_trl example (#1498)
- trl[vllm]: 0.19.1 -> 0.28.0 - vllm: 0.9.1 -> 0.12.0 (max supported by trl 0.28.0) - transformers: 4.52.4 -> 4.57 - flashinfer-python: 0.2.6.post1 -> 0.5.3
1 parent cd91de3 commit eae2b7e

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

06_gpu_and_ml/reinforcement-learning/grpo_trl.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -24,9 +24,9 @@
2424
# We define an image where we install the TRL library.
2525
# We also install vLLM for the next part of this example. We also use Weights & Biases for logging.
2626
image: modal.Image = modal.Image.debian_slim().uv_pip_install(
27-
"trl[vllm]==0.19.1",
28-
"vllm==0.9.1",
29-
"transformers==4.52.4",
27+
"trl[vllm]==0.28.0",
28+
"vllm==0.12.0",
29+
"transformers==4.57",
3030
"datasets==3.5.1",
3131
"wandb==0.17.6",
3232
)
@@ -236,8 +236,8 @@ def get_latest_checkpoint_file_path():
236236
vllm_image = (
237237
modal.Image.debian_slim(python_version="3.12")
238238
.uv_pip_install(
239-
"vllm==0.9.1",
240-
"flashinfer-python==0.2.6.post1",
239+
"vllm==0.12.0",
240+
"flashinfer-python==0.5.3",
241241
extra_index_url="https://download.pytorch.org/whl/cu128",
242242
extra_options="--index-strategy unsafe-best-match",
243243
)

0 commit comments

Comments
 (0)