Fixing nits

mydatascience · mydatascience · commit cd25f174ba42 · 2025-11-25T23:11:24.000+04:00
Signed-off-by: Vladimir Suvorov &lt;suvorovv@google.com&gt;
diff --git a/src/MaxText/examples/rl_llama3_demo.ipynb b/src/MaxText/examples/rl_llama3_demo.ipynb
@@ -63,7 +63,7 @@
     "## Setup\n",
     "\n",
     "Install dependencies and set up the environment:\n",
-    "https://maxtext.readthedocs.io/latest/tutorials/grpo.html#from-github"
+    "https://maxtext.readthedocs.io/en/latest/tutorials/grpo.html#from-github"
    ]
   },
   {
@@ -130,8 +130,6 @@
     "    print(\"Authentication failed: Hugging Face token not set\")\n",
     "\n",
     "# Optional: Override training parameters\n",
-    "STEPS = 10  # Reduced for demo purposes\n",
-    "PER_DEVICE_BATCH_SIZE = 1\n",
     "LEARNING_RATE = 3e-6\n",
     "NUM_GENERATIONS = 2\n",
     "GRPO_BETA = 0.08\n",
@@ -197,8 +195,6 @@
     "    f\"load_parameters_path={MODEL_CHECKPOINT_PATH}\",\n",
     "    f\"base_output_directory={OUTPUT_DIRECTORY}\",\n",
     "    f\"hf_access_token={HF_TOKEN}\",\n",
-    "    f\"steps={STEPS}\",\n",
-    "    f\"per_device_batch_size={PER_DEVICE_BATCH_SIZE}\",\n",
     "    f\"learning_rate={LEARNING_RATE}\",\n",
     "    f\"num_generations={NUM_GENERATIONS}\",\n",
     "    f\"grpo_beta={GRPO_BETA}\",\n",
@@ -211,7 +207,6 @@
     "# Initialize configuration\n",
     "print(f\"🔧 Initializing configuration from: {config_file}\")\n",
     "config = pyconfig.initialize(config_argv)\n",
-    "max_utils.print_system_information()\n",
     "\n",
     "print(\"\\n✅ Configuration initialized successfully\")\n",
     "print(f\"📊 Training steps: {config.steps}\")\n",
@@ -261,10 +256,9 @@
    "source": [
     "## 📚 Learn More\n",
     "\n",
-    "- **CLI Usage**: Run `python3 -m src.MaxText.rl.train_rl src/MaxText/configs/rl.yml --model_name=llama3.1-8b ...`\n",
+    "- **CLI Usage**: https://maxtext.readthedocs.io/en/latest/tutorials/grpo.html#run-grpo\n",
     "- **Configuration**: See `src/MaxText/configs/rl.yml` for all available options\n",
-    "- **Documentation**: Check `src/MaxText/rl/train_rl.py` for the `rl_train` function implementation\n",
-    "- **Examples**: See other examples in `src/MaxText/examples/`"
+    "- **Documentation**: Check `src/MaxText/rl/train_rl.py` for the `rl_train` function implementation"
    ]
   }
  ],