unslothai
diff --git a/‎nb/Gemma4_(26B-A4B)-Inference.ipynb‎
Lines changed: 0 additions & 405 deletions b/‎nb/Gemma4_(26B-A4B)-Inference.ipynb‎
Lines changed: 0 additions & 405 deletions
diff --git a/‎nb/Gemma4_(26B_A4B)-Text.ipynb‎
Lines changed: 8 additions & 7 deletions b/‎nb/Gemma4_(26B_A4B)-Text.ipynb‎
Lines changed: 8 additions & 7 deletions
diff --git a/‎nb/Gemma4_(26B_A4B)-Vision.ipynb‎
Lines changed: 12 additions & 25 deletions b/‎nb/Gemma4_(26B_A4B)-Vision.ipynb‎
Lines changed: 12 additions & 25 deletions
@@ -6,7 +6,7 @@
         "id": "64duhI2Gsavq"
       },
       "source": [
-        "To run this, press \"*Runtime*\" and press \"*Run all*\" on a **free** Tesla T4 Google Colab instance!\n",
+        "To run this, press \"*Runtime*\" and press \"*Run all*\" on a Google Colab A100 instance!\n",
         "<div class=\"align-center\">\n",
         "<a href=\"https://unsloth.ai/\"><img src=\"https://github.com/unslothai/unsloth/raw/main/images/unsloth%20new%20logo.png\" width=\"115\"></a>\n",
         "<a href=\"https://discord.gg/unsloth\"><img src=\"https://github.com/unslothai/unsloth/raw/main/images/Discord button.png\" width=\"145\"></a>\n",
@@ -75,7 +75,7 @@
         "    xformers = 'xformers==' + {'2.10':'0.0.34','2.9':'0.0.33.post1','2.8':'0.0.32.post2'}.get(v, \"0.0.34\")\n",
         "    !pip install sentencepiece protobuf \"datasets==4.3.0\" \"huggingface_hub>=0.34.0\" hf_transfer\n",
         "    !pip install --no-deps unsloth_zoo bitsandbytes accelerate {xformers} peft trl triton unsloth\n",
-        "!pip install --no-deps git+https://github.com/huggingface/transformers.git\n",
+        "!pip install --no-deps transformers==5.5.0\n",
         "!pip install torchcodec\n",
         "import torch; torch._dynamo.config.recompile_limit = 64;"
       ]
@@ -114,15 +114,16 @@
         "from unsloth import FastModel\n",
         "import torch\n",
         "\n",
-        "fourbit_models = [\n",
-        "    # Gemma 4 models\n",
+        "gemma4_models = [\n",
+        "    # Gemma-4 instruct models:\n",
+        "    \"unsloth/gemma-4-E2B-it\",\n",
+        "    \"unsloth/gemma-4-E4B-it\",\n",
         "    \"unsloth/gemma-4-31B-it\",\n",
+        "    \"unsloth/gemma-4-26B-A4B-it\",\n",
+        "    # Gemma-4 base models:\n",
         "    \"unsloth/gemma-4-E2B\",\n",
-        "    \"unsloth/gemma-4-E4B-it\",\n",
         "    \"unsloth/gemma-4-E4B\",\n",
-        "    \"unsloth/gemma-4-31B-it\",\n",
         "    \"unsloth/gemma-4-31B\",\n",
-        "    \"unsloth/gemma-4-26B-A4B-it\",\n",
         "    \"unsloth/gemma-4-26B-A4B\",\n",
         "] # More models at https://huggingface.co/unsloth\n",
         "\n",
 
@@ -6,7 +6,7 @@
         "id": "gOpYt-Zgspvw"
       },
       "source": [
-        "To run this, press \"*Runtime*\" and press \"*Run all*\" on a **free** Tesla T4 Google Colab instance!\n",
+        "To run this, press \"*Runtime*\" and press \"*Run all*\" on a Google Colab A100 instance!\n",
         "<div class=\"align-center\">\n",
         "<a href=\"https://unsloth.ai/\"><img src=\"https://github.com/unslothai/unsloth/raw/main/images/unsloth%20new%20logo.png\" width=\"115\"></a>\n",
         "<a href=\"https://discord.gg/unsloth\"><img src=\"https://github.com/unslothai/unsloth/raw/main/images/Discord button.png\" width=\"145\"></a>\n",
@@ -75,7 +75,7 @@
         "    xformers = 'xformers==' + {'2.10':'0.0.34','2.9':'0.0.33.post1','2.8':'0.0.32.post2'}.get(v, \"0.0.34\")\n",
         "    !pip install sentencepiece protobuf \"datasets==4.3.0\" \"huggingface_hub>=0.34.0\" hf_transfer\n",
         "    !pip install --no-deps unsloth_zoo bitsandbytes accelerate {xformers} peft trl triton unsloth\n",
-        "!pip install --no-deps git+https://github.com/huggingface/transformers.git\n",
+        "!pip install --no-deps transformers==5.5.0\n",
         "!pip install torchcodec\n",
         "import torch; torch._dynamo.config.recompile_limit = 64;"
       ]
@@ -112,16 +112,16 @@
         "from unsloth import FastVisionModel # FastLanguageModel for LLMs\n",
         "import torch\n",
         "\n",
-        "# 4bit pre quantized models we support for 4x faster downloading + no OOMs.\n",
-        "fourbit_models = [\n",
-        "    # Gemma 4 models\n",
+        "gemma4_models = [\n",
+        "    # Gemma-4 instruct models:\n",
         "    \"unsloth/gemma-4-E2B-it\",\n",
-        "    \"unsloth/gemma-4-E2B\",\n",
+        "    \"unsloth/gemma-4-E4B-it\",\n",
+        "    \"unsloth/gemma-4-31B-it\",\n",
         "    \"unsloth/gemma-4-26B-A4B-it\",\n",
+        "    # Gemma-4 base models:\n",
+        "    \"unsloth/gemma-4-E2B\",\n",
         "    \"unsloth/gemma-4-E4B\",\n",
-        "    \"unsloth/gemma-4-31B-it\",\n",
         "    \"unsloth/gemma-4-31B\",\n",
-        "    \"unsloth/gemma-4-26B-A4B-it\",\n",
         "    \"unsloth/gemma-4-26B-A4B\",\n",
         "] # More models at https://huggingface.co/unsloth\n",
         "\n",
@@ -394,8 +394,6 @@
       },
       "outputs": [],
       "source": [
-        "FastVisionModel.for_inference(model)  # Enable for inference!\n",
-        "\n",
         "image = dataset[2][\"image\"]\n",
         "instruction = \"Write the LaTeX representation for this image.\"\n",
         "\n",
@@ -453,8 +451,6 @@
         "from unsloth.trainer import UnslothVisionDataCollator\n",
         "from trl import SFTTrainer, SFTConfig\n",
         "\n",
-        "FastVisionModel.for_training(model) # Enable for training!\n",
-        "\n",
         "trainer = SFTTrainer(\n",
         "    model = model,\n",
         "    train_dataset = converted_dataset,\n",
@@ -463,23 +459,19 @@
         "    args = SFTConfig(\n",
         "        per_device_train_batch_size = 1,\n",
         "        gradient_accumulation_steps = 4,\n",
-        "        gradient_checkpointing = True,\n",
-        "\n",
-        "        # use reentrant checkpointing\n",
-        "        gradient_checkpointing_kwargs = {\"use_reentrant\": False},\n",
-        "        max_grad_norm = 0.3,              # max gradient norm based on QLoRA paper\n",
+        "        max_grad_norm = 0.3,\n",
         "        warmup_ratio = 0.03,\n",
         "        max_steps = 60,\n",
-        "        #num_train_epochs = 2,          # Set this instead of max_steps for full training runs\n",
+        "        # num_train_epochs = 2, # Set this instead of max_steps for full training runs\n",
         "        learning_rate = 2e-4,\n",
         "        logging_steps = 1,\n",
         "        save_strategy = \"steps\",\n",
-        "        optim = \"adamw_torch_fused\",\n",
+        "        optim = \"adamw_8bit\",\n",
         "        weight_decay = 0.001,\n",
         "        lr_scheduler_type = \"cosine\",\n",
         "        seed = 3407,\n",
         "        output_dir = \"outputs\",\n",
-        "        report_to = \"none\",             # For Weights and Biases\n",
+        "        report_to = \"none\", # For Weights and Biases or others\n",
         "\n",
         "        # You MUST put the below items for vision finetuning:\n",
         "        remove_unused_columns = False,\n",
@@ -563,8 +555,6 @@
       },
       "outputs": [],
       "source": [
-        "FastVisionModel.for_inference(model)  # Enable for inference!\n",
-        "\n",
         "image = dataset[10][\"image\"]\n",
         "instruction = \"Write the LaTeX representation for this image.\"\n",
         "\n",
@@ -642,9 +632,6 @@
         "        model_name = \"gemma_4_lora\",  # YOUR MODEL YOU USED FOR TRAINING\n",
         "        load_in_4bit = True,  # Set to False for 16bit LoRA\n",
         "    )\n",
-        "    FastVisionModel.for_inference(model)  # Enable for inference!\n",
-        "\n",
-        "FastVisionModel.for_inference(model)  # Enable for inference!\n",
         "\n",
         "sample = dataset[1]\n",
         "image = sample[\"image\"].convert(\"RGB\")\n",