Created using Colab

rawanaldaneen · rawanaldaneen · commit 0e08e8072222 · 2025-09-09T12:05:38.000+03:00
diff --git a/letter_recognition_using_LoRA.ipynb b/letter_recognition_using_LoRA.ipynb
@@ -0,0 +1,221 @@
+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "provenance": [],
+      "authorship_tag": "ABX9TyNTUIlwVwyn/MGWQv2x/gQg",
+      "include_colab_link": true
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "view-in-github",
+        "colab_type": "text"
+      },
+      "source": [
+        "<a href=\"https://colab.research.google.com/github/rawanaldaneen/pytorch_row/blob/main/letter_recognition_using_LoRA.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "The following code defines a neural network called NNet.\n",
+        "\n",
+        "NNet is a neural network that was originally written to identify hand-written digits from 32x32 images. Your task is to fine-tune this network to perform letter recognition using LoRA by\n",
+        ". To enhance your understanding, apply LoRA to just the second linear layer, and replace the last layer with a layer that has 26 outputs, one for each letter in the English alphabet."
+      ],
+      "metadata": {
+        "id": "OFqk8sQxtT1d"
+      }
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "K9R2t_e0sWku"
+      },
+      "outputs": [],
+      "source": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "5dc070f1",
+        "outputId": "c1119959-0f30-4fb2-b4af-9d7dd8454769"
+      },
+      "source": [
+        "!pip install torch torchvision torchaudio"
+      ],
+      "execution_count": 1,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Requirement already satisfied: torch in /usr/local/lib/python3.12/dist-packages (2.8.0+cu126)\n",
+            "Requirement already satisfied: torchvision in /usr/local/lib/python3.12/dist-packages (0.23.0+cu126)\n",
+            "Requirement already satisfied: torchaudio in /usr/local/lib/python3.12/dist-packages (2.8.0+cu126)\n",
+            "Requirement already satisfied: filelock in /usr/local/lib/python3.12/dist-packages (from torch) (3.19.1)\n",
+            "Requirement already satisfied: typing-extensions>=4.10.0 in /usr/local/lib/python3.12/dist-packages (from torch) (4.15.0)\n",
+            "Requirement already satisfied: setuptools in /usr/local/lib/python3.12/dist-packages (from torch) (75.2.0)\n",
+            "Requirement already satisfied: sympy>=1.13.3 in /usr/local/lib/python3.12/dist-packages (from torch) (1.13.3)\n",
+            "Requirement already satisfied: networkx in /usr/local/lib/python3.12/dist-packages (from torch) (3.5)\n",
+            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.12/dist-packages (from torch) (3.1.6)\n",
+            "Requirement already satisfied: fsspec in /usr/local/lib/python3.12/dist-packages (from torch) (2025.3.0)\n",
+            "Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.6.77 in /usr/local/lib/python3.12/dist-packages (from torch) (12.6.77)\n",
+            "Requirement already satisfied: nvidia-cuda-runtime-cu12==12.6.77 in /usr/local/lib/python3.12/dist-packages (from torch) (12.6.77)\n",
+            "Requirement already satisfied: nvidia-cuda-cupti-cu12==12.6.80 in /usr/local/lib/python3.12/dist-packages (from torch) (12.6.80)\n",
+            "Requirement already satisfied: nvidia-cudnn-cu12==9.10.2.21 in /usr/local/lib/python3.12/dist-packages (from torch) (9.10.2.21)\n",
+            "Requirement already satisfied: nvidia-cublas-cu12==12.6.4.1 in /usr/local/lib/python3.12/dist-packages (from torch) (12.6.4.1)\n",
+            "Requirement already satisfied: nvidia-cufft-cu12==11.3.0.4 in /usr/local/lib/python3.12/dist-packages (from torch) (11.3.0.4)\n",
+            "Requirement already satisfied: nvidia-curand-cu12==10.3.7.77 in /usr/local/lib/python3.12/dist-packages (from torch) (10.3.7.77)\n",
+            "Requirement already satisfied: nvidia-cusolver-cu12==11.7.1.2 in /usr/local/lib/python3.12/dist-packages (from torch) (11.7.1.2)\n",
+            "Requirement already satisfied: nvidia-cusparse-cu12==12.5.4.2 in /usr/local/lib/python3.12/dist-packages (from torch) (12.5.4.2)\n",
+            "Requirement already satisfied: nvidia-cusparselt-cu12==0.7.1 in /usr/local/lib/python3.12/dist-packages (from torch) (0.7.1)\n",
+            "Requirement already satisfied: nvidia-nccl-cu12==2.27.3 in /usr/local/lib/python3.12/dist-packages (from torch) (2.27.3)\n",
+            "Requirement already satisfied: nvidia-nvtx-cu12==12.6.77 in /usr/local/lib/python3.12/dist-packages (from torch) (12.6.77)\n",
+            "Requirement already satisfied: nvidia-nvjitlink-cu12==12.6.85 in /usr/local/lib/python3.12/dist-packages (from torch) (12.6.85)\n",
+            "Requirement already satisfied: nvidia-cufile-cu12==1.11.1.6 in /usr/local/lib/python3.12/dist-packages (from torch) (1.11.1.6)\n",
+            "Requirement already satisfied: triton==3.4.0 in /usr/local/lib/python3.12/dist-packages (from torch) (3.4.0)\n",
+            "Requirement already satisfied: numpy in /usr/local/lib/python3.12/dist-packages (from torchvision) (2.0.2)\n",
+            "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/local/lib/python3.12/dist-packages (from torchvision) (11.3.0)\n",
+            "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.12/dist-packages (from sympy>=1.13.3->torch) (1.3.0)\n",
+            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.12/dist-packages (from jinja2->torch) (3.0.2)\n"
+          ]
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "fd55627b"
+      },
+      "source": [
+        "import torch\n",
+        "import torch.nn as nn\n",
+        "import torch.nn.functional as F\n",
+        "import torch.optim as optim"
+      ],
+      "execution_count": 2,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "class NNet(nn.Module):\n",
+        "\n",
+        "    def __init__(self):\n",
+        "        super(NNet, self).__init__()\n",
+        "        # 1 input image channel, 6 output channels, 5x5 square convolution\n",
+        "        # kernel\n",
+        "        self.conv1 = nn.Conv2d(1, 6, 5)\n",
+        "        self.conv2 = nn.Conv2d(6, 16, 5)\n",
+        "        # an affine operation: y = Wx + b\n",
+        "        self.fc1 = nn.Linear(16 * 5 * 5, 120)  # 5*5 from image dimension\n",
+        "        self.fc2 = nn.Linear(120, 84)\n",
+        "        self.fc3 = nn.Linear(84, 10)\n",
+        "\n",
+        "    def forward(self, input):\n",
+        "        # Convolution layer C1: 1 input image channel, 6 output channels,\n",
+        "        # 5x5 square convolution, it uses RELU activation function, and\n",
+        "        # outputs a Tensor with size (N, 6, 28, 28), where N is the size of the batch\n",
+        "        c1 = F.relu(self.conv1(input))\n",
+        "        # Subsampling layer S2: 2x2 grid, purely functional,\n",
+        "        # this layer does not have any parameter, and outputs a (N, 6, 14, 14) Tensor\n",
+        "        s2 = F.max_pool2d(c1, (2, 2))\n",
+        "        # Convolution layer C3: 6 input channels, 16 output channels,\n",
+        "        # 5x5 square convolution, it uses RELU activation function, and\n",
+        "        # outputs a (N, 16, 10, 10) Tensor\n",
+        "        c3 = F.relu(self.conv2(s2))\n",
+        "        # Subsampling layer S4: 2x2 grid, purely functional,\n",
+        "        # this layer does not have any parameter, and outputs a (N, 16, 5, 5) Tensor\n",
+        "        s4 = F.max_pool2d(c3, 2)\n",
+        "        # Flatten operation: purely functional, outputs a (N, 400) Tensor\n",
+        "        s4 = torch.flatten(s4, 1)\n",
+        "        # Fully connected layer F5: (N, 400) Tensor input,\n",
+        "        # and outputs a (N, 120) Tensor, it uses RELU activation function\n",
+        "        f5 = F.relu(self.fc1(s4))\n",
+        "        # Fully connected layer F6: (N, 120) Tensor input,\n",
+        "        # and outputs a (N, 84) Tensor, it uses RELU activation function\n",
+        "        f6 = F.relu(self.fc2(f5))\n",
+        "        # Gaussian layer OUTPUT: (N, 84) Tensor input, and\n",
+        "        # outputs a (N, 10) Tensor\n",
+        "        output = self.fc3(f6)\n",
+        "        return output\n",
+        "\n",
+        "# Define device\n",
+        "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
+        "\n",
+        "model_exercise = NNet()\n",
+        "model_exercise.to(device)\n",
+        "\n",
+        "print('This is what the model looked like before applying LoRA:')\n",
+        "print(model_exercise)\n",
+        "print(\"\\n###############\\n\")\n",
+        "\n",
+        "# Freeze all parameters:\n",
+        "for parm in model_exercise.parameters():\n",
+        "    parm.requires_grad=False\n",
+        "\n",
+        "# Change final layer for one with 26 outputs:\n",
+        "model_exercise.fc3=nn.Linear(in_features=84, out_features=26, bias=True).to(device)\n",
+        "\n",
+        "# Apply LoRA to the second linear layer\n",
+        "model_exercise.fc2=LinearWithLoRA(model_exercise.fc2,rank=2, alpha=0.1).to(device)\n",
+        "\n",
+        "print('This is what the model looked like after applying LoRA:')\n",
+        "print(model_exercise)"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "lmZOWpy5sXR0",
+        "outputId": "e8a453cf-db32-4fde-c59a-d5ce83695750"
+      },
+      "execution_count": 6,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "This is what the model looked like before applying LoRA:\n",
+            "NNet(\n",
+            "  (conv1): Conv2d(1, 6, kernel_size=(5, 5), stride=(1, 1))\n",
+            "  (conv2): Conv2d(6, 16, kernel_size=(5, 5), stride=(1, 1))\n",
+            "  (fc1): Linear(in_features=400, out_features=120, bias=True)\n",
+            "  (fc2): Linear(in_features=120, out_features=84, bias=True)\n",
+            "  (fc3): Linear(in_features=84, out_features=10, bias=True)\n",
+            ")\n",
+            "\n",
+            "###############\n",
+            "\n",
+            "This is what the model looked like after applying LoRA:\n",
+            "NNet(\n",
+            "  (conv1): Conv2d(1, 6, kernel_size=(5, 5), stride=(1, 1))\n",
+            "  (conv2): Conv2d(6, 16, kernel_size=(5, 5), stride=(1, 1))\n",
+            "  (fc1): Linear(in_features=400, out_features=120, bias=True)\n",
+            "  (fc2): LinearWithLoRA(\n",
+            "    (linear): Linear(in_features=120, out_features=84, bias=True)\n",
+            "  )\n",
+            "  (fc3): Linear(in_features=84, out_features=26, bias=True)\n",
+            ")\n"
+          ]
+        }
+      ]
+    }
+  ]
+}