MITDeepLearning
diff --git a/‎lab2/PT_Part1_MNIST.ipynb‎
Lines changed: 41 additions & 80 deletions b/‎lab2/PT_Part1_MNIST.ipynb‎
Lines changed: 41 additions & 80 deletions
@@ -10,9 +10,9 @@
         "  <td align=\"center\"><a target=\"_blank\" href=\"http://introtodeeplearning.com\">\n",
         "        <img src=\"https://i.ibb.co/Jr88sn2/mit.png\" style=\"padding-bottom:5px;\" />\n",
         "      Visit MIT Deep Learning</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab2/solutions/PT_Part1_MNIST_Solution.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/MITDeepLearning/introtodeeplearning/blob/master/lab2/PT_Part1_MNIST.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/2P3SLwK/colab.png\"  style=\"padding-bottom:5px;\" />Run in Google Colab</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab2/solutions/PT_Part1_MNIST_Solution.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/MITDeepLearning/introtodeeplearning/blob/master/lab2/PT_Part1_MNIST.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/xfJbPmL/github.png\"  height=\"70px\" style=\"padding-bottom:5px;\"  />View Source on GitHub</a></td>\n",
         "</table>\n",
         "\n",
@@ -252,13 +252,9 @@
         "\n",
         "        # '''TODO: Define the activation function for the first fully connected (Dense/Linear) layer.'''\n",
         "        nn.Linear(28 * 28, 128),\n",
-        "        nn.ReLU(),\n",
-        "        # activation function = '''TODO'''\n",
+        "        '''TODO'''\n",
         "\n",
-        "        # '''TODO: Define the second Linear layer to output the classification probabilities'''\n",
-        "        nn.Linear(128, 10),\n",
-        "        nn.Softmax(dim=1) # Softmax activation for probabilities\n",
-        "        # '''TODO: Linear layer and activation to output classification probabilities'''\n",
+        "        '''TODO: Define the second Linear layer to output the classification probabilities'''\n",
         "        )\n",
         "    return fc_model\n",
         "\n",
@@ -321,27 +317,17 @@
         "        self.fc1 = nn.Linear(28 * 28, 128)\n",
         "\n",
         "        # '''TODO: Define the activation function for the first fully connected layer'''\n",
-        "        self.relu = nn.ReLU()\n",
+        "        self.relu = # TODO\n",
         "\n",
         "        # '''TODO: Define the second Linear layer to output the classification probabilities'''\n",
-        "        self.fc2 = nn.Linear(128, 10)\n",
-        "        self.softmax = nn.Softmax(dim=1)\n",
-        "        # self.fc2 = # TODO\n",
-        "        # self.softmax = # TODO\n",
+        "        self.fc2 = # TODO\n",
         "\n",
         "    def forward(self, x):\n",
         "        x = self.flatten(x)\n",
         "        x = self.fc1(x)\n",
         "\n",
         "        # '''TODO: Implement the rest of forward pass of the model using the layers you have defined above'''\n",
-        "        x = self.relu(x)\n",
-        "        x = self.fc2(x)\n",
-        "        # '''TODO'''\n",
-        "\n",
-        "        '''NOTE: In Pytorch, softmax is omitted in training since CrossEntropyLoss includes\n",
-        "            LogSoftmax; using both would result in incorrect loss values.\n",
-        "            Since we will train with CrossEntropyLoss, we do not need something like:\n",
-        "              x = self.softmax(x) '''\n",
+        "        '''TODO'''\n",
         "\n",
         "        return x\n",
         "\n",
@@ -430,15 +416,18 @@
         "        for images, labels in trainset_loader:\n",
         "            # Move tensors to GPU so compatible with model\n",
         "            images, labels = images.to(device), labels.to(device)\n",
-        "            # Clear gradients before performing backward pass\n",
-        "            optimizer.zero_grad()\n",
+        "\n",
         "            # Forward pass\n",
         "            outputs = fc_model(images)\n",
+        "\n",
+        "            # Clear gradients before performing backward pass\n",
+        "            optimizer.zero_grad()\n",
         "            # Calculate loss based on model predictions\n",
         "            loss = loss_function(outputs, labels)\n",
         "            # Backpropagate and update model parameters\n",
         "            loss.backward()\n",
         "            optimizer.step()\n",
+        "\n",
         "            # multiply loss by total nos. of samples in batch\n",
         "            total_loss += loss.item()*images.size(0)\n",
         "\n",
@@ -463,8 +452,7 @@
       "source": [
         "# TODO: Train the model by calling the function appropriately\n",
         "EPOCHS = 5\n",
-        "train(fc_model, trainset_loader, loss_function, optimizer, EPOCHS)\n",
-        "# train('''TODO''') # TODO\n",
+        "train('''TODO''') # TODO\n",
         "\n",
         "comet_model_1.end()"
       ]
@@ -512,39 +500,33 @@
         "    with torch.no_grad():\n",
         "        for images, labels in testset_loader:\n",
         "            # TODO: ensure evalaution happens on the GPU\n",
-        "            images, labels = images.to(device), labels.to(device)\n",
-        "            # images, labels = # TODO\n",
+        "            images, labels = # TODO\n",
         "\n",
         "            # TODO: feed the images into the model and obtain the predictions (forward pass)\n",
-        "            outputs = model(images)\n",
-        "            # outputs = # TODO\n",
+        "            outputs = # TODO\n",
         "\n",
         "            loss = loss_function(outputs, labels)\n",
         "\n",
         "            # TODO: Calculate test loss\n",
-        "            test_loss += loss.item() * images.size(0)\n",
-        "            # test_loss += # TODO\n",
+        "            test_loss += # TODO\n",
         "\n",
         "           '''TODO: make a prediction and determine whether it is correct!'''\n",
         "            # TODO: identify the digit with the highest probability prediction for the images in the test dataset.\n",
-        "            predicted = torch.argmax(outputs, dim=1)\n",
-        "            # predicted = # TODO\n",
+        "            predicted = # torch.argmax('''TODO''')\n",
         "\n",
         "            # TODO: tally the number of correct predictions\n",
-        "            correct_pred += (predicted == labels).sum().item()\n",
-        "            # correct_pred += TODO\n",
+        "            correct_pred += TODO\n",
+        "\n",
         "            # TODO: tally the total number of predictions\n",
-        "            total_pred += labels.size(0)\n",
-        "            # total_pred += TODO\n",
+        "            total_pred += TODO\n",
         "\n",
         "    # Compute average loss and accuracy\n",
         "    test_loss /= total_pred\n",
         "    test_acc = correct_pred / total_pred\n",
         "    return test_loss, test_acc\n",
         "\n",
         "# TODO: call the evaluate function to evaluate the trained model!!\n",
-        "test_loss, test_acc = evaluate(fc_model, trainset_loader, loss_function)\n",
-        "# test_loss, test_acc = # TODO\n",
+        "test_loss, test_acc = # TODO\n",
         "\n",
         "print('Test accuracy:', test_acc)"
       ]
@@ -607,29 +589,24 @@
         "    def __init__(self):\n",
         "        super(CNN, self).__init__()\n",
         "        # TODO: Define the first convolutional layer\n",
-        "        self.conv1 = nn.Conv2d(1, 24, kernel_size=3)\n",
-        "        # self.conv1 = # TODO\n",
+        "        self.conv1 = # TODO\n",
         "\n",
         "        # TODO: Define the first max pooling layer\n",
-        "        self.pool1 = nn.MaxPool2d(kernel_size=2)\n",
-        "        # self.pool1 = # TODO\n",
+        "        self.pool1 = # TODO\n",
         "\n",
         "        # TODO: Define the second convolutional layer\n",
-        "        self.conv2 = nn.Conv2d(24, 36, kernel_size=3)\n",
-        "        # self.conv2 = # TODO\n",
+        "        self.conv2 = # TODO\n",
         "\n",
         "        # TODO: Define the second max pooling layer\n",
-        "        self.pool2 = nn.MaxPool2d(kernel_size=2)\n",
-        "        # self.pool2 = # TODO\n",
+        "        self.pool2 = # TODO\n",
         "\n",
         "        self.flatten = nn.Flatten()\n",
         "        self.fc1 = nn.Linear(36 * 5 * 5, 128)\n",
         "        self.relu = nn.ReLU()\n",
         "\n",
         "        # TODO: Define the Linear layer that outputs the classification\n",
         "        # logits over class labels. Remember that CrossEntropyLoss operates over logits.\n",
-        "        self.fc2 = nn.Linear(128, 10)\n",
-        "        # self.fc2 = # TODO\n",
+        "        self.fc2 = # TODO\n",
         "\n",
         "\n",
         "    def forward(self, x):\n",
@@ -640,18 +617,7 @@
         "\n",
         "        # '''TODO: Implement the rest of forward pass of the model using the layers you have defined above'''\n",
         "        #     '''hint: this will involve another set of convolutional/pooling layers and then the linear layers'''\n",
-        "        x = self.conv2(x)\n",
-        "        x = self.relu(x)\n",
-        "        x = self.pool2(x)\n",
-        "\n",
-        "        x = self.flatten(x)\n",
-        "        x = self.fc1(x)\n",
-        "        x = self.relu(x)\n",
-        "        x = self.fc2(x)\n",
-        "\n",
-        "        '''NOTE: Remember that we do not need to define/execute softmax (self.softmax(x))\n",
-        "              in the forward pass since we will use CrossEntropyLoss for training,\n",
-        "              which operates directly on logits'''\n",
+        "        '''TODO'''\n",
         "\n",
         "        return x\n",
         "\n",
@@ -697,8 +663,7 @@
         "optimizer = optim.SGD(cnn_model.parameters(), lr=1e-2)\n",
         "\n",
         "# TODO: instantiate the cross entropy loss function\n",
-        "loss_function = nn.CrossEntropyLoss()\n",
-        "# loss_function = # TODO\n",
+        "loss_function = # TODO\n",
         "\n",
         "# Redefine trainloader with new batch size parameter (tweak as see fit if optimizing)\n",
         "trainset_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
@@ -735,13 +700,12 @@
         "        images, labels = images.to(device), labels.to(device)\n",
         "\n",
         "        # Forward pass\n",
-        "        #'''TODO: feed the images into the model and obtain the predictions'''\n",
-        "        logits = cnn_model(images)\n",
-        "        # logits = # TODO\n",
+        "        # TODO: feed the images into the model and obtain the predictions\n",
+        "        logits = # TODO\n",
+        "\n",
+        "        # TODO: compute the categorical cross entropy loss using the predicted logits\n",
+        "        loss = # TODO\n",
         "\n",
-        "        #'''TODO: compute the categorical cross entropy loss\n",
-        "        loss = loss_function(logits, labels)\n",
-        "        # loss = # TODO\n",
         "        # Get the loss and log it to comet and the loss_history record\n",
         "        loss_value = loss.item()\n",
         "        comet_model_2.log_metric(\"loss\", loss_value, step=idx)\n",
@@ -751,9 +715,9 @@
         "        # Backpropagation/backward pass\n",
         "        '''TODO: Compute gradients for all model parameters and propagate backwads\n",
         "            to update model parameters. remember to reset your optimizer!'''\n",
-        "        optimizer.zero_grad()\n",
-        "        loss.backward()\n",
-        "        optimizer.step()\n",
+        "        # TODO: reset optimizer\n",
+        "        # TODO: compute gradients\n",
+        "        # TODO: update model parameters\n",
         "\n",
         "        # Get the prediction and tally metrics\n",
         "        predicted = torch.argmax(logits, dim=1)\n",
@@ -788,9 +752,7 @@
       "outputs": [],
       "source": [
         "'''TODO: Evaluate the CNN model!'''\n",
-        "\n",
-        "test_loss, test_acc = evaluate(cnn_model, trainset_loader, loss_function)\n",
-        "# test_loss, test_acc = # TODO\n",
+        "test_loss, test_acc = evaluate('''TODO''')\n",
         "\n",
         "print('Test accuracy:', test_acc)"
       ]
@@ -850,7 +812,7 @@
       },
       "outputs": [],
       "source": [
-        "predictions_test_image"
+        "print(predictions_test_image)"
       ]
     },
     {
@@ -875,8 +837,7 @@
         "'''TODO: identify the digit with the highest likelihood prediction for the first\n",
         "    image in the test dataset. '''\n",
         "predictions_value = predictions_test_image.cpu().detach().numpy() #.cpu() to copy tensor to memory first\n",
-        "prediction = np.argmax(predictions_value)\n",
-        "# prediction = # TODO\n",
+        "prediction = # TODO\n",
         "print(prediction)"
       ]
     },
@@ -935,7 +896,7 @@
         "        probabilities = torch.nn.functional.softmax(outputs, dim=1)\n",
         "\n",
         "        # Get predicted classes\n",
-        "        predicted = torch.argmax(outputs, dim=1)\n",
+        "        predicted = torch.argmax(probabilities, dim=1)\n",
         "\n",
         "        all_predictions.append(probabilities)\n",
         "        all_labels.append(labels)\n",
@@ -1018,7 +979,7 @@
       "collapsed_sections": [
         "Xmf_JRJa_N8C"
       ],
-      "name": "PT_Part1_MNIST_Solution.ipynb",
+      "name": "PT_Part1_MNIST.ipynb",
       "provenance": []
     },
     "kernelspec": {