fixing todos

aamini · aamini · commit a7a96c22613b · 2022-01-26T04:13:54.000-05:00
diff --git a/lab3/solutions/RL_Solution.ipynb b/lab3/solutions/RL_Solution.ipynb
@@ -249,10 +249,10 @@
         "        # First Dense layer\n",
         "        tf.keras.layers.Dense(units=32, activation='relu'),\n",
         "\n",
-        "        # TODO: Define the last Dense layer, which will provide the network's output.\n",
-        "        # Think about the space the agent needs to act in!\n",
+        "        ''' TODO: Define the last Dense layer, which will provide the network's output.\n",
+        "        # Think about the space the agent needs to act in! '''\n",
         "        tf.keras.layers.Dense(units=n_actions, activation=None) # TODO\n",
-        "        # [TODO Dense layer to output action probabilities]\n",
+        "        # ['''TODO''' Dense layer to output action probabilities]\n",
         "    ])\n",
         "    return model\n",
         "\n",
@@ -720,12 +720,46 @@
     },
     {
       "cell_type": "code",
-      "execution_count": null,
+      "execution_count": 3,
       "metadata": {
         "scrolled": true,
-        "id": "JrTpTBJsJ9Bp"
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 530
+        },
+        "id": "JrTpTBJsJ9Bp",
+        "outputId": "c6a7e93c-a9c1-4a15-b550-0dd4db94d05c"
       },
-      "outputs": [],
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "vista_traces.zip     29%[====>               ] 180.35M  68.8MB/s               ^C\n",
+            "Unzipping data...\n",
+            "[vista_traces.zip]\n",
+            "  End-of-central-directory signature not found.  Either this file is not\n",
+            "  a zipfile, or it constitutes one disk of a multi-part archive.  In the\n",
+            "  latter case the central directory and zipfile comment will be found on\n",
+            "  the last disk(s) of this archive.\n",
+            "unzip:  cannot find zipfile directory in one of vista_traces.zip or\n",
+            "        vista_traces.zip.zip, and cannot find vista_traces.zip.ZIP, period.\n",
+            "Done downloading and unzipping data!\n"
+          ]
+        },
+        {
+          "output_type": "error",
+          "ename": "NameError",
+          "evalue": "ignored",
+          "traceback": [
+            "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+            "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
+            "\u001b[0;32m<ipython-input-3-06a67e1ffe73>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[1;32m     12\u001b[0m     \u001b[0;34m\"20210726-184956_lexus_devens_center_reverse\"\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     13\u001b[0m ]\n\u001b[0;32m---> 14\u001b[0;31m \u001b[0mtrace_path\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mos\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpath\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtrace_root\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mp\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mp\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtrace_path\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     15\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     16\u001b[0m \u001b[0;31m# Create a virtual world with VISTA, the world is defined by a series of data traces\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
+            "\u001b[0;32m<ipython-input-3-06a67e1ffe73>\u001b[0m in \u001b[0;36m<listcomp>\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m     12\u001b[0m     \u001b[0;34m\"20210726-184956_lexus_devens_center_reverse\"\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     13\u001b[0m ]\n\u001b[0;32m---> 14\u001b[0;31m \u001b[0mtrace_path\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mos\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpath\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtrace_root\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mp\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mp\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtrace_path\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     15\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     16\u001b[0m \u001b[0;31m# Create a virtual world with VISTA, the world is defined by a series of data traces\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
+            "\u001b[0;31mNameError\u001b[0m: name 'os' is not defined"
+          ]
+        }
+      ],
       "source": [
         "# Download and extract the data for vista (auto-skip if already downloaded)\n",
         "!wget -nc -q --show-progress https://www.dropbox.com/s/3qogfzuugi852du/vista_traces.zip\n",
@@ -735,8 +769,6 @@
         "\n",
         "trace_root = \"./vista_traces\"\n",
         "trace_path = [\n",
-        "#     \"20210726-131322_lexus_devens_center\", \n",
-        "#     \"20210726-131912_lexus_devens_center_reverse\", \n",
         "    \"20210726-154641_lexus_devens_center\", \n",
         "    \"20210726-155941_lexus_devens_center_reverse\", \n",
         "    \"20210726-184624_lexus_devens_center\", \n",
@@ -1093,11 +1125,11 @@
         "        # First, 32 5x5 filters and 2x2 stride\n",
         "        Conv2D(filters=32, kernel_size=5, strides=2),\n",
         "\n",
-        "        # TODO: define convolutional layers with 48 5x5 filters and 2x2 stride\n",
+        "        ''' TODO: define convolutional layers with 48 5x5 filters and 2x2 stride '''\n",
         "        Conv2D(filters=48, kernel_size=5, strides=2), # TODO\n",
         "        # Conv2D('''TODO'''),\n",
         "\n",
-        "        # TODO: define two convolutional layers with 64 3x3 filters and 2x2 stride\n",
+        "        ''' TODO: define two convolutional layers with 64 3x3 filters and 2x2 stride '''\n",
         "        Conv2D(filters=64, kernel_size=3, strides=2), # TODO\n",
         "        Conv2D(filters=64, kernel_size=3, strides=2), # TODO\n",
         "        # Conv2D('''TODO'''),\n",
@@ -1106,10 +1138,10 @@
         "\n",
         "        # Fully connected layer and output\n",
         "        Dense(units=128, activation=act),\n",
-        "        # TODO: define the output dimension of the last Dense layer. \n",
-        "        # Pay attention to the space the agent needs to act in.\n",
-        "        # Remember that this model is outputing *continuous* actions, \n",
-        "        # which take a different shape than discrete actions (like in Cartpole).\n",
+        "        ''' TODO: define the output dimension of the last Dense layer. \n",
+        "            Pay attention to the space the agent needs to act in.\n",
+        "            Remember that this model is outputing *continuous* actions, \n",
+        "            which take a different shape than discrete actions (like in Cartpole). '''\n",
         "        Dense(units=2, activation=None) # TODO\n",
         "        # Dense('''TODO''')\n",
         "\n",
@@ -1200,7 +1232,7 @@
         "## Training parameters ##\n",
         "## Re-run this cell to restart training from scratch ##\n",
         "\n",
-        "# TODO: Learning rate and optimizer\n",
+        "''' TODO: Learning rate and optimizer '''\n",
         "learning_rate = 5e-4\n",
         "# learning_rate = '''TODO'''\n",
         "optimizer = tf.keras.optimizers.Adam(learning_rate)\n",
@@ -1256,27 +1288,27 @@
         "    observation = grab_and_preprocess_obs(car)\n",
         "\n",
         "    while True:\n",
-        "        # TODO: using the car's current observation compute the desired \n",
-        "        # action (curvature) distribution by feeding it into our \n",
-        "        # driving model (use the function you already built to do this!)\n",
+        "        '''TODO: using the car's current observation compute the desired \n",
+        "           action (curvature) distribution by feeding it into our \n",
+        "           driving model (use the function you already built to do this!) '''\n",
         "        curvature_dist = run_driving_model(observation)\n",
         "        # curvature_dist = '''TODO'''\n",
         "        \n",
-        "        # TODO: sample from the action distribution to decide how to step\n",
-        "        # the car in the environment. You may want to check the documentation\n",
-        "        # for tfp.distributions.Normal online. Remember that the sampled action\n",
-        "        # should be a single scalar value after this step.\n",
+        "        ''' TODO: sample from the action distribution to decide how to step\n",
+        "            the car in the environment. You may want to check the documentation\n",
+        "            for tfp.distributions.Normal online. Remember that the sampled action\n",
+        "            should be a single scalar value after this step.'''\n",
         "        curvature_action = curvature_dist.sample()[0,0]\n",
         "        # curvature_action = '''TODO'''\n",
         "        \n",
         "        # Step the simulated car with the same action\n",
         "        vista_step(curvature_action)\n",
         "        observation = grab_and_preprocess_obs(car)\n",
         "               \n",
-        "        # TODO: Compute the reward for this iteration. You define \n",
-        "        # the reward function for this policy, start with something \n",
-        "        # simple - for example, give a reward of 1 if the car did not \n",
-        "        # crash and a reward of 0 if it did crash.\n",
+        "        '''TODO: Compute the reward for this iteration. You define \n",
+        "           the reward function for this policy, start with something \n",
+        "           simple - for example, give a reward of 1 if the car did not \n",
+        "           crash and a reward of 0 if it did crash.'''\n",
         "        reward = 1.0 if not check_crash(car) else 0.0\n",
         "        #  reward = '''TODO'''\n",
         "        \n",