|
89 | 89 | "id": "EvdePP-VyVWp"
|
90 | 90 | },
|
91 | 91 | "source": [
|
| 92 | + "#Install some dependencies for visualizing the agents\n", |
| 93 | + "!apt-get install -y xvfb python-opengl x11-utils > /dev/null 2>&1\n", |
| 94 | + "!pip install gym pyvirtualdisplay scikit-video > /dev/null 2>&1\n", |
| 95 | + "\n", |
92 | 96 | "# Import Tensorflow 2.0\n",
|
93 | 97 | "%tensorflow_version 2.x\n",
|
94 | 98 | "import tensorflow as tf\n",
|
|
241 | 245 | "\n",
|
242 | 246 | "cartpole_model = create_cartpole_model()"
|
243 | 247 | ],
|
244 |
| - "execution_count": null, |
| 248 | + "execution_count": 6, |
245 | 249 | "outputs": []
|
246 | 250 | },
|
247 | 251 | {
|
|
289 | 293 | "\n",
|
290 | 294 | " return action[0] if single else action"
|
291 | 295 | ],
|
292 |
| - "execution_count": null, |
| 296 | + "execution_count": 7, |
293 | 297 | "outputs": []
|
294 | 298 | },
|
295 | 299 | {
|
|
352 | 356 | "# Instantiate a single Memory buffer\n",
|
353 | 357 | "memory = Memory()"
|
354 | 358 | ],
|
355 |
| - "execution_count": null, |
| 359 | + "execution_count": 8, |
356 | 360 | "outputs": []
|
357 | 361 | },
|
358 | 362 | {
|
|
404 | 408 | " \n",
|
405 | 409 | " return normalize(discounted_rewards)"
|
406 | 410 | ],
|
407 |
| - "execution_count": null, |
| 411 | + "execution_count": 9, |
408 | 412 | "outputs": []
|
409 | 413 | },
|
410 | 414 | {
|
|
448 | 452 | " # loss = tf.reduce_mean('''TODO''')\n",
|
449 | 453 | " return loss"
|
450 | 454 | ],
|
451 |
| - "execution_count": null, |
| 455 | + "execution_count": 10, |
452 | 456 | "outputs": []
|
453 | 457 | },
|
454 | 458 | {
|
|
482 | 486 | " # grads = tape.gradient('''TODO''', model.trainable_variables)\n",
|
483 | 487 | " optimizer.apply_gradients(zip(grads, model.trainable_variables))\n"
|
484 | 488 | ],
|
485 |
| - "execution_count": null, |
| 489 | + "execution_count": 11, |
486 | 490 | "outputs": []
|
487 | 491 | },
|
488 | 492 | {
|
|
0 commit comments