kangwonlee
diff --git a/‎15_optimization/035_colab_mnist_keras_example.ipynb‎
Lines changed: 316 additions & 0 deletions b/‎15_optimization/035_colab_mnist_keras_example.ipynb‎
Lines changed: 316 additions & 0 deletions
@@ -0,0 +1,316 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "view-in-github",
+    "colab_type": "text"
+   },
+   "source": [
+    "<a href=\"https://colab.research.google.com/github/kangwonlee/nmisp/blob/main/15_optimization/035_colab_mnist_keras_example.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2.1 A first look at a neural network\n",
+    "\n",
+    "* from : F. Chollet, Deep Learning with Python, ISBN 9781617294433, 2017\n",
+    "* https://github.com/fchollet/deep-learning-with-python-notebooks\n",
+    "* https://www.manning.com/books/deep-learning-with-python\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import pathlib\n",
+    "\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "import tensorflow as tf\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Listing 2.1 Loading the MNIST dataset in Keras\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "try:\n",
+    "  data_folder = pathlib.Path('sample_data')\n",
+    "  assert data_folder.exists()\n",
+    "  assert data_folder.is_dir()\n",
+    "\n",
+    "  def read_data(data_path):\n",
+    "    df = pd.read_csv(\n",
+    "        data_path,\n",
+    "        header=None\n",
+    "    )\n",
+    "    labels = np.array(df.iloc[:, 0])\n",
+    "    images = np.array(df.iloc[:, 1:])\n",
+    "\n",
+    "    return images, labels\n",
+    "\n",
+    "\n",
+    "  train_images, train_labels = read_data(data_folder / 'mnist_train_small.csv')\n",
+    "  test_images, test_labels = read_data(data_folder / 'mnist_test.csv')\n",
+    "\n",
+    "except AssertionError:\n",
+    "  (train_images, train_labels), (test_images, test_labels) = tf.keras.datasets.mnist.load_data()\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Listing 2.2 The training data\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "train_images.shape\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "n_train = len(train_labels)\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "train_labels\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Listing 2.3 The test data\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "test_images.shape\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "n_test = len(test_labels)\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "test_labels\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Listing 2.4 The network architecture\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import keras\n",
+    "\n",
+    "network = keras.models.Sequential()\n",
+    "network.add(keras.layers.Input(shape=(28 * 28,)))  # Define input shape using Input layer\n",
+    "network.add(keras.layers.Dense(512, activation='relu'))\n",
+    "network.add(keras.layers.Dense(10, activation='softmax'))\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2.5 The compilation step\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "network.compile(\n",
+    "    optimizer='rmsprop',\n",
+    "    loss='categorical_crossentropy',\n",
+    "    metrics=['accuracy']\n",
+    ")\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2.6 Preparing the image data\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "train_images = np.array(train_images).reshape((n_train, 28 * 28))\n",
+    "train_images = np.array(train_images).astype('float32') / 255\n",
+    "\n",
+    "test_images = np.array(test_images).reshape((n_test, 28 * 28))\n",
+    "test_images = np.array(test_images).astype('float32') / 255\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2.7 Preparing the labels\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "train_labels = keras.utils.to_categorical(train_labels)\n",
+    "test_labels = keras.utils.to_categorical(test_labels)\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2.8 Training the network\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "n_epoch = 1 if os.getenv('GITHUB_ACTIONS', False) else 5\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%time\n",
+    "network.fit(train_images, train_labels, epochs=n_epoch, batch_size=128)\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2.9 Evaluating the network\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "test_loss, test_acc = network.evaluate(test_images, test_labels)\n",
+    "print('test_acc:', test_acc)\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "colab": {
+   "provenance": []
+  },
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}