Merge branch 'damienlancry-pytorch-integration' into dev

cosmic-cortex · cosmic-cortex · commit f40935870e2e · 2019-06-07T11:16:21.000+02:00
diff --git a/docs/source/content/examples/Pytorch_integration.ipynb b/docs/source/content/examples/Pytorch_integration.ipynb
@@ -0,0 +1,277 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Pytorch models in modAL workflows\n",
+    "=============================\n",
+    "\n",
+    "Thanks to Skorch API, you can seamlessly integrate Pytorch models into your modAL workflow. In this tutorial, we shall quickly introduce how to use Skorch API of Keras and we are going to see how to do active learning with it. More details on the Keras scikit-learn API [can be found here](https://skorch.readthedocs.io/en/stable/).\n",
+    "\n",
+    "The executable script for this example can be [found here](https://github.com/cosmic-cortex/modAL/blob/master/examples/pytorch_integration.py)!"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Skorch API\n",
+    "-----------------------\n",
+    "\n",
+    "By default, a Pytorch model's interface differs from what is used for scikit-learn estimators. However, with the use of Skorch wrapper, it is possible to adapt your model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "from torch import nn\n",
+    "from skorch import NeuralNetClassifier\n",
+    "\n",
+    "# build class for the skorch API\n",
+    "class Torch_Model(nn.Module):\n",
+    "    def __init__(self,):\n",
+    "        super(Torch_Model, self).__init__()\n",
+    "        self.convs = nn.Sequential(\n",
+    "                                nn.Conv2d(1,32,3),\n",
+    "                                nn.ReLU(),\n",
+    "                                nn.Conv2d(32,64,3),\n",
+    "                                nn.ReLU(),\n",
+    "                                nn.MaxPool2d(2),\n",
+    "                                nn.Dropout(0.25)\n",
+    "        )\n",
+    "        self.fcs = nn.Sequential(\n",
+    "                                nn.Linear(12*12*64,128),\n",
+    "                                nn.ReLU(),\n",
+    "                                nn.Dropout(0.5),\n",
+    "                                nn.Linear(128,10),\n",
+    "        )\n",
+    "\n",
+    "    def forward(self, x):\n",
+    "        out = x\n",
+    "        out = self.convs(out)\n",
+    "        out = out.view(-1,12*12*64)\n",
+    "        out = self.fcs(out)\n",
+    "        return out"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "For our purposes, the ``classifier`` which we will initialize now acts just like any scikit-learn estimator."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# create the classifier\n",
+    "device = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
+    "classifier = NeuralNetClassifier(Torch_Model,\n",
+    "                                 criterion=nn.CrossEntropyLoss,\n",
+    "                                 optimizer=torch.optim.Adam,\n",
+    "                                 train_split=None,\n",
+    "                                 verbose=1,\n",
+    "                                 device=device)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Active learning with Pytorch\n",
+    "---------------------------------------\n",
+    "\n",
+    "In this example, we are going to use the famous MNIST dataset, which is available as a built-in for PyTorch."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\r",
+      "0it [00:00, ?it/s]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz to ./MNIST/raw/train-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      " 97%|█████████▋| 9584640/9912422 [00:15<00:00, 1777143.52it/s]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Extracting ./MNIST/raw/train-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "0it [00:00, ?it/s]\u001b[A"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz to ./MNIST/raw/train-labels-idx1-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "  0%|          | 0/28881 [00:00<?, ?it/s]\u001b[A\n",
+      " 57%|█████▋    | 16384/28881 [00:00<00:00, 62622.03it/s]\u001b[A\n",
+      "32768it [00:00, 41627.01it/s]                           \u001b[A\n",
+      "0it [00:00, ?it/s]\u001b[A"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Extracting ./MNIST/raw/train-labels-idx1-ubyte.gz\n",
+      "Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz to ./MNIST/raw/t10k-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "  0%|          | 0/1648877 [00:00<?, ?it/s]\u001b[A"
+     ]
+    }
+   ],
+   "source": [
+    "import numpy as np\n",
+    "from torch.utils.data import DataLoader\n",
+    "from torchvision.transforms import ToTensor\n",
+    "from torchvision.datasets import MNIST\n",
+    "\n",
+    "\n",
+    "mnist_data = MNIST('.', download=True, transform=ToTensor())\n",
+    "dataloader = DataLoader(mnist_data, shuffle=True, batch_size=60000)\n",
+    "X, y = next(iter(dataloader))\n",
+    "\n",
+    "# read training data\n",
+    "X_train, X_test, y_train, y_test = X[:50000], X[50000:], y[:50000], y[50000:]\n",
+    "X_train = X_train.reshape(50000, 1, 28, 28)\n",
+    "X_test = X_test.reshape(10000, 1, 28, 28)\n",
+    "\n",
+    "# assemble initial data\n",
+    "n_initial = 1000\n",
+    "initial_idx = np.random.choice(range(len(X_train)), size=n_initial, replace=False)\n",
+    "X_initial = X_train[initial_idx]\n",
+    "y_initial = y_train[initial_idx]\n",
+    "\n",
+    "# generate the pool\n",
+    "# remove the initial data from the training dataset\n",
+    "X_pool = np.delete(X_train, initial_idx, axis=0)[:5000]\n",
+    "y_pool = np.delete(y_train, initial_idx, axis=0)[:5000]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Active learning with data and classifier ready is as easy as always. Because training is *very* expensive in large neural networks, this time we are going to query the best 200 instances each time we measure the uncertainty of the pool."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from modAL.models import ActiveLearner\n",
+    "\n",
+    "# initialize ActiveLearner\n",
+    "learner = ActiveLearner(\n",
+    "    estimator=classifier,\n",
+    "    X_training=X_initial, y_training=y_initial,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "To make sure that you train only on newly queried labels, pass ``only_new=True`` to the ``.teach()`` method of the learner."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# the active learning loop\n",
+    "n_queries = 10\n",
+    "for idx in range(n_queries):\n",
+    "    print('Query no. %d' % (idx + 1))\n",
+    "    query_idx, query_instance = learner.query(X_pool, n_instances=100)\n",
+    "    learner.teach(\n",
+    "        X=X_pool[query_idx], y=y_pool[query_idx], only_new=True,\n",
+    "    )\n",
+    "    # remove queried instance from pool\n",
+    "    X_pool = np.delete(X_pool, query_idx, axis=0)\n",
+    "    y_pool = np.delete(y_pool, query_idx, axis=0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python [conda env:modAL] *",
+   "language": "python",
+   "name": "conda-env-modAL-py"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -67,6 +67,7 @@ Currently supported active learning strategies are
    content/examples/query_by_committee
    content/examples/bootstrapping_and_bagging
    content/examples/Keras_integration
+   content/examples/Pytorch_integration
    
 .. toctree::
    :glob:
diff --git a/examples/pytorch_integration.py b/examples/pytorch_integration.py
@@ -0,0 +1,103 @@
+"""
+This example demonstrates how to use the active learning interface with Pytorch.
+The example uses Skorch, a scikit learn wrapper of Pytorch.
+For more info, see https://skorch.readthedocs.io/en/stable/
+"""
+
+import torch
+import numpy as np
+
+from torch import nn
+from torch.utils.data import DataLoader
+from torchvision.transforms import ToTensor
+from torchvision.datasets import MNIST
+from skorch import NeuralNetClassifier
+
+from modAL.models import ActiveLearner
+
+
+# build class for the skorch API
+class Torch_Model(nn.Module):
+    def __init__(self,):
+        super(Torch_Model, self).__init__()
+        self.convs = nn.Sequential(
+                                nn.Conv2d(1,32,3),
+                                nn.ReLU(),
+                                nn.Conv2d(32,64,3),
+                                nn.ReLU(),
+                                nn.MaxPool2d(2),
+                                nn.Dropout(0.25)
+        )
+        self.fcs = nn.Sequential(
+                                nn.Linear(12*12*64,128),
+                                nn.ReLU(),
+                                nn.Dropout(0.5),
+                                nn.Linear(128,10),
+        )
+
+    def forward(self, x):
+        out = x
+        out = self.convs(out)
+        out = out.view(-1,12*12*64)
+        out = self.fcs(out)
+        return out
+
+
+# create the classifier
+device = "cuda" if torch.cuda.is_available() else "cpu"
+classifier = NeuralNetClassifier(Torch_Model,
+                                 # max_epochs=100,
+                                 criterion=nn.CrossEntropyLoss,
+                                 optimizer=torch.optim.Adam,
+                                 train_split=None,
+                                 verbose=1,
+                                 device=device)
+
+"""
+Data wrangling
+1. Reading data from torchvision
+2. Assembling initial training data for ActiveLearner
+3. Generating the pool
+"""
+
+mnist_data = MNIST('.', download=True, transform=ToTensor())
+dataloader = DataLoader(mnist_data, shuffle=True, batch_size=60000)
+X, y = next(iter(dataloader))
+
+# read training data
+X_train, X_test, y_train, y_test = X[:50000], X[50000:], y[:50000], y[50000:]
+X_train = X_train.reshape(50000, 1, 28, 28)
+X_test = X_test.reshape(10000, 1, 28, 28)
+
+# assemble initial data
+n_initial = 1000
+initial_idx = np.random.choice(range(len(X_train)), size=n_initial, replace=False)
+X_initial = X_train[initial_idx]
+y_initial = y_train[initial_idx]
+
+# generate the pool
+# remove the initial data from the training dataset
+X_pool = np.delete(X_train, initial_idx, axis=0)
+y_pool = np.delete(y_train, initial_idx, axis=0)
+
+"""
+Training the ActiveLearner
+"""
+
+# initialize ActiveLearner
+learner = ActiveLearner(
+    estimator=classifier,
+    X_training=X_initial, y_training=y_initial,
+)
+
+# the active learning loop
+n_queries = 10
+for idx in range(n_queries):
+    query_idx, query_instance = learner.query(X_pool, n_instances=100)
+    learner.teach(X_pool[query_idx], y_pool[query_idx], only_new=True)
+    # remove queried instance from pool
+    X_pool = np.delete(X_pool, query_idx, axis=0)
+    y_pool = np.delete(y_pool, query_idx, axis=0)
+
+# the final accuracy score
+print(learner.score(X_test, y_test))
diff --git a/modAL/utils/data.py b/modAL/utils/data.py
@@ -25,4 +25,7 @@ def data_vstack(blocks: Container) -> modALinput:
     elif sp.issparse(blocks[0]):
         return sp.vstack(blocks)
     else:
-        raise TypeError('%s datatype is not supported' % type(blocks[0]))
+        try:
+            return np.concatenate(blocks)
+        except:
+            raise TypeError('%s datatype is not supported' % type(blocks[0]))