Add pyTorch mc_dropout example

Max Keller · Max Keller · commit e5218f551f78 · 2021-08-25T19:51:21.000+02:00
diff --git a/examples/pytorch_mc_dropout.py b/examples/pytorch_mc_dropout.py
@@ -0,0 +1,126 @@
+"""
+In this file the basic ModAL PyTorch DeepActiveLearner workflow is explained 
+through an example on the MNIST dataset and the MC-Dropout-Bald query strategy.
+"""
+import sys
+import os
+import torch
+from torch import nn
+from skorch import NeuralNetClassifier
+
+from modAL.models import DeepActiveLearner
+
+# import of query strategies
+from modAL.dropout import mc_dropout_bald, mc_dropout_mean_st
+
+import numpy as np
+from torch.utils.data import DataLoader
+from torchvision.transforms import ToTensor
+from torchvision.datasets import MNIST
+
+# Standard Pytorch Model (Visit the PyTorch documentation for more details)
+class Torch_Model(nn.Module):
+    def __init__(self,):
+        super(Torch_Model, self).__init__()
+        self.convs = nn.Sequential(
+            nn.Conv2d(1, 32, 3),
+            nn.ReLU(),
+            nn.Conv2d(32, 64, 3),
+            nn.ReLU(),
+            nn.MaxPool2d(2),
+            nn.Dropout(0.25)
+        )
+        self.fcs = nn.Sequential(
+            nn.Linear(12*12*64, 128),
+            nn.ReLU(),
+            nn.Dropout(0.5),
+            nn.Linear(128, 10),
+        )
+
+    def forward(self, x):
+        out = x
+        out = self.convs(out)
+        out = out.view(-1, 12*12*64)
+        out = self.fcs(out)
+        return out
+
+
+torch_model = Torch_Model()
+"""
+You can acquire from the layer_list the dropout_layer_indexes, which can then be passed on 
+to the query strategies to decide which dropout layers should be active for the predictions. 
+When no dropout_layer_indexes are passed, all dropout layers will be activated on default. 
+"""
+layer_list = list(torch_model.modules())
+
+device = "cuda" if torch.cuda.is_available() else "cpu"
+
+# Use the NeuralNetClassifier from skorch to wrap the Pytorch model to the scikit-learn API
+classifier = NeuralNetClassifier(Torch_Model,
+                                 criterion=torch.nn.CrossEntropyLoss,
+                                 optimizer=torch.optim.Adam,
+                                 train_split=None,
+                                 verbose=1,
+                                 device=device)
+
+
+# Load the Dataset
+mnist_data = MNIST('.', download=True, transform=ToTensor())
+dataloader = DataLoader(mnist_data, shuffle=True, batch_size=60000)
+X, y = next(iter(dataloader))
+
+# read training data
+X_train, X_test, y_train, y_test = X[:50000], X[50000:], y[:50000], y[50000:]
+X_train = X_train.reshape(50000, 1, 28, 28)
+X_test = X_test.reshape(10000, 1, 28, 28)
+
+# assemble initial data
+n_initial = 1000
+initial_idx = np.random.choice(
+    range(len(X_train)), size=n_initial, replace=False)
+X_initial = X_train[initial_idx]
+y_initial = y_train[initial_idx]
+
+
+# generate the pool
+# remove the initial data from the training dataset
+X_pool = np.delete(X_train, initial_idx, axis=0)[:5000]
+y_pool = np.delete(y_train, initial_idx, axis=0)[:5000]
+
+
+# initialize ActiveLearner (Pass to him the skorch wrapped PyTorch model & the Query strategy)
+learner = DeepActiveLearner(
+    estimator=classifier,
+    query_strategy=mc_dropout_bald,
+)
+# initial teaching if desired (not necessary)
+learner.teach(X_initial, y_initial)
+
+print("Score from sklearn: {}".format(learner.score(X_pool, y_pool)))
+
+
+# the active learning loop
+n_queries = 10
+X_teach = X_initial
+y_teach = y_initial
+
+
+for idx in range(n_queries):
+    print('Query no. %d' % (idx + 1))
+    """
+        Query new data (num_cycles are the number of dropout forward passes that should be performed)
+        --> check the documentation of mc_dropout_bald in modAL/dropout.py to see all available parameters
+    """
+    query_idx, metric_values = learner.query(
+        X_pool, n_instances=100, dropout_layer_indexes=[7, 11], num_cycles=10)
+    # Add queried instances
+    X_teach = torch.cat((X_teach, X_pool[query_idx]))
+    y_teach = torch.cat((y_teach, y_pool[query_idx]))
+    learner.teach(X_teach, y_teach)
+
+    # remove queried instance from pool
+    X_pool = np.delete(X_pool, query_idx, axis=0)
+    y_pool = np.delete(y_pool, query_idx, axis=0)
+
+    # give us the model performance
+    print("Model score: {}".format(learner.score(X_test, y_test)))
diff --git a/modAL/models/base.py b/modAL/models/base.py
@@ -250,10 +250,6 @@ def _fit_on_new(self, X: modALinput, y: modALinput, bootstrap: bool = False, **f
     def predict(self, X: modALinput) -> Any:
         pass
 
-    @abc.abstractmethod
-    def teach(self, X: modALinput, y: modALinput, bootstrap: bool = False, **fit_kwargs) -> Any:
-        pass
-
     def transform_without_estimating(self, X: modALinput) -> Union[np.ndarray, sp.csr_matrix]:
         """
         Transforms the data as supplied to each learner's estimator and concatenates transformations.