Addressed reviewer's comments. Added test that demonstrates that 'bias' is not clustered by default.

wwwind · wwwind · commit c5f42abc55c7 · 2021-02-18T18:10:07.000Z
Change-Id: I6e21506d8c44cb6dbaa9200d1f87918df1982da9
diff --git a/tensorflow_model_optimization/python/core/clustering/keras/BUILD b/tensorflow_model_optimization/python/core/clustering/keras/BUILD
@@ -166,8 +166,19 @@ py_test(
 )
 
 py_test(
-    name = "mnist_customerable_test",
-    srcs = ["mnist_customerable_test.py"],
+    name = "mnist_clusterable_layer_test",
+    srcs = ["mnist_clusterable_layer_test.py"],
+    python_version = "PY3",
+    visibility = ["//visibility:public"],
+    deps = [
+        ":cluster"
+        # tensorflow dep1,
+    ],
+)
+
+py_test(
+    name = "mnist_clustering_test",
+    srcs = ["mnist_clustering_test.py"],
     python_version = "PY3",
     visibility = ["//visibility:public"],
     deps = [
diff --git a/tensorflow_model_optimization/python/core/clustering/keras/cluster_test.py b/tensorflow_model_optimization/python/core/clustering/keras/cluster_test.py
@@ -55,7 +55,7 @@ class CustomNonClusterableLayer(layers.Dense):
   pass
 
 
-class MyCustomerableLayer(keras.layers.Dense,
+class MyClusterableLayer(keras.layers.Dense,
   clusterable_layer.ClusterableLayer):
 
   def __init__(self, num_units):
@@ -65,7 +65,7 @@ def get_clusterable_weights(self):
     # Cluster kernel and bias.
     return [('kernel', self.kernel), ('bias', self.bias)]
 
-class MyCustomerableLayerInvalid(keras.layers.Dense,
+class MyClusterableLayerInvalid(keras.layers.Dense,
   clusterable_layer.ClusterableLayer):
   """ This layer is invalid, because it does not provide
   get_clusterable_weights function.
@@ -107,8 +107,7 @@ def setUp(self):
     self.custom_clusterable_layer = CustomClusterableLayer(10)
     self.custom_non_clusterable_layer = CustomNonClusterableLayer(10)
     self.keras_depthwiseconv2d_layer = layers.DepthwiseConv2D((3, 3), (1, 1))
-    self.customerable_layer = MyCustomerableLayer(10)
-    self.keras_custom_layer = KerasCustomLayer()
+    self.clusterable_layer = MyClusterableLayer(10)
 
     clustering_registry.ClusteringLookupRegistry.register_new_implementation(
         {
@@ -225,12 +224,12 @@ def testClusterCustomNonClusterableLayer(self):
       cluster_wrapper.ClusterWeights(custom_non_clusterable_layer,
                                      **self.params)
 
-  def testClusterMyCustomerableLayer(self):
+  def testClusterMyClusterableLayer(self):
     # we have weights to cluster.
-    customerable_layer = self.customerable_layer
-    customerable_layer.build(input_shape=(10, 10))
+    clusterable_layer = self.clusterable_layer
+    clusterable_layer.build(input_shape=(10, 10))
 
-    wrapped_layer = cluster_wrapper.ClusterWeights(customerable_layer,
+    wrapped_layer = cluster_wrapper.ClusterWeights(clusterable_layer,
                                      **self.params)
 
     self.assertIsInstance(wrapped_layer, cluster_wrapper.ClusterWeights)
@@ -239,40 +238,24 @@ def testKerasCustomLayerClusterable(self):
     """
     Verifies that we can wrap keras custom layer that is customerable.
     """
-    customerable_layer = KerasCustomLayerClusterable()
-    wrapped_layer = cluster_wrapper.ClusterWeights(customerable_layer,
+    clusterable_layer = KerasCustomLayerClusterable()
+    wrapped_layer = cluster_wrapper.ClusterWeights(clusterable_layer,
                                      **self.params)
 
     self.assertIsInstance(wrapped_layer, cluster_wrapper.ClusterWeights)
 
-  def testClusterMyCustomerableLayerInvalid(self):
+  def testClusterMyClusterableLayerInvalid(self):
     """
     Verifies that assertion is thrown when function
     get_clusterable_weights is not provided.
     """
     with self.assertRaises(TypeError):
-      MyCustomerableLayerInvalid(10) # pylint: disable=abstract-class-instantiated
+      MyClusterableLayerInvalid(10) # pylint: disable=abstract-class-instantiated
 
-  def testClusterKerasCustomLayer(self):
-    """
-    Verifies that attempting to cluster a keras custom layer raises
-    an exception.
-    """
-    # If layer is not built, it has not weights, so
-    # we just skip it.
-    keras_custom_layer = self.keras_custom_layer
-    cluster_wrapper.ClusterWeights(keras_custom_layer,
-                                  **self.params)
-    # We need to build weights before check that clustering is not supported.
-    keras_custom_layer.build(input_shape=(10, 10))
-    with self.assertRaises(ValueError):
-      cluster_wrapper.ClusterWeights(keras_custom_layer,
-                                     **self.params)
-
->>>>>>> 8fe29ec... MLTOOLS-1031 Customerable layer API.
   @keras_parameterized.run_all_keras_modes
   def testClusterSequentialModelSelectively(self):
     clustered_model = keras.Sequential()
+    clustered_model.add(cluster.cluster_weights(self.keras_clusterable_layer, **self.params))
     clustered_model.add(self.keras_clusterable_layer)
     clustered_model.build(input_shape=(1, 10))
 
diff --git a/tensorflow_model_optimization/python/core/clustering/keras/mnist_clusterable_layer_test.py b/tensorflow_model_optimization/python/core/clustering/keras/mnist_clusterable_layer_test.py
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
-"""Tests for a simple convnet with customerable layer on the MNIST dataset. """
+"""Tests for a simple convnet with clusterable layer on the MNIST dataset. """
 
 import tensorflow as tf
 
@@ -38,7 +38,7 @@ def get_clusterable_weights(self):
     # Cluster kernel and bias.
     return [('kernel', self.kernel), ('bias', self.bias)]
 
-class CustomerableWeightsCA(clustering_registry.AbstractClusteringAlgorithm):
+class ClusterableWeightsCA(clustering_registry.AbstractClusteringAlgorithm):
   """
     This class provided a special lookup function for the the weights 'w'.
     It reshapes and tile centroids the same way as the weights. This allows us
@@ -58,10 +58,10 @@ def get_pulling_indices(self, weight):
 
     return pulling_indices
 
-class MyCustomerableLayer(keras.layers.Layer, clusterable_layer.ClusterableLayer):
+class MyClusterableLayer(keras.layers.Layer, clusterable_layer.ClusterableLayer):
 
   def __init__(self, units=32):
-    super(MyCustomerableLayer, self).__init__()
+    super(MyClusterableLayer, self).__init__()
     self.units = units
 
   def build(self, input_shape):
@@ -87,7 +87,7 @@ def get_clusterable_algorithm(self, weight_name):
     """ Returns clustering algorithm for the custom weights 'w'.
     """
     if weight_name == 'w':
-      return CustomerableWeightsCA
+      return ClusterableWeightsCA
     else:
       # We don't cluster other weights.
       return None
@@ -110,7 +110,7 @@ def _build_model():
 
 def _build_model_2():
   """
-  Builds model with MyCustomerableLayer layer.
+  Builds model with MyClusterableLayer layer.
   """
   i = tf.keras.layers.Input(shape=(28, 28), name='input')
   x = tf.keras.layers.Reshape((28, 28, 1))(i)
@@ -119,7 +119,7 @@ def _build_model_2():
           x)
   x = tf.keras.layers.MaxPool2D(2, 2)(x)
   x = tf.keras.layers.Flatten()(x)
-  output = MyCustomerableLayer(units=10)(x)
+  output = MyClusterableLayer(units=10)(x)
 
   model = tf.keras.Model(inputs=[i], outputs=[output])
   return model
@@ -220,13 +220,13 @@ def testMnistMyDenseLayer(self):
     self.assertLessEqual(nr_of_unique_weights, NUMBER_OF_CLUSTERS)
 
     # checks 'bias' weights of the last layer: MyDenseLayer
-    nr_of_unique_weights = _get_number_of_unique_weights(clustered_model, -1, 0)
+    nr_of_unique_weights = _get_number_of_unique_weights(clustered_model, -1, 1)
     self.assertLessEqual(nr_of_unique_weights, NUMBER_OF_CLUSTERS)
 
-  def testMnistCustomerableLayer(self):
+  def testMnistClusterableLayer(self):
     """ We test the keras custom layer with the provided
-      clustering algorithm (see MyCustomerableLayer above).
-      We cluster only 'w' weights and the class CustomerableWeightsCA
+      clustering algorithm (see MyClusterableLayer above).
+      We cluster only 'w' weights and the class ClusterableWeightsCA
       provides the function get_pulling_indices for the
       layer-out of 'w' weights.
 
diff --git a/tensorflow_model_optimization/python/core/clustering/keras/mnist_clustering_test.py b/tensorflow_model_optimization/python/core/clustering/keras/mnist_clustering_test.py
@@ -0,0 +1,143 @@
+# Copyright 2021 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for a simple convnet with clusterable layer on the MNIST dataset. """
+
+import tensorflow as tf
+
+from tensorflow_model_optimization.python.core.clustering.keras import cluster
+from tensorflow_model_optimization.python.core.clustering.keras import cluster_config
+from tensorflow_model_optimization.python.core.clustering.keras import clusterable_layer
+from tensorflow_model_optimization.python.core.clustering.keras import clustering_registry
+
+tf.random.set_seed(42)
+
+keras = tf.keras
+
+EPOCHS = 7
+EPOCHS_FINE_TUNING = 4
+NUMBER_OF_CLUSTERS = 8
+
+def _build_model():
+  """
+  Builds simple CNN model.
+  """
+  i = tf.keras.layers.Input(shape=(28, 28), name='input')
+  x = tf.keras.layers.Reshape((28, 28, 1))(i)
+  x = tf.keras.layers.Conv2D(
+      filters=12, kernel_size=(3, 3), activation='relu', name='conv1')(
+          x)
+  x = tf.keras.layers.MaxPool2D(2, 2)(x)
+  x = tf.keras.layers.Flatten()(x)
+  output = tf.keras.layers.Dense(units=10)(x)
+
+  model = tf.keras.Model(inputs=[i], outputs=[output])
+  return model
+
+def _get_dataset():
+  mnist = tf.keras.datasets.mnist
+  (x_train, y_train), (x_test, y_test) = mnist.load_data()
+  x_train, x_test = x_train / 255.0, x_test / 255.0
+  # Use subset of 60000 examples to keep unit test speed fast.
+  x_train = x_train[0:1000]
+  y_train = y_train[0:1000]
+  return (x_train, y_train), (x_test, y_test)
+
+
+def _train_model(model):
+  loss_fn = tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
+
+  model.compile(optimizer='adam', loss=loss_fn, metrics=['accuracy'])
+
+  (x_train, y_train), _ = _get_dataset()
+
+  model.fit(x_train, y_train, epochs=EPOCHS)
+
+def _cluster_model(model, number_of_clusters):
+
+  (x_train, y_train), _ = _get_dataset()
+
+  clustering_params = {
+    'number_of_clusters': NUMBER_OF_CLUSTERS,
+    'cluster_centroids_init': cluster_config.CentroidInitialization.KMEANS_PLUS_PLUS
+  }
+
+  # Cluster model
+  clustered_model = cluster.cluster_weights(model, **clustering_params)
+
+  # Use smaller learning rate for fine-tuning
+  # clustered model
+  opt = tf.keras.optimizers.Adam(learning_rate=1e-5)
+
+  clustered_model.compile(
+  loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
+  optimizer=opt,
+  metrics=['accuracy'])
+
+  # Fine-tune clustered model
+  clustered_model.fit(
+      x_train,
+      y_train,
+      epochs=EPOCHS_FINE_TUNING)
+
+  stripped_model = cluster.strip_clustering(clustered_model)
+  stripped_model.compile(
+    loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
+    optimizer=opt,
+    metrics=['accuracy'])
+
+  return stripped_model
+
+def _get_number_of_unique_weights(stripped_model, layer_nr, weights_nr):
+  weights_as_list = stripped_model.layers[layer_nr].get_weights()[weights_nr].reshape(-1,).tolist()
+  nr_of_unique_weights = len(set(weights_as_list))
+
+  return nr_of_unique_weights
+
+class FunctionalTest(tf.test.TestCase):
+
+  def testMnist(self):
+    """ In this test we test that 'kernel' weights
+    are clustered.
+    """
+    model = _build_model()
+    _train_model(model)
+
+    # Checks that number of original weights('kernel') is greater than the number of clusters
+    nr_of_unique_weights = _get_number_of_unique_weights(model, -1, 0)
+    self.assertGreater(nr_of_unique_weights, NUMBER_OF_CLUSTERS)
+
+    # Record the number of unique values of 'bias'
+    nr_of_bias_weights = _get_number_of_unique_weights(model, -1, 1)
+
+    _, (x_test, y_test) = _get_dataset()
+
+    results_original = model.evaluate(x_test, y_test)
+    self.assertGreater(results_original[1], 0.85)
+
+    clustered_model = _cluster_model(model, NUMBER_OF_CLUSTERS)
+
+    results = clustered_model.evaluate(x_test, y_test)
+
+    self.assertGreater(results[1], 0.85)
+
+    nr_of_unique_weights = _get_number_of_unique_weights(clustered_model, -1, 0)
+    self.assertLessEqual(nr_of_unique_weights, NUMBER_OF_CLUSTERS)
+
+    # checks that we don't cluster 'bias' weights
+    clustered_nr_of_bias_weights = _get_number_of_unique_weights(clustered_model, -1, 1)
+    self.assertEqual(nr_of_bias_weights, clustered_nr_of_bias_weights)
+
+if __name__ == '__main__':
+  tf.test.main()