Add all trainable variable to wrapper and keep the order of the training weights as much as possible for the custom layer.

Xhark · tensorflower-gardener · commit 18e87d262e53 · 2021-08-18T09:16:05.000-07:00
Note that this CL increased the coverage of keeping weight order, but doesn't guarantee alway same order because it uses _dedup_weights keras method which remove duplicated weights and maintaining order as much as possible.

PiperOrigin-RevId: 391542287
diff --git a/tensorflow_model_optimization/python/core/quantization/keras/BUILD b/tensorflow_model_optimization/python/core/quantization/keras/BUILD
@@ -266,6 +266,7 @@ py_strict_test(
         ":quantize_config",
         ":quantize_layer",
         ":quantize_wrapper",
+        ":quantizers",
         # numpy dep1,
         # tensorflow dep1,
         "//tensorflow_model_optimization/python/core/keras:test_utils",
diff --git a/tensorflow_model_optimization/python/core/quantization/keras/quantize_test.py b/tensorflow_model_optimization/python/core/quantization/keras/quantize_test.py
@@ -27,6 +27,7 @@
 from tensorflow_model_optimization.python.core.quantization.keras import quantize_config as quantize_config_mod
 from tensorflow_model_optimization.python.core.quantization.keras import quantize_layer
 from tensorflow_model_optimization.python.core.quantization.keras import quantize_wrapper as quantize_wrapper_mod
+from tensorflow_model_optimization.python.core.quantization.keras import quantizers
 from tensorflow_model_optimization.python.core.quantization.keras.default_8bit import default_8bit_quantize_registry
 
 quantize_annotate_layer = quantize.quantize_annotate_layer
@@ -513,6 +514,69 @@ def testQuantizeApply_RunsWhenNestedModelNotAnnotated(self):
 
     quantize_apply(annotated_model)
 
+  class CustomConvLayer(tf.keras.layers.Layer):
+
+    def __init__(self, name=None, **kwargs):
+      super().__init__(name=name, **kwargs)
+      self.conv1 = tf.keras.layers.Conv2D(2, 2)
+
+    def build(self, input_shape):
+      self.conv1.build(input_shape)
+
+    def call(self, inputs):
+      return self.conv1(inputs)
+
+    def get_config(self):
+      return {'name': self.name}
+
+  class CustomConvQuantizeConfig(quantize_config_mod.QuantizeConfig):
+
+    def get_weights_and_quantizers(self, layer):
+      return [(layer.conv1.kernel, quantizers.LastValueQuantizer(
+          num_bits=8, symmetric=True, narrow_range=False, per_axis=False)),]
+
+    def get_activations_and_quantizers(self, layer):
+      return []
+
+    def set_quantize_weights(self, layer, quantize_weights):
+      # layer.conv1._kernel_bak = layer.conv1.kernel
+      layer.conv1.kernel = quantize_weights[0]
+
+    def set_quantize_activations(self, layer, quantize_activations):
+      pass
+
+    def get_output_quantizers(self, layer):
+      return []
+
+    def get_config(self):
+      return {}
+
+  def testQuantizeApply_KeepTrainableWeightOrder(self):
+    layer = self.CustomConvLayer(input_shape=(28, 28, 3))
+    model = keras.Sequential([layer])
+
+    def apply_quantization_to_dense(layer):
+      if isinstance(layer, self.CustomConvLayer):
+        return quantize_annotate_layer(
+            layer, quantize_config=self.CustomConvQuantizeConfig())
+      return layer
+
+    annotated_model = tf.keras.models.clone_model(
+        model,
+        clone_function=apply_quantization_to_dense,
+    )
+
+    with quantize.quantize_scope({
+        'CustomConvQuantizeConfig': self.CustomConvQuantizeConfig,
+        'CustomConvLayer': self.CustomConvLayer
+    }):
+      quant_aware_model = quantize_apply(annotated_model)
+
+    self._assert_weights_different_objects(
+        model.trainable_weights, quant_aware_model.trainable_weights)
+    self._assert_weights_equal_value(
+        model.trainable_weights, quant_aware_model.trainable_weights)
+
 
 if __name__ == '__main__':
   tf.test.main()
diff --git a/tensorflow_model_optimization/python/core/quantization/keras/quantize_wrapper.py b/tensorflow_model_optimization/python/core/quantization/keras/quantize_wrapper.py
@@ -99,15 +99,14 @@ def build(self, input_shape):
         dtype=tf.dtypes.int32,
         trainable=False)
 
+    self._trainable_weights.extend(self.layer.trainable_weights)
     self._weight_vars = []
     for weight, quantizer in \
         self.quantize_config.get_weights_and_quantizers(self.layer):
       quantizer_vars = quantizer.build(weight.shape,
                                        self._weight_name(weight.name), self)
 
       self._weight_vars.append((weight, quantizer, quantizer_vars))
-      # Needed to ensure unquantized weights get trained as part of the wrapper.
-      self._trainable_weights.append(weight)
 
     self._quantize_activations = []
     for activation, quantizer in \
@@ -215,7 +214,9 @@ def trainable(self, value):
 
   @property
   def trainable_weights(self):
-    return self.layer.trainable_weights + self._trainable_weights
+    # Change the order to keep the weight order after applying QAT.
+    return self._dedup_weights(
+        self._trainable_weights + self.layer.trainable_weights)
 
   @property
   def non_trainable_weights(self):