Add all trainable variable to wrapper and keep the order of the training weights as much as possible for the custom layer.

Xhark · tensorflower-gardener · commit eefc66ad656f · 2021-08-25T20:11:22.000-07:00
Note that this CL increased the coverage of keeping weight order, but doesn't guarantee alway same order because it uses _dedup_weights keras method which remove duplicated weights and maintaining order as much as possible.

PiperOrigin-RevId: 393035727
diff --git a/tensorflow_model_optimization/python/core/quantization/keras/BUILD b/tensorflow_model_optimization/python/core/quantization/keras/BUILD
@@ -266,7 +266,6 @@ py_strict_test(
         ":quantize_config",
         ":quantize_layer",
         ":quantize_wrapper",
-        ":quantizers",
         # numpy dep1,
         # tensorflow dep1,
         "//tensorflow_model_optimization/python/core/keras:test_utils",
diff --git a/tensorflow_model_optimization/python/core/quantization/keras/quantize_test.py b/tensorflow_model_optimization/python/core/quantization/keras/quantize_test.py
@@ -27,7 +27,6 @@
 from tensorflow_model_optimization.python.core.quantization.keras import quantize_config as quantize_config_mod
 from tensorflow_model_optimization.python.core.quantization.keras import quantize_layer
 from tensorflow_model_optimization.python.core.quantization.keras import quantize_wrapper as quantize_wrapper_mod
-from tensorflow_model_optimization.python.core.quantization.keras import quantizers
 from tensorflow_model_optimization.python.core.quantization.keras.default_8bit import default_8bit_quantize_registry
 
 quantize_annotate_layer = quantize.quantize_annotate_layer
@@ -514,69 +513,6 @@ def testQuantizeApply_RunsWhenNestedModelNotAnnotated(self):
 
     quantize_apply(annotated_model)
 
-  class CustomConvLayer(tf.keras.layers.Layer):
-
-    def __init__(self, name=None, **kwargs):
-      super().__init__(name=name, **kwargs)
-      self.conv1 = tf.keras.layers.Conv2D(2, 2)
-
-    def build(self, input_shape):
-      self.conv1.build(input_shape)
-
-    def call(self, inputs):
-      return self.conv1(inputs)
-
-    def get_config(self):
-      return {'name': self.name}
-
-  class CustomConvQuantizeConfig(quantize_config_mod.QuantizeConfig):
-
-    def get_weights_and_quantizers(self, layer):
-      return [(layer.conv1.kernel, quantizers.LastValueQuantizer(
-          num_bits=8, symmetric=True, narrow_range=False, per_axis=False)),]
-
-    def get_activations_and_quantizers(self, layer):
-      return []
-
-    def set_quantize_weights(self, layer, quantize_weights):
-      # layer.conv1._kernel_bak = layer.conv1.kernel
-      layer.conv1.kernel = quantize_weights[0]
-
-    def set_quantize_activations(self, layer, quantize_activations):
-      pass
-
-    def get_output_quantizers(self, layer):
-      return []
-
-    def get_config(self):
-      return {}
-
-  def testQuantizeApply_KeepTrainableWeightOrder(self):
-    layer = self.CustomConvLayer(input_shape=(28, 28, 3))
-    model = keras.Sequential([layer])
-
-    def apply_quantization_to_dense(layer):
-      if isinstance(layer, self.CustomConvLayer):
-        return quantize_annotate_layer(
-            layer, quantize_config=self.CustomConvQuantizeConfig())
-      return layer
-
-    annotated_model = tf.keras.models.clone_model(
-        model,
-        clone_function=apply_quantization_to_dense,
-    )
-
-    with quantize.quantize_scope({
-        'CustomConvQuantizeConfig': self.CustomConvQuantizeConfig,
-        'CustomConvLayer': self.CustomConvLayer
-    }):
-      quant_aware_model = quantize_apply(annotated_model)
-
-    self._assert_weights_different_objects(
-        model.trainable_weights, quant_aware_model.trainable_weights)
-    self._assert_weights_equal_value(
-        model.trainable_weights, quant_aware_model.trainable_weights)
-
 
 if __name__ == '__main__':
   tf.test.main()
diff --git a/tensorflow_model_optimization/python/core/quantization/keras/quantize_wrapper.py b/tensorflow_model_optimization/python/core/quantization/keras/quantize_wrapper.py
@@ -99,14 +99,15 @@ def build(self, input_shape):
         dtype=tf.dtypes.int32,
         trainable=False)
 
-    self._trainable_weights.extend(self.layer.trainable_weights)
     self._weight_vars = []
     for weight, quantizer in \
         self.quantize_config.get_weights_and_quantizers(self.layer):
       quantizer_vars = quantizer.build(weight.shape,
                                        self._weight_name(weight.name), self)
 
       self._weight_vars.append((weight, quantizer, quantizer_vars))
+      # Needed to ensure unquantized weights get trained as part of the wrapper.
+      self._trainable_weights.append(weight)
 
     self._quantize_activations = []
     for activation, quantizer in \
@@ -214,9 +215,7 @@ def trainable(self, value):
 
   @property
   def trainable_weights(self):
-    # Change the order to keep the weight order after applying QAT.
-    return self._dedup_weights(
-        self._trainable_weights + self.layer.trainable_weights)
+    return self.layer.trainable_weights + self._trainable_weights
 
   @property
   def non_trainable_weights(self):