Makes index_ranges always iterable.

Johannes Ballé · copybara-github · commit 0c0e40f3899b · 2021-02-03T15:29:23.000-08:00
We now allow an omitted channel dimension via channel_axis=None instead.

PiperOrigin-RevId: 355495759
Change-Id: I52281d18d726384341c8a818c4b49b0d4196cc96
diff --git a/tensorflow_compression/python/entropy_models/continuous_indexed.py b/tensorflow_compression/python/entropy_models/continuous_indexed.py
@@ -59,16 +59,16 @@ class ContinuousIndexedEntropyModel(continuous_base.ContinuousEntropyModelBase):
   each bottleneck tensor element, it selects the appropriate scalar
   distribution.
 
-  The `indexes` tensor must contain only integer values (but may have
-  floating-point type for purposes of backpropagation) in a pre-specified range.
-  If `index_ranges` is a single integer, the index values must be in the range
-  `[0, index_ranges)` and `indexes` must have the same shape as the bottleneck
-  tensor. This only allows a one-dimensional conditional dependency. To make the
-  distribution conditional on `n`-dimensional indexes, `index_ranges` must be
-  specified as an iterable of `n` integers. Then, `indexes` must have the same
+  The `indexes` tensor must contain only integer values in a pre-specified range
+  (but may have floating-point type for purposes of backpropagation). To make
+  the distribution conditional on `n`-dimensional indexes, `index_ranges` must
+  be specified as an iterable of `n` integers. `indexes` must have the same
   shape as the bottleneck tensor with an additional channel dimension of length
   `n`. The position of the channel dimension is given by `channel_axis`. The
-  index values in the `n`th channel must be in the range `[0, index_ranges[n])`.
+  index values in the `k`th channel must be in the range `[0, index_ranges[k])`.
+  If `index_ranges` has only one element (i.e. `n == 1`), `channel_axis` may be
+  `None`. In that case, the additional channel dimension is omitted, and the
+  `indexes` tensor must have the same shape as the bottleneck tensor.
 
   The implied distribution for the bottleneck tensor is determined as:
   ```
@@ -89,12 +89,13 @@ class ContinuousIndexedEntropyModel(continuous_base.ContinuousEntropyModelBase):
   ```
   tfc.ContinuousIndexedEntropyModel(
       prior_fn=tfc.NoisyNormal,
-      index_ranges=64,
+      index_ranges=(64,),
       parameter_fns=dict(
           loc=lambda _: 0.,
           scale=lambda i: tf.exp(i / 8 - 5),
       ),
       coding_rank=1,
+      channel_axis=None,
   )
   ```
   Then, each element of `indexes` in the range `[0, 64)` would indicate that the
@@ -149,12 +150,10 @@ def __init__(self,
         since this is the marginal distribution for bottleneck dimensions that
         are constant. The callable will receive keyword arguments as determined
         by `parameter_fns`.
-      index_ranges: Integer or iterable of integers. If a single integer,
-        `indexes` must have the same shape as `bottleneck`, and `channel_axis`
-        is ignored. Its values must be in the range `[0, index_ranges)`. If an
-        iterable of integers, `indexes` must have an additional dimension at
-        position `channel_axis`, and the values of the `n`th channel must be in
-        the range `[0, index_ranges[n])`.
+      index_ranges: Iterable of integers. `indexes` must have the same shape as
+        the bottleneck tensor, with an additional dimension at position
+        `channel_axis`. The values of the `k`th channel must be in the range
+        `[0, index_ranges[k])`.
       parameter_fns: Dict of strings to callables. Functions mapping `indexes`
         to each distribution parameter. For each item, `indexes` is passed to
         the callable, and the string key and return value make up one keyword
@@ -167,9 +166,10 @@ def __init__(self,
         assumes eager mode (throws an error if in graph mode or inside a
         `tf.function` call). If set to `False`, these two methods will not be
         accessible.
-      channel_axis: Integer. For iterable `index_ranges`, determines the
-        position of the channel axis in `indexes`. Defaults to the last
-        dimension.
+      channel_axis: Integer or `None`. Determines the position of the channel
+        axis in `indexes`. Defaults to the last dimension. If set to `None`,
+        the index tensor is expected to have the same shape as the bottleneck
+        tensor (only allowed when `index_ranges` has length 1).
       dtype: `tf.dtypes.DType`. The data type of all floating-point
         computations carried out in this class.
       laplace_tail_mass: Float. If positive, will augment the prior with a
@@ -187,19 +187,24 @@ def __init__(self,
         `compression=True` and not in eager execution mode.
     """
     if coding_rank <= 0:
-      raise ValueError("`coding_rank` must be larger than 0.")
+      raise ValueError("coding_rank must be larger than 0.")
     if not callable(prior_fn):
-      raise TypeError("`prior_fn` must be a class or factory function.")
+      raise TypeError("prior_fn must be a class or factory function.")
     for name, fn in parameter_fns.items():
       if not isinstance(name, str):
-        raise TypeError("`parameter_fns` must have string keys.")
+        raise TypeError("parameter_fns must have string keys.")
       if not callable(fn):
-        raise TypeError("`parameter_fns['{}']` must be callable.".format(name))
-
-    prior = self._make_range_coding_prior(prior_fn, index_ranges, parameter_fns,
-                                          channel_axis, dtype)
+        raise TypeError(f"parameter_fns['{name}'] must be callable.")
+    self._index_ranges = tuple(int(r) for r in index_ranges)
+    if not self.index_ranges:
+      raise ValueError("index_ranges must have at least one element.")
+    self._channel_axis = None if channel_axis is None else int(channel_axis)
+    if self.channel_axis is None and len(self.index_ranges) > 1:
+      raise ValueError("channel_axis can't be None for len(index_ranges) > 1.")
+    self._prior_fn = prior_fn
+    self._parameter_fns = dict(parameter_fns)
     super().__init__(
-        prior=prior,
+        prior=self._make_range_coding_prior(self.index_ranges, dtype),
         coding_rank=coding_rank,
         compression=compression,
         laplace_tail_mass=laplace_tail_mass,
@@ -208,14 +213,6 @@ def __init__(self,
         range_coder_precision=range_coder_precision,
         no_variables=no_variables
     )
-    self._channel_axis = int(channel_axis)
-    self._prior_fn = prior_fn
-    # TODO(relational, jonycgn): Do we need special casing for int index_ranges?
-    try:
-      self._index_ranges = int(index_ranges)
-    except TypeError:
-      self._index_ranges = tuple(int(r) for r in index_ranges)  # pytype:disable=attribute-error
-    self._parameter_fns = dict(parameter_fns)
 
   @property
   def index_ranges(self):
@@ -242,23 +239,23 @@ def _make_prior(self, indexes, dtype=None):
     parameters = {k: f(indexes) for k, f in self.parameter_fns.items()}
     return self.prior_fn(**parameters)
 
-  def _make_range_coding_prior(self, prior_fn, index_ranges, parameter_fns,
-                               channel_axis, dtype):
-    del self  # Method does not depend on instance state.
+  def _make_range_coding_prior(self, index_ranges, dtype):
+    """Instantiates the range coding prior."""
     dtype = tf.as_dtype(dtype)
-    if isinstance(index_ranges, int):
-      indexes = tf.range(index_ranges, dtype=dtype)
+    if self.channel_axis is None:
+      index_range, = index_ranges
+      indexes = tf.range(index_range, dtype=dtype)
     else:
       indexes = [tf.range(r, dtype=dtype) for r in index_ranges]
       indexes = tf.meshgrid(*indexes, indexing="ij")
-      indexes = tf.stack(indexes, axis=channel_axis)
-    parameters = {k: f(indexes) for k, f in parameter_fns.items()}
-    return prior_fn(**parameters)
+      indexes = tf.stack(indexes, axis=self.channel_axis)
+    return self._make_prior(indexes, dtype=dtype)
 
   def _normalize_indexes(self, indexes):
     indexes = math_ops.lower_bound(indexes, 0)
-    if isinstance(self.index_ranges, int):
-      bounds = self.index_ranges - 1
+    if self.channel_axis is None:
+      index_range, = self.index_ranges
+      bounds = index_range - 1
     else:
       axes = [1] * indexes.shape.rank
       axes[self.channel_axis] = len(self.index_ranges)
@@ -268,7 +265,7 @@ def _normalize_indexes(self, indexes):
 
   def _flatten_indexes(self, indexes):
     indexes = tf.cast(indexes, tf.int32)
-    if isinstance(self.index_ranges, int):
+    if self.channel_axis is None:
       return indexes
     else:
       strides = tf.math.cumprod(self.index_ranges, exclusive=True, reverse=True)
@@ -509,13 +506,14 @@ def __init__(self, prior_fn, num_scales, scale_fn, coding_rank,
     num_scales = int(num_scales)
     super().__init__(
         prior_fn=prior_fn,
-        index_ranges=num_scales,
+        index_ranges=(num_scales,),
         parameter_fns=dict(
             loc=lambda _: 0.,
             scale=scale_fn,
         ),
         coding_rank=coding_rank,
         compression=compression,
+        channel_axis=None,
         dtype=dtype,
         tail_mass=tail_mass,
         range_coder_precision=range_coder_precision,
diff --git a/tensorflow_compression/python/entropy_models/continuous_indexed_test.py b/tensorflow_compression/python/entropy_models/continuous_indexed_test.py
@@ -26,9 +26,9 @@ class ContinuousIndexedEntropyModelTest(tf.test.TestCase):
 
   def test_can_instantiate_one_dimensional(self):
     em = continuous_indexed.ContinuousIndexedEntropyModel(
-        uniform_noise.NoisyNormal, 64,
+        uniform_noise.NoisyNormal, (64,),
         dict(loc=lambda _: 0, scale=lambda i: tf.exp(i / 8 - 5)), 1,
-        compression=True)
+        compression=True, channel_axis=None)
     self.assertIsInstance(em.prior, uniform_noise.NoisyNormal)
     self.assertEqual(em.coding_rank, 1)
     self.assertEqual(em.tail_mass, 2**-8)
diff --git a/tensorflow_compression/python/entropy_models/universal.py b/tensorflow_compression/python/entropy_models/universal.py
@@ -65,7 +65,7 @@ class UniversalBatchedEntropyModel(
     continuous_batched.ContinuousBatchedEntropyModel):
   """Batched entropy model model which implements Universal Quantization.
 
-  In contrast to the base class, which uses roundinig for quantization, here
+  In contrast to the base class, which uses rounding for quantization, here
   "quantization" is performed additive uniform noise, which is implemented with
   Universal Quantization.
 
@@ -232,7 +232,7 @@ class UniversalIndexedEntropyModel(
     continuous_indexed.ContinuousIndexedEntropyModel):
   """Indexed entropy model model which implements Universal Quantization.
 
-  In contrast to the base class, which uses roundinig for quantization, here
+  In contrast to the base class, which uses rounding for quantization, here
   "quantization" is performed additive uniform noise, which is implemented with
   Universal Quantization.
 
@@ -268,10 +268,9 @@ def __init__(self,
         since this is the marginal distribution for bottleneck dimensions that
         are constant. The callable will receive keyword arguments as determined
         by `parameter_fns`.
-      index_ranges: Iterable of integers. If (non-empty), compared to
-        `bottleneck`, `indexes` in __call__() must have an additional dimension
-        at position `channel_axis`, and the values of the `n`th channel must be
-        in the range `[0, index_ranges[n])`.
+      index_ranges: Iterable of integers. Compared to `bottleneck`, `indexes`
+        in `__call__()` must have an additional trailing dimension, and the
+        values of the `k`th channel must be in the range `[0, index_ranges[k])`.
       parameter_fns: Dict of strings to callables. Functions mapping `indexes`
         to each distribution parameter. For each item, `indexes` is passed to
         the callable, and the string key and return value make up one keyword
@@ -302,10 +301,6 @@ def __init__(self,
       RuntimeError: when attempting to instantiate an entropy model with
         `compression=True` and not in eager execution mode.
     """
-    if isinstance(index_ranges, int):
-      raise ValueError(
-          "An iterable of integers is only supported for `index_ranges`.")
-
     # Add extra indexes for noise levels.
     index_ranges_with_offsets = tuple([num_noise_levels] +
                                       [int(r) for r in index_ranges])
@@ -342,7 +337,7 @@ def index_ranges_without_offsets(self):
     return _index_ranges_without_offsets(self.index_ranges)
 
   def _normalize_indexes(self, indexes):
-    """See base  class."""
+    """See base class."""
     num_indexes = indexes.shape[-1]  # Last dim of `indexes` should be static.
     if num_indexes == len(self.index_ranges):
       # Indexes have offsets.
@@ -364,20 +359,10 @@ def _offset_from_indexes(self, indexes_with_offsets):
         offset_indexes, self._num_noise_levels, dtype=self.dtype)
     return offset
 
-  def _make_range_coding_prior(self, prior_fn, index_ranges_with_offsets,
-                               parameter_fns, channel_axis, dtype):
-    """Computes the range coding prior."""
-    del self  # Method does not depend on instance state.
-    dtype = tf.as_dtype(dtype)
-    index_ranges_without_offsets = _index_ranges_without_offsets(
-        index_ranges_with_offsets)
-    indexes = [
-        tf.range(r, dtype=dtype) for r in index_ranges_without_offsets
-    ]
-    indexes = tf.meshgrid(*indexes, indexing="ij")
-    indexes = tf.stack(indexes, axis=channel_axis)
-    parameters = {k: f(indexes) for k, f in parameter_fns.items()}
-    return prior_fn(**parameters)
+  def _make_range_coding_prior(self, index_ranges, dtype):
+    """Instantiates the range coding prior."""
+    return super()._make_range_coding_prior(
+        _index_ranges_without_offsets(index_ranges), dtype)
 
   def _offset_from_prior(self, prior):
     return _range_coding_offsets(self._num_noise_levels, self.prior_shape,
diff --git a/tensorflow_compression/python/entropy_models/universal_test.py b/tensorflow_compression/python/entropy_models/universal_test.py
@@ -149,15 +149,6 @@ def setUp(self):
     super().setUp()
     tf.random.set_seed(1234)
 
-  def test_cannot_instantiate_one_dimensional(self):
-    with self.assertRaises(ValueError):
-      universal.UniversalIndexedEntropyModel(
-          uniform_noise.NoisyNormal,
-          coding_rank=1,
-          index_ranges=64,
-          parameter_fns=dict(
-              loc=lambda _: 0, scale=lambda i: tf.exp(i / 8 - 5)))
-
   def test_can_instantiate_n_dimensional(self):
     em = universal.UniversalIndexedEntropyModel(
         uniform_noise.NoisyLogisticMixture,