Remove JD overrides of Distribution public methods for event and batch shape.

davmre · tensorflower-gardener · commit ede69e06e95a · 2021-06-17T12:58:46.000-07:00
These are no longer needed since Distribution now supports structured shape. Using the public methods allows us to benefit from static optimizations, e.g., batch_shape_tensor won't run if batch_shape is fully defined.

This also removes the `sample_shape` argument to event_shape_tensor and batch_shape_tensor. This theoretically could be a breaking change, but we are proceeding without a deprecation cycle because passing a nontrivial sample shape was *already* broken (and has been since at least Jan 2020).

PiperOrigin-RevId: 380024311
diff --git a/tensorflow_probability/python/distributions/BUILD b/tensorflow_probability/python/distributions/BUILD
@@ -3075,7 +3075,7 @@ multi_substrate_py_test(
     name = "joint_distribution_coroutine_test",
     size = "medium",
     srcs = ["joint_distribution_coroutine_test.py"],
-    shard_count = 2,
+    shard_count = 5,
     deps = [
         # numpy dep,
         # tensorflow dep,
diff --git a/tensorflow_probability/python/distributions/joint_distribution.py b/tensorflow_probability/python/distributions/joint_distribution.py
@@ -35,7 +35,7 @@
 from tensorflow_probability.python.internal import distribution_util
 from tensorflow_probability.python.internal import docstring_util
 from tensorflow_probability.python.internal import nest_util
-from tensorflow_probability.python.internal import prefer_static
+from tensorflow_probability.python.internal import prefer_static as ps
 from tensorflow_probability.python.internal import samplers
 from tensorflow_probability.python.util.seed_stream import SeedStream
 from tensorflow_probability.python.util.seed_stream import TENSOR_SEED_MSG_PREFIX
@@ -315,56 +315,15 @@ def experimental_shard_axis_names(self):
   def use_vectorized_map(self):
     return False
 
-  @property
-  def batch_shape(self):
-    """Shape of a single sample from a single event index as a `TensorShape`.
-
-    May be partially defined or unknown.
-
-    The batch dimensions are indexes into independent, non-identical
-    parameterizations of this distribution.
-
-    Returns:
-      batch_shape: `tuple` of `TensorShape`s representing the `batch_shape` for
-        each distribution in `model`.
-    """
+  def _batch_shape(self):
     return self._model_unflatten([
         d.batch_shape for d in self._get_single_sample_distributions()])
 
-  def batch_shape_tensor(self, sample_shape=(), name='batch_shape_tensor'):
-    """Shape of a single sample from a single event index as a 1-D `Tensor`.
-
-    The batch dimensions are indexes into independent, non-identical
-    parameterizations of this distribution.
-
-    Args:
-      sample_shape: The sample shape under which to evaluate the joint
-        distribution. Sample shape at root (toplevel) nodes may affect the batch
-        or event shapes of child nodes.
-      name: name to give to the op
-
-    Returns:
-      batch_shape: `Tensor` representing batch shape of each distribution in
-        `model`.
-    """
-    with self._name_and_control_scope(name):
-      return self._model_unflatten(
-          self._map_attr_over_dists(
-              'batch_shape_tensor',
-              dists=(self.sample_distributions(sample_shape)
-                     if sample_shape else None)))
-
-  @property
-  def event_shape(self):
-    """Shape of a single sample from a single batch as a `TensorShape`.
+  def _batch_shape_tensor(self):
+    return self._model_unflatten(
+        self._map_attr_over_dists('batch_shape_tensor'))
 
-    May be partially defined or unknown.
-
-    Returns:
-      event_shape: `tuple` of `TensorShape`s representing the `event_shape` for
-        each distribution in `model`.
-    """
-    # Caching will not leak graph Tensors since this is a static attribute.
+  def _event_shape(self):
     if not hasattr(self, '_cached_event_shape'):
       self._cached_event_shape = [
           d.event_shape
@@ -373,24 +332,9 @@ def event_shape(self):
     # wrapping the returned value.
     return self._model_unflatten(self._cached_event_shape)
 
-  def event_shape_tensor(self, sample_shape=(), name='event_shape_tensor'):
-    """Shape of a single sample from a single batch as a 1-D int32 `Tensor`.
-
-    Args:
-      sample_shape: The sample shape under which to evaluate the joint
-        distribution. Sample shape at root (toplevel) nodes may affect the batch
-        or event shapes of child nodes.
-      name: name to give to the op
-    Returns:
-      event_shape: `tuple` of `Tensor`s representing the `event_shape` for each
-        distribution in `model`.
-    """
-    with self._name_and_control_scope(name):
-      return self._model_unflatten(
-          self._map_attr_over_dists(
-              'event_shape_tensor',
-              dists=(self.sample_distributions(sample_shape)
-                     if sample_shape else None)))
+  def _event_shape_tensor(self):
+    return self._model_unflatten(
+        self._map_attr_over_dists('event_shape_tensor'))
 
   def sample_distributions(self, sample_shape=(), seed=None, value=None,
                            name='sample_distributions', **kwargs):
@@ -847,9 +791,9 @@ def _assert_compatible_shape(self, index, sample_shape, samples):
     requested_shape, _ = self._expand_sample_shape_to_vector(
         tf.convert_to_tensor(sample_shape, dtype=tf.int32),
         name='requested_shape')
-    actual_shape = prefer_static.shape(samples)
-    actual_rank = prefer_static.rank_from_shape(actual_shape)
-    requested_rank = prefer_static.rank_from_shape(requested_shape)
+    actual_shape = ps.shape(samples)
+    actual_rank = ps.rank_from_shape(actual_shape)
+    requested_rank = ps.rank_from_shape(requested_shape)
 
     # We test for two properties we expect of yielded distributions:
     # (1) The rank of the tensor of generated samples must be at least
@@ -1068,8 +1012,8 @@ def maybe_check_wont_broadcast(flat_xs, validate_args):
     # Only when `validate_args` is `True` do we enforce the validation.
     return flat_xs
   msg = 'Broadcasting probably indicates an error in model specification.'
-  s = tuple(prefer_static.shape(x) for x in flat_xs)
-  if all(prefer_static.is_numpy(s_) for s_ in s):
+  s = tuple(ps.shape(x) for x in flat_xs)
+  if all(ps.is_numpy(s_) for s_ in s):
     if not all(np.all(a == b) for a, b in zip(s[1:], s[:-1])):
       raise ValueError(msg)
     return flat_xs
@@ -1092,7 +1036,7 @@ def __init__(self, jd, parameters=None, bijector_fn=None):
       bijectors = tuple(bijector_fn(d)
                         for d in jd._get_single_sample_distributions())
       i_min_event_ndims = tf.nest.map_structure(
-          prefer_static.size, jd.event_shape)
+          ps.size, jd.event_shape)
       f_min_event_ndims = jd._model_unflatten([
           b.inverse_event_ndims(nd) for b, nd in
           zip(bijectors, jd._model_flatten(i_min_event_ndims))])
@@ -1207,9 +1151,9 @@ def _jd_log_prob_ratio(p, x, q, y, name=None):
   """Implements `log_prob_ratio` for tfd.JointDistribution*."""
   with tf.name_scope(name or 'jd_log_prob_ratio'):
     tf.nest.assert_same_structure(x, y)
-    ps, _ = p.sample_distributions(value=x, seed=samplers.zeros_seed())
-    qs, _ = q.sample_distributions(value=y, seed=samplers.zeros_seed())
-    tf.nest.assert_same_structure(ps, qs)
+    p_dists, _ = p.sample_distributions(value=x, seed=samplers.zeros_seed())
+    q_dists, _ = q.sample_distributions(value=y, seed=samplers.zeros_seed())
+    tf.nest.assert_same_structure(p_dists, q_dists)
     log_prob_ratio_parts = nest.map_structure_up_to(
-        ps, log_prob_ratio.log_prob_ratio, ps, x, qs, y)
+        p_dists, log_prob_ratio.log_prob_ratio, p_dists, x, q_dists, y)
     return tf.add_n(tf.nest.flatten(log_prob_ratio_parts))
diff --git a/tensorflow_probability/python/distributions/joint_distribution_sample_path_mixin.py b/tensorflow_probability/python/distributions/joint_distribution_sample_path_mixin.py
@@ -77,52 +77,42 @@ def __init__(self, *args, **kwargs):
   def batch_ndims(self):
     return self._batch_ndims
 
-  @property
   def _batch_shape_parts(self):
     return [d.batch_shape[:self.batch_ndims]
             for d in self._get_single_sample_distributions()]
 
-  @property
-  def batch_shape(self):
+  def _batch_shape(self):
     # Caching will not leak graph Tensors since this is a static attribute.
-    if not hasattr(self, '_cached_batch_shape'):
-      reduce_fn = ((lambda a, b: a.merge_with(b)) if self.validate_args
-                   else tf.broadcast_static_shape)  # Allows broadcasting.
-      self._cached_batch_shape = functools.reduce(
-          reduce_fn, self._batch_shape_parts)
-    return self._cached_batch_shape
+    reduce_fn = ((lambda a, b: a.merge_with(b)) if self.validate_args
+                 else tf.broadcast_static_shape)  # Allows broadcasting.
+    return functools.reduce(reduce_fn, self._batch_shape_parts())
 
   def _batch_shape_tensor_parts(self):
     return [d.batch_shape_tensor()[:self.batch_ndims]
             for d in self._get_single_sample_distributions()]
 
-  def batch_shape_tensor(self, sample_shape=(), name='batch_shape_tensor'):
-    del sample_shape  # Unused.
-    with self._name_and_control_scope(name):
-      return tf.convert_to_tensor(functools.reduce(
-          prefer_static.broadcast_shape, self._batch_shape_tensor_parts()))
+  def _batch_shape_tensor(self):
+    return tf.convert_to_tensor(functools.reduce(
+        prefer_static.broadcast_shape, self._batch_shape_tensor_parts()))
 
-  @property
-  def event_shape(self):
+  def _event_shape(self):
     if not hasattr(self, '_cached_event_shape'):
       self._cached_event_shape = list([
           tf.nest.map_structure(  # Recurse over joint component distributions.
               d.batch_shape[self.batch_ndims:].concatenate,
               d.event_shape) for d in self._get_single_sample_distributions()])
     return self._model_unflatten(self._cached_event_shape)
 
-  def event_shape_tensor(self, sample_shape=(), name='event_shape_tensor'):
+  def _event_shape_tensor(self):
     """Shape of a single sample from a single batch."""
-    del sample_shape  # Unused.
-    with self._name_and_control_scope(name):
-      component_shapes = []
-      for d in self._get_single_sample_distributions():
-        iid_event_shape = d.batch_shape_tensor()[self.batch_ndims:]
-        # Recurse over the (potentially joint) component distribution's event.
-        component_shapes.append(tf.nest.map_structure(
-            lambda a, b=iid_event_shape: prefer_static.concat([b, a], axis=0),
-            d.event_shape_tensor()))
-      return self._model_unflatten(component_shapes)
+    component_shapes = []
+    for d in self._get_single_sample_distributions():
+      iid_event_shape = d.batch_shape_tensor()[self.batch_ndims:]
+      # Recurse over the (potentially joint) component distribution's event.
+      component_shapes.append(tf.nest.map_structure(
+          lambda a, b=iid_event_shape: prefer_static.concat([b, a], axis=0),
+          d.event_shape_tensor()))
+    return self._model_unflatten(component_shapes)
 
   def _reduce_measure_over_dists(self, xs, reduce_fn):
     num_trailing_batch_dims_treated_as_event = [