Modify gen_linear_operators to properly map broadcast_dynamic_shape.

srvasude · tensorflower-gardener · commit b0d85b130799 · 2022-08-03T15:22:49.000-07:00
- Add `LinearOperatorPermutation`.

PiperOrigin-RevId: 465162410
diff --git a/tensorflow_probability/python/internal/backend/jax/BUILD b/tensorflow_probability/python/internal/backend/jax/BUILD
@@ -91,6 +91,7 @@ GEN_FILENAMES = [
     "gen/linear_operator_kronecker",
     "gen/linear_operator_lower_triangular",
     "gen/linear_operator_low_rank_update",
+    "gen/linear_operator_permutation",
     "gen/linear_operator",
     "gen/linear_operator_toeplitz",
     "gen/linear_operator_util",
diff --git a/tensorflow_probability/python/internal/backend/meta/gen_linear_operators.py b/tensorflow_probability/python/internal/backend/meta/gen_linear_operators.py
@@ -45,6 +45,7 @@
     'ops import linalg_ops': 'linalg_impl as linalg_ops',
     'ops import math_ops': 'numpy_math as math_ops',
     'ops import nn': 'nn',
+    'ops import sort_ops': 'misc as sort_ops',
     'ops import variables as variables_module': 'ops as variables_module',
     'ops.linalg import linalg_impl as linalg': 'linalg_impl as linalg'
 }
@@ -185,6 +186,8 @@ def gen_module(module_name):
 
   code = code.replace('array_ops.shape', 'prefer_static.shape')
   code = code.replace('array_ops.concat', 'prefer_static.concat')
+  code = code.replace('array_ops.broadcast_dynamic_shape',
+                      '_ops.broadcast_dynamic_shape')
   code = code.replace('array_ops.broadcast_static_shape',
                       '_ops.broadcast_static_shape')
   code = code.replace('array_ops.broadcast_to', '_ops.broadcast_to')
diff --git a/tensorflow_probability/python/internal/backend/numpy/BUILD b/tensorflow_probability/python/internal/backend/numpy/BUILD
@@ -548,6 +548,7 @@ LINOP_FILES = [
     "linear_operator_kronecker",
     "linear_operator_lower_triangular",
     "linear_operator_low_rank_update",
+    "linear_operator_permutation",
     "linear_operator",
     "linear_operator_toeplitz",
     "linear_operator_util",
diff --git a/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_kronecker.py b/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_kronecker.py
@@ -292,7 +292,7 @@ def _shape_tensor(self):
     # broadcast_shape checks for compatibility.
     batch_shape = self.operators[0].batch_shape_tensor()
     for operator in self.operators[1:]:
-      batch_shape = array_ops.broadcast_dynamic_shape(
+      batch_shape = _ops.broadcast_dynamic_shape(
           batch_shape, operator.batch_shape_tensor())
 
     return prefer_static.concat((batch_shape, matrix_shape), 0)
diff --git a/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_low_rank_update.py b/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_low_rank_update.py
@@ -370,13 +370,13 @@ def _shape(self):
     return batch_shape.concatenate(tensor_shape.TensorShape(self.base_operator.shape)[-2:])
 
   def _shape_tensor(self):
-    batch_shape = array_ops.broadcast_dynamic_shape(
+    batch_shape = _ops.broadcast_dynamic_shape(
         self.base_operator.batch_shape_tensor(),
         self.diag_operator.batch_shape_tensor())
-    batch_shape = array_ops.broadcast_dynamic_shape(
+    batch_shape = _ops.broadcast_dynamic_shape(
         batch_shape,
         prefer_static.shape(self.u)[:-2])
-    batch_shape = array_ops.broadcast_dynamic_shape(
+    batch_shape = _ops.broadcast_dynamic_shape(
         batch_shape,
         prefer_static.shape(self.v)[:-2])
     return prefer_static.concat(
diff --git a/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_permutation.py b/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_permutation.py
@@ -0,0 +1,306 @@
+# Copyright 2020 The TensorFlow Probability Authors. All Rights Reserved.
+# @@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@
+# THIS FILE IS AUTO-GENERATED BY `gen_linear_operators.py`.
+# DO NOT MODIFY DIRECTLY.
+# @@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@
+# pylint: disable=g-import-not-at-top
+# pylint: disable=g-direct-tensorflow-import
+# pylint: disable=g-bad-import-order
+# pylint: disable=unused-import
+# pylint: disable=line-too-long
+# pylint: disable=reimported
+# pylint: disable=g-bool-id-comparison
+# pylint: disable=g-statement-before-imports
+# pylint: disable=bad-continuation
+# pylint: disable=useless-import-alias
+# pylint: disable=property-with-parameters
+# pylint: disable=trailing-whitespace
+# pylint: disable=g-inconsistent-quotes
+
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""`LinearOperator` acting like a permutation matrix."""
+
+import numpy as np
+
+from tensorflow_probability.python.internal.backend.numpy import dtype as dtypes
+from tensorflow_probability.python.internal.backend.numpy import ops
+from tensorflow_probability.python.internal.backend.numpy import ops
+from tensorflow_probability.python.internal.backend.numpy import numpy_array as array_ops
+from tensorflow_probability.python.internal.backend.numpy import control_flow as control_flow_ops
+from tensorflow_probability.python.internal.backend.numpy import numpy_math as math_ops
+from tensorflow_probability.python.internal.backend.numpy import misc as sort_ops
+from tensorflow_probability.python.internal.backend.numpy import linalg_impl as linalg
+from tensorflow_probability.python.internal.backend.numpy.gen import linear_operator
+from tensorflow_probability.python.internal.backend.numpy.gen import linear_operator_util
+# from tensorflow.python.util.tf_export import tf_export
+
+__all__ = ["LinearOperatorPermutation",]
+
+
+# @tf_export("linalg.LinearOperatorPermutation")
+# @linear_operator.make_composite_tensor
+class LinearOperatorPermutation(linear_operator.LinearOperator):
+  """`LinearOperator` acting like a [batch] of permutation matrices.
+
+  This operator acts like a [batch] of permutations with shape
+  `[B1,...,Bb, N, N]` for some `b >= 0`.  The first `b` indices index a
+  batch member.  For every batch index `(i1,...,ib)`, `A[i1,...,ib, : :]` is
+  an `N x N` matrix.  This matrix `A` is not materialized, but for
+  purposes of broadcasting this shape will be relevant.
+
+  `LinearOperatorPermutation` is initialized with a (batch) vector.
+
+  A permutation, is defined by an integer vector `v` whose values are unique
+  and are in the range `[0, ... n]`. Applying the permutation on an input
+  matrix has the folllowing meaning: the value of `v` at index `i`
+  says to move the `v[i]`-th row of the input matrix to the `i`-th row.
+  Because all values are unique, this will result in a permutation of the
+  rows the input matrix. Note, that the permutation vector `v` has the same
+  semantics as `tf.transpose`.
+
+  ```python
+  # Create a 3 x 3 permutation matrix that swaps the last two columns.
+  vec = [0, 2, 1]
+  operator = LinearOperatorPermutation(vec)
+
+  operator.to_dense()
+  ==> [[1., 0., 0.]
+       [0., 0., 1.]
+       [0., 1., 0.]]
+
+  tensor_shape.TensorShape(operator.shape)
+  ==> [3, 3]
+
+  # This will be zero.
+  operator.log_abs_determinant()
+  ==> scalar Tensor
+
+  x = ... Shape [3, 4] Tensor
+  operator.matmul(x)
+  ==> Shape [3, 4] Tensor
+  ```
+
+  #### Shape compatibility
+
+  This operator acts on [batch] matrix with compatible shape.
+  `x` is a batch matrix with compatible shape for `matmul` and `solve` if
+
+  ```
+  tensor_shape.TensorShape(operator.shape) = [B1,...,Bb] + [N, N],  with b >= 0
+  tensor_shape.TensorShape(x.shape) =   [C1,...,Cc] + [N, R],
+  and [C1,...,Cc] broadcasts with [B1,...,Bb] to [D1,...,Dd]
+  ```
+
+  #### Matrix property hints
+
+  This `LinearOperator` is initialized with boolean flags of the form `is_X`,
+  for `X = non_singular, self_adjoint, positive_definite, square`.
+  These have the following meaning:
+
+  * If `is_X == True`, callers should expect the operator to have the
+    property `X`.  This is a promise that should be fulfilled, but is *not* a
+    runtime assert.  For example, finite floating point precision may result
+    in these promises being violated.
+  * If `is_X == False`, callers should expect the operator to not have `X`.
+  * If `is_X == None` (the default), callers should have no expectation either
+    way.
+  """
+
+  def __init__(self,
+               perm,
+               dtype=dtypes.float32,
+               is_non_singular=None,
+               is_self_adjoint=None,
+               is_positive_definite=None,
+               is_square=None,
+               name="LinearOperatorPermutation"):
+    r"""Initialize a `LinearOperatorPermutation`.
+
+    Args:
+      perm:  Shape `[B1,...,Bb, N]` Integer `Tensor` with `b >= 0`
+        `N >= 0`. An integer vector that represents the permutation to apply.
+        Note that this argument is same as `tf.transpose`. However, this
+        permutation is applied on the rows, while the permutation in
+        `tf.transpose` is applied on the dimensions of the `Tensor`. `perm`
+        is required to have unique entries from `{0, 1, ... N-1}`.
+      dtype: The `dtype` of arguments to this operator. Default: `float32`.
+        Allowed dtypes: `float16`, `float32`, `float64`, `complex64`,
+        `complex128`.
+      is_non_singular:  Expect that this operator is non-singular.
+      is_self_adjoint:  Expect that this operator is equal to its hermitian
+        transpose.  This is autoset to true
+      is_positive_definite:  Expect that this operator is positive definite,
+        meaning the quadratic form `x^H A x` has positive real part for all
+        nonzero `x`.  Note that we do not require the operator to be
+        self-adjoint to be positive-definite.  See:
+        https://en.wikipedia.org/wiki/Positive-definite_matrix#Extension_for_non-symmetric_matrices
+        This is autoset to false.
+      is_square:  Expect that this operator acts like square [batch] matrices.
+        This is autoset to true.
+      name: A name for this `LinearOperator`.
+
+    Raises:
+      ValueError:  `is_self_adjoint` is not `True`, `is_positive_definite` is
+        not `False` or `is_square` is not `True`.
+    """
+    parameters = dict(
+        perm=perm,
+        dtype=dtype,
+        is_non_singular=is_non_singular,
+        is_self_adjoint=is_self_adjoint,
+        is_positive_definite=is_positive_definite,
+        is_square=is_square,
+        name=name
+    )
+
+    with ops.name_scope(name, values=[perm]):
+      self._perm = linear_operator_util.convert_nonref_to_tensor(
+          perm, name="perm")
+      self._check_perm(self._perm)
+
+      # Check and auto-set hints.
+      if is_non_singular is False:  # pylint:disable=g-bool-id-comparison
+        raise ValueError(f"A Permutation operator is always non-singular. "
+                         f"Expected argument `is_non_singular` to be True. "
+                         f"Received: {is_non_singular}.")
+
+      if is_square is False:  # pylint:disable=g-bool-id-comparison
+        raise ValueError(f"A Permutation operator is always square. "
+                         f"Expected argument `is_square` to be True. "
+                         f"Received: {is_square}.")
+      is_square = True
+
+      super(LinearOperatorPermutation, self).__init__(
+          dtype=dtype,
+          is_non_singular=is_non_singular,
+          is_self_adjoint=is_self_adjoint,
+          is_positive_definite=is_positive_definite,
+          is_square=is_square,
+          parameters=parameters,
+          name=name)
+
+  def _check_perm(self, perm):
+    """Static check of perm."""
+    if (tensor_shape.TensorShape(perm.shape).ndims is not None and tensor_shape.TensorShape(perm.shape).ndims < 1):
+      raise ValueError(f"Argument `perm` must have at least 1 dimension. "
+                       f"Received: {perm}.")
+    if not np.issubdtype(perm.dtype, np.integer):
+      raise TypeError(f"Argument `perm` must be integer dtype. "
+                      f"Received: {perm}.")
+    # Check that the permutation satisfies the uniqueness constraint.
+    static_perm = ops.get_static_value(perm)
+    if static_perm is not None:
+      sorted_perm = np.sort(static_perm, axis=-1)
+      if np.any(sorted_perm != np.arange(0, tensor_shape.TensorShape(static_perm.shape)[-1])):
+        raise ValueError(
+            f"Argument `perm` must be a vector of unique integers from "
+            f"0 to {tensor_shape.TensorShape(static_perm.shape)[-1] - 1}.")
+
+  def _shape(self):
+    perm_shape = tensor_shape.TensorShape(self._perm.shape)
+    return perm_shape.concatenate(perm_shape[-1:])
+
+  def _shape_tensor(self):
+    perm_shape = prefer_static.shape(self._perm)
+    k = perm_shape[-1]
+    return prefer_static.concat((perm_shape, [k]), 0)
+
+  def _assert_non_singular(self):
+    return control_flow_ops.no_op("assert_non_singular")
+
+  def _domain_dimension_tensor(self, perm=None):
+    perm = perm if perm is not None else self.perm
+    return prefer_static.shape(perm)[-1]
+
+  def _matmul(self, x, adjoint=False, adjoint_arg=False):
+    perm = ops.convert_to_tensor(self.perm)
+    if adjoint and not self.is_self_adjoint:
+      # TODO(srvasude): invert_permutation doesn't work on batches so we use
+      # argsort.
+      perm = sort_ops.argsort(perm, axis=-1)
+    x = linalg.adjoint(x) if adjoint_arg else x
+
+    # We need to broadcast x and the permutation since tf.gather doesn't
+    # broadcast.
+    broadcast_shape = _ops.broadcast_dynamic_shape(
+        prefer_static.shape(x)[:-1], prefer_static.shape(perm))
+    k = prefer_static.shape(x)[-1]
+    broadcast_x_shape = prefer_static.concat([broadcast_shape, [k]], axis=-1)
+    x = _ops.broadcast_to(x, broadcast_x_shape)
+    perm = _ops.broadcast_to(perm, broadcast_shape)
+
+    m = prefer_static.shape(x)[-2]
+    x = array_ops.reshape(x, [-1, m, k])
+    perm = array_ops.reshape(perm, [-1, m])
+
+    y = array_ops.gather(x, perm, axis=-2, batch_dims=1)
+    return array_ops.reshape(y, broadcast_x_shape)
+
+  # TODO(srvasude): Permutation parity is equivalent to the determinant.
+
+  def _log_abs_determinant(self):
+    # Permutation matrices have determinant +/- 1.
+    return array_ops.zeros(shape=self.batch_shape_tensor(), dtype=self.dtype)
+
+  def _solve(self, rhs, adjoint=False, adjoint_arg=False):
+    # The inverse of a permutation matrix is the transpose matrix.
+    # Apply a matmul and flip the adjoint bit.
+    return self._matmul(rhs, adjoint=(not adjoint), adjoint_arg=adjoint_arg)
+
+  def _to_dense(self):
+    perm = ops.convert_to_tensor(self.perm)
+    return _ops.cast(math_ops.equal(
+        array_ops.range(0, self._domain_dimension_tensor(perm)),
+        perm[..., _ops.newaxis]), self.dtype)
+
+  def _diag_part(self):
+    perm = ops.convert_to_tensor(self.perm)
+    return _ops.cast(math_ops.equal(
+        array_ops.range(0, self._domain_dimension_tensor(perm)),
+        perm), self.dtype)
+
+  def _cond(self):
+    # Permutation matrices are rotations which have condition number 1.
+    return array_ops.ones(self.batch_shape_tensor(), dtype=self.dtype)
+
+  @property
+  def perm(self):
+    return self._perm
+
+  @property
+  def _composite_tensor_fields(self):
+    return ("perm", "dtype")
+
+  @property
+  def _experimental_parameter_ndims_to_matrix_ndims(self):
+    return {"perm": 1}
+
+import numpy as np
+from tensorflow_probability.python.internal.backend.numpy import linalg_impl as _linalg
+from tensorflow_probability.python.internal.backend.numpy import ops as _ops
+from tensorflow_probability.python.internal.backend.numpy.gen import tensor_shape
+
+from tensorflow_probability.python.internal.backend.numpy import private
+distribution_util = private.LazyLoader(
+    "distribution_util", globals(),
+    "tensorflow_probability.substrates.numpy.internal.distribution_util")
+tensorshape_util = private.LazyLoader(
+    "tensorshape_util", globals(),
+    "tensorflow_probability.substrates.numpy.internal.tensorshape_util")
+prefer_static = private.LazyLoader(
+    "prefer_static", globals(),
+    "tensorflow_probability.substrates.numpy.internal.prefer_static")
+
diff --git a/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_toeplitz.py b/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_toeplitz.py
@@ -204,7 +204,7 @@ def _shape(self):
   def _shape_tensor(self, row=None, col=None):
     row = self.row if row is None else row
     col = self.col if col is None else col
-    v_shape = array_ops.broadcast_dynamic_shape(
+    v_shape = _ops.broadcast_dynamic_shape(
         prefer_static.shape(row),
         prefer_static.shape(col))
     k = v_shape[-1]
@@ -262,7 +262,7 @@ def _diag_part(self):
   def _to_dense(self):
     row = ops.convert_to_tensor(self.row)
     col = ops.convert_to_tensor(self.col)
-    total_shape = array_ops.broadcast_dynamic_shape(
+    total_shape = _ops.broadcast_dynamic_shape(
         prefer_static.shape(row), prefer_static.shape(col))
     n = prefer_static.shape(row)[-1]
     row = _ops.broadcast_to(row, total_shape)
diff --git a/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_util.py b/tensorflow_probability/python/internal/backend/numpy/gen/linear_operator_util.py
@@ -367,7 +367,7 @@ def broadcast_matrix_batch_dims(batch_matrices, name=None):
     # Since static didn't work, do dynamic, which always copies data.
     bcast_batch_shape = prefer_static.shape(batch_matrices[0])[:-2]
     for mat in batch_matrices[1:]:
-      bcast_batch_shape = array_ops.broadcast_dynamic_shape(
+      bcast_batch_shape = _ops.broadcast_dynamic_shape(
           bcast_batch_shape,
           prefer_static.shape(mat)[:-2])
     for i, mat in enumerate(batch_matrices):
diff --git a/tensorflow_probability/python/internal/backend/numpy/gen/slicing.py b/tensorflow_probability/python/internal/backend/numpy/gen/slicing.py
diff --git a/tensorflow_probability/python/internal/backend/numpy/linalg.py b/tensorflow_probability/python/internal/backend/numpy/linalg.py
diff --git a/tensorflow_probability/python/internal/backend/numpy/numpy_test.py b/tensorflow_probability/python/internal/backend/numpy/numpy_test.py