freedomtan
diff --git a/‎keras_core/backend/jax/math.py‎
Lines changed: 7 additions & 0 deletions b/‎keras_core/backend/jax/math.py‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎keras_core/backend/tensorflow/math.py‎
Lines changed: 4 additions & 0 deletions b/‎keras_core/backend/tensorflow/math.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎keras_core/layers/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎keras_core/layers/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎keras_core/layers/merging/__init__.py‎ b/‎keras_core/layers/merging/__init__.py‎
diff --git a/‎keras_core/layers/merging/add.py‎
Lines changed: 68 additions & 0 deletions b/‎keras_core/layers/merging/add.py‎
Lines changed: 68 additions & 0 deletions
diff --git a/‎keras_core/layers/merging/base_merge.py‎
Lines changed: 232 additions & 0 deletions b/‎keras_core/layers/merging/base_merge.py‎
Lines changed: 232 additions & 0 deletions
@@ -13,3 +13,10 @@ def top_k(x, k, sorted=True):
             "Jax backend does not support `sorted=False` for `ops.top_k`"
         )
     return jax.lax.top_k(x, k)
+
+
+def in_top_k(targets, predictions, k):
+    topk_indices = top_k(predictions, k)[1]
+    targets = targets[..., None]
+    mask = targets == topk_indices
+    return jax.numpy.any(mask, axis=1)
@@ -10,3 +10,7 @@ def segment_sum(data, segment_ids, num_segments=None, sorted=False):
 
 def top_k(x, k, sorted=True):
     return tf.math.top_k(x, k, sorted=sorted)
+
+
+def in_top_k(targets, predictions, k):
+    return tf.math.in_top_k(targets, predictions, k)
@@ -4,6 +4,8 @@
 from keras_core.layers.core.input_layer import Input
 from keras_core.layers.core.input_layer import InputLayer
 from keras_core.layers.layer import Layer
+from keras_core.layers.merging.add import Add
+from keras_core.layers.merging.add import add
 from keras_core.layers.regularization.activity_regularization import (
     ActivityRegularization,
 )
@@ -13,3 +15,4 @@
 from keras_core.layers.regularization.spatial_dropout import SpatialDropout1D
 from keras_core.layers.regularization.spatial_dropout import SpatialDropout2D
 from keras_core.layers.regularization.spatial_dropout import SpatialDropout3D
+from keras_core.layers.reshaping.reshape import Reshape
@@ -0,0 +1,68 @@
+from keras_core.api_export import keras_core_export
+from keras_core.layers.merging.base_merge import Merge
+
+
+@keras_core_export("keras_core.layers.Add")
+class Add(Merge):
+    """Performs elementwise addition operation.
+
+    It takes as input a list of tensors, all of the same shape,
+    and returns a single tensor (also of the same shape).
+
+    Examples:
+
+    >>> input_shape = (2, 3, 4)
+    >>> x1 = np.random.rand(*input_shape)
+    >>> x2 = np.random.rand(*input_shape)
+    >>> y = keras_core.layers.Add()([x1, x2])
+
+    Usage in a Keras model:
+
+    >>> input1 = keras_core.layers.Input(shape=(16,))
+    >>> x1 = keras_core.layers.Dense(8, activation='relu')(input1)
+    >>> input2 = keras_core.layers.Input(shape=(32,))
+    >>> x2 = keras_core.layers.Dense(8, activation='relu')(input2)
+    >>> # equivalent to `added = keras_core.layers.add([x1, x2])`
+    >>> added = keras_core.layers.Add()([x1, x2])
+    >>> out = keras_core.layers.Dense(4)(added)
+    >>> model = keras_core.models.Model(inputs=[input1, input2], outputs=out)
+
+    """
+
+    def _merge_function(self, inputs):
+        output = inputs[0]
+        for i in range(1, len(inputs)):
+            output += inputs[i]
+        return output
+
+
+@keras_core_export("keras_core.layers.add")
+def add(inputs, **kwargs):
+    """Functional interface to the `keras_core.layers.Add` layer.
+
+    Args:
+        inputs: A list of input tensors with the same shape.
+        **kwargs: Standard layer keyword arguments.
+
+    Returns:
+        A tensor as the sum of the inputs. It has the same shape as the inputs.
+
+    Examples:
+
+    >>> input_shape = (2, 3, 4)
+    >>> x1 = np.random.rand(*input_shape)
+    >>> x2 = np.random.rand(*input_shape)
+    >>> y = keras_core.layers.add([x1, x2])
+
+    Usage in a Keras model:
+
+    >>> input1 = keras_core.layers.Input(shape=(16,))
+    >>> x1 = keras_core.layers.Dense(8, activation='relu')(input1)
+    >>> input2 = keras_core.layers.Input(shape=(32,))
+    >>> x2 = keras_core.layers.Dense(8, activation='relu')(input2)
+    >>> added = keras_core.layers.add([x1, x2])
+    >>> out = keras_core.layers.Dense(4)(added)
+    >>> model = keras_core.models.Model(inputs=[input1, input2], outputs=out)
+
+    """
+    return Add(**kwargs)(inputs)
@@ -0,0 +1,232 @@
+from keras_core import backend
+from keras_core import operations as ops
+from keras_core.layers.layer import Layer
+
+
+class Merge(Layer):
+    """Generic merge layer for elementwise merge functions.
+
+    Used to implement `Sum`, `Average`, etc.
+
+    Args:
+        **kwargs: standard layer keyword arguments.
+    """
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        self.supports_masking = True
+
+    def _merge_function(self, inputs):
+        raise NotImplementedError
+
+    def _compute_elemwise_op_output_shape(self, shape1, shape2):
+        """Computes the shape of the resultant of an elementwise operation.
+
+        Args:
+            shape1: Tuple or None. Shape of the first tensor
+            shape2: Tuple or None. Shape of the second tensor
+
+        Returns:
+            Expected output shape when an element-wise operation is
+            carried out on 2 tensors with shapes shape1 and shape2.
+            tuple or None.
+
+        Raises:
+            ValueError: If shape1 and shape2 are not compatible for
+                element-wise operations.
+        """
+
+        if None in [shape1, shape2]:
+            return None
+        elif len(shape1) < len(shape2):
+            return self._compute_elemwise_op_output_shape(shape2, shape1)
+        elif not shape2:
+            return shape1
+        output_shape = list(shape1[: -len(shape2)])
+        for i, j in zip(shape1[-len(shape2) :], shape2):
+            if i is None or j is None:
+                output_shape.append(None)
+            elif i == 1:
+                output_shape.append(j)
+            elif j == 1:
+                output_shape.append(i)
+            else:
+                if i != j:
+                    raise ValueError(
+                        "Inputs have incompatible shapes. "
+                        f"Received shapes {shape1} and {shape2}"
+                    )
+                output_shape.append(i)
+        return tuple(output_shape)
+
+    def build(self, input_shape):
+        # Used purely for shape validation.
+        if not isinstance(input_shape[0], tuple):
+            raise ValueError(
+                "A merge layer should be called on a list of inputs. "
+                f"Received: input_shape={input_shape} (not a list of shapes)"
+            )
+        if len(input_shape) < 1:
+            raise ValueError(
+                "A merge layer should be called "
+                "on a list of at least 1 input. "
+                f"Received {len(input_shape)} inputs. "
+                f"Full input_shape received: {input_shape}"
+            )
+
+        batch_sizes = {s[0] for s in input_shape if s} - {None}
+        if len(batch_sizes) > 1:
+            raise ValueError(
+                "Cannot merge tensors with different batch sizes. "
+                f"Received tensors with shapes {input_shape}"
+            )
+
+        if input_shape[0] is None:
+            output_shape = None
+        else:
+            output_shape = input_shape[0][1:]
+
+        for i in range(1, len(input_shape)):
+            if input_shape[i] is None:
+                shape = None
+            else:
+                shape = input_shape[i][1:]
+            output_shape = self._compute_elemwise_op_output_shape(
+                output_shape, shape
+            )
+
+        # If the inputs have different ranks, we have to reshape them
+        # to make them broadcastable.
+        if None not in input_shape and len(set(map(len, input_shape))) == 1:
+            self._reshape_required = False
+        else:
+            self._reshape_required = True
+        self.built = True
+
+    def call(self, inputs):
+        if not isinstance(inputs, (list, tuple)):
+            raise ValueError(
+                "A merge layer should be called on a list of inputs. "
+                f"Received: inputs={inputs} (not a list of tensors)"
+            )
+        if self._reshape_required:
+            reshaped_inputs = []
+            input_ndims = list(map(ops.ndim, inputs))
+            if None not in input_ndims:
+                # If ranks of all inputs are available,
+                # we simply expand each of them at axis=1
+                # until all of them have the same rank.
+                max_ndim = max(input_ndims)
+                for x in inputs:
+                    x_ndim = ops.ndim(x)
+                    for _ in range(max_ndim - x_ndim):
+                        x = ops.expand_dims(x, axis=1)
+                    reshaped_inputs.append(x)
+                return self._merge_function(reshaped_inputs)
+            else:
+                # Transpose all inputs so that batch size is the last dimension.
+                # (batch_size, dim1, dim2, ... ) -> (dim1, dim2, ... ,
+                # batch_size)
+                transposed = False
+                for x in inputs:
+                    x_ndim = ops.ndim(x)
+
+                    if x_ndim is None:
+                        x_shape = ops.shape(x)
+                        batch_size = x_shape[0]
+
+                        new_shape = backend.concatenate(
+                            [x_shape[1:], ops.expand_dims(batch_size, axis=-1)]
+                        )
+                        x_transposed = ops.reshape(
+                            x,
+                            ops.stack(
+                                [batch_size, ops.prod(x_shape[1:])],
+                                axis=0,
+                            ),
+                        )
+                        x_transposed = ops.transpose(x_transposed, perm=(1, 0))
+                        x_transposed = ops.reshape(x_transposed, new_shape)
+
+                        reshaped_inputs.append(x_transposed)
+                        transposed = True
+
+                    elif x_ndim > 1:
+                        dims = list(range(1, x_ndim)) + [0]
+                        reshaped_inputs.append(ops.transpose(x, perm=dims))
+                        print(dims)
+                        transposed = True
+                    else:
+                        # We don't transpose inputs if they are 1D vectors or
+                        # scalars.
+                        reshaped_inputs.append(x)
+
+                y = self._merge_function(reshaped_inputs)
+                y_ndim = ops.ndim(y)
+
+                if transposed:
+                    # If inputs have been transposed, we have to transpose the
+                    # output too.
+                    if y_ndim is None:
+                        y_shape = ops.shape(y)
+                        y_ndim = ops.shape(y_shape)[0]
+                        batch_size = y_shape[y_ndim - 1]
+                        new_shape = ops.concatenate(
+                            [
+                                ops.expand_dims(batch_size, axis=-1),
+                                y_shape[: y_ndim - 1],
+                            ]
+                        )
+                        y = ops.reshape(y, (-1, batch_size))
+                        y = ops.transpose(y, perm=(1, 0))
+                        y = ops.reshape(y, new_shape)
+                    elif y_ndim > 1:
+                        dims = [y_ndim - 1] + list(range(y_ndim - 1))
+                        y = ops.transpose(y, perm=dims)
+                return y
+        else:
+            return self._merge_function(inputs)
+
+    def compute_output_shape(self, input_shape):
+        if input_shape[0] is None:
+            output_shape = None
+        else:
+            output_shape = input_shape[0][1:]
+
+        for i in range(1, len(input_shape)):
+            if input_shape[i] is None:
+                shape = None
+            else:
+                shape = input_shape[i][1:]
+            output_shape = self._compute_elemwise_op_output_shape(
+                output_shape, shape
+            )
+        batch_sizes = {s[0] for s in input_shape if s is not None} - {None}
+        if len(batch_sizes) == 1:
+            output_shape = (list(batch_sizes)[0],) + output_shape
+        else:
+            output_shape = (None,) + output_shape
+        return output_shape
+
+    def compute_mask(self, inputs, mask=None):
+        if mask is None:
+            return None
+        if not isinstance(mask, (tuple, list)):
+            raise ValueError(f"`mask` should be a list. Received: mask={mask}")
+        if not isinstance(inputs, (tuple, list)):
+            raise ValueError(
+                f"`inputs` should be a list. Received: inputs={inputs}"
+            )
+        if len(mask) != len(inputs):
+            raise ValueError(
+                "The lists `inputs` and `mask` should have the same length. "
+                f"Received: inputs={inputs} of length {len(inputs)}, and "
+                f"mask={mask} of length {len(mask)}"
+            )
+        if all(m is None for m in mask):
+            return None
+        masks = [ops.expand_dims(m, axis=0) for m in mask if m is not None]
+        return ops.all(ops.concatenate(masks, axis=0), axis=0, keepdims=False)
+
+    def get_config(self):
+        return super().get_config()