PyLops
diff --git a/‎docs/source/api/index.rst‎
Lines changed: 22 additions & 0 deletions b/‎docs/source/api/index.rst‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎examples/plot_mdc.py‎
Lines changed: 172 additions & 0 deletions b/‎examples/plot_mdc.py‎
Lines changed: 172 additions & 0 deletions
diff --git a/‎pylops_mpi/__init__.py‎
Lines changed: 3 additions & 1 deletion b/‎pylops_mpi/__init__.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎pylops_mpi/basicoperators/__init__.py‎
Lines changed: 4 additions & 4 deletions b/‎pylops_mpi/basicoperators/__init__.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎pylops_mpi/signalprocessing/Fredholm1.py‎
Lines changed: 161 additions & 0 deletions b/‎pylops_mpi/signalprocessing/Fredholm1.py‎
Lines changed: 161 additions & 0 deletions
@@ -61,6 +61,28 @@ Derivatives
     MPILaplacian
     MPIGradient
 
+Signal Processing
+~~~~~~~~~~~~~~~~~
+
+.. currentmodule:: pylops_mpi.signalprocessing
+
+.. autosummary::
+   :toctree: generated/
+
+    MPIFredholm1
+
+
+Wave-Equation processing
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. currentmodule:: pylops_mpi.waveeqprocessing
+
+.. autosummary::
+   :toctree: generated/
+
+    MPIMDC
+
+
 Solvers
 -------
 
 
@@ -0,0 +1,172 @@
+"""
+Multi-Dimensional Convolution
+=============================
+This example shows how to use the :py:class:`pylops_mpi.waveeqprocessing.MPIMDC` operator
+to convolve a 3D kernel with an input seismic data in a distributed fashion (where
+parallelism is harnessed over the frequency axis when performing repeated matrix-vector
+or matrix-matrix multiplications).
+
+"""
+from matplotlib import pyplot as plt
+import numpy as np
+from mpi4py import MPI
+from pylops.utils.seismicevents import hyperbolic2d, makeaxis
+from pylops.utils.tapers import taper3d
+from pylops.utils.wavelets import ricker
+
+from pylops_mpi.DistributedArray import local_split, Partition
+import pylops_mpi
+
+plt.close("all")
+np.random.seed(42)
+
+rank = MPI.COMM_WORLD.Get_rank()
+size = MPI.COMM_WORLD.Get_size()
+dtype = np.float32
+cdtype = np.complex64
+
+###############################################################################
+# Let's start by creating a set of hyperbolic events to be used as our MDC kernel
+
+# Input parameters
+par = {
+    "ox": -300,
+    "dx": 10,
+    "nx": 61,
+    "oy": -500,
+    "dy": 10,
+    "ny": 101,
+    "ot": 0,
+    "dt": 0.004,
+    "nt": 400,
+    "f0": 20,
+    "nfmax": 200,
+}
+
+t0_m = 0.2
+vrms_m = 1100.0
+amp_m = 1.0
+
+t0_G = (0.2, 0.5, 0.7)
+vrms_G = (1200.0, 1500.0, 2000.0)
+amp_G = (1.0, 0.6, 0.5)
+
+# Taper
+tap = taper3d(par["nt"], (par["ny"], par["nx"]), (5, 5), tapertype="hanning")
+
+# Create axis
+t, t2, x, y = makeaxis(par)
+
+# Create wavelet
+wav = ricker(t[:41], f0=par["f0"])[0]
+
+# Generate model
+m, mwav = hyperbolic2d(x, t, t0_m, vrms_m, amp_m, wav)
+
+# Generate operator
+G, Gwav = np.zeros((par["ny"], par["nx"], par["nt"])), np.zeros(
+    (par["ny"], par["nx"], par["nt"])
+)
+for iy, y0 in enumerate(y):
+    G[iy], Gwav[iy] = hyperbolic2d(x - y0, t, t0_G, vrms_G, amp_G, wav)
+G, Gwav = G * tap, Gwav * tap
+
+# Add negative part to data and model
+m = np.concatenate((np.zeros((par["nx"], par["nt"] - 1)), m), axis=-1)
+mwav = np.concatenate((np.zeros((par["nx"], par["nt"] - 1)), mwav), axis=-1)
+Gwav2 = np.concatenate((np.zeros((par["ny"], par["nx"], par["nt"] - 1)), Gwav), axis=-1)
+
+# Move to frequency
+Gwav_fft = np.fft.rfft(Gwav2, 2 * par["nt"] - 1, axis=-1)
+Gwav_fft = Gwav_fft[..., : par["nfmax"]]
+
+# Move frequency/time to first axis
+m, mwav = m.T, mwav.T
+Gwav_fft = Gwav_fft.transpose(2, 0, 1)
+
+###############################################################################
+# Now that we have created the kernel of our MDC operator in ``Gwav_fft``, we
+# are ready to define a strategy on how to split it along the first
+# (i.e., frequency) axis over different ranks. In practical applications, one
+# would of course pre-compute the kernel and just load the relevant part in
+# each rank from file.
+
+# Choose how to split sources to ranks
+nf = par["nfmax"]
+nf_rank = local_split((nf, ), MPI.COMM_WORLD, Partition.SCATTER, 0)
+nf_ranks = np.concatenate(MPI.COMM_WORLD.allgather(nf_rank))
+ifin_rank = np.insert(np.cumsum(nf_ranks)[:-1] , 0, 0)[rank]
+ifend_rank = np.cumsum(nf_ranks)[rank]
+print(f'Rank: {rank}, nf: {nf_rank}, ifin: {ifin_rank}, ifend: {ifend_rank}')
+
+# Extract part of kernel of interest
+G = Gwav_fft[ifin_rank:ifend_rank].astype(cdtype)
+print(f'Rank: {rank}, G: {G.shape}')
+
+###############################################################################
+# We can finally create the MDC operator using
+# :py:class:`pylops_mpi.waveeqprocessing.MPIMDC` so that the most
+# demanding computations can be run in parallel.
+
+# Define operator
+Fop = pylops_mpi.waveeqprocessing.MPIMDC(
+    G, nt=2 * par["nt"] - 1, nv=1, nfreq=nf,
+    dt=0.004, dr=1.0, twosided=True)
+
+# Apply forward
+md = pylops_mpi.DistributedArray(global_shape=(2 * par["nt"] - 1) * par["nx"] * 1,
+                                 partition=pylops_mpi.Partition.BROADCAST,
+                                 dtype=dtype)
+md[:] = m.astype(dtype).ravel()
+
+dd = Fop @ md
+d = dd.asarray().real
+d = d.reshape(2 * par["nt"] - 1, par["ny"])
+
+# Apply adjoint
+madjd = Fop.H @ dd
+madj = madjd.asarray().real
+madj = madj.reshape(2 * par["nt"] - 1, par["nx"])
+
+###############################################################################
+# Finally let's display input model, data and adjoint model
+
+if rank == 0:
+    fig, axs = plt.subplots(1, 3, figsize=(9, 6))
+    axs[0].imshow(
+        mwav,
+        aspect="auto",
+        interpolation="nearest",
+        cmap="gray",
+        vmin=-mwav.max(),
+        vmax=mwav.max(),
+        extent=(x.min(), x.max(), t2.max(), t2.min()),
+    )
+    axs[0].set_title(r"$m$", fontsize=15)
+    axs[0].set_xlabel("r")
+    axs[0].set_ylabel("t")
+    axs[1].imshow(
+        d,
+        aspect="auto",
+        interpolation="nearest",
+        cmap="gray",
+        vmin=-d.max(),
+        vmax=d.max(),
+        extent=(x.min(), x.max(), t2.max(), t2.min()),
+    )
+    axs[1].set_title(r"$d$", fontsize=15)
+    axs[1].set_xlabel("s")
+    axs[1].set_ylabel("t")
+    axs[2].imshow(
+        madj,
+        aspect="auto",
+        interpolation="nearest",
+        cmap="gray",
+        vmin=-madj.max(),
+        vmax=madj.max(),
+        extent=(x.min(), x.max(), t2.max(), t2.min()),
+    )
+    axs[2].set_title(r"$m_{adj}$", fontsize=15)
+    axs[2].set_xlabel("s")
+    axs[2].set_ylabel("t")
+    fig.tight_layout()
@@ -5,7 +5,9 @@
 from . import (
     basicoperators,
     optimization,
-    plotting
+    plotting,
+    signalprocessing,
+    waveeqprocessing,
 )
 from .plotting.plotting import *
 from .optimization.basic import *
 
@@ -2,11 +2,11 @@
 Basic Linear Operators using MPI
 ================================
 
-The subpackage basicoperators extends some of the basic linear algebra
-operations provided by numpy providing forward and adjoint functionalities
-using MPI.
+The subpackage basicoperators extends some of the basic operations
+provided by pylops.basicoperators providing forward and adjoint
+functionalities using MPI.
 
-A list of operators present in pylops_mpi.basicoperators :
+A list of operators present in pylops_mpi.basicoperators:
     MPIBlockDiag                      Block Diagonal arrangement of PyLops operators
     MPIStackedBlockDiag               Block Diagonal arrangement of PyLops-MPI operators
     MPIVStack                         Vertical Stacking of PyLops operators
 
@@ -0,0 +1,161 @@
+import numpy as np
+
+from mpi4py import MPI
+from pylops.utils.backend import get_module
+from pylops.utils.typing import DTypeLike, NDArray
+
+from pylops_mpi import (
+    DistributedArray,
+    MPILinearOperator,
+    Partition
+)
+
+
+class MPIFredholm1(MPILinearOperator):
+    r"""Fredholm integral of first kind.
+
+    Implement a multi-dimensional Fredholm integral of first kind distributed
+    across the first dimension
+
+    Parameters
+    ----------
+    G : :obj:`numpy.ndarray`
+        Multi-dimensional convolution kernel of size
+        :math:`[n_{\text{slice}} \times n_x \times n_y]`
+    nz : :obj:`int`, optional
+        Additional dimension of model
+    saveGt : :obj:`bool`, optional
+        Save ``G`` and ``G.H`` to speed up the computation of adjoint
+        (``True``) or create ``G.H`` on-the-fly (``False``)
+        Note that ``saveGt=True`` will double the amount of required memory
+    usematmul : :obj:`bool`, optional
+        Use :func:`numpy.matmul` (``True``) or for-loop with :func:`numpy.dot`
+        (``False``). As it is not possible to define which approach is more
+        performant (this is highly dependent on the size of ``G`` and input
+        arrays as well as the hardware used in the computation), we advise users
+        to time both methods for their specific problem prior to making a
+        choice.
+    base_comm : :obj:`mpi4py.MPI.Comm`, optional
+        MPI Base Communicator. Defaults to ``mpi4py.MPI.COMM_WORLD``.
+    dtype : :obj:`str`, optional
+        Type of elements in input array.
+
+    Attributes
+    ----------
+    shape : :obj:`tuple`
+        Operator shape
+
+    Raises
+    ------
+    NotImplementedError
+        If the size of the first dimension of ``G`` is equal to 1 in any of the ranks
+
+    Notes
+    -----
+    A multi-dimensional Fredholm integral of first kind can be expressed as
+
+    .. math::
+
+        d(k, x, z) = \int{G(k, x, y) m(k, y, z) \,\mathrm{d}y}
+        \quad \forall k=1,\ldots,n_{slice}
+
+    on the other hand its adjoint is expressed as
+
+    .. math::
+
+        m(k, y, z) = \int{G^*(k, y, x) d(k, x, z) \,\mathrm{d}x}
+        \quad \forall k=1,\ldots,n_{\text{slice}}
+
+    This integral is implemented in a distributed fashion, where ``G``
+    is split across ranks along its first dimension. The inputs
+    of both the forward and adjoint are distributed arrays with broadcast partion:
+    each rank takes a portion of such arrays, computes a partial integral, and
+    the resulting outputs are then gathered by all ranks to return a
+    distributed arrays with broadcast partion.
+
+    """
+
+    def __init__(
+        self,
+        G: NDArray,
+        nz: int = 1,
+        saveGt: bool = False,
+        usematmul: bool = True,
+        base_comm: MPI.Comm = MPI.COMM_WORLD,
+        dtype: DTypeLike = "float64",
+    ) -> None:
+        self.nz = nz
+        self.nsl, self.nx, self.ny = G.shape
+        self.nsls = base_comm.allgather(self.nsl)
+        if base_comm.Get_rank() == 0 and 1 in self.nsls:
+            raise NotImplementedError(f'All ranks must have at least 2 or more '
+                                      f'elements in the first dimension: '
+                                      f'local split is instead {self.nsls}...')
+        nslstot = base_comm.allreduce(self.nsl)
+        self.islstart = np.insert(np.cumsum(self.nsls)[:-1], 0, 0)
+        self.islend = np.cumsum(self.nsls)
+        self.rank = base_comm.Get_rank()
+        self.dims = (nslstot, self.ny, self.nz)
+        self.dimsd = (nslstot, self.nx, self.nz)
+        shape = (np.prod(self.dimsd),
+                 np.prod(self.dims))
+        super().__init__(shape=shape, dtype=np.dtype(dtype), base_comm=base_comm)
+
+        self.G = G
+        if saveGt:
+            self.GT = G.transpose((0, 2, 1)).conj()
+        self.usematmul = usematmul
+
+    def _matvec(self, x: DistributedArray) -> DistributedArray:
+        ncp = get_module(x.engine)
+        if x.partition is not Partition.BROADCAST:
+            raise ValueError(f"x should have partition={Partition.BROADCAST}, {x.partition} != {Partition.BROADCAST}")
+        y = DistributedArray(global_shape=self.shape[0], partition=Partition.BROADCAST,
+                             engine=x.engine, dtype=self.dtype)
+        x = x.local_array.reshape(self.dims).squeeze()
+        x = x[self.islstart[self.rank]:self.islend[self.rank]]
+        # apply matmul for portion of the rank of interest
+        if self.usematmul:
+            if self.nz == 1:
+                x = x[..., ncp.newaxis]
+            y1 = ncp.matmul(self.G, x)
+        else:
+            y1 = ncp.squeeze(ncp.zeros((self.nsls[self.rank], self.nx, self.nz), dtype=self.dtype))
+            for isl in range(self.nsls[self.rank]):
+                y1[isl] = ncp.dot(self.G[isl], x[isl])
+        # gather results
+        y[:] = np.vstack(self.base_comm.allgather(y1)).ravel()
+        return y
+
+    def _rmatvec(self, x: NDArray) -> NDArray:
+        ncp = get_module(x.engine)
+        if x.partition is not Partition.BROADCAST:
+            raise ValueError(f"x should have partition={Partition.BROADCAST}, {x.partition} != {Partition.BROADCAST}")
+        y = DistributedArray(global_shape=self.shape[1], partition=Partition.BROADCAST,
+                             engine=x.engine, dtype=self.dtype)
+        x = x.local_array.reshape(self.dimsd).squeeze()
+        x = x[self.islstart[self.rank]:self.islend[self.rank]]
+        # apply matmul for portion of the rank of interest
+        if self.usematmul:
+            if self.nz == 1:
+                x = x[..., ncp.newaxis]
+            if hasattr(self, "GT"):
+                y1 = ncp.matmul(self.GT, x)
+            else:
+                y1 = (
+                    ncp.matmul(x.transpose(0, 2, 1).conj(), self.G)
+                    .transpose(0, 2, 1)
+                    .conj()
+                )
+        else:
+            y1 = ncp.squeeze(ncp.zeros((self.nsls[self.rank], self.ny, self.nz), dtype=self.dtype))
+            if hasattr(self, "GT"):
+                for isl in range(self.nsls[self.rank]):
+                    y1[isl] = ncp.dot(self.GT[isl], x[isl])
+            else:
+                for isl in range(self.nsl):
+                    y1[isl] = ncp.dot(x[isl].T.conj(), self.G[isl]).T.conj()
+
+        # gather results
+        y[:] = np.vstack(self.base_comm.allgather(y1)).ravel()
+        return y