PyLops · rohanbabbar04 · Aug 6, 2023 · Aug 4, 2023 · Aug 4, 2023 · Aug 4, 2023
diff --git a/docs/source/api/index.rst b/docs/source/api/index.rst
@@ -53,6 +53,7 @@ Derivatives
    :toctree: generated/
 
     MPIFirstDerivative
+    MPISecondDerivative
 
 Solvers
 -------

diff --git a/examples/plot_derivative.py b/examples/plot_derivative.py
@@ -0,0 +1,86 @@
+"""
+Derivatives
+===========
+This example demonstrates how to use pylops-mpi's derivative operators, namely
+:py:class:`pylops_mpi.basicoperators.MPIFirstDerivative` and
+:py:class:`pylops_mpi.basicoperators.MPISecondDerivative`.
+
+We will be focusing here on the case where the input array :math:`x` is assumed to be
+an n-dimensional :py:class:`pylops_mpi.DistributedArray` and the derivative is
+applied over the first axis (``axis=0``). Since the array is distributed
+over multiple processes, the derivative operators must take care of applying
+the derivatives across the edges using the information from the previous/next
+processes, using the so-called ghost cells.
+
+Derivative operators are commonly used when solving inverse problems within
+regularization terms aimed at enforcing smooth solutions
+
+"""
+from matplotlib import pyplot as plt
+import numpy as np
+from mpi4py import MPI
+
+import pylops_mpi
+
+plt.close("all")
+np.random.seed(42)
+
+rank = MPI.COMM_WORLD.Get_rank()
+size = MPI.COMM_WORLD.Get_size()
+
+###############################################################################
+# Let’s start by applying the first derivative on a :py:class:`pylops_mpi.DistributedArray`
+# in the first direction(i.e. along axis=0) using the
+# :py:class:`pylops_mpi.basicoperators.MPIFirstDerivative` operator.
+nx, ny = 11, 21
+x = np.zeros((nx, ny))
+x[nx // 2, ny // 2] = 1.0
+
+Fop = pylops_mpi.MPIFirstDerivative((nx, ny), dtype=np.float64)
+x_dist = pylops_mpi.DistributedArray.to_dist(x=x.flatten())
+y_dist = Fop @ x_dist
+y = y_dist.asarray().reshape((nx, ny))
+
+if rank == 0:
+    fig, axs = plt.subplots(1, 2, figsize=(10, 3), sharey=True)
+    fig.suptitle(
+        "First Derivative in 1st direction", fontsize=12, fontweight="bold", y=0.95
+    )
+    im = axs[0].imshow(x, interpolation="nearest", cmap="rainbow")
+    axs[0].axis("tight")
+    axs[0].set_title("x")
+    plt.colorbar(im, ax=axs[0])
+    im = axs[1].imshow(y, interpolation="nearest", cmap="rainbow")
+    axs[1].axis("tight")
+    axs[1].set_title("y")
+    plt.colorbar(im, ax=axs[1])
+    plt.tight_layout()
+    plt.subplots_adjust(top=0.8)
+
+###############################################################################
+# We can now do the same for the second derivative using the
+# :py:class:`pylops_mpi.basicoperators.MPISecondDerivative` operator.
+nx, ny = 11, 21
+x = np.zeros((nx, ny))
+x[nx // 2, ny // 2] = 1.0
+
+Sop = pylops_mpi.MPISecondDerivative(dims=(nx, ny), dtype=np.float64)
+x_dist = pylops_mpi.DistributedArray.to_dist(x=x.flatten())
+y_dist = Sop @ x_dist
+y = y_dist.asarray().reshape((nx, ny))
+
+if rank == 0:
+    fig, axs = plt.subplots(1, 2, figsize=(10, 3), sharey=True)
+    fig.suptitle(
+        "Second Derivative in 1st direction", fontsize=12, fontweight="bold", y=0.95
+    )
+    im = axs[0].imshow(x, interpolation="nearest", cmap="rainbow")
+    axs[0].axis("tight")
+    axs[0].set_title("x")
+    plt.colorbar(im, ax=axs[0])
+    im = axs[1].imshow(y, interpolation="nearest", cmap="rainbow")
+    axs[1].axis("tight")
+    axs[1].set_title("y")
+    plt.colorbar(im, ax=axs[1])
+    plt.tight_layout()
+    plt.subplots_adjust(top=0.8)
diff --git a/pylops_mpi/basicoperators/SecondDerivative.py b/pylops_mpi/basicoperators/SecondDerivative.py
@@ -0,0 +1,240 @@
+import numpy as np
+
+from typing import Callable, Union
+from pylops.utils.typing import DTypeLike, InputDimsLike
+from pylops.utils._internal import _value_or_sized_to_tuple
+
+from pylops_mpi import DistributedArray, MPILinearOperator, Partition
+from pylops_mpi.utils.decorators import reshaped
+
+
+class MPISecondDerivative(MPILinearOperator):
+    r"""MPI Second Derivative
+
+    Apply a second derivative using a three-point stencil finite-difference
+    approximation with :class:`pylops_mpi.DistributedArray`. The Second Derivative
+    is calculated along ``axis=0``.
+
+    Parameters
+    ----------
+    dims : :obj:`int` or :obj:`tuple`
+        Number of samples for each dimension.
+    sampling : :obj:`float`, optional
+        Sampling step :math:`\Delta x`.
+    kind : :obj:`str`, optional
+        Derivative kind (``forward``, ``centered``, or ``backward``).
+    edge : :obj:`bool`, optional
+        Use reduced order derivative at edges (``True``) or
+        ignore them (``False``). This is currently only available
+        for centered derivative.
+    dtype : :obj:`str`, optional
+        Type of elements in the input array.
+
+    Attributes
+    ----------
+    shape : :obj:`tuple`
+        Operator shape
+
+    Notes
+    -----
+    The MPISecondDerivative operator applies a second derivative to a :class:`pylops_mpi.DistributedArray`
+    using either a second-order forward, backward or a centered stencil.
+
+    Similar to the concept of :py:class:`pylops_mpi.basicoperators.MPIFirstDerivative`,
+    **ghosting** is applied at each rank to include duplicated copies of border cells
+    (ghost cells) from neighboring processes. These ghost cells enable each process
+    to perform local computations independently, avoiding the necessity for direct
+    communication with other processes. As a result, it becomes possible to calculate
+    the Second Derivative of the entire distributed array efficiently.
+
+    Now, for a one-dimensional DistributedArray, the second-order forward stencil is:
+
+    .. math::
+        y[i] = (x[i+2] - 2 * x[i+1] + x[i]) / \mathbf{\Delta x}^2
+
+    while the second-order backward stencil is:
+
+    .. math::
+        y[i] = (x[i] - 2 * x[i-1] + x[i-2]) / \mathbf{\Delta x}^2
+
+    and the second-order centered stencil is:
+
+    .. math::
+        y[i] = (x[i+1] - 2 * x[i] + x[i-1]) / \mathbf{\Delta x}^2
+
+    where :math:`y` is a DistributedArray and :math:`x` is a Ghosted array created
+    by adding border cells of neighboring processes to the local array at each rank.
+
+    """
+
+    def __init__(
+            self,
+            dims: Union[int, InputDimsLike],
+            sampling: float = 1.0,
+            kind: str = "centered",
+            edge: bool = False,
+            dtype: DTypeLike = np.float64,
+    ) -> None:
+        self.dims = _value_or_sized_to_tuple(dims)
+        shape = (int(np.prod(dims)),) * 2
+        super().__init__(shape=shape, dtype=np.dtype(dtype))
+        self.sampling = sampling
+        self.kind = kind
+        self.edge = edge
+        self._register_multiplications(self.kind)
+
+    def _register_multiplications(
+            self,
+            kind: str,
+    ) -> None:
+        # choose _matvec and _rmatvec kind
+        self._hmatvec: Callable
+        self._hrmatvec: Callable
+        if kind == "forward":
+            self._hmatvec = self._matvec_forward
+            self._hrmatvec = self._rmatvec_forward
+        elif kind == "centered":
+            self._hmatvec = self._matvec_centered
+            self._hrmatvec = self._rmatvec_centered
+        elif kind == "backward":
+            self._hmatvec = self._matvec_backward
+            self._hrmatvec = self._rmatvec_backward
+        else:
+            raise NotImplementedError(
+                "'kind' must be 'forward', 'centered' or 'backward'"
+            )
+
+    def _matvec(self, x: DistributedArray) -> DistributedArray:
+        # If Partition.BROADCAST, then convert to Partition.SCATTER
+        if x.partition is Partition.BROADCAST:
+            x = DistributedArray.to_dist(x=x.local_array)
+        return self._hmatvec(x)
+
+    def _rmatvec(self, x: DistributedArray) -> DistributedArray:
+        # If Partition.BROADCAST, then convert to Partition.SCATTER
+        if x.partition is Partition.BROADCAST:
+            x = DistributedArray.to_dist(x=x.local_array)
+        return self._hrmatvec(x)
+
+    @reshaped
+    def _matvec_forward(self, x: DistributedArray) -> DistributedArray:
+        y = DistributedArray(global_shape=x.global_shape, dtype=self.dtype, axis=x.axis)
+        ghosted_x = x.add_ghost_cells(cells_back=2)
+        y_forward = ghosted_x[2:] - 2 * ghosted_x[1:-1] + ghosted_x[:-2]
+        if self.rank == self.size - 1:
+            y_forward = np.append(y_forward, np.zeros((min(y.global_shape[0], 2),) + self.dims[1:]), axis=0)
+        y[:] = y_forward / self.sampling ** 2
+        return y
+
+    @reshaped
+    def _rmatvec_forward(self, x: DistributedArray) -> DistributedArray:
+        y = DistributedArray(global_shape=x.global_shape, dtype=self.dtype, axis=x.axis)
+        y[:] = 0
+        if self.rank == self.size - 1:
+            y[:-2] += x[:-2]
+        else:
+            y[:] += x[:]
+
+        ghosted_x = x.add_ghost_cells(cells_front=1, cells_back=1)
+        y_forward = ghosted_x[:-2]
+        if self.rank == 0:
+            y_forward = np.insert(y_forward, 0, np.zeros((1,) + self.dims[1:]), axis=0)
+        if self.rank == self.size - 1:
+            y_forward = np.append(y_forward, np.zeros((min(1, y.global_shape[0] - 1),) + self.dims[1:]), axis=0)
+        y[:] -= 2 * y_forward
+
+        ghosted_x = x.add_ghost_cells(cells_front=2)
+        y_forward = ghosted_x[:-2]
+        if self.rank == 0:
+            y_forward = np.insert(y_forward, 0, np.zeros((min(y.global_shape[0], 2),) + self.dims[1:]), axis=0)
+        y[:] += y_forward
+        y[:] /= self.sampling ** 2
+        return y
+
+    @reshaped
+    def _matvec_backward(self, x: DistributedArray) -> DistributedArray:
+        y = DistributedArray(global_shape=x.global_shape, dtype=self.dtype, axis=x.axis)
+        ghosted_x = x.add_ghost_cells(cells_front=2)
+        y_backward = ghosted_x[2:] - 2 * ghosted_x[1:-1] + ghosted_x[:-2]
+        if self.rank == 0:
+            y_backward = np.insert(y_backward, 0, np.zeros((min(y.global_shape[0], 2),) + self.dims[1:]), axis=0)
+        y[:] = y_backward / self.sampling ** 2
+        return y
+
+    @reshaped
+    def _rmatvec_backward(self, x: DistributedArray) -> DistributedArray:
+        y = DistributedArray(global_shape=x.global_shape, dtype=self.dtype, axis=x.axis)
+        y[:] = 0
+        ghosted_x = x.add_ghost_cells(cells_back=2)
+        y_backward = ghosted_x[2:]
+        if self.rank == self.size - 1:
+            y_backward = np.append(y_backward, np.zeros((min(2, y.global_shape[0]),) + self.dims[1:]), axis=0)
+        y[:] += y_backward
+
+        ghosted_x = x.add_ghost_cells(cells_front=1, cells_back=1)
+        y_backward = 2 * ghosted_x[2:]
+        if self.rank == 0:
+            y_backward = np.insert(y_backward, 0, np.zeros((1,) + self.dims[1:]), axis=0)
+        if self.rank == self.size - 1:
+            y_backward = np.append(y_backward, np.zeros((min(1, y.global_shape[0] - 1),) + self.dims[1:]), axis=0)
+        y[:] -= y_backward
+
+        if self.rank == 0:
+            y[2:] += x[2:]
+        else:
+            y[:] += x[:]
+        y[:] /= self.sampling ** 2
+        return y
+
+    @reshaped
+    def _matvec_centered(self, x: DistributedArray) -> DistributedArray:
+        y = DistributedArray(global_shape=x.global_shape, dtype=self.dtype, axis=x.axis)
+        ghosted_x = x.add_ghost_cells(cells_front=1, cells_back=1)
+        y_centered = ghosted_x[2:] - 2 * ghosted_x[1:-1] + ghosted_x[:-2]
+        if self.rank == 0:
+            y_centered = np.insert(y_centered, 0, np.zeros((1,) + self.dims[1:]), axis=0)
+        if self.rank == self.size - 1:
+            y_centered = np.append(y_centered, np.zeros((min(1, y.global_shape[0] - 1),) + self.dims[1:]), axis=0)
+        y[:] = y_centered
+        if self.edge:
+            if self.rank == 0:
+                y[0] = x[0] - 2 * x[1] + x[2]
+            if self.rank == self.size - 1:
+                y[-1] = x[-3] - 2 * x[-2] + x[-1]
+        y[:] /= self.sampling ** 2
+        return y
+
+    @reshaped
+    def _rmatvec_centered(self, x: DistributedArray) -> DistributedArray:
+        y = DistributedArray(global_shape=x.global_shape, dtype=self.dtype, axis=x.axis)
+        y[:] = 0
+        ghosted_x = x.add_ghost_cells(cells_back=2)
+        y_centered = ghosted_x[1:-1]
+        if self.rank == self.size - 1:
+            y_centered = np.append(y_centered, np.zeros((min(2, y.global_shape[0]),) + self.dims[1:]), axis=0)
+        y[:] += y_centered
+
+        ghosted_x = x.add_ghost_cells(cells_front=1, cells_back=1)
+        y_centered = 2 * ghosted_x[1:-1]
+        if self.rank == 0:
+            y_centered = np.insert(y_centered, 0, np.zeros((1,) + self.dims[1:]), axis=0)
+        if self.rank == self.size - 1:
+            y_centered = np.append(y_centered, np.zeros((min(1, y.global_shape[0] - 1),) + self.dims[1:]), axis=0)
+        y[:] -= y_centered
+
+        ghosted_x = x.add_ghost_cells(cells_front=2)
+        y_centered = ghosted_x[1:-1]
+        if self.rank == 0:
+            y_centered = np.insert(y_centered, 0, np.zeros((min(2, y.global_shape[0]),) + self.dims[1:]), axis=0)
+        y[:] += y_centered
+        if self.edge:
+            if self.rank == 0:
+                y[0] += x[0]
+                y[1] -= 2 * x[0]
+                y[2] += x[0]
+            if self.rank == self.size - 1:
+                y[-3] += x[-1]
+                y[-2] -= 2 * x[-1]
+                y[-1] += x[-1]
+        y[:] /= self.sampling ** 2
+        return y
diff --git a/pylops_mpi/basicoperators/__init__.py b/pylops_mpi/basicoperators/__init__.py
@@ -18,10 +18,12 @@
 from .VStack import *
 from .HStack import *
 from .FirstDerivative import *
+from .SecondDerivative import *
 
 __all__ = [
     "MPIBlockDiag",
     "MPIVStack",
     "MPIHStack",
-    "MPIFirstDerivative"
+    "MPIFirstDerivative",
+    "MPISecondDerivative"
 ]
diff --git a/tests/test_derivative.py b/tests/test_derivative.py
@@ -233,3 +233,99 @@ def test_first_derivative_centered(par):
             y_adj_np = Fop.H @ x_global
             assert_allclose(y, y_np, rtol=1e-14)
             assert_allclose(y_adj, y_adj_np, rtol=1e-14)
+
+
+@pytest.mark.mpi(min_size=2)
+@pytest.mark.parametrize("par", [(par1), (par1b), (par1j), (par1e), (par2), (par2b),
+                                 (par2j), (par2e), (par3), (par3b), (par3j), (par3e),
+                                 (par4), (par4b), (par4j), (par4e)])
+def test_second_derivative_forward(par):
+    """MPISecondDerivative operator (forward stencil)"""
+    Sop_MPI = pylops_mpi.basicoperators.MPISecondDerivative(dims=par['nz'], sampling=par['dz'],
+                                                            kind="forward", edge=par['edge'],
+                                                            dtype=par['dtype'])
+    x = pylops_mpi.DistributedArray(global_shape=np.prod(par['nz']), dtype=par['dtype'],
+                                    partition=par['partition'])
+    x[:] = np.random.normal(rank, 10, x.local_shape)
+    x_global = x.asarray()
+    # Forward
+    y_dist = Sop_MPI @ x
+    y = y_dist.asarray()
+    # Adjoint
+    y_adj_dist = Sop_MPI.H @ x
+    y_adj = y_adj_dist.asarray()
+
+    if rank == 0:
+        Sop = pylops.SecondDerivative(dims=par['nz'], axis=0,
+                                      sampling=par['dz'],
+                                      kind="forward", edge=par['edge'],
+                                      dtype=par['dtype'])
+        assert Sop_MPI.shape == Sop.shape
+        y_np = Sop @ x_global
+        y_adj_np = Sop.H @ x_global
+        assert_allclose(y, y_np, rtol=1e-14)
+        assert_allclose(y_adj, y_adj_np, rtol=1e-14)
+
+
+@pytest.mark.mpi(min_size=2)
+@pytest.mark.parametrize("par", [(par1), (par1b), (par1j), (par1e), (par2), (par2b),
+                                 (par2j), (par2e), (par3), (par3b), (par3j), (par3e),
+                                 (par4), (par4b), (par4j), (par4e)])
+def test_second_derivative_backward(par):
+    """MPISecondDerivative operator (backward stencil)"""
+    Sop_MPI = pylops_mpi.basicoperators.MPISecondDerivative(dims=par['nz'], sampling=par['dz'],
+                                                            kind="backward", edge=par['edge'],
+                                                            dtype=par['dtype'])
+    x = pylops_mpi.DistributedArray(global_shape=np.prod(par['nz']), dtype=par['dtype'],
+                                    partition=par['partition'])
+    x[:] = np.random.normal(rank, 10, x.local_shape)
+    x_global = x.asarray()
+    # Forward
+    y_dist = Sop_MPI @ x
+    y = y_dist.asarray()
+    # Adjoint
+    y_adj_dist = Sop_MPI.H @ x
+    y_adj = y_adj_dist.asarray()
+
+    if rank == 0:
+        Sop = pylops.SecondDerivative(dims=par['nz'], axis=0,
+                                      sampling=par['dz'],
+                                      kind="backward", edge=par['edge'],
+                                      dtype=par['dtype'])
+        assert Sop_MPI.shape == Sop.shape
+        y_np = Sop @ x_global
+        y_adj_np = Sop.H @ x_global
+        assert_allclose(y, y_np, rtol=1e-14)
+        assert_allclose(y_adj, y_adj_np, rtol=1e-14)
+
+
+@pytest.mark.mpi(min_size=2)
+@pytest.mark.parametrize("par", [(par1), (par1b), (par1j), (par1e), (par2), (par2b),
+                                 (par2j), (par2e), (par3), (par3b), (par3j), (par3e),
+                                 (par4), (par4b), (par4j), (par4e)])
+def test_second_derivative_centered(par):
+    """MPISecondDerivative operator (centered stencil)"""
+    Sop_MPI = pylops_mpi.basicoperators.MPISecondDerivative(dims=par['nz'], sampling=par['dz'],
+                                                            kind="centered", edge=par['edge'],
+                                                            dtype=par['dtype'])
+    x = pylops_mpi.DistributedArray(global_shape=np.prod(par['nz']), dtype=par['dtype'],
+                                    partition=par['partition'])
+    x[:] = np.random.normal(rank, 10, x.local_shape)
+    x_global = x.asarray()
+    # Forward
+    y_dist = Sop_MPI @ x
+    y = y_dist.asarray()
+    # Adjoint
+    y_adj_dist = Sop_MPI.H @ x
+    y_adj = y_adj_dist.asarray()
+
+    if rank == 0:
+        Sop = pylops.SecondDerivative(dims=par['nz'], axis=0,
+                                      sampling=par['dz'],
+                                      kind="centered", edge=par['edge'],
+                                      dtype=par['dtype'])
+        assert Sop_MPI.shape == Sop.shape
+        y_np = Sop @ x_global
+        y_adj_np = Sop.H @ x_global
+        assert_allclose(y, y_np, rtol=1e-14)
+        assert_allclose(y_adj, y_adj_np, rtol=1e-14)