__all__ = ["BlockDiag"]
import concurrent.futures as mt
import multiprocessing as mp
import numpy as np
import scipy as sp
# need to check scipy version since the interface submodule changed into
# _interface from scipy>=1.8.0
sp_version = sp.__version__.split(".")
if int(sp_version[0]) <= 1 and int(sp_version[1]) < 8:
from scipy.sparse.linalg.interface import LinearOperator as spLinearOperator
from scipy.sparse.linalg.interface import _get_dtype
else:
from scipy.sparse.linalg._interface import (
_get_dtype,
LinearOperator as spLinearOperator,
)
from typing import Optional, Sequence
from pylops import LinearOperator
from pylops.basicoperators import MatrixMult
from pylops.utils.backend import get_array_module, get_module, inplace_set
from pylops.utils.typing import DTypeLike, NDArray
def _matvec_rmatvec_map(op, x: NDArray) -> NDArray:
"""matvec/rmatvec for multiprocessing"""
return op(x).squeeze()
[docs]class BlockDiag(LinearOperator):
r"""Block-diagonal operator.
Create a block-diagonal operator from N linear operators.
Parameters
----------
ops : :obj:`list`
Linear operators to be stacked. Alternatively,
:obj:`numpy.ndarray` or :obj:`scipy.sparse` matrices can be passed
in place of one or more operators.
nproc : :obj:`int`, optional
Number of processes/threads used to evaluate the N operators in parallel using
``multiprocessing``/``concurrent.futures``. If ``nproc=1``, work in serial mode.
forceflat : :obj:`bool`, optional
.. versionadded:: 2.2.0
Force an array to be flattened after matvec and rmatvec.
inoutengine : :obj:`tuple`, optional
.. versionadded:: 2.4.0
Type of output vectors of `matvec` and `rmatvec. If ``None``, this is
inferred directly from the input vectors. Note that this is ignored
if ``nproc>1``.
parallel_kind : :obj:`str`, optional
.. versionadded:: 2.6.0
Parallelism kind when ``nproc>1``. Can be ``multiproc`` (using
:mod:`multiprocessing`) or ``multithread`` (using
:class:`concurrent.futures.ThreadPoolExecutor`). Defaults
to ``multiproc``.
dtype : :obj:`str`, optional
Type of elements in input array.
Attributes
----------
nops : :obj:`int`
Number of rows of the full operator (sum of rows of each block).
mops : :obj:`int`
Number of columns of the full operator (sum of columns of each block).
nnops : :obj:`numpy.ndarray`
Cumulative sum of rows of each block, with a leading zero.
mmops : :obj:`numpy.ndarray`
Cumulative sum of columns of each block, with a leading zero.
dims : :obj:`tuple`
Shape of the array after the adjoint, but before flattening.
For example, ``x_reshaped = (Op.H * y.ravel()).reshape(Op.dims)``.
dimsd : :obj:`tuple`
Shape of the array after the forward, but before flattening.
For example, ``y_reshaped = (Op * x.ravel()).reshape(Op.dimsd)``.
pool : :obj:`multiprocessing.Pool` or :obj:`concurrent.futures.ThreadPoolExecutor` or :obj:`None`
Pool of workers used to evaluate the N operators in parallel.
When ``nproc=1``, no pool is created (i.e., ``pool=None``).
shape : :obj:`tuple`
Operator shape.
Notes
-----
A block-diagonal operator composed of N linear operators is created such
as its application in forward mode leads to
.. math::
\begin{bmatrix}
\mathbf{L}_1 & \mathbf{0} & \ldots & \mathbf{0} \\
\mathbf{0} & \mathbf{L}_2 & \ldots & \mathbf{0} \\
\vdots & \vdots & \ddots & \vdots \\
\mathbf{0} & \mathbf{0} & \ldots & \mathbf{L}_N
\end{bmatrix}
\begin{bmatrix}
\mathbf{x}_{1} \\
\mathbf{x}_{2} \\
\vdots \\
\mathbf{x}_{N}
\end{bmatrix} =
\begin{bmatrix}
\mathbf{L}_1 \mathbf{x}_{1} \\
\mathbf{L}_2 \mathbf{x}_{2} \\
\vdots \\
\mathbf{L}_N \mathbf{x}_{N}
\end{bmatrix}
while its application in adjoint mode leads to
.. math::
\begin{bmatrix}
\mathbf{L}_1^H & \mathbf{0} & \ldots & \mathbf{0} \\
\mathbf{0} & \mathbf{L}_2^H & \ldots & \mathbf{0} \\
\vdots & \vdots & \ddots & \vdots \\
\mathbf{0} & \mathbf{0} & \ldots & \mathbf{L}_N^H
\end{bmatrix}
\begin{bmatrix}
\mathbf{y}_{1} \\
\mathbf{y}_{2} \\
\vdots \\
\mathbf{y}_{N}
\end{bmatrix} =
\begin{bmatrix}
\mathbf{L}_1^H \mathbf{y}_{1} \\
\mathbf{L}_2^H \mathbf{y}_{2} \\
\vdots \\
\mathbf{L}_N^H \mathbf{y}_{N}
\end{bmatrix}
"""
def __init__(
self,
ops: Sequence[LinearOperator],
nproc: int = 1,
forceflat: bool = None,
inoutengine: Optional[tuple] = None,
parallel_kind: str = "multiproc",
dtype: Optional[DTypeLike] = None,
) -> None:
if parallel_kind not in ["multiproc", "multithread"]:
raise ValueError("parallel_kind must be 'multiproc' or 'multithread'")
# identify dimensions
self.ops = ops
mops = np.zeros(len(ops), dtype=int)
nops = np.zeros(len(ops), dtype=int)
for iop, oper in enumerate(ops):
if not isinstance(oper, (LinearOperator, spLinearOperator)):
self.ops[iop] = MatrixMult(oper, dtype=oper.dtype)
nops[iop] = self.ops[iop].shape[0]
mops[iop] = self.ops[iop].shape[1]
self.nops = int(nops.sum())
self.mops = int(mops.sum())
self.nnops = np.insert(np.cumsum(nops), 0, 0)
self.mmops = np.insert(np.cumsum(mops), 0, 0)
# define dims (check if all operators have the same,
# otherwise make same as self.mops and forceflat=True)
dims = [op.dims for op in self.ops]
if len(set(dims)) == 1:
dims = (len(ops), *dims[0])
else:
dims = (self.mops,)
forceflat = True
# define dimsd (check if all operators have the same,
# otherwise make same as self.nops and forceflat=True)
dimsd = [op.dimsd for op in self.ops]
if len(set(dimsd)) == 1:
dimsd = (len(ops), *dimsd[0])
else:
dimsd = (self.nops,)
forceflat = True
# create pool for multithreading / multiprocessing
self.parallel_kind = parallel_kind
self._nproc = nproc
self.pool: Optional[mp.pool.Pool] = None
if self.nproc > 1:
if self.parallel_kind == "multiproc":
self.pool = mp.Pool(processes=nproc)
else:
self.pool = mt.ThreadPoolExecutor(max_workers=nproc)
self.inoutengine = inoutengine
dtype = _get_dtype(ops) if dtype is None else np.dtype(dtype)
clinear = all([getattr(oper, "clinear", True) for oper in self.ops])
super().__init__(
dtype=dtype,
dims=dims,
dimsd=dimsd,
clinear=clinear,
forceflat=forceflat,
)
@property
def nproc(self) -> int:
return self._nproc
@nproc.setter
def nproc(self, nprocnew: int) -> None:
if self._nproc > 1 and self.pool is not None:
if self.parallel_kind == "multiproc":
self.pool.close()
self.pool.join()
else:
self.pool.shutdown()
if nprocnew > 1:
if self.parallel_kind == "multiproc":
self.pool = mp.Pool(processes=nprocnew)
else:
self.pool = mt.ThreadPoolExecutor(max_workers=nprocnew)
self._nproc = nprocnew
def _matvec_serial(self, x: NDArray) -> NDArray:
ncp = (
get_array_module(x)
if self.inoutengine is None
else get_module(self.inoutengine[0])
)
y = ncp.zeros(self.nops, dtype=self.dtype)
for iop, oper in enumerate(self.ops):
y = inplace_set(
oper.matvec(x[self.mmops[iop] : self.mmops[iop + 1]]).squeeze(),
y,
slice(self.nnops[iop], self.nnops[iop + 1]),
)
return y
def _rmatvec_serial(self, x: NDArray) -> NDArray:
ncp = (
get_array_module(x)
if self.inoutengine is None
else get_module(self.inoutengine[1])
)
y = ncp.zeros(self.mops, dtype=self.dtype)
for iop, oper in enumerate(self.ops):
y = inplace_set(
oper.rmatvec(x[self.nnops[iop] : self.nnops[iop + 1]]).squeeze(),
y,
slice(self.mmops[iop], self.mmops[iop + 1]),
)
return y
def _matvec_multiproc(self, x: NDArray) -> NDArray:
ys = self.pool.starmap(
_matvec_rmatvec_map,
[
(oper._matvec, x[self.mmops[iop] : self.mmops[iop + 1]])
for iop, oper in enumerate(self.ops)
],
)
y = np.hstack(ys)
return y
def _rmatvec_multiproc(self, x: NDArray) -> NDArray:
ys = self.pool.starmap(
_matvec_rmatvec_map,
[
(oper._rmatvec, x[self.nnops[iop] : self.nnops[iop + 1]])
for iop, oper in enumerate(self.ops)
],
)
y = np.hstack(ys)
return y
def _matvec_multithread(self, x: NDArray) -> NDArray:
ys = list(
self.pool.map(
lambda args: _matvec_rmatvec_map(*args),
[
(oper._matvec, x[self.mmops[iop] : self.mmops[iop + 1]])
for iop, oper in enumerate(self.ops)
],
)
)
y = np.hstack(ys)
return y
def _rmatvec_multithread(self, x: NDArray) -> NDArray:
ys = list(
self.pool.map(
lambda args: _matvec_rmatvec_map(*args),
[
(oper._rmatvec, x[self.nnops[iop] : self.nnops[iop + 1]])
for iop, oper in enumerate(self.ops)
],
)
)
y = np.hstack(ys)
return y
def _matvec(self, x: NDArray) -> NDArray:
if self.nproc == 1:
y = self._matvec_serial(x)
else:
if self.parallel_kind == "multiproc":
y = self._matvec_multiproc(x)
else:
y = self._matvec_multithread(x)
return y
def _rmatvec(self, x: NDArray) -> NDArray:
if self.nproc == 1:
y = self._rmatvec_serial(x)
else:
if self.parallel_kind == "multiproc":
y = self._rmatvec_multiproc(x)
else:
y = self._rmatvec_multithread(x)
return y
def close(self):
"""Close the pool of workers used for multiprocessing
/ multithreading.
"""
if self.pool is not None:
if self.parallel_kind == "multiproc":
self.pool.close()
self.pool.join()
else:
self.pool.shutdown()
self.pool = None