Source code for pygeoinf.linear_operators

"""
Provides classes for linear operators between Hilbert spaces.

This module is the primary tool for defining and manipulating linear mappings
between `HilbertSpace` objects. It provides a powerful `LinearOperator` class
that supports a rich algebra and includes numerous factory methods for
convenient construction from matrices, forms, or tensor products.

Key Classes
-----------
- `LinearOperator`: The main workhorse for linear algebra. It represents a
  linear map `L(x) = Ax` and provides rich functionality, including composition
  (`@`), adjoints (`.adjoint`), duals (`.dual`), and matrix representations
  (`.matrix`).
- `DiagonalLinearOperator`: A specialized, efficient implementation for linear
  operators that are diagonal in their component representation, notable for
  supporting functional calculus (e.g., `.inverse`, `.sqrt`).
"""

from __future__ import annotations
from typing import Callable, List, Optional, Any, Union, Tuple, TYPE_CHECKING, Dict

from collections import defaultdict

import numpy as np
import scipy.sparse as sp
from scipy.sparse.linalg import LinearOperator as ScipyLinOp


from joblib import Parallel, delayed


from .nonlinear_operators import NonLinearOperator


from .parallel import parallel_compute_dense_matrix_from_scipy_op

from .checks.linear_operators import LinearOperatorAxiomChecks


if TYPE_CHECKING:
    from .hilbert_space import HilbertSpace, Vector
    from .linear_forms import LinearForm



[docs]
class LinearOperator(NonLinearOperator, LinearOperatorAxiomChecks):
    """A linear operator between two Hilbert spaces.

    This class represents a linear map `A(x)` and provides rich
    functionality for linear algebraic operations. It specializes
    `NonLinearOperator`, with the derivative mapping taking the
    required form (i.e., the derivative is just the operator itself).

    Key features include operator algebra (`@`, `+`, `*`), automatic
    derivation of adjoint (`.adjoint`) and dual (`.dual`) operators, and
    multiple matrix representations (`.matrix()`) for use with numerical
    solvers.
    """

    def __init__(
        self,
        domain: HilbertSpace,
        codomain: HilbertSpace,
        mapping: Callable[[Vector], Vector],
        /,
        *,
        dual_mapping: Optional[Callable[[Vector], Vector]] = None,
        adjoint_mapping: Optional[Callable[[Vector], Vector]] = None,
        dual_base: Optional[LinearOperator] = None,
        adjoint_base: Optional[LinearOperator] = None,
    ) -> None:
        """
        Initializes the LinearOperator.

        Args:
            domain (HilbertSpace): The domain of the operator.
            codomain (HilbertSpace): The codomain of the operator.
            mapping (callable): The function defining the linear mapping.
            dual_mapping (callable, optional): The action of the dual operator.
            adjoint_mapping (callable, optional): The action of the adjoint.
            dual_base (LinearOperator, optional): Internal use for duals.
            adjoint_base (LinearOperator, optional): Internal use for adjoints.

        Notes:
            If neither the dual or adjoint mappings are provided, an they are
            deduced internally using a correct but very inefficient method.
            In general this functionality should not be relied on other than
            for operators between low-dimensional spaces.
        """
        super().__init__(
            domain, codomain, self._mapping_impl, derivative=self._derivative_impl
        )
        self._mapping = mapping
        self._dual_base: Optional[LinearOperator] = dual_base
        self._adjoint_base: Optional[LinearOperator] = adjoint_base
        self.__adjoint_mapping: Callable[[Any], Any]
        self.__dual_mapping: Callable[[Any], Any]

        self.__using_default_dual_and_adjoint = False

        if dual_mapping is None:
            if adjoint_mapping is None:
                self.__dual_mapping = self._dual_mapping_default
                self.__adjoint_mapping = self._adjoint_mapping_from_dual
                self.__using_default_dual_and_adjoint = True
            else:
                self.__adjoint_mapping = adjoint_mapping
                self.__dual_mapping = self._dual_mapping_from_adjoint
        else:
            self.__dual_mapping = dual_mapping
            if adjoint_mapping is None:
                self.__adjoint_mapping = self._adjoint_mapping_from_dual
            else:
                self.__adjoint_mapping = adjoint_mapping


[docs]
    @staticmethod
    def self_dual(
        domain: HilbertSpace, mapping: Callable[[Any], Any]
    ) -> LinearOperator:
        """Creates a self-dual operator."""
        return LinearOperator(domain, domain.dual, mapping, dual_mapping=mapping)



[docs]
    @staticmethod
    def self_adjoint(
        domain: HilbertSpace, mapping: Callable[[Any], Any]
    ) -> LinearOperator:
        """Creates a self-adjoint operator."""
        return LinearOperator(domain, domain, mapping, adjoint_mapping=mapping)



[docs]
    @staticmethod
    def from_formal_adjoint(
        domain: HilbertSpace, codomain: HilbertSpace, operator: LinearOperator
    ) -> LinearOperator:
        """
        Constructs an operator on weighted spaces from one on the underlying spaces.

        This is a key method for working with `MassWeightedHilbertSpace`. It takes
        an operator `A` that is defined on the simple, unweighted underlying spaces
        and "lifts" it to be a proper operator on the mass-weighted spaces. It
        correctly defines the new operator's adjoint with respect to the
        weighted inner products.

        This method automatically handles cases where the domain and/or codomain
        are a `HilbertSpaceDirectSum`, recursively building the necessary
        block-structured mass operators.

        Args:
            domain: The (potentially) mass-weighted domain of the new operator.
            codomain: The (potentially) mass-weighted codomain of the new operator.
            operator: The original operator defined on the underlying,
                unweighted spaces.

        Returns:
            A new `LinearOperator` that acts between the mass-weighted spaces.
        """
        from .hilbert_space import MassWeightedHilbertSpace
        from .direct_sum import HilbertSpaceDirectSum, BlockDiagonalLinearOperator

        def get_properties(space: HilbertSpace):
            if isinstance(space, MassWeightedHilbertSpace):
                return (
                    space.underlying_space,
                    space.mass_operator,
                    space.inverse_mass_operator,
                )
            elif isinstance(space, HilbertSpaceDirectSum):
                properties = [get_properties(subspace) for subspace in space.subspaces]
                underlying_space = HilbertSpaceDirectSum(
                    [property[0] for property in properties]
                )
                mass_operator = BlockDiagonalLinearOperator(
                    [property[1] for property in properties]
                )
                inverse_mass_operator = BlockDiagonalLinearOperator(
                    [property[2] for property in properties]
                )
                return (
                    underlying_space,
                    mass_operator,
                    inverse_mass_operator,
                )
            else:
                return space, space.identity_operator(), space.identity_operator()

        domain_base, _, domain_inverse_mass_operator = get_properties(domain)
        codomain_base, codomain_mass_operator, _ = get_properties(codomain)

        if domain_base != operator.domain:
            raise ValueError("Domain mismatch")

        if codomain_base != operator.codomain:
            raise ValueError("Codomain mismatch")

        return LinearOperator(
            domain,
            codomain,
            operator,
            adjoint_mapping=domain_inverse_mass_operator

[docs]
            @ operator.adjoint
            @ codomain_mass_operator,
        )


    @staticmethod
    def from_formally_self_adjoint(
        domain: HilbertSpace, operator: LinearOperator
    ) -> LinearOperator:
        """
        Constructs a self-adjoint operator on a weighted space.

        This method takes an operator that is formally self-adjoint on an
        underlying (unweighted) space and promotes it to a truly self-adjoint
        operator on the `MassWeightedHilbertSpace`. It automatically handles
        `HilbertSpaceDirectSum` domains.

        Args:
            domain (HilbertSpace): The domain of the operator, which can be a
                `MassWeightedHilbertSpace` or a `HilbertSpaceDirectSum`.
            operator (LinearOperator): The operator to be converted.
        """
        return LinearOperator.from_formal_adjoint(domain, domain, operator)



[docs]
    @staticmethod
    def from_linear_forms(forms: List[LinearForm]) -> LinearOperator:
        """
        Creates an operator from a list of linear forms.

        The resulting operator maps from the forms' domain to an N-dimensional
        Euclidean space, where N is the number of forms.
        """
        from .hilbert_space import EuclideanSpace

        domain = forms[0].domain
        codomain = EuclideanSpace(len(forms))
        if not all(form.domain == domain for form in forms):
            raise ValueError("Forms need to be defined on a common domain")

        matrix = np.zeros((codomain.dim, domain.dim))
        for i, form in enumerate(forms):
            matrix[i, :] = form.components

        def mapping(x: Any) -> np.ndarray:
            cx = domain.to_components(x)
            cy = matrix @ cx
            return cy

        def dual_mapping(yp: Any) -> Any:
            cyp = codomain.dual.to_components(yp)
            cxp = matrix.T @ cyp
            return domain.dual.from_components(cxp)

        return LinearOperator(domain, codomain, mapping, dual_mapping=dual_mapping)



[docs]
    @staticmethod
    def from_linear_form(form: "LinearForm") -> "LinearOperator":
        """
        Creates a rank-1 LinearOperator from a single LinearForm.

        The resulting operator maps from the form's domain to a 1-dimensional
        Euclidean space.

        The forward mapping evaluates the form: A(x) = [form(x)].
        The dual mapping scales the form: A'(y') = y'_0 * form.
        The adjoint mapping is handled automatically by the base class.

        Args:
            form: A LinearForm representing a continuous linear functional.

        Returns:
            A LinearOperator mapping from 'form.domain' to EuclideanSpace(1).
        """
        from .hilbert_space import EuclideanSpace

        domain = form.domain
        codomain = EuclideanSpace(1)

        def mapping(x: "Vector") -> np.ndarray:
            # Evaluate the linear form and wrap it in a 1D array
            return np.array([form(x)])

        def dual_mapping(yp: Any) -> "LinearForm":
            # Map the 1D Euclidean dual vector to its scalar component
            scalar = codomain.from_dual(yp)[0]
            # The dual map simply scales the linear form in the dual space
            return domain.dual.multiply(scalar, form)

        return LinearOperator(
            domain,
            codomain,
            mapping,
            dual_mapping=dual_mapping,
        )



[docs]
    @staticmethod
    def from_vectors(domain: HilbertSpace, vectors: List[Vector]) -> "LinearOperator":
        """
        Creates a LinearOperator from a list of domain vectors.

        The resulting operator maps from the given domain to a Euclidean space
        of dimension n (where n is the number of vectors).

        The forward mapping is given by A(x)_i = <vectors[i], x>.
        The adjoint mapping is given by A*(y) = sum(y_i * vectors[i]).

        Args:
            domain: The Hilbert space the vectors belong to.
            vectors: A list of vectors in the domain space.

        Returns:
            A LinearOperator mapping from 'domain' to EuclideanSpace(len(vectors)).

        Raises:
            ValueError: If the list of vectors is empty.
        """
        from .hilbert_space import EuclideanSpace

        n = len(vectors)
        if n == 0:
            raise ValueError("Cannot create an operator from an empty list of vectors.")

        codomain = EuclideanSpace(n)

        def mapping(x: Vector) -> np.ndarray:
            # Evaluate the inner product of x with each vector
            return np.array([domain.inner_product(v, x) for v in vectors])

        def adjoint_mapping(y: np.ndarray) -> Vector:
            # Reconstruct a domain vector as a linear combination
            result = domain.zero
            for i in range(n):
                domain.axpy(y[i], vectors[i], result)
            return result

        return LinearOperator(
            domain,
            codomain,
            mapping,
            adjoint_mapping=adjoint_mapping,
        )



[docs]
    @staticmethod
    def from_vector(domain: HilbertSpace, vector: Vector) -> "LinearOperator":
        """
        Creates a rank-1 LinearOperator from a single domain vector.

        The resulting operator maps from the given domain to a 1-dimensional
        Euclidean space.

        The forward mapping evaluates the inner product: A(x) = [<vector, x>].
        The adjoint mapping scales the vector: A*(y) = y[0] * vector.

        Args:
            domain: The Hilbert space the vector belongs to.
            vector: A single vector in the domain space.

        Returns:
            A LinearOperator mapping from 'domain' to EuclideanSpace(1).
        """
        from .hilbert_space import EuclideanSpace

        codomain = EuclideanSpace(1)

        def mapping(x: Vector) -> np.ndarray:
            # Evaluate the inner product and wrap it in a 1D array
            return np.array([domain.inner_product(vector, x)])

        def adjoint_mapping(y: np.ndarray) -> Vector:
            # y is a 1D Euclidean vector (numpy array of size 1)
            return domain.multiply(y[0], vector)

        return LinearOperator(
            domain,
            codomain,
            mapping,
            adjoint_mapping=adjoint_mapping,
        )



[docs]
    @staticmethod
    def from_matrix(
        domain: HilbertSpace,
        codomain: HilbertSpace,
        matrix: Union[np.ndarray, sp.sparray, ScipyLinOp],
        /,
        *,
        galerkin: bool = False,
    ) -> MatrixLinearOperator:
        """
        Creates the most appropriate LinearOperator from a matrix representation.

        This factory method acts as a dispatcher, inspecting the type of the
        input matrix and returning the most specialized and optimized operator
        subclass (e.g., Dense, Sparse, or DiagonalSparse). It also handles
        matrix-free `scipy.sparse.linalg.LinearOperator` objects.

        Args:
            domain: The operator's domain space.
            codomain: The operator's codomain space.
            matrix: The matrix representation (NumPy ndarray, SciPy sparray,
                    or SciPy LinearOperator).
            galerkin: If `True`, the matrix is interpreted in Galerkin form.

        Returns:
            An instance of the most appropriate MatrixLinearOperator subclass.
        """
        # The order of these checks is important: from most specific to most general.

        # 1. Check for the most specific diagonal-sparse format
        if isinstance(matrix, sp.dia_array):
            diagonals_tuple = (matrix.data, matrix.offsets)
            return DiagonalSparseMatrixLinearOperator(
                domain, codomain, diagonals_tuple, galerkin=galerkin
            )

        # 2. Check for any other modern sparse format
        elif isinstance(matrix, sp.sparray):
            return SparseMatrixLinearOperator(
                domain, codomain, matrix, galerkin=galerkin
            )

        # 3. Check for a dense NumPy array
        elif isinstance(matrix, np.ndarray):
            return DenseMatrixLinearOperator(
                domain, codomain, matrix, galerkin=galerkin
            )

        # 4. Check for a matrix-free SciPy LinearOperator
        elif isinstance(matrix, ScipyLinOp):
            # This is matrix-free, so the general MatrixLinearOperator is the correct wrapper.
            return MatrixLinearOperator(domain, codomain, matrix, galerkin=galerkin)

        # 5. Handle legacy sparse matrix formats (optional but robust)
        elif sp.issparse(matrix):
            modern_array = sp.csr_array(matrix)
            return SparseMatrixLinearOperator(
                domain, codomain, modern_array, galerkin=galerkin
            )

        # 6. Raise an error for unsupported types
        else:
            raise TypeError(f"Unsupported matrix type: {type(matrix)}")



[docs]
    @staticmethod
    def self_adjoint_from_matrix(
        domain: HilbertSpace,
        matrix: Union[np.ndarray, sp.sparray, ScipyLinOp],
    ) -> MatrixLinearOperator:
        """
        Creates the most appropriate self-adjoint LinearOperator from a matrix.

        This factory acts as a dispatcher, returning the most specialized
        subclass for the given matrix type (e.g., Dense, Sparse).

        It ALWAYS assumes the provided matrix is the **Galerkin** representation
        of the operator. The user is responsible for ensuring the input matrix
        is symmetric (or self-adjoint for ScipyLinOp).

        Args:
            domain: The operator's domain and codomain space.
            matrix: The symmetric matrix representation.

        Returns:
            An instance of the most appropriate MatrixLinearOperator subclass.
        """
        # Dispatch to the appropriate subclass, always with galerkin=True
        if isinstance(matrix, sp.dia_array):
            diagonals_tuple = (matrix.data, matrix.offsets)
            return DiagonalSparseMatrixLinearOperator(
                domain, domain, diagonals_tuple, galerkin=True
            )
        elif isinstance(matrix, sp.sparray):
            return SparseMatrixLinearOperator(domain, domain, matrix, galerkin=True)
        elif isinstance(matrix, np.ndarray):
            return DenseMatrixLinearOperator(domain, domain, matrix, galerkin=True)
        elif isinstance(matrix, ScipyLinOp):
            return MatrixLinearOperator(domain, domain, matrix, galerkin=True)
        elif sp.issparse(matrix):
            modern_array = sp.csr_array(matrix)
            return SparseMatrixLinearOperator(
                domain, domain, modern_array, galerkin=True
            )
        else:
            raise TypeError(f"Unsupported matrix type: {type(matrix)}")



[docs]
    @staticmethod
    def from_tensor_product(
        domain: HilbertSpace,
        codomain: HilbertSpace,
        vector_pairs: List[Tuple[Any, Any]],
        /,
        *,
        weights: Optional[List[float]] = None,
    ) -> LinearOperator:
        """
        Creates an operator from a weighted sum of tensor products.

        The operator represents A(x) = sum_i( w_i * <x, v_i> * u_i ),
        where vector_pairs are (u_i, v_i).
        """
        _weights = [1.0] * len(vector_pairs) if weights is None else weights

        def mapping(x: Any) -> Any:
            y = codomain.zero
            for (left, right), weight in zip(vector_pairs, _weights):
                product = domain.inner_product(right, x)
                codomain.axpy(weight * product, left, y)
            return y

        def adjoint_mapping(y: Any) -> Any:
            x = domain.zero
            for (left, right), weight in zip(vector_pairs, _weights):
                product = codomain.inner_product(left, y)
                domain.axpy(weight * product, right, x)
            return x

        return LinearOperator(
            domain, codomain, mapping, adjoint_mapping=adjoint_mapping
        )



[docs]
    @staticmethod
    def self_adjoint_from_tensor_product(
        domain: HilbertSpace,
        vectors: List[Any],
        /,
        *,
        weights: Optional[List[float]] = None,
    ) -> LinearOperator:
        """Creates a self-adjoint operator from a tensor product sum."""
        _weights = [1.0] * len(vectors) if weights is None else weights

        def mapping(x: Any) -> Any:
            y = domain.zero
            for vector, weight in zip(vectors, _weights):
                product = domain.inner_product(vector, x)
                domain.axpy(weight * product, vector, y)
            return y

        return LinearOperator.self_adjoint(domain, mapping)


    @property
    def linear(self) -> bool:
        """True, as this is a LinearOperator."""
        return True

    @property
    def dual(self) -> LinearOperator:
        """The dual of the operator."""
        if self._dual_base is None:
            return LinearOperator(
                self.codomain.dual,
                self.domain.dual,
                self.__dual_mapping,
                dual_base=self,
            )
        else:
            return self._dual_base

    @property
    def adjoint(self) -> LinearOperator:
        """The adjoint of the operator."""
        if self._adjoint_base is None:
            return LinearOperator(
                self.codomain,
                self.domain,
                self.__adjoint_mapping,
                adjoint_base=self,
            )
        else:
            return self._adjoint_base


[docs]
    def matrix(
        self,
        /,
        *,
        dense: bool = False,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> Union[ScipyLinOp, np.ndarray]:
        """Returns a matrix representation of the operator.

        This provides a concrete matrix that represents the operator's action
        on the underlying component vectors.

        Args:
            dense: If `True`, returns a dense `numpy.ndarray`. If `False`
                (default), returns a memory-efficient, matrix-free
                `scipy.sparse.linalg.LinearOperator`.
            galerkin: If `True`, the returned matrix is the Galerkin
                representation, whose `rmatvec` corresponds to the
                **adjoint** operator. If `False` (default), the `rmatvec`
                corresponds to the **dual** operator. The Galerkin form is
                essential for algorithms that rely on symmetry/self-adjointness.
            parallel: If `True` and `dense=True`, computes the matrix columns
                in parallel.
            n_jobs: Number of parallel jobs to use. `-1` uses all available cores.

        Returns:
            The matrix representation, either dense or matrix-free.
        """

        if dense:
            return self._compute_dense_matrix(galerkin, parallel, n_jobs)
        else:
            if galerkin:

                def matvec(cx: np.ndarray) -> np.ndarray:
                    x = self.domain.from_components(cx)
                    y = self(x)
                    yp = self.codomain.to_dual(y)
                    return self.codomain.dual.to_components(yp)

                def rmatvec(cy: np.ndarray) -> np.ndarray:
                    y = self.codomain.from_components(cy)
                    x = self.adjoint(y)
                    xp = self.domain.to_dual(x)
                    return self.domain.dual.to_components(xp)

            else:

                def matvec(cx: np.ndarray) -> np.ndarray:
                    x = self.domain.from_components(cx)
                    y = self(x)
                    return self.codomain.to_components(y)

                def rmatvec(cyp: np.ndarray) -> np.ndarray:
                    yp = self.codomain.dual.from_components(cyp)
                    xp = self.dual(yp)
                    return self.domain.dual.to_components(xp)

            def matmat(xmat: np.ndarray) -> np.ndarray:
                _n, k = xmat.shape
                assert _n == self.domain.dim

                if not parallel:
                    ymat = np.zeros((self.codomain.dim, k))
                    for j in range(k):
                        ymat[:, j] = matvec(xmat[:, j])
                    return ymat
                else:
                    result_cols = Parallel(n_jobs=n_jobs)(
                        delayed(matvec)(xmat[:, j]) for j in range(k)
                    )
                    return np.column_stack(result_cols)

            def rmatmat(ymat: np.ndarray) -> np.ndarray:
                _m, k = ymat.shape
                assert _m == self.codomain.dim

                if not parallel:
                    xmat = np.zeros((self.domain.dim, k))
                    for j in range(k):
                        xmat[:, j] = rmatvec(ymat[:, j])
                    return xmat
                else:
                    result_cols = Parallel(n_jobs=n_jobs)(
                        delayed(rmatvec)(ymat[:, j]) for j in range(k)
                    )
                    return np.column_stack(result_cols)

            return ScipyLinOp(
                (self.codomain.dim, self.domain.dim),
                matvec=matvec,
                rmatvec=rmatvec,
                matmat=matmat,
                rmatmat=rmatmat,
            )



[docs]
    def extract_diagonal(
        self,
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> np.ndarray:
        """
        Computes the main diagonal of the operator's matrix representation.

        This method is highly parallelizable and memory-efficient, as it
        avoids forming the full dense matrix.

        Args:
            galerkin: If True, computes the diagonal of the Galerkin matrix.
            parallel: If True, computes the entries in parallel.
            n_jobs: Number of parallel jobs to use.

        Returns:
            A NumPy array containing the diagonal entries.
        """

        dim = min(self.domain.dim, self.codomain.dim)
        jobs = n_jobs if parallel else 1

        def compute_entry(i: int) -> float:
            """Worker function to compute a single diagonal entry."""
            e_i = self.domain.basis_vector(i)
            L_e_i = self(e_i)

            if galerkin:
                return self.domain.inner_product(e_i, L_e_i)
            else:
                return self.codomain.to_components(L_e_i)[i]

        diagonal_entries = Parallel(n_jobs=jobs)(
            delayed(compute_entry)(i) for i in range(dim)
        )
        return np.array(diagonal_entries)



[docs]
    def extract_diagonals(
        self,
        offsets: List[int],
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> Tuple[np.ndarray, List[int]]:
        """
        Computes specified diagonals of the operator's matrix representation.

        This is a memory-efficient and parallelizable method that computes
        the matrix one column at a time.

        Args:
            offsets: A list of diagonal offsets to extract (e.g., [0] for
                the main diagonal, [-1, 0, 1] for a tridiagonal matrix).
            galerkin: If True, computes the diagonals of the Galerkin matrix.
            parallel: If True, computes columns in parallel.
            n_jobs: Number of parallel jobs to use.

        Returns:
            A tuple containing:
            - A NumPy array where each row is a diagonal.
            - The list of offsets.
            This format is compatible with scipy.sparse.spdiags.
        """
        dim = min(self.domain.dim, self.codomain.dim)
        jobs = n_jobs if parallel else 1

        # Prepare a thread-safe dictionary to store results

        results: Dict[int, Dict[int, float]] = defaultdict(dict)

        def compute_column_entries(j: int) -> Dict[int, Dict[int, float]]:
            """
            Worker function to compute all needed entries for column j.
            """
            e_j = self.domain.basis_vector(j)
            L_e_j = self(e_j)

            col_results = defaultdict(dict)

            for k in offsets:
                i = j - k
                if 0 <= i < dim:
                    if galerkin:
                        e_i = self.domain.basis_vector(i)
                        val = self.domain.inner_product(e_i, L_e_j)
                    else:
                        val = self.codomain.to_components(L_e_j)[i]
                    col_results[k][i] = val
            return col_results

        # Run the computation in parallel
        column_data = Parallel(n_jobs=jobs)(
            delayed(compute_column_entries)(j) for j in range(dim)
        )

        # Aggregate results from the parallel computation
        for col_dict in column_data:
            for k, entries in col_dict.items():
                results[k].update(entries)

        # Format the results for spdiags
        # The array must have padding for shorter off-diagonals.
        diagonals_array = np.zeros((len(offsets), dim))
        for idx, k in enumerate(offsets):
            diag_entries = results[k]
            for i, val in diag_entries.items():
                j = i + k
                if 0 <= j < dim:
                    diagonals_array[idx, j] = val

        return diagonals_array, offsets



[docs]
    def with_dense_matrix(
        self,
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> DenseMatrixLinearOperator:
        """
        Returns a new operator equivalent to the existing one, but with its
        matrix representation computed and stored internally in dense form.

        Args:
            galerkin: If True, the Galerkin representation is used. Default is False.
            parallel: If True, computes the dense matrix in parallel.
            n_jobs: Number of CPU cores to use. -1 means all available.

        Returns:
            A DenseMatrixLinearOperator instance.
        """

        return DenseMatrixLinearOperator.from_linear_operator(
            self, galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
        )


    def _mapping_impl(self, x: Any) -> Any:
        return self._mapping(x)

    def _derivative_impl(self, _: Any) -> LinearOperator:
        return self

    def _dual_mapping_default(self, yp: Any) -> LinearForm:
        from .linear_forms import LinearForm

        return LinearForm(self.domain, mapping=lambda x: yp(self(x)))

    def _dual_mapping_from_adjoint(self, yp: Any) -> Any:
        y = self.codomain.from_dual(yp)
        x = self.__adjoint_mapping(y)
        return self.domain.to_dual(x)

    def _adjoint_mapping_from_dual(self, y: Any) -> Any:
        yp = self.codomain.to_dual(y)
        xp = self.__dual_mapping(yp)
        return self.domain.from_dual(xp)

    def _compute_dense_matrix(
        self, galerkin: bool, parallel: bool, n_jobs: int
    ) -> np.ndarray:

        if (
            self.codomain.dim < self.domain.dim
            and not self.__using_default_dual_and_adjoint
        ):
            if galerkin:
                return self.adjoint.matrix(
                    dense=True, galerkin=True, parallel=parallel, n_jobs=n_jobs
                ).T
            else:
                return self.dual.matrix(
                    dense=True, galerkin=False, parallel=parallel, n_jobs=n_jobs
                ).T

        scipy_op_wrapper = self.matrix(galerkin=galerkin)

        if not parallel:
            matrix = np.zeros((self.codomain.dim, self.domain.dim))
            cx = np.zeros(self.domain.dim)
            for i in range(self.domain.dim):
                cx[i] = 1.0
                matrix[:, i] = (scipy_op_wrapper @ cx)[:]
                cx[i] = 0.0
            return matrix
        else:
            return parallel_compute_dense_matrix_from_scipy_op(
                scipy_op_wrapper, n_jobs=n_jobs
            )

    def __call__(self, x: Any) -> Any:
        return super().__call__(x)

    def __neg__(self) -> LinearOperator:
        domain = self.domain
        codomain = self.codomain

        def mapping(x: Any) -> Any:
            return codomain.negative(self(x))

        def adjoint_mapping(y: Any) -> Any:
            return domain.negative(self.adjoint(y))

        return LinearOperator(
            domain, codomain, mapping, adjoint_mapping=adjoint_mapping
        )

    def __mul__(self, a: float) -> LinearOperator:
        domain = self.domain
        codomain = self.codomain

        def mapping(x: Any) -> Any:
            return codomain.multiply(a, self(x))

        def adjoint_mapping(y: Any) -> Any:
            return domain.multiply(a, self.adjoint(y))

        return LinearOperator(
            domain, codomain, mapping, adjoint_mapping=adjoint_mapping
        )

    def __rmul__(self, a: float) -> LinearOperator:
        return self * a

    def __truediv__(self, a: float) -> LinearOperator:
        return self * (1.0 / a)

    def __add__(
        self, other: NonLinearOperator | LinearOperator
    ) -> NonLinearOperator | LinearOperator:
        """Returns the sum of this operator and another.

        If `other` is also a `LinearOperator`, this performs an optimized
        addition that preserves linearity and correctly defines the new
        operator's `adjoint`. Otherwise, it delegates to the general
        implementation in the `NonLinearOperator` base class.

        Args:
            other: The operator to add to this one.

        Returns:
            A new `LinearOperator` if adding two linear operators, otherwise
            a `NonLinearOperator`.
        """

        if type(other).__name__ == "AffineOperator":
            return NotImplemented

        if isinstance(other, LinearOperator):
            domain = self.domain
            codomain = self.codomain

            def mapping(x: Any) -> Any:
                return codomain.add(self(x), other(x))

            def adjoint_mapping(y: Any) -> Any:
                return domain.add(self.adjoint(y), other.adjoint(y))

            return LinearOperator(
                domain, codomain, mapping, adjoint_mapping=adjoint_mapping
            )
        else:
            return super().__add__(other)

    def __sub__(
        self, other: NonLinearOperator | LinearOperator
    ) -> NonLinearOperator | LinearOperator:
        """Returns the difference between this operator and another.

        If `other` is also a `LinearOperator`, this performs an optimized
        subtraction that preserves linearity and correctly defines the new
        operator's `adjoint`. Otherwise, it delegates to the general
        implementation in the `NonLinearOperator` base class.

        Args:
            other: The operator to subtract from this one.

        Returns:
            A new `LinearOperator` if subtracting two linear operators,
            otherwise a `NonLinearOperator`.
        """

        # Yield to AffineOperator to preserve structure
        if type(other).__name__ == "AffineOperator":
            return NotImplemented

        if isinstance(other, LinearOperator):
            domain = self.domain
            codomain = self.codomain

            def mapping(x: Any) -> Any:
                return codomain.subtract(self(x), other(x))

            def adjoint_mapping(y: Any) -> Any:
                return domain.subtract(self.adjoint(y), other.adjoint(y))

            return LinearOperator(
                domain, codomain, mapping, adjoint_mapping=adjoint_mapping
            )
        else:
            return super().__sub__(other)

    def __matmul__(
        self, other: NonLinearOperator | LinearOperator
    ) -> NonLinearOperator | LinearOperator:
        """Composes this operator with another using the @ symbol.

        The composition `(self @ other)` results in a new operator that
        first applies `other` and then applies `self`, i.e.,
        `(self @ other)(x) = self(other(x))`.

        If `other` is also a `LinearOperator`, this creates a new `LinearOperator`
        whose adjoint is correctly defined using the composition rule:
        `(L1 @ L2)* = L2* @ L1*`. Otherwise, it delegates to the general
        `NonLinearOperator` implementation.

        Args:
            other: The operator to compose with (the right-hand operator).

        Returns:
            A new `LinearOperator` if composing two linear operators,
            otherwise a `NonLinearOperator`.
        """

        # Yield to AffineOperator to preserve structure
        if type(other).__name__ == "AffineOperator":
            return NotImplemented

        if isinstance(other, LinearOperator):
            domain = other.domain
            codomain = self.codomain

            def mapping(x: Any) -> Any:
                return self(other(x))

            def adjoint_mapping(y: Any) -> Any:
                return other.adjoint(self.adjoint(y))

            return LinearOperator(
                domain, codomain, mapping, adjoint_mapping=adjoint_mapping
            )

        else:
            return super().__matmul__(other)

    def __str__(self) -> str:
        return self.matrix(dense=True).__str__()




[docs]
class MatrixLinearOperator(LinearOperator):
    """
    A sub-class of LinearOperator for which the operator's action is
    defined internally through its matrix representation.

    This matrix can be either a dense numpy matrix or a
    scipy LinearOperator.
    """

    def __init__(
        self,
        domain: HilbertSpace,
        codomain: HilbertSpace,
        matrix: Union[np.ndarray, ScipyLinOp],
        /,
        *,
        galerkin=False,
    ):
        """
        Args:
            domain: The domain of the operator.
            codomain: The codomain of the operator.
            matrix: matrix representation of the linear operator in either standard
                 or Galerkin form.
            galerkin: If True, galerkin representation used. Default is false.
        """
        assert matrix.shape == (codomain.dim, domain.dim)

        self._matrix = matrix
        self._is_dense = isinstance(matrix, np.ndarray)
        self._galerkin = galerkin

        if galerkin:
            super().__init__(
                domain,
                codomain,
                self._mapping_galerkin,
                adjoint_mapping=self._adjoint_mapping_galerkin,
            )
        else:
            super().__init__(
                domain,
                codomain,
                self._mapping_standard,
                dual_mapping=self._dual_mapping_standard,
            )

    def _mapping_galerkin(self, x: Any) -> Any:
        cx = self.domain.to_components(x)
        cyp = self._matrix @ cx
        yp = self.codomain.dual.from_components(cyp)
        return self.codomain.from_dual(yp)

    def _adjoint_mapping_galerkin(self, y: Any) -> Any:
        cy = self.codomain.to_components(y)
        cxp = self._matrix.T @ cy
        xp = self.domain.dual.from_components(cxp)
        return self.domain.from_dual(xp)

    def _mapping_standard(self, x: Any) -> Any:
        cx = self.domain.to_components(x)
        cy = self._matrix @ cx
        return self.codomain.from_components(cy)

    def _dual_mapping_standard(self, yp: Any) -> Any:
        cyp = self.codomain.dual.to_components(yp)
        cxp = self._matrix.T @ cyp
        return self.domain.dual.from_components(cxp)

    @property
    def is_dense(self) -> bool:
        """
        Returns True if the matrix representation is stored internally in dense form.
        """
        return self._is_dense

    @property
    def is_galerkin(self) -> bool:
        """
        Returns True if the matrix representation is stored in Galerkin form.
        """
        return self._galerkin

    def _compute_dense_matrix(
        self, galerkin: bool, parallel: bool, n_jobs: int
    ) -> np.ndarray:
        """
        Overloaded method to efficiently compute the dense matrix.
        """

        if galerkin == self.is_galerkin and self.is_dense:
            return self._matrix
        else:
            return super()._compute_dense_matrix(galerkin, parallel, n_jobs)


[docs]
    def extract_diagonal(
        self,
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> np.ndarray:
        """
        Overload for efficiency.
        """

        if galerkin == self.is_galerkin and self.is_dense:
            return self._matrix.diagonal()
        else:
            return super().extract_diagonal(
                galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
            )



[docs]
    def extract_diagonals(
        self,
        offsets: List[int],
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> Tuple[np.ndarray, List[int]]:
        """
        Overrides the base method for efficiency by extracting diagonals directly
        from the stored dense matrix when possible.
        """

        if self.is_dense and galerkin == self.is_galerkin:
            dim = self.domain.dim

            diagonals_array = np.zeros((len(offsets), dim))

            for i, k in enumerate(offsets):
                diag_k = np.diag(self._matrix, k=k)

                if k >= 0:
                    diagonals_array[i, k : k + len(diag_k)] = diag_k
                else:
                    diagonals_array[i, : len(diag_k)] = diag_k

            return diagonals_array, offsets

        else:
            return super().extract_diagonals(
                offsets, galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
            )





[docs]
class DenseMatrixLinearOperator(MatrixLinearOperator):
    """
    A specialisation of the MatrixLinearOperator class to instances where
    the matrix representation is always provided as a numpy array.

    This is a class provides some additional methods for component-wise access.
    """

    def __init__(
        self,
        domain: HilbertSpace,
        codomain: HilbertSpace,
        matrix: np.ndarray,
        /,
        *,
        galerkin=False,
    ):
        """
        domain: The domain of the operator.
            codomain: The codomain of the operator.
            matrix: matrix representation of the linear operator in either standard
                 or Galerkin form.
            galerkin: If True, galerkin representation used. Default is false.
        """

        if not isinstance(matrix, np.ndarray):
            raise ValueError("Matrix must be input in dense form.")

        super().__init__(domain, codomain, matrix, galerkin=galerkin)


[docs]
    @staticmethod
    def from_linear_operator(
        operator: LinearOperator,
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> DenseMatrixLinearOperator:
        """
        Converts a LinearOperator into a DenseMatrixLinearOperator by forming its dense matrix representation.

        Args:
            operator: The operator to be converted.
            galerkin: If True, the Galerkin representation is used. Default is False.
            parallel: If True, dense matrix calculation is done in parallel. Default is False.
            n_jobs: Number of jobs used for parallel calculations. Default is False.
        """

        if isinstance(operator, DenseMatrixLinearOperator):
            return operator

        domain = operator.domain
        codomain = operator.codomain

        matrix = operator.matrix(
            dense=True, galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
        )

        return DenseMatrixLinearOperator(domain, codomain, matrix, galerkin=galerkin)





[docs]
class SparseMatrixLinearOperator(MatrixLinearOperator):
    """
    A specialization for operators represented by a modern SciPy sparse array.

    This class requires a `scipy.sparse.sparray` object (e.g., csr_array)
    and provides optimized methods that delegate to efficient SciPy routines.

    Upon initialization, the internal array is converted to the CSR
    (Compressed Sparse Row) format to ensure consistently fast matrix-vector
    products and row-slicing operations.
    """

    def __init__(
        self,
        domain: HilbertSpace,
        codomain: HilbertSpace,
        matrix: sp.sparray,
        /,
        *,
        galerkin: bool = False,
    ):
        """
        Args:
            domain: The domain of the operator.
            codomain: The codomain of the operator.
            matrix: The sparse array representation of the linear operator.
                    Must be a modern sparray object (e.g., csr_array).
            galerkin: If True, the matrix is in Galerkin form. Defaults to False.
        """
        # Strict check for the modern sparse array type
        if not isinstance(matrix, sp.sparray):
            raise TypeError(
                "Matrix must be a modern SciPy sparray object (e.g., csr_array)."
            )

        super().__init__(domain, codomain, matrix, galerkin=galerkin)
        self._matrix = self._matrix.asformat("csr")

    @property
    def sparse_array(self) -> sp.sparray:
        """
        Provides public read-only access to the underlying SciPy sparse array.
        """
        return self._matrix

    def _compute_dense_matrix(
        self, galerkin: bool, parallel: bool, n_jobs: int
    ) -> np.ndarray:
        """
        Overrides the base method to efficiently compute the dense matrix.
        """

        if galerkin == self.is_galerkin:
            return self._matrix.toarray()
        else:
            return super()._compute_dense_matrix(galerkin, parallel, n_jobs)


[docs]
    def extract_diagonal(
        self,
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> np.ndarray:
        """
        Overrides the base method to efficiently extract the main diagonal.
        """
        if galerkin == self.is_galerkin:
            return self._matrix.diagonal(k=0)
        else:
            return super().extract_diagonal(
                galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
            )



[docs]
    def extract_diagonals(
        self,
        offsets: List[int],
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> Tuple[np.ndarray, List[int]]:
        """
        Overrides the base method for efficiency by extracting diagonals
        directly from the stored sparse array.
        """
        if galerkin != self.is_galerkin:
            return super().extract_diagonals(
                offsets, galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
            )

        dim = self.domain.dim
        diagonals_array = np.zeros((len(offsets), dim))

        for i, k in enumerate(offsets):
            # Use the sparse array's fast .diagonal() method
            diag_k = self._matrix.diagonal(k=k)

            # Place the raw diagonal into the padded output array
            if k >= 0:
                diagonals_array[i, k : k + len(diag_k)] = diag_k
            else:
                diagonals_array[i, : len(diag_k)] = diag_k

        return diagonals_array, offsets





[docs]
class DiagonalSparseMatrixLinearOperator(MatrixLinearOperator):
    """
    A highly specialized operator for matrices defined purely by a set of
    non-zero diagonals.

    This class internally stores the operator using a `scipy.sparse.dia_array`
    for maximum efficiency in storage and matrix-vector products. It provides
    extremely fast methods for extracting diagonals, as this is its native
    storage format.

    Class Methods
    -------------
    from_diagonal_values:
        Constructs a strictly diagonal operator from a 1D array of values.
    from_operator:
        Creates a diagonal approximation of another LinearOperator.

    Properties
    ----------
    offsets:
        The array of stored diagonal offsets.
    is_strictly_diagonal:
        True if the operator only has a non-zero main diagonal.
    inverse:
        The inverse of a strictly diagonal operator.
    sqrt:
        The square root of a strictly diagonal operator.
    """

    def __init__(
        self,
        domain: HilbertSpace,
        codomain: HilbertSpace,
        diagonals: Tuple[np.ndarray, List[int]],
        /,
        *,
        galerkin: bool = False,
    ):
        """
        Args:
            domain: The domain of the operator.
            codomain: The codomain of the operator.
            diagonals: A tuple `(data, offsets)` where `data` is a 2D array
                       of diagonal values and `offsets` is a list of their
                       positions. This is the native format for a dia_array.
            galerkin: If True, the matrix is in Galerkin form. Defaults to False.
        """
        shape = (codomain.dim, domain.dim)
        dia_array = sp.dia_array(diagonals, shape=shape)

        super().__init__(domain, codomain, dia_array, galerkin=galerkin)


[docs]
    @classmethod
    def from_operator(
        cls, operator: LinearOperator, offsets: List[int], /, *, galerkin: bool = True
    ) -> DiagonalSparseMatrixLinearOperator:
        """
        Creates a diagonal approximation of another LinearOperator.

        This factory method works by calling the source operator's
        `.extract_diagonals()` method and using the result to construct a
        new, highly efficient DiagonalSparseMatrixLinearOperator.

        Args:
            operator: The source operator to approximate.
            offsets: The list of diagonal offsets to extract and keep.
            galerkin: Specifies which matrix representation to use.

        Returns:
            A new DiagonalSparseMatrixLinearOperator.
        """
        diagonals_data, extracted_offsets = operator.extract_diagonals(
            offsets, galerkin=galerkin
        )
        return cls(
            operator.domain,
            operator.codomain,
            (diagonals_data, extracted_offsets),
            galerkin=galerkin,
        )



[docs]
    @classmethod
    def from_diagonal_values(
        cls,
        domain: HilbertSpace,
        codomain: HilbertSpace,
        diagonal_values: np.ndarray,
        /,
        *,
        galerkin: bool = False,
    ) -> "DiagonalSparseMatrixLinearOperator":
        """
        Constructs a purely diagonal operator from a 1D array of values.

        This provides a convenient way to create an operator with non-zero
        entries only on its main diagonal (offset k=0).

        Args:
            domain: The domain of the operator.
            codomain: The codomain of the operator. Must have the same dimension.
            diagonal_values: A 1D NumPy array of the values for the main diagonal.
            galerkin: If True, the operator is in Galerkin form.

        Returns:
            A new DiagonalSparseMatrixLinearOperator.
        """
        if domain.dim != codomain.dim or domain.dim != len(diagonal_values):
            raise ValueError(
                "Domain, codomain, and diagonal_values must all have the same dimension."
            )

        diagonals_data = diagonal_values.reshape(1, -1)
        offsets = [0]

        return cls(domain, codomain, (diagonals_data, offsets), galerkin=galerkin)


    @property
    def offsets(self) -> np.ndarray:
        """Returns the array of stored diagonal offsets."""
        return self._matrix.offsets

    @property
    def is_strictly_diagonal(self) -> bool:
        """
        True if the operator only has a non-zero main diagonal (offset=0).
        """
        return len(self.offsets) == 1 and self.offsets[0] == 0


[docs]
    def extract_diagonal(
        self,
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> np.ndarray:
        """
        Overrides the base method to efficiently extract the main diagonal.
        """
        if galerkin == self.is_galerkin:
            return self._matrix.diagonal(k=0)
        else:
            return super().extract_diagonal(
                galerkin=galerkin, parallel=parallel, n_jobs=n_jobs
            )



[docs]
    def extract_diagonals(
        self,
        offsets: List[int],
        /,
        *,
        galerkin: bool = False,
        parallel: bool = False,
        n_jobs: int = -1,
    ) -> Tuple[np.ndarray, List[int]]:
        """
        Overrides the base method for extreme efficiency.

        This operation is nearly free, as it involves selecting the requested
        diagonals from the data already stored in the native format.
        """
        if galerkin != self.is_galerkin:
            return super().extract_diagonals(offsets, galerkin=galerkin)

        result_diagonals = np.zeros((len(offsets), self.domain.dim))
        stored_diagonals = dict(zip(self.offsets, self._matrix.data))

        for i, k in enumerate(offsets):
            if k in stored_diagonals:
                result_diagonals[i, :] = stored_diagonals[k]

        return result_diagonals, offsets


    def _compute_dense_matrix(
        self, galerkin: bool, parallel: bool, n_jobs: int
    ) -> np.ndarray:
        """
        Overrides the base method to efficiently compute the dense matrix.
        """
        if galerkin == self.is_galerkin:
            return self._matrix.toarray()
        else:
            return super()._compute_dense_matrix(galerkin, parallel, n_jobs)