Source code for spacecore.linalg._power

from __future__ import annotations

from collections.abc import Callable
from typing import Any, NamedTuple, cast

from ..backend import Context
from ..functional import QuadraticForm
from ..linop import LinOp
from ..space import Space
from ._utils import DEFAULT_CONVERGENCE_CHECK_INTERVAL, SpaceCoreOps, check_interval
from ._utils import check_maxiter, core_normalize, default_initial_vector, is_converged
from ._utils import require_linop, require_square, resolve_apply, result_repr



[docs]
class PowerIterationResult(NamedTuple):
    """
    Store the result returned by :func:`power_iteration`.

    Parameters
    ----------
    eigenvalue : scalar
        Rayleigh-quotient estimate of the dominant eigenvalue.
    eigenvector : array-like
        Normalized eigenvector estimate in the operator domain.
    converged : bool-like
        Whether the residual norm satisfied ``tol``.
    num_iters : int-like
        Number of power iterations executed.
    residual_norm : scalar
        Norm of ``A x - eigenvalue * x``.
    """

    eigenvalue: Any
    eigenvector: Any
    converged: Any
    num_iters: Any
    residual_norm: Any

    def __repr__(self) -> str:
        """Return a compact summary without printing the full eigenvector."""
        return result_repr(
            "PowerIterationResult",
            {
                "converged": self.converged,
                "num_iters": self.num_iters,
                "eigenvalue": self.eigenvalue,
                "residual_norm": self.residual_norm,
                "eigenvector": self.eigenvector,
            },
        )



class _SelfAdjointAction(NamedTuple):
    """Store the callable action used by power iteration."""

    apply: Callable[[Any], Any]
    domain: Space
    ctx: Context
    rayleigh: Callable[[Any, Any], Any]
    residual_norm: Callable[[Any, Any, Any], Any]

    @property
    def ops(self) -> Any:
        """Backend operations for this action."""
        return self.ctx.ops

    @property
    def dtype(self) -> Any:
        """Default dtype for this action."""
        return self.ctx.dtype


def _action_from_linop(A: LinOp) -> _SelfAdjointAction:
    """Normalize a square linear operator into a self-adjoint action."""
    A = require_linop(A)
    require_square(A, "power_iteration")
    if A.is_hermitian() is False:
        raise ValueError("power_iteration requires A to be Hermitian/self-adjoint.")
    apply = resolve_apply(A)
    sops = SpaceCoreOps(A.domain)
    return _SelfAdjointAction(
        apply,
        A.domain,
        A.ctx,
        lambda x, y: A.ops.real(sops.inner(x, y)),
        lambda x, y, eigenvalue: sops.norm(sops.axpy(-eigenvalue, x, y)),
    )


def _action_from_quadratic_form(q: QuadraticForm) -> _SelfAdjointAction:
    """Normalize a quadratic form into its Hessian action."""
    sops = SpaceCoreOps(q.domain)
    hess_quad = getattr(q, "hess_quad", None)
    if callable(hess_quad):

        def rayleigh(x, y):
            return q.ops.real(cast(Any, hess_quad)(x, Hx=y))
    else:

        def rayleigh(x, y):
            return q.ops.real(sops.inner(x, y))

    hess_residual_norm = getattr(q, "hess_residual_norm", None)
    if callable(hess_residual_norm):
        residual_norm = hess_residual_norm
    else:

        def residual_norm(x, y, eigenvalue):
            return sops.norm(sops.axpy(-eigenvalue, x, y))

    return _SelfAdjointAction(q.hess_apply, q.domain, q.ctx, rayleigh, residual_norm)



[docs]
def power_iteration(
    A: LinOp | QuadraticForm,
    *,
    x0: Any | None = None,
    tol: float = 1e-6,
    maxiter: int | None = None,
    check_every: int = DEFAULT_CONVERGENCE_CHECK_INTERVAL,
) -> PowerIterationResult:
    r"""
    Estimate the dominant eigenpair of a self-adjoint action.

    Accept a square :class:`LinOp` or a :class:`QuadraticForm` exposing
    ``hess_apply``. Public dispatch converts either input into a fixed
    self-adjoint action before entering the numerical loop. Power iteration
    still requires ``hess_apply`` for quadratic forms because the vector update
    is ``x_next = normalize(H x)``. Optional two-sided scalar diagnostics such
    as ``hess_quad(x, Hx=None)`` can improve Rayleigh quotient evaluation, but
    they cannot replace the Hessian-vector action. "Dominant" means largest
    eigenvalue in absolute value, not necessarily the largest positive
    eigenvalue.

    Parameters
    ----------
    A : LinOp or QuadraticForm
        Square operator or quadratic form whose dominant eigenpair, largest in
        absolute value, is sought. Linear-operator inputs must satisfy
        ``A.domain == A.codomain``; this includes the underlying space type and
        inner-product geometry.
        Quadratic-form inputs must provide ``hess_apply``. If they also expose
        ``hess_quad(x, Hx=None)``, it is used for the Rayleigh quotient and
        must be compatible with being called as ``hess_quad(x, Hx=Hx)``. The
        ``Hx`` argument is the cached Hessian-vector product already computed
        by power iteration. If the quadratic form exposes
        ``hess_residual_norm(x, Hx, eigenvalue)``, it is used for the residual
        diagnostic. Otherwise generic space inner-product and norm diagnostics
        are used.
        For spectral-norm estimates of a rectangular operator, pass
        ``A.H @ A``.
    x0 : array-like or None, optional
        Initial vector in the action domain. Default is a normalized all-ones
        vector in the domain geometry.
    tol : float, optional
        Residual-norm tolerance. ``result.converged`` is ``True`` when
        ``norm(A @ x - lambda * x) < tol``. Default is 1e-6.
    maxiter : int or None, optional
        Maximum number of iterations. Default is ``prod(A.domain.shape)``.
    check_every : int, optional
        Accepted for backward compatibility. Residual diagnostics are now
        refreshed every iteration because the loop already carries ``A @ x``;
        this argument is ignored and may be removed in a future release.

    Returns
    -------
    PowerIterationResult
        Named tuple with fields:

        - ``eigenvalue``: Rayleigh-quotient eigenvalue estimate
        - ``eigenvector``: normalized eigenvector estimate
        - ``converged``: whether ``residual_norm < tol``
        - ``num_iters``: number of iterations executed
        - ``residual_norm``: norm of ``A x - eigenvalue * x``

    Raises
    ------
    TypeError
        If ``A`` is neither a :class:`LinOp` nor a :class:`QuadraticForm`.
    ValueError
        If a linear-operator input is not square, is known to be non-Hermitian,
        or if iteration parameters are invalid.

    See Also
    --------
    lanczos_smallest : Approximate the smallest eigenpair of a Hermitian
        operator.
    cg : Solve Hermitian positive-definite systems.

    Notes
    -----
    The residual-based stopping criterion uses
    :math:`\|A x - \lambda x\|` and is refreshed every iteration. The
    ``check_every`` argument is accepted for backward compatibility but is no
    longer used. This function is JIT-compatible on the JAX backend when
    ``maxiter`` is static.

    Inner products and norms use ``domain.inner`` and ``domain.norm`` through
    the normalized self-adjoint action. The method is correct on
    non-Euclidean geometries when the space supplies Riesz maps and the action
    is self-adjoint in that geometry.

    For operators with eigenvalues of mixed sign, the dominant eigenvalue is
    the one with largest absolute value, which may be negative. Convergence
    requires that this eigenvalue be separated from the rest in absolute value.
    If the dominant modulus is degenerate, for example both ``lambda`` and
    ``-lambda`` have maximum modulus, the iteration may oscillate between
    subspaces.

    For most dense vector-space problems, the generic Rayleigh quotient
    ``real(inner(x, Hx))`` is already cheap. Specialized quadratic-form scalar
    diagnostics are mainly useful when a subclass can evaluate ``<x, Hx>`` or
    the residual norm more accurately or with less overhead than reconstructing
    the scalar from generic space operations. A specialized ``hess_quad`` must
    accept the cached Hessian-vector product as ``hess_quad(x, Hx=Hx)``;
    implementations may ignore ``Hx`` or use it to avoid recomputation.

    Examples
    --------
    Estimate the largest eigenvalue of a diagonal operator.

    >>> import numpy as np
    >>> import spacecore as sc
    >>> ctx = sc.Context(sc.NumpyOps(), dtype=np.float64)
    >>> X = sc.DenseCoordinateSpace((3,), ctx)
    >>> A = sc.DiagonalLinOp(ctx.asarray([1.0, 3.0, 2.0]), X, ctx)
    >>> result = sc.power_iteration(A, maxiter=20, tol=1e-10)
    >>> np.allclose(result.eigenvalue, 3.0)
    True
    """
    if isinstance(A, QuadraticForm):
        action = _action_from_quadratic_form(A)
    elif isinstance(A, LinOp):
        action = _action_from_linop(A)
    else:
        raise TypeError(f"A must be a LinOp or QuadraticForm, got {type(A).__name__}.")

    maxiter = check_maxiter(maxiter, cast(Any, action))
    check_interval(check_every)

    x = default_initial_vector(cast(Any, action)) if x0 is None else x0
    action.domain.check_member(x)
    return PowerIterationResult(*_power_iteration_core(action, x, tol, maxiter))



def _power_iteration_core(
    action: _SelfAdjointAction,
    x: Any,
    tol: float,
    maxiter: int,
) -> tuple[Any, Any, Any, Any, Any]:
    """Run the backend-loop implementation of power iteration."""
    sops = SpaceCoreOps(action.domain)
    x, _ = core_normalize(sops, x)
    y = action.apply(x)
    zero = action.ops.asarray(0.0, dtype=action.dtype)
    residual_norm = sops.norm(x) + float("inf")

    # Carry: current eigenvalue estimate, normalized vector x, product y=A x,
    # residual norm, and iteration counter.
    def cond_fun(carry: tuple[Any, Any, Any, Any, int]) -> Any:
        _eigenvalue, _x, _y, res_norm, k = carry
        return (k < maxiter) & (res_norm > tol)

    def body_fun(carry: tuple[Any, Any, Any, Any, int]) -> tuple[Any, Any, Any, Any, int]:
        _eigenvalue, _x, y, _residual_norm, k = carry
        x_next, _norm_y = core_normalize(sops, y)
        y_next = action.apply(x_next)
        eigenvalue_next = action.rayleigh(x_next, y_next)
        k_next = k + 1

        residual_norm_next = action.residual_norm(x_next, y_next, eigenvalue_next)
        return eigenvalue_next, x_next, y_next, residual_norm_next, k_next

    eigenvalue, eigenvector, _y, residual_norm, num_iters = action.ops.while_loop(
        cond_fun,
        body_fun,
        (zero, x, y, residual_norm, 0),
    )
    return (
        eigenvalue,
        eigenvector,
        is_converged(residual_norm, tol),
        num_iters,
        residual_norm,
    )