Source code for low_rank_toolbox.randomized.randomized_svd

"""Randomized SVD algorithms for low-rank matrix approximation.

Author: Benjamin Carrel, University of Geneva, 2024
"""

from typing import Optional

import numpy as np
from scipy.sparse.linalg import LinearOperator

from ..matrices.low_rank_matrix import LowRankMatrix
from ..matrices.svd import SVD
from .rangefinder import adaptive_rangefinder, rangefinder



[docs]
def randomized_svd(
    X: LinearOperator,
    r: int,
    p: int = 10,
    q: int = 0,
    truncate: bool = True,
    seed: int = 1234,
    **extra_data,
) -> SVD:
    """
    Randomized SVD algorithm.

    Reference:
        "Finding structure with randomness: Probabilistic algorithms for constructing approximate matrix decompositions",
        Halko, Martinsson and Tropp 2010.

    The randomized SVD computes an approximate SVD of a matrix X with the following steps:
    1. Estimate the range with Q = rangefinder(X, r, p, q, seed)
    2. Form the smaller matrix C = Q^H X
    3. Compute the SVD of C: C = U_C S V^H
    4. Form the approximate SVD of X: X_approx = Q U_C S V^H


    Parameters
    ----------
    X : SVD | LowRankMatrix | ndarray | LinearOperator
        Matrix or operator to be decomposed
    r : int
        Rank of the decomposition, must be positive
    p : int, optional
        Oversampling parameter (default: 10)
    q : int, optional
        Number of power iterations (default: 0)
    truncate : bool, optional
        If True, truncate the SVD to rank r (default: True)
    seed : int, optional
        Random seed for reproducibility (default: 1234)
    **extra_data : dict
        Additional arguments passed to SVD constructor. If 'Omega' is provided, use it as the sketching matrix.

    Returns
    -------
    SVD
        Near-optimal best rank r approximation of X
    """
    # Input validation
    if r < 1:
        raise ValueError(f"Rank must be at least 1, got r={r}.")
    if p < 0:
        raise ValueError(f"Oversampling parameter must be non-negative, got p={p}.")
    if q < 0:
        raise ValueError(f"Number of power iterations must be non-negative, got q={q}.")
    if r + p > min(X.shape):
        raise ValueError(
            f"Rank + oversampling ({r + p}) exceeds minimum matrix dimension ({min(X.shape)})."
        )

    _, n = X.shape
    # Draw or extract the random matrix Omega
    if "Omega" in extra_data:
        Omega = extra_data["Omega"]
    else:
        np.random.seed(seed)
        Omega = np.random.randn(n, r + p)

    # Step 1: find the range of X
    Q = rangefinder(X, r, p, q, seed, Omega=Omega)

    # Step 2: Form smaller matrix C = Q^H @ X
    if isinstance(X, LowRankMatrix):
        C = X.dot(Q.T.conj(), side="left", dense_output=True)
    else:
        C = Q.T.conj().dot(X)

    # Step 3: Compute SVD of C using numpy
    U_C, s_C, Vh_C = np.linalg.svd(C, full_matrices=False)

    # Step 4: Truncate if requested
    if truncate and r < len(s_C):
        U_C = U_C[:, :r]
        s_C = s_C[:r]
        Vh_C = Vh_C[:r, :]

    # Step 5: Form final U = Q @ U_C
    U_final = Q.dot(U_C)
    V_final = Vh_C.T.conj()

    return SVD(U_final, s_C, V_final, **extra_data)




[docs]
def adaptive_randomized_svd(
    X: LinearOperator,
    tol: float = 1e-6,
    failure_prob: float = 1e-6,
    max_rank: Optional[int] = None,
    seed: int = 1234,
    **extra_data,
) -> SVD:
    """
    Adaptive randomized SVD algorithm.

    Reference:
        "Finding structure with randomness: Probabilistic algorithms for constructing approximate matrix decompositions",
        Halko, Martinsson and Tropp 2010.

    The adaptive randomized SVD computes an approximate SVD of a matrix X with the following steps:
    1. Estimate the range with Q = adaptive_rangefinder(X, tol, failure_prob, seed)
    2. Form the smaller matrix C = Q^H X
    3. Compute the SVD of C: C = U_C S V^H
    4. Form the approximate SVD of X: X_approx = Q U_C S V^H


    Parameters
    ----------
    X : SVD | LowRankMatrix | ndarray | LinearOperator
        Matrix or operator to be decomposed
    tol : float, optional
        Target approximation error (default: 1e-6)
    failure_prob : float, optional
        Failure probability for the approximation error, must be in (0, 1) (default: 1e-6)
    max_rank : int, optional
        Maximum rank for the approximation (default: None, no limit)
    seed : int, optional
        Random seed for reproducibility (default: 1234)
    **extra_data : dict
        Additional arguments passed to SVD constructor

    Returns
    -------
    SVD
        Near-optimal approximation of X with ||X - X_approx||_F <= tol with probability >= 1 - failure_prob
    """
    # Input validation
    if tol <= 0:
        raise ValueError(f"Tolerance must be positive, got tol={tol}.")
    if not (0 < failure_prob < 1):
        raise ValueError(
            f"Failure probability must be in (0, 1), got failure_prob={failure_prob}."
        )
    if max_rank is not None and max_rank < 1:
        raise ValueError(f"Maximum rank must be at least 1, got max_rank={max_rank}.")

    # Step 1: find the range of X adaptively
    Q = adaptive_rangefinder(X, tol, failure_prob, seed)
    if max_rank is not None:
        Q = Q[:, :max_rank]

    # Step 2: Form smaller matrix C = Q^H @ X
    if isinstance(X, LowRankMatrix):
        C = X.dot(Q.T.conj(), side="left", dense_output=True)
    else:
        C = Q.T.conj().dot(X)

    # Step 3: Compute SVD of C using numpy
    U_C, s_C, Vh_C = np.linalg.svd(C, full_matrices=False)

    # Step 4: Form final U = Q @ U_C
    U_final = Q.dot(U_C)
    V_final = Vh_C.T.conj()

    return SVD(U_final, s_C, V_final, **extra_data)