Source code for qvartools.krylov.basis.skqd

"""
skqd --- Classical Krylov subspace diagonalization
===================================================

Implements a classical Krylov subspace diagonalization algorithm that
constructs Krylov states via exact matrix exponentiation, samples
computational-basis configurations from each Krylov vector, and solves a
projected generalized eigenvalue problem in the sampled basis.

.. note::

   This module performs **classical** linear algebra (no quantum circuits).
   For the real SKQD algorithm using CUDA-Q Trotterized circuits, see
   :mod:`qvartools.krylov.circuits.circuit_skqd`.

Classes
-------
SKQDConfig
    Dataclass holding all hyperparameters for the algorithm.
ClassicalKrylovDiagonalization
    Core solver that builds and diagonalises the projected Hamiltonian.

References
----------
.. [1] Robledo-Moreno et al., "Chemistry beyond exact solutions on a
       quantum-centric supercomputer", arXiv:2405.05068 (2024).
"""

from __future__ import annotations

import logging
from dataclasses import dataclass
from itertools import combinations
from typing import Any

import numpy as np
import torch
from scipy.linalg import eigh as scipy_eigh
from scipy.sparse.linalg import expm_multiply

from qvartools.hamiltonians.hamiltonian import Hamiltonian

__all__ = [
    "SKQDConfig",
    "ClassicalKrylovDiagonalization",
    # Deprecated aliases (remove in v0.1.0)
    "SampleBasedKrylovDiagonalization",
    "FlowGuidedSKQD",
]


def __getattr__(name: str):
    """Lazy re-export with deprecation warnings for old names."""
    import warnings

    if name == "FlowGuidedKrylovDiag":
        from qvartools.krylov.basis.flow_guided import FlowGuidedKrylovDiag

        return FlowGuidedKrylovDiag

    _DEPRECATED = {
        "FlowGuidedSKQD": "FlowGuidedKrylovDiag",
        "SampleBasedKrylovDiagonalization": "ClassicalKrylovDiagonalization",
    }
    if name in _DEPRECATED:
        new_name = _DEPRECATED[name]
        warnings.warn(
            f"{name} is deprecated, use {new_name} instead. "
            "The old name will be removed in v0.1.0.",
            DeprecationWarning,
            stacklevel=2,
        )
        if name == "FlowGuidedSKQD":
            from qvartools.krylov.basis.flow_guided import FlowGuidedKrylovDiag

            return FlowGuidedKrylovDiag
        return ClassicalKrylovDiagonalization

    raise AttributeError(f"module {__name__!r} has no attribute {name!r}")


logger = logging.getLogger(__name__)


# ---------------------------------------------------------------------------
# Configuration
# ---------------------------------------------------------------------------



[docs]
@dataclass(frozen=True)
class SKQDConfig:
    """Hyperparameters for Sample-Based Krylov Quantum Diagonalization.

    Parameters
    ----------
    max_krylov_dim : int
        Maximum number of Krylov vectors to construct.
    time_step : float
        Time step for real-time evolution ``e^{-iH dt}``.
    total_evolution_time : float
        Total evolution time budget (informational; the algorithm uses
        ``max_krylov_dim * time_step`` Krylov vectors).
    shots_per_krylov : int
        Number of measurement shots per Krylov state for sampling
        computational-basis configurations.
    use_cumulative_basis : bool
        If ``True``, retain samples from all previous Krylov states
        (cumulative union).  If ``False``, only keep the latest set.
    num_eigenvalues : int
        Number of lowest eigenvalues to compute from the projected problem.
    which_eigenvalues : str
        Eigenvalue selection criterion passed to the eigensolver.
        ``"SA"`` = smallest algebraic (default).
    regularization : float
        Tikhonov regularization added to the overlap matrix diagonal to
        stabilise the generalized eigenvalue problem.
    use_gpu : bool
        If ``True``, attempt to use GPU-accelerated linear algebra.

    Examples
    --------
    >>> cfg = SKQDConfig(max_krylov_dim=5, time_step=0.05)
    >>> cfg.max_krylov_dim
    5
    """

    max_krylov_dim: int = 10
    time_step: float = 0.1
    total_evolution_time: float = 1.0
    shots_per_krylov: int = 1000
    use_cumulative_basis: bool = True
    num_eigenvalues: int = 1
    which_eigenvalues: str = "SA"
    regularization: float = 1e-8
    # NOTE: use_gpu is not yet forwarded to _solve_generalised_eigenproblem
    # from all call sites. The eigensolver defaults to GPU when available.
    # TODO: wire this through in a future PR.
    use_gpu: bool = False

    def __post_init__(self) -> None:
        """Validate configuration values."""
        if self.max_krylov_dim < 1:
            raise ValueError(f"max_krylov_dim must be >= 1, got {self.max_krylov_dim}")
        if self.time_step <= 0.0:
            raise ValueError(f"time_step must be > 0, got {self.time_step}")
        if self.shots_per_krylov < 1:
            raise ValueError(
                f"shots_per_krylov must be >= 1, got {self.shots_per_krylov}"
            )
        if self.num_eigenvalues < 1:
            raise ValueError(
                f"num_eigenvalues must be >= 1, got {self.num_eigenvalues}"
            )
        if self.regularization < 0.0:
            raise ValueError(f"regularization must be >= 0, got {self.regularization}")



# ---------------------------------------------------------------------------
# Helper: build projected matrices
# ---------------------------------------------------------------------------


def _build_projected_matrices(
    hamiltonian: Hamiltonian,
    basis_configs: torch.Tensor,
    device: torch.device | None = None,
) -> tuple[np.ndarray, np.ndarray]:
    """Build projected H and S matrices in a sampled configuration basis.

    Parameters
    ----------
    hamiltonian : Hamiltonian
        The system Hamiltonian.
    basis_configs : torch.Tensor
        Basis configurations, shape ``(n_basis, num_sites)``.
    device : torch.device or None, optional
        Device to use for computation.  If ``None``, uses CUDA when available,
        otherwise CPU.

    Returns
    -------
    h_proj : np.ndarray
        Projected Hamiltonian matrix, shape ``(n_basis, n_basis)``.
    s_proj : np.ndarray
        Overlap matrix, shape ``(n_basis, n_basis)``.  For an orthonormal
        computational-basis subset this is the identity, but we keep the
        general form for consistency with weighted / non-orthogonal bases.
    """
    if device is None:
        device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

    n_basis = basis_configs.shape[0]
    s_proj = np.eye(n_basis, dtype=np.float64)

    configs_on_device = basis_configs.to(device)

    # Prefer the symmetric fast path when available
    if hasattr(hamiltonian, "matrix_elements_fast"):
        h_matrix = hamiltonian.matrix_elements_fast(configs_on_device)
    else:
        h_matrix = hamiltonian.matrix_elements(configs_on_device, configs_on_device)

    h_proj = h_matrix.detach().cpu().numpy().astype(np.float64)

    return h_proj, s_proj


def _solve_generalised_eigenproblem(
    h_proj: np.ndarray,
    s_proj: np.ndarray,
    num_eigenvalues: int,
    regularization: float,
    use_gpu: bool = True,
) -> tuple[np.ndarray, np.ndarray]:
    """Solve the generalized eigenvalue problem ``H v = E S v``.

    When a CUDA device is available and ``use_gpu`` is ``True``, the problem is
    reduced to a standard eigenvalue problem via Cholesky decomposition and
    solved with :func:`torch.linalg.eigh` on the GPU.  Otherwise, falls back
    to :func:`scipy.linalg.eigh` on the CPU.

    Parameters
    ----------
    h_proj : np.ndarray
        Projected Hamiltonian, shape ``(n, n)``.
    s_proj : np.ndarray
        Overlap matrix, shape ``(n, n)``.
    num_eigenvalues : int
        Number of lowest eigenvalues to return.
    regularization : float
        Tikhonov regularization added to the overlap diagonal.
    use_gpu : bool, optional
        If ``True`` (default), use GPU-accelerated ``torch.linalg.eigh``
        when CUDA is available.  If ``False``, always use scipy on CPU.

    Returns
    -------
    eigenvalues : np.ndarray
        Lowest ``num_eigenvalues`` eigenvalues, shape ``(num_eigenvalues,)``.
    eigenvectors : np.ndarray
        Corresponding eigenvectors, shape ``(n, num_eigenvalues)``.
    """
    n = h_proj.shape[0]
    s_reg = s_proj + regularization * np.eye(n, dtype=np.float64)

    # Symmetrise to guard against floating-point asymmetry
    h_sym = 0.5 * (h_proj + h_proj.T)
    s_sym = 0.5 * (s_reg + s_reg.T)

    if use_gpu and torch.cuda.is_available():
        # GPU path: reduce generalised eigenproblem to standard form via
        # Cholesky decomposition  L L^T = S,  then solve
        # L^{-1} H L^{-T} y = E y,  with x = L^{-T} y.
        device = torch.device("cuda")
        h_t = torch.tensor(h_sym, dtype=torch.float64, device=device)
        s_t = torch.tensor(s_sym, dtype=torch.float64, device=device)

        l_chol = torch.linalg.cholesky(s_t)
        l_inv = torch.linalg.inv(l_chol)
        h_standard = l_inv @ h_t @ l_inv.T

        # Symmetrise to remove numerical noise from the transformation
        h_standard = 0.5 * (h_standard + h_standard.T)

        evals, evecs_y = torch.linalg.eigh(h_standard)

        # Transform eigenvectors back: x = L^{-T} y
        evecs_x = l_inv.T @ evecs_y

        eigenvalues = evals.cpu().numpy()
        eigenvectors = evecs_x.cpu().numpy()
    else:
        # CPU path: scipy generalised eigensolver
        eigenvalues, eigenvectors = scipy_eigh(h_sym, s_sym)

    k = min(num_eigenvalues, len(eigenvalues))
    return eigenvalues[:k], eigenvectors[:, :k]


# ---------------------------------------------------------------------------
# ClassicalKrylovDiagonalization
# ---------------------------------------------------------------------------



[docs]
class ClassicalKrylovDiagonalization:
    r"""Classical Krylov subspace diagonalization via exact time evolution.

    Constructs Krylov states
    :math:`|\psi_k\rangle = (e^{-iH\Delta t})^k |\psi_0\rangle`
    using exact matrix exponentiation (no Trotter decomposition),
    samples computational-basis configurations from each via Born-rule
    sampling, and solves a projected generalized eigenvalue problem.

    For molecular Hamiltonians the algorithm restricts to the
    particle-number-conserving subspace.  For spin Hamiltonians the full
    Hilbert space is used.

    Parameters
    ----------
    hamiltonian : Hamiltonian
        The system Hamiltonian.
    config : SKQDConfig
        Algorithm hyperparameters.
    initial_state : np.ndarray or None, optional
        Initial state vector in the full (or subspace) Hilbert space.
        If ``None``, a default Hartree--Fock-like state is constructed.

    Attributes
    ----------
    hamiltonian : Hamiltonian
        The Hamiltonian instance.
    config : SKQDConfig
        The configuration dataclass.
    h_dense : np.ndarray
        Dense Hamiltonian matrix (in the relevant subspace).
    subspace_configs : torch.Tensor or None
        Particle-conserving configurations, if applicable.

    Examples
    --------
    >>> skqd = ClassicalKrylovDiagonalization(hamiltonian, SKQDConfig())
    >>> eigenvalues, info = skqd.run()
    >>> info["krylov_dim"]
    10
    """

    def __init__(
        self,
        hamiltonian: Hamiltonian,
        config: SKQDConfig,
        initial_state: np.ndarray | None = None,
    ) -> None:
        self.hamiltonian = hamiltonian
        self.config = config

        # Detect molecular Hamiltonian
        self._is_molecular = hasattr(hamiltonian, "integrals")

        if self._is_molecular:
            self.subspace_configs = self._setup_particle_conserving_subspace()
            self.subspace_dim = self.subspace_configs.shape[0]
            logger.info(
                "Particle-conserving subspace: %d configurations", self.subspace_dim
            )
            # Build dense H in the subspace
            h_torch = hamiltonian.matrix_elements(
                self.subspace_configs, self.subspace_configs
            )
            self.h_dense = h_torch.detach().cpu().numpy().astype(np.float64)
        else:
            self.subspace_configs = None
            self.subspace_dim = hamiltonian.hilbert_dim
            h_torch = hamiltonian.to_dense()
            self.h_dense = h_torch.detach().cpu().numpy().astype(np.float64)

        # Build hash→index mapping for fast submatrix extraction
        self._subspace_hash_to_idx = self._build_subspace_index()

        # Precompute GPU matrix exponential for Krylov time evolution
        self._exp_dt_gpu: torch.Tensor | None = None
        self._initial_state_gpu: torch.Tensor | None = None

        # Initial state
        if initial_state is not None:
            if initial_state.shape[0] != self.subspace_dim:
                raise ValueError(
                    f"initial_state dimension ({initial_state.shape[0]}) does "
                    f"not match subspace dimension ({self.subspace_dim})"
                )
            self._initial_state = initial_state.astype(np.complex128)
        else:
            self._initial_state = self._default_initial_state()

    # ------------------------------------------------------------------
    # Private helpers
    # ------------------------------------------------------------------

    def _default_initial_state(self) -> np.ndarray:
        """Construct a default initial state (first basis vector).

        Returns
        -------
        np.ndarray
            State vector of shape ``(subspace_dim,)``.
        """
        state = np.zeros(self.subspace_dim, dtype=np.complex128)
        state[0] = 1.0
        return state

    def _build_subspace_index(self) -> dict[int, int]:
        """Build a hash→index mapping for the subspace configurations.

        Uses the Hamiltonian's ``_config_hash_batch`` when available for
        vectorised hashing, otherwise falls back to a powers-of-2 hash.

        Returns
        -------
        dict
            Mapping from integer config hash to subspace index.
        """
        if self.subspace_configs is None:
            return {}

        configs = self.subspace_configs
        n = configs.shape[0]
        num_sites = configs.shape[1]

        # Use Hamiltonian's batch hash if available
        if hasattr(self.hamiltonian, "_config_hash_batch"):
            hashes = self.hamiltonian._config_hash_batch(configs)
        else:
            powers = torch.tensor(
                [1 << k for k in range(num_sites - 1, -1, -1)],
                dtype=torch.int64,
                device=configs.device,
            )
            hashes = (configs.to(torch.int64) * powers.unsqueeze(0)).sum(dim=-1)

        return {int(hashes[i].item()): i for i in range(n)}

    def _precompute_gpu_time_evolution(self) -> None:
        """Precompute exp(-iH*dt) on GPU for fast Krylov state generation.

        Called lazily on the first ``_compute_krylov_state`` call when
        CUDA is available.  Stores the precomputed matrix exponential
        and the initial state on GPU.
        """
        if not torch.cuda.is_available():
            return

        device = torch.device("cuda")
        h_gpu = torch.tensor(
            -1j * self.h_dense * self.config.time_step,
            dtype=torch.complex128,
            device=device,
        )
        self._exp_dt_gpu = torch.matrix_exp(h_gpu)
        self._initial_state_gpu = torch.tensor(
            self._initial_state, dtype=torch.complex128, device=device
        )
        logger.info("Precomputed GPU matrix exponential: dim=%d", self.subspace_dim)


[docs]
    def extract_projected_submatrix(
        self, configs: torch.Tensor
    ) -> tuple[np.ndarray, np.ndarray]:
        """Extract projected H and S from the precomputed dense Hamiltonian.

        Maps each configuration in *configs* to its index in the full
        particle-conserving subspace and extracts the corresponding
        submatrix of ``self.h_dense``.  Falls back to
        :func:`_build_projected_matrices` if any configuration is not
        found in the subspace.

        Parameters
        ----------
        configs : torch.Tensor
            Basis configurations, shape ``(n_basis, num_sites)``.

        Returns
        -------
        h_proj : np.ndarray
            Projected Hamiltonian, shape ``(n_basis, n_basis)``.
        s_proj : np.ndarray
            Overlap matrix (identity), shape ``(n_basis, n_basis)``.
        """
        if not self._subspace_hash_to_idx:
            return _build_projected_matrices(self.hamiltonian, configs)

        n = configs.shape[0]

        # Compute hashes for the requested configs
        if hasattr(self.hamiltonian, "_config_hash_batch"):
            hashes = self.hamiltonian._config_hash_batch(configs.cpu())
        else:
            num_sites = configs.shape[1]
            powers = torch.tensor(
                [1 << k for k in range(num_sites - 1, -1, -1)],
                dtype=torch.int64,
            )
            hashes = (configs.cpu().to(torch.int64) * powers.unsqueeze(0)).sum(dim=-1)

        # Map each config to its subspace index
        indices = np.empty(n, dtype=np.intp)
        for i in range(n):
            h = int(hashes[i].item())
            idx = self._subspace_hash_to_idx.get(h)
            if idx is None:
                # Config not in precomputed subspace — fall back
                logger.debug(
                    "Config %d not in subspace index, falling back to full build", i
                )
                return _build_projected_matrices(self.hamiltonian, configs)
            indices[i] = idx

        h_proj = self.h_dense[np.ix_(indices, indices)].copy()
        s_proj = np.eye(n, dtype=np.float64)
        return h_proj, s_proj


    def _setup_particle_conserving_subspace(self) -> torch.Tensor:
        """Generate all valid particle-conserving configurations.

        For a molecular Hamiltonian with ``n_alpha`` spin-up and ``n_beta``
        spin-down electrons distributed across ``n_orb`` spatial orbitals
        (mapped to ``2 * n_orb`` qubits via Jordan--Wigner), enumerate all
        configurations that satisfy the particle-number constraints.

        Returns
        -------
        torch.Tensor
            All valid configurations, shape ``(n_configs, num_sites)``.
        """
        integrals = self.hamiltonian.integrals  # type: ignore[attr-defined]
        n_orb = integrals.n_orbitals
        n_alpha = integrals.n_alpha
        n_beta = integrals.n_beta
        num_qubits = 2 * n_orb

        configs: list[list[int]] = []

        # Alpha orbitals: qubits [0, n_orb)
        # Beta orbitals: qubits [n_orb, 2*n_orb)
        for alpha_occ in combinations(range(n_orb), n_alpha):
            for beta_occ in combinations(range(n_orb), n_beta):
                config = [0] * num_qubits
                for a in alpha_occ:
                    config[a] = 1
                for b in beta_occ:
                    config[n_orb + b] = 1
                configs.append(config)

        return torch.tensor(configs, dtype=torch.int64)

    def _compute_krylov_state(self, k: int) -> np.ndarray:
        r"""Compute the *k*-th Krylov state via matrix exponentiation.

        Evaluates :math:`|\psi_k\rangle = (e^{-iH\Delta t})^k |\psi_0\rangle`.

        When CUDA is available, uses a precomputed GPU matrix exponential
        ``U = e^{-iH\Delta t}`` and applies *k* matrix-vector products on
        the GPU.  Otherwise falls back to
        :func:`scipy.sparse.linalg.expm_multiply` on the CPU.

        Parameters
        ----------
        k : int
            Krylov power index (``k = 0`` returns the initial state).

        Returns
        -------
        np.ndarray
            State vector of shape ``(subspace_dim,)`` with dtype
            ``complex128``.
        """
        if k == 0:
            return self._initial_state.copy()

        # Lazy GPU precomputation
        if self._exp_dt_gpu is None and torch.cuda.is_available():
            self._precompute_gpu_time_evolution()

        # GPU path: repeated matrix-vector products
        if self._exp_dt_gpu is not None:
            state = self._initial_state_gpu.clone()
            for _ in range(k):
                state = self._exp_dt_gpu @ state
            return state.cpu().numpy()

        # CPU fallback: scipy expm_multiply
        total_time = k * self.config.time_step
        state = expm_multiply(
            -1j * self.h_dense,
            self._initial_state,
            start=0.0,
            stop=total_time,
            num=2,
            endpoint=True,
        )
        # expm_multiply returns shape (num, dim); take the last row
        return state[-1]

    def _sample_from_state(
        self, state_vector: np.ndarray, n_samples: int
    ) -> torch.Tensor:
        """Sample computational-basis configurations from a state vector.

        Parameters
        ----------
        state_vector : np.ndarray
            State vector of shape ``(subspace_dim,)`` with complex amplitudes.
        n_samples : int
            Number of configurations to sample.

        Returns
        -------
        torch.Tensor
            Unique sampled configurations, shape ``(n_unique, num_sites)``.
        """
        probabilities = np.abs(state_vector) ** 2
        prob_sum = probabilities.sum()
        if prob_sum < 1e-15:
            raise RuntimeError(
                "State vector has near-zero norm; cannot sample configurations."
            )
        probabilities = probabilities / prob_sum

        rng = np.random.default_rng()
        indices = rng.choice(len(probabilities), size=n_samples, p=probabilities)
        unique_indices = np.unique(indices)

        if self.subspace_configs is not None:
            sampled = self.subspace_configs[unique_indices]
        else:
            # Full Hilbert space: convert indices to binary configs
            num_sites = self.hamiltonian.num_sites
            configs_list = []
            for idx in unique_indices:
                config = self.hamiltonian._index_to_config(int(idx))
                configs_list.append(config)
            sampled = torch.stack(configs_list)

        return sampled

    # ------------------------------------------------------------------
    # Public API
    # ------------------------------------------------------------------


[docs]
    def run(self) -> tuple[np.ndarray, dict[str, Any]]:
        """Execute the full SKQD algorithm.

        Constructs Krylov states iteratively, samples configurations from
        each, builds projected Hamiltonian and overlap matrices in the
        sampled basis, and solves the generalized eigenvalue problem.

        Returns
        -------
        eigenvalues : np.ndarray
            Lowest eigenvalues from the projected problem,
            shape ``(num_eigenvalues,)``.
        info : dict
            Diagnostic information with keys:

            - ``"basis_size"`` : int — final number of basis configurations.
            - ``"krylov_dim"`` : int — number of Krylov vectors constructed.
            - ``"energies_per_step"`` : list of float — ground-state energy
              estimate after each Krylov expansion step.
            - ``"basis_configs"`` : torch.Tensor — final basis configurations.
        """
        all_configs: torch.Tensor | None = None
        energies_per_step: list[float] = []

        for k in range(self.config.max_krylov_dim):
            logger.info("Computing Krylov state k=%d", k)

            krylov_state = self._compute_krylov_state(k)
            sampled = self._sample_from_state(
                krylov_state, self.config.shots_per_krylov
            )

            if self.config.use_cumulative_basis and all_configs is not None:
                # Union of existing and new configs (deduplicated)
                combined = torch.cat([all_configs, sampled], dim=0)
                all_configs = torch.unique(combined, dim=0)
            else:
                all_configs = sampled

            # Build and solve projected problem (use submatrix extraction)
            h_proj, s_proj = self.extract_projected_submatrix(all_configs)
            eigenvalues, _ = _solve_generalised_eigenproblem(
                h_proj,
                s_proj,
                self.config.num_eigenvalues,
                self.config.regularization,
            )
            energies_per_step.append(float(eigenvalues[0]))
            logger.info(
                "Step k=%d: basis_size=%d, E0=%.10f",
                k,
                all_configs.shape[0],
                eigenvalues[0],
            )

        # Final solve
        assert all_configs is not None
        h_proj, s_proj = self.extract_projected_submatrix(all_configs)
        eigenvalues, eigenvectors = _solve_generalised_eigenproblem(
            h_proj,
            s_proj,
            self.config.num_eigenvalues,
            self.config.regularization,
        )

        info: dict[str, Any] = {
            "basis_size": all_configs.shape[0],
            "krylov_dim": self.config.max_krylov_dim,
            "energies_per_step": energies_per_step,
            "basis_configs": all_configs,
        }

        return eigenvalues, info




# Deprecated alias: handled by module-level __getattr__ with DeprecationWarning