Source code for pythtb.tbmodel

from collections.abc import Mapping
import copy
import logging
import warnings
import numpy as np
import inspect
from itertools import product
from typing import Callable
from .visualization import plot_bands, plot_tbmodel, plot_tbmodel_3d
from .utils import (
    _offdiag_approximation_warning_and_stop,
    is_Hermitian,
    deprecated,
    copydoc,
    finite_difference,
    levi_civita,
)
from .lattice import Lattice
from .hoptable import HoppingTable

# set up logging
logger = logging.getLogger(__name__)

# what is exported when "from pythtb import *" is used
__all__ = ["TBModel", "tb_model"]

# Pauli matrices
SIGMA0 = np.array([[1, 0], [0, 1]], dtype=complex)
SIGMAX = np.array([[0, 1], [1, 0]], dtype=complex)
SIGMAY = np.array([[0, -1j], [1j, 0]], dtype=complex)
SIGMAZ = np.array([[1, 0], [0, -1]], dtype=complex)


def _iter_params_of_callable(f):
    """Yield explicit parameter names (ignore *args/**kwargs)."""
    sig = inspect.signature(f)
    for name, param in sig.parameters.items():
        if param.kind in (param.POSITIONAL_OR_KEYWORD, param.KEYWORD_ONLY):
            if param.default is inspect._empty:  # user must supply
                yield name


def _call_provider(prov, params):
    """Call a provider with only the kwargs it actually declares (unless it has **kwargs)."""
    if not callable(prov):
        raise TypeError("Provider is not callable.")
    sig = inspect.signature(prov)
    if any(p.kind == p.VAR_KEYWORD for p in sig.parameters.values()):
        return prov(**params)  # accepts anything
    kwargs = {k: params[k] for k in _iter_params_of_callable(prov) if k in params}
    return prov(**kwargs)


def _describe_provider(provider):
    if isinstance(provider, str):
        return f"'{provider}'"
    if callable(provider):
        try:
            src = inspect.getsource(provider).strip()
            return src
        except (OSError, TypeError, AttributeError):
            name = getattr(
                provider, "__qualname__", getattr(provider, "__name__", repr(provider))
            )
            return f"callable {name} (source unavailable)"
    return repr(provider)



[docs]
class TBModel:
    r"""Build, parametrize, and solve tight-binding Hamiltonians.

    A tight-binding (TB) model describes single-particle dynamics in a discrete
    orbital basis (e.g., Wannier functions, atomic-like orbitals) placed on sites
    of a lattice. The Hamiltonian is specified by on-site and hopping terms between
    orbitals.

    This class supports

    - **Periodic systems** (one or more reciprocal-space dimensions),
    - **Finite real-space systems** (open boundaries), or
    - **Mixed geometries** (some periodic, some open; e.g. ribbons or slabs).

    .. versionremoved:: 2.0.0
        Parameters ``dim_r`` and ``dim_k`` were removed. Real- and reciprocal-space
        dimensions are inferred from :class:`Lattice`.

    Parameters
    ----------
    lattice : :class:`Lattice`
        Lattice and basis specification. This object defines the lattice vectors,
        the positions of the localized orbitals (basis functions) within the unit
        cell, and which lattice directions are treated as periodic. The orbital
        positions are given in reduced (fractional) coordinates relative to the
        lattice vectors. The periodic directions are a list of indices into the
        lattice vectors.

        .. versionchanged:: 2.0.0
            Replaced constructor arguments ``dim_k``, ``dim_r``, ``lat``, ``orb``,
            and ``per`` with a single :class:`~pythtb.Lattice` argument.
            Real- and reciprocal-space dimensionalities
            are inferred from the lattice definition. For example, code that previously used
            ``TBModel(dim_r=2, dim_k=1, lat=..., orb=..., per=[1])`` should now use
            ``TBModel(lattice=Lattice(lat_vecs=..., orb_vecs=..., periodic_dirs=[1]))``.

    spinful : bool, optional
        If True, each orbital carries two spin components (spin-1/2), and the
        Hamiltonian includes a 2x2 matrix structure for each orbital pair. If
        False, the model is spinless. Default is False.

        .. versionchanged:: 2.0.0
            Renamed from ``nspin`` to ``spinful`` and changed type to ``bool``.
            Instead of specifying the number of spin components (1 or 2), now
            specify whether the model is spinful (True) or spinless (False).

    Notes
    -----
    - The lattice geometry (primitive vectors, orbital positions, and periodic
      directions) is specified through a :class:`Lattice` object. Periodic
      directions are treated in reciprocal space. :class:`Lattice` also provides
      methods for constructing a finite model from a periodic one
      (e.g. ribbons, slabs, etc.).

    - Both spinless and spinful models are supported; spin-orbit effects may be encoded
      directly in the hopping matrices.

    - Beyond constructing and diagonalizing the Hamiltonian, this class provides
      methods for computing topological and quantum-geometric observables, including:

      - Quantum geometric tensor (QGT) (in ≥ 2D periodic systems)
      - Berry curvature and quantum metric (in ≥ 2D periodic systems)
      - Chern number (in ≥ 2D periodic systems)
      - Axion angle (in 3D periodic models + 1 varying parameter)
      - Bianco-Resta local Chern marker (in 2D finite systems)

    - Hamiltonians may depend on external parameters (e.g. strain, adiabatic
      parameters), and can be registered by setting onsite or hopping terms
      with strings or callable functions that take parameter names as keyword
      arguments. Supply these values as keyword arguments when calling downstream
      methods and the class will automatically evaluate the Hamiltonian with the
      specified parameters.

    Examples
    --------
    Create a ribbon-like model: two real-space directions but only one periodic axis.
    The first lattice vector is ``[1, 1/2]`` and the second is ``[0, 2]``; only the
    second direction is periodic, so we model a strip that repeats along
    :math:`\mathbf{a}_2`. Three orbitals sit at fractional coordinates inside
    the unit cell.

    >>> from pythtb import TBModel, Lattice
    >>> lat = Lattice(
    ...    lat_vecs=[[1, 1/2], [0, 2]],
    ...    orb_vecs=[[0.2, 0.3], [0.1, 0.1], [0.2, 0.2]],
    ...    periodic_dirs=[1],
    ... )
    >>> tb = TBModel(lattice=lat, spinful=False)

    Define on-site terms and a few hoppings (home cell hop plus one along the
    periodic direction):

    >>> tb.set_onsite([0.0, 1.0, 0.5])  # onsite energies for all three orbitals
    >>> tb.set_hop(1.0, 0, 1, [0, 0])   # 0 <-> 1 within home unit cell
    >>> tb.set_hop(-0.8, 1, 2, [0, 0])  # 1 <-> 2 within home unit cell
    >>> tb.set_hop(0.3, 2, 0, [0, 1])   # 2 <-> 0 shifted by one cell along periodic axis

    Introduce parameters with strings or callables; the parameter names are
    remembered and must be supplied later:

    >>> tb.set_onsite("U", ind_i=0)  # onsite energy for orbital 0 is parameter 'U'
    >>> tb.set_onsite(lambda U: np.cos(U), ind_i=2)  # onsite energy for orbital 2 is parameter 'U'
    >>> tb.set_hop(lambda t: t**2, 1, 2, [0, 0])  # hopping from orbital 1 to 2 is parameter 't'

    Evaluate the Bloch Hamiltonian at a range of reduced momenta for specific
    parameter values:

    >>> H = tb.hamiltonian(k_pts=np.linspace(0,1,10), return_eigvecs=True, U=0.4, t=0.7)
    >>> H.shape
    (10, 3, 3)

    Diagonalize the Bloch Hamiltonian for a range of momenta and parameter values,

    >>> U_vals = np.linspace(0, 2*np.pi, 11)
    >>> t_vals = np.linspace(0, 1, 12)
    >>> evals, evecs = tb.solve_ham(k_pts=np.linspace(0,1,10), return_eigvecs=True, U=U_vals, t=t_vals)
    >>> evals.shape
    (10, 11, 12, 3)
    >>> evecs.shape
    (10, 11, 12, 3, 3)

    This pattern of setting parameters by name and supplying their values extends to all other
    methods that depend on the Hamiltonian, such as Berry curvature, quantum metric, etc.
    """

    def __init__(self, lattice: Lattice, spinful: bool = False):
        self._lattice = lattice
        self._spinful = spinful
        self._nspin = 2 if spinful else 1

        # By default, assume model did not come from w90 object and that
        # position operator is diagonal
        self.assume_position_operator_diagonal = True
        self._from_w90 = False

        # Initialize onsite energies to zero
        if not spinful:
            self._site_energies = np.zeros((self.norb), dtype=float)
        else:
            self._site_energies = np.zeros((self.norb, 2, 2), dtype=complex)

        # The onsite energies and hoppings are not specified
        # when creating a 'TBModel' object.  They are speficied
        # subsequently by separate function calls defined below.

        # remember which onsite energies user has specified
        self._site_energies_specified = np.zeros(self.norb, dtype=bool)
        self._site_energies_specified[:] = False

        # Initialize hoppings container
        self._hoptable = HoppingTable(self.dim_r, spinful=spinful)

        self._onsite_param_terms = {}
        self._hopping_param_terms = {}

    def __repr__(self):
        r"""Return a concise representation of the model.

        Returns
        -------
        str
            A string like ``"pythtb.TBModel(dim_r=..., dim_k=..., norb=..., spinful=...)"``.
        """
        return (
            f"pythtb.TBModel(dim_r={self.dim_r}, dim_k={self.dim_k}, "
            f"norb={self.norb}, spinful={self.spinful})"
        )

    def __str__(self):
        r"""Return a human‑readable summary string.

        Returns
        -------
        str
            Same text as :meth:`info` with ``show=False``.
        """
        return self.info(show=False)

    # Property decorators for read-only access to model attributes

    @property
    def lattice(self) -> Lattice:
        """The :class:`Lattice` object associated with the model.

        .. versionadded:: 2.0.0

        Returns
        -------
        Lattice
            A copy of the :class:`Lattice` object associated with the model.
        """
        return copy.copy(self._lattice)

    @property
    def dim_r(self) -> int:
        """Dimensionality of real space.

        .. versionadded:: 2.0.0

        Returns
        -------
        int
            Number of Cartesian real-space directions.
        """
        return self.lattice.dim_r

    @property
    def dim_k(self) -> int:
        """Dimensionality of reciprocal space (number of periodic directions).

        .. versionadded:: 2.0.0

        Returns
        -------
        int
            Number of periodic directions.
        """
        return self.lattice.dim_k

    @property
    def nspin(self) -> int:
        """Number of spin components (1 for spinless, 2 for spinful).

        .. versionadded:: 2.0.0

        Returns
        -------
        int
            Number of spin components (1 for spinless, 2 for spinful).
        """
        return self._nspin

    @property
    def spinful(self) -> bool:
        """Whether the model includes spin degrees of freedom.

        .. versionadded:: 2.0.0

        Returns
        -------
        bool
            Whether the model includes spin degrees of freedom.
        """
        return self._spinful

    @property
    def periodic_dirs(self) -> list[int]:
        """Periodic directions as indices into the lattice vectors.

        .. versionadded:: 2.0.0

        Returns
        -------
        list[int]
            Indices of periodic directions (length equals :attr:`dim_k`).
        """
        return self.lattice.periodic_dirs

    @property
    def norb(self) -> int:
        """Number of tight-binding orbitals per unit cell.

        .. versionadded:: 2.0.0

        Returns
        -------
        int
            Number of tight-binding orbitals per unit cell.
        """
        return self.lattice.norb

    @property
    def nstate(self) -> int:
        """Total number of electronic states (``norb * nspin``).

        .. versionadded:: 2.0.0

        Returns
        -------
        int
            Total number of electronic states (``norb * nspin``).
        """
        return self.norb * self.nspin

    @property
    def orb_vecs(self) -> np.ndarray:
        """Orbital positions in reduced coordinates.

        .. versionadded:: 2.0.0

        Returns
        -------
        np.ndarray
            A copy of the orbital positions in reduced coordinates.
            Shape is ``(norb, dim_r)``.
        """
        return self.lattice.orb_vecs.copy()

    @property
    def lat_vecs(self) -> np.ndarray:
        """Lattice vectors in Cartesian coordinates.

        .. versionadded:: 2.0.0

        Returns
        -------
        np.ndarray
            A copy of the lattice vectors in Cartesian coordinates.
            Shape is ``(dim_r, dim_r)``.
        """
        return self.lattice.lat_vecs.copy()

    @property
    def recip_lat_vecs(self) -> np.ndarray:
        """Reciprocal lattice vectors in inverse Cartesian units.

        .. versionadded:: 2.0.0

        Returns
        -------
        np.ndarray
            A copy of the reciprocal lattice vectors in inverse Cartesian units.
            Shape is ``(dim_k, dim_r)``.
        """
        return self.lattice.recip_lat_vecs.copy()

    @property
    def recip_volume(self) -> float:
        """Volume of the reciprocal unit cell in inverse Cartesian units.

        .. versionadded:: 2.0.0

        Returns
        -------
        float
            Volume of the reciprocal unit cell in inverse Cartesian units.
        """
        return copy.copy(self.lattice.recip_volume)

    @property
    def cell_volume(self) -> float:
        """Volume of the real-space unit cell in Cartesian units.

        .. versionadded:: 2.0.0

        Returns
        -------
        float
            Volume of the real-space unit cell in Cartesian units.
        """
        return copy.copy(self.lattice.cell_volume)

    @property
    def onsite(self) -> np.ndarray:
        """On-site energies for each orbital.

        .. versionadded:: 2.0.0

        Returns
        -------
        np.ndarray
            A copy of the on-site energies for each orbital.
            Shape is ``(norb,)`` for spinless models,
            ``(norb, 2, 2)`` for spinful models.
        """
        return self._site_energies.copy()

    @property
    def hoppings(self) -> list[dict]:
        """Hopping terms defined in the model.

        .. versionadded:: 2.0.0

        Returns
        -------
        list[dict]
            One dictionary per hopping with keys:

            - ``"amplitude"`` : hopping amplitude (complex or 2x2 numpy.ndarray for spinful)
            - ``"from_orbital"``: index of starting orbital (int)
            - ``"to_orbital"``: index of ending orbital (int)
            - ``"lattice_vector"``: lattice vector displacement for ``"to_orbital"`` (list of int)
        """
        amps, i_idx, j_idx, R_vecs = self._hoptable.components()
        formatted: list[dict] = []
        for hop_idx in range(self.nhops):
            amp = amps[hop_idx]
            if self.spinful:
                amplitude = np.asarray(amp).copy()
            else:
                amplitude = complex(amp)
            entry = {
                "amplitude": amplitude,
                "from_orbital": int(i_idx[hop_idx]),
                "to_orbital": int(j_idx[hop_idx]),
            }
            R_vec = R_vecs[hop_idx]
            if np.any(R_vec):
                entry["lattice_vector"] = R_vec.tolist()
            formatted.append(entry)
        return formatted

    @property
    def nhops(self) -> int:
        """Number of hoppings defined in the model.

        .. versionadded:: 2.0.0

        Returns
        -------
        int
            Number of hoppings defined in the model.
        """
        return len(self._hoptable)

    @property
    def parameters(self):
        """Parameter providers registered on on‑site and hopping terms.

        Returns
        -------
        list[dict]
            Each entry describes a provider with the following fields:

            - ``kind``: ``"onsite"`` or ``"hopping"``
            - ``orbitals``: index (onsite) or ``(i, j)`` tuple (hopping)
            - ``R``: lattice-vector tuple for hoppings
            - ``names``: list[str] of parameter names required by the provider
            - ``source`` (optional): best-effort textual description of the callable
            - ``function`` (optional): the callable itself
        """
        out = []
        for idx, provider in getattr(self, "_onsite_param_terms", {}).items():
            if provider is None:
                continue
            names = self._provider_names(provider, ctx=f"onsite[{idx}]")
            desc = {"kind": "onsite", "orbitals": int(idx), "names": names}
            if callable(provider):
                desc["source"] = _describe_provider(provider)
                desc["function"] = provider
            out.append(desc)

        for (i, j, R), provider in getattr(self, "_hopping_param_terms", {}).items():
            if provider is None:
                continue
            names = self._provider_names(provider, ctx=f"hopping[{i},{j},{tuple(R)}]")
            desc = {
                "kind": "hopping",
                "orbitals": (i, j),
                "R": tuple(R),
                "names": names,
            }
            if callable(provider):
                desc["source"] = _describe_provider(provider)
                desc["function"] = provider
            out.append(desc)

        return out

    @property
    def from_w90(self) -> bool:
        """Whether the model was constructed from :class:`W90`.

        .. versionadded:: 2.0.0

        Returns
        -------
        bool
            Whether the model was constructed from :class:`W90` and
            comes from a Wannier90 calculation.
        """
        return self._from_w90

    @property
    def assume_position_operator_diagonal(self) -> bool:
        """Whether the position operator is assumed to be diagonal in the orbital basis.

        Returns
        -------
        bool
            Whether the position operator is assumed to be diagonal in the orbital basis.
        """
        return self._assume_position_operator_diagonal

    @assume_position_operator_diagonal.setter
    def assume_position_operator_diagonal(self, value: bool):
        if not isinstance(value, bool):
            raise ValueError("assume_position_operator_diagonal must be a boolean.")
        self._assume_position_operator_diagonal = value


[docs]
    @deprecated(
        "The 'display()' method is deprecated and will be removed in a future release. "
        "Use 'print(model)' or 'model.info(show=True)' instead."
    )
    def display(self):
        r"""
        .. deprecated:: 2.0.0
            Use ``print(model)`` or :meth:`info` instead.
        """
        return self.info(show=True)



[docs]
    def info(self, show: bool = True, short: bool = False):
        r"""Print or return a textual report describing the model.

        Parameters
        ----------
        show : bool, optional
            If True, print to stdout and return ``None``.
            If False, return the string without printing.
            Default is True.

            .. versionadded:: 2.0.0

        short : bool, optional
            If True, include only a lattice summary.
            If False, also include site-energies and hopping information.
            Default is False.

            .. versionadded:: 2.0.0

        Returns
        -------
        str or None
            The report string if ``show`` is False; otherwise ``None``.

        Notes
        -----
        The report includes lattice vectors, orbital positions, spin information,
        site energies, hopping terms, and hopping distances (when available).

        Examples
        --------
        >>> text = tb.info(show=False, short=True)
        >>> isinstance(text, str)
        True
        """
        output = []
        header = (
            "----------------------------------------\n"
            "       Tight-binding model report       \n"
            "----------------------------------------"
        )
        output.append(header)
        lat_report = self.lattice._report_list()
        lat_report.pop(0)  # remove header
        lat_report.insert(3, f"spinful                     = {self.spinful}")
        lat_report.insert(4, f"number of spin components   = {self.nspin}")
        lat_report.insert(5, f"number of electronic states = {self.nstate}")
        output.extend(lat_report)

        if not short:
            # Print Site Energies
            output.append("Site energies:")
            onsite_params = getattr(self, "_onsite_param_terms", {})

            for i, site in enumerate(self._site_energies):
                onsite_param_term = onsite_params.get(i)
                if onsite_param_term:
                    output.append(
                        f"  <{i:^3}| H |{i:^3}> = {_describe_provider(onsite_param_term)}"
                    )
                    continue

                if not self.spinful:
                    energy_str = f"{site:^7.3f}"
                else:
                    energy_str = str(site).replace("\n", " ")

                output.append(f"  <{i:^3}| H |{i:^3}> = {energy_str}")

            amps, i_idx, j_idx, R_vecs = self._hoptable.components()

            output.append("Hoppings:")
            for hop_idx in range(self.nhops):
                hop_from = int(i_idx[hop_idx])
                hop_to = int(j_idx[hop_idx])
                R_vec = R_vecs[hop_idx]

                coords = ", ".join(f"{value:^5.1f}" for value in R_vec)
                disp = f" + [{coords}] " if self.dim_k else ""
                out_str = f"  <{hop_from:^3}| H |{hop_to:^3}{disp}> = "

                amp = amps[hop_idx]
                if self.spinful:
                    amp_str = str(np.asarray(amp).round(4)).replace("\n", " ")
                else:
                    amp_str = f"{complex(amp):^7.4f}"

                out_str += amp_str
                output.append(out_str)

            param_hops = getattr(self, "_hopping_param_terms", {})
            if param_hops:
                for (hop_from, hop_to, R_tup), provider in param_hops.items():
                    coords = (
                        ", ".join(f"{value:^5.1f}" for value in R_tup)
                        if len(R_tup)
                        else ""
                    )
                    disp = f" + [{coords}] " if (coords and self.dim_k) else ""
                    output.append(
                        f"  <{hop_from:^3}| H |{hop_to:^3}{disp}> = {_describe_provider(provider)}"
                    )

            output.append("Hopping distances:")
            orb_cart = self.get_orb_vecs(cartesian=True)
            lat_vecs = np.asarray(self.lat_vecs, dtype=float)

            if self.nhops:
                for hop_idx in range(self.nhops):
                    hop_from = int(i_idx[hop_idx])
                    hop_to = int(j_idx[hop_idx])
                    R_vec = R_vecs[hop_idx]

                    pos_i = orb_cart[hop_from]
                    pos_j = orb_cart[hop_to] + R_vec @ lat_vecs

                    coords = ", ".join(f"{value:^5.1f}" for value in R_vec)
                    disp = f" + [{coords}]" if self.dim_k else ""
                    distance = np.linalg.norm(pos_j - pos_i)

                    output.append(
                        f"  | pos({hop_from:^3}) - pos({hop_to:^3}){disp} | = {distance:7.3f}"
                    )

            for (hop_from, hop_to, R_tup), _ in param_hops.items():
                R_vec = np.asarray(R_tup, dtype=float)

                pos_i = orb_cart[hop_from]
                pos_j = orb_cart[hop_to] + R_vec @ lat_vecs

                coords = ", ".join(f"{value:^5.1f}" for value in R_vec)
                disp = f" + [{coords}]" if self.dim_k else ""
                distance = np.linalg.norm(pos_j - pos_i)

                output.append(
                    f"  | pos({hop_from:^3}) - pos({hop_to:^3}){disp} | = {distance:7.3f} (param)"
                )

        if show:
            print("\n".join(output))
        else:
            return "\n".join(output)



[docs]
    def copy(self) -> "TBModel":
        """Return a deep copy of the model.

        .. versionadded:: 2.0.0

        Returns
        -------
        TBModel
            Independent copy of ``self``.

        Examples
        --------
        >>> tb2 = tb.copy()
        >>> tb2 is tb
        False
        """
        return copy.deepcopy(self)



[docs]
    def clear_hoppings(self):
        """Remove all hopping terms from the model.

        .. versionadded:: 2.0.0

        Notes
        -----
        Useful for resetting the model to a state without any hoppings.
        """
        self._hoptable.clear()
        logger.info("Cleared all hoppings.")



[docs]
    def clear_onsite(self):
        """Reset all on-site energies to zero.

        .. versionadded:: 2.0.0

        Notes
        -----
        Also clears the internal flags that track which sites were explicitly set.
        """
        self._site_energies.fill(0)
        self._site_energies_specified.fill(False)
        logger.info("Cleared all on-site energies.")



[docs]
    @deprecated("Use 'norb' property instead.")
    def get_num_orbitals(self):
        """
        .. deprecated:: 2.0.0
           Use :attr:`norb` instead.
        """
        return self.norb



[docs]
    @deprecated("Use 'get_orb_vecs' instead.")
    def get_orb(self):
        """
        .. deprecated:: 2.0.0
           Use :meth:`get_orb_vecs` instead.
        """
        return self.get_orb_vecs(cartesian=False)



[docs]
    def get_orb_vecs(self, cartesian=False):
        """Return orbital positions.

        .. versionchanged:: 2.0.0
            The name was changed from `get_orb` to `get_orb_vecs`.

        Parameters
        ----------
        cartesian : bool, optional
            If True, returns orbital positions in Cartesian coordinates.
            If False, returns reduced coordinates (default).

            .. versionadded:: 2.0.0

        Returns
        -------
        np.ndarray
            Array of orbital positions, shape (norb, dim_r).
        """
        return self.lattice.get_orb_vecs(cartesian=cartesian)



[docs]
    @copydoc(Lattice.nn_bonds)
    def nn_bonds(self, n_shells: int, report: bool = False):
        return self.lattice.nn_bonds(n_shells, report=report)



[docs]
    @deprecated("Use 'get_lat_vecs' instead.")
    def get_lat(self):
        """
        .. deprecated:: 2.0.0
           Use :meth:`get_lat_vecs` instead.
        """
        return self.get_lat_vecs()



[docs]
    def get_lat_vecs(self):
        """Return lattice vectors in Cartesian coordinates.

        .. versionchanged:: 2.0.0
            The name was changed from `get_lat` to `get_lat_vecs`.

        Returns
        -------
        np.ndarray
            Lattice vectors, shape ``(dim_r, dim_r)``.
        """
        return self.lattice.get_lat_vecs()



[docs]
    def set_onsite(
        self,
        onsite_en: float | list | np.ndarray | str | Callable,
        ind_i: int = None,
        mode: str = "set",
    ):
        r"""Define on-site energies for tight-binding orbitals.

        This assigns on-site matrix elements

        .. math::
            H_{ii}(\mathbf{0}) = \langle \phi_{\mathbf{0}i} | H | \phi_{\mathbf{0}i} \rangle 
            
        for orbital :math:`i` in the home unit cell. 

        Parameters
        ----------
        onsite_en : float, array_like, (2, 2) numpy.ndarray, str, callable
            The on-site energy or parameter provider to set.

            .. versionadded:: 2.0.0
                Symbolic expressions and callables for onsite energies.

            Valid formats depend on whether ``spinful`` is True or False, and
            whether a single orbital index ``ind_i`` is specified or all orbitals
            are being set at once.

            - **Spinless models**  (``spinful=False``)

              - Real scalar.

            - **Spinful models**  (``spinful=True``)

              - **Scalar** ``a`` -> :math:`a I_2` (same value for both spins).
              - **4-vector** ``[a, b, c, d]`` -> :math:`a I_2 + b \sigma_x + c \sigma_y + d \sigma_z`
              
                Explicitly, a 4-vector produces

                .. math::
                  \begin{pmatrix}
                  a+d & b - i c \\
                  b + i c & a-d
                  \end{pmatrix}.

              - **2x2 matrix** (Hermitian ndarray).
            
            - **Symbolic definitions**

              - String: symbolic expression in user-defined parameters.
              - Callable: ``f(param)`` returning any of the above forms.

            If ``ind_i is None``, this must be a length-:attr:`norb` sequence of
            values, one per orbital.

        ind_i : int, optional
            Orbital index to update. 
            If omitted, update *all* orbitals; in that case ``onsite_en`` must be
            a sequence of length :attr:`norb`.

        mode : {'set', 'add'}, optional
            Operation mode.

            - ``'set'``: replace existing on-site value(s). (Default)
            - ``'add'``: add to existing value(s).

            .. deprecated:: 2.0.0
                ``mode="reset"`` is deprecated. Use ``mode="set"`` instead.

        See Also
        --------
        set_hop : Define hopping amplitudes between orbitals.
        set_parameters : Register parameter values 
        with_parameters : Return a new :class:`TBModel` with specified parameters.

        Notes
        -----
        - When ``mode='add'`` the new value is added to the existing entry.
        - Symbolic and callable inputs automatically register their parameter names. 
          For callables with multiple parameters, each parameter is registered.
        - Parameter evaluation is **scalar only**. Spinful on-site blocks
          must then be set with callables so that the returned values match 
          the expected spinful structure. 
        
          Example:

          .. code-block:: python

              # Spinful on-site via 4-vector with one parameter 'mA'
              tb.set_onsite(lambda mA: [mA, 0.2, 0.0, -0.1], ind_i=0) 

              # Spinful on-site via full 2x2 matrix with two parameters 'mA' and 'mB'
              tb.set_onsite(
                  lambda mA, mB: np.array([[mA + mB, 0.1 - 0.2j],
                                           [0.1 + 0.2j, mA - mB]]),
                  ind_i=1
              )
        
          Parameters values must later be supplied as scalars or 1D arrays to methods 
          such as :meth:`set_parameters`, :meth:`hamiltonian`, :meth:`velocity`, 
          :meth:`solve_ham`, etc., via keyword arguments. 
        - Providing parameter values to downstream observables such as :meth:`hamiltonian`,
          :meth:`velocity`, :meth:`solve_ham`, etc., does **not** permanently store them in
          the model; they are used only for that evaluation. To persist parameter values on
          the model, use :meth:`set_parameters`.

        Examples
        --------
        Set all on-site energies:

        >>> tb.set_onsite([0.0, 1.0, 2.0]) 

        Add to a single orbital:

        >>> tb.set_onsite(100.0, ind_i=1, mode="add")  

        Overwrite a single orbital:

        >>> tb.set_onsite(0.0, ind_i=1, mode="set")

        Spinful on-site via 4-vector:

        >>> tb.set_onsite([1.0, 0.2, 0.0, -0.1], ind_i=0)

        Symbolic parameter:

        >>> tb.set_onsite("mA", ind_i=0)

        Callable parameter:

        >>> tb.set_onsite(lambda mA: mA**2, ind_i=0)

        Callable list over all orbitals with the same parameter but different
        functional forms:

        >>> tb.set_onsite([lambda mA: mA, lambda mA: 2*mA, lambda mA: 3*mA])

        Later usage:

        >>> H = tb.hamiltonian(k_pts, mA=1.2)
        >>> H = tb.hamiltonian(k_pts, mA=np.linspace(0, 2, 5))
        """
        # Handle deprecated 'reset' mode
        mode = mode.lower()
        if mode == "reset":
            logger.warning(
                "The 'reset' mode is deprecated as of v2.0. Use 'set' instead to set the onsite energy."
                "This will be removed in a future version."
            )
            mode = "set"

        def _process_single(val):
            # Accept callables (e.g., lambdas) – defer checks to evaluation time
            if callable(val):
                return ("callable", val)

            # Back-compat string path
            if isinstance(val, str):
                return ("expr", val)

            # Numeric/array/matrix path – convert to canonical onsite block now
            block = self._val_to_block(val)
            if self.nspin == 2 and not is_Hermitian(block):
                raise ValueError(
                    "Onsite terms should be real, or Hermitian for spinful models."
                )
            return ("block", block)

        # prechecks
        if ind_i is None:
            # when ind_i is not specified, onsite_en should be a list or array
            if not isinstance(onsite_en, (list, np.ndarray)):
                raise TypeError(
                    "When ind_i is not specified, onsite_en must be a list or array."
                )
            # the number of onsite energies must match the number of orbitals,
            if len(onsite_en) != self.norb:
                raise ValueError(
                    "List of onsite energies must include a value for every orbital."
                )

            items = list(onsite_en)
            indices = np.arange(self.norb)
        else:
            if not (0 <= ind_i < self.norb):
                raise ValueError(
                    "Index ind_i is not within the range of number of orbitals."
                )

            items = [onsite_en]
            indices = [ind_i]

        processed = [_process_single(v) for v in items]

        if mode == "set":
            for idx, (kind, payload) in zip(indices, processed):
                if self._site_energies_specified[idx]:
                    logger.warning(
                        f"Onsite energy for site {idx} was already set; resetting to the specified values."
                    )

                if kind == "block":
                    self._site_energies[idx] = payload
                    self._site_energies_specified[idx] = True
                    # Clear any previous param providers
                    self._onsite_param_terms[idx] = None
                else:
                    # callable/expr -> store for later evaluation
                    self._site_energies[idx] = (
                        0  # numeric placeholder, unused at build time
                    )
                    self._site_energies_specified[idx] = False
                    self._onsite_param_terms[idx] = (
                        payload  # payload is callable or str
                    )

        elif mode == "add":
            for idx, (kind, payload) in zip(indices, processed):
                if kind == "block":
                    self._site_energies[idx] += payload
                    self._site_energies_specified[idx] = True
                    # 'add' with a concrete block keeps any prior callable/expr ignored at build time
                    self._onsite_param_terms[idx] = None
                else:
                    # Adding a callable/expr: we interpret as "replace provider" (cannot 'add' unevaluated safely).
                    logger.warning(
                        f"'add' with a callable/string provider on site {idx} replaces the previous provider."
                    )
                    self._site_energies[idx] = 0
                    self._site_energies_specified[idx] = False
                    self._onsite_param_terms[idx] = payload
        else:
            raise ValueError("Mode should be either 'set' or 'add'.")


    def _get_flattened_indices(self):
        return self._hoptable.flatten_cache(self.norb)


[docs]
    def set_hop(
        self,
        hop_amp: float | complex | list | np.ndarray | str | Callable,
        ind_i: int,
        ind_j: int,
        ind_R=None,
        mode: str = "set",
        allow_conjugate_pair=False,
    ):
        r"""
        Define hopping amplitudes between tight-binding orbitals.

        This assigns matrix elements

        .. math::
            H_{ij}(\mathbf{R}) = \langle \phi_{0,i} | H | \phi_{\mathbf{R},j} \rangle

        between orbital ``i`` in the home cell and orbital ``j`` in the cell displaced
        by integer lattice vector :math:`\mathbf{R}` (in reduced coordinates).
        For periodic directions, hoppings contribute to the Bloch Hamiltonian with
        phase factors :math:`e^{i\mathbf{k}\cdot\mathbf{R}}`.

        Parameters
        ----------
        hop_amp : scalar, array_like, (2,2) ndarray, str, or callable
            Hopping amplitude specification.

            .. versionadded:: 2.0.0
                Symbolic expressions and callables are supported.

            Valid formats depend on whether ``spinful`` is True or False, and
            whether a single orbital index ``ind_i`` is specified or all orbitals
            are being set at once.

            - **Spinless models**  (``spinful=False``)

              - Complex scalar.

            - **Spinful models**  (``spinful=True``)

              - **Scalar** ``a`` -> :math:`a I_2` (same value for both spins).
              - **4-vector** ``[a, b, c, d]`` -> :math:`a I_2 + b \sigma_x + c \sigma_y + d \sigma_z`
              
                Explicitly, a 4-vector produces

                .. math::
                  \begin{pmatrix}
                  a+d & b - i c \\
                  b + i c & a-d
                  \end{pmatrix}.

              - **2x2 matrix** (Hermitian ndarray).
            
            - **Symbolic definitions**

              - String: symbolic expression in user-defined parameters.
              - Callable: ``f(param)`` returning any of the above forms.

        ind_i : int
            Index of the bra orbital (home cell).
        ind_j : int
            Index of the ket orbital (shifted cell).
        ind_R : array_like of int, optional
            Integer reduced-coordinate lattice vector specifying the cell of orbital ``j``.
            Components along non-periodic directions **must be zero**.  Attempting to hop
            across an open direction raises :class:`ValueError`. 
            If omitted, defaults to the zero vector.
        mode : {'set', 'add'}, optional
            Operation mode:

            - ``'set'``: replace the hopping value (default)
            - ``'add'``: add to existing value

            .. deprecated:: 2.0.0
                ``mode="reset"`` is deprecated. Use ``mode="set"`` instead.

        allow_conjugate_pair : bool, optional
            If ``False`` (default), the Hermitian conjugate term is automatically handled
            and specifying the opposite hopping is disallowed.  If ``True``, both entries
            may be set explicitly.

        See Also
        --------
        set_onsite : Define on-site terms.
        set_parameters : Permanently register parameter values.
        with_parameters : Return a new :class:`TBModel` with specified parameters.

        Notes
        -----
        - Only individual hopping terms may be defined; bulk hopping assignment is not supported.
        - Hermiticity is automatically enforced:

          .. math::
              H_{ji}(-\mathbf{R}) = \left[ H_{ij}(\mathbf{R}) \right]^* .

          Therefore, it is unnecessary to define both directions unless
          ``allow_conjugate_pair=True``.

        - When ``mode='add'`` the new value accumulates.
        - ``ind_R`` may only carry non-zero values along :attr:`periodic_dirs`.
        - Symbolic and callable inputs automatically register their parameter names. 
          For callables with multiple parameters, each parameter is registered.
        - Parameter evaluation is **scalar only**. Spinful on-site blocks
          must then be then be set with callables so that the returned values match 
          the expected spinful structure. 
        
          Example:

          .. code-block:: python

              # Spinful on-site via 4-vector with one parameter 'mA'
              tb.set_hop(lambda mA: [mA, 0.2, 0.0, -0.1], ind_i=0, ind_j=1, ind_R=[0,1]) 

              # Spinful on-site via full 2x2 matrix with two parameters 'mA' and 'mB'
              tb.set_hop(
                  lambda mA, mB: np.array([[mA + mB, 0.1 - 0.2j],
                                           [0.1 + 0.2j, mA - mB]]),
                  ind_i=1,
                  ind_j=1,
                  ind_R=[0,0]
              )

              # Calling Hamiltonian later with parameter values, for example:
              H = tb.hamiltonian(k_pts, mA=0.5, mB=[0, 1, 2, 3, 4])

              # Setting the parameters later:
              tb.set_parameters(mA=0.5, mB=1.0)
        
          Parameters values must later be supplied as scalars or 1D arrays to methods 
          such as :meth:`set_parameters`, :meth:`hamiltonian`, :meth:`velocity`, 
          :meth:`solve_ham`, etc., via keyword arguments. 
        - Providing parameter values to downstream observables such as :meth:`hamiltonian`,
          :meth:`velocity`, :meth:`solve_ham`, etc., does **not** permanently store them in
          the model; they are used only for that evaluation. To persist parameter values on
          the model, use :meth:`set_parameters`.

        Examples
        --------
        Hopping between orbital 0 (home cell) and orbital 2 in cell ``R=[0,1]``:

        >>> tb.set_hop(0.3+0.4j, 0, 2, [0, 1])

        Add to an existing hopping:

        >>> tb.set_hop(100.0, 0, 2, [0, 1], mode="add")

        Spinful hopping via 4-vector:

        >>> tb.set_hop([0.1, 0.0, 0.2, -0.1], 0, 1, [1, 0])

        Symbolic hopping:

        >>> tb.set_hop("t1", 0, 1, [1, 0])

        Callable hopping:

        >>> tb.set_hop(lambda t1: t1**2, 0, 1, [1, 0])

        Parametric hopping in spinful model via full 2x2 matrix:

        >>> tb.set_hop(
        ...     lambda t1, t2: np.array([[t1, 0.1 - 0.2j],
        ...                              [0.1 + 0.2j, t2]]),
        ...     0, 1, [1, 0]
        ... )

        Later usage:

        >>> H = tb.hamiltonian(k_pts, t1=0.5, t2=1.0)
        >>> H = tb.hamiltonian(k_pts, t1=np.linspace(0,1,5), t2=1.0)

        Attempting to hop along a non-periodic axis:

        >>> tb.set_hop(0.5, 0, 1, [0, 1, 0])
        Traceback (most recent call last):
            ...
        ValueError: ind_R may only have non-zero components along periodic directions ...
        """
        #### Prechecks and formatting ####
        mode = mode.lower()
        if mode == "reset":
            logger.warning(
                "The 'reset' mode is deprecated as of v2.0. Use 'set' instead to set the hopping term."
                "This will be removed in a future version."
            )
            mode = "set"

        table = self._hoptable

        ind_i, ind_j, R_vec = table.normalize_entry(
            ind_i,
            ind_j,
            ind_R,
            norb=self.norb,
            dim_k=self.dim_k,
            periodic_dirs=self.periodic_dirs,
        )

        # Do not allow onsite hoppings to be specified here
        if ind_i == ind_j and (self.dim_k == 0 or bool(np.all(R_vec == 0))):
            raise ValueError(
                "Do not use set_hop for onsite terms. Use set_onsite instead."
            )

        key = (ind_i, ind_j, tuple(R_vec.tolist()))
        existing_idx = table.find(ind_i, ind_j, R_vec)

        def _process_amp(val):
            # Accept callables (e.g., lambdas) – defer evaluation to build time
            if callable(val):
                return ("callable", val)
            # string
            if isinstance(val, str):
                return ("expr", val)
            # Numeric / array / matrix -> convert now
            block = self._val_to_block(
                val
            )  # may be complex; no Hermitian requirement for offsite
            return ("block", block)

        kind, payload = _process_amp(hop_amp)

        if not allow_conjugate_pair:
            conj_key = (ind_j, ind_i, tuple((-R_vec).tolist()))
            conj_idx = table.find(ind_j, ind_i, -R_vec)
            conj_in_providers = conj_key in getattr(self, "_hopping_param_terms", {})
            if conj_idx is not None or conj_in_providers:
                # If we're updating the exact same entry, allow it; otherwise error
                if existing_idx is None and key != conj_key:
                    raise ValueError(
                        f"Conjugate element already specified for i={ind_i}, j={ind_j}, R={R_vec.tolist()}. "
                        "Either avoid double entry or set allow_conjugate_pair=True."
                    )

        # Ensure provider dict exists
        if not hasattr(self, "_hopping_param_terms"):
            self._hopping_param_terms = {}

        if kind in ("callable", "expr"):
            # Provider path (deferred evaluation). We don't mix numeric state with parameters.
            if mode == "add":
                raise NotImplementedError(
                    "Adding parametric hopping terms is currently not supported."
                )
            # Remove any prior numeric or provider entry for this key
            if existing_idx is not None:
                table.remove(existing_idx)
            self._hopping_param_terms[key] = payload  # callable or str
            return

        # Numeric/matrix path
        hop_use = payload  # already canonicalized by _val_to_block

        # If a provider existed at this key, numeric input overrides it
        if key in self._hopping_param_terms:
            logger.warning(
                f"Overriding existing param-dependent hopping at {key} with a numeric block."
            )
            self._hopping_param_terms.pop(key, None)

        if mode == "set":
            if existing_idx is not None:
                table.update(existing_idx, amplitude=hop_use, R=R_vec)
            else:
                table.append(hop_use, ind_i, ind_j, R_vec)
        elif mode == "add":
            if existing_idx is not None:
                table.add(existing_idx, hop_use)
            else:
                table.append(hop_use, ind_i, ind_j, R_vec)
        else:
            raise ValueError(
                "Wrong value of mode parameter. Should be either `set` or `add`."
            )



[docs]
    def set_shell_hops(self, shell_hops: dict, mode="set"):
        r"""
        Set hopping amplitudes for entire nearest-neighbor shells.

        This assigns :math:`H_{ij}(\mathbf{R})` for **all** orbital pairs
        whose spatial separation lies in a given nearest-neighbor *shell*.
        Shells are numbered by increasing distance:
        shell 1 = nearest neighbors, shell 2 = next-nearest neighbors, etc.
        All hoppings within the same shell are assigned the same amplitude.

        Shell topology and distances are determined from the orbital positions
        :math:`\boldsymbol{\tau}_i` in the lattice.  Each key in ``shell_hops`` labels
        a shell index, and the associated amplitude is applied uniformly to every
        bond belonging to that shell.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        shell_hops : dict[int, scalar | array_like | (2,2) ndarray | str | callable]
            Mapping ``shell`` -> ``amplitude``.  Keys are positive integers labeling
            neighbor shells. Values specify hopping strength. For spinful models,
            amplitudes may be

            - **scalar** ``a``  → :math:`a I_2`
            - **4-vector** ``[a,b,c,d]`` → :math:`a I + b\sigma_x + c\sigma_y + d\sigma_z`
            - **2×2 Hermitian ndarray**

            Symbolic strings or callables can also be supplied; in that case, parameter
            names are registered automatically and later passed as keyword arguments to
            :meth:`hamiltonian`, :meth:`solve_ham`, etc.

        mode : {'set', 'add'}, default='set'
            Operation mode:

            - ``'set'``: replace existing hopping values
            - ``'add'``: add to existing values

        Notes
        -----
        - All hopping terms in the same shell receive *exactly* the same amplitude.
        - Shell identification is based purely on distance; degeneracies or direction
          are not distinguished.
        - Parameterized (symbolic/callable) shell amplitudes follow the same rules as
          in :meth:`set_hop`. Callables receive parameters exclusively as keyword
          arguments.
        - Parameter values supplied to :meth:`hamiltonian` (etc.) are not permanently
          stored in the model; use :meth:`set_parameters` to persist them.

        Examples
        --------
        Nearest- and next-nearest-neighbor hopping:

        >>> tb.set_shell_hops({1: 1.0, 2: 0.5})

        Only nearest‐neighbor hopping:

        >>> tb.set_shell_hops({1: 1.0})

        Spinful shell assignment via 4-vector:

        >>> tb.set_shell_hops({1: [1.0, 0.1, 0.0, -0.1]})

        Symbolic parameterized NN hopping:

        >>> tb.set_shell_hops({1: "t"})

        Callable hopping:

        >>> tb.set_shell_hops({1: lambda t: 0.2 * np.cos(t)})

        Evaluate later:

        >>> evals = tb.solve_ham(k_pts, t=0.3)

        """
        if not isinstance(shell_hops, dict):
            raise TypeError(
                "shell_hops must be a dictionary mapping shell index to hopping amplitude."
            )

        nn_shells = list(shell_hops.keys())
        if len(nn_shells) == 0:
            raise ValueError("shell_hops must have at least one element.")
        if not all(isinstance(shell, int) and shell > 0 for shell in nn_shells):
            raise ValueError("Each element in nn_shells must be a positive integer.")

        max_shell = max(nn_shells)
        shell_bonds = self.nn_bonds(max_shell)[1]

        for shell_idx, shell in enumerate(shell_bonds):
            amp = shell_hops.get(shell_idx + 1, None)
            if amp is None:
                continue
            for bond in shell:
                i, j, R = bond
                self.set_hop(amp, i, j, R, mode=mode, allow_conjugate_pair=True)


    def _append_hops(self, hop_amps, i_idx, j_idx, R_vecs):
        hop_amps = np.asarray(hop_amps)
        i_idx = np.asarray(i_idx, dtype=int)
        j_idx = np.asarray(j_idx, dtype=int)
        R_vecs = np.asarray(R_vecs, dtype=int).reshape(len(i_idx), self.dim_r)

        blocks = [self._val_to_block(val) for val in hop_amps]
        self._hoptable.extend(
            blocks,
            i_idx.tolist(),
            j_idx.tolist(),
            R_vecs.tolist(),
        )

    def _val_to_block(self, val):
        r"""
        Convert input value to appropriate matrix block for onsite or hopping.

        For spinful=False, returns the value (should be real or complex scalar).
        For spinful=True:
            - Scalar: returns a 2 x 2 matrix proportional to the identity.
            - Array with up to four elements: returns a 2 x 2 matrix as
              :math:`a I + b \sigma_x + c \sigma_y + d \sigma_z`.
            - 2 x 2 matrix: returns the matrix as is.

        Parameters
        ----------
        val : float, complex, list, np.ndarray
            Value to convert.

        Returns
        -------
        float, complex, or np.ndarray
            Matrix block for onsite or hopping.
        """
        # spinless case
        if not self.spinful:
            if not isinstance(
                val, (int, np.integer, np.floating, float, complex, np.complexfloating)
            ):
                raise TypeError("For spinless case, value must be a scalar.")
            return val

        # spinful case: construct 2x2 matrix
        coeffs = np.array(val, dtype=complex)
        paulis = [SIGMA0, SIGMAX, SIGMAY, SIGMAZ]
        if coeffs.shape == ():
            # scalar -> identity
            return coeffs * SIGMA0
        elif coeffs.shape == (4,):
            block = sum([val * paulis[i] for i, val in enumerate(coeffs)])
        elif coeffs.shape == (2, 2):
            block = coeffs
        else:
            raise TypeError(
                "For spinful models, value should be a scalar, length-4 iterable, or 2x2 array."
            )
        return block

    def _clear_param_terms(self, onsite_idx=None, hop_key=None):
        if onsite_idx is not None:
            self._onsite_param_terms.pop(onsite_idx, None)
        if hop_key is not None:
            canonical = tuple(hop_key) if len(hop_key) == 3 else hop_key
            self._hopping_param_terms.pop(canonical, None)

    def _provider_names(self, provider, *, ctx):
        if callable(provider):
            params = tuple(_iter_params_of_callable(provider))
            if not params:
                raise ValueError(f"{ctx} callable must declare at least one parameter.")
            return params
        if isinstance(provider, str):
            return (provider,)
        raise TypeError(f"Unsupported {ctx} provider type: {type(provider)}")

    def _check_missing_parameters(self, params: dict):
        """Check for missing parameters in the provided dictionary."""
        required = {name for entry in self.parameters for name in entry["names"]}
        provided = set(params.keys())

        unknown = provided - required
        if unknown:
            raise ValueError("Unknown parameter name(s): " + ", ".join(sorted(unknown)))

        missing = required - provided
        if missing:
            raise ValueError(
                "Missing parameter value(s): " + ", ".join(sorted(missing))
            )

    def _params_to_sweep(self, params: dict):
        """Partition parameters into scalars and sweeps."""
        # Partition params into scalars vs sweeps (1D arrays/lists)
        sweep_names: list[str] = []
        sweep_values: list[
            list[object]
        ] = []  # list of per-parameter lists of scalar values
        scalars: dict[str, object] = {}

        for name, raw in params.items():
            # Treat 1D arrays / lists / tuples as sweep axes; everything else as scalar
            if isinstance(raw, (list, tuple, np.ndarray)):
                raw = np.asarray(raw)

                if raw.ndim == 0:
                    # 0D array -> scalar
                    scalars[name] = raw.item()
                    continue
                elif raw.ndim == 1:
                    # keep raw values as-is so lambdas see original dtype (float/complex/etc.)
                    values = (
                        list(raw)
                        if not isinstance(raw, np.ndarray)
                        else [raw[i] for i in range(raw.shape[0])]
                    )
                    if len(values) == 0:
                        raise ValueError(
                            f"Parameter sweep '{name}' must provide at least one value."
                        )
                    sweep_names.append(name)
                    sweep_values.append(values)
                elif raw.ndim == 2:
                    # Single-row array -> single value sweep
                    if raw.shape[0] == 1:
                        scalars[name] = raw[0, :].copy()
                    # Single-column array -> scalar sweep
                    elif raw.shape[1] == 1:
                        scalars[name] = raw[:, 0].copy()
                    # Full 2x2 matrix
                    elif raw.shape == (2, 2):
                        if not self.spinful:
                            raise ValueError(
                                f"Parameter '{name}' is a 2x2 array, but the model is spinless."
                            )
                        scalars[name] = raw.copy()
                    # Pauli 4-vector
                    elif raw.shape[1] == 4:
                        if not self.spinful:
                            raise ValueError(
                                f"Parameter '{name}' has shape {raw.shape}, but the model is spinless."
                            )
                        sweep_names.append(name)
                        sweep_values.append(
                            [raw[i, :].copy() for i in range(raw.shape[0])]
                        )

            elif isinstance(raw, (int, float, complex)):
                # single scalar value
                scalars[name] = raw
            else:
                raise TypeError(
                    f"Parameter '{name}' has unsupported type {type(raw)}. "
                    "Expected scalar, list, tuple, or numpy.ndarray."
                )

        return scalars, sweep_names, sweep_values

    def _evaluate_params(self, assignments: dict):
        """Evaluate the model with given parameter assignments.

        Parameters
        ----------
        assignments : dict
            Dictionary mapping parameter names to their values.
            The form is expected to match the parameters used in
            the symbolic expressions or callables defined in the model.
            For example, if the model has a parameter 't', then
            assignments should include an entry like {'t': 1.0}.

        Returns
        -------
        hop_amps : np.ndarray
            Hopping amplitudes after evaluation.
        i_idx : np.ndarray
            Indices of the 'from' orbitals.
        j_idx : np.ndarray
            Indices of the 'to' orbitals.
        R_vecs : np.ndarray
            Lattice vectors for each hopping.
        site : np.ndarray
            On-site energies after evaluation.
        """
        # ---- copy base hops and onsite (immutable per evaluation) ----
        base_hop_amps, base_i_idx, base_j_idx, base_R_vecs = self._hoptable.components()

        hop_amps = np.array(base_hop_amps, copy=True)  # copy!
        i_idx = np.array(base_i_idx, copy=True)
        j_idx = np.array(base_j_idx, copy=True)
        R_vecs = np.array(base_R_vecs, copy=True)

        site = np.asarray(self._site_energies, dtype=complex).copy()  # copy!
        # ---- onsite providers ----
        for idx, term in getattr(self, "_onsite_param_terms", {}).items():
            if term is None:
                continue
            if callable(term):
                val = _call_provider(term, assignments)
                block = self._val_to_block(val)
            elif isinstance(term, str):
                block = self._eval_expr_to_block(term, **assignments)
            else:
                raise TypeError("Unsupported onsite provider type.")
            if self.nspin == 2 and not is_Hermitian(block):
                raise ValueError(
                    f"Onsite callable for site {idx} returned non-Hermitian 2×2."
                )
            site[idx] = np.asarray(block, dtype=complex)

        # collect param-dependent hops without mutating arrays in-place
        dyn_blocks = []
        dyn_i = []
        dyn_j = []
        dyn_R = []

        for key, term in getattr(self, "_hopping_param_terms", {}).items():
            if callable(term):
                val = _call_provider(term, assignments)
                block = self._val_to_block(val)
            elif isinstance(term, str):
                block = self._eval_expr_to_block(term, **assignments)
            else:
                raise TypeError("Unsupported hopping provider type.")
            dyn_blocks.append(np.asarray(block, dtype=complex)[None, ...])
            dyn_i.append(key[0])
            dyn_j.append(key[1])
            dyn_R.append(list(key[2]) if len(key) > 2 else [0] * self.dim_k)

        if dyn_blocks:
            hop_amps = np.concatenate([hop_amps] + dyn_blocks, axis=0)
            i_idx = np.concatenate([i_idx, np.asarray(dyn_i, dtype=i_idx.dtype)])
            j_idx = np.concatenate([j_idx, np.asarray(dyn_j, dtype=j_idx.dtype)])
            R_vecs = np.concatenate(
                [R_vecs, np.asarray(dyn_R, dtype=R_vecs.dtype)], axis=0
            )

        return hop_amps, i_idx, j_idx, R_vecs, site

    def _normalize_parameter_axis(self, values, *, name, period=None):
        """
        Normalize a 1D parameter sweep and report metadata for finite differences.

        Returns
        -------
        values_unique : np.ndarray
            Copy of the input with any duplicated endpoint removed.
        step : float
            Uniform spacing between samples (computed before trimming so the “true” step is kept).
        is_periodic : bool
            True if the sweep spans a full cycle.
        trimmed : bool
            True when the final element was dropped because it duplicated the first.
        """
        arr = np.asarray(values, dtype=float)
        if arr.ndim != 1 or arr.size < 2:
            raise ValueError(
                f"Parameter '{name}' must be one-dimensional with at least two samples."
            )

        diffs = np.diff(arr)
        if not np.allclose(diffs, diffs[0]):
            raise ValueError(f"Parameter '{name}' must be uniformly spaced.")
        step = float(diffs[0])

        periodic = False
        trimmed = False
        if period is not None:
            period = float(period)
            span = arr[-1] - arr[0]
            if np.isclose(span, period):
                arr = arr[:-1]
                periodic = True
                trimmed = True
            elif np.isclose(step * arr.size, period):
                periodic = True
        else:
            if np.isclose(arr[-1], arr[0]):
                arr = arr[:-1]
                periodic = True
                trimmed = True

        return arr.copy(), step, periodic, trimmed

    def _eval_expr_to_block(self, expr: str, **assignments):
        """Evaluate a string expression with the given parameter values and cast it to a block."""
        env = {"np": np, "numpy": np, "pi": np.pi, "complex": complex, "float": float}
        env.update(assignments)
        try:
            value = eval(expr, {"__builtins__": {}}, env)
        except NameError as exc:
            missing = exc.args[0].split("'")[1]
            raise ValueError(
                f"Expression '{expr}' needs a value for parameter '{missing}'."
            ) from None
        except Exception as exc:
            raise ValueError(f"Could not evaluate expression '{expr}': {exc}") from exc
        return self._val_to_block(value)


[docs]
    def set_parameters(self, params=None, /, **kwargs):
        r"""
        Materialize parameterized on-site and hopping terms at fixed scalar values.

        Any entries previously defined via :meth:`set_onsite` or :meth:`set_hop` with
        a **string** or **callable** provider are evaluated using the supplied parameter
        values. The resulting numerics are then written back through the same APIs so
        all standard validation (Hermiticity, conjugate handling, shape checks) applies.

        Parameters
        ----------
        params : Mapping[str, Any], optional
            Dictionary mapping parameter names to **scalar** values. Use this when
            a name is not a valid Python identifier (e.g. contains spaces or ``-``).
            If both ``params`` and ``kwargs`` are given, values in ``kwargs`` **override**
            those from ``params``.
        **kwargs
            Additional ``name=value`` overrides for parameters whose names are valid
            identifiers (e.g. ``tb.set_parameters(beta=0.3)``).

        See Also
        --------
        with_parameters : Create a new TBModel instance with parameter-dependent terms evaluated.
            leaving the original unchanged.
        set_onsite : Define on-site terms (may be symbolic/callable).
        set_hop : Define hopping terms (may be symbolic/callable).

        Notes
        -----
        - Values must be Python scalars; 0-D NumPy scalars are
          unwrapped via ``.item()``. Use keyword parameters to :meth:`hamiltonian`,
          :meth:`solve_ham`, etc., for **array sweeps** (those are ephemeral).
        - Providers whose full parameter lists are not covered
          by the supplied values are left as-is; you can freeze parameters
          incrementally across calls.
        - After a provider is fully evaluated, it is **removed** and
          replaced by its numeric value; subsequent Hamiltonian builds no longer
          depend on external parameter kwargs.
        - When both ``params`` and ``kwargs`` specify the same name,
          the value from ``kwargs`` wins.

        Examples
        --------
        Freeze two parameters at once:

        >>> tb.set_onsite(lambda m: [m, -m], ind_i=None)
        >>> tb.set_hop(lambda t: t * np.eye(2), 0, 1, [0, 0])
        >>> tb.set_parameters(m=0.4, t=1.2)  # providers removed, numeric values stored

        Use a dict for a non-identifier name, override via kwargs:

        >>> tb.set_onsite(lambda m_A: m_A, ind_i=0)
        >>> tb.set_parameters({"m-A": 0.1, "m_A": 0.2}, m_A=0.3)  # m_A=0.3 overrides

        Keep one parameter symbolic (partial freeze):

        >>> tb.set_hop(lambda t, phi: t * np.exp(1j*phi), 0, 2, [1, 0])
        >>> tb.set_parameters(t=0.5)  # still depends on 'phi'
        """
        merged = {}
        if params is not None:
            if not isinstance(params, Mapping):
                raise TypeError(
                    "params must be a mapping of parameter names to values."
                )
            merged.update(params)
        merged.update(kwargs)
        if not merged:
            return

        cleaned = {}
        for name, value in merged.items():
            if isinstance(value, np.ndarray):
                if value.ndim != 0:
                    raise TypeError(f"Parameter '{name}' must be a scalar.")
                value = value.item()
            if not np.isscalar(value):
                raise TypeError(f"Parameter '{name}' must be a scalar.")
            cleaned[name] = value

        # onsite
        for idx, provider in list(getattr(self, "_onsite_param_terms", {}).items()):
            if provider is None:
                continue
            names = self._provider_names(provider, ctx=f"onsite[{idx}]")
            if any(name not in cleaned for name in names):
                continue
            if callable(provider):
                block = _call_provider(
                    provider, {name: cleaned[name] for name in names}
                )
            else:
                block = cleaned[names[0]]
            self.set_onsite(block, ind_i=idx, mode="set")  # reuse existing validation

        # hoppings
        for key, provider in list(getattr(self, "_hopping_param_terms", {}).items()):
            if provider is None:
                continue
            i, j, R = key
            names = self._provider_names(provider, ctx=f"hopping[{i},{j},{tuple(R)}]")
            if any(name not in cleaned for name in names):
                continue
            if callable(provider):
                block = _call_provider(
                    provider, {name: cleaned[name] for name in names}
                )
            else:
                block = cleaned[names[0]]

            if self.dim_k == 0:
                self.set_hop(block, i, j, mode="set", allow_conjugate_pair=True)
            else:
                self.set_hop(
                    block, i, j, list(R), mode="set", allow_conjugate_pair=True
                )



[docs]
    def with_parameters(self, params=None, /, **kwargs) -> "TBModel":
        r"""
        Create a new TBModel instance with parameter-dependent terms evaluated
        at the supplied scalar values.

        This function is similar to `set_parameters`, but instead of modifying
        the current model in place, it returns a new model instance where all
        parameter-dependent onsite and hopping terms have been evaluated at
        the provided values.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        params : Mapping[str, Any], optional
            Dictionary mapping parameter names to **scalar** values. Use this when
            a name is not a valid Python identifier (e.g. contains spaces or ``-``).
            If both ``params`` and ``kwargs`` are given, values in ``kwargs`` **override**
            those from ``params``.
        **kwargs
            Additional ``name=value`` overrides for parameters whose names are valid
            identifiers (e.g. ``tb.set_parameters(beta=0.3)``).

        Returns
        -------
        new_model : TBModel
            A new TBModel instance with parameter-dependent terms evaluated.

        See Also
        --------
        set_parameters : Evaluate parameter-dependent terms in place.
        """
        merged = {}
        if params is not None:
            if not isinstance(params, Mapping):
                raise TypeError(
                    "params must be a mapping of parameter names to values."
                )
            merged.update(params)
        merged.update(kwargs)

        if not merged:
            return self.copy()

        cleaned = {}
        for name, value in merged.items():
            if isinstance(value, np.ndarray):
                if value.ndim != 0:
                    raise TypeError(f"Parameter '{name}' must be a scalar.")
                value = value.item()
            if not np.isscalar(value):
                raise TypeError(f"Parameter '{name}' must be a scalar.")
            cleaned[name] = value

        new_model = self.copy()
        new_model.set_parameters(cleaned)
        return new_model


    ###### Lattice manipulation #########


[docs]
    def add_orb(self, orb_pos):
        """Adds a new orbital to the model with the specified coordinates.

        The orbital coordinate must be given in reduced
        coordinates, i.e. in units of the real-space lattice vectors
        of the model. The new orbital is added at the end of the list
        of orbitals, and the orbital index is set to the next available
        index.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        orb_pos : array_like, float
            The reduced coordinates of the new orbital of length ``dim_r``. If
            ``orb_pos`` is a single float or int, it will be converted to a 1D array
            (``dim_r`` must be 1).
        """

        # Append orbital position
        self._lattice.add_orb(orb_pos)

        # Append default site energy and specified flag
        if not self.spinful:
            self._site_energies = np.append(self._site_energies, 0.0)
        else:
            new_block = np.zeros((1, 2, 2), dtype=complex)
            self._site_energies = np.vstack([self._site_energies, new_block])
        self._site_energies_specified = np.append(self._site_energies_specified, False)

        # No hoppings are added by default


[docs]
    def remove_orb(self, to_remove):
        r"""Removes specified orbitals from the model.

        Parameters
        ----------
        to_remove : array-like or int
            List of orbital indices to be removed, or index of single orbital to be removed

        Notes
        -----
        Removing orbitals will reindex the orbitals with indices higher
        than those that are removed. For example, if model has 6 orbitals
        and you remove the 2nd orbital, then the orbitals 3-6 will be
        reindexed to 2-5 (Python counting). Indices of first two orbitals (0 and 1)
        are unaffected.

        Examples
        --------
        If original_model has say 10 orbitals then returned small_model will
        have only 8 orbitals.

        >>> small_model = original_model.remove_orb([2,5])

        """
        if isinstance(to_remove, int):
            indices = [to_remove]
        elif isinstance(to_remove, (list, np.ndarray)):
            indices = list(to_remove)
        else:
            raise TypeError("to_remove must be an integer or a list of integers.")

        for index in indices:
            if not isinstance(index, int):
                raise TypeError("All indices in to_remove must be integers.")
            if index < 0 or index >= self.norb:
                raise ValueError("Index out of bounds.")

        # check that all indices are unique
        if len(indices) != len(set(indices)):
            raise ValueError("All indices in to_remove must be unique.")

        # put the orbitals to be removed in descending order
        orb_index = sorted(indices, reverse=True)

        self._lattice.remove_orb(orb_index)

        # remove indices one by one
        for _, orb_ind in enumerate(orb_index):
            self._site_energies = np.delete(self._site_energies, orb_ind, 0)
            self._site_energies_specified = np.delete(
                self._site_energies_specified, orb_ind
            )

        self._hoptable.remove_orbitals(orb_index)



[docs]
    def cut_piece(self, num_cells, periodic_dir, glue_edges=False) -> "TBModel":
        r"""Cut a (d-1)-dimensional piece out of a d-dimensional tight-binding model.

        Constructs a (d-1)-dimensional tight-binding model out of a
        d-dimensional one by repeating the unit cell a given number of
        times along one of the periodic lattice vectors.

        Parameters
        ----------
        num_cells : int
            How many times to repeat the unit cell.

            .. versionchanged:: 2.0.0
                Renamed from ``num`` for clarity.

        periodic_dir : int
            Index of the periodic lattice vector along which to make the system finite.

            .. versionchanged:: 2.0.0
                Renamed from ``fin_dir`` for clarity.

        glue_edges : bool, optional
            If True, allow hoppings from one edge to the other of a cut model.

        Returns
        -------
        cut_model : TBModel
            Object of type :class:`pythtb.TBModel` representing a cutout
            tight-binding model.

        See Also
        --------
        :ref:`cubic-slab-hwf-nb` : For an example
        :ref:`three-site-thouless-nb` : For an example

        Notes
        -----
        - Orbitals in ``cut_model`` are numbered so that the `i`-th orbital of the `n`-th unit
          cell has index ``i + norb * n`` (here `norb` is the number of orbitals in the original model).
        - The real-space lattice vectors of the returned model are the same as those of
          the original model; only the dimensionality of reciprocal space
          is reduced.

        Examples
        --------
        Construct two-dimensional model B out of three-dimensional model A
        by repeating model along second lattice vector ten times


        >>> A = TBModel(Lattice([[1.0, 0.0, 0.0],
        ...                      [0.0, 1.0, 0.0],
        ...                      [0.0, 0.0, 1.0]], ...))
        >>> B = A.cut_piece(10, 1)

        Further cut two-dimensional model B into one-dimensional model
        A by repeating unit cell twenty times along third lattice
        vector and allow hoppings from one edge to the other

        >>> C = B.cut_piece(20, 2, glue_edges=True)

        """
        if not isinstance(num_cells, int) or num_cells < 1:
            raise ValueError("num_cells must be a positive integer.")
        if not isinstance(periodic_dir, int) or periodic_dir not in self.periodic_dirs:
            raise ValueError(
                "periodic_dir must be an integer corresponding to one of the periodic directions."
            )
        if not isinstance(glue_edges, bool):
            raise ValueError("glue_edges must be a boolean.")
        if self.dim_k == 0:
            raise ValueError("Can't cut a piece out of a finite sample.")

        # TODO: Why can't num_cells be 1 if glue_edges is False?
        if num_cells == 1 and glue_edges:
            raise ValueError("Can't have `num=1` and gluing of the edges!")

        lat_fin = self.lattice.cut_piece(num_cells, periodic_dir)
        cut_model = TBModel(lat_fin, spinful=self.spinful)

        onsite = []  # store onsite energies
        for _ in range(num_cells):  # go over all cells in finite direction
            for j in range(self.norb):  # go over all orbitals in one cell
                # do the onsite energies at the same time
                onsite.append(self._site_energies[j])
        onsite = np.array(onsite)
        cut_model.set_onsite(onsite, mode="set")

        # replicate parameterised onsite providers
        onsite_providers = getattr(self, "_onsite_param_terms", {})
        if onsite_providers:
            for c in range(num_cells):
                base = c * self.norb
                for idx, provider in onsite_providers.items():
                    if provider:
                        cut_model.set_onsite(provider, ind_i=base + idx, mode="set")

        # remember if came from w90
        cut_model.assume_position_operator_diagonal = (
            self.assume_position_operator_diagonal
        )
        cut_model._from_w90 = self._from_w90

        amps, from_idx, to_idx, R_vecs = self._hoptable.components()
        for c in range(num_cells):
            for amp, ind_i, ind_j, ind_R in zip(
                amps, from_idx, to_idx, R_vecs, strict=True
            ):
                hop_amp = amp.copy() if self.spinful else complex(amp)
                R_vec = ind_R.copy()
                jump_fin = int(R_vec[periodic_dir])

                hi = int(ind_i) + c * self.norb
                hj = int(ind_j) + (c + jump_fin) * self.norb

                if cut_model.dim_k != 0:
                    R_vec[periodic_dir] = 0
                    R_arg = R_vec
                else:
                    R_arg = None

                to_add = True
                if not glue_edges:
                    if hj < 0 or hj >= self.norb * num_cells:
                        to_add = False
                else:
                    hj = int(hj) % int(self.norb * num_cells)

                if to_add:
                    cut_model.set_hop(
                        hop_amp,
                        hi,
                        hj,
                        R_arg,
                        mode="add",
                        allow_conjugate_pair=True,
                    )

        # replicate parameterised hoppings
        param_hops = getattr(self, "_hopping_param_terms", {})
        if param_hops:
            for c in range(num_cells):
                base = c * self.norb
                for (ind_i, ind_j, R_tuple), provider in param_hops.items():
                    R_vec = np.array(R_tuple, dtype=int)
                    jump_fin = int(R_vec[periodic_dir])

                    hi = int(ind_i) + base
                    hj = int(ind_j) + (c + jump_fin) * self.norb

                    if cut_model.dim_k != 0:
                        R_copy = R_vec.copy()
                        R_copy[periodic_dir] = 0
                        R_arg = R_copy
                    else:
                        R_arg = None

                    if not glue_edges:
                        if hj < 0 or hj >= self.norb * num_cells:
                            continue
                    else:
                        hj = hj % (self.norb * num_cells)

                    cut_model.set_hop(
                        provider,
                        hi,
                        hj,
                        R_arg,
                        mode="set",
                        allow_conjugate_pair=True,
                    )

        return cut_model



[docs]
    def make_finite(
        self,
        periodic_dirs: list[int],
        num_cells: list[int],
        glue_edges: list[bool] = None,
    ) -> "TBModel":
        r"""Returns a finite model.

        This function constructs a finite tight-binding model by removing periodicity
        along specified directions. The resulting model has open boundary conditions
        along those directions, with the option to glue edges together.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        periodic_dirs : list[int]
            List of indices of periodic directions along which
            you wish to make the model finite.
        num_cells : list[int]
            Number of unit cells of the sample along each periodic direction.
        glue_edges : list[bool], optional
            If True, allow hoppings from one edge to the other of a cut model
            along the corresponding direction. If None (default), no edge gluing
            is performed along any direction and we have open boundary conditions.

        Returns
        -------
        finite : :class:`pythtb.TBModel`
            A model whose periodic hoppings have been removed (OBC model).

        See Also
        --------
        :meth:`cut_piece` : Cut a lower-dimensional piece out of a higher-dimensional model.
        :ref:`haldane-nb` : For an example
        :ref:`haldane-edge-nb` : For an example
        :ref:`fkm-nb` : For an example
        :ref:`local-chern-nb` : For an example

        Notes
        -----
        - This function applies :meth:`cut_piece` iteratively along each specified direction.
          The order of directions in `dirs` determines the sequence of cuts.
        - Orbitals in the returned model are numbered so that the `i`-th orbital of the `n`-th unit
          cell along the first direction in `dirs`, the `m`-th unit cell along the second direction in `dirs`, etc.,
          has index ``i + norb * (n + m * num_cells[0] + ...)`` (here `norb` is the number of orbitals in the original model).
        - The real-space lattice vectors of the returned model are the same as those of
          the original model; only the dimensionality of reciprocal space
          is reduced.

        Examples
        --------
        Construct a two-dimensional finite model by removing periodicity
        along both lattice vectors of a two-dimensional model
        >>> lat = Lattice([[1.0, 0.0], [0.0, 1.0]], [[0.0, 0.0]], periodic_dirs=[0,1])
        >>> tb = TBModel(lat)
        >>> fin_tb = tb.make_finite(periodic_dirs=[0, 1], num_cells=[10, 5])
        >>> fin_tb.dim_k
        0
        >>> fin_tb.norb
        50
        """
        if self.dim_k == 0:
            raise ValueError("Model is already finite!")
        if not all(d in self.periodic_dirs for d in periodic_dirs):
            raise ValueError("All directions in `periodic_dirs` must be periodic.")
        if len(periodic_dirs) != len(set(periodic_dirs)):
            raise ValueError("All directions in `periodic_dirs` must be unique.")
        if len(periodic_dirs) != len(num_cells):
            raise ValueError(
                "Length of `periodic_dirs` must match length of `num_cells`."
            )
        if not all(n_cell > 0 for n_cell in num_cells):
            raise ValueError(
                "Number of sites along finite direction must be greater than 0"
            )

        if glue_edges is not None:
            if len(glue_edges) != len(num_cells):
                raise ValueError(
                    "Length of `glue_edges` must match number of periodic directions."
                )
        else:
            glue_edges = [False] * self.dim_k

        cut = self
        for idx, n_cell in enumerate(num_cells):
            cut = cut.cut_piece(
                num_cells=n_cell,
                periodic_dir=periodic_dirs[idx],
                glue_edges=glue_edges[idx],
            )

        return cut


    # This function is being deprecated. The preferred way to reduce dimensionality
    # is to use `make_finite` with `num_cells=1` along the desired directions.
    # This approach is more general and can handle multiple directions at once.
    # If the intention is to keep periodicity along all directions while keeping some
    # k-values fixed, this can be achieved by using the `hamiltonian` method passing the
    # desired k-values. Explicit manipulation of k-space sampling in the model is discouraged. k-space
    # sampling is managed by 'Mesh' and 'WFArray' classes.

[docs]
    @deprecated(
        "use `make_finite` or `cut_piece` with ``num_cells=1`` along the desired directions instead (since v2.0).",
        category=FutureWarning,
    )
    def reduce_dim(self) -> "TBModel":
        r"""
        .. deprecated:: 2.0.0
            Use :meth:`make_finite` or :meth:`cut_piece` with ``num_cells=1`` along the desired
            directions instead.
            If the intention is to keep periodicity along all directions while keeping some
            k-values fixed, this can be achieved by using the :meth:`hamiltonian` method
            passing the desired k-values.
        """
        pass



[docs]
    def change_nonperiodic_vector(
        self,
        fin_dir: int,
        new_latt_vec: np.ndarray = None,
        to_home: bool = True,
    ):
        """Change non-periodic lattice vector

        Changes one of the non-periodic "lattice vectors". Non-periodic lattice vectors
        are those that are *not* listed as periodic in the :attr:`periodic_dirs` parameter.
        The orbital vectors are modified accordingly so that the actual (Cartesian) coordinates of
        orbitals remain unchanged.

        .. versionremoved:: 2.0.0
            Parameter `to_home_supress_warning` has been removed.

        Parameters
        ----------
        fin_dir : int
            Index of non-periodic lattice vector to change.

            .. versionchanged:: 2.0.0
                Renamed from ``np_dir`` for clarity and consistency.

        new_latt_vec : array_like, optional
            The new non-periodic lattice vector. If None (default), the new
            non-periodic lattice vector is constructed to be orthogonal to all periodic
            vectors and to have the same length as the original non-periodic vector.

        to_home : bool, optional
            If ``True`` (default), shift all orbitals to the home cell along
            periodic directions. Default behavior is to shift orbitals
            to the home cell.

            .. versionchanged:: 2.0.0
                This parameter was previously not working as intended and is now fixed.

        See Also
        --------
        :ref:`boron-nitride-nb` : For an example.

        Notes
        -----
        - This function is especially useful after using function cut_piece to create slabs,
          rods, or ribbons.
        - By default, the new non-periodic vector is constructed
          from the original by removing all components in the periodic
          space. This ensures that the Berry phases computed in the
          periodic space correspond to the usual expectations.
        - For example, after this change, the Berry phase computed for a
          ribbon depends only on the location of the Wannier center
          in the extended direction, not on its location in the
          transverse direction. Alternatively, the new non-periodic
          vector can be set explicitly via the ``new_latt_vec`` parameter.

        Examples
        --------
        Modify slab model so that non-periodic third vector is perpendicular to the slab

        >>> tb.change_nonperiodic_vector(2)
        """
        self._lattice.change_nonperiodic_vector(fin_dir, new_latt_vec)

        if to_home:
            self._shift_hop_to_home()
            self._lattice._shift_orb_to_home()



[docs]
    def make_supercell(
        self,
        sc_red_lat,
        return_sc_vectors: bool = False,
        to_home: bool = True,
    ) -> "TBModel":
        """Make model on a super-cell.

        Constructs a :class:`pythtb.TBModel` representing a super-cell
        of the current object. This function can be used together with :func:`cut_piece`
        in order to create slabs with arbitrary surfaces.

        By default all orbitals will be shifted to the home cell after
        unit cell has been created. That way all orbitals will have
        reduced coordinates between 0 and 1. If you wish to avoid this
        behavior, you need to set, *to_home* argument to *False*.

        .. versionremoved:: 2.0.0
            Parameter `to_home_supress_warning` has been removed.

        Parameters
        ----------
        sc_red_lat : array-like
          Super-cell lattice vectors in terms of reduced coordinates
          of the original tight-binding model. Shape must be
          ``(dim_r, dim_r)``. First index in the array specifies super-cell vector,
          while second index specifies coordinate of that super-cell vector.

          If `dim_k` < `dim_r` then still need to specify full array with
          size ``(dim_r, dim_r)`` for consistency, but non-periodic
          directions must have 0 on off-diagonal elements and 1 on
          diagonal.

        return_sc_vectors : bool, optional
            Default value is ``False``. If ``True`` returns also lattice vectors
            inside the super-cell. Internally, super-cell tight-binding model will
            have orbitals repeated in the same order in which these
            super-cell vectors are given, but if argument `to_home`
            is set ``True`` (which it is by default) then additionally,
            orbitals will be shifted to the home cell.

        to_home : bool, optional
            Default value is ``True``. If ``True`` will shift all orbitals
            to the home cell along periodic directions.

        Returns
        -------
        sc_tb : :class:`pythtb.TBModel`
            Tight-binding model in a super-cell.

        sc_vectors : :class:`numpy.ndarray`, optional
          Super-cell vectors, returned only if
          `return_sc_vectors` is set to ``True`` (default value is
          ``False``).

        Notes
        -----
        The super-cell is constructed by repeating the original unit cell
        according to the specified super-cell lattice vectors. The resulting
        model will have a larger Brillouin zone and may exhibit different
        electronic properties compared to the original model.

        Examples
        --------
        Create super-cell out of 2d tight-binding model ``tb``

        >>> sc_tb = tb.make_supercell([[2, 1], [-1, 2]])
        """
        geom = self._lattice._prepare_supercell_geometry(sc_red_lat)

        # get super-cell vectors in cartesian coordinates
        sc_vec = geom["translations"]
        num_sc = sc_vec.shape[0]

        lat = Lattice(geom["lat_vecs"], geom["orb_vecs"], self.periodic_dirs)
        sc_tb = TBModel(lat, spinful=self.spinful)
        sc_tb.assume_position_operator_diagonal = self.assume_position_operator_diagonal

        for offset in range(num_sc):
            base = offset * self.norb
            for orb_idx, onsite in enumerate(self._site_energies):
                sc_tb.set_onsite(onsite, base + orb_idx)

        sc_index = {tuple(vec.tolist()): idx for idx, vec in enumerate(sc_vec)}
        sc_red_lat = geom["sc_red_lat"]
        red_transform = geom["red_transform"]
        eps = 1e-8

        amps, ind_is, ind_js, R_vecs = self._hoptable.components()

        for offset, cur_sc_vec in enumerate(sc_vec):
            base = offset * self.norb
            for amp, ind_i, ind_j, ind_R in zip(
                amps, ind_is, ind_js, R_vecs, strict=True
            ):
                R_vec = ind_R.copy()
                total_disp = cur_sc_vec + R_vec
                red_disp = total_disp @ red_transform
                sc_part = np.floor(red_disp + eps).astype(int)
                orig_part = total_disp - sc_part @ sc_red_lat
                pair_idx = sc_index.get(tuple(orig_part.tolist()))
                if pair_idx is None:
                    raise Exception("Did not find super cell vector!")

                hi = int(ind_i) + base
                hj = int(ind_j) + pair_idx * self.norb

                if self.spinful:
                    amp_use = amp.copy()
                else:
                    amp_use = complex(amp)

                sc_tb.set_hop(
                    amp_use, hi, hj, sc_part, mode="add", allow_conjugate_pair=True
                )

        param_hops = getattr(self, "_hopping_param_terms", {})
        if param_hops:
            for offset, cur_sc_vec in enumerate(sc_vec):
                base = offset * self.norb
                for (ind_i, ind_j, R_tuple), provider in param_hops.items():
                    R_vec = np.array(R_tuple, dtype=float)
                    total_disp = cur_sc_vec + R_vec
                    red_disp = total_disp @ red_transform
                    sc_part = np.floor(red_disp + eps).astype(int)
                    orig_part = total_disp - sc_part @ sc_red_lat
                    pair_idx = sc_index.get(tuple(orig_part.tolist()))
                    if pair_idx is None:
                        raise RuntimeError(
                            "Supercell vector not found for parameterised hopping."
                        )

                    hi = int(ind_i) + base
                    hj = int(ind_j) + pair_idx * self.norb

                    sc_tb.set_hop(
                        provider,
                        hi,
                        hj,
                        sc_part,
                        mode="set",
                        allow_conjugate_pair=True,
                    )

        if to_home:
            # NOTE: These two functions must be called in this order!
            # First shift hoppings, then orbitals. The hoppings
            # depend on the orbital positions.

            sc_tb._shift_hop_to_home()
            sc_tb._lattice._shift_orb_to_home()

        return sc_tb if not return_sc_vectors else (sc_tb, sc_vec.copy())


    def _shift_hop_to_home(self):
        """Shifts orbital coordinates (along periodic directions) to the home
        unit cell.

        After this function is called reduced coordinates
        (along periodic directions) of orbitals will be between 0 and
        1.

        .. versionchanged:: 1.7.2
            Versions < 1.7.2 shifted orbitals to the home cell even
            along even nonperiodic directions. In later versions, this is
            no longer allowed, as this might produce
            counterintuitive results. Shifting orbitals along nonperiodic
            directions changes physical nature of the tight-binding model.
            This behavior might be especially non-intuitive for
            tight-binding models that came from the `cut_piece` function.

        """

        for i in range(self.norb):
            disp_vec = np.zeros(self.dim_r, dtype=int)
            for k in range(self.dim_r):
                shift = int(np.floor(self.orb_vecs[i, k]))
                if k in self.periodic_dirs:
                    disp_vec[k] = shift
                elif shift != 0:
                    logger.warning(
                        f"Orbital {i} has reduced coordinate {self.orb_vecs[i, k]:.4f} along non-periodic direction {k}. "
                        "This orbital will not be shifted to the home cell along this direction."
                    )

            if self.dim_k != 0 and np.any(disp_vec):
                self._hoptable.shift_orbital(i, disp_vec)


[docs]
    @copydoc(Lattice.k_uniform_mesh)
    def k_uniform_mesh(
        self, mesh_size, *, gamma_centered: bool = False, include_endpoints: bool = True
    ):
        return self._lattice.k_uniform_mesh(
            mesh_size,
            gamma_centered=gamma_centered,
            include_endpoints=include_endpoints,
        )



[docs]
    @copydoc(Lattice.k_path)
    def k_path(self, k_nodes, nk: int, report: bool = False):
        return self._lattice.k_path(k_nodes, nk, report)


    ############### Observables ####################

    def _normalize_kpoints(
        self, k_pts, *, allow_none_for_finite: bool = False
    ) -> np.ndarray | None:
        """Validate and reshape user-provided k-points."""
        dim_k = self.dim_k
        if dim_k == 0:
            if k_pts is None:
                return None
            elif allow_none_for_finite:
                return None
            raise ValueError(
                "k_pts should not be specified for finite (dim_k=0) models."
            )

        elif k_pts is None:
            raise ValueError("Must supply k_pts for periodic systems (dim_k > 0).")

        k_arr = np.asarray(k_pts, dtype=float)

        # scalar -> treat as a single point in # of dimensions dim_k
        if k_arr.ndim == 0:
            # e.g. dim_k == 1 and user passed scalar
            if dim_k == 1:
                return k_arr.reshape(1, 1)
            raise ValueError("Scalar k_pts is only valid when dim_k == 1.")

        if k_arr.ndim == 1:
            if dim_k == 1:
                # 1D sweep, keep all entries as a column vector
                return k_arr.reshape(-1, 1)
            if k_arr.size == dim_k:
                # single k-point in higher dimensions
                return k_arr.reshape(1, dim_k)
            raise ValueError(
                f"k_pts must have shape ({dim_k},) for a single point or (Nk,) only when dim_k == 1."
            )

        if k_arr.ndim == 2 and k_arr.shape[1] == dim_k:
            return k_arr

        raise ValueError(f"k_pts must have shape (Nk, {dim_k}) or ({dim_k},).")

    def _H_to_per_gauge(self, H_flat, k_vals):
        r"""
        Transform Hamiltonian to periodic gauge so that :math:`H(\mathbf{k}+\mathbf{G}) = H(\mathbf{k})`.

        If ``nspin = 2``, ``H_flat`` should only be flat along `k` and _NOT_ spin.

        Parameters
        ----------
        H_flat : np.ndarray
            Hamiltonian flattened along the k-direction, shape (Nk, nstate, nstate[, nspin]).
        k_vals : np.ndarray
            Array of k-point values, shape (Nk, dim_k).

        Returns
        -------
        np.ndarray
            Hamiltonian in periodic gauge, shape (Nk, nstate, nstate[, nspin]).

        Notes
        -----
        The transformation applies phase factors to ensure periodicity in reciprocal space.
        """
        if k_vals.ndim != 2:
            raise ValueError(
                f"Invalid k_vals shape: {k_vals.shape}. Expected (Nk, dim_k)."
            )
        if k_vals.shape[1] != self.dim_k:
            raise ValueError(
                f"Invalid k_vals shape: {k_vals.shape}. Expected (Nk, {self.dim_k})."
            )

        if self.dim_k == 0:
            logger.warning(
                "No periodic directions in k-space. Returning H_flat unchanged."
            )
            return H_flat

        orb_vecs = self._orb_vecs  # reduced units
        orb_vec_diff = orb_vecs[:, None, :] - orb_vecs[None, :, :]
        orb_vec_diff = orb_vec_diff[..., self.periodic_dirs]
        orb_phase = np.exp(
            1j * 2 * np.pi * np.matmul(orb_vec_diff, k_vals.T)
        ).transpose(2, 0, 1)
        H_per_flat = H_flat * orb_phase
        return H_per_flat

    def _hamiltonian_finite(
        self, hop_amps, i_idx, j_idx, site_energies, *, flatten_spin: bool
    ):
        norb = self.norb

        if not self.spinful:
            hop_amps = hop_amps.astype(complex)
            ham = np.zeros((norb, norb), dtype=complex)
            if hop_amps.size:
                np.add.at(ham, (i_idx, j_idx), hop_amps)
                np.add.at(ham, (j_idx, i_idx), hop_amps.conj())
            np.fill_diagonal(ham, site_energies)
            return ham

        # spinful
        nspin = self.nspin
        dim_block = norb * nspin  # full matrix dimension after flattening spins
        hop_amps = np.asarray(hop_amps, dtype=complex)

        ham = np.zeros((dim_block, dim_block), dtype=complex)
        if hop_amps.size:
            # For every hopping we have a 2×2 spin block. Pre-compute the spin-pair indices
            # so we can add all blocks in a single vectorised pass.
            hop_blocks = hop_amps.reshape(hop_amps.shape[0], -1)  # (n_hops, nspin^2)
            spin_out = np.repeat(np.arange(nspin), nspin)  # s_out varies slowest
            spin_in = np.tile(np.arange(nspin), nspin)  # s_in varies fastest

            rows = (i_idx[:, None] * nspin + spin_out[None, :]).reshape(-1)
            cols = (j_idx[:, None] * nspin + spin_in[None, :]).reshape(-1)
            contrib = hop_blocks.reshape(-1)

            flat_idx = rows * dim_block + cols
            ham_flat = ham.reshape(-1)
            np.add.at(ham_flat, flat_idx, contrib)

            # Hermiticity: add the conjugate only on the opposite off-diagonal entries
            offdiag = rows != cols
            if np.any(offdiag):
                conj_idx = cols[offdiag] * dim_block + rows[offdiag]
                np.add.at(ham_flat, conj_idx, contrib[offdiag].conj())

        # On-site energies already come as 2×2 spin blocks.  Broadcast them onto the diagonal.
        ham_view = ham.reshape(norb, nspin, norb, nspin)
        diag_orbs = np.arange(norb)
        ham_view[diag_orbs, :, diag_orbs, :] += site_energies

        if flatten_spin:
            return ham
        return ham_view

    def _hamiltonian_periodic(
        self,
        k_vecs: np.ndarray,
        hop_amps,
        i_idx,
        j_idx,
        R_vecs,
        site_energies,
        *,
        flatten_spin: bool,
    ):
        norb = self.norb
        per = np.asarray(self.periodic_dirs)
        orb_red = np.asarray(self.orb_vecs)

        n_kpts = k_vecs.shape[0]
        n_hops = hop_amps.shape[0]

        i_idx = i_idx.astype(int)
        j_idx = j_idx.astype(int)
        R_vecs = R_vecs.astype(float)

        orb_i = orb_red[i_idx]
        orb_j = orb_red[j_idx]
        delta_r = R_vecs - orb_i + orb_j
        delta_r_per = delta_r[:, per]

        if n_hops:
            k_dot_r = k_vecs @ delta_r_per.T
            phases = np.exp(1j * 2 * np.pi * k_dot_r)
        else:
            phases = None

        if not self.spinful:
            hop_amps = hop_amps.astype(complex)
            ham = np.zeros((n_kpts, norb, norb), dtype=complex)
            if n_hops:
                cache = self._get_flattened_indices()
                order = cache["order"]
                starts = cache["starts"]
                uniq = cache["uniq"]
                cols_transposed = cache["cols_transposed"]

                ham_flat = ham.reshape(n_kpts, -1)
                contrib = phases[:, order] * hop_amps[order]
                sums = np.add.reduceat(contrib, starts, axis=1)
                ham_flat[:, uniq] += sums
                ham_flat[:, cols_transposed] += sums.conj()

            diag = np.arange(norb)
            ham[:, diag, diag] += site_energies
            return ham

        # spinful
        nspin = self.nspin
        M = norb * nspin
        hop_blocks = np.asarray(hop_amps, dtype=complex).reshape(n_hops, -1)

        ham = np.zeros((n_kpts, M, M), dtype=complex)
        if n_hops:
            # flattened indices for every spin pair
            spin_out = np.repeat(np.arange(nspin), nspin)  # [0, 0, 1, 1]
            spin_in = np.tile(np.arange(nspin), nspin)  # [0, 1, 0, 1]

            row_flat = (i_idx[:, None] * nspin + spin_out[None, :]).reshape(-1)
            col_flat = (j_idx[:, None] * nspin + spin_in[None, :]).reshape(-1)

            pair_flat = row_flat * M + col_flat
            order = np.argsort(pair_flat, kind="stable")
            uniq, starts = np.unique(pair_flat[order], return_index=True)
            cols_transposed = (uniq % M) * M + (uniq // M)

            ham_flat = ham.reshape(n_kpts, -1)
            contrib = (phases[:, :, None] * hop_blocks[None, :, :]).reshape(n_kpts, -1)
            contrib = contrib[:, order]

            sums = np.add.reduceat(contrib, starts, axis=1)
            ham_flat[:, uniq] += sums
            ham_flat[:, cols_transposed] += sums.conj()

        rows = np.arange(norb * nspin).reshape(norb, nspin)
        ham[:, rows[:, :, None], rows[:, None, :]] += site_energies[None, :, :, :]

        if not flatten_spin:
            ham = ham.reshape(n_kpts, norb, nspin, norb, nspin)
        return ham


[docs]
    def hamiltonian(
        self,
        k_pts: list | np.ndarray | None = None,
        flatten_spin_axis: bool = False,
        **params,
    ) -> np.ndarray:
        r"""Generate the Bloch Hamiltonian of the tight-binding model.

        The Hamiltonian is computed in tight-binding convention I, which includes phase factors
        associated with orbital positions in the hopping terms:

        .. math::

            H_{ij}(k) = \sum_{\mathbf{R}} t_{ij}(\mathbf{R}) \exp[i \mathbf{k} \cdot (\mathbf{r}_i - \mathbf{r}_j + \mathbf{R})]

        where :math:`t_{ij}(R)` is the hopping amplitude from orbital j to i through lattice vector :math:`\mathbf{R}`.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        k_pts : (Nk, dim_k) list or numpy.ndarray of floats or None, optional
            Array of k-points in reduced coordinates. Shape must be ``(Nk, dim_k)``.
            If `None`, the Hamiltonian is computed at a single point (`dim_k = 0`),
            corresponding to a finite sample.
        flatten_spin_axis : bool, optional
            If True, the spin indices are flattened into the orbital indices.
            This results in a Hamiltonian of shape ``(..., norb*nspin, norb*nspin)``.
            If False (default), the Hamiltonian has shape ``(..., norb, nspin, norb, nspin)``.
        **params :
            Keyword arguments mapping parameter names to value(s). Each value can be a scalar
            or a 1D array of values. If any values are array-like,
            the Hamiltonian is evaluated at all combinations of parameter values,
            and the final array is stacked with the k-axis leading, followed by each
            parameter axis in the order of given parameter names.

        Returns
        -------
        ham : numpy.ndarray
            Array of Bloch-Hamiltonian matrices defined on the specified k-points. The Hamiltonian is Hermitian by construction.
            The shape of the returned array depends on the presence of k-points and spin:

            - Spinless models: ``(..., norb, norb)``
            - Spinful models: ``(..., norb, nspin, norb, nspin)`` if ``flatten_spin_axis=False``,
              or ``(..., norb*nspin, norb*nspin)`` if ``flatten_spin_axis=True``.
            - ``dim_k > 0``: ``(n_kpts, ...)``
            - ``dim_k = 0``: no k-point axis.
            - Parameter sweeps: ``(n_kpts, n_param1, n_param2, ...)`` parameter axes are added after the k-point axis (if present).

        See Also
        --------
        velocity : Compute the derivatives of the Hamiltonian with respect to k and parameters.
        k_uniform_mesh : Generate a uniform k-point mesh for periodic systems.
        k_path : Generate a k-point path for band structure calculations.

        Notes
        -----
        - In convention I, the Hamiltonian satisfies:

          .. math::
            H(k) \neq H(k + G), \quad \text{but instead} \quad H(k) = U H(k + G) U^{\dagger}

          where :math:`G` is a reciprocal lattice vector and :math:`U` is a unitary transformation
          relating the two.

        Examples
        --------
        Compute Hamiltonian at a single k-point for a finite model:

        >>> ham = tb_model.hamiltonian()

        Compute Hamiltonian at multiple k-points for a periodic model:

        >>> k_points = tb_model.k_uniform_mesh([10, 10])
        >>> ham_k = tb_model.hamiltonian(k_pts=k_points)

        Compute Hamiltonian while sweeping over a parameter:

        >>> model = TBModel(lattice, spinful=False)
        >>> model.set_hop(-1.0, 0, 1, [0, 0], param_name='t1')
        >>> k_points = model.k_uniform_mesh([5, 5])
        >>> ham_param = tb_model.hamiltonian(k_pts=k_points, t1= [0.0, 1.0, 2.0])
        """

        # Check params includes all parameters
        if params is not None:
            self._check_missing_parameters(params)

        # Normalize k-points
        if self.dim_k == 0:
            k_arr = None
        else:
            if k_pts is None:
                raise ValueError(
                    "k_pts must be specified for periodic systems (dim_k > 0)."
                )
            else:
                k_arr = self._normalize_kpoints(k_pts)

        # Partition params into scalars vs sweeps (1D arrays/lists)
        # scalars: dict of param_name -> scalar value
        # sweep_names: list of param names to sweep over
        # sweep_values: list of arrays/lists of values to sweep over
        scalars, sweep_names, sweep_values = self._params_to_sweep(params)

        # No sweep axes, resolve scalar parameters only
        if not sweep_values:
            hop_amps, i_idx, j_idx, R_vecs, site = self._evaluate_params(scalars)
            if self.dim_k == 0:
                H = self._hamiltonian_finite(
                    hop_amps, i_idx, j_idx, site, flatten_spin=flatten_spin_axis
                )
            else:
                H = self._hamiltonian_periodic(
                    k_arr,
                    hop_amps,
                    i_idx,
                    j_idx,
                    R_vecs,
                    site,
                    flatten_spin=flatten_spin_axis,
                )
            return H

        # param sweeps: cartesian product, then reshape with lambda at the end
        axis_lengths = [len(ax) for ax in sweep_values]
        blocks, base_shape = [], None
        for multi in product(*[range(n) for n in axis_lengths]):
            assign = scalars.copy()
            for a, name in enumerate(sweep_names):
                assign[name] = sweep_values[a][multi[a]]

            # ---- assemble H from immutable arrays ----
            hop_amps, i_idx, j_idx, R_vecs, site = self._evaluate_params(assign)
            if self.dim_k == 0:
                H = self._hamiltonian_finite(
                    hop_amps, i_idx, j_idx, site, flatten_spin=flatten_spin_axis
                )
            else:
                H = self._hamiltonian_periodic(
                    k_arr,
                    hop_amps,
                    i_idx,
                    j_idx,
                    R_vecs,
                    site,
                    flatten_spin=flatten_spin_axis,
                )

            if base_shape is None:
                base_shape = H.shape
            blocks.append(H[np.newaxis, ...])

        stacked = np.concatenate(blocks, axis=0)  # (*shape_params, *base_shape)
        stacked = stacked.reshape(*axis_lengths, *base_shape)

        if axis_lengths and self.dim_k != 0:
            p = len(axis_lengths)
            b = len(base_shape)  # typically (Nk, nstate, nstate)
            perm = (p,) + tuple(range(p)) + tuple(range(p + 1, p + b))
            stacked = np.transpose(stacked, perm)

        self._H = stacked

        return stacked


    def _sol_ham(
        self,
        ham,
        return_eigvecs=False,
        flatten_spin_axis=False,
        use_tensorflow=False,
        use_32_bit=False,
    ):
        """Solves Hamiltonian and returns eigenvectors, eigenvalues"""
        # NOTE: this function is separate so that it can be jit-compiled if needed

        if not np.allclose(ham, ham.swapaxes(-1, -2).conj()):
            raise ValueError("Hamiltonian matrix is not Hermitian.")

        if use_tensorflow:
            try:
                import tensorflow as tf
            except ImportError as e:
                raise ImportError(
                    "TensorFlow is not installed. Please install TensorFlow or set use_tensorflow=False."
                ) from e

            if use_32_bit:
                ham_tf = tf.convert_to_tensor(ham, dtype=tf.complex64)
            else:
                ham_tf = tf.convert_to_tensor(ham, dtype=tf.complex128)

            evals_tf, evecs_tf = tf.linalg.eigh(ham_tf)

            if return_eigvecs:
                # return later
                eval, evec = evals_tf.numpy(), evecs_tf.numpy()
            else:
                return evals_tf.numpy()

        else:
            if use_32_bit:
                ham_use = ham.astype(np.complex64)
            else:
                ham_use = ham.astype(np.complex128)
            if return_eigvecs:
                # return later
                eval, evec = np.linalg.eigh(ham_use)
            else:
                return np.linalg.eigvalsh(ham_use)

        if return_eigvecs:
            if self.nspin == 1:
                shape_evecs = (*ham.shape[:-2],) + (self.norb, self.norb)
            elif self.nspin == 2:
                shape_evecs = (*ham.shape[:-2],) + (
                    self.nstate,
                    self.norb,
                    self.nspin,
                )

            # transpose matrix eig since otherwise it is confusing
            # now eig[i,:] is eigenvector for eval[i]-th eigenvalue
            evec = evec.swapaxes(-1, -2)
            if not flatten_spin_axis and self.nspin == 2:
                evec = evec.reshape(*shape_evecs)
            return eval, evec


[docs]
    def solve_ham(
        self,
        k_pts: list | np.ndarray | None = None,
        return_eigvecs: bool = False,
        flatten_spin_axis: bool = True,
        use_tensorflow: bool = False,
        **params,
    ) -> tuple[np.ndarray, np.ndarray] | np.ndarray:
        r"""Diagonalize the Hamiltonian

        Solve for eigenvalues and optionally eigenvectors of the tight-binding model
        at a list of one-dimensional k-vectors.

        .. versionadded:: 2.0.0
            Merged :func:`solve_all` and :func:`solve_one` into :func:`solve_ham`.
            This function will equivalently handle both a single k-point and
            multiple k-points.

        Parameters
        ----------
        k_pts : (Nk, dim_k) list or numpy.ndarray or None, optional
            One-dimensional list or array of k-vectors, each given in reduced coordinates.
            Shape should be ``(Nk, dim_k)``, where ``dim_k`` is the number of periodic directions.
            Should not be specified for systems with zero-dimensional reciprocal space.

            .. versionchanged:: 2.0.0
                Renamed from ``k_list``.

        return_eigvecs : bool, optional
            If True, both eigenvalues and eigenvectors are returned.
            If False (default), only eigenvalues are returned.

            .. versionchanged:: 2.0.0
                Renamed from ``eig_vectors``.

        flatten_spin_axis : bool, optional
            If True (default), the spin axes are flattened into the orbital axes.
            If False, the spin axes are kept separate. This affects the
            shape of the returned eigenvectors for spinful models.

            .. versionadded:: 2.0.0

        use_tensorflow : bool, optional
            If True, use TensorFlow to accelerate the diagonalization.
            This requires TensorFlow to be installed. Default is False.

            .. versionadded:: 2.0.0

        **params :
            Keyword arguments mapping parameter names to value(s). Each value can be a scalar
            or a 1D array of values. If any values are array-like,
            the Hamiltonian is evaluated at all combinations of parameter values,
            and the final array is stacked with the k-axis leading, followed by each
            parameter axis in the order of given parameter names.

            .. versionadded:: 2.0.0

        Returns
        -------
        eval : np.ndarray
            Array of eigenvalues. Shape is:

            - ``(Nk, nstates)`` for periodic systems
            - ``(nstates,)`` for zero-dimensional (molecular) systems
            - ``(Nk, n_param1, n_param2, ..., nstates)`` if parameter sweeps are performed,
              with parameter axes added after the k-point axis.

        evec : np.ndarray, optional
            Array of eigenvectors (if ``return_eigvecs=True``). The ordering of bands matches that in ``eval``.

            For spinless models the shape is:

            - ``(Nk, nstates, norb)``: periodic systems
            - ``(nstates, norb)``: zero-dimensional systems
            - ``(nstates, norb)``: If only one k-point is provided, the redundant k-axis is removed.

            For spinful models the shape is (``nstates = norb * 2``):

            - ``(..., nstates, norb, 2)``: If ``flatten_spin_axis=False``, an additional spin axis of size 2 is appended at the end.
            - ``(..., nstates, nstates)``: If ``flatten_spin_axis=True``, the spin axes are flattened into the orbital axes.

            If parameter sweeps are performed, parameter axes are added after the k-point axis.

            - ``(Nk, n_param1, n_param2, ..., nstates, norb[, 2])`` or
              ``(Nk, n_param1, n_param2, ..., nstates, nstates)`` depending on ``flatten_spin_axis``.

        Notes
        -----
        - This function uses the convention described in section 3.1 of the
          :ref:`formalism`.
        - The returned wavefunctions correspond to the cell-periodic part
          :math:`u_{n \mathbf{k}}(\mathbf{r})` and not the full Bloch function
          :math:`\psi_{n \mathbf{k}}(\mathbf{r})`.
        - In many cases, using the :class:`WFArray` class offers a more
          elegant interface for handling eigenstates on a mesh of k and parameter points.
          This class will automatically manage the periodic gauge of the wavefunctions
          and provide additional methods for computing observables such as the Berry curvature.

        Examples
        --------
        Solve for eigenvalues at several k-points:

        >>> eval = tb.solve_ham([[0.0, 0.0], [0.0, 0.2], [0.0, 0.5]])

        Solve for eigenvalues and eigenvectors:

        >>> eval, evec = tb.solve_ham([[0.0, 0.0], [0.0, 0.2]], return_eigvecs=True)
        """
        logger.debug("Initializing Hamiltonian...")
        ham = self.hamiltonian(k_pts, flatten_spin_axis=True, **params)

        logger.debug("Diagonalizing Hamiltonian...")
        if return_eigvecs:
            eigvals, eigvecs = self._sol_ham(
                ham,
                return_eigvecs=return_eigvecs,
                flatten_spin_axis=flatten_spin_axis,
                use_tensorflow=use_tensorflow,
            )
            if self.dim_k != 0:
                # if only one k_point, remove that redundant axis (reproduces solve_one)
                if eigvals.shape[0] == 1:
                    eigvals = eigvals[0]
                    eigvecs = eigvecs[0]

            return eigvals, eigvecs
        else:
            eigvals = self._sol_ham(ham, return_eigvecs=return_eigvecs)

            if self.dim_k != 0:
                # if only one k_point, remove that redundant axis (reproduces solve_one)
                if eigvals.shape[0] == 1:
                    eigvals = eigvals[0]
            return eigvals



[docs]
    @deprecated("use .solve_ham() instead (since v2.0).", category=FutureWarning)
    def solve_one(self, k_list=None, eig_vectors=False):
        """
        .. deprecated:: 2.0.0
            Use :meth:`solve_ham` instead.
        """
        return self.solve_ham(
            k_list=k_list, return_eigvecs=eig_vectors, flatten_spin_axis=False
        )



[docs]
    @deprecated("use .solve_ham() instead (since v2.0).", category=FutureWarning)
    def solve_all(self, k_list=None, eig_vectors=False):
        """
        .. deprecated:: 2.0.0
            Use :meth:`solve_ham` instead.
        """
        return self.solve_ham(
            k_list=k_list, return_eigvecs=eig_vectors, flatten_spin_axis=False
        )


    def _velocity_k(
        self,
        k_arr: np.ndarray,
        hop_amps: np.ndarray,
        i_indices: np.ndarray,
        j_indices: np.ndarray,
        R_vecs: np.ndarray,
        site_energies: np.ndarray = None,
        *,
        cartesian: bool = False,
        flatten_spin_axis: bool = False,
        return_ham: bool = False,
    ) -> np.ndarray:
        r"""Compute velocity operator dH/dk at given k-points.

        The velocity operator is computed as the derivative of the Bloch Hamiltonian
        with respect to the k-vector:

        .. math::
            \hat{v}_\alpha(\mathbf{k}) = \frac{\partial H(\mathbf{k})}{\partial k_\alpha}
            = \sum_{\mathbf{R}} t_{ij}(\mathbf{R}) \, (i R_\alpha) \,
            \exp[i \mathbf{k} \cdot (\mathbf{r}_i - \mathbf{r}_j + \mathbf{R})]

        Parameters
        ----------
        k_arr : np.ndarray
            Array of k-points in reduced coordinates, shape (Nk, dim_k).
        hop_amps : np.ndarray
            Array of hopping amplitudes, shape (n_hops, ) for spinless models,
            or (n_hops, nspin, nspin) for spinful models.
        i_indices : np.ndarray
            Array of initial orbital indices for each hopping, shape (n_hops, ).
        j_indices : np.ndarray
            Array of final orbital indices for each hopping, shape (n_hops, ).
        R_vecs : np.ndarray
            Array of lattice vectors for each hopping in reduced coordinates, shape (n_hops, dim_r).
        site_energies : np.ndarray, optional
            Array of on-site energies, shape (norb, ) for spinless models,
            or (norb, nspin, nspin) for spinful models. Required if `return_ham` is True.
        cartesian : bool, optional
            If True, compute velocity in Cartesian coordinates.
            If False (default), compute in reduced coordinates.
        flatten_spin_axis : bool, optional
            If True, flatten the spin axis in the output.
        return_ham : bool, optional
            If True, also return the Hamiltonian matrix at the given k-points.

        Returns
        -------
        vel : np.ndarray
            Velocity operator dH/dk at the given k-points. Shape is (dim_k, Nk, norb, norb) for spinless models,
            or (dim_k, Nk, norb*nspin, norb*nspin) for spinful models if `flatten_spin_axis` is True,
            or (dim_k, Nk, norb, nspin, norb, nspin) if `flatten_spin_axis` is False.
        ham : np.ndarray, optional
            Hamiltonian matrix at the given k-points, returned only if `return_ham` is True. Shapes
            match those described for `vel`, without the leading `dim_k` axis.

        Notes
        -----
        - The Hamiltonian and velocity are constructed in tight-binding convention I, which includes
          phase factors associated with orbital positions in the hopping terms.
        - The construction of the velocity uses efficient summation techniques to handle large numbers
          of hoppings. This ensures that the computation remains tractable even for complex models. The
          steps are roughly as follows:
            1. Compute phase factors for each hopping at all k-points.
            2. Compute the derivative of the phase factors with respect to k.
            3. Accumulate contributions to the velocity operator using these derivatives
              and the hopping amplitudes
            4. (Optional) Accumulate contributions to the Hamiltonian if requested.
          The matrices are built using flattened indices and `np.add.reduceat` for efficiency.
        """

        dim_k = self.dim_k
        norb = self.norb

        i_indices = i_indices.astype(int)
        j_indices = j_indices.astype(int)
        R_vecs = R_vecs.astype(float)

        n_hops = i_indices.size
        per = np.asarray(self.periodic_dirs)
        orb_red = np.asarray(self.orb_vecs)
        orb_i = orb_red[i_indices]
        orb_j = orb_red[j_indices]
        delta_r = R_vecs - orb_i + orb_j
        delta_r_per = delta_r[:, per]

        if n_hops:
            k_dot_r = k_arr @ delta_r_per.T
            phases = np.exp(1j * 2 * np.pi * k_dot_r)
        else:
            phases = np.zeros((k_arr.shape[0], 0), dtype=complex)

        if cartesian:
            lattice = self.get_lat_vecs()[self.periodic_dirs, :]
            coeff = (1j * delta_r_per @ lattice).T[:, None, :]
        else:
            coeff = (1j * 2 * np.pi * delta_r_per).T[:, None, :]

        deriv_phase = coeff * phases[None, ...] if n_hops else coeff[:, :, :0]

        if not self.spinful:
            amps_use = np.asarray(hop_amps, dtype=complex)
            vel = np.zeros((dim_k, k_arr.shape[0], norb, norb), dtype=complex)
            if n_hops:
                cache = self._get_flattened_indices()
                order = cache["order"]
                starts = cache["starts"]
                uniq = cache["uniq"]
                cols_transposed = cache["cols_transposed"]

                vel_flat = vel.reshape(dim_k, k_arr.shape[0], -1)

                if return_ham:
                    ham = np.zeros((k_arr.shape[0], norb, norb), dtype=complex)
                    ham_flat = ham.reshape(k_arr.shape[0], -1)
                    contrib_ham = phases[:, order] * amps_use[order]
                    sums_ham = np.add.reduceat(contrib_ham, starts, axis=1)
                    ham_flat[:, uniq] += sums_ham
                    ham_flat[:, cols_transposed] += sums_ham.conj()

                contrib_sorted = deriv_phase[:, :, order] * amps_use[order]
                sums = np.add.reduceat(contrib_sorted, starts, axis=2)
                vel_flat[..., uniq] += sums
                vel_flat[..., cols_transposed] += sums.conj()

            if return_ham:
                diag = np.arange(norb)
                ham[:, diag, diag] += site_energies
                return vel, ham
            return vel

        n_kpts = k_arr.shape[0]
        nspin = self.nspin
        M = norb * nspin

        # Flatten spin blocks (n_hops, nspin, nspin) -> (n_hops, nspin^2)
        # For spin pair index s in [0, ..., nspin^2-1]:
        #   s_out = s // nspin
        #   s_in  = s % nspin
        hop_blocks = np.asarray(hop_amps, dtype=complex).reshape(n_hops, -1)

        vel = np.zeros((dim_k, k_arr.shape[0], M, M), dtype=complex)
        if n_hops:
            # spin_out, spin_in shape: (nspin^2,)
            # Creates all (s_out, s_in) pairs in a fixed order
            spin_out = np.repeat(np.arange(nspin), nspin)  # [0,0,1,1] for nspin=2
            spin_in = np.tile(np.arange(nspin), nspin)  # [0,1,0,1] for nspin=2

            # For hop h and spin pair (s_out, s_in), the big M×M index is
            #   row = s_out*norb + i_indices[h]
            #   col = s_in *norb + j_indices[h]
            # Build them as (n_hops * nspin^2,) arrays, then flatten to 1D of
            # length n_hops*nspin^2
            row_flat = (i_indices[:, None] * nspin + spin_out[None, :]).reshape(-1)
            col_flat = (j_indices[:, None] * nspin + spin_in[None, :]).reshape(-1)

            # Convert (row, col) to a single flat index in [0 .. M*M-1].
            # pair_flat uniquely identifies each matrix element touched by a hop×spin pair.
            pair_flat = row_flat * M + col_flat
            # Sorting by pair_flat lets us use reduceat to sum contiguous groups efficiently.
            order = np.argsort(pair_flat, kind="stable")

            # uniq: the unique flat matrix positions; starts: the start indices of each group.
            uniq, starts = np.unique(pair_flat[order], return_index=True)
            # Hermitian partner flat positions (swap row/col): (r,c) -> (c,r)
            cols_transposed = (uniq % M) * M + (uniq // M)

            if return_ham:
                ham = np.zeros((k_arr.shape[0], M, M), dtype=complex)
                ham_flat = ham.reshape(k_arr.shape[0], -1)

                # Broadcast multiply to get contribution per (hop, spin): shape (Nk, n_hops, S)
                contrib_ham = phases[:, :, None] * hop_blocks[None, :, :]
                # Flatten the last two axes to match pair_flat ordering, then reorder by 'order'
                contrib_ham = contrib_ham.reshape(n_kpts, -1)  # (Nk, n_hops*nspin^2)
                contrib_ham = contrib_ham[:, order]  # align with pair_sorted

                # Sum within each group of identical matrix elements
                sums_ham = np.add.reduceat(
                    contrib_ham, starts, axis=1
                )  # (Nk, len(uniq))

                # Scatter once per unique element (and its Hermitian partner)
                ham_flat[:, uniq] += sums_ham
                ham_flat[:, cols_transposed] += sums_ham.conj()

            # Broadcast multiply to get contribution per (hop, spin): shape (dim_k, Nk, n_hops, S)
            terms = deriv_phase[:, :, :, None] * hop_blocks[None, None, :, :]
            # Flatten the last two axes to match pair_flat ordering, then reorder by 'order'
            terms = terms.reshape(dim_k, n_kpts, -1)  # (dim_k, Nk, n_hops*nspin^2)
            terms = terms[..., order]  # align with pair_sorted

            # Sum within each group of identical matrix elements
            sums = np.add.reduceat(terms, starts, axis=2)  # (dim_k, Nk, len(uniq))

            # Scatter once per unique element (and its Hermitian partner)
            vel_flat = vel.reshape(
                dim_k, n_kpts, -1
            )  # flatten (M,M) -> M*M as last axis
            vel_flat[:, :, uniq] += sums
            vel_flat[:, :, cols_transposed] += sums.conj()

        if return_ham:
            rows = np.arange(norb * nspin).reshape(norb, nspin)
            ham[:, rows[:, :, None], rows[:, None, :]] += site_energies[None, :, :, :]

            if not flatten_spin_axis:
                ham = ham.reshape(n_kpts, norb, nspin, norb, nspin)
                vel = vel.reshape(dim_k, n_kpts, norb, nspin, norb, nspin)

            return vel, ham

        if not flatten_spin_axis:
            vel = vel.reshape(dim_k, n_kpts, norb, nspin, norb, nspin)
        return vel

    def _velocity(
        self,
        k_pts: np.ndarray,
        cartesian: bool = False,
        flatten_spin_axis: bool = False,
        *,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 2,
        _return_ham: bool = False,
        **params,
    ) -> np.ndarray:
        """Compute velocity operator dH/dk and dH/dλ at given k-points.

        Private method called by .velocity(). Allows returning Hamiltonian for internal use.
        See .velocity() for full docstring.

        Notes
        -----
        - The velocity operator with respect to k is computed analytically using ._velocity_k().
        - The velocity operator with respect to parameters is computed via finite differences.
        - The finite difference function dynamically uses central, forward, or backward schemes
          depending on the periodicty and position within the parameter axis. If the parameters
          are not periodic and the point is at the edge of the axis, forward or backward differences
          are used as appropriate.
        - Parameter sweeps that are detected as cyclic (either because
          ``param_periods[name]`` is provided or because the first and last samples
          of the sweep coincide) have their duplicated endpoint removed internally
          by :meth:`_normalize_parameter_axis` before the finite-difference stencil
          is built. The returned velocity tensor is re-expanded onto the original
          grid, so the parameter axes seen by the caller keep the user-supplied
          length even though the derivative itself is computed from the trimmed set.
          Trim the endpoint yourself if you need the unique samples for post-processing.
        """

        # Check params
        if params is not None:
            params = dict(params)
            self._check_missing_parameters(params)
        else:
            params = {}

        # Normalize k-points to correct shape
        if self.dim_k == 0:
            raise NotImplementedError(
                "Velocity operator is not defined for systems with dim_k=0."
            )
        else:
            k_arr = self._normalize_kpoints(k_pts)

        # Partition params into scalars vs sweeps (1D arrays/lists)
        # scalars: dict of param_name -> scalar value
        # sweep_names: list of param names to sweep over
        # sweep_values: list of arrays/lists of values to sweep over
        scalars, sweep_names, sweep_values = self._params_to_sweep(params)

        param_periods = dict(param_periods or {})

        raw_axes: list[list[float]] = []
        sweep_meta: dict[str, tuple[float, bool, bool, list[float]]] = {}
        for idx, name in enumerate(sweep_names):
            axis_array = np.asarray(sweep_values[idx], dtype=float)
            raw_axes.append(axis_array.tolist())  # preserve the user’s grid
            if axis_array.ndim != 1 or axis_array.size < 2:
                continue

            normalized, step, periodic, trimmed = self._normalize_parameter_axis(
                axis_array,
                name=name,
                period=param_periods.get(name),
            )
            sweep_meta[name] = (step, periodic, trimmed, normalized.tolist())

        # Determine if we need to compute Hamiltonian for lambda derivatives
        needs_ham = _return_ham or bool(sweep_meta)

        # No sweeps: just evaluate in place
        if not sweep_values:
            hop_amps, i_idx, j_idx, R_vecs, site_energies = self._evaluate_params(
                scalars
            )
            v = self._velocity_k(
                k_arr,
                hop_amps,
                i_idx,
                j_idx,
                R_vecs,
                site_energies=site_energies,
                cartesian=cartesian,
                flatten_spin_axis=flatten_spin_axis,
                return_ham=needs_ham,
            )
            if needs_ham:
                vel, ham = v
                return (vel, ham) if _return_ham else vel
            return v

        # Parameter sweeps: cartesian product,
        # then reshape to (*param_shape, dim_k, Nk, norb, norb) at end
        axis_lengths = [len(ax) for ax in sweep_values]
        vel_blocks, base_shape = [], None
        ham_blocks, ham_shape = [], None

        for multi in product(*[range(n) for n in axis_lengths]):
            assign = scalars.copy()  # copy str -> scalar mappings
            for a, name in enumerate(sweep_names):
                # Evaluate velocity on user grid, not normalized grid
                assign[name] = raw_axes[a][multi[a]]

            # Retrive hoppings, orbital indices, R-vectors
            # for this parameter combination
            hop_amps, i_idx, j_idx, R_vecs, site_energies = self._evaluate_params(
                assign
            )

            # Build velocity operator
            v = self._velocity_k(
                k_arr,
                hop_amps,
                i_idx,
                j_idx,
                R_vecs,
                site_energies=site_energies,
                cartesian=cartesian,
                flatten_spin_axis=flatten_spin_axis,
                return_ham=needs_ham,
            )

            # Unpack velocity and Hamiltonian if needed
            if needs_ham:
                vel, ham = v
                if ham_shape is None:
                    ham_shape = ham.shape
                ham_blocks.append(ham[np.newaxis, ...])
            else:
                vel = v

            # Record base shape first time e.g. (dim_k, Nk, norb, norb)
            if base_shape is None:
                base_shape = vel.shape

            # Append with new leading axis for stacking later
            vel_blocks.append(vel[np.newaxis, ...])

        # Stack all velocity blocks along new leading axis: (*param_shapes, *base_shape)
        stacked = np.concatenate(vel_blocks, axis=0).reshape(*axis_lengths, *base_shape)
        # Move param axes to be after k-axis
        if axis_lengths:
            p = len(axis_lengths)  # number of param axes
            b = len(base_shape)  # e.g. 4 when base is (dim_k, Nk, norb, norb)
            perm = (
                p,  # dim_k
                p + 1,  # Nk
                *range(p),  # all param axes in original order
                *range(p + 2, p + b),  # remaining matrix axes (e.g. norb, norb)
            )
            stacked = np.transpose(stacked, perm)

        # Final velocity array with shape (dim_k, Nk, l1, ..., norb, norb)
        # where l1, ... are parameter sweep axes
        vel_k = stacked

        # Stack Hamiltonian blocks if needed
        ham = None
        if needs_ham:
            # Stack all hamiltonian blocks along new leading axis: (*param_shapes, *ham_shape)
            ham_stacked = np.concatenate(ham_blocks, axis=0).reshape(
                *axis_lengths, *ham_shape
            )
            # Move param axes to be after k-axis
            if axis_lengths:
                p = len(axis_lengths)  # number of param axes
                b = len(ham_shape)  # e.g. 3 when base is (Nk, norb, norb)
                perm = (p,) + tuple(range(p)) + tuple(range(p + 1, p + b))
                ham_stacked = np.transpose(ham_stacked, perm)

            # Final hamiltonian array
            ham = ham_stacked

        # If no param derivatives needed, return now
        if not sweep_meta:
            return (vel_k, ham) if _return_ham else vel_k

        ######### Compute parameter derivatives via finite differences #########

        # The velocity output currently has shape (dim_k, Nk, l1, ..., norb, norb).
        # Append parameter-derivatives after the existing k components.
        vel_components = [vel_k]
        for idx, name in enumerate(sweep_names):
            meta = sweep_meta.get(name)
            if meta is None:
                continue  # non-numeric sweep; skip

            step, periodic, trimmed, _ = meta
            # Axis of Hamiltonian corresponding to this parameter sweep
            sweep_axis = 1 + idx  # axis 0 is Nk, axis 1 begins the param sweeps

            if trimmed:
                logger.debug(
                    "velocity: Endpoint detected on periodic parameter"
                    f"Trimming last '{name}' before differentiating Hamiltonian."
                )
                # drop the repeated endpoint before taking finite differences
                slicer = [slice(None)] * ham.ndim
                slicer[sweep_axis] = slice(0, -1)
                ham_fd = ham[tuple(slicer)]
            else:
                ham_fd = ham

            dH = finite_difference(
                ham_fd,
                axis=sweep_axis,
                delta=step,
                order=diff_order,
                mode=diff_scheme,
                periodic=periodic,
            )

            # Re-append the first slice so the derivative array matches the user grid
            # Derivative at the endpoint is same as at the start for periodic params
            if trimmed and periodic:
                first_slice = np.take(dH, indices=0, axis=sweep_axis)
                first_slice = np.expand_dims(first_slice, axis=sweep_axis)
                dH = np.concatenate([dH, first_slice], axis=sweep_axis)

            vel_components.append(dH[np.newaxis, ...])  # prepend new derivative axis

        vel_full = np.concatenate(vel_components, axis=0)
        return (vel_full, ham) if _return_ham else vel_full


[docs]
    def velocity(
        self,
        k_pts: np.ndarray,
        cartesian: bool = False,
        flatten_spin_axis: bool = False,
        *,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 2,
        **params,
    ) -> np.ndarray:
        r"""Generate the velocity operator in the orbital basis.

        The velocity operator is related to the derivative of the Hamiltonian
        with respect to each reciprocal lattice direction, i.e.,

        .. math::
            v_{\mu}(k) = \hbar \frac{\partial H(k)}{\partial k_{\mu}}

        When passing parameter sweeps via ``**params``, the generalized velocity
        operator is computed by appending finite-difference derivatives of the
        Hamiltonian with respect to the swept parameters.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        k_pts : (Nk, dim_k) numpy.ndarray
            Reduced k-points where the velocity operator is evaluated.
            Must be a 2D array of shape ``(Nk, dim_k)``, where ``dim_k`` is the number
            of periodic directions in the model.
        cartesian : bool, optional
            If True, use Cartesian coordinates for the velocity operator,
            otherwise derivatives are taken with respect to reduced coordinates.
        flatten_spin_axis : bool, optional
            If True, the spin indices are flattened into the orbital indices.
            This results in a velocity operator of shape ``(..., norb*nspin, norb*nspin)``.
            If False (default), the velocity operator has shape ``(..., norb, nspin, norb, nspin)``.
        param_periods : dict[str, float], optional
            Optional map ``{param_name: period}`` for swept parameters. When supplied,
            assumes the parameter is cyclic and trims any duplicated endpoints, or endpoints
            equal to the start plus the given period, before building finite-difference stencils.
            This can improve numerical accuracy by using centered differences throughout the parameter
            range. Otherwise, the function will use a backward difference at the endpoint and a forward
            difference at the start.
        diff_scheme : str, optional
            Finite difference scheme to use for parameter derivatives.
            Options are "central" (default) or "forward".
            This parameter is only relevant when passing varying parameters.
        diff_order : int, optional
            Order of accuracy for finite difference lambda derivatives.
            Must be an even integer for "central" scheme (default is ``4``),
            and a positive integer for "forward" scheme.
            This parameter is only relevant when passing varying parameters.
        **params :
            Parameter assignments. Scalars are applied directly; any 1D array/list
            is treated as a sweep and *automatically* adds a finite-difference derivative
            :math:`\partial_{\lambda} H` for that parameter. The velocity operator is
            evaluated at all combinations of parameter values.

        Returns
        -------
        vel : numpy.ndarray
            Velocity operator in the orbital basis. First axis indexes the cartesian direction
            if ``cartesian=True``. Otherwise, it indexes the reduced direction. If
            ``include_lambda=True``, the lambda (parameter) derivatives are appended
            after the k-directions along the first axis.

            Shape is:

            - ``(n_dir, Nk, *param_shape, norb, norb)`` for spinless models,
            - ``(n_dir, Nk, *param_shape, norb, 2, norb, 2)`` for spinful models.
            - ``(..., norb*nspin, norb*nspin)`` if ``flatten_spin_axis=True``.

            where ``n_dir = dim_k + n_params``, where ``n_params`` is
            the number of parameters being swept over.

        Notes
        -----
        - We use units where :math:`\hbar = 1`, and thus the velocity operator is simply defined as
          the gradient of the Hamiltonian with respect to :math:`\mathbf{k}` or :math:`\boldsymbol{\lambda}`.
        - The velocity operator is computed in tight-binding convention I, which includes phase factors
          associated with orbital positions in the hopping terms.
        - For the k-derivatives, if ``cartesian=True``, the velocity operator
          is given by the derivative with respect to Cartesian :math:`\mathbf{k}`-coordinates:

          .. math::
            v_\alpha(\mathbf{k}) = \frac{\partial H(\mathbf{k})}{\partial k_\alpha}
            = \sum_{\mathbf{R}} t_{ij}(\mathbf{R}) \,
            i(\mathbf{r}_i - \mathbf{r}_j + \mathbf{R})_{\alpha} \,
            \exp[i \mathbf{k} \cdot (\mathbf{r}_i - \mathbf{r}_j + \mathbf{R})]

          where :math:`t_{ij}(\mathbf{R})` are the hopping amplitudes,
          :math:`\mathbf{r}_i` and :math:`\mathbf{r}_j` are the orbital positions in
          Cartesian coordinates, and :math:`\mathbf{R}` are the lattice vectors in
          Cartesian coordinates.

        - For the k-derivatives, if ``cartesian=False``, the velocity operator is given by
          the derivative with respect to reduced :math:`\mathbf{\kappa}`-coordinates:

          .. math::
            v_\alpha(\mathbf{\kappa})
            = \frac{\partial H(\mathbf{\kappa})}{\partial \kappa_\alpha}
            = \sum_{\mathbf{R}} t_{ij}(\mathbf{R}) \,
            i 2 \pi (\boldsymbol{\tau_i} - \boldsymbol{\tau_j} + \mathbf{R})_{\alpha} \,
            \exp[i 2 \pi \mathbf{\kappa} \cdot
            (\boldsymbol{\tau_i}- \boldsymbol{\tau_j} + \mathbf{R})]

          where :math:`\boldsymbol{\tau_i}` and :math:`\boldsymbol{\tau_j}` are the orbital
          positions in reduced coordinates, :math:`\mathbf{\kappa}` are the k-points in
          reduced coordinates, and :math:`\mathbf{R}` are the lattice vectors in reduced coordinates.

        - Passing a list/array for a parameter means you want derivatives with respect to that
          parameter. If the intent is simply to evaluate at a specific value, resolve the
          symbol first via :meth:`set_parameters`, or simply pass a scalar value with ``**params``.
        - When passing a list/array for a parameter, the finite difference derivatives are computed
          explicitly as

          .. math::
            \frac{\partial H}{\partial \lambda} \approx
            \sum_{m} c_m H(\lambda + m \Delta \lambda)

          where the coefficients :math:`c_m` depend on the finite difference scheme and order.

        Examples
        --------
        Compute the velocity operator at the Gamma point:

        >>> vel = tb.velocity(np.array([[0.0, 0.0]]))

        Compute the velocity operator at several k-points with a parameter sweep. This
        will compute the velocity operator at all values of ``mA = 0.0, 1.0, 2.0`` and
        the first axis will have length equal to ``dim_k + 1``, with the last slice
        corresponding to the finite-difference derivative with respect to ``mA``.

        >>> vel = tb.velocity(
        ... np.array([[0.0, 0.0], [0.5, 0.5]]),
        ... mA=np.linspace(0, np.pi, 10, endpoint=False)
        ... )

        If ``mA`` is a periodic parameter with period ``2*pi``, and ``2*pi`` is included
        in the parameter list, we can inform the velocity function to trim the duplicated
        endpoint before building the finite-difference stencil. This can improve numerical accuracy
        by using centered differences throughout the parameter range. Otherwise, the function
        will use a backward difference at the endpoint and a forward difference at the start.

        Specify this by passing a dictionary to the ``param_periods`` argument:

        >>> vel = tb.velocity(
        ... np.array([[0.0, 0.0]]),
        ... mA=np.linspace(0, 2*np.pi, 10, endpoint=True),
        ... param_periods={"mA": 2*np.pi}
        ... )
        """
        return self._velocity(
            k_pts,
            cartesian=cartesian,
            flatten_spin_axis=flatten_spin_axis,
            param_periods=param_periods,
            diff_scheme=diff_scheme,
            diff_order=diff_order,
            **params,
        )


    def _quantum_geometric_tensor(
        self,
        v: np.ndarray,
        eigvals: np.ndarray,
        eigvecs: np.ndarray,
        plane: tuple[int, int] = None,
        occ_idxs: np.ndarray | None = None,
        non_abelian: bool = False,
        use_tensorflow: bool = False,
    ) -> np.ndarray:
        r"""Compute the quantum geometric tensor Q from the velocity operator.

        This function computes the quantum geometric tensor (QGT) from the velocity operator
        and the eigenvalues and eigenvectors of the Hamiltonian.
        """
        if self.dim_k != 0:
            # if only one k_point, remove that redundant axis
            if eigvals.shape[0] == 1:
                eigvals = eigvals[0]
                eigvecs = eigvecs[0]

        # Identify occupied bands
        n_eigs = eigvecs.shape[-2]
        if occ_idxs is None:
            occ_idxs = np.arange(n_eigs // 2)
        else:
            occ_idxs = np.array(occ_idxs)
        # Identify conduction bands as remainder of band indices (assumes gapped)
        cond_idxs = np.setdiff1d(np.arange(n_eigs), occ_idxs)

        if use_tensorflow:
            try:
                import tensorflow as tf
            except ImportError as e:
                raise ImportError(
                    "TensorFlow is not installed. Please install TensorFlow to use this feature."
                ) from e

            v_tf = tf.constant(v, dtype=tf.complex64)
            evals_tf = tf.constant(eigvals, dtype=tf.complex64)
            evecs_tf = tf.constant(eigvecs, dtype=tf.complex64)

            # Transpose eigenvectors for matmul
            r = tf.rank(evecs_tf)  # number of axes
            # Transpose last two axes
            evecs_T_tf = tf.transpose(
                evecs_tf, tf.concat([tf.range(r - 2), [r - 1, r - 2]], 0)
            )
            # Conjugate eigenvectors
            evecs_conj_tf = tf.math.conj(evecs_tf)

            E_occ = tf.gather(evals_tf, occ_idxs, axis=-1)
            E_cond = tf.gather(evals_tf, cond_idxs, axis=-1)

            # Delta_{nm} = E_n - E_m (occ - cond)
            delta_occ_cond = E_occ[..., :, None] - E_cond[..., None, :]

            # Degeneracy guard: abort if any denominator is (near) zero
            tol = tf.constant(1e-12, dtype=delta_occ_cond.dtype.real_dtype)
            if tf.reduce_any(tf.math.abs(delta_occ_cond) < tol).numpy():
                raise ZeroDivisionError(
                    "Degenerate occupied/conduction bands encountered."
                )

            inv_delta_occ_cond = tf.math.reciprocal(delta_occ_cond)

            # reuse the same denominators for the conjugate block by swapping the last axes
            rank = inv_delta_occ_cond.shape.rank
            perm = list(range(rank))
            perm[-2], perm[-1] = perm[-1], perm[-2]
            inv_delta_cond_occ = tf.transpose(inv_delta_occ_cond, perm=perm)

            # Rotate velocity operators to energy eigenbasis
            v_rot_tf = tf.matmul(
                evecs_conj_tf[None, ...],  # (1, n_kpts, n_beta, n_state, n_state)
                tf.matmul(
                    v_tf,  # (dim_k+n_param, n_kpts, n_beta, n_state, n_state)
                    evecs_T_tf[None, ...],  # (1, n_kpts, n_beta, n_state, n_state)
                ),
            )  # (dim_k+n_param, n_kpts, n_beta, n_state, n_state)

            # Extract relevant submatrices
            v_occ_cond_tf = tf.gather(
                tf.gather(v_rot_tf, occ_idxs, axis=-2), cond_idxs, axis=-1
            )
            v_cond_occ_tf = tf.gather(
                tf.gather(v_rot_tf, cond_idxs, axis=-2), occ_idxs, axis=-1
            )

            # premultiply by energy denominators
            v_occ_cond_tf *= inv_delta_occ_cond
            v_cond_occ_tf *= inv_delta_cond_occ

            # Compute Berry curvature
            # newaxis for Cartesian direction
            # shape (dim_k+n_param, dim_k+n_param, nk, *shape_sweeps, n_occ, n_occ)
            Q = tf.matmul(v_occ_cond_tf[:, None], v_cond_occ_tf[None, :])

            # Convert final result to NumPy
            Q = Q.numpy()
        else:
            # Occupied and conduction energies
            E_occ = np.take(eigvals, occ_idxs, axis=-1)
            E_cond = np.take(eigvals, cond_idxs, axis=-1)

            # Delta_{nm} = E_n - E_m (occ - cond)
            delta_occ_cond = E_occ[..., np.newaxis] - E_cond[..., np.newaxis, :]
            if np.any(np.isclose(delta_occ_cond, 0.0)):
                raise ZeroDivisionError(
                    "Degenerate occupied/conduction bands encountered."
                )
            inv_delta_occ_cond = np.divide(1.0, delta_occ_cond)  # (..., n_occ, n_cond)
            inv_delta_cond_occ = np.swapaxes(
                inv_delta_occ_cond, -2, -1
            )  # (..., n_cond, n_occ)

            # newaxis for Cartesian direction
            evecs_conj = eigvecs.conj()[np.newaxis, ...]
            # transpose for matmul
            evecs_T = eigvecs.swapaxes(-2, -1)[np.newaxis, ...]
            v_evecT = np.matmul(v, evecs_T)  # intermediate array
            # Project vk into energy eigenbasis
            v_rot = np.matmul(
                evecs_conj, v_evecT
            )  # (dim_k, n_kpts, n_states, n_states)

            # Extract relevant submatrices
            v_occ_cond = v_rot[..., occ_idxs, :][
                ..., :, cond_idxs
            ]  # shape (dim_k, Nk, n_occ, n_con)
            v_cond_occ = v_rot[..., cond_idxs, :][
                ..., :, occ_idxs
            ]  # shape (dim_k, Nk, n_con, n_occ)

            # premultiply by energy denominators
            v_occ_cond *= inv_delta_occ_cond
            v_cond_occ *= inv_delta_cond_occ

            Q = np.matmul(v_occ_cond[:, None], v_cond_occ[None, :])

        if not non_abelian:
            Q = np.trace(Q, axis1=-1, axis2=-2)
        if plane is None:
            return Q
        else:
            if not (isinstance(plane, tuple) and len(plane) == 2):
                raise ValueError("plane must be a tuple of length 2.")
            return Q[plane]


[docs]
    def quantum_geometric_tensor(
        self,
        k_pts,
        occ_idxs: list[int] = None,
        plane: tuple[int, int] = None,
        *,
        cartesian: bool = False,
        non_abelian: bool = False,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 2,
        use_tensorflow: bool = False,
        **params,
    ):
        r"""Quantum geometric tensor at a list of k-points via Kubo formula.

        The quantum geometric tensor is computed from the derivatives of the
        Bloch Hamiltonian :math:`\partial_\mu H_k`, where :math:`\mu` is the
        direction in k-space, and is given by (when ``non_abelian=True``):

        .. math::

            Q_{\mu \nu;\ mn}(k) = \sum_{l \notin \text{occ}}
            \frac{
                \langle u_{mk} | \partial_{\mu} H_k | u_{lk} \rangle
                \langle u_{lk} | \partial_{\nu} H_k | u_{nk} \rangle
            }{
                (E_{mk} - E_{lk})(E_{nk} - E_{lk})
            }

        The Abelian quantum geometric tensor (when ``non_abelian=False``)
        is obtained by taking the trace
        over occupied bands:

        .. math::

            Q_{\mu \nu}(k) = \sum_{m \in \text{occ}} Q_{\mu \nu;\ mm}(k)

        By specifying the ``plane`` parameter, we choose a particular :math:`(\mu, \nu)` pair
        of the quantum geometric tensor to return.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        k_pts : (Nk, dim_k) array-like
            Array of k-points with shape (Nk, dim_k), where Nk is the number of points
            and dim_k is the dimensionality of the k-space.
        occ_idxs : 1D array, optional
            Indices of the occupied bands. Defaults to the first half of the states.
        plane : tuple of int, optional
            Tuple of two integers specifying the plane in k-space for which to compute
            the curvature. If None (default),
            computes all components of the Berry curvature tensor. This
            will affect the shape of the returned array.
        cartesian : bool, optional
            If True, computes the velocity operator in Cartesian coordinates.
            Default is False (reduced coordinates).
        non_abelian : bool, optional
            If True, returns the full tensor (non-abelian case).
            If False, returns the band-trace of the tensor (abelian case).
            Default is False. This will affect the shape of the returned array.
        param_periods : dict[str, float], optional
            Optional map ``{param_name: period}`` for swept parameters. When supplied,
            assumes the parameter is cyclic and trims any duplicated endpoints, or endpoints
            equal to the start plus the given period, before building finite-difference stencils.
            This can improve numerical accuracy by using centered differences throughout the parameter
            range. Otherwise, the function will use a backward difference at the endpoint and a forward
            difference at the start.
        diff_scheme : str, optional
            Finite difference scheme to use for parameter derivatives.
            Options are "central" (default) or "forward".
            This parameter is only relevant when passing varying parameters.
        diff_order : int, optional
            Order of accuracy for finite difference lambda derivatives.
            Must be an even integer for "central" scheme (default is ``4``),
            and a positive integer for "forward" scheme.
            This parameter is only relevant when passing varying parameters.
        use_tensorflow: bool, optional
            If True, will use TensorFlow to speed up linear algebra routines.
            Requires TensorFlow to be installed. Default is False.
        **params :
            Keyword arguments mapping parameter names to value(s). Each value can be a scalar
            or a 1D array of values. If any values are array-like,
            the QGT is evaluated at all combinations of parameter values,
            and the final array is stacked with the k-axis leading, followed by each
            parameter axis in the order of given parameter names.

        Returns
        -------
        Q : array
            Quantum geometric tensor. Full shape is
            ``(dim_tot, dim_tot, Nk, Nparam1, Nparam2, ..., n_orb, n_orb)``,
            where ``dim_tot = dim_k + n_params`` is the total number of
            independent coordinates (crystal momenta plus varying parameters). If ``plane``
            is specified, the first two axes are indexed by the specified directions, and the
            shape is ``(Nk, Nparam1, Nparam2, ..., n_orb, n_orb)``. If ``non_abelian=False``,
            the returned array is the band-trace of the full tensor and the last
            two dimensions are contracted. The order of the parameter axes follows the order
            of the parameter names in ``**params``.

        See Also
        --------
        velocity : Computes the velocity operator used in the Kubo formula.
        berry_curvature : Computes the Berry curvature from the quantum geometric tensor.
        quantum_metric : Computes the quantum metric from the quantum geometric tensor.
        :ref:`quantum-geom-tens-nb` : Jupyter notebook tutorial on quantum geometric tensor.

        Notes
        -----
        - The quantum geometric tensor captures both the Berry curvature (imaginary part)
          and the quantum metric (real part) of the occupied bands.
        - The plane indices use the combined coordinate ordering of k-space
          dimensions followed by swept parameters
          :math:`[k_0, ..., k_{\text{dim_k}}, \lambda_0, \lambda_1, ...]`.
          For example, in a 2D model with one swept parameter, the valid plane indices
          are ``0``, ``1``, and ``2``, where ``0`` and ``1`` refer to the two k-space
          dimensions, and ``2`` refers to the swept parameter axis. Swept parameters
          are those provided as array-like values in ``**params``. The order of
          swept parameters is determined by the order in which they appear
          in the ``**params`` keyword arguments.

        .. warning::
            - This requires a global energy gap between occupied and unoccupied bands.
            - The quantum geometric tensor is defined only when the total number of independent
              coordinates (crystal momenta plus varying parameters) is at least two,
              i.e. ``dim_k + n_params >= 2`` where ``n_params`` is the number of varying parameters
              set with lists of values.

        """
        v, ham = self._velocity(
            k_pts,
            cartesian=cartesian,
            flatten_spin_axis=True,
            param_periods=param_periods,
            diff_scheme=diff_scheme,
            diff_order=diff_order,
            _return_ham=True,
            **params,
        )  # (dim_k + dim_lam , Nk, *lam_shape, nstate, nstate)

        if v.shape[0] < 2:
            raise ValueError(
                "Quantum geometric tensor requires at least two independent "
                "coordinates (crystal momenta and/or varying parameters)."
            )

        eigvals, eigvecs = self._sol_ham(
            ham,
            return_eigvecs=True,
            flatten_spin_axis=True,
            use_tensorflow=use_tensorflow,
        )

        return self._quantum_geometric_tensor(
            v,
            eigvals,
            eigvecs,
            plane=plane,
            occ_idxs=occ_idxs,
            non_abelian=non_abelian,
            use_tensorflow=use_tensorflow,
        )



[docs]
    def berry_curvature(
        self,
        k_pts,
        occ_idxs: list[int] = None,
        plane: tuple[int, int] = None,
        *,
        cartesian: bool = False,
        non_abelian: bool = False,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 2,
        use_tensorflow: bool = False,
        **params,
    ):
        r"""Compute the Berry curvature in energy eigenbasis via Kubo formula.

        The Berry curvature is computed as the anti-Hermitian part of the quantum
        geometric tensor :math:`Q_{\mu \nu}(k)` from :meth:`quantum_geometric_tensor`,
        i.e., in the non-Abelian case (``non_abelian=True``):

        .. math::

            \Omega_{\mu \nu;\ mn}(k) =  i \left( Q_{\mu \nu;\ mn}(k) - Q_{\mu \nu;\ nm}^*(k) \right)

        In the Abelian case (``non_abelian=False``), the Berry curvature is given by the
        band-trace of the above quantity. This reduces to the well-known expression for the
        Berry curvature in terms of the quantum geometric tensor.

        .. math::

           \Omega_{\mu \nu}(k) = -2 \mathrm{Im} \, Q_{\mu \nu}(k),

        By specifying the ``plane`` parameter, we choose a particular :math:`(\mu, \nu)` pair
        of the Berry curvature tensor to return.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        k_pts : (Nk, dim_k) array-like
            Array of k-points with shape ``(Nk, dim_k)``, where ``Nk`` is the number of points
            and ``dim_k`` is the dimensionality of the k-space.
        occ_idxs : 1D array, optional
            Indices of the occupied bands. Defaults to the first half of the states.
        plane : tuple of int, optional
            Tuple of two integers specifying the plane in k-space for which to compute
            the curvature. If None (default), computes all components of the Berry
            curvature tensor. This will affect the shape of the returned array.
        cartesian : bool, optional
            If True, computes the velocity operator in Cartesian coordinates.
            Default is False (reduced coordinates). See :meth:`velocity` for details.
        non_abelian : bool, optional
            If True, returns the full Berry curvature tensor (non-abelian case).
            If False, returns the band-trace of the Berry curvature tensor (abelian case).
            Default is False. This will affect the shape of the returned array.
        param_periods : dict[str, float], optional
            Optional map ``{param_name: period}`` for swept parameters. When supplied,
            assumes the parameter is cyclic and trims any duplicated endpoints, or endpoints
            equal to the start plus the given period, before building finite-difference stencils.
            This can improve numerical accuracy by using centered differences throughout the parameter
            range. Otherwise, the function will use a backward difference at the endpoint and a forward
            difference at the start.
        diff_scheme : str, optional
            Finite difference scheme to use for parameter derivatives.
            Options are "central" (default) or "forward".
            This parameter is only relevant when passing varying parameters.
        diff_order : int, optional
            Order of accuracy for finite difference lambda derivatives.
            Must be an even integer for "central" scheme (default is ``4``),
            and a positive integer for "forward" scheme.
            This parameter is only relevant when passing varying parameters.
        use_tensorflow: bool, optional
            If True, will use TensorFlow to speed up linear algebra routines.
            Requires TensorFlow to be installed. Default is False.
        **params :
            Keyword arguments mapping parameter names to value(s). Each value can be a scalar
            or a 1D array of values. If any values are array-like,
            the Berry curvature is evaluated at all combinations of parameter values,
            and the final array is stacked with the k-axis leading, followed by each
            parameter axis in the order of given parameter names.

        Returns
        -------
        b_curv : np.ndarray
            Berry curvature tensor. Full shape is
            ``(dim_tot, dim_tot, Nk, Nparam1, Nparam2, ..., n_orb, n_orb)``,
            where ``dim_tot = dim_k + n_params`` is the total number of
            independent coordinates (crystal momenta plus varying parameters). If ``plane``
            is specified, the first two axes are indexed by the specified directions, and the
            shape is ``(Nk, Nparam1, Nparam2, ..., n_orb, n_orb)``. If ``non_abelian=False``,
            the returned array is the band-trace of the full tensor and the last
            two dimensions are contracted. The order of the parameter axes follows the order
            of the parameter names in ``**params``.

        See Also
        --------
        quantum_geometric_tensor : Computes the quantum geometric tensor.
        quantum_metric : Computes the quantum metric tensor.
        velocity : Computes the velocity operator used in the Kubo formula.
        :ref:`quantum-geom-tens-nb` : Jupyter notebook tutorial on quantum geometric tensor.

        Notes
        -----
        - The Berry curvature is computed using the Kubo formula, which
          requires knowledge of :math:`\partial_\mu H_k`. This operator
          is computed using the gradient of the Hamiltonian provided by :func:`velocity`.
        - Specifically, for :math:`(m,n) \in \text{occ}`, the non-Abelian Berry curvature tensor
          is given by (when ``non_abelian=True``):

          .. math::

            \Omega_{\mu \nu;\ mn}(k) =  i\sum_{l \notin \text{occ}}
            \frac{
                \langle u_{mk} | \partial_{\mu} H_k | u_{lk} \rangle
                \langle u_{lk} | \partial_{\nu} H_k | u_{nk} \rangle
                -
                m \leftrightarrow n
            }{
                (E_{nk} - E_{lk})(E_{mk} - E_{lk})
            }
        - This quantity is anti-symmetric under :math:`\mu \leftrightarrow \nu`.
        - When using parameter sweeps via ``params``, the Berry curvature is computed
          at all combinations of parameter values, and the resulting array has
          parameter axes added after the k-point axis in the output.
        - The plane indices use the combined coordinate ordering of k-space
          dimensions followed by swept parameters
          :math:`[k_0, ..., k_{\text{dim_k}}, \lambda_0, \lambda_1, ...]`.
          For example, in a 2D model with one swept parameter, the valid plane indices
          are ``0``, ``1``, and ``2``, where ``0`` and ``1`` refer to the two k-space
          dimensions, and ``2`` refers to the swept parameter axis. Swept parameters
          are those provided as array-like values in ``**params``. The order of
          swept parameters is determined by the order in which they appear
          in the ``**params`` keyword arguments.

        .. warning::
            - This requires a global energy gap between occupied and unoccupied bands.
            - The Berry curvature is defined only when the total number of independent
              coordinates (crystal momenta plus varying parameters) is at least two,
              i.e. ``dim_k + n_params >= 2`` where ``n_params`` is the number of varying parameters
              set with lists of values.
        """
        Q = self.quantum_geometric_tensor(
            k_pts,
            occ_idxs=occ_idxs,
            cartesian=cartesian,
            non_abelian=non_abelian,
            param_periods=param_periods,
            diff_scheme=diff_scheme,
            diff_order=diff_order,
            use_tensorflow=use_tensorflow,
            **params,
        )
        # Berry curvature is the anti-symmetric part of the quantum geometric tensor
        if non_abelian:
            Omega = 1j * (Q - np.swapaxes(Q, -1, -2).conj())
        else:
            Omega = -2 * Q.imag

        if plane is not None:
            # Restrict to specified plane
            mu, nu = plane
            Omega = Omega[mu, nu]
        return Omega



[docs]
    def quantum_metric(
        self,
        k_pts,
        occ_idxs: list[int] = None,
        plane: tuple[int, int] = None,
        *,
        cartesian: bool = False,
        non_abelian: bool = False,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 2,
        use_tensorflow: bool = False,
        **params,
    ):
        r"""Quantum metric in the energy eigenbasis computed via Kubo formula.

        The quantum metric is computed as the Hermitian part of the quantum
        geometric tensor :math:`Q_{\mu \nu}(k)` from :meth:`quantum_geometric_tensor`,
        i.e., in the non-Abelian case (``non_abelian=True``):

        .. math::

            g_{\mu \nu;\ mn}(k) =  \frac{1}{2} \left( Q_{\mu \nu;\ mn}(k)  + Q_{\mu \nu;\ nm}^*(k) \right)

        In the Abelian case (``non_abelian=False``), the quantum metric is given by the
        band-trace of the above quantity. This reduces to the well-known expression for the
        quantum metric in terms of the quantum geometric tensor.

        .. math::

           g_{\mu \nu}(k) = \mathrm{Re} \, Q_{\mu \nu}(k),

        By specifying the ``plane`` parameter, we choose a particular :math:`(\mu, \nu)` pair
        of the Berry curvature tensor to return.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        k_pts : (nk, dim_k) array-like
            Array of k-points with shape ``(nk, dim_k)``, where ``nk`` is the number of points
            and dim_k is the dimensionality of the k-space.
        occ_idxs : 1D array, optional
            Indices of the occupied bands. Defaults to the first half of the states.
        plane : tuple of int, optional
            Tuple of two integers specifying the plane in k-space for which to compute
            the curvature. If None (default),
            computes all components of the Berry curvature tensor. This
            will affect the shape of the returned array.
        cartesian : bool, optional
            If True, computes the velocity operator in Cartesian coordinates.
            Default is False (reduced coordinates).
        non_abelian : bool, optional
            If True, returns the full Berry curvature tensor (non-abelian case).
            If False, returns the band-trace of the Berry curvature tensor (abelian case).
            Default is False. This will affect the shape of the returned array.
        param_periods : dict[str, float], optional
            Optional map ``{param_name: period}`` for swept parameters. When supplied,
            assumes the parameter is cyclic and trims any duplicated endpoints, or endpoints
            equal to the start plus the given period, before building finite-difference stencils.
            This can improve numerical accuracy by using centered differences throughout the parameter
            range. Otherwise, the function will use a backward difference at the endpoint and a forward
            difference at the start.
        diff_scheme : str, optional
            Finite difference scheme to use for parameter derivatives.
            Options are "central" (default) or "forward".
            This parameter is only relevant when passing varying parameters.
        diff_order : int, optional
            Order of accuracy for finite difference lambda derivatives.
            Must be an even integer for "central" scheme (default is ``4``),
            and a positive integer for "forward" scheme.
            This parameter is only relevant when passing varying parameters.
        use_tensorflow: bool, optional
            If True, will use TensorFlow to speed up linear algebra routines.
            Requires TensorFlow to be installed. Default is False.
        **params :
            Keyword arguments mapping parameter names to value(s). Each value can be a scalar
            or a 1D array of values. If any values are array-like,
            the quantum metric is evaluated at all combinations of parameter values,
            and the final array is stacked with the k-axis leading, followed by each
            parameter axis in the order of given parameter names.

        Returns
        -------
        g : np.ndarray
            Quantum metric tensor. Full shape is
            ``(dim_tot, dim_tot, Nk, Nparam1, Nparam2, ..., n_orb, n_orb)``,
            where ``dim_tot = dim_k + n_params`` is the total number of
            independent coordinates (crystal momenta plus varying parameters). If ``plane``
            is specified, the first two axes are indexed by the specified directions, and the
            shape is ``(Nk, Nparam1, Nparam2, ..., n_orb, n_orb)``. If ``non_abelian=False``,
            the returned array is the band-trace of the full tensor and the last
            two dimensions are contracted. The order of the parameter axes follows the order
            of the parameter names in ``**params``.

        See Also
        --------
        quantum_geometric_tensor
        berry_curvature
        velocity
        :ref:`quantum-geom-tens-nb` : Jupyter notebook tutorial on quantum geometric tensor.

        Notes
        -----
        - The quantum metric is computed using the Kubo formula, which
          requires knowledge of :math:`\partial_\mu H_k`. This operator
          is computed using the gradient of the Hamiltonian provided by :func:`velocity`.
        - Specifically, for :math:`(m,n) \in \text{occ}`, the non-Abelian quantum metric tensor
          is given by (when ``non_abelian=True``):

          .. math::

            g_{\mu \nu;\ mn}(k) =  \frac{1}{2} \sum_{l \notin \text{occ}}
            \frac{
                \langle u_{mk} | \partial_{\mu} H_k | u_{lk} \rangle
                \langle u_{lk} | \partial_{\nu} H_k | u_{nk} \rangle
                +
                m \leftrightarrow n
            }{
                (E_{nk} - E_{lk})(E_{mk} - E_{lk})
            }

        - This quantity is symmetric under :math:`\mu \leftrightarrow \nu`.
        - When using parameter sweeps via ``params``, the quantum metric is computed
          at all combinations of parameter values, and the resulting array has
          parameter axes added after the k-point axis in the output.
        - The plane indices use the combined coordinate ordering of k-space
          dimensions followed by swept parameters
          :math:`[k_0, ..., k_{\text{dim_k}}, \lambda_0, \lambda_1, ...]`.
          For example, in a 2D model with one swept parameter, the valid plane indices
          are ``0``, ``1``, and ``2``, where ``0`` and ``1`` refer to the two k-space
          dimensions, and ``2`` refers to the swept parameter axis. Swept parameters
          are those provided as array-like values in ``**params``. The order of
          swept parameters is determined by the order in which they appear
          in the ``**params`` keyword arguments.

        .. warning::
            - This requires a global energy gap between occupied and unoccupied bands.
            - The quantum metric is defined only when the total number of independent
              coordinates (crystal momenta plus varying parameters) is at least two,
              i.e. ``dim_k + n_params >= 2`` where ``n_params`` is the number of varying parameters
              set with lists of values.
        """
        Q = self.quantum_geometric_tensor(
            k_pts,
            occ_idxs=occ_idxs,
            cartesian=cartesian,
            non_abelian=non_abelian,
            param_periods=param_periods,
            diff_scheme=diff_scheme,
            diff_order=diff_order,
            use_tensorflow=use_tensorflow,
            **params,
        )

        if non_abelian:
            # Quantum metric is the symmetric part of the quantum geometric tensor
            g = (1 / 2) * (Q + Q.swapaxes(-1, -2))
        else:
            g = Q.real
        if plane is not None:
            mu, nu = plane
            g = g[mu, nu]
        return g



[docs]
    def axion_angle(
        self,
        nks: tuple[int, int, int] = (20, 20, 20),
        occ_idxs=None,
        return_second_chern: bool = False,
        *,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 4,
        use_tensorflow: bool = False,
        **params,
    ):
        r"""Axion angle via the second Chern form.

        Computes the axion angle for a 3D bulk model that depends
        on a single adiabatic parameter :math:`\lambda`. This is computed
        using the gauge-invariant 4-curvature formulation:

        .. math::
            \theta(\lambda) = \frac{1}{16\pi} \int_0^{\lambda} d\lambda'
            \int_{\text{BZ}} d^3k \,
            \epsilon^{\mu\nu\rho\sigma} \mathrm{Tr} \left[
                \Omega_{\mu\nu}(\mathbf{k}, \lambda')
                \Omega_{\rho\sigma}(\mathbf{k}, \lambda')
            \right]

        where :math:`\mu, \nu, \rho, \sigma` run over the three reciprocal-space
        directions and the adiabatic parameter :math:`\lambda`, and
        :math:`\Omega_{\mu\nu}` is the non-Abelian Berry curvature
        tensor over the occupied states.

        When the parameter :math:`\lambda` is cyclic (e.g., an angle variable),
        the change in :math:`\theta` over one full cycle is quantized
        in units of :math:`2\pi`, with the integer multiple given by the
        second Chern number :math:`C_2`:

        .. math::
            \Delta \theta = \theta(\lambda + P) - \theta(\lambda)
            = 2\pi C_2,

        where :math:`P` is the period of :math:`\lambda`.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        nks : tuple[int, int, int], optional
            Number of reduced k-points along each reciprocal axis.  All axes are treated
            as periodic and sampled uniformly in ``[0, 1)``.
        occ_idxs : array_like, optional
            Explicit list of occupied band indices.  If omitted, all bands below the gap
            are used, consistent with other bulk invariants.
        return_second_chern : bool, optional
            If ``True``, return the second Chern number :math:`C_2` alongside :math:`\theta(\lambda)`.
            This corresponds to the integer winding number of the axion angle over a full
            cycle of the adiabatic parameter.
        param_periods : dict[str, float], optional
            Optional map ``{param_name: period}`` for swept parameters. When supplied,
            assumes the parameter is cyclic and trims any duplicated endpoints, or endpoints
            equal to the start plus the given period, before building finite-difference stencils.
            This can improve numerical accuracy by using centered differences throughout the parameter
            range. Otherwise, the function will use a backward difference at the endpoint and a forward
            difference at the start.
        diff_scheme : {"central", "forward"}, optional
            Finite-difference stencil for the adiabatic derivative passed to
            :meth:`berry_curvature`.  Defaults to ``"central"``.
        diff_order : int, optional
            Order of the finite-difference scheme (must be even for ``"central"`` stencils).
        use_tensorflow : bool, optional
            Forwarded to :meth:`berry_curvature`; set ``True`` to accelerate large grids on
            GPU if TensorFlow is installed.
        **params :
            Keyword arguments mapping parameter names to value(s). Exactly one parameter
            must be supplied with an array of values to sweep the adiabatic parameter
            :math:`\lambda`. All other parameters must be scalar-valued.

        Returns
        -------
        lambdas : np.ndarray
            The :math:`\lambda` samples (including the closing point).
        theta : float
            Axion angle :math:`\theta(\lambda)` wrapped into :math:`[0, 2\pi)`.
        c2 : float, optional
            Second Chern number. Only returned when ``return_second_chern=True``.

        See Also
        --------
        berry_curvature : Computes the Berry curvature tensor used in the integrand.
        :ref:`axion-fkm-nb` : Example notebook demonstrating axion angle calculation.

        Notes
        -----
        - Requires a fully periodic three-dimensional model (``dim_k == 3``).
        - The adiabatic parameter sweep must be one-dimensional (exactly one parameter
          supplied with an array of values).
        - The k-grid is constructed uniformly in reduced coordinates over the
          full Brillouin zone.
        - The axion angle is computed using the gauge-invariant 4-curvature formulation,
          which doesn't require fixing a smooth gauge like the Chern-Simons 3-form approach.
        - The plane indices use the combined coordinate ordering of k-space
          dimensions followed by swept parameters
          :math:`[k_0, ..., k_{\text{dim_k}}, \lambda_0, \lambda_1, ...]`.
          For example, in a 2D model with one swept parameter, the valid plane indices
          are ``0``, ``1``, and ``2``, where ``0`` and ``1`` refer to the two k-space
          dimensions, and ``2`` refers to the swept parameter axis. Swept parameters
          are those provided as array-like values in ``**params``. The order of
          swept parameters is determined by the order in which they appear
          in the ``**params`` keyword arguments.
        """
        if self.dim_k != 3:
            raise ValueError(
                "axion_angle requires a three-dimensional periodic model (dim_k == 3)."
            )

        if not params:
            raise ValueError(
                "axion_angle requires sweeping a single adiabatic parameter; supply param and lambda_values."
            )

        params = dict(params)
        self._check_missing_parameters(params)

        scalars, sweep_names, sweep_values = self._params_to_sweep(params)

        # Take first and only swept parameter as adiabatic axis
        if len(sweep_names) != 1:
            raise ValueError(
                "axion_angle expects exactly one swept (array-valued) parameter."
            )
        sweep_name = sweep_names[0]
        lambda_vals_raw = np.asarray(sweep_values[0], dtype=float)

        # Trim end points if they duplicate the start (periodic)
        period_dict = param_periods or {}
        logger.debug(
            "axion_angle: normalizing adiabatic parameter axis '%s'.", sweep_name
        )
        lambda_vals, step_lambda, is_cyclic, trimmed = self._normalize_parameter_axis(
            lambda_vals_raw,
            name=sweep_name,
            period=period_dict.get(sweep_name, None),
        )
        sweep_values[0] = list(lambda_vals)

        nkx, nky, nkz = map(int, nks)
        if min(nkx, nky, nkz) < 2:
            raise ValueError("Each k-axis must contain at least two points.")

        # Build uniform reduced k-grid in [0, 1)
        k_axes = [np.linspace(0.0, 1.0, n, endpoint=False) for n in (nkx, nky, nkz)]
        k_grid = np.stack(np.meshgrid(*k_axes, indexing="ij"), axis=-1).reshape(
            -1, self.dim_k
        )

        # Assemble kwargs for berry_curvature (scalars + the sweep)
        bc_kwargs = {name: value for name, value in scalars.items()}
        bc_kwargs[sweep_name] = lambda_vals

        # evaluate the non-Abelian 4D Berry curvature
        logger.debug(
            "axion_angle: computing Berry curvature on %d x %d x %d x %d grid",
            nkx,
            nky,
            nkz,
            lambda_vals.size,
        )
        curvature = self.berry_curvature(
            k_grid,
            occ_idxs=occ_idxs,
            non_abelian=True,
            param_periods=param_periods,
            diff_scheme=diff_scheme,
            diff_order=diff_order,
            use_tensorflow=use_tensorflow,
            **bc_kwargs,
        )

        epsilon = levi_civita(4, 4).astype(curvature.dtype, copy=False)
        c2_density = np.einsum(
            "ijkl,ij...mn,kl...nm->...", epsilon, curvature, curvature
        ).real
        c2_density = c2_density.reshape(nkx, nky, nkz, lambda_vals.size)

        # sum over the k-space slab to obtain per-lambda slices
        d_lambda = c2_density.sum(axis=(0, 1, 2))

        # integration weights
        delta_k = 1.0 / (nkx * nky * nkz)
        # 4-volume element: (1/Nk)^3 * delta_lambda (k sampled in reduced units)
        volume_element = delta_k * step_lambda

        # second Chern number from full integral over closed 4D manifold
        # NOTE: shouldn't include endpoints (trimmed already)
        c2 = (volume_element / (32.0 * np.pi**2)) * d_lambda.sum()

        # cumulative trapezoid along parameter
        pref = volume_element / (16.0 * np.pi)
        cumulative = np.empty_like(d_lambda, dtype=float)
        cumulative[0] = 0.0
        if d_lambda.size > 1:
            mids = 0.5 * (d_lambda[:-1] + d_lambda[1:])
            cumulative[1:] = np.cumsum(mids) * pref

        if is_cyclic and trimmed:
            logger.debug(
                "axion_angle: Appending endpoint to axion angle for trimmed cyclic parameter sweep."
            )
            theta_ep = cumulative[-1] + pref * 0.5 * (d_lambda[-1] + d_lambda[0])
            lambdas_total = np.append(
                lambda_vals, lambda_vals[0] + step_lambda * lambda_vals.size
            )
            theta_total = np.append(cumulative, theta_ep)
        else:
            lambdas_total = lambda_vals.copy()
            theta_total = cumulative

        # wrap theta into [0, 2*pi)
        thetas_wrapped = np.unwrap(theta_total, period=2.0 * np.pi)

        outputs = [lambdas_total, thetas_wrapped]
        if return_second_chern:
            outputs.append(c2.real)

        return outputs[0] if len(outputs) == 1 else tuple(outputs)



[docs]
    def chern_number(
        self,
        plane: tuple[int, int],
        nks: tuple[int, ...],
        occ_idxs: list[int] = None,
        *,
        param_periods: dict[str, float] | None = None,
        diff_scheme: str = "central",
        diff_order: int = 4,
        use_tensorflow: bool = False,
        **params,
    ):
        r"""Compute the Chern number on the specified plane.

        The Chern number is computed by integrating the Berry curvature
        over a surface defined by ``plane`` parameter.
        The Chern number is given by

        .. math::
            C_{\mu\nu} = \frac{1}{2\pi} \int_{\mathcal{S}_{\mu\nu}}
            \Omega_{\mu\nu}(\boldsymbol{\kappa}) \,
            d\kappa_\mu\, d\kappa_\nu

        where :math:`\mathcal{S}_{\mu\nu}` denotes the two-dimensional plane in
        the combined k/parameter space, and :math:`\boldsymbol{\kappa}` is the combined
        coordinate vector including both crystal momenta and swept parameters.
        Here, :math:`\Omega_{\mu\nu}(\boldsymbol{\kappa})` is the trace of the
        Berry curvature tensor over the occupied bands.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        plane : tuple[int, int]
            Two distinct indices identifying the directions to integrate.
            Indices below ``dim_k`` refer to k-space axes, higher indices refer
            to swept parameters supplied via ``**params``.
        nks : tuple[int, int]
            Number of k samples along each periodic direction. Length must
            equal ``dim_k``. If the any k-directions are spectators, meaning
            they are not part of the ``plane``, they are still sampled
            uniformly in ``[0, 1)`` but the number of samples does not affect
            the Chern number result. The returned array will the Chern number
            for each spectator k-point and/or swept parameter combination.
        occ_idxs : array-like, optional
            Occupied-band indices used in the Berry-curvature calculation.
            Defaults to the lower half of the spectrum.
        param_periods : dict[str, float], optional
            Optional map ``{param_name: period}`` for swept parameters. When supplied,
            assumes the parameter is cyclic and trims any duplicated endpoints, or endpoints
            equal to the start plus the given period, before building finite-difference stencils.
            This can improve numerical accuracy by using centered differences throughout the parameter
            range. Otherwise, the function will use a backward difference at the endpoint and a forward
            difference at the start.
        diff_scheme : {'central', 'forward'}, optional
            Finite-difference stencil passed through to :meth:`berry_curvature`.
        diff_order : int, optional
            Accuracy order for the finite-difference stencil (even for
            ``'central'`` schemes). Default is 4.
        use_tensorflow: bool, optional
            Forwarded to :meth:`berry_curvature`; enables GPU evaluation if
            TensorFlow is available.
        **params :
            Parameter assignments. Scalars fix a parameter value; 1D arrays
            define sweeps. Swept axes appear as spectator dimensions in the
            returned array unless they are part of the integration plane.

        Returns
        -------
        float or np.ndarray
            Chern number(s) evaluated on the spectator grid. A scalar is
            returned when no spectator axes remain; otherwise the array shape
            matches the Cartesian product of the spectator coordinates.

        See Also
        --------
        berry_curvature : Computes the Berry curvature used in the integrand.

        Notes
        -----
        - The plane indices use the combined coordinate ordering of k-space
          dimensions followed by swept parameters
          :math:`[k_0, ..., k_{\text{dim_k}}, \lambda_0, \lambda_1, ...]`.
          For example, in a 2D model with one swept parameter, the valid plane indices
          are ``0``, ``1``, and ``2``, where ``0`` and ``1`` refer to the two k-space
          dimensions, and ``2`` refers to the swept parameter axis. Swept parameters
          are those provided as array-like values in ``**params``. The order of
          swept parameters is determined by the order in which they appear
          in the ``**params`` keyword arguments.
        - The routine reuses :meth:`berry_curvature` to obtain
          :math:`\Omega_{\mu\nu}` and performs the discrete integral for the
          selected plane. The occupied manifold must stay gapped over the entire
          integration region for the result to converge to an (approximate) integer.
        - The Chern number is only defined when the total number of independent
          coordinates (crystal momenta plus varying parameters) is at least two,
          i.e. ``dim_k + n_params >= 2`` where ``n_params`` is the number of
          parameters set with lists of values.
        - The Chern number is only guaranteed to be an integer in the limit
          of dense k-meshes and when the plane of integration forms a closed
          manifold (e.g., a Brillouin zone or a periodic parameter).
        """
        if len(nks) != self.dim_k:
            raise ValueError("nks must provide one entry per periodic direction.")
        if not (isinstance(plane, tuple) and len(plane) == 2):
            raise ValueError("plane must be a tuple of two axis indices.")
        mu, nu = plane
        if mu == nu:
            raise ValueError("Chern number plane indices must be different.")

        params = dict(params)
        self._check_missing_parameters(params)
        scalars, sweep_names, sweep_axes = self._params_to_sweep(params)
        param_periods = dict(param_periods or {})

        param_steps: list[float] = []
        param_lengths: list[int] = []
        param_trimmed: list[bool] = []
        eval_kwargs = scalars.copy()

        # Inspect each parameter sweep. _normalize_parameter_axis returns the unique
        # grid (trimmed if cyclic) plus the uniform spacing. We call it to obtain
        # spacing metadata, but we still evaluate the curvature on the *raw* grid
        # so "spectator" axes (not integrated) see exactly the points they requested.
        for name, axis_vals in zip(sweep_names, sweep_axes, strict=True):
            values = np.asarray(axis_vals, dtype=float)
            if values.ndim != 1 or values.size < 2:
                raise ValueError(
                    f"Swept parameter '{name}' must be a 1D array with at least two samples."
                )
            normalized, step, periodic, trimmed = self._normalize_parameter_axis(
                values,
                name=name,
                period=param_periods.get(name),
            )
            eval_kwargs[name] = values
            param_steps.append(step)
            param_lengths.append(values.size)
            param_trimmed.append(bool(periodic and trimmed))

        # Build a uniform k-mesh without endpoints so the BZ wrap is not double-counted.
        k_grid = self.k_uniform_mesh(nks, include_endpoints=False)

        # Berry curvature gives us Omega_{mu, nu}(k, p1, ...) for every pair mu,nu. We ask for the
        # full tensor (plane=None) because we may integrate over any combination later.
        curvature = self.berry_curvature(
            k_pts=k_grid,
            occ_idxs=occ_idxs,
            plane=None,
            cartesian=False,
            non_abelian=False,
            param_periods=param_periods,
            diff_scheme=diff_scheme,
            diff_order=diff_order,
            use_tensorflow=use_tensorflow,
            **eval_kwargs,
        )

        curvature = np.asarray(curvature, dtype=float)
        dim_total = curvature.shape[0]
        if any(idx < 0 or idx >= dim_total for idx in (mu, nu)):
            raise ValueError(
                f"plane indices {plane} exceed available coordinate directions ({dim_total})."
            )

        axis_lengths = [int(n) for n in nks] + param_lengths
        # Reshape curvature to (dim_total, dim_total, nk1, nk2, ..., param1, param2, ...)
        curvature = curvature.reshape(dim_total, dim_total, *axis_lengths)

        # Extract the (mu, nu) component to integrate
        component = curvature[mu, nu]
        # Move mu, nu to leading axes for easier integration
        component = np.moveaxis(component, (mu, nu), (0, 1))

        len_mu = axis_lengths[mu]
        len_nu = axis_lengths[nu]

        # If a parameter axis is being integrated and the sweep
        # was cyclic, drop the duplicated endpoint before summing. Spectator axes
        # keep their full length so the return matches the caller’s grid.
        if mu >= self.dim_k and param_trimmed[mu - self.dim_k]:
            component = component[:-1, ...]
            len_mu -= 1
        if nu >= self.dim_k and param_trimmed[nu - self.dim_k]:
            component = component[:, :-1, ...]
            len_nu -= 1

        spectator_axes = [ax for ax in range(len(axis_lengths)) if ax not in (mu, nu)]
        spectator_lengths = [axis_lengths[ax] for ax in spectator_axes]
        component = component.reshape(len_mu, len_nu, *spectator_lengths)

        # Plaquette area in each direction: k-axes are spaced by 1/nk (reduced units).
        def _step(idx: int) -> float:
            if idx < self.dim_k:
                return 1.0 / nks[idx]
            return param_steps[idx - self.dim_k]

        area = _step(mu) * _step(nu) / (2.0 * np.pi)
        integrated = component.sum(axis=(0, 1)) * area

        if spectator_lengths:
            return np.real_if_close(integrated.reshape(spectator_lengths))
        return float(np.real_if_close(integrated))


    @staticmethod
    def _permutation_sign(indices: list[int]) -> int:
        perm = list(indices)
        sign = 1
        for i in range(len(perm)):
            for j in range(i + 1, len(perm)):
                if perm[i] > perm[j]:
                    perm[i], perm[j] = perm[j], perm[i]
                    sign *= -1
        return sign

    # TODO: Handle params lists

[docs]
    def local_chern_marker(
        self,
        occ_idxs=None,
        return_bulk_avg: bool = False,
        trim_cells: int = 4,
        **params,
    ):
        r"""Bianco-Resta local Chern marker.

        The local Chern marker is a real-space diagnostic of topology,
        assigning to each orbital/site a scalar quantity that reflects the
        topological character of the occupied bands. It is defined as

        .. math::
            C(\boldsymbol{\tau}_i) = \frac{4\pi}{{A_\text{cell}}}\,
            \mathrm{Im} \; \langle \phi_i |
            \mathcal{P} \left[ X,\mathcal{P} \right]\left[Y,\mathcal{P}\right]
            | \phi_i \rangle ,

        where :math:`\mathcal{P}` is the projector onto the occupied subspace,
        :math:`X,Y` are the single-particle position operators and
        :math:`|\phi_i\rangle` is the orbital basis state at site
        :math:`\boldsymbol{\tau}_i`.

        This quantity is intensive: when normalized by the unit-cell volume,
        its spatial average converges to the total Chern number of the occupied
        manifold in the crystalline case [1]_.

        .. versionadded:: 2.0.0

        Parameters
        ----------
        occ_idxs : array-like, optional
            Indices of the occupied bands. If none are provided,
            the lower half bands are considered occupied.
        return_bulk_avg : bool, optional
            If True, also returns the bulk-averaged Chern number
            computed from the local Chern marker. Default is False.
        trim_cells : int, optional
            Number of unit cells to trim from each edge when computing
            the bulk-averaged Chern number. Default is 4.

        Returns
        -------
        C_local : np.ndarray of shape (norb,)
            Per-site local Chern marker.
        C_bulk_avg : float, optional
            Bulk-averaged Chern number computed from local Chern marker.
            Returned only if `return_bulk_avg` is True.

        See Also
        --------
        chern_number : Computes the total Chern number via Berry curvature integration.
        :ref:`local-chern-nb` : Jupyter notebook tutorial on local Chern marker.

        References
        ----------
        .. [1] R. Bianco and R. Resta, "Mapping topological order in coordinate space",
               Phys. Rev. B 84, 241106(R) (2011).
        """
        if self.dim_k != 0:
            raise ValueError(
                "Local Chern marker is only defined for real-space models (dim_k=0)."
            )
        if self.dim_r != 2:
            raise NotImplementedError(
                "Local Chern marker is only defined for 2D models (dim_r=2)."
            )

        H = self.hamiltonian(flatten_spin_axis=True, **params)  # (..., N, N) dense
        N = H.shape[-1]
        r_cart = self.get_orb_vecs(cartesian=True)  # (N, 2)
        if r_cart.ndim != 2 or r_cart.shape[1] != 2 or r_cart.shape[0] != N:
            raise ValueError("Could not get orbital coordinates in Cartesian basis.")
        x = r_cart[:, 0]
        y = r_cart[:, 1]

        # Dense eigensolve and projector
        _, evecs = np.linalg.eigh(H)  # returns sorted ascending
        if occ_idxs is None:
            # Default to half filling (robust for particle-hole symmetric models like Haldane).
            occ_idxs = np.arange(N // 2)
        else:
            occ_idxs = np.asarray(occ_idxs, int)

        Uocc = evecs[..., occ_idxs]  # (N, k_occ)
        P = Uocc @ Uocc.conj().T  # (N,N) dense projector

        DX = x[:, None] - x[None, :]
        DY = y[:, None] - y[None, :]
        CX = DX * P
        CY = DY * P

        # A = P [X,P][Y,P]
        A = P @ (CX @ CY)

        # Local marker from diagonal of A
        A_cell = self.cell_volume
        C_local = (4 * np.pi / A_cell) * np.imag(np.diag(A))

        if not return_bulk_avg:
            return C_local

        Lx = self.lattice.nsuper[0]
        Ly = self.lattice.nsuper[1]

        # number of orbitals per Bravais cell (handles spin implicitly via N)
        if N % (Lx * Ly) != 0:
            raise ValueError(
                f"N={N} not divisible by Lx*Ly={Lx * Ly}; "
                "cannot aggregate per-cell markers."
            )

        # Per-cell marker by summing orbitals belonging to the same cell
        # (use fractional positions to infer integer cell index robustly)
        r_frac = self.get_orb_vecs(cartesian=False)  # (N, 2)

        # Per-cell fractional centers (average over orbitals of each cell)
        # We don't assume any orbitals ordering; we infer cell indices by rounding.
        # Compute approximate cell indices using fractional coords:
        # Step 1: reshape a best-guess to estimate the internal offset
        # If ordering is arbitrary, estimate offset from all orbitals:
        offset = np.mod(r_frac, 1.0).mean(axis=0)
        ij_float = r_frac - offset  # ~ integers (ix, iy) per orbital
        ij = np.rint(ij_float).astype(int)
        ix = np.mod(ij[:, 0], Lx)
        iy = np.mod(ij[:, 1], Ly)
        lin = ix + Lx * iy  # linear cell index in C-order (ix fastest)

        # Aggregate per-cell local marker
        marker_cell = np.zeros(Lx * Ly, dtype=C_local.dtype)
        np.add.at(marker_cell, lin, C_local)

        # Normalize trim argument
        if isinstance(trim_cells, int):
            tx = ty = int(trim_cells)
        else:
            tx, ty = map(int, trim_cells)
        tx = max(0, tx)
        ty = max(0, ty)
        if 2 * tx >= Lx or 2 * ty >= Ly:
            raise ValueError(f"trim_cells={trim_cells} too large for grid {(Lx, Ly)}")

        # Build mask over interior cells (C-order indexing)
        IX, IY = np.meshgrid(np.arange(Lx), np.arange(Ly), indexing="xy")
        mask = (
            (IX.ravel() >= tx)
            & (IX.ravel() < Lx - tx)
            & (IY.ravel() >= ty)
            & (IY.ravel() < Ly - ty)
        )

        C_bulk_avg = marker_cell[mask].mean()

        return C_local, C_bulk_avg



[docs]
    def position_matrix(self, evecs: np.ndarray, pos_dir: int):
        r"""Position operator matrix elements

        Returns matrix elements of the position operator along
        direction ``pos_dir`` for eigenvectors ``evecs`` at a single k-point.
        Position operator is defined in reduced coordinates.

        The returned object :math:`X` is

        .. math::

          X_{m n {\bf k}}^{\alpha} = \langle u_{m {\bf k}} \vert
          r^{\alpha} \vert u_{n {\bf k}} \rangle

        Here :math:`r^{\alpha}` is the position operator along direction
        :math:`\alpha` that is selected by ``pos_dir``.

        Parameters
        ----------
        evecs : np.ndarray
            Eigenvectors for which we are computing matrix
            elements of the position operator.  The shape of this array
            is ``evecs[band, orbital]`` if ``spinful=False`` and
            ``evecs[band, orbital, spin]`` if ``spinful=True``.

            .. versionchanged:: 2.0.0
                Parameter ``evec`` renamed to ``evecs`` to clarify that multiple
                eigenvectors can be passed at once.

        pos_dir : int
            Direction along which we are computing the center.
            This integer must not be one of the periodic directions
            since position operator matrix element in that case is not
            well defined.

            .. versionchanged:: 2.0.0
                Parameter ``dir`` renamed to ``pos_dir`` to avoid conflict
                with built-in function ``dir()``.

        Returns
        -------
        pos_mat : np.ndarray
            Position operator matrix :math:`X_{m n}` as defined above.
            This is a square matrix with size determined by number of bands
            given in `evec` input array.  First index of `pos_mat` corresponds to
            bra vector (:math:`m`) and second index to ket (:math:`n`).

        See Also
        --------
        :ref:`haldane-hwf-nb` : For an example.

        Examples
        --------
        Diagonalizes Hamiltonian at some k-points

        >>> (evals, evecs) = my_model.solve_ham(k_vec, return_eigvecs=True)

        Computes position operator matrix elements for 3-rd kpoint
        and bottom five bands along first coordinate

        >>> pos_mat = my_model.position_matrix(evecs[2, :5], 0)

        """

        # make sure specified direction is not periodic!
        if pos_dir in self.periodic_dirs:
            raise ValueError(
                "Can not compute position matrix elements along periodic direction!"
            )
        # make sure direction is not out of range
        if pos_dir < 0 or pos_dir >= self.dim_r:
            raise ValueError("Direction out of range!")

        # check if model came from w90
        if not self.assume_position_operator_diagonal:
            _offdiag_approximation_warning_and_stop()

        # check shape of evec
        if not isinstance(evecs, np.ndarray):
            raise TypeError("evec must be a numpy array.")
        # check number of dimensions of evec
        if not self.spinful:
            if evecs.ndim != 2:
                raise ValueError(
                    "evec must be a 2D array with shape (band, orbital) for spinless models."
                )
        elif self.spinful:
            if evecs.ndim != 3:
                raise ValueError(
                    "evec must be a 3D array with shape (band, orbital, spin) for spinful models."
                )

        # get coordinates of orbitals along the specified direction
        pos_tmp = self.orb_vecs[:, pos_dir]
        # reshape arrays in the case of spinful calculation
        if self.spinful:
            # tile along spin direction if needed
            pos_use = np.tile(pos_tmp, (2, 1)).transpose().flatten()
            evec_use = evecs.reshape(evecs.shape[0], -1)  # flatten spin index
        else:
            pos_use = pos_tmp
            evec_use = evecs

        # <u_i | r | u_j> = sum_orb r_orb u_i*(orb) u_j(orb)
        pos_mat = np.einsum("im,m,jm->ij", evec_use.conj(), pos_use, evec_use)

        # make sure matrix is Hermitian
        if not np.allclose(pos_mat, pos_mat.T.conj()):
            raise ValueError("Position matrix is not Hermitian.")

        return pos_mat



[docs]
    def position_expectation(self, evecs: np.ndarray, pos_dir: int):
        r"""Returns diagonal matrix elements of the position operator.

        These elements :math:`X_{n n}` can be interpreted as an
        average position of n-th Bloch state ``evec[n]`` along
        direction `dir`.

        Parameters
        ----------
        evecs : np.ndarray
            Eigenvectors for which we are computing matrix
            elements of the position operator. The shape of this array
            is ``evecs[band, orbital]`` if ``spinful=True`` and
            ``evecs[band, orbital, spin]`` if ``spinful=False``.

            .. versionchanged:: 2.0.0
                Parameter ```evec`` renamed to ``evecs`` to clarify that multiple
                eigenvectors can be passed at once.

        pos_dir : int
            Direction along which we are computing matrix
            elements. This integer must *not* be one of the periodic
            directions since position operator matrix element in that
            case is not well defined.

            .. versionchanged:: 2.0.0
                Parameter ``dir`` renamed to ``pos_dir`` to avoid conflict
                with built-in function ``dir()``.

        Returns
        -------
        pos_exp : np.ndarray
            Diagonal elements of the position operator matrix :math:`X`.
            Length of this vector is determined by number of bands given in *evec* input
            array.

        See Also
        --------
        :ref:`haldane-hwf-nb` : For an example.
        position_matrix : For definition of matrix :math:`X`.

        Notes
        -----
        Generally speaking these centers are _not_
        hybrid Wannier function centers (which are instead
        returned by :func:`TBModel.position_hwf`).

        Examples
        --------
        Diagonalizes Hamiltonian at some k-points

        >>> (evals, evecs) = my_model.solve_ham(k_vec, return_eigvecs=True)

        Computes average position for 3-rd kpoint
        and bottom five bands along first coordinate

        >>> pos_exp = my_model.position_expectation(evecs[2, :5], 0)

        """

        # check if model came from w90
        if not self.assume_position_operator_diagonal:
            _offdiag_approximation_warning_and_stop()

        pos_exp = self.position_matrix(evecs=evecs, pos_dir=pos_dir).diagonal()
        return np.array(np.real(pos_exp), dtype=float)



[docs]
    def position_hwf(
        self, evecs: np.ndarray, pos_dir: int, hwf_evec=False, basis="orbital"
    ):
        r"""Eigenvalues and eigenvectors of the position operator

        Returns eigenvalues and optionally eigenvectors of the
        position operator matrix :math:`X` in basis of the orbitals
        or, optionally, of the input wave functions (typically Bloch
        functions). The returned eigenvectors can be interpreted as
        linear combinations of the input states ``evec`` that have
        minimal extent (or spread :math:`\Omega` in the sense of
        maximally localized Wannier functions) along direction
        ``dir``. The eigenvalues are average positions of these
        localized states.

        Parameters
        ----------
        evecs : np.ndarray
            Eigenvectors for which we are computing matrix
            elements of the position operator. The shape of this array
            is ``evecs[band, orbital]`` if ``spinful=True`` and
            ``evecs[band, orbital, spin]`` if ``spinful=False``.

            .. versionchanged:: 2.0.0
                Parameter ``evec`` renamed to ``evecs`` to clarify that multiple
                eigenvectors can be passed at once.

        pos_dir : int
            Direction along which we are computing matrix
            elements. This integer must not be one of the periodic
            directions since position operator matrix element in that
            case is not well defined.

            .. versionchanged:: 2.0.0
                Parameter ``dir`` renamed to ``pos_dir`` to avoid conflict
                with built-in function ``dir()``.

        hwf_evec : bool, optional
            Default is ``False``. If set to ``True`` this function will
            return not only eigenvalues but also eigenvectors of :math:`X`.
        basis : {"orbital", "wavefunction", "bloch"}, optional
            Default is "orbital". If ``basis="wavefunction"`` or ``basis="bloch"``, the hybrid
            Wannier function `hwf` is returned in the basis of the input
            wave functions. That is, the elements of ``hwf[i, j]`` give the amplitudes
            of the i-th hybrid Wannier function on the j-th input state.
            If ``basis="orbital"``, the elements of ``hwf[i, orb]`` (or ``hwf[i, orb, spin]``
            if ``spinful=True``) give the amplitudes of the i-th hybrid Wannier function on
            the specified basis function.

        Returns
        -------
        hwfc : np.ndarray
            Eigenvalues of the position operator matrix :math:`X`
            (also called hybrid Wannier function centers).
            Length of this vector equals number of bands given in ``evecs``
            input array. Hybrid Wannier function centers are ordered in ascending order.
            Note that in general `n`-th hwfc does not correspond to `n`-th
            state in ``evecs``.
        hwf : np.ndarray
            Eigenvectors of the position operator matrix :math:`X`.
            (also called hybrid Wannier functions).  These are returned only if
            parameter ``hwf_evec = True``.

            The shape of this array is ``[h,x]`` or ``[h,x,s]`` depending on value of
            ``basis`` and ``spinful``.

            - If ``basis`` is "bloch" then ``x`` refers to indices of
              Bloch states.
            - If ``basis`` is "orbital" then ``x`` (or ``x`` and ``s``)
              correspond to orbital index (or orbital and spin index if ``spinful=True``).

        See Also
        --------
        :ref:`haldane-hwf-nb` : For an example.
        position_matrix : For the definition of the matrix :math:`X`.
        position_expectation : For the position expectation value.

        Notes
        -----
        Note that these eigenvectors are not maximally localized
        Wannier functions in the usual sense because they are
        localized only along one direction. They are also not the
        average positions of the Bloch states ``evecs``, which are
        instead computed by :func:`position_expectation`.

        See Fig. 3 in [1]_ for a discussion of the hybrid Wannier function centers in the
        context of a Chern insulator.

        References
        ----------
        .. [1] \ S. Coh, D. Vanderbilt, *Phys. Rev. Lett.* **102**, 107603 (2009).

        Examples
        --------
        Diagonalizes Hamiltonian at some k-points

        >>> evals, evecs = my_model.solve_ham(k_vec, return_eigvecs=True)

        Computes hybrid Wannier centers (and functions) for 3-rd kpoint
        and bottom five bands along first coordinate

        >>> hwfc, hwf = my_model.position_hwf(evecs[2, :5], 0, hwf_evec=True, basis="orbital")
        """
        # check if model came from w90
        if not self.assume_position_operator_diagonal:
            _offdiag_approximation_warning_and_stop()

        # get position matrix
        pos_mat = self.position_matrix(evecs=evecs, pos_dir=pos_dir)

        # diagonalize
        if not hwf_evec:
            hwfc = np.linalg.eigvalsh(pos_mat)
            return hwfc
        else:  # find eigenvalues and eigenvectors
            (hwfc, hwf) = np.linalg.eigh(pos_mat)
            # transpose matrix eig since otherwise it is confusing
            # now eig[i,:] is eigenvector for eval[i]-th eigenvalue
            hwf = hwf.T
            # convert to right basis
            if basis.lower().strip() in ["wavefunction", "bloch"]:
                return (hwfc, hwf)
            elif basis.lower().strip() == "orbital":
                if not self.spinful:
                    ret_hwf = np.zeros((hwf.shape[0], self.norb), dtype=complex)
                    # sum over bloch states to get hwf in orbital basis
                    for i in range(ret_hwf.shape[0]):
                        ret_hwf[i] = np.dot(hwf[i], evecs)
                    hwf = ret_hwf
                else:
                    ret_hwf = np.zeros((hwf.shape[0], self.norb * 2), dtype=complex)
                    # get rid of spin indices
                    evec_use = evecs.reshape([hwf.shape[0], self.norb * 2])
                    # sum over states
                    for i in range(ret_hwf.shape[0]):
                        ret_hwf[i] = np.dot(hwf[i], evec_use)
                    # restore spin indices
                    hwf = ret_hwf.reshape([hwf.shape[0], self.norb, 2])
                return (hwfc, hwf)
            else:
                raise ValueError(
                    "Basis must be either 'wavefunction', 'bloch', or 'orbital'"
                )


    ##### Plotting functions #####
    # These plotting functions are wrappers to the functions in plotting.py


[docs]
    @copydoc(plot_tbmodel)
    def visualize(
        self,
        proj_plane=None,
        eig_dr=None,
        draw_hoppings=True,
        annotate_onsite=False,
        ph_color="black",
    ):
        return plot_tbmodel(
            self, proj_plane, eig_dr, draw_hoppings, annotate_onsite, ph_color
        )



[docs]
    @copydoc(plot_tbmodel_3d)
    def visualize_3d(
        self,
        draw_hoppings=True,
        show_model_info=True,
        site_colors=None,
        site_names=None,
        show=True,
    ):
        return plot_tbmodel_3d(
            self,
            draw_hoppings=draw_hoppings,
            show_model_info=show_model_info,
            site_colors=site_colors,
            site_names=site_names,
            show=show,
        )



[docs]
    @copydoc(plot_bands)
    def plot_bands(
        self,
        k_nodes,
        k_node_labels=None,
        nk=101,
        fig=None,
        ax=None,
        proj_orb_idx=None,
        proj_spin=False,
        bands_label=None,
        scat_size=3,
        lw=2,
        lc="b",
        ls="solid",
        cmap="plasma",
        cbar=True,
    ):
        return plot_bands(
            self,
            k_nodes,
            nk=nk,
            ktick_labels=k_node_labels,
            bands_label=bands_label,
            proj_orb_idx=proj_orb_idx,
            proj_spin=proj_spin,
            fig=fig,
            ax=ax,
            scat_size=scat_size,
            lw=lw,
            lc=lc,
            ls=ls,
            cmap=cmap,
            cbar=cbar,
        )




# Backward-compatibility for legacy tb_model constructor
class tb_model(TBModel):
    """Deprecated alias for backward-compatibility with PythTB <= 1.8.

    This class preserves the old constructor signature:
        ``tb_model(dim_k, dim_r, lat=None, orb=None, per=None, nspin=1)``

    Use ``TBModel(lattice, spinful)`` going forward.
    """

    def __init__(self, dim_k, dim_r, lat=None, orb=None, per=None, nspin=1):
        warnings.warn(
            "pythtb.tb_model is deprecated and will be removed in a future release. "
            "Use TBModel instead.",
            DeprecationWarning,
            stacklevel=2,
        )
        # Build a Lattice from v1-style arguments
        if not isinstance(dim_k, int):
            raise TypeError("dim_k must be an int in tb_model-compatible constructor")
        if not isinstance(dim_r, int):
            raise TypeError("dim_r must be an int in tb_model-compatible constructor")
        if dim_k < 0 or dim_k > 4:
            raise ValueError("dim_k must be between 0 and 4")
        if dim_r < dim_k or dim_r > 4:
            raise ValueError("dim_r must satisfy dim_r >= dim_k and <= 4")

        # Lattice vectors
        if (isinstance(lat, str) and lat == "unit") or lat is None:
            lat_vecs = np.identity(dim_r, float)
        else:
            lat_vecs = np.array(lat, dtype=float)
            if lat_vecs.shape != (dim_r, dim_r):
                raise ValueError("lat must have shape (dim_r, dim_r)")
            det = np.linalg.det(lat_vecs)
            if abs(det) < 1.0e-12:
                raise ValueError("lattice vectors have near-zero volume")

        # Orbital positions (reduced coordinates)
        if (isinstance(orb, str) and orb == "bravais") or orb is None:
            orb_vecs = np.zeros((1, dim_r), dtype=float)
        elif isinstance(orb, (int, np.integer)):
            orb_vecs = np.zeros((int(orb), dim_r), dtype=float)
        else:
            orb_vecs = np.array(orb, dtype=float)
            if orb_vecs.ndim != 2 or orb_vecs.shape[1] != dim_r:
                raise ValueError("orb must be (norb, dim_r) in reduced coords")

        # Periodic directions
        if per is None:
            periodic_dirs = list(range(dim_k))
        else:
            periodic_dirs = list(per)
            if len(periodic_dirs) != dim_k:
                raise ValueError("len(per) must equal dim_k")

        # Construct new-style Lattice and delegate to TBModel
        lat_obj = Lattice(lat_vecs, orb_vecs, periodic_dirs=periodic_dirs)
        spinful = nspin == 2
        super().__init__(lattice=lat_obj, spinful=spinful)