Source code for halomod.tools

"""
Modules defining a series of utility functions to perform hankel transformation
and Fourier transformation from correlation function to power spectrum.
"""

from __future__ import annotations

import logging
import time
import warnings
from functools import lru_cache

import numpy as np
import scipy.integrate as intg
from scipy.interpolate import InterpolatedUnivariateSpline as spline
from scipy.interpolate import UnivariateSpline as uspline
from scipy.stats import poisson

from .hod import HOD
from .profiles import Profile

try:
    from pathos import multiprocessing as mp

    HAVE_POOL = True
except ImportError:
    HAVE_POOL = False

logger = logging.getLogger(__name__)


@lru_cache(maxsize=25)
def _get_sumspace(h: float, nmin: int, nmax: int):
    r"""Function used in hankel transformation to get the parts of the integral sum."""
    roots = np.arange(nmin, nmax)
    t = h * roots
    s = np.pi * np.sinh(t)
    x = np.pi * roots * np.tanh(s / 2)

    dpsi = 1 + np.cosh(s)
    dpsi[dpsi != 0] = (np.pi * t * np.cosh(t) + np.sinh(s)) / dpsi[dpsi != 0]
    sumparts = np.pi * np.sin(x) * dpsi * x

    return x, sumparts



[docs]
def hankel_transform(
    f: [callable, list[callable]],
    trns_var: np.ndarray,
    trns_var_name: str,
    h=0.005,
    chunksize=100,
    atol=1e-8,
    rtol=1e-8,
):
    r"""Function to do the hankel tranformation."""
    if trns_var_name not in "kr":
        raise ValueError("trns_var_name must be either 'k' or 'r'.")

    # Optimal value of nmax, given h.
    nmax = int(3.2 / h)

    out = np.zeros(len(trns_var))

    for ir, rr in enumerate(trns_var):
        nn = 1
        prev_res = 100
        res = 0
        p = f[ir] if hasattr(f, "__len__") else f
        while not np.isclose(prev_res, res, atol=atol, rtol=rtol) and nn < nmax:
            prev_res = res

            x, sumparts = _get_sumspace(h, nn, nn + chunksize)

            kk = x / rr
            pk = p(kk)

            pk[np.isnan(pk)] = 0

            res = prev_res + np.sum(sumparts * pk)
            nn += chunksize

        out[ir] = res

    if trns_var_name == "r":
        return out / (2 * np.pi**2 * trns_var**3)
    else:
        return out * 4 * np.pi / trns_var**3




[docs]
def power_to_corr_ogata(
    power: np.ndarray,
    k: np.ndarray,
    r: np.ndarray,
    h=0.005,
    power_pos=(True, True),
    rtol=1e-3,
    atol=1e-15,
    _reverse=False,
):
    """
    Convert a 3D power spectrum to a correlation function.

    Uses Ogata's method (Ogata 2005) for Hankel Transforms in 3D.

    Parameters
    ----------
    power : np.ndarray
        The power spectrum to convert -- either 1D or 2D. If 1D, it is the power as a
        function of k. If 2D, the first dimension should be ``len(r)``, and the power
        to integrate is considered to be different for each ``r``.
    k : np.ndarray
        Array of same length as the last axis of ``power``, giving the fourier-space
        co-ordinates.
    r : np.ndarray
        The real-space co-ordinates to which to transform.
    h : int, optional
        Controls the spacing of the intervals (note the intervals are not equispaced).
        Smaller numbers give smaller intervals.
    power_pos : tuple of bool, optional
        Whether 'power' is definitely positive, at either end. If so, a slightly better
        extrapolation can be achieved.

    Notes
    -----
    See the `hankel <https://hankel.readthedocs.io>`_ documentation for details on the
    implementation here. This particular function is restricted to a spherical transform.
    """
    v = "kr"
    if _reverse:
        v = v[::-1]

    func = "corr" if _reverse else "power"

    # Optimal value of nmax, given h.
    nmax = int(3.2 / h)

    lnk = np.log(k)
    roots = np.arange(1, nmax + 1)
    t = h * roots
    s = np.pi * np.sinh(t)
    x = np.pi * roots * np.tanh(s / 2)

    dpsi = 1 + np.cosh(s)
    dpsi[dpsi != 0] = (np.pi * t * np.cosh(t) + np.sinh(s)) / dpsi[dpsi != 0]
    sumparts = np.pi * np.sin(x) * dpsi * x

    if power_pos[0] and not np.all(power.T[:2] > 0):
        power_pos = (False, power_pos[1])

    if power_pos[1] and not np.all(power.T[-2:] > 0):
        power_pos = (power_pos[0], False)

    def pfunc(logk, p):
        """An interpolation function for masked p(k)."""
        spl = spline(lnk, p, k=3)
        result = np.zeros_like(logk)
        inner_mask = (lnk.min() <= logk) & (logk <= lnk.max())
        result[inner_mask] = spl(logk[inner_mask])

        lower_mask = logk < lnk.min()
        if power_pos[0]:
            result[lower_mask] = np.exp(
                (np.log(p[1]) - np.log(p[0])) * (logk[lower_mask] - lnk[0]) / (lnk[1] - lnk[0])
                + np.log(p[0])
            )
        else:
            result[lower_mask] = (p[1] - p[0]) * (logk[lower_mask] - lnk[0]) / (
                lnk[1] - lnk[0]
            ) + p[0]

        upper_mask = logk > lnk.max()
        if power_pos[1]:
            if p[-1] <= 0 or p[-2] <= 0:
                raise ValueError("Something went horribly wrong")
            result[upper_mask] = np.exp(
                (np.log(p[-1]) - np.log(p[-2])) * (logk[upper_mask] - lnk[-1]) / (lnk[-1] - lnk[-2])
                + np.log(p[-1])
            )
        else:
            result[upper_mask] = (p[-1] - p[-2]) * (logk[upper_mask] - lnk[-1]) / (
                lnk[-1] - lnk[-2]
            ) + p[-1]

        return result

    out = np.zeros(len(r))

    warn_upper = True
    warn_lower = True
    warn_conv = True
    for ir, rr in enumerate(r):
        kk = x / rr

        summand = sumparts * pfunc(np.log(kk), power[ir] if power.ndim == 2 else power)
        cumsum = np.cumsum(summand)

        if kk.min() < k.min() and warn_lower:
            warnings.warn(
                f"In hankel transform, {func} at {v[1]}={rr:.2e} was extrapolated to "
                f"{v[0]}={kk.min():.2e}. Minimum provided was {k.min():.2e}. "
                f"Lowest value required is {x.min() / r.max():.2e}",
                stacklevel=2,
            )
            warn_lower = False

        # If all k values accessed weren't interpolated, just return it.
        if kk.max() <= k.max():
            out[ir] = cumsum[-1]
        else:
            # Check whether we have convergence at k.max
            indx = np.where(kk > k.max())[0][0]

            if np.isclose(cumsum[indx], cumsum[indx - 1], atol=atol, rtol=rtol):
                # If it converged in the non-extrapolated part, return that.
                out[ir] = cumsum[indx]
            else:
                # Otherwise, warn the user, and just return the full sum.
                if warn_upper:
                    warnings.warn(
                        f"In hankel transform, {func} at {v[1]}={rr:.2e} was extrapolated to "
                        f"{v[0]}={kk.max():.2e}. Maximum provided was {k.max():.2e}. ",
                        stacklevel=2,
                    )
                    warn_upper = False

                if not np.isclose(cumsum[-1], cumsum[-2], atol=atol, rtol=rtol) and warn_conv:
                    warnings.warn(
                        f"Hankel transform of {func} did not converge for {v[1]}={rr:.2e}. "
                        f"It is likely that higher {v[1]} will also not converge. "
                        f"Absolute error estimate = {cumsum[-1] - cumsum[-2]:.2e}. "
                        f"Relative error estimate = {cumsum[-1] / cumsum[-2] - 1:.2e}",
                        stacklevel=2,
                    )
                    warn_conv = False

                out[ir] = cumsum[-1]

    return out / (2 * np.pi**2 * r**3)




[docs]
def corr_to_power_ogata(corr, r, k, h=0.005, power_pos=(True, False), atol=1e-15, rtol=1e-3):
    """
    Convert an isotropic 3D correlation function to a power spectrum.

    Uses Ogata's method (Ogata 2005) for Hankel Transforms in 3D.

    Parameters
    ----------
    corr : np.ndarray
        The correlation function to convert as a function of ``r``.
    r : np.ndarray
        Array of same length as ``corr``, giving the real-space co-ordinates.
    k : np.ndarray
        The fourier-space co-ordinates to which to transform.
    n : int, optional
        The number of subdivisions in the integral.
    h : int, optional
        Controls the spacing of the intervals (note the intervals are not equispaced).
        Smaller numbers give smaller intervals.

    Notes
    -----
    See the `hankel <https://hankel.readthedocs.io>`_ documentation for details on the
    implementation here. This particular function is restricted to a spherical transform.
    """
    return (
        8
        * np.pi**3
        * power_to_corr_ogata(
            corr, r, k, h, power_pos=power_pos, atol=atol, rtol=rtol, _reverse=True
        )
    )




[docs]
def power_to_corr(power_func: callable, r: np.ndarray) -> np.ndarray:
    """
    Calculate the isotropic 3D correlation function given an isotropic power spectrum.

    Parameters
    ----------
    power_func : callable
        A callable function which returns the natural log of power given lnk
    r : array_like
        The values of separation/scale to calculate the correlation at.

    Notes
    -----
    This uses standard Simpson's Rule integration, but in which the number of subdivisions
    is chosen with some care to ensure that zeros of the Bessel function are captured.

    See Also
    --------
    power_to_corr_ogata :
        A faster, smarter algorithm for doing the same thing.
    """
    if not np.iterable(r):
        r = [r]

    corr = np.zeros_like(r)

    # the number of steps to fit into a half-period at high-k. 6 is better than 1e-4.
    minsteps = 8

    # set min_k, 1e-6 should be good enough
    mink = 1e-6

    temp_min_k = 1.0

    for i, rr in enumerate(r):
        # getting maxk here is the important part. It must be a half multiple of
        # pi/r to be at a "zero", it must be >1 AND it must have a number of half
        # cycles > 38 (for 1E-5 precision).

        min_k = (2 * np.ceil((temp_min_k * rr / np.pi - 1) / 2) + 0.5) * np.pi / rr
        maxk = max(501.5 * np.pi / rr, min_k)

        # Now we calculate the requisite number of steps to have a good dk at hi-k.
        nk = np.ceil(np.log(maxk / mink) / np.log(maxk / (maxk - np.pi / (minsteps * rr))))

        lnk, dlnk = np.linspace(np.log(mink), np.log(maxk), int(nk), retstep=True)
        P = power_func(lnk)
        integ = P * np.exp(lnk) ** 2 * np.sin(np.exp(lnk) * rr) / rr

        corr[i] = (0.5 / np.pi**2) * intg.simpson(integ, dx=dlnk)

    return corr




[docs]
def exclusion_window(k: np.ndarray, r: float) -> np.ndarray:
    """Fourier-space top-hat window function.

    Parameters
    ----------
    k : np.ndarray
        The fourier-space wavenumbers
    r : float
        The size of the top-hat window.

    Returns
    -------
    W : np.ndarray
        The top-hat window function in fourier space.
    """
    x = k * r
    return 3 * (np.sin(x) - x * np.cos(x)) / x**3




[docs]
def populate(
    centres: np.ndarray,
    masses: np.ndarray,
    halomodel=None,
    profile: Profile | None = None,
    hodmod: HOD | None = None,
    edges: np.ndarray | None = None,
    rng=None,
):
    """
    Populate a series of DM halos with a tracer, given a HOD model.

    Parameters
    ----------
    centres : (N,3)-array
        The cartesian co-ordinates of the centres of the halos
    masses : array_like
        The masses (in M_sun/h) of the halos
    halomodel : type :class:`halomod.HaloModel`
        A HaloModel object. One can either use this, or *both* `halo_profile` and
        `hodmod` arguments.
    profile : type :class:`halo_profile.Profile`, optional
        A density halo_profile to use. Only required if ``halomodel`` not given.
    hodmod : object of type :class:`hod.HOD`, optional
        A HOD model to use to populate the dark matter. Only required if ``halomodel``
        not given.
    edges : float, len(2) iterable, or (2,3)-array
        Periodic box edges. If float, defines the upper limit of cube, with lower limit at zero.
        If len(2) iterable, defines edges of cube.
        If (2,3)-array, specifies edges of arbitrary rectangular prism.

    Returns
    -------
    pos : array
        (N,3)-array of positions of galaxies.
    halo : array
        (N)-array of associated haloes (by index)
    H : int
        Number of central galaxies. The first H galaxies in pos/halo correspond to centrals.
    """
    if halomodel is not None:
        profile = halomodel.halo_profile
        hodmod = halomodel.hod

    masses = np.array(masses)

    if rng is None:
        rng = np.random.default_rng()

    # Define which halos have central galaxies.
    cgal = rng.binomial(1, hodmod.central_occupation(masses))
    cmask = cgal > 0
    central_halos = np.arange(len(masses))[cmask]

    if hodmod._central:
        masses = masses[cmask]
        centres = centres[cmask]

    # Calculate the number of satellite galaxies in halos
    # Using ns gives the correct answer for both central condition and not.
    # Note that other parts of the algorithm also need to be changed if central condition
    # is not true.
    sgal = poisson.rvs(hodmod.ns(masses), random_state=rng)

    # Get an array ready, hopefully speeds things up a bit
    ncen = np.sum(cgal)
    nsat = np.sum(sgal)

    pos = np.empty((ncen + nsat, 3))
    halo = np.empty(ncen + nsat)

    # Assign central galaxy positions
    halo[:ncen] = central_halos
    if hodmod._central:
        pos[:ncen, :] = centres
    else:
        pos[:ncen, :] = centres[cmask]

    smask = sgal > 0
    # if hodmod._central:
    #     sat_halos = central_halos[np.arange(len(masses[cmask]))[smask]]
    # else:
    if hodmod._central:
        sat_halos = central_halos[np.arange(len(masses))[smask]]
    else:
        sat_halos = np.arange(len(masses))[smask]

    sgal = sgal[smask]
    centres = centres[smask]
    masses = masses[smask]

    # Now go through each halo and calculate galaxy positions
    start = time.time()
    halo[ncen:] = np.repeat(sat_halos, sgal)
    indx = np.concatenate(([0], np.cumsum(sgal))) + ncen

    def fill_array(i):
        r"""Function to populate the field with ith tracer."""
        m, n, ctr = masses[i], sgal[i], centres[i]
        pos[indx[i] : indx[i + 1], :] = profile.populate(n, m, centre=ctr, rng=rng)

    if HAVE_POOL:
        mp.ProcessingPool(mp.cpu_count()).map(fill_array, list(range(len(masses))))
    else:
        for i in range(len(masses)):
            fill_array(i)

    nhalos_with_gal = len(set(central_halos.tolist() + sat_halos.tolist()))

    logger.info(
        f"Took {time.time() - start} seconds, or "
        f"{(time.time() - start) / nhalos_with_gal} each halo."
    )
    logger.info(
        f"NhalosWithGal: {nhalos_with_gal}, Ncentrals: {ncen}, NumGal: {len(halo)}, "
        f"MeanGal: {float(len(halo)) / nhalos_with_gal}, "
        f"MostGal: {sgal.max() + 1 if len(sgal) > 0 else 1}"
    )

    if edges is not None:
        if np.isscalar(edges):
            edges = np.array([[0, 0, 0], [edges, edges, edges]])
        elif np.array(edges).shape == (2,):
            edges = np.array([[edges[0]] * 3, [edges[1]] * 3])

        for j in range(3):
            d = pos[:, j] - edges[0][j]
            pos[d < 0, j] = edges[1][j] + d[d < 0]
            d = pos[:, j] - edges[1][j]
            pos[d > 0, j] = edges[0][j] + d[d > 0]

    return pos, halo.astype("int"), ncen




[docs]
class ExtendedSpline:
    """Generate a function from data x,y with arbitrary behaviour below and above limit."""

    def __init__(
        self,
        x: np.ndarray,
        y: np.ndarray,
        lower_func: callable | None | str = None,
        upper_func: callable | None | str = None,
        match_lower: bool = True,
        match_upper: bool = True,
        domain=(-np.inf, np.inf),
        k: int = 3,
        lower_power_law_n=10,
        upper_power_law_n=10,
    ):
        if x.min() < domain[0] or x.max() > domain[1]:
            raise ValueError("x is outside domain")

        self.xmin = x.min()
        self.xmax = x.max()

        self._spl = spline(x, y, k=k, ext="extrapolate")

        self.lfunc = self._get_extension_func(
            lower_func,
            x[:lower_power_law_n],
            y[:lower_power_law_n],
            match_lower,
            self.xmin,
        )
        self.ufunc = self._get_extension_func(
            upper_func,
            x[-upper_power_law_n:],
            y[-upper_power_law_n:],
            match_upper,
            self.xmax,
        )

    def _get_extension_func(self, fnc, x, y, match, match_x):
        """Function to generate the extended spline."""
        if callable(fnc):
            if not match:
                return fnc
            ff = fnc(match_x)
            if ff == 0:
                return fnc
            norm = self._spl(match_x) / ff
            return _NormedCallable(fnc, norm)
        elif fnc == "power_law":
            assert np.all(x > 0), "to use a power-law, x must be >= 0"
            if not np.all(y > 0) or np.all(y < 0):
                warnings.warn(
                    "to use a power-law, y must be all positive or negative. "
                    "Switching to zero extrapolation.",
                    stacklevel=2,
                )
                return _zero
            neg = y[0] < 0

            spl = uspline(np.log(x), np.log(y * (-1 if neg else 1)), k=1)

            return _PowerLawExtension(spl, neg)
        elif fnc == "boundary":
            return _BoundaryExtension(self._spl, match_x)
        elif fnc is None:
            return self._spl
        else:
            raise ValueError("Invalid choice for lower or upper func")

    def __call__(self, x):
        """Function to call the output."""
        if np.isscalar(x):
            if x < self.xmin:
                return self.lfunc(x)
            elif x > self.xmax:
                return self.ufunc(x)
            else:
                return self._spl(x)
        else:
            x = np.array(x)
            out = np.zeros_like(x)
            lmask = x < self.xmin
            umask = x > self.xmax
            mmask = ~(lmask | umask)

            xlo = x[lmask]
            xhi = x[umask]
            xmid = x[mmask]

            # print(out.shape, x.shape, lmask, xlo, self.lfunc, self.ufunc)
            out[lmask] = self.lfunc(xlo)
            out[umask] = self.ufunc(xhi)
            out[mmask] = self._spl(xmid)

            return out



def _zero(x):
    """Simple function that returns zeros."""
    if np.isscalar(x):
        return 0
    else:
        return np.zeros_like(x)


class _NormedCallable:
    """Callable that scales another callable by a fixed normalization factor."""

    def __init__(self, fnc: callable, norm: float):
        self.fnc = fnc
        self.norm = norm

    def __call__(self, xx: np.ndarray) -> np.ndarray:
        return self.fnc(xx) * self.norm


class _PowerLawExtension:
    """Callable for power-law extrapolation based on a log-log spline."""

    def __init__(self, spl: callable, neg: bool):
        self.spl = spl
        self.neg = neg

    def __call__(self, xx: np.ndarray) -> np.ndarray:
        return np.exp(self.spl(np.log(xx))) * (-1 if self.neg else 1)


class _BoundaryExtension:
    """Callable that returns a constant value equal to a spline at a boundary point."""

    def __init__(self, spl: callable, match_x: float):
        self.spl = spl
        self.match_x = match_x

    def __call__(self, xx: np.ndarray) -> np.ndarray:
        return np.ones_like(xx) * self.spl(self.match_x)


class _PowerLawK:
    """Callable that returns k**n, used as a lower-bound extension for power spectra."""

    def __init__(self, n: float):
        self.n = n

    def __call__(self, k: np.ndarray) -> np.ndarray:
        return k**self.n


class _SumCallable:
    """Callable that returns the sum of two callables, with an optional constant offset."""

    def __init__(self, fnc1: callable, fnc2: callable, offset: float = 0):
        self.fnc1 = fnc1
        self.fnc2 = fnc2
        self.offset = offset

    def __call__(self, x: np.ndarray) -> np.ndarray:
        return self.fnc1(x) + self.fnc2(x) + self.offset



[docs]
def spline_integral(
    x: np.ndarray,
    f: np.ndarray,
    xmin: [None, float] = None,
    xmax: [None, float] = None,
    log: bool = True,
) -> float:
    """
    Perform an integral using a spline function over a vector of data.

    The purpose of this function is to do robust integration when the bounds of integration
    don't necessarily fall on a particular x co-ordinate. It falls back to integrating
    over all ``x`` if no explicit ``xmin`` is given.

    Parameters
    ----------
    x
        The co-ordinates of the integral
    f
        The integrand at ``x`` (same shape as ``x``).
    xmin
        The lower bound of the integral.
    xmax
        The upper bound of the integral.
    log
        Whether to interpolate the integrand in log space.

    Returns
    -------
    integral
        The integral from ``xmin`` to ``xmax``.
    """
    if xmin and xmin < x.min():
        warnings.warn(
            f"Extrapolation occurs in integral! xmin={xmin} while x.min() ={x.min()}",
            stacklevel=2,
        )
    if xmax and xmax > x.max():
        warnings.warn(
            f"Extrapolation occurs in integral! xmax={xmax} while x.max() ={x.max()}",
            stacklevel=2,
        )

    if log:
        spl = spline(np.log(x), x * f)
        return spl.integral(
            np.log(xmin) if xmin is not None else np.log(x.min()),
            np.log(xmax) if xmax is not None else np.log(x.max()),
        )
    else:
        spl = spline(x, f)
        return spl.integral(xmin or x.min(), xmax or x.max())




[docs]
def norm_warn(self):
    """Emit a warning when either the HMF or the HMF/bias pair are not normalized."""
    if not self.hmf.normalized:
        warnings.warn(
            f"You are using an un-normalized mass function "
            f"({self.hmf_model.__name__}). Matter correlations are not "
            "well-defined.",
            stacklevel=2,
        )

    if self.hmf_model not in self.bias.pair_hmf:
        warnings.warn(
            f"You are using an un-normalized mass function and bias function pair."
            f"Bias {self.bias_model.__name__} has the following paired HMF model: "
            f"{self.bias_model.pair_hmf}. Matter correlations are not "
            "well-defined.",
            stacklevel=2,
        )