Source code for kliff.uq.mcmc_utils

from typing import Optional, Tuple, Union

import numpy as np

from kliff.error import report_import_error

try:
    import emcee

    emcee_avail = True
except ImportError:
    emcee_avail = False


# Estimate the burn-in time

[docs]
def mser(
    chain: np.ndarray,
    dmin: Optional[int] = 1,
    dstep: Optional[int] = 10,
    dmax: Optional[int] = -1,
    full_output: Optional[bool] = False,
) -> Union[int, dict]:
    """Estimate the equilibration time using marginal standard error rule (MSER).

    This is done by calculating the standard error (square) of ``chain_d``, where
    ``chain_d`` contains the last :math:`n-d` element of the chain (n is the total number
    of iterations for each chain), for progresively larger d values, starting from
    ``dmin`` upto ``dmax``, incremented by ``dstep``. The SE values are stored in a list.
    Then we search the minimum element in the list and return the index of that element.

    Args:
        chain: (nsteps,) Array containing the time series.
        dmin: Index where to start the search in the time series.
        dstep: How much to increment the search is done.
        dmax: Index where to stop the search in the time series.
        full_output: A flag to return the list of squared standard error.

    Returns:
        Estimate of the equilibration time using MSER. If ``full_output=True``, then a
        dictionary containing the estimated equilibration time and the list of squared
        standard errors will be returned.
    """
    length = len(chain)  # Chain length

    # Compute the SE square
    SE2_list = [
        _standard_error_squared(chain[dd:]) for dd in range(length)[dmin:dmax:dstep]
    ]

    # Get the estimate of the equilibration time, wrt the original time series
    dest = np.argmin(SE2_list)
    dstar = min([dmin + (dest + 1) * dstep, length])

    if full_output:
        return {"dstar": dstar, "SE2": SE2_list}
    else:
        return dstar



# Estimate autocorrelation length

[docs]
def autocorr(chain: np.ndarray, *args, **kwargs) -> np.ndarray:
    """Use ``emcee`` package to estimate the autocorrelation length.

    Args:
        chain: (nwalkers, nsteps, ndim,) Chains from the MCMC simulation. Note that the
            burn-in time needs to be discarded prior to this calculation
        args, kwargs: Additional positional and keyword arguments of ``emcee.autocorr.integrated_time``.

    Returns:
        Estimate of the autocorrelation length for each parameter.
    """
    if emcee_avail:
        chain = np.swapaxes(chain, 0, 1)
        return emcee.autocorr.integrated_time(chain, *args, **kwargs)
    else:
        report_import_error("emcee")



# Assess convergence

[docs]
def rhat(
    chain: np.ndarray, time_axis: Optional[int] = 1, return_WB: Optional[bool] = False
) -> Union[float, Tuple[float, np.ndarray, np.ndarray]]:
    """Compute the value of :math:`\\hat{r}` proposed by Brooks and Gelman [BrooksGelman1998]_.

    If the samples come from PTMCMC simulation, then the chain needs to be from one of
    the temperature only.

    Args:
        chain: The MCMC chain as a ndarray, preferrably with the shape
            (nwalkers, nsteps, ndim,). However, the shape can also be
            (nsteps, nwalkers, ndim,), but the argument time_axis needs to be set to 0.
        time_axis: Axis in which the time series is stored (0 or 1). For emcee results,
            the time series is stored in axis 0, but for ptemcee for a given temperature,
            the time axis is 1.
        return_WB: A flag to return covariance matrices within and between chains.

    Returns:
        The value of rhat. if ``return_WB=True``, also returns matrices of
        covariance within and between the chains.

    References:
        .. [BrooksGelman1998]
           Brooks, S.P., Gelman, A., 1998. General Methods for Monitoring Convergence of
           Iterative Simulations. Journal of Computational and Graphical Statistics 7,
           434455. https://doi.org/10.1080/10618600.1998.10474787
    """
    if time_axis == 1:
        # Reshape the chain so that the time axis is in axis 1
        temp = np.swapaxes(chain, 0, 1)
        chain = temp

    m, n, _ = chain.shape
    lambda1, W, B = _lambda1(chain)
    r = 1 - 1 / n + (1 + 1 / m) * lambda1

    if return_WB:
        toreturn = (r, W, B)
    else:
        toreturn = r

    return toreturn



def _standard_error_squared(chain: np.ndarray) -> float:
    """Compute the square of the standard error."""
    nn = len(chain)
    se2 = np.var(chain) / nn
    return se2


def _lambda1(chain):
    """Compute the largest eigenvalue of :math:`W^{-1} B/n`."""
    W = _W(chain)
    B_over_n = _B_over_n(chain)
    V = np.linalg.lstsq(W, B_over_n, rcond=-1)[0]
    s = np.linalg.svd(V, compute_uv=False)
    return np.max(s), W, B_over_n


def _B_over_n(chain):
    """Compute covariance matrix between the chains."""
    return np.cov(np.mean(chain, axis=1), rowvar=False, ddof=1)


def _W(chain):
    """Compute the mean of the covariance matrix within each chain."""
    m, n, nparams = chain.shape
    Wm = np.empty((m, nparams, nparams))
    for walker in range(m):
        Wm[walker] = np.cov((chain[walker]), rowvar=False, ddof=1)
    return np.mean(Wm, axis=0)