Source code for spectral_connectivity.statistics

"""Common statistical procedures used with frequency domain measures."""

import numpy as np
from scipy.stats import chi2, norm

np.seterr(invalid="ignore")



[docs]
def Benjamini_Hochberg_procedure(p_values, alpha=0.05):
    """Corrects for multiple comparisons and returns the significant
    p-values by controlling the false discovery rate at level `alpha`
    using the Benjamani-Hochberg procedure.

    Parameters
    ----------
    p_values : array_like
    alpha : float, optional
        The expected proportion of false positive tests.
    Returns
    -------
    is_significant : boolean nd-array
        A boolean array the same shape as `p_values` indicating whether the
        null hypothesis has been rejected (True) or failed to reject
        (False).
    """
    p_values = np.array(p_values)
    threshold_line = np.linspace(0, alpha, num=p_values.size + 1, endpoint=True)[1:]
    sorted_p_values = np.sort(p_values.flatten())
    try:
        threshold_ind = np.max(np.where(sorted_p_values <= threshold_line)[0])
        threshold = sorted_p_values[threshold_ind]
    except ValueError:  # There are no values below threshold
        threshold = -1
    return p_values <= threshold




[docs]
def Bonferroni_correction(p_values: np.ndarray, alpha: float = 0.05):
    """Corrects for multiple comparisons and returns the significant
    p-values by controlling the false discovery rate at level `alpha`
    using the Bonferroni procedure.

    Parameters
    ----------
    p_values : np.ndarray, shape (n_p_values,)
    alpha : float, optional
        critical threshold, by default 0.05

    Returns
    -------
    is_significant : np.ndarray, shape (n_p_values,)

    """
    p_values = np.asarray(p_values)
    return p_values <= alpha / p_values.size



MULTIPLE_COMPARISONS = dict(
    Benjamini_Hochberg_procedure=Benjamini_Hochberg_procedure,
    Bonferroni_correction=Bonferroni_correction,
)



[docs]
def adjust_for_multiple_comparisons(
    p_values, alpha=0.05, method="Benjamini_Hochberg_procedure"
):
    """Corrects for multiple comparisons and returns the significant
    p-values.

    Parameters
    ----------
    p_values : array_like
    alpha : float, optional
        The expected proportion of false positive tests.
    method : string, optional
        Name of the method to use to correct for multiple comparisons.
        Options are "Benjamini_Hochberg_procedure", "Bonferroni_correction"
    Returns
    -------
    is_significant : boolean nd-array
        A boolean array the same shape as `p_values` indicating whether the
        null hypothesis has been rejected (True) or failed to reject
        (False).

    """
    # TODO: add axis keyword?
    return MULTIPLE_COMPARISONS[method](p_values, alpha=alpha)




[docs]
def fisher_z_transform(coherency1, bias1, coherency2=0, bias2=0):
    """Transform the coherence magnitude to an approximately normal
    distribution.

    If two coherencies are provided, then the function returns the
    fisher z transform of the difference of the coherencies with
    `coherency1` - `coherency2`.

    Parameters
    ----------
    coherency1 : complex array
        The complex coherency between signals
    bias1 : float
        The bias from independent estimates of the frequency domain.
    coherency2 : complex array, optional
    bias2 : float, optional
        The bias from independent estimates of the frequency domain.

    Returns
    -------
    fisher_z_transform : real array
        Either the difference from 0 mean or, if another coherency is
        provided, the difference from that coherency.

    """
    coherence_magnitude1 = np.abs(coherency1)
    coherence_magnitude1[coherence_magnitude1 >= 1] = 1 - np.finfo(float).eps

    coherence_magnitude2 = np.array(np.abs(coherency2))
    coherence_magnitude2[coherence_magnitude2 >= 1] = 1 - np.finfo(float).eps

    z1 = np.arctanh(coherence_magnitude1) - bias1
    z2 = np.arctanh(coherence_magnitude2) - bias2
    return (z1 - z2) / np.sqrt(bias1 + bias2)




[docs]
def get_normal_distribution_p_values(data, mean=0, std_deviation=1):
    """Given data, returns the probability the data was generated from
    a normal distribution with `mean` and `std_deviation`
    """
    try:
        return 1 - norm.cdf(data, loc=mean, scale=std_deviation)
    except TypeError:
        return 1 - norm.cdf(data.get(), loc=mean, scale=std_deviation)




[docs]
def coherence_bias(n_observations):
    """Estimates of coherence are biased by sample size [1,2]. This estimates the degree of bias
    so that estimates can be corrected.

    Parameters
    ----------
    n_observations : int
        Number of observations.

    Returns
    -------
    bias : float

    References
    ---------
    .. [1] Enochson, L.D., and Goodman, N.R. (1965). Gaussian approximations to the distribution
           of sample coherence (Measurement analysis corp Los Angeles CA).
    .. [2] Bokil, H., Purpura, K., Schoffelen, J.-M., Thomson, D., and Mitra, P. (2007). Comparing
           spectra and coherences for groups of unequal size. Journal of Neuroscience Methods 159,
           337–345. 10.1016/j.jneumeth.2006.07.011.


    """
    degrees_of_freedom = 2 * n_observations
    return 1.0 / (degrees_of_freedom - 2)




[docs]
def coherence_rate_adjustment(
    firing_rate_condition1,
    firing_rate_condition2,
    spike_power_spectrum,
    homogeneous_poisson_noise=0,
    dt=1,
):
    """Correction for the spike-field or spike-spike coherence when the
    conditions have different firing rates.

    When comparing the coherence of two conditions, a change in firing rate
    results in a change in coherence without an increase in coupling.
    This adjustment modifies the coherence of one of the conditions, so
    that a difference in coherence between conditions indicates a change
    in coupling, not firing rate. See [1] for details.

    If using to compare spike-spike coherence, not that the coherence
    adjustment must be applied twice, once for each spike train.

    Adjusts `firing_rate_condition1` to `firing_rate_condition2`.

    Parameters
    ----------
    firing_rate_condition1, firing_rate_condition2 : float
        Average firing rates for each condition.
    spike_power_spectrum : ndarray, shape (n_frequencies,)
        Power spectrum of the spike train in condition 1.
    homogeneous_poisson_noise : float, optional
        Beta in [1].
    dt : float, optional
        Size of time step.

    Returns
    -------
    rate_adjustment_factor : ndarray, shape (n_frequencies,)

    References
    ----------
    .. [1] Aoi, M.C., Lepage, K.Q., Kramer, M.A., and Eden, U.T. (2015).
           Rate-adjusted spike-LFP coherence comparisons from spike-train
           statistics. Journal of Neuroscience Methods 240, 141-153.

    """
    # alpha in [1]
    firing_rate_ratio = firing_rate_condition2 / firing_rate_condition1
    adjusted_firing_rate = (
        (1 / firing_rate_ratio - 1) * firing_rate_condition1
        + homogeneous_poisson_noise / firing_rate_ratio**2
    ) * dt**2
    return 1 / np.sqrt(1 + (adjusted_firing_rate / spike_power_spectrum))




[docs]
def power_confidence_intervals(n_tapers, power=1, ci=0.95):
    """Confidence intervals for the power spectrum.

    Parameters
    ----------
    n_tapers : int
        Number of tapers
    power : np.ndarray, optional
        Multitaper spectrum
    ci : float
        Confidence level. Range [0.5, 1]

    Returns
    -------
    lower_bound, upper_bound : float


    References
    ----------
    .. [1] Kramer, M.A., and Eden, U.T. (2016). Case studies in neural
           data analysis: a guide for the practicing neuroscientist (MIT Press).

    """
    upper_bound = 2 * n_tapers / chi2.ppf(1 - ci, 2 * n_tapers) * power
    lower_bound = 2 * n_tapers / chi2.ppf(ci, 2 * n_tapers) * power

    return lower_bound, upper_bound