Source code for aopy.analysis.base

# base.py
#
# Code for neural data analysis; functions here should return interpretable results such as
# firing rates, success rates, direction tuning, etc.

import math
import warnings

import numpy as np
from matplotlib import pyplot as plt
from sklearn.decomposition import PCA, FactorAnalysis
from sklearn.cluster import KMeans
from sklearn import model_selection
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
from sklearn.linear_model import LinearRegression
from sklearn.metrics import confusion_matrix, accuracy_score
import scipy
from scipy import stats, signal
from scipy import interpolate
from scipy.stats import wilcoxon
from statsmodels.stats.multitest import fdrcorrection
import nitime.algorithms as tsa
import pywt
import multiprocessing as mp
from tqdm.auto import tqdm
from functools import partial

from .. import visualization
from .. import utils
from .. import preproc
from .. import postproc
from .. import precondition
from . import tuning

'''
Correlation / dimensionality analysis
'''
[docs]def factor_analysis_dimensionality_score(data_in, dimensions, nfold, maxiter=1000, verbose=False):
    '''
    Estimate the latent dimensionality of an input dataset by appling cross validated 
    factor analysis (FA) to input data and returning the maximum likelihood values. 
    
    Args:
        data_in (nt, nch): Time series data in
        dimensions (ndim): 1D Array of dimensions to compute FA for 
        nfold (int): Number of cross validation folds to compute. Must be >= 1
        maxiter (int): Maximum number of FA iterations to compute if there is no convergence. Defaults to 1000.
        verbose (bool): Display % of dimensions completed. Defaults to False

    Returns:
        tuple: Tuple containing:
            | **log_likelihood_score (ndim, nfold):** Array of MLE FA score for each dimension for each fold
            | **iterations_required (ndim, nfold):** How many iterations of FA were required to converge for each fold
    '''

    # Initialize arrays
    log_likelihood_score = np.zeros((np.max(np.shape(dimensions)), nfold))
    iterations_required = np.zeros((np.max(np.shape(dimensions)), nfold))

    if verbose == True:
        print('Cross validating and fitting ...')

    # Compute the maximum likelihood score for each dimension using factor analysis    
    for dim_idx in range(len(dimensions)):
        fold_idx = 0

        # Handle the case without cross validation.
        if nfold == 1:
            fa = FactorAnalysis(n_components=dimensions[dim_idx], max_iter=maxiter)
            fafit = fa.fit(data_in.T)
            log_likelihood_score[dim_idx, fold_idx] = fafit.score(data_in.T)
            iterations_required[dim_idx, fold_idx] = fafit.n_iter_
            warnings.warn("Without cross validation the highest dimensional model will always fit best.")

        # Every other case with cross validation
        else:
            for trainidx, testidx in model_selection.KFold(n_splits=nfold).split(data_in.T):
                fa = FactorAnalysis(n_components=dimensions[dim_idx], max_iter=maxiter)
                fafit = fa.fit(data_in[:, trainidx].T)
                log_likelihood_score[dim_idx, fold_idx] = fafit.score(data_in[:, testidx].T)
                iterations_required[dim_idx, fold_idx] = fafit.n_iter_
                fold_idx += 1

        if verbose == True:
            print(str((100 * (dim_idx + 1)) // len(dimensions)) + "% Complete")

    return log_likelihood_score, iterations_required

[docs]def get_pca_dimensions(data, max_dims=None, VAF=0.9, project_data=False):
    """
    Use PCA to estimate the dimensionality required to account for the variance in the given data. If requested it also projects the data onto those dimensions.
    
    Args:
        data (nt, nch): time series data where each channel is considered a 'feature' (nt=n_samples, nch=n_features)
        max_dims (int): (default None) the maximum number of dimensions to reduce data onto.
        VAF (float): (default 0.9) variance accounted for (VAF)
        project_data (bool): (default False). If the function should project the high dimensional input data onto the calculated number of dimensions

    Returns:
        tuple: Tuple containing: 
            | **explained_variance (list ndims long):** variance accounted for by each principal component
            | **num_dims (int):** number of principal components required to account for variance
            | **projected_data (nt, ndims):** Data projected onto the dimensions required to explain the input variance fraction. If the input 'project_data=False', the function will return 'projected_data=None'
    """
    pca = PCA()
    pca.fit(data)
    explained_variance = pca.explained_variance_ratio_
    total_explained_variance = np.cumsum(explained_variance)
    if max_dims is None:
        num_dims = np.min(np.where(total_explained_variance>VAF)[0])+1
    else:
        temp_dims = np.min(np.where(total_explained_variance>VAF)[0])+1
        num_dims = np.min([max_dims, temp_dims])

    if project_data:
        all_projected_data = pca.transform(data)
        projected_data = all_projected_data[:,:num_dims]
    else:
        projected_data = None

    return list(explained_variance), num_dims, projected_data


[docs]def interpolate_extremum_poly2(extremum_idx, data, extrap_peaks=False):
    '''
    This function finds the extremum approximation around an index by fitting a second order polynomial (using a lagrange polynomial) to
    the index input, the point before, and the point after it. In the case where the input index is either 
    at the end or the beginning of the data array, the function can either fit the data using the closest 3
    data points and return the extrapolated peak value or just return the input index. This extrapolation
    functionality is controlled with the 'extrap_peaks' input variable. Note: the extrapolation function may choose an 
    index within the input data length if chosen points result in a polynomial with an extremum at that point.

    Args:
        extremum_idx (int): Current extremum index
        data (n): data used to interpolate (or extrapolate) with
        extrap_peaks (bool): If the extremum_idx is at the start or end of the data, indicate if the closest 3 points
                                should be used to extrapolate a peak index.
        
    Returns:
        tuple: A tuple containing         
            | **extremum_time (float):** Interpolated (or extrapolated) peak time        
            | **extremum_value (float):** Approximated peak value.        
            | **f (np.poly):** Polynomial used to calculate peak time
    '''

    # Handle condition where the peak is at the beginning of a dataset
    if extremum_idx == 0:
        edge_idx = True
        xpts = np.arange((extremum_idx), extremum_idx+3, 1)
        ypts = data[extremum_idx:extremum_idx+3]
    
    # Handle condition where the peak is at the end of a dataset
    elif extremum_idx == len(data)-1:
        edge_idx = True
        xpts = np.arange((extremum_idx-2), extremum_idx+1, 1)
        ypts = data[extremum_idx-2:extremum_idx+1]
        
    # Condition where the peak is in the middle of the dataset
    else:
        edge_idx = False
        xpts = np.arange((extremum_idx-1), extremum_idx+2, 1)
        ypts = data[extremum_idx-1:extremum_idx+2]
    
    f = interpolate.lagrange(xpts, ypts)
    extremum_time = -f[1]/(2*f[2])
    extremum_value = (f[2]*(extremum_time**2)) + (f[1]*extremum_time) + f[0]
    
    # If end points should not be extrapolated from...
    if extrap_peaks==False and edge_idx:
        extremum_time = extremum_idx
        extremum_value = data[extremum_time]

    return extremum_time, extremum_value, f

[docs]def calc_task_rel_dims(neural_data, kin_data, conc_proj_data=False):
    '''
    Calculates the task relevant dimensions by regressing neural activity against kinematic data using least squares.
    If the input neural data is 3D, all trials will be concatenated to calculate the subspace. 
    Calculation is based on the approach used in Sun et al. 2022 https://doi.org/10.1038/s41586-021-04329-x
    
    .. math::
    
        R \\in \\mathbb{R}^{nt \\times nch}

    .. math::

        M \\in \\mathbb{R}^{nt \\times ndim}

    .. math::

        \\beta \\in \\mathbb{R}^{nch \\times ndim}
    
    .. math::

        R = M\\beta^T

    .. math::

        [\\beta_0 \\beta_x \\beta_y]^T = (M^T M)^{-1} M^T R

    Args:
        neural_data ((nt, nch) or list of (nt, nch)): Input neural data (:math:`R`) to regress against kinematic activity.
        kin_data ((nt, ndim) or list of (nt, ndim)): Kinematic variables (:math:`M`), commonly position or instantaneous velocity. 'ndims' refers to the number of physical dimensions that define the kinematic data (i.e. X and Y)
        conc_proj_data (bool): If the projected neural data should be concatenated.

    Returns:
        tuple: Tuple containing:
            | **(nch, ndim):** Subspace (:math:`\\beta`) that best predicts kinematic variables. Note the first column represents the intercept, then the next dimensions represent the behvaioral variables
            | **((nt, nch) or list of (nt, ndim)):** Neural data projected onto task relevant subspace

    '''

    # If a list of segments from trials, concatenate them into one larget timeseries
    if type(neural_data) == list:
        ntrials = len(neural_data)

        conc_neural_data = np.vstack(neural_data) #(nt, nch)
        ntime = conc_neural_data.shape[0]
        
        # Set input neural data as a float
        conc_neural_data = conc_neural_data.astype(float)

        conc_kin_data = np.zeros((ntime,kin_data[0].shape[1]+1))*np.nan
        conc_kin_data[:,0] = 1
        conc_kin_data[:,1:] = np.vstack(kin_data)

        # Center neural data:
        conc_neural_data -= np.nanmean(conc_neural_data, axis=0)

        # Calculate task relevant subspace 
        task_subspace = np.linalg.pinv(conc_kin_data.T @ conc_kin_data) @ conc_kin_data.T @ conc_neural_data
    
    else:
        # Save original neural data as a list
        neural_data = [neural_data]
        
        # Set input neural data as a float
        neural_data_centered = neural_data[0].astype(float)
        
        # Center neural data:
        neural_data_centered -= np.nanmean(neural_data_centered, axis=0)
        ntime = neural_data_centered.shape[0]
        conc_kin_data = np.zeros((ntime, kin_data.shape[1]+1))*np.nan
        conc_kin_data[:,0] = 1
        conc_kin_data[:,1:] = kin_data
        
        # Calculate task relevant subspace 
        task_subspace = np.linalg.pinv(conc_kin_data.T @ conc_kin_data) @ conc_kin_data.T @ neural_data_centered
        ntrials = 1
        
    # Project neural data onto task subspace
    projected_data = []
    
    for itrial in range(ntrials):
        projected_data.append(neural_data[itrial] @ np.linalg.pinv(task_subspace))

    if conc_proj_data:
        return task_subspace.T, np.vstack(projected_data)
    else:    
        return task_subspace.T, projected_data

'''
METRIC CALCULATIONS
'''
[docs]def calc_rms(signal, remove_offset=True):
    '''
    Root mean square of a signal
    
    Args:
        signal (nt, ...): voltage along time, other dimensions will be preserved
        remove_offset (bool): if true, subtract the mean before calculating RMS

    Returns:
        float array: rms of the signal along the first axis. output dimensions will be the same non-time dimensions as the input signal
    '''
    if remove_offset:
        m = np.mean(signal, axis=0)
    else:
        m = 0
    
    return np.sqrt(np.mean(np.square(signal - m), axis=0))

[docs]def find_outliers(data, std_threshold):   
    '''
    Use kmeans clustering to find the center point of a dataset and distances from each data point
    to the center point. Data points further than a specified number of standard deviations away
    from the center point are labeled as outliers. This is particularily useful for high dimensional data
    
    Note: This function only uses the kmeans function to calculate centerpoint distances but does
    not output any useful information about data clusters. 
    
    Example::

        >>> data = np.array([[0.5,0.5], [0.75,0.75], [1,1], [10,10]])
        >>> outliers_labels, distance = aopy.analysis.find_outliers(data, 2)
        >>> print(outliers_labels, distance)
        [True, True, True, False] [3.6239, 3.2703, 2.9168, 9.8111]

    Args:
        data (n, nfeatures): Input data to plot in an nfeature dimensional space and compute outliers
        std_threshold (float): Number of standard deviations away a data point is required to be to be classified as an outlier
        
    Returns:
        tuple: Tuple containing: 
            | **good_data_idx (n):** Labels each data point if it is an outlier (True = good, False = outlier)
            | **distances (n):** Distance of each data point from center
    '''
    
    # Check ncluster input
    kmeans_model = KMeans(n_clusters = 1).fit(data)
    distances = kmeans_model.transform(data)
    cluster_labels = kmeans_model.labels_
    dist_std = np.sqrt(np.sum(distances**2)/len(distances))
    good_data_idx = (distances < (dist_std*std_threshold))
                  
    return good_data_idx.flatten(), distances.flatten()

[docs]def fit_linear_regression(X:np.ndarray, Y:np.ndarray, coefficient_coeff_warning_level:float = 0.5) -> np.ndarray:
    """
    Function that fits a linear regression to each matching column of X and Y arrays. 
    
    Args:
        X [np.ndarray]: number of data points by number of columns. columns of independant vars. 
        Y [np.ndarray]: number of data points by number of columns. columns of dependant vars
        coeffcient_coeff_warning_level (float): if any column returns a corr coeff less than this level 

    Returns:
        tuple: tuple containing:
            | **slope (n_columns):** slope of each fit
            | **intercept (n_columns):** intercept of each fit
            | **corr_coefficient (n_columns):** corr_coefficient of each fit
    """
    
    # Make sure the same shape
    assert X.shape == Y.shape
    
    n_columns = X.shape[1]

    slope = np.empty((n_columns,))
    intercept = np.zeros((n_columns,))
    corr_coeff = np.zeros((n_columns,))
    
    # Iterate through the columns
    for i in range(n_columns):
        
        x = X[:,i]
        y = Y[:,i]
        
        slope[i], intercept[i], corr_coeff[i],  *_ = scipy.stats.linregress(x, y)

        if abs(corr_coeff[i]) <= coefficient_coeff_warning_level: 
            warnings.warn(f'when fitting column number {i}, the correlation coefficient is {corr_coeff[i]}, less than {coefficient_coeff_warning_level} ')
        
    return slope, intercept, corr_coeff

[docs]def calc_freq_domain_values(data, samplerate):
    '''
    Use FFT to decompose time series data into frequency domain and return
    non-negative frequency components
    For math details, see: https://www.sjsu.edu/people/burford.furman/docs/me120/FFT_tutorial_NI.pdf

    Args:
        data (nt, nch): timeseries data, can be a single channel vector
        samplerate (float): sampling rate of the data

    Returns:
        tuple: Tuple containing:
            | **freqs (nt/2):** array of frequencies (essentially the x axis of a spectrogram) 
            | **freqvalues (nt/2, nch):** array of complex numbers at the above frequencies (each containing magnitude and phase)
    '''
    if np.ndim(data) < 2:
        data = np.expand_dims(data, 1)

    # Compute FFT along time dimension
    freq_data = np.fft.fft(data, axis=0)
    length = np.shape(freq_data)[0]
    freq = np.fft.fftfreq(length, d=1./samplerate)

    # Only take non-negative frequency components
    non_negative_freq = freq[freq>=0]
    non_negative_freq_data = freq_data[freq>=0,:]/complex(length,0) # normalize by length
    non_negative_freq_data[1:,:] = non_negative_freq_data[1:,:]*2 # account for half the peak amplitude being at the negative frequency component
    return non_negative_freq, non_negative_freq_data

[docs]def calc_freq_domain_amplitude(data, samplerate, rms=False):
    '''
    Use FFT to decompose time series data into frequency domain to calculate the
    amplitude of the non-negative frequency components

    Args:
        data (nt, nch): timeseries data, can be a single channel vector
        samplerate (float): sampling rate of the data
        rms (bool, optional): compute root-mean square amplitude instead of peak amplitude

    Returns:
        tuple: Tuple containing:
            | **freqs (nt/2):** array of frequencies (essentially the x axis of a spectrogram) 
            | **amplitudes (nt/2, nch):** array of amplitudes at the above frequencies (the y axis)
    '''
    non_negative_freq, non_negative_freq_data = calc_freq_domain_values(data, samplerate)

    # Compute the one-sided amplitude
    data_ampl = abs(non_negative_freq_data)

    # Divide non-DC components by root 2 to turn amplitude into RMS amplitude
    if rms:
        data_ampl[1:,:] = data_ampl[1:,:]/np.sqrt(2)
    return non_negative_freq, data_ampl

[docs]def calc_ISI(data, fs, bin_width, hist_width, plot_flag = False):
    '''
    Computes inter-spike interval histogram. The input data is the sampled thresholded data (0 or 1 data).

    Example:
        >>> data = np.array([[0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1],[1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0]])
        >>> data_T = data.T
        >>> fs = 100
        >>> bin_width = 0.01
        >>> hist_width = 0.1
        >>> ISI_hist, hist_bins = analysis.calc_ISI(data_T, fs, bin_width, hist_width)
        >>> print(ISI_hist) 
            [[0. 0.]
            [2. 3.]
            [2. 1.]
            [2. 1.]
            [1. 2.]
            [0. 0.]
            [0. 0.]
            [0. 0.]
            [0. 0.]]

    Args:
        data (nt, n_unit): time series spike data with multiple units.
        fs (float): sampling rate of data [Hz]
        bin_width (float): bin_width to compute histogram [s]
        hist_width (float): determines bin edge (0 < t < histo_width) [s]
        plot_flag (bool, optional): display histogram. In plotting, number of intervals is summed across units.

    Returns:
        tuple: tuple containing:
            | **ISI_hist (n_bins, n_unit):** number of intervals
            | **hist_bins (n_bins):** bin edge to compute histogram
    '''

    n_unit = data.shape[1]
    dT = 1/fs
    hist_bins = np.arange(0, hist_width, bin_width)

    ISI_hist = np.zeros((len(hist_bins)-1, n_unit))
    for iU in range(n_unit):
        spike_idx = np.where( data[:,iU] )
        ISI = np.diff(spike_idx)*dT
        ISI_hist[:,iU], _ = np.histogram(ISI, hist_bins)
    
    hist_bins = hist_bins[:-1] + np.diff(hist_bins)/2 # change hist_bins to be the center of the bin, not the edges

    # for plot
    if plot_flag:
        plt.bar(hist_bins*1000, np.sum(ISI_hist,axis=1), width = bin_width*1000, edgecolor="black") #multiplied 1000 to rescale to [ms]
        plt.xlabel('Interspike interval (ms)')
        plt.ylabel('Number of intervals')

    return ISI_hist, hist_bins

[docs]def calc_sem(data, axis=None):
    '''
    This function calculates the standard error of the mean (SEM). The SEM is calculated with the following equation
    where :math:`\\sigma` is the standard deviation and :math:`n` is the number of samples. When the data matrix includes NaN values,
    this function ignores them when calculating the :math:`n`. If no value for axis is input, the SEM will be 
    calculated across the entire input array.

    .. math::
    
        SEM = \\frac{\\sigma}{\\sqrt{n}}
        

    Args:
        data (nd array): Input data matrix of any dimension
        axis (int or tuple): Axis to perform SEM calculation on
    
    Returns:
        nd array: SEM value(s).
    '''
    n = np.sum(~np.isnan(data), axis=axis)
    SEM = np.nanstd(data, axis=axis)/np.sqrt(n)

    return SEM

[docs]def calc_rolling_average(data, window_size=11, mode='copy'):
    """
    Computes the rolling average of a 1- or 2-D array using a convolutional kernel. 
    The rolling average is always applied along the first axis of the array.
    If mode is 'nan', the ends of the array where an incomplete rolling average
    occurs is replaced with np.nan. If mode is 'copy' (the default), the first and 
    last valid datapoint (fully overlapping with the kernel) are copied backwards 
    and forwards, respectively. The size of the output will always be the same as 
    the size of the input data. 

    Args:
        data (nt, nch): The array of data to compute the rolling average for.
        window_size (int): The size of the kernel in number of samples. Must be odd.
        mode (str): Either 'copy' or 'nan', determines what happens on the edges
            where the kernel doesn't fully overlap the data
    
    Returns:
        (nt,) array: The rolling average of the input data.
    """
    assert window_size % 2 == 1, "Kernel size must be odd."
    
    data = np.array(data)
    kernel = np.ones(window_size) / min(window_size, data.shape[0])
    data_convolved = np.apply_along_axis(
        lambda d: np.convolve(d, kernel, mode='same'), 0, data)
    mid_kernel_idx = math.floor(window_size/2)
    if mode == 'nan':
        data_convolved[:mid_kernel_idx] = np.nan
        data_convolved[-mid_kernel_idx:] = np.nan
    elif mode == 'copy':
        data_convolved[:mid_kernel_idx] = data_convolved[mid_kernel_idx]
        data_convolved[-mid_kernel_idx:] = data_convolved[-(mid_kernel_idx+1)]  
    else:
        raise ValueError(f"Invalid mode: {mode}. Choose from 'copy' or 'nan'.")
    
    # Fix shape if window is bigger than data
    if data_convolved.shape[0] > data.shape[0]:
        data_convolved = data_convolved[0]*np.ones(data.shape)
    return data_convolved

[docs]def calc_corr_over_elec_distance(elec_data, elec_pos, bins=20, method='spearman', exclude_zero_dist=True):
    '''
    Calculates mean absolute correlation between acq_data across channels with the same distance between them.
    
    Args:
        elec_data (nt, nelec): electrode data with nch corresponding to elec_pos
        elec_pos (nelec, 2): x, y position of each electrode
        bins (int or array): input into scipy.stats.binned_statistic, can be a number or a set of bins
        method (str, optional): correlation method to use ('pearson' or 'spearman')
        exclude_zero_dist (bool, optional): whether to exclude distances that are equal to zero. default True
        
    Returns:
        tuple: tuple containing:
            | **dist (nbins):** electrode distance at each bin
            | **corr (nbins):** correlation at each bin

    Updated:
        2024-03-13 (LRS): Changed input from acq_data and acq_ch to elec_data.
    '''
    assert elec_data.shape[1] == elec_pos.shape[0], "Number of electrodes don't match!"
    dist = utils.calc_euclid_dist_mat(elec_pos)
    if method == 'spearman':
        c, _ = stats.spearmanr(elec_data, axis=0)
    elif method == 'pearson':
        c = np.corrcoef(elec_data.T)
    else:
        raise ValueError(f"Unknown correlation method {method}")
        
    if exclude_zero_dist:
        zero_dist = dist == 0
        dist = dist[~zero_dist]
        c = c[~zero_dist]
        
    corr, edges, _ = stats.binned_statistic(dist.flatten(), np.abs(c.flatten()), statistic='mean', bins=bins)
    dist = (edges[:-1] + edges[1:]) / 2

    return dist, corr

[docs]def calc_stat_over_dist_from_pos(elec_data, elec_pos, pos, statistic='mean', bins=20):
    '''
    For spatial data, calculate a statistic over distance from a given position.

    Args:
        elec_data (nelec): electrode data
        elec_pos (nelec, 2): x, y position of each electrode
        pos (2,): x, y position to calculate distance from
        statistic (str): statistic to calculate ('mean', 'std', 'median', 'max', 'min'). See scipy.stats.binned_statistic. Default 'mean'.
        bins (int or array): number of bins or bin edges for binned_statistic. Default 20.

    Returns:
        tuple: tuple containing:
            | **dist (nbins):** electrode distance at each bin
            | **stat (nbins):** statistic at each bin

    Example:
    
        .. code-block:: python
        
            nelec = 100
            elec_data = np.arange(nelec)
            elec_pos = [[idx, 1] for idx in range(nelec)]
            pos = [0,1]
            dist, mean = aopy.analysis.calc_stat_over_dist_from_pos(elec_data, elec_pos, pos)

            plt.figure()
            plt.plot(dist, mean)
            plt.xlabel('Distance')
            plt.ylabel('Mean')
            plt.title('Increasing statistic with distance')

        .. image:: _images/increasing_statistic_with_distance.png
    '''
    assert len(pos) == 2, "Position must be a 2D point"
    assert len(elec_data) == len(elec_pos), "Number of electrodes don't match!"
    assert np.shape(elec_pos)[1] == 2, "Electrode positions must be 2D"

    pos = np.array(pos)
    dist = [np.linalg.norm(np.array(p) - pos) for p in elec_pos]
    stat, edges, _ = stats.binned_statistic(dist, elec_data, statistic=statistic, bins=bins)
    dist = (edges[:-1] + edges[1:]) / 2

    return dist, stat

[docs]def calc_stat_over_angle_from_pos(elec_data, elec_pos, origin, statistic='mean', bins=20):
    '''
    Bins spatial data based on the angle from each electrode to the origin, 
    then compute a statistic on the electrode data within each angular bin.

    Args:
        elec_data (nelec): electrode data
        elec_pos (nelec, 2): x, y position of each electrode
        origin (2,): x, y position to calculate angle from
        statistic (str): statistic to calculate ('mean', 'std', 'median', 'max', 'min'). See scipy.stats.binned_statistic. Default 'mean'.
        bins (int or array): number of angular bins or bin edges for binned_statistic. Default 20.

    Returns:
        tuple: tuple containing:
            | **angle (nbins):** angle (in radians) to origin at each bin
            | **stat (nbins):** statistic at each bin

    Example:
    
        .. code-block:: python
        
            # Create a circle of electrodes
            nelec = 100
            elec_data = np.arange(nelec)
            elec_pos = [[np.cos(idx/nelec*2*np.pi), np.sin(idx/nelec*2*np.pi)] for idx in range(nelec)]
            origin1 = [0,0]
            origin2 = [0,1]

            plt.figure()
            plt.subplot(1,2,1)
            plt.scatter(*np.array(elec_pos).T, c=elec_data)
            plt.scatter(*origin1, color='b')
            plt.scatter(*origin2, color='r')
            plt.axis('equal')

            angle, mean = aopy.analysis.calc_stat_over_angle_from_pos(elec_data, elec_pos, origin1)
            plt.subplot(1,2,2)
            plt.plot(angle, mean, color='b')
            angle, mean = aopy.analysis.calc_stat_over_angle_from_pos(elec_data, elec_pos, origin2)
            plt.plot(angle, mean, color='r')
            plt.xlabel('Angle (rad)')
            plt.ylabel('Mean')

        .. image:: _images/angle_versus_position.png
    '''
    assert len(origin) == 2, "Origin must be a 2D point"
    assert len(elec_data) == len(elec_pos), "Number of electrodes don't match!"
    assert np.shape(elec_pos)[1] == 2, "Electrode positions must be 2D"

    origin = np.array(origin)
    angle = [np.arctan2(p[1] - origin[1], p[0] - origin[0]) for p in elec_pos]
    stat, edges, _ = stats.binned_statistic(angle, elec_data, statistic=statistic, bins=bins)
    angle = (edges[:-1] + edges[1:]) / 2

    return angle, stat

[docs]def subtract_erp_baseline(erp, time, t0, t1):
    '''
    Subtract pre-trigger activity from trial-aligned data.

    Args:
        erp (nt, nch, ntr): trial-aligned evoked responses
        time (nt): time axis (in seconds) of the erp, in the same reference frame as t0 and t1
        t0 (float): start of the baseline window (in seconds)
        t1 (float): end of the baseline window (in seconds)

    Raises:
        ValueError: if the baseline window times (t0, t1) are in the wrong order

    Returns:
        (nt, nch, ntr): erp after baseline subtraction
    '''
    if t1 <= t0:
        raise ValueError("t1 must be greater than t0")
    
    # Take a mean across the data before the events as a baseline
    s0 = np.searchsorted(time, t0)
    s1 = np.searchsorted(time, t1)
    event_mean = np.mean(erp[s0:s1], axis=0)

    # Subtract the baseline to calculate ERP
    n_samples = erp.shape[0]
    event_mean = np.tile(event_mean, (n_samples,1,1))
    return erp - event_mean

[docs]def calc_erp(data, event_times, time_before, time_after, samplerate, subtract_baseline=True, baseline_window=None):
    '''
    Calculates the event-related potential (ERP) for the given timeseries data.

    Args:
        data (nt, nch): timeseries data across channels
        event_times (ntrial): list of event times
        time_before (float): number of seconds to include before each event
        time_after (float): number of seconds to include after each event
        samplerate (float): sampling rate of the data
        subtract_baseline (bool, optional): if True, subtract the mean of the aligned data during
            the time_before period preceding each event (using nanmean). Must supply a positive time_before. Default True
        baseline_window ((2,) float, optional): range of time to compute baseline (in seconds before event)
            Default is the entire time_before period.

    Returns:
        (nt, nch, ntr): array of event-aligned responses for each channel during the given time periods

    '''
    if subtract_baseline and time_before <= 0:
        raise ValueError("Input time_before must be positive in order to calculate baseline")
        
    # Align the data to the given event times (shape is [nt, nch, ntrial])
    aligned_data = preproc.trial_align_data(data, event_times, time_before, time_after, samplerate)

    if subtract_baseline:
        if not baseline_window:
            baseline_window = (0, time_before)
        elif len(baseline_window) < 2 or baseline_window[1] <= baseline_window[0]:
            raise ValueError("baseline_window must be in the form (t0, t1) where \
                t1 is greater than t0")

        time = np.arange(len(aligned_data))/samplerate
        erp = subtract_erp_baseline(aligned_data, time, baseline_window[0], baseline_window[1])
        
    else:
        erp = aligned_data

    return erp

[docs]def get_max_erp(erp, time_before, time_after, samplerate, max_search_window=None, trial_average=False):
    '''
    Finds the maximum (across time) mean (across trials) values for the given trial-aligned data or 
    event-related potential (ERP). Identical to :func:`~aopy.analysis.calc_max_erp` except this function 
    takes trial-aligned data as input instead of timeseries data.
    
    Args:
        erp ((nt, nch, ntr) array): trial-aligned data
        time_before (float): number of seconds to include before each event
        time_after (float): number of seconds to include after each event
        samplerate (float): sampling rate of the data
        max_search_window ((2,) float, optional): range of time to search for maximum value (in seconds 
            after event). Default is the entire time_after period.
        trial_average (bool, optional): if True, average across trials before calculating max (using nanmean). Default False.
        
    Returns:
        (nch, ntr): array of maximum mean-ERP for each channel during the given time periods
    '''
    if np.ndim(erp) != 3: # assume (nt, ntr)
        raise ValueError("ERP must be in the form (nt, nch, ntr)")
    if trial_average:
        erp = np.nanmean(erp, axis=2, keepdims=True)

    # Limit the search to the given window
    start_idx = int(time_before*samplerate)
    end_idx = start_idx + int(time_after*samplerate)
    if max_search_window:
        if len(max_search_window) < 2 or max_search_window[1] < max_search_window[0]:
            raise ValueError("max_search_window must be in the form (t0, t1) where \
                t1 is greater than t0")
        end_idx = start_idx + int(max_search_window[1]*samplerate)
        start_idx += int(max_search_window[0]*samplerate)
    
    # Find the indices of the maximum absolute values
    erp_window = erp[start_idx:end_idx]
    idx_max_erp = start_idx + np.argmax(np.abs(erp_window), axis=0)

    # Use the indices to obtain the actual signed values
    max_erp = erp[idx_max_erp, np.arange(erp.shape[1])[:, None], np.arange(erp.shape[2])]

    if trial_average:
        max_erp = max_erp[:,0]
        
    return max_erp

[docs]def calc_max_erp(data, event_times, time_before, time_after, samplerate, subtract_baseline=True, 
                 baseline_window=None, max_search_window=None, trial_average=True):
    '''
    Calculates the maximum (across time) mean (across trials) event-related potential (ERP) 
    for the given timeseries data. Identical to :func:`~aopy.analysis.get_max_erp` except this function 
    takes timeseries data. If you already have trial-aligned erp (e.g. from :func:`~aopy.analysis.base.calc_erp`,
    then use :func:`~aopy.analysis.get_max_erp` instead.
    
    Args:
        data (nt, nch): timeseries data across channels
        event_times (ntrial): list of event times
        time_before (float): number of seconds to include before each event
        time_after (float): number of seconds to include after each event
        samplerate (float): sampling rate of the data
        subtract_baseline (bool, optional): if True, subtract the mean of the aligned data during
            the time_before period preceding each event. Must supply a positive time_before. Default True
        baseline_window ((2,) float, optional): range of time to compute baseline (in seconds before event)
            Default is the entire time_before period.
        max_search_window ((2,) float, optional): range of time to search for maximum value (in seconds 
            after event). Default is the entire time_after period.
        trial_average (bool, optional): by default, average across trials before calculating max
        
    Returns:
        nch: array of maximum mean-ERP for each channel during the given time periods
    '''
    erp = calc_erp(data, event_times, time_before, time_after, samplerate, subtract_baseline, baseline_window)
    return get_max_erp(erp, time_before, time_after, samplerate, max_search_window, trial_average)
    
    
'''
MODEL FITTING
'''
[docs]def linear_fit_analysis2D(xdata, ydata, weights=None, fit_intercept=True):
    '''
    This functions fits a line to input data using linear regression, calculates the fitting score
    (coefficient of determination), and calculates Pearson's correlation coefficient. Optional weights
    can be input to adjust the linear fit. This function then applies the linear fit to the input xdata.

    Linear regression fit is calculated using:
    https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LinearRegression.html
    
    Pearson correlation coefficient is calculated using:
    https://docs.scipy.org/doc/scipy/reference/generated/scipy.stats.pearsonr.html


    Args:
        xdata (npts):
        ydata (npts):
        weights (npts):

    Returns:
        tuple: Tuple containing:
            | **linear_fit (npts):** Y value of the linear fit corresponding to each point in the input xdata.
            | **linear_fit_score (float):** Coefficient of determination for linear fit
            | **pcc (float):** Pearson's correlation coefficient
            | **pcc_pvalue (float):** Two tailed p-value corresponding to PCC calculation. Measures the significance of the relationship between xdata and ydata.
            | **reg_fit (sklearn.linear_model._base.LinearRegression):** Linear regression parameters
    '''
    xdata = xdata.reshape(-1, 1)
    ydata = ydata.reshape(-1,1)

    reg_fit = LinearRegression(fit_intercept=fit_intercept).fit(xdata,ydata, sample_weight=weights)
    linear_fit_score = reg_fit.score(xdata, ydata)
    pcc_all = stats.pearsonr(xdata.flatten(), ydata.flatten())

    linear_fit = reg_fit.coef_[0][0]*xdata.flatten() + reg_fit.intercept_

    return linear_fit, linear_fit_score, pcc_all[0], pcc_all[1], reg_fit

[docs]def classify_by_lda(X_train_lda, y_class_train, 
                                 n_splits=5,
                                 n_repeats=3, 
                                 random_state=1):
    """
    Trains a linear discriminant model on the training data (X_train_lda) and their labels (y_class_train) with data spliting and
    k-fold validation. Returns accuracy and variance based on how well the model is able to predict the left-out data.

    Args:
        X_train_lda (n_classes, n_features): 2d training data. first dimension is the number of examples, second dimension is the size of each example
        y_class_train (n_classes): class to which each example belongs
        n_splits (int, optional): number of paritions to split data Defaults to 5.
        n_repeats (int, optional): number of repeated fitting Defaults to 3.
        random_state (int, optional): random state for data spliting Defaults to 1.

    Returns:
        tuple: Tuple containing:
            **accuracy (float):** mean accuracy of the repeated lda runs.
            **std (float):** standard deviation of the repeated lda runs.
    """

    assert X_train_lda.shape[0] == len(y_class_train)

    # get the model
    model = LinearDiscriminantAnalysis()
    
    # define model evaluation method
    cv = model_selection.RepeatedStratifiedKFold(n_splits=n_splits,
                                 n_repeats=n_repeats, 
                                 random_state=random_state)
    # evaluate model
    scores = model_selection.cross_val_score(model, X_train_lda, y_class_train, 
                                            scoring='accuracy', cv=cv, n_jobs=-1)

    mean_accuracy,  std = np.mean(scores), np.std(scores)

    return mean_accuracy, std

[docs]def get_random_timestamps(nshuffled_points, max_time, min_time=0, time_samplerate=None):
    '''
    This calculates random timestamps either within a range or from a discrete time axis.

    Args:
        nshuffled_points (int): How many randomly selected time points to
        max_time (float): Max of time range to draw samples from (inclusive)
        min_time (float): Min of time range to draw samples from. Defaults to 0
        time_samplerate (int): Samplerate [samples/s] for the time range. Defaults to None. If None, a random time to machine precision will be calculated. If a value is input, the random samples will be in increments of the samplerate (without replacement).

    Returns:
        shuffled_timestamps (nshuffled_points): Ordered random timestamps
    '''

    # Check that that there are enough sample points to randomly select from if time_samplerate is not None.
    if time_samplerate is not None and nshuffled_points > ((max_time-min_time)*time_samplerate):
        warnings.warn('There are not enough possible sample points to randomly select from.')
        return

    if time_samplerate is None:
        random_timestamps = np.random.uniform(min_time, max_time, size=nshuffled_points)
    
    else:
        time_axis = np.arange(min_time, max_time+(1/time_samplerate), 1/time_samplerate)
        random_timestamps = np.random.choice(time_axis, size=nshuffled_points, replace=False)
    
    return np.sort(random_timestamps)
    
[docs]def get_empirical_pvalue(data_distribution, data_sample, test_type='two_sided', assume_gaussian=False, nbins=None):
    '''
    Calculates the cumulative density function (CDF) from the input data distribution, then calculates the probability (p-value) that a data sample is part of that distribution.

    Args:
        data_distribution (npts): Distribution of empirically determined data points
        data_sample (npts): Data sample(s) to get pvalue of 
        test_type (str): 'two_sided', 'lower', or 'upper'.
        assume_gaussian (bool): Assumes the data represents a gaussian distribution when calculating the pvalue
        nbins (int): Number of bins to use to calculate the data distribution. Default is len(data_distribution)/100 if input is None (if necessary)
        
    Returns:
        significance (float): pvalue of the input data_sample based the parameters of the input data_distribution
    '''
    # Assume input data is a gaussian distribution
    data_mean = np.nanmean(data_distribution)
    if assume_gaussian:
        data_std = np.nanstd(data_distribution)
        z_value = (data_sample - data_mean)/data_std
        cdf_sample = scipy.stats.norm.cdf(z_value)
    
    # Get CDF from input data distribution
    else: 
        if nbins is None:
            nbins = len(data_distribution/100)
        count, bin_edges = np.histogram(data_distribution, bins=nbins)
        bin_edges += (bin_edges[1] - bin_edges[0])/2 # Use center of bins
        pdf = count / sum(count)
        cdf = np.cumsum(pdf)
        if np.isscalar(data_sample):
            cdf_sample = cdf[np.where(bin_edges > data_sample)[0][0]]
        else:
            cdf_sample = np.array([cdf[np.where(bin_edges > isample)[0][0]] for isample in data_sample])

    if test_type == 'two_sided':
        if np.isscalar(data_sample):
            if data_sample > data_mean:
                return 2*(1-cdf_sample)
            else: 
                return 2*cdf_sample
        else:
            return 2*np.array([(1-isample) if data_sample[idx] > data_mean else isample for idx, isample in enumerate(cdf_sample)])
        
    elif test_type == 'lower':
        return(cdf_sample)
    elif test_type == 'upper':
        return(1-cdf_sample)
    else:
        warnings.warn('Please enter a valid test_type. Must be either two_sided, upper, or lower')
        return


'''
Spectral Estimation and Analysis
'''
[docs]def calc_cwt_tfr(data, freqs, samplerate, fb=1.5, f0_norm=1.0, method='fft', complex_output=False, verbose=False):
    '''
    Use morlet wavelet decomposition to calculate a time-frequency representation of your data.
    
    Args:
        data (nt, nch): time series data
        freqs (nfreq): frequencies to decompose
        samplerate (float): sampling rate of the data
        fb (float, optional): time-decay parameter, inverse relationship with bandwidth 
            of the wavelets; setting a higher number results in narrower frequency resolution
        f0_norm (float, optional): center frequency of the wavelets, normalized to the sampling 
            rate. Default to 1.0, or the same frequency as the sampling rate.
        method (str, optional): either 'fft', or 'conv', which can be faster for shorter data. 
            Defaults to 'fft'.
        complex_output (bool, optional): output complex output or magnitdue. Default False.
        verbose (bool, optional): print out information about the wavelets

    Returns:
        tuple: tuple containing:
            | **freqs (nfreq):** frequency axis in Hz
            | **time (nt):** time axis in seconds
            | **spec (nfreq, nt, nch):** tfr representation for each channel

    Examples:
        
        .. code-block:: python

            from analyze/tests/analysis_tests import HelperFunctions
            fb = 10.
            f0_norm = 2.
            freqs = np.linspace(1,50,50)
            tfr_fun = lambda data, fs: aopy.analysis.calc_cwt_tfr(data, freqs, fs, fb=fb, f0_norm=f0_norm, verbose=True)
            HelperFunctions.test_tfr_sines(tfr_fun)
            
        .. image:: _images/tfr_cwt_sines.png
        
        .. code-block:: python

            freqs = np.linspace(1,500,500)
            tfr_fun = lambda data, fs: aopy.analysis.calc_cwt_tfr(data, freqs, fs, fb=fb, f0_norm=f0_norm, verbose=True)
            HelperFunctions.test_tfr_chirp(tfr_fun)

        .. image:: _images/tfr_cwt_chirp.png

        .. code-block:: python

            freqs = np.linspace(1,200,200)
            tfr_fun = lambda data, fs: aopy.analysis.calc_cwt_tfr(data, freqs, fs, fb=fb, f0_norm=f0_norm, verbose=True)
            HelperFunctions.test_tfr_lfp(tfr_fun)

        .. image:: _images/tfr_cwt_lfp.png

    '''
    if len(data.shape) < 2:
        data = data[:,None]
    time = np.arange(data.shape[0])/samplerate
    freqs_ud = np.flip(freqs)/samplerate
    wav = pywt.ContinuousWavelet(f'cmor{fb}-{f0_norm}') # 'cmorB-C' for a complex Morlet wavelet with the
                                                        # given time-decay (B) and center frequency (C) params.
    scale = pywt.frequency2scale(wav, freqs_ud)
    if verbose:
        print(wav.bandwidth_frequency)
        print(f"Wavelet ({wav.lower_bound}, {wav.upper_bound})")
        print(f"Scale ({scale[0]}, {scale[-1]})")
        print(f"Freqs ({freqs_ud[0]}, {freqs_ud[-1]})")
    coef, _ = pywt.cwt(data, scale, wav, method=method, axis=0)
    
    shape = coef.shape
    while shape and shape[-1] == 1:
        shape = shape[:-1] # remove trailing axes with length 1
    coef = coef.reshape(shape)

    if not complex_output:
        coef = np.abs(coef)
    return freqs, time, np.flip(coef, axis=0)

[docs]def calc_ft_tfr(data, samplerate, win_t, step, f_max=None, pad=2, window=None, 
                 detrend='constant', complex_output=False):
    '''
    Short-time fourier transform. Makes use of scipy.signal.spectrogram to compute
    a fast spectrogram. 

    Args:
        data (nt, nch): timeseries data.
        samplerate (float): sampling rate of the data.
        win_t (float): window size in seconds.
        step (float): step size in seconds.
        f_max (float): frequency range to return in Hz ([0, f_max]). Defaults to samplerate/2.
        pad (int):  padding factor for the FFT. This should be 1 or a multiple of 2.
                    For N=500, if pad=1, we pad the FFT to 512 points.
                    If pad=2, we pad the FFT to 1024 points. 
                    If pad=4, we pad the FFT to 2024 points.
        window (tuple, optional): see scipy documentation. Defaults to None.
        detrend (str, optional): see scipy documentation. Defaults to 'constant'.
        complex_output (bool): if True, return the complex signal instead of magnitude.
                               Default False.

    Returns:
        tuple: Tuple containing:
            | **f (n_freq):** frequency axis for spectrogram
            | **t (n_time):** time axis for spectrogram
            | **spec (n_freq,n_time,nch):** multitaper spectrogram estimate

    Examples:
        
        .. code-block:: python

            from analyze/tests/analysis_tests import HelperFunctions
            win_t = 0.5
            step = 0.01
            f_max = 50
            tfr_fun = lambda data, fs: aopy.analysis.calc_ft_tfr(data, fs, win_t, step, f_max, pad=3, window=('tukey', 0.5))
            HelperFunctions.test_tfr_sines(tfr_fun)
        
        .. image:: _images/tfr_ft_sines.png
            
        .. code-block:: python

            f_max = 500
            tfr_fun = lambda data, fs: aopy.analysis.calc_ft_tfr(data, fs, win_t, step, f_max, pad=3, window=('tukey', 0.5))
            HelperFunctions.test_tfr_chirp(tfr_fun)
            
        .. image:: _images/tfr_ft_chirp.png
        
        .. code-block:: python

            f_max = 200
            tfr_fun = lambda data, fs: aopy.analysis.calc_ft_tfr(data, fs, win_t, step, f_max, pad=3, window=('tukey', 0.5))
            HelperFunctions.test_tfr_lfp(tfr_fun)
            
        .. image:: _images/tfr_ft_lfp.png
    '''
    if isinstance(data, list): 
        data = np.array(data)
    if data.ndim == 1:
        data = data[:, np.newaxis]

    win_size = int(samplerate * win_t)
    overlap_size = win_size - int(samplerate * step)
    assert overlap_size > 0, "Step size exceeds window size"

    nfft = np.max([256, pad * 2**utils.nextpow2(win_size + 1)]) # 0 padding for efficient computation in FFT
    if f_max == None:
        f_max = samplerate/2
    nfk = int(np.floor(f_max/samplerate*nfft)) # number of data points in frequency axis

    if window is None:
        window = ('tukey', 0.25)

    freqs, time, spec = scipy.signal.spectrogram(
        data, fs=samplerate, window=window, nperseg=win_size, noverlap=overlap_size, nfft=nfft, 
        detrend=detrend, scaling='spectrum', axis=0, mode='complex')
    
    spec = spec.transpose(0,2,1)
    shape = spec.shape
    while shape and shape[-1] == 1:
        shape = shape[:-1] # remove trailing axes with length 1
    spec = spec.reshape(shape)

    if complex_output:
        return freqs[:nfk], time, spec[:nfk]
    else:
        return freqs[:nfk], time, np.abs(spec[:nfk])


[docs]def calc_mt_tfr(ts_data, n, p, k, fs, step=None, fk=None, pad=2, ref=True, complex_output=False, dtype='float64', nonnegative_freqs=True):
    '''
    Compute multitaper time-frequency estimate from multichannel signal input. 
    This code is adapted from the Pesaran lab `tfspec`.    
    
    Args:
        ts_data (nt, [nch, ntr]): time series array. If nch=1, the second dimension can be omitted.
            If ntr=1, the third dimension can be omitted. Output spectrogram dimensions
            (n_freq, n_time, [nch, ntr]) will also be reduced accordingly.
        n (float): window length in seconds
        p (float): standardized half bandwidth in hz
        k (int): number of DPSS tapers to use
        fs (float): sampling rate
        step (float): window step. Defaults to step = n/10.
        fk (float): frequency range to return in Hz ([0, fk]). Defaults to fs/2.
        pad (int):  padding factor for the FFT. This should be 1 or a multiple of 2.
                    For N=500, if pad=1, we pad the FFT to 512 points.
                    If pad=2, we pad the FFT to 1024 points. 
                    If pad=4, we pad the FFT to 2024 points.
        ref (bool): referencing flag. If True, mean of neural signals across electrodes 
                    for each time window is subtracted to remove common noise
                    so that you can get spacially-localized signals.
                    If you only analyze single channel data, this has to be False.
                    This paper discuss referencing scheme
                    https://iopscience.iop.org/article/10.1088/1741-2552/abce3c
        complex_output (bool): if True, return the complex signal instead of magnitude.
                               Default False.
        dtype (str): dtype of the output. Default 'float64'
        nonnegative_freqs (bool): if True, only include non-negative frequencies in the output.
                                       Default True.
                       
    Returns:
        tuple: Tuple containing:
            | **f (n_freq):** frequency axis for spectrogram
            | **t (n_time):** time axis for spectrogram
            | **spec (n_freq,n_time,nch,ntr):** multitaper spectrogram estimate
        
    Examples:
        
        .. code-block:: python

            from analyze/tests/analysis_tests import HelperFunctions
            NW = 0.3
            BW = 10
            step = 0.01
            fk = 50
            n, p, k = aopy.precondition.convert_taper_parameters(NW, BW)
            print(f"using {k} tapers length {n} half-bandwidth {p}")
            tfr_fun = lambda data, fs: aopy.analysis.calc_mt_tfr(data, n, p, k, fs, step=step, fk=fk, pad=2, ref=False)
            HelperFunctions.test_tfr_sines(tfr_fun)
                        
        .. image:: _images/tfspec.png
            
        .. code-block:: python
        
            fk = 500
            tfr_fun = lambda data, fs: aopy.analysis.calc_mt_tfr(data, n, p, k, fs, step=step, fk=fk, pad=2, ref=False)
            HelperFunctions.test_tfr_chirp(tfr_fun)
            
        .. image:: _images/tfr_mt_chirp.png
        
        .. code-block:: python

            fk = 200
            tfr_fun = lambda data, fs: aopy.analysis.calc_mt_tfr(data, n, p, k, fs, step=step, fk=fk, pad=2, ref=False, dtype='int16')
            HelperFunctions.test_tfr_lfp(tfr_fun)
            
        .. image:: _images/tfr_mt_lfp.png
        
    See Also:
        :func:`~aopy.analysis.calc_cwt_tfr`

    Note:
        The time axis returned by calc_mt_tfr corresponds to the center of the sliding window (`n` seconds). 
        To move the time axis so that the spectrogram bins are aligned to the right edge of each window, do 
        `time += n/2`.

        .. image:: _images/tfr_mt_alignment.png

    Modified September 2023 to return magnitude instead of magnitude squared power.
    '''  
    if isinstance(ts_data, list): 
        ts_data = np.array(ts_data)
    if ts_data.ndim == 1:
        ts_data = ts_data[:, np.newaxis]
    if ts_data.ndim == 2:
        ts_data = ts_data[:, :, np.newaxis]
    if ts_data.shape[1] == 1:
        ref = False
    if step == None:
        step = n/10
    if fk == None:
        fk = fs/2
        
    ts_data = ts_data.transpose(1, 0, 2)  # (nch, nt, ntr)
    nch, nt, ntr = ts_data.shape
    fk = np.array([0, fk])
    tapers, _ = precondition.dpsschk(int(n * fs), p, k) # round down
    
    win_size = tapers.shape[0]  # window size (data points of tapers)
    step_size = int(step * fs) # step size
    nf = np.max([256, pad * 2 ** utils.nextpow2(win_size + 1)])  # 0 padding for efficient computation in FFT
    nwin = 1 + int(np.floor((nt - win_size) / step_size))  # number of windows
    nfk = np.floor(fk / fs * nf)  # number of data points in frequency axis
    if nonnegative_freqs:
        f = np.linspace(fk[0], fk[1], int(nfk[1] - nfk[0]))  # frequency axis for spectrogram
    else:
        f = np.fft.fftfreq(nf, d=1/fs)
        f = np.fft.fftshift(f)
        nfk = [int(nf/2)-int(nfk[1]), int(nf/2)+int(nfk[1])]
        f = f[nfk[0]:nfk[1]]

    spec = np.zeros((int(nfk[1] - nfk[0]), nwin, nch, ntr), dtype=dtype)
    for iwin in range(nwin):
        if ref:
            m_data = np.sum(ts_data[:, step_size * iwin:step_size * iwin + win_size, :], axis=0) / nch  # Mean across channels for that window
            win_data = (ts_data[:, step_size * iwin:step_size * iwin + win_size, :] - m_data).transpose(1, 0, 2)  # Subtract mean from data           
        else:
            win_data = (ts_data[:, step_size * iwin:step_size * iwin + win_size, :]).transpose(1, 0, 2)
        
        # Compute power for each taper
        tapers_ik = tapers[:, :, np.newaxis, np.newaxis]  # Shape: (win_size, k, 1, 1)
        win_data_reshaped = win_data[:, np.newaxis, :, :]  # Shape: (win_size, 1, nch, ntr)
        fk_data = np.fft.fft(tapers_ik * win_data_reshaped, nf, axis=0)  # Shape: (nf, k, nch, ntr)
        if not nonnegative_freqs:
            fk_data = np.fft.fftshift(fk_data, axes=0)
        if complex_output:
            spec[:, iwin, :, :] = np.mean(fk_data[int(nfk[0]):int(nfk[1]), :, :, :], axis=1)
        else:
            spec[:, iwin, :, :] = np.mean(np.abs(fk_data[int(nfk[0]):int(nfk[1]), :, :, :]), axis=1).real

    if not nonnegative_freqs:
        f = np.fft.ifftshift(f)
        spec = np.fft.ifftshift(spec, axes=0)

    t = np.arange(nwin) * step + n / 2  # Center of each window is time axis

    shape = spec.shape
    while shape and shape[-1] == 1:
        shape = shape[:-1] # remove trailing axes with length 1
    spec = spec.reshape(shape)

    return f, t, spec

[docs]def calc_tsa_mt_tfr(data, fs, win_t, step_t, bw=None, f_max=None, pad=2, jackknife=False, adaptive=False, sides='onesided'):
    """
    Compute multitaper time-frequency power estimate from multichannel signal input. 
    This code uses nitime time-series analysis below. In comparison to :func:`~aopy.analysis.calc_mt_tfr` this
    function is very slow.

    Args:
        data (nt, nch): nd array of input neural data (multichannel)
        fs (int): sampling rate
        win_t (float): spectrogram window length (in seconds)
        step_t (float): step size between spectrogram windows (in seconds)
        bw (float, optional): spectrogram frequency bin bandwidth. Defaults to None.
        f_max (float): frequency range to return in Hz ([0, f_max]). Defaults to samplerate/2.
        pad (int):  padding factor for the FFT. This should be 1 or a multiple of 2.
                    For N=500, if pad=1, we pad the FFT to 512 points.
                    If pad=2, we pad the FFT to 1024 points. 
                    If pad=4, we pad the FFT to 2024 points.
        adaptive (bool, optional): adaptive taper weighting. Defaults to False.
        
    Returns:
        tuple: Tuple containing:
            | **freqs (nfreq,):** spectrogram frequency array (equal in length to win_t * fs // 2 + 1)
            | **time (nt,):** spectrogram time array (equal in length to (len(data)/fs - win_t)/step_t)
            | **spec (nfreq, nt, nch): multitaper spectrogram estimate. Last dimension squeezed for 1-d inputs.

    Examples:
        
        .. code-block:: python

            from analyze/tests/analysis_tests import HelperFunctions
            win_t = 0.3
            step_t = 0.01
            bw = 20
            fk = 50
            tfr_fun = lambda data, fs: aopy.analysis.calc_tsa_mt_tfr(data, fs, win_t, step_t, bw=bw, f_max=fk)
            HelperFunctions.test_tfr_sines(tfr_fun)
                        
        .. image:: _images/tfr_mt_tsa_sines.png
            
        .. code-block:: python

            fk = 500
            tfr_fun = lambda data, fs: aopy.analysis.calc_tsa_mt_tfr(data, fs, win_t, step_t, bw=bw, f_max=fk)
            HelperFunctions.test_tfr_chirp(tfr_fun)
            
        .. image:: _images/tfr_mt_tsa_chirp.png
        
        .. code-block:: python
            
            fk = 200
            tfr_fun = lambda data, fs: aopy.analysis.calc_tsa_mt_tfr(data, fs, win_t, step_t, bw=bw, f_max=fk)
            HelperFunctions.test_tfr_lfp(tfr_fun)
            
        .. image:: _images/tfr_mt_tsa_lfp.png
    """
    if len(data.shape) < 2:
        data = data[:,None]
    assert len(data.shape) < 3, f"only 1- or 2-dim data arrays accepted - {data.shape}-dim input given"
    (n_sample, n_ch) = data.shape
    total_t = n_sample/fs
    n_window = int((total_t-win_t)/step_t)
    assert n_window > 0
    window_len = int(win_t*fs)
    step_len = int(step_t*fs)
    if f_max == None:
        f_max = fs/2
    nfft = np.max([256, pad * 2**utils.nextpow2(window_len+1)]) # 0 padding for efficient computation in FFT
    nfreqs = nfft // 2 + 1
    nfk = int(np.floor(f_max/fs*nfft)) # number of data points in frequency axis

    time = np.arange(n_window)*step_t # window start time
    spec = np.zeros((nfreqs,n_window,n_ch))

    data = interp_nans(data)

    for idx_window in range(n_window):
        window_sample_range = np.arange(window_len) + step_len*idx_window
        win_data = data[window_sample_range,:]
        freqs, _win_psd, _ = calc_mt_psd(win_data, fs, bw, nfft, adaptive, jackknife, sides)
        spec[:,idx_window,...] = _win_psd

    shape = spec.shape
    while shape and shape[-1] == 1:
        shape = shape[:-1] # remove trailing axes with length 1
    spec = spec.reshape(shape)

    return freqs[:nfk], time, spec[:nfk]

[docs]def calc_mt_psd(data, fs, bw=None, nfft=None, adaptive=False, jackknife=True, sides='default'):
    '''
    Computes power spectral density using Multitaper functions from nitime. 

    Args:
        data (nt, nch): time series data where time axis is assumed to be on the last axis
        fs (float): sampling rate of the signal
        bw (float): sampling bandwidth of the data tapers in Hz
        adaptive (bool): Use an adaptive weighting routine to combine the PSD estimates of different tapers.
        jackknife (bool): Use the jackknife method to make an estimate of the PSD variance at each point.
        sides (str): This determines which sides of the spectrum to return.

    Returns:
        tuple: Tuple containing:
            | **f (nfft):** Frequency points vector
            | **psd_est (nfft, nch):** estimated power spectral density (PSD)
            | **nu (nfft, nch):** if jackknife = True; estimated variance of the log-psd. 
                If Jackknife = False; degrees of freedom in a chi square model of how the estimated 
                psd is distributed wrt true log - PSD
    '''
    data = data.T # move time to the last axis
    f, psd_mt, nu = tsa.multi_taper_psd(data, fs, None, bw,  adaptive, jackknife, sides, NFFT=nfft)
    return f, psd_mt.T, nu.T

[docs]def calc_welch_psd(data, fs, n_freq=None):
    '''
    Computes power using Welch's method. Welch’s method computes an estimate of the power
    by dividing the data into overlapping segments, computes a modified periodogram for 
    each segment and then averages the periodogram. Periodogram is averaged using median.

    Args:
        data (nt, ...): time series data.
        fs (float): sampling rate
        n_freq (int): no. of frequency points expected

    Returns:
        tuple: Tuple containing:
            | **f (nfft):** frequency points vector
            | **psd_est (nfft, ...):** estimated power spectral density (PSD)
    '''
    if n_freq:
        f, psd = signal.welch(data, fs, average='median', scaling='spectrum', nperseg=2*n_freq, axis=0)
    else:
        f, psd = signal.welch(data, fs, average='median', scaling='spectrum', axis=0)
    return f, np.sqrt(psd)

[docs]def get_tfr_feats(freqs, spec, bands, log=False, epsilon=1e-9):
    '''
    Estimate band power in specified frequency bands, preserving other dimensions.

    Args:
        f (nfreq,): Frequency points vector
        spec (nfreq, nt, nch): spectrogram of data
        bands (list of tuples): frequency bands of interest in Hz, e.g. [(0, 10), (10, 20), (130, 140)]
        log (bool, optional): boolean to select whether band power should be in log scale or not
        epsilon (float, optional): small number to avoid division by zero. Default 1e-9.
        
    Returns:
        lfp_power (n_features, nt, nch): band power features at each timepoint for each channel
    '''
    if spec.ndim == 1:
        spec = np.expand_dims(spec, [1, 2])
    if spec.ndim == 2:
        spec = spec[:, np.newaxis, :] # insert time axis

    feats = np.zeros((len(bands), spec.shape[1], spec.shape[2]), like=spec)
    for idx, band in enumerate(bands):
        fft_inds = [freq_idx for freq_idx, freq in enumerate(freqs) if band[0] <= freq < band[1]]

        if log:
            feats[idx] = np.mean(np.log10(spec[fft_inds] + epsilon), axis=0)
        else:
            feats[idx] = np.mean(spec[fft_inds], axis=0)

    return np.squeeze(feats)

[docs]def calc_tfr_mean(freqs, time, spec, band=(0, 1e16), window=(-1e16, 1e16)):
    """
    Calculate the mean within a specific frequency band and time window.
    
    Args:
        freqs (nfreq,): Frequency values in Hz.
        time (nt,): Time values in seconds.
        spec (nfreq, nt, nch): Time-frequency spectrogram data.
        band (tuple): Frequency band (low, high) in Hz. Defaults to (0, np.inf).
        window (tuple, optional): Time window (start, end) in seconds. Defaults to (-np.inf, np.inf).

    Returns:
        (nch,): Mean spectral value within the specified band and time window for each channel.
    """
    freq_idx = (freqs >= band[0]) & (freqs < band[1])
    time_idx = (time >= window[0]) & (time < window[1])
    tf_idx = np.ix_(freq_idx, time_idx)
    
    return np.nanmean(spec[tf_idx], axis=(0, 1))

[docs]def calc_tfr_mean_fdrc_ranktest(freqs, time, spec, null_specs, band=(0,1e16), window=(-1e16, 1e16),
                                alternative='greater', nan_policy='raise', alpha=0.05):
    """
    Compute band-specific Wilcoxon sign-rank test with false discovery-rate correction. Used for comparing 
    coherence maps against null distributions. Spectrograms must be multi-channel.
    
    Args:
        freqs (nfreq,): Frequency axis in Hz.
        time (nt,): Time axis in seconds.
        spec (nfreq, nt, nch): Observed spectrogram.
        null_specs (n_null, nfreq, nt, nch): Distribution of null spectrograms.
        band (tuple, optional): Frequency band (low, high) in Hz. Defaults to (0, np.inf).
        window (tuple, optional): Time window (start, end) in seconds. Defaults to (-np.inf, np.inf).
        alternative (str, optional): Hypothesis test alternative. See scipy.stats.calc_fdrc_ranktest for 
            options. Defaults to 'greater'.
        nan_policy (str, optional): Handling of NaN values. See scipy.stats.calc_fdrc_ranktest for options. 
            Defaults to 'raise'.
        alpha (float, optional): Significance level. Defaults to 0.05.
    
    Returns:
        tuple: tuple containing:
            - diff (nch,): Effect size at each channel.
            - p_fdrc (nch,): Adjusted p-values at each channel.
    """  
    mean = calc_tfr_mean(freqs, time, spec, band, window)
    null_means = np.array([calc_tfr_mean(freqs, time, null_spec, band, window) for null_spec in null_specs])
    
    diff, p_fdrc = calc_fdrc_ranktest(mean, null_means, alternative=alternative, 
                                      nan_policy=nan_policy, alpha=alpha)
    return diff, p_fdrc

[docs]def get_bandpower_feats(data, samplerate, bands, method='mt', log=False, epsilon=0, **kwargs):
    '''
    Wrapper around get_tfr_feats and calc_mt_tfr. 

    Args:
        data (nt, ...): time series data.
        samplerate (float): sampling rate of the data.
        bands (list of tuples): frequency bands of interest in Hz, e.g. [(0, 10), (10, 20), (130, 140)]
        log (bool): boolean to select whether band power should be in log scale or not
        epsilon (float): small number, e.g. 1e-10 to add to power before averaging in case there are zero values
        kwargs (dict, optional): keyword arguments for the calc_tfr function of choice (see Note).

    Raises:
        ValueError: if the requested method is not valid

    Returns:
        tuple: tuple containing:
            | **time (nstep):** the resulting time axis for the features
            | **feats (nfeatures, nstep, nch):** band power features

    Note:
        For method 'mt', you must pass the following keyword arguments:
            | **n (float):** window length in seconds
            | **p (float):** standardized half bandwidth in hz
            | **k (int):** number of DPSS tapers to use
            | **step (float):** window step. Defaults to step = n/10.
            | **fk (float):** frequency range to return in Hz ([0, fk]). Defaults to fs/2.
        Optionally you may also pass:
            | **pad (int):** padding factor for the FFT. This should be 1 or a multiple of 2.
            | **ref (bool):** referencing flag. If True, mean of neural signals across electrodes 
            | **dtype (str):** dtype of the output. Default 'float64'
    '''
    if method == 'mt':
        n = kwargs.pop('n')
        p = kwargs.pop('p')
        k = kwargs.pop('k')
        step = kwargs.pop('step')
        fk = kwargs.pop('fk')
        pad = kwargs.pop('pad', 2)
        ref = kwargs.pop('ref', True)
        dtype = kwargs.pop('dtype', 'float64')
        freqs, time, spec = calc_mt_tfr(data, n, p, k, samplerate, 
                                        step=step, fk=fk, pad=pad, ref=ref, dtype=dtype)
    else:
        raise ValueError(f"Method {method} not implemented.")

    return time, get_tfr_feats(freqs, spec, bands, log=log, epsilon=epsilon)

[docs]def interp_nans(x):
    """
    Interpolate NaN values from multichannel data using linear interpolation.

    Args:
        x (n_sample, n_ch): input data array containing nan-valued missing entries

    Returns:
        x_interp (n_sample, n_ch): interpolated data, uses `numpy.interp` method.
    """
    nan_idx = np.isnan(x)
    ok_idx = ~nan_idx
    xp = ok_idx.ravel().nonzero()[0]
    fp = x[ok_idx]
    idx = nan_idx.ravel().nonzero()[0]
    x[nan_idx] = np.interp(idx,xp,fp)

    return x

[docs]def calc_mt_tfcoh(data, ch, n, p, k, fs, step, fk=None, pad=2, ref=False, imaginary=False, 
                  return_angle=False, dtype='float64', workers=None):
    '''
    Computes moving window time-frequency coherence averaged across trials between selected channels.
    This is loosely based on pesaran lab code, modified to be more compatible with :func:`~aopy.analysis.calc_mt_tfr`.
    The coherence computations are from https://doi.org/10.7551/mitpress/9609.001.0001
    
    Given analytical signals Xk1 and Xk2, coherence is computed as:
    
    .. code-block:: python
    
        # Compute power and cross-spectral power
        S1 = np.sum(Xk*Xk.conj(), axis=1) # sum across tapers and trials
        S2 = np.sum(Yk*Yk.conj(), axis=1) # sum across tapers and trials 
        S12 = np.sum(Xk*Yk.conj(), axis=1) # sum across tapers and trials
    
        # Coherence
        coh = np.abs(S12/np.sqrt(S1*S2))**2

        # Imaginary coherence
        coh = np.abs(np.imag(S12/np.sqrt(S1*S2)))

    Args:
        data ((nt,nch,ntr) array): evoked potential across all channels and trials
        ch ((2,) tuple): the two channel indices between which coherence will be computed
        n (float): window length in seconds
        p (float): standardized half bandwidth in hz
        k (int): number of DPSS tapers to use
        fs (float): sampling rate in Hz.
        step (float): window step size in seconds.
        fk (float, optional): frequency range to return in Hz ([0, fk]). Default is fs/2.
        pad (int, optional): padding factor for the FFT. This should be 1 or a multiple of 2.
            For nt=500, if pad=1, we pad the FFT to 512 points.
            If pad=2, we pad the FFT to 1024 points. 
            If pad=4, we pad the FFT to 2024 points.
            Default is 2.
        ref (bool, optional): referencing flag. If True, mean of neural signals across electrodes 
            for each time window is subtracted to remove common noise so that You can get 
            spacially-localized signals. If you only analyze single channel data, this has 
            to be False. This paper discuss referencing scheme
            https://iopscience.iop.org/article/10.1088/1741-2552/abce3c
            Default is False.
        imaginary (bool, optional): if True, compute imaginary coherence.
        return_angle (bool, optional): if True, also return the phase difference between 
            the two channels. For example if ch = [ch1, ch0], angles correspond to phase differences 
            from ch1 to ch0 (i.e. angle ≈ phase(ch1) - phase(ch0)). Default is False.
        dtype (str, optional): dtype of the output. Default 'float64'
        workers (int, optional): Number of workers argument to pass to scipy.fft.fft. 
            Default None. 
                       
    Returns:
        tuple: tuple containing:
            | **f (n_freq):** frequency axis
            | **t (n_time):** time axis
            | **coh (n_freq,n_time):** magnitude squared coherence or imaginary coherence (0 <= coh <= 1)
            | **angle (n_freq,n_time):** phase difference between the two channels in radians 
                (optional output, -pi <= angle <= pi)

    See also: 
        :func:`~aopy.analysis.calc_mt_tfr`

    Examples:

        .. code-block:: python

            fs = 1000
            N = 1e5
            T = N/fs
            amp = 20
            noise_power = 0.001 * fs / 2
            time = np.arange(N) / fs

        Generate two test signals with common low-frequency signals, except at a given freq (100 Hz)

        .. code-block:: python

            rng = np.random.default_rng(seed=0)
            signal1 = rng.normal(scale=np.sqrt(noise_power), size=time.shape)

            b, a = scipy.signal.butter(2, 0.25, 'low')
            signal2 = scipy.signal.lfilter(b, a, signal1)
            signal2 += rng.normal(scale=0.1*np.sqrt(noise_power), size=time.shape)

            # Add a 100 hz sine wave only to signal 1
            freq = 100.0
            signal1[time > T/2] += amp*np.sin(2*np.pi*freq*time[time > T/2])

            # Add a 400 hz sine wave to both signals
            freq = 400.0
            signal1[time < T/2] += amp*np.sin(2*np.pi*freq*time[time < T/2])
            signal2[time < T/2] += amp*np.sin(2*np.pi*freq*time[time < T/2])
                    
            # Add a 200 hz sine wave to both signals but with phase modulated by a 0.05 hz sine wave
            freq = 200.0
            freq2 = 0.05
            signal1 += amp*np.sin(2*np.pi*freq*time)
            signal2 += amp*np.sin(2*np.pi*freq*time + np.pi*np.sin(2*np.pi*freq2*time))

        Calculate coherence, imaginary coherence, and compared to `scipy.signal.coherence()`

        .. code-block:: python

            n = 1
            w = 2
            n, p, k = aopy.precondition.convert_taper_parameters(n, w)
            fk = fs / 2  # Maximum frequency of interest
            step = n # no overlap
            signal_combined = np.stack((signal1, signal2), axis=1)

            # Calculate spectrograms for each signal
            f, t, spec1 = aopy.analysis.calc_mt_tfr(signal1, n, p, k, fs, step, fk=fk,
                                                                ref=False)
            f, t, spec2 = aopy.analysis.calc_mt_tfr(signal2, n, p, k, fs, step, fk=fk,
                                                                ref=False)

            # And coherence
            f, t, coh = aopy.analysis.calc_mt_tfcoh(signal_combined, [0,1], n, p, k, fs, step, fk=fk,
                                                                ref=False)
            f, t, coh_im, angle = aopy.analysis.calc_mt_tfcoh(signal_combined, [0,1], n, p, k, fs, step, fk=fk,
                                                                ref=False, imaginary=True, return_angle=True)
            f_scipy, coh_scipy = scipy.signal.coherence(signal1, signal2, fs=fs, nperseg=2048, noverlap=0, axis=0)

        Plot coherence

        .. code-block:: python

            # Plot the coherence over time
            plt.figure(figsize=(10, 15))
            plt.subplot(5, 1, 1)
            im = aopy.visualization.plot_tfr(spec1[:,:,0], t, f)
            plt.colorbar(im, orientation='horizontal', location='top', label='Signal 1')
            im.set_clim(0,3)

            plt.subplot(5, 1, 2)
            im = aopy.visualization.plot_tfr(spec2[:,:,0], t, f)
            plt.colorbar(im, orientation='horizontal', location='top', label='Signal 2')
            im.set_clim(0,3)

            plt.subplot(5, 1, 3)
            im = aopy.visualization.plot_tfr(coh, t, f)
            plt.colorbar(im, orientation='horizontal', location='top', label='Coherence')
            im.set_clim(0,1)

            # Plot the average coherence across windows
            plt.subplot(5, 1, 4)
            plt.plot(f, np.mean(coh, axis=1))
            plt.plot(f, np.mean(coh_im, axis=1))
            plt.plot(f_scipy, coh_scipy)
            plt.title('Average coherence across time')
            plt.xlabel('Frequency (Hz)')
            plt.ylabel('Coherency')
            plt.legend(['coh', 'imag coh', 'scipy'])

            # Also plot the phase difference
            plt.subplot(5, 1, 5)
            im = aopy.visualization.plot_tfr(angle, t, f, cmap='bwr')
            plt.colorbar(im, orientation='horizontal', location='top', label='Phase difference (rad)')
            im.set_clim(-np.pi,np.pi)

        .. image:: _images/coherency.png
    '''
    if data.ndim == 1:
        data = data[:,np.newaxis,np.newaxis]
    elif data.ndim == 2:
        data = data[:,:,np.newaxis]
    if data.shape[1] == 1:
        ref = False
    if fk == None:
        fk = fs/2

    nt,_,ntr = data.shape
    fk = np.array([0,fk])    
    win_size = int(n*fs)
    dn = int(np.floor(step*fs))
    nf = np.max([256,pad*2**utils.nextpow2(win_size+1)])
    nfk = np.floor(fk/fs*nf)
    nwin = 1 + int(np.floor((nt-win_size)/dn))
    f = np.linspace(fk[0],fk[1],int(nfk[1]-nfk[0]))

    assert nwin > 0, "Not enough data for the given `n` and `step`"
   
    tapers, _ = precondition.dpsschk(win_size, p, k)

    # For now we only allow two channel. In the future we could expand to multiple pairs of channels
    ch1 = ch[0]
    ch2 = ch[1]
        
    coh = np.zeros((nwin,int(nfk[1]-nfk[0])), dtype=dtype)
    angle = np.zeros((nwin,int(nfk[1]-nfk[0])), dtype=dtype)
    for win in range(nwin):
        if ref:
            mX = np.mean(data[dn*win:dn*win+win_size], axis=1, keepdims=True) # Mean across channels for that window
            tmp = (data[dn*win:dn*win+win_size]-mX) # Subtract mean from data 
        else:
            tmp = (data[dn*win:dn*win+win_size])

        # tmp is shape (N, nch, ntr)
        # tapers is shape (N, k)

        # Compute power for channel 1
        ch1_rolled = np.reshape(tapers[:,:,np.newaxis]*tmp[:,[ch1],:], (win_size, k*ntr)) # trials and tapers together
        Xk_tmp1 = scipy.fft.fft(ch1_rolled.T, nf, axis=-1, overwrite_x=True, workers=workers).T # looping over the last axis is faster
        Xk1 = Xk_tmp1[int(nfk[0]):int(nfk[1])] # filter desired frequency range
        S1 = np.sum(Xk1*Xk1.conj(), axis=1) # sum across tapers and trials

        # Compute power for channel 2
        ch2_rolled = np.reshape(tapers[:,:,np.newaxis]*tmp[:,[ch2],:], (win_size, k*ntr))
        Xk_tmp2 = scipy.fft.fft(ch2_rolled.T, nf, axis=-1, overwrite_x=True, workers=workers).T
        Xk2 = Xk_tmp2[int(nfk[0]):int(nfk[1])]
        S2 = np.sum(Xk2*Xk2.conj(), axis=1) # note: Xk*Xk.conj() is equivalent to abs(Xk)**2

        # Cross spectral power
        S12 = np.sum(Xk1*Xk2.conj(), axis=1)
    
        # Coherence
        if imaginary:
            coh[win,:] = np.abs(np.imag(S12/np.sqrt(S1*S2)))
        else:
            coh[win,:] = np.abs(S12/np.sqrt(S1*S2))**2
            
        # Phase difference angle
        angle[win,:] = np.angle(S12)

    coh = coh.T
    angle = angle.T
    t = np.arange(nwin)*step + n/2 # Center of each window is time axis
    
    if return_angle:
        return f, t, coh, angle
    else:
        return f, t, coh
    
[docs]def calc_itpc(analytical_signals):
    '''
    Computes inter-trial phase clustering (ITPC) from analytical signals of evoked potentials.
    ITPC is computed as the magnitude of the mean of the complex signal across trials at each timepoint
    (think vector average). This captures the similarity of phases across trials. ITPC ranges from 0 to 1, 
    where 0 indicates uniformly random phases and 1 indicates perfect phase alignment.

    From Cohen, M. X. (2014). Analyzing neural time series data: theory and practice. MIT press.

    .. math:: 

        ITPC = \\frac{1}{N} |\\sum_{k=1}^{N} e^{i\\theta_k}|

    Args:
        analytical_signals (nt, nch, ntr): analytical signal of the evoked potential (np.complex128)

    Returns:
        (nt, nch): itpc values for each channel (ranges from 0 to 1)

    Examples:

        Generate two channels of data with different phase distributions across trials

        .. code-block:: python

            fs = 1000
            nt = fs * 2
            ntr = 100
            t = np.arange(nt)/fs
            data = np.zeros((t.shape[0],2,ntr)) # 2 channels

            # 10 Hz sine with gaussian phase distribution across trials
            for tr in range(ntr):
                data[:,0,tr] = np.sin(2*np.pi*10*t + np.random.normal(np.pi/4, np.pi/8)) 

            # 10 Hz sine with uniform random phase distribution across trials
            for tr in range(ntr):
                data[:,1,tr] = np.sin(2*np.pi*10*t + np.random.uniform(-np.pi, np.pi)) 

        Calculate an analytical signal using hilbert transform, then apply ITPC
        
        .. code-block:: python
        
            im_data = signal.hilbert(data, axis=0)
            itpc = aopy.analysis.calc_itpc(im_data)

            plt.figure()

            # Plot the data
            plt.subplot(3,1,1)
            aopy.visualization.plot_timeseries(np.mean(data, axis=2), fs)
            plt.legend(['Channel 1', 'Channel 2'])
            plt.ylabel('amplitude (a.u.)')
            plt.title('Trial averaged data')

            # Plot the angles at the first timepoint
            angles = np.angle(im_data[0])
            plt.subplot(3,2,3, projection= 'polar')
            aopy.visualization.plot_angles(angles[0,:], color='tab:blue', alpha=0.5, linewidth=0.75)
            plt.subplot(3,2,4, projection= 'polar')
            aopy.visualization.plot_angles(angles[1,:], color='tab:orange', alpha=0.5, linewidth=0.75)

            # Plot ITPC
            plt.subplot(3,1,3)
            aopy.visualization.plot_timeseries(itpc, fs)
            plt.ylabel('ITPC')
            plt.title('ITPC')

        .. image:: _images/itpc.png
    '''
    return np.abs(np.mean(analytical_signals/np.abs(analytical_signals), axis=2))


'''
Statistics
'''
[docs]def align_spatial_maps(data1, data2):
    '''
    Align two input maps by finding the location of the peak of the 2D correlation function.
    Note, if these shifts are unexpectedly high, there is likely not high enough correlation between the maps
    and the alignment should not be used. This function replaces input NaN values with 0 and uses 0-padding for all
    edge conditions.

    Args:
        data1 (nrow, ncol): First input data array, used as baseline map.
        data2 (nrow, ncol): Second input data array, will be shifted to match the baseline map.

    Returns:
        tuple: tuple containing:
            | **data2_align (nrow, ncol):** aligned version of data2
            | **shifts (tuple):** contains (row_shifts, col_shifts)
    '''
    # Replace NaNs with 0s so correlation doesn't output NaN
    data1[np.isnan(data1)] = 0
    data2[np.isnan(data2)] = 0
    
    # Align data maps.
    corr = scipy.signal.correlate2d(data1/np.linalg.norm(data1), data2/np.linalg.norm(data2), 
                                    boundary='fill', mode='same')
    irow, icol = np.unravel_index(np.argmax(corr), corr.shape)  # find the match
    row_shift = int(irow - (data1.shape[0]-1)/2)
    col_shift = int(icol - (data1.shape[1]-1)/2)
    data2_align = np.roll(data2, row_shift, axis=0)
    data2_align = np.roll(data2_align, col_shift, axis=1)
    shifts = (row_shift, col_shift)
    return data2_align, shifts

[docs]def calc_corr2_map(data1, data2, knlsz=15, align_maps=False):
    '''
    This function creates a map showning the local correlation between two input datamaps. If specified, it also aligns the input
    maps by finding the location of the peak of the 2D correlation function. Note, if these shifts are unexpectedly high, there
    is likely not high enough correlation between the datamaps and alignment should not be used. This function uses 0-padding for all
    edge conditions and replaces input NaN values with 0 to calculate the correlation map. After the correlation map is calculated,
    all values were NaN in the input data are again set to NaN. If a window of data has all 0's, the NCC is set to nan. 
    Note, the worst correlation in the example image is not at the edge of the image because of zero padding.

    .. image:: _images/calc_corr2_map.png

    Args:
        data1 (nrow, ncol): First input data array. Used as baseline if map alignment is required.
        data2 (nrow, ncol): Second input data array. Shifted to match the baseline if map alignment is required
        knlsz (int): Length of the kernel window in units of data points. The kernel is a square so each side will have the lenght specified here. This value should always be odd.
        align_maps (bool): Whether or not to align maps.

    Returns:
        tuple: Tuple containing:
            | **NCC (nrow, ncol):** Spatial correlation map (NCC: normalized correlatoin coefficient)
            | **shifts (tuple):** Contains (row_shifts, col_shifts)
    '''
    
    # Make sure knlsz is odd
    if knlsz % 2 == 0:
        print('Warning: Kernel size (knlsz) is even in calc_corr2_map')

    NCC = np.zeros((data1.shape))
    data_sz = data1.shape[0]
    
    # Get nan value locations 
    nan_idx1 = np.isnan(data1)
    nan_idx2 = np.isnan(data2)
    
    # Replace NaNs with 0s so correlation doesn't output NaN
    data1[nan_idx1] = 0
    data2[nan_idx2] = 0
    
    # Get maxidx of 2D spatial correlation matrix to ensure data maps are aligned.
    if align_maps:
        data2_align, shifts = align_spatial_maps(data1, data2)
    else:
        data2_align = data2
        shifts = (0,0)
    
    # Pad data
    data1_pad = np.pad(data1, int((knlsz-1)/2), mode='constant')
    data2_pad = np.pad(data2_align, int((knlsz-1)/2), mode='constant')
    
    start_idx = int((knlsz-1)/2)
    end_idx = int(data_sz + (knlsz-1)/2)
    middle_ncc_idx = int(2*(knlsz-1)/2)
    for xx in range(start_idx, end_idx):
        for yy in range(start_idx,end_idx):
            # Normalize input arrays based on the norm
            data_subset1 = data1_pad[(xx-start_idx):(xx+start_idx+1),(yy-start_idx):(yy+start_idx+1)]
            data_subset2 = data2_pad[(xx-start_idx):(xx+start_idx+1),(yy-start_idx):(yy+start_idx+1)]

            # If either data subset is all 0's set the NCC to 0
            if np.linalg.norm(data_subset1)==0 or np.linalg.norm(data_subset2)==0:
                NCC[xx - start_idx, yy - start_idx] = np.nan
            else:
                data_subset1 /= np.linalg.norm(data_subset1)
                data_subset2 /= np.linalg.norm(data_subset2)
                NCC[xx - start_idx, yy - start_idx] = scipy.signal.correlate2d(data_subset1,data_subset2)[middle_ncc_idx, middle_ncc_idx]
    
    # Replace NaNs in correlation map
    NCC[nan_idx1] = np.nan
    return NCC, shifts

[docs]def calc_spatial_map_correlation(data_maps, align_maps=False):
    '''
    Generate a correlation matrix between all pairs of input data maps. If specified, it also 
    aligns the input maps. Alignment is done using :func:`~aopy.analysis.align_spatial_maps` which 
    finds the location of the peak of the 2D correlation function. Here, we calculate the 1D
    correlation between flattened versions of the input data maps. This function removes datapoints
    along the second axis if any map contains NaN values at that location. Data maps are normalized 
    by their magnitude prior to computing correlation.

    Note: 
        If shifts are unexpectedly high, there is likely not high enough correlation between the 
        datamaps and alignment should not be used.

    Args:
        data_maps ((nmaps,) list): list of (ncol, nrow) spatial data arrays
        align_maps (bool): Whether or not to align maps. Always aligns to the first map. Default False.

    Returns:
        tuple: tuple containing:
            | **NCC (nmaps, nmaps):** normalized correlation coefficients
            | **shifts ((nmaps,) list):** list of (row_shifts, col_shifts) for each map

    Examples:

        Generate a noisy map and two copies with known change and shift

        .. code-block:: python

            data1 = np.random.normal(0,1,(nrows,ncols))
            data2 = data1.copy()
            NCC, _ = aopy.analysis.calc_spatial_map_correlation([data1, data2], False)
            self.assertAlmostEqual(NCC[1,0], 1)

            nrows_changed = 5
            ncols_changed = 3
            for irow in range(nrows_changed):
                data2[irow,:ncols_changed] = 1

            data3 = data2.copy()
            data3 = np.roll(data3, 2, axis=0)

            NCC, shifts = aopy.analysis.calc_spatial_map_correlation([data1, data2, data3], True)

        Plot the maps and correlation coefficients against the reference map
            
        .. code-block:: python

            fig, [ax1, ax2, ax3] = plt.subplots(1,3, figsize=(8,3))
            im1 = ax1.pcolor(data1)
            ax1.set(title='Reference')
            plt.colorbar(im1, ax=ax1)
            
            im2 = ax2.pcolor(data2)
            ax2.set(title=f'R^2={np.round(NCC[1,0],3)}')
            plt.colorbar(im2, ax=ax2)
            
            im3 = ax3.pcolor(data3)
            ax3.set(title=f'R^2={np.round(NCC[2,0],3)}')
            plt.colorbar(im3, ax=ax3)

        .. image:: _images/calc_spatial_map_correlation.png
    '''
    # Prepare spatial maps
    shifts = []
    flat_maps = []
    for idx in range(len(data_maps)):
        data_map = data_maps[idx].copy()
        if align_maps:        
            # Align to first map
            shift = (0,0)
            if idx == 0:
                day0_map = data_maps[0].copy()
            else:
                data_map, shift = align_spatial_maps(day0_map, data_map)
            shifts.append(shift)
        else:
            shifts.append((0,0))
        flat_maps.append(data_map.ravel())
            
    # remove NaNs so correlation doesn't output NaN
    mask = np.any(np.isnan(flat_maps), axis=0)
    if np.sum(mask) > 0:
        warnings.warn(f'Removing {np.sum(mask)} NaN values in data maps')
        flat_maps = np.array(flat_maps)[:,~mask]

    # Compute correlation
    flat_maps /= np.linalg.norm(flat_maps, axis=1, keepdims=True)
    NCC = np.corrcoef(flat_maps)

    return NCC, shifts   

[docs]def calc_spatial_data_correlation(elec_data, elec_pos, interp=False, grid_size=None, 
                                  interp_method='cubic', align_maps=False):
    '''
    Wrapper around :func:`~aopy.analysis.calc_spatial_map_correlation` that interpolates electrode data 
    onto a 2D map before computing correlation.

    Args:
        elec_data ((nmaps,) list): list of (nch,) spatial data arrays
        elec_pos ((nch, 2) array): electrode positions for each channel
        interp (bool): whether or not to interpolate data maps. Default False.
        grid_size ((2,) tuple, optional): map size for interpolation, e.g. (16,16) for a 16x16 grid
        interp_method (str): interpolation method to use. Default 'cubic'
        align_maps (bool): Whether or not to align maps. Default False.

    Returns:
        tuple: tuple containing:
            | **NCC (nmaps, nmaps):** normalized correlation coefficients
            | **shifts ((nmaps,) list):** list of (row_shifts, col_shifts) for each map
    '''
    data_maps = []
    for elec_data in elec_data:
        if interp:
            data_map, _ = visualization.calc_data_map(elec_data, elec_pos[:,0], elec_pos[:,1], 
                                                    grid_size, interp_method=interp_method)
        else:
            data_map = visualization.get_data_map(elec_data, elec_pos[:,0], elec_pos[:,1])
        data_maps.append(data_map)

    return calc_spatial_map_correlation(data_maps, align_maps)

[docs]def calc_spatial_tf_data_correlation(freqs, time, tf_elec_data, elec_pos, null_tf_elec_data=None,
                                     band=(12,150), window=(0,1), alternative='greater', 
                                     nan_policy='propagate', alpha=0.05, interp=False, 
                                     grid_size=None, interp_method='cubic', align_maps=False):
    '''
    Wrapper around :func:`~aopy.analysis.calc_spatial_map_correlation` that averages over a given time-window
    and frequency-band, then interpolates data onto a 2D map before computing correlation.
    
    Args:
        freqs (nfreq): frequency axis
        time (nt): time axis
        tf_elec_data (list of (nt, nfreq, nch)): time-frequency data arrays
        band (tuple): frequency band of interest, e.g. (12, 150), in Hz
        window (tuple): time window of interest, e.g. (0, 1), in seconds
        null_tf_elec_data (list of (nt, nfreq, nch), optional): time-frequency null data arrays to
            compute significance. If None, no significance testing is performed.
        alternative (str, optional): Hypothesis test alternative ('greater', 'less', 'two-sided'). Defaults to 'greater'.
        nan_policy (str, optional): Handling of NaN values. Defaults to 'propagate'.
        alpha (float, optional): Significance level. Defaults to 0.05.
        interp (bool): whether or not to interpolate data maps. Default False.
        grid_size ((2,) tuple, optional): map size for interpolation, e.g. (16,16) for a 16x16 grid
        interp_method (str): interpolation method to use. Default 'cubic'
        align_maps (bool): Whether or not to align maps. Default False.

    Returns:
        tuple: tuple containing:
            | **NCC (nmaps, nmaps):** normalized correlation coefficients
            | **shifts ((nmaps,) list):** list of (row_shifts, col_shifts) for each map
    '''
    band_data = []
    for elec_data in tf_elec_data:
        if null_tf_elec_data is None:
            band_data.append(calc_tfr_mean(freqs, time, elec_data, band=band, window=window))
        else:
            diff, p = calc_tfr_mean_fdrc_ranktest(
                freqs, time, elec_data, null_tf_elec_data, band=band, window=window,
                                alternative=alternative, nan_policy=nan_policy, alpha=alpha)
            diff[p > alpha] = np.nan
            band_data.append(diff)
    
    return calc_spatial_data_correlation(band_data, elec_pos, interp=interp, grid_size=grid_size,
                                         interp_method=interp_method, align_maps=align_maps)

[docs]def get_confidence_interval(sample, hist_bins, alpha=0.025, ax=None, **kwarg):
    '''
    Compute a confidence interval from samples, not the mean of samples
    If you want to compute it for the mean of samples, use scipy.stats.t.interval.
    
    Args:
        sample (nsamples): data samples
        hist_bins (int or sequence of scalars): the number of bins or array of bin edges
        alpha (float): significance level to define a confidece interval. Defaults to 0.025
        ax (pyplot.Axes, optional): axis on which to plot data histogram and confidence interval. Defaults to None.
        kwargs (dict): additional keyword arguments to pass to ax.hist()
        
    Returns:
        (list): lower and upper bounds in the confidence interval
    '''
    
    # Compute cdf from histogram in samples
    count, bin_edges = np.histogram(sample, bins=hist_bins)
    bin_edges = bin_edges[1:] - (bin_edges[1] - bin_edges[0])/2 # Use center of bins
    pdf = count / sum(count)
    cdf = np.cumsum(pdf)
    
    # Compute lower and upper bound
    lower_bound = bin_edges[np.where(cdf>alpha)[0][0]]
    upper_bound = bin_edges[np.where(cdf<1-alpha)[0][-1]]
    
    # Plot histogram and confidence interval
    if ax is not None:
        ax.hist(sample,**kwarg)
        ax.axvline(lower_bound, color='r', linestyle='--')
        ax.axvline(upper_bound, color='r', linestyle='--')
        ax.set(ylabel='# count')
        
        ax2 = ax.twinx()
        ax2.plot(bin_edges, cdf, 'k')
        ax2.set(ylabel='cdf')
        
    return [lower_bound, upper_bound]

[docs]def calc_confidence_interval_overlap(CI1, CI2):
    '''
    Calculate the overlap between two confidence intervals.

    Parameters:
        CI1 (tuple or list): Tuple containing the lower and upper bounds of the first confidence interval.
        CI2 (tuple or list): Tuple containing the lower and upper bounds of the second confidence interval.

    Returns:
        (float): Overlap ratio (0 to 1) between the two confidence intervals.
    '''
    
    lower1, upper1 = CI1
    lower2, upper2 = CI2
    
    # Calculate overlap
    overlap_lower = max(lower1, lower2)
    overlap_upper = min(upper1, upper2)
    overlap_width = max(0, overlap_upper - overlap_lower)

    # Calculate widths of the intervals
    width1 = upper1 - lower1
    width2 = upper2 - lower2
    
    # Calculate overlap ratio
    overlap = (overlap_width / min(width1, width2))
    
    return overlap

[docs]def calc_fdrc_ranktest(altdata, nulldata_dist, alternative='greater', nan_policy='raise', alpha=0.05):
    """
    Compute statistical significance using the Wilcoxon signed-rank test with FDR correction.
    
    Args:
        altdata (nch): Observed data values.
        nulldata_dist (n_null, nch): Null distribution for comparison.
        alternative (str, optional): Hypothesis test alternative ('greater', 'less', 'two-sided'). Defaults to 'greater'.
        nan_policy (str, optional): Handling of NaN values. Defaults to 'raise'.
        alpha (float, optional): Significance level. Defaults to 0.05.
    
    Returns:
        tuple: tuple containing:
            | **effect_size (nch):** differences between the alternative and null data
            | **p_fdrc (nch):** Adjusted p-values for each alternative hypothesis test.
    """
    differences = altdata - nulldata_dist
    result = wilcoxon(differences, axis=0, alternative=alternative, nan_policy=nan_policy)
    p_ranktest = result.pvalue
    rej, p_fdrc = fdrcorrection(p_ranktest, alpha=alpha)
    
    diff = np.nanmean(differences, axis=0)
    diff[p_fdrc > alpha] = 0
    
    return diff, p_fdrc

[docs]def windowed_xval_lda_wrapper(data, labels, samplerate, lags=3, nfolds=5, regularization='auto', lda_model=None, return_weights=False, return_confusion_matrix=False):
    """
    Perform cross-validation with Linear Discriminant Analysis (LDA) to estimate decoding accuracy at each time point.

    This function performs an n-fold cross-validation LDA analysis on time-series data to compute the decoding accuracy 
    across time windows defined by `lags`. Optionally, it can return the weights of the LDA classifier and/or confusion matrices 
    for each fold.

    Args:
        data (numpy.ndarray): The input data array with shape (ntime, nch, ntrials), where `ntime` is the number of time points,
                               `nch` is the number of channels, and `ntrials` is the number of trials.
        labels (numpy.ndarray): Array of shape (ntrials,) containing the labels for each trial.
        samplerate (float or int): Samplerate of data. Used to compute the timeaxis.
        lags (int, optional): The number of time lags to include in the analysis (default is 3). To only use a single timepoint set lags=0
        nfolds (int, optional): The number of folds for cross-validation (default is 5).
        regularization (str or float, optional): If regularization should be included when building the LDA model. Input into the shrinkage parameter of the sklearn 
                                LDA function. Can either be None, 'auto', or a float between 0 and 1. 
        lda_model (sklearn LDA class, optional): User-defined LDA model from sklearn.discriminant_analysis.LinearDiscriminantAnalysis. If None, this function will initialize the model.
        return_weights (bool, optional): Whether to return the LDA weights (default is False).
        return_confusion_matrix (bool, optional): Whether to return the confusion matrix for each fold (default is False).

    Returns:
        tuple: Tuple containing:
            | **accuracy (ntime-nlags, nfolds):** The decoding accuracy for each time point (and fold if cross-validation is used). 
            | **time_axis (nt-nlags):** The time-axis for each trial of the output data. When lags>0, each time-point corresponds to the right edge of the window. This is the time point corresponding to the latest data used in decoding.
            | **(Optional) LDA Weights (ntime-lags, nlabels, nfeatures, nfolds):** The LDA weights for each time point, channel, and fold if `return_weights=True`. Note: nfeatures will include lagged features if lags are used.
            | **(Optional) Confusion Matrix (ntime-lags, nlabels, nlabels, nfolds):** The confusion matrix for each fold if `return_confusion_matrix=True`. 

    Raises:
        ValueError: If the input data or labels are not valid, or if there is a mismatch between the data and labels.

    Notes:      
        If `nfolds < 2`, no cross-validation is performed, and the function will calculate the accuracy based on the entire dataset.
        If `nfolds >= 2`, k-fold cross-validation is performed, and decoding accuracy is calculated for each fold.
    """

    ntime, nch, ntrials = data.shape 
    nlabels = len(np.unique(labels))

    # Perform n-fold xval LDA at each time point 
    decoding_accuracy = np.zeros((ntime-lags, nfolds))*np.nan
    weights = np.zeros((ntime-lags, nlabels, (1+lags)*nch, nfolds))*np.nan # (ntime, ntargets, nfeatures, nfolds)
    cm = np.zeros((ntime-lags, nlabels, nlabels, nfolds))*np.nan
    nwind = data.shape[0] - lags
    time_axis = (np.arange(nwind)+lags)/samplerate
    for iwind in range(nwind):
        if lda_model is None:
            lda = LinearDiscriminantAnalysis(solver='eigen', shrinkage=regularization)
        else:
            lda = lda_model

        end_wind = iwind+lags+1

        # If there are nans at this timestep, return nan in all places
        if np.sum(np.isnan(data[iwind:end_wind,:,:])):
            if nfolds < 2:
                decoding_accuracy[iwind] = np.nan
                weights[iwind,:,:] = np.nan
                cm[iwind,:,:] = np.nan
            else:
                decoding_accuracy[iwind,:] = np.nan
                if return_weights:
                    weights[iwind,:,:,:] = np.nan
                if return_confusion_matrix:
                    cm[iwind,:,:,:] = np.nan

        else:
            # If not cross validated
            if nfolds < 2:
                lda.fit(np.vstack(data[iwind:end_wind,:,:]).T - np.mean(np.vstack(data[iwind:end_wind,:,:]).T, axis=0), labels)
                decoding_accuracy[iwind] = lda.score(np.vstack(data[iwind:end_wind,:,:]).T - np.mean(np.vstack(data[iwind:end_wind,:,:]).T, axis=0), labels)
                predicted_labels = lda.predict(np.vstack(data[iwind:end_wind,:,:]).T - np.mean(np.vstack(data[iwind:end_wind,:,:]).T, axis=0))
                cm[iwind,:,:,0] = confusion_matrix(labels, predicted_labels)
                                                        
            # if cross validated: 
            else:
                kf = model_selection.KFold(n_splits=nfolds,shuffle=True,random_state=None)
                for ifold, (train_idx, test_idx) in enumerate(kf.split(np.vstack(data[iwind:end_wind,:,:]).T)):
                    # print(ifold, train_idx, test_idx, iwind, end_wind)
                    lda.fit(np.vstack(data[iwind:end_wind,:,train_idx]).T - np.mean(np.vstack(data[iwind:end_wind,:,train_idx]).T, axis=0), labels[train_idx])
                    decoding_accuracy[iwind, ifold] = lda.score(np.vstack(data[iwind:end_wind,:,test_idx]).T - np.mean(np.vstack(data[iwind:end_wind,:,train_idx]).T, axis=0), labels[test_idx])
                    predicted_labels = lda.predict(np.vstack(data[iwind:end_wind,:,test_idx]).T - np.mean(np.vstack(data[iwind:end_wind,:,train_idx]).T, axis=0))
                    if return_weights:
                        weights[iwind,:,:,ifold] = lda.coef_
                    if return_confusion_matrix:
                        cm[iwind,:,:,ifold] = confusion_matrix(labels[test_idx], predicted_labels, normalize='true')
            
    if return_weights & return_confusion_matrix:
        return decoding_accuracy, time_axis, weights, cm
    elif return_weights: 
        return decoding_accuracy, time_axis, weights
    elif return_confusion_matrix:
        return decoding_accuracy, time_axis, cm
    else:
        return decoding_accuracy, time_axis

[docs]def xval_lda_subsample_wrapper(data, labels, min_trial, cond_mask=None, single_decoding=True, min_unit=None, shuffle_labels=False,
        nfolds=5, replacement=False, regularization='auto', lda_model=None, return_labels=False, return_weights=False, seed=None):
    '''
    Perform an n-fold cross-validation with Linear Discriminant Analysis (LDA) using a single unit or multiple units.
    This functions extracts trials and/or units randomly based on the random seed with/without replacement.
    The number of trials per target is controlled to be the same across targets
    You can repeatedly perform this function by changing random seed to estimate the resampling distribution

    Args:
        data (nunit, ntr) or (nunit, nfeatures, ntr): neural data. 2 different shapess are allowed. 
        labels (ntr): the labels for each trial.
        min_trial (int): the minimum number of trials for each label to be extracted
                                if this is 20, 20*(the number of unique labels) trials are extracted
        cond_mask (ntr): a boolean array. This is a mask to extract trials that satisfies a certain condition
                                (ex. movement onset is more than a certain threshold)
        single_decoding (bool, optional): If True, LDA is performed using single unit activity separately (default is True)
        min_unit (int, optional): the number of units used for decoding. This is used only when single_decoding is False.
                                if min_unit is None, decoding is perfomed using all units (default is None)
        shuffle_labels (bool, optional): whether to shuffle labels or not (default is False)
        nfolds (int, optional): the number of folds for cross-validation (default is 5)
        replacement (bool, optional): whether to choose trials with replacement or without replacement
        regularization (str or float, optional): If regularization should be included when building the LDA model
                                Input into the shrinkage parameter of the sklearn LDA function
                                Can either be None, 'auto', or a float between 0 and 1. 
        lda_model (sklearn LDA class, optional): User-defined LDA model from sklearn.discriminant_analysis.LinearDiscriminantAnalysis. If None, this function will initialize the model.
        return_labels (bool, optional): Whether to return true and predicted labels (default is False).
        return_weights (bool, optional): Whether to return the LDA weights (default is False).
        seed (int, optional): random seed

    Returns:
        tuple: Tuple containing:
            | **accuracy (nch) or (float):** the decoding accuracy. If single_decoding is False, this gets a single velue.
            | **(Optional) true_Y (nch,ntr) or (ntr):** a list of true labels. If single_decoding is False, its shape becomes (ntr).
            | **(Optional) pred_Y (nch,ntr) or (ntr):** a list of predicted labels. If single_decoding is False, its shape becomes (ntr).
            | **(Optional) LDA Weights (nlabels,nch,nfolds) or (nlabels,nch,nfeatures,nfolds):** The LDA weights if return_weights is True.

    Examples:
        
        .. code-block:: python

            "This is an example of this function using multiprocessing to get a resampling distribution"
            
            import multiprocessing as mp

            single_decoding = True
            min_unit = None
            shuffle_labels = False
            n_fold = 5
            replacement = False
            regularization = 'auto'
            lda_model = None
            return_labels = True
            return_weights = False
            n_resample = 100 # the number of resampling
            n_processes = 20 # the number of cpus used for the computation

            pool = mp.Pool(n_processes)
            result_objects = [pool.apply_async(xval_lda_subsample_wrapper,\
                args=(data, target_idx, min_trials, trial_mask, single_decoding, min_unit, shuffle_labels, n_fold, \
                    replacement, regularization, lda_model, return_labels, return_weights, ibs)) for ibs in range(n_resample)]
            pool.close()

            # Organize results
            results = [r.get() for r in result_objects]
            accuracy, pred_labels_resample, true_labels_resample = zip(*results)
            accuracy = np.array(accuracy)
            pred_labels_resample = np.array(pred_labels_resample, int)
            true_labels_resample = np.array(true_labels_resample, int)

    See Also:
        :func:`~aopy.analysis.base.windowed_xval_lda_wrapper`

    '''

    if data.ndim == 2:
        # (nunit, ntr) -> (nunit, 1, ntr)
        data = data[:, np.newaxis, :]
    elif data.ndim != 3:
        raise ValueError("data must have shape (nunit, ntr) or (nunit, nfeatures, ntr)")
    
    nunit, nfeatures, ntr = data.shape
    nlabels = len(np.unique(labels))
    kf = model_selection.KFold(n_splits=nfolds)

    if seed is not None:
        np.random.seed(seed)

    if lda_model is None:
        lda = LinearDiscriminantAnalysis(solver='eigen', shrinkage=regularization)
    else:
        lda = lda_model

    if shuffle_labels:
        Y = np.random.permutation(Y)

    # Choose trials randomly so that the number of trials per target can be the same across targets.
    trial_mask = postproc.get_conditioned_trials_per_target(labels, min_trial, cond_mask=cond_mask, replacement=replacement, seed=seed)
        
    # Extract trials
    data_trial = data[:,:,trial_mask]
    Y = labels[trial_mask]

    pred_Y = []
    true_Y = []

    # Perform LDA using single unit activity separately
    if single_decoding:

        if return_weights:
            weights = np.zeros((nlabels, nunit, nfeatures, nfolds))*np.nan
    
        accuracy = []
        for iunit in range(data_trial.shape[0]):
            # Flatten features for sklearn
            X = data_trial[iunit].T  # shape (ntr, nfeatures)
            
            pred_Y_ch = []
            true_Y_ch = []

            # k-fold cross-validation
            for ifold, (train_idx, test_idx) in enumerate(kf.split(X)):
    
                Xtrain,Xtest = X[train_idx,:],X[test_idx,:]
                Ytrain,Ytest = Y[train_idx],Y[test_idx]
                
                lda.fit( (Xtrain - np.mean(Xtrain,axis=0)), Ytrain)
    
                pred_Y_ch.extend(lda.predict( (Xtest - np.mean(Xtrain,axis=0)) ))
                true_Y_ch.extend(Ytest)

                if return_weights:
                    weights[:,iunit,:,ifold] = lda.coef_
                    
            accuracy.append(accuracy_score(true_Y_ch, pred_Y_ch))
            true_Y.append(true_Y_ch)
            pred_Y.append(pred_Y_ch)

        accuracy = np.array(accuracy)

    # Perform LDA using multiple unit activity together
    else:
        # Subsample units for decoding
        if min_unit is not None:
            unit_mask = np.random.choice(nunit, size=min_unit, replace=replacement) # randomly choose units
            X = data_trial[unit_mask,:,:].reshape(min_unit*nfeatures, -1).T
            if return_weights:
                weights = np.zeros((nlabels, min_unit, nfeatures, nfolds))*np.nan
        # Use all units without subsampling
        else:
            X = data_trial.reshape(nunit*nfeatures, -1).T
            if return_weights:
                weights = np.zeros((nlabels, nunit, nfeatures, nfolds)) * np.nan

        # k-fold cross-validation
        for ifold, (train_idx, test_idx) in enumerate(kf.split(X)):

            Xtrain,Xtest = X[train_idx,:],X[test_idx,:]
            Ytrain,Ytest = Y[train_idx],Y[test_idx]
            
            lda.fit( (Xtrain - np.mean(Xtrain,axis=0)), Ytrain)

            true_Y.extend(Ytest)
            pred_Y.extend(lda.predict( (Xtest - np.mean(Xtrain,axis=0)) ))
            
            if return_weights:
                weights[:,:,:,ifold] = lda.coef_.reshape(nlabels, -1, nfeatures)

        accuracy = accuracy_score(true_Y, pred_Y)

    # Organize results
    results = [accuracy]
    if return_labels:
        results.append(np.array(true_Y))
        results.append(np.array(pred_Y))
    if return_weights:
        results.append(np.squeeze(weights))

    if len(results) == 1:
        return results[0]
    else:
        return tuple(results)

[docs]def simulate_ideal_trajectories(targets, origin=[0.0, 0.0, 0.0], resolution=1000):
    """
    Simulates straight reach trajectories from a given origin to a list of target points in 3D space.
    A fixed number of samples is used for each reach (i.e. time to target is constant.)

    Args:
        targets (numpy.ndarray or list of lists/tuples): A list or array of target coordinates
            in space.
        origin (list or tuple, optional): The origin point from which the trajectories
            are simulated. Default is zeros in all dimensions.
        resolution (int, optional): The number of points used to render each trajectory.
            Default is 1000.

    Returns:
        (num_targets, resolution, num_dims) numpy.ndarray: An array of simulated trajectories, each being a series of points
            from the origin to the corresponding target.

    Examples:

        .. code-block:: python

            subject = 'MCP015'
            entries = db.lookup_mc_sessions(subject=subject)
            subjects, ids, dates = db.list_entry_details(entries)
            df = aopy.data.tabulate_behavior_data_center_out(preproc_dir, subjects, ids, dates, 
                                                            metadata=['target_radius', 'session'])
            target_radius = df['target_radius'][0]
            target_indices = np.unique(df['target_idx'])
            target_locations = aopy.data.bmi3d.get_target_locations(preproc_dir, subject,
                                                                    te_id, dates[0], target_indices)

            ideal_trajectories = simulate_ideal_trajectories(target_locations[1:], target_locations[0])
            
            fig = plt.figure()
            ax = fig.add_subplot(111, projection='3d')
            aopy.visualization.color_trajectories(ideal_trajectories, target_idx, colors)
            
        .. image:: _images/simulate_ideal_trajectories.png

    """

    if len(targets[0])!=3 and origin is None:
        origin = []
        for d in np.arange(len(targets[0])):
            origin.append(0.0)

    max_dist = np.max(targets - origin)
    num_points = int(max_dist * resolution)
    
    trajectories = []
    
    for target in targets:
        traj = np.linspace(origin, target, num_points)
        trajectories.append(traj)
        
    return np.array(trajectories)

[docs]def calc_statistic_random_trials(data, n_trials=300, 
                                 statistic=partial(np.mean, axis=0),
                                 rng=None):
    '''
    Calculate a distribution of a statistic across groups of trials of the data
    by randomly sampling trials without replacement.

    Args:
        data (ntrials, nch): data to calculate the statistic on. Also accepts a pandas DataFrame of
            shape (ntrials, ...) if the statistic can be calculated on a DataFrame.
        n_trials (int): number of trials to use in each bootstrap
        statistic (function): function to calculate the statistic on the data. Should
            take the form `f(x) = y` where `x` is a 2D array of shape (n_trials, nch)
            and `y` is a 1D array of shape (nch). Default is np.mean(x, axis=0).
        rng (numpy.random.Generator, optional): Random number generator to use for shuffling trials.
            If None, uses the default random number generator. Default is None.
            
    Returns:
        (len(data)//ntrials, nch) array: distributions of the statistic across divisions of the data.

    Examples:

        .. code-block:: python

            elec_pos, _, _ = aopy.data.load_chmap()
            n_elec = len(elec_pos)
            total_trials = 1600
            n_trials = 50
            np.random.seed()
            data = 0.5*np.ones((total_trials,n_elec))
            data += np.random.normal(0.5, size=(total_trials,n_elec))
            data[:,n_elec//4:n_elec//2] += 0.1

            dists = aopy.analysis.calc_statistic_random_trials(data, n_trials=n_trials)
            self.assertEqual(np.shape(dists), (len(data)//n_trials, n_elec))

            # Test that the distribution means are close to the original data mean
            mean = np.mean(data, axis=0)
            dists_mean = np.mean(dists, axis=0)
            dists_std = np.std(dists, axis=0)
            for i in range(n_elec):
                self.assertAlmostEqual(mean[i], dists_mean[i], delta=0.1)
            clim = (np.min(dists_mean), np.max(dists_mean))

            plt.figure(figsize=(5,2), dpi=300)
            plt.subplot(1,3,1)
            im = aopy.visualization.plot_spatial_drive_map(mean, 
                                            elec_data=True, cmap='Grays')
            im.set_clim(*clim)
            plt.axis('off')
            plt.colorbar(im, shrink=0.5)
            plt.title('data mean')

            plt.subplot(1,3,2)
            im = aopy.visualization.plot_spatial_drive_map(dists_mean, 
                                            elec_data=True, cmap='Grays')
            im.set_clim(*clim)
            plt.axis('off')
            plt.colorbar(im, shrink=0.5)
            plt.title('dist means')

            plt.subplot(1,3,3)
            im = aopy.visualization.plot_spatial_drive_map(dists_std, 
                                            elec_data=True, cmap='Grays')
            plt.axis('off')
            plt.colorbar(im, shrink=0.5)
            plt.title('dist std')

        .. image:: _images/calc_statistic_random_trials.png
    '''
    if rng is None:
        rng = np.random.default_rng()
    all_trials = np.arange(len(data))
    rng.shuffle(all_trials)
    n_div = len(data)//n_trials
    if n_div < 1:
        raise ValueError(f"Not enough trials in data ({len(data)}) to perform the calculation with n_trials ({n_trials}).")
    trials = np.reshape(all_trials[:n_div*n_trials], (n_div, n_trials))

    dist = []
    for k in range(n_div):
        try:
            dist.append(statistic(data[trials[k]]))
        except KeyError:
            dist.append(statistic(data.iloc[trials[k]].reset_index(drop=True)))

    return np.array(dist)

def _calc_statistic_random_trials(args):
    '''
    Helper function to unpack arguments for parallel processing.
    '''
    return calc_statistic_random_trials(*args)

[docs]def calc_trial_bootstraps(data, n_trials=300, n_bootstraps=30, 
                          statistic=partial(np.mean, axis=0), 
                          rng=None, parallel=False, verbose=True):
    '''
    Repeatedly call :func:`~aopy.analysis.calc_statistic_random_trials` to generate
    statistics over randomly sampled trials. Each bootstrap draws random groups of 
    trials, each of size `n_trials`, without replacement, until there aren't enough
    trials to make another full size group. The statistic is then calculated on each 
    group, resulting in `n_bootstraps * len(data)//n_trials` values.

    Args:
        data (ntrials, nch): data to calculate the statistic on
        n_trials (int): number of trials to use in each bootstrap
        n_bootstraps (int): number of bootstrap trials to perform
        statistic (function): function to calculate the statistic on the data. Should
            take the form `f(x) = y` where `x` is a 2D array of shape (n_trials, nch)
            and `y` is a 1D array of shape (nch). Default is np.mean(x, axis=0).
        rng (numpy.random.Generator, optional): Random number generator to use for shuffling trials.
            Be careful when using this with parallel processing, as it may lead to
            duplicate results if the same random number generator is used across processes.
            If None, uses a new default random number generator on each bootstrap.
            Default is None.
        parallel (bool or mp.pool.Pool, optional): Whether to run the bootstraps in parallel.
            If True, uses a multiprocessing pool with 10 workers. If a Pool is provided,
            it will use that pool instead. The pool will not be closed. If False, 
            runs the bootstraps sequentially.
        verbose (bool, optional): Whether to print progress bars. Default is True.
            
    Returns:
        (n_bootstraps, len(data)//n_trials, nch) array: multiple bootstraps of distributions
            of the statistic applied to divisions of the data.
    '''
    assert n_bootstraps > 0, "must have at least 1 bootstrap"
    assert n_trials > 0, "must have at least 1 trial"
    assert len(data) >= n_trials, "data must have at least as many trials as n_trials"
    assert callable(statistic), "statistic must be a callable function"

    if rng is None:
        rng = np.random.default_rng()
    args_list = [(data, n_trials, statistic, rng) for rng in rng.spawn(n_bootstraps)]

    pool = None
    if parallel is True:
        pool = mp.Pool(mp.cpu_count() // 2)  # use half of the available cores
    elif type(parallel) is mp.pool.Pool: # use an existing pool
        pool = parallel
    
    if n_bootstraps == 1:
        results = [calc_statistic_random_trials(*args_list[0])]
    elif pool:
        if verbose:
            results = list(tqdm(pool.imap(_calc_statistic_random_trials, args_list), 
                                total=n_bootstraps, desc="Bootstraps"))
        else:
            results = list(pool.imap(_calc_statistic_random_trials, args_list))
        if parallel is True:
            pool.close()
    else:
        results = []
        if verbose:
            iterator = tqdm(args_list, desc="Bootstraps")
        else:
            iterator = args_list
        for args in iterator:
            results.append(calc_statistic_random_trials(*args))

    return np.array(results)

def _compare_conditions_bootstrap_spatial_corr_worker(
        data, elec_pos, labels, n_trials=300, n_bootstraps=30, 
        statistics=partial(np.mean, axis=0), rng=None, parallel=False):
    '''
    Compare multiple conditions using bootstrapping. Two comparisons are made:
        1. The spatial correlation of the distributions of the statistic across conditions.
        2. The d-prime value for each channel pooled across bootstraps and comparing
           across conditions.

    Args:
        data (ntrials, nch): data to calculate the statistic on. Also accepts a pandas DataFrame of
            shape (ntrials, ...) if the statistic can be calculated on a DataFrame.
        elec_pos ((nch, 2) array): electrode positions for each channel
        labels (ntrials,): labels for each trial, used to group trials by condition
        n_trials (int): number of trials to use in each bootstrap
        n_bootstraps (int): number of bootstrap trials to perform
        rng (numpy.random.Generator, optional): Random number generator to use for shuffling trials.
            Be careful when using this with parallel processing, as it may lead to
            duplicate results if the same random number generator is used across processes.
            If None, uses a new default random number generator on each bootstrap.
            Default is None.
        statistics (function or list of functions): function(s) to calculate the statistic on the data. 
            If more than one is supplied, they will be applied per condition 

    Returns:
        tuple: tuple containing:
            | **cond_dists (n_cond, n_bootstraps, len(data)//n_trials, nch):** bootstraps distributions for each condition
            | **conditions (n_cond):** unique conditions in the labels
            | **corr_mats (n_bootstraps, n_cond*n_cond, n_cond*n_cond, nch):** list of spatial correlation matrices for each bootstrap
            | **dprime (nch):** d-prime value for each channel pooled across bootstraps and comparing across conditions
    '''
    conditions = np.unique(labels)
    if len(conditions) < 2:
        raise ValueError("At least two conditions are required for comparison")
    if callable(statistics):
        statistics=[statistics] * len(conditions)

    cond_dists = []
    for idx, cond in enumerate(conditions):
        try:
            data_cond = data[labels == cond]
        except KeyError:
            data_cond = data.iloc[labels == cond].reset_index(drop=True)

        if len(data_cond) < n_trials:
            raise ValueError(f"Condition {cond} has less than {n_trials} trials")

        dist = calc_trial_bootstraps(data_cond, n_trials=n_trials, n_bootstraps=n_bootstraps,
                                     statistic=statistics[idx], rng=rng, parallel=parallel)
        
        cond_dists.append(dist)

    # Compare spatial correlation
    corr_mats = []
    for i in range(n_bootstraps):
        dists = [cd[i] for cd in cond_dists]
        cmp = calc_spatial_data_correlation(np.concatenate(dists), 
                                            elec_pos, interp=False)[0]
        corr_mats.append(cmp)

    # d-prime pooled across bootstraps
    dprime = tuning.calc_dprime(*[np.concatenate(cd) for cd in cond_dists])

    return cond_dists, conditions, corr_mats, dprime

[docs]def compare_conditions_bootstrap_spatial_corr(
        data, elec_pos, labels, n_trials=300, n_bootstraps=30, n_shuffle=0, 
        statistics=partial(np.mean, axis=0), rng=None, parallel=False):
    '''
    Compare multiple conditions using bootstrapping and shuffling. Each additional
    bootstrap draws random groups of trials, each of size `n_trials`, without replacement,
    until there aren't enough trials to make another full size group. The statistic is then
    calculated on each group, resulting in `n_bootstraps * len(data)//n_trials` values.
    The spatial correlation of the statistic across conditions is calculated within each
    bootstrap, and the d-prime is calculated for all statistics pooled across bootstraps.
    Finally, if `n_shuffle > 0`, the labels are shuffled `n_shuffle` times and the bootstrap
    procedure repeated to create a null distribution for the spatial correlation and d-prime values.

    Args:
        data (ntrials, nch): data to calculate the statistic on
        elec_pos ((nch, 2) array): electrode positions for each channel
        labels (ntrials,): labels for each trial, used to group trials by condition
        n_trials (int): number of trials to use in each bootstrap
        n_bootstraps (int): number of bootstrap trials to perform
        n_shuffle (int): number of times to shuffle the labels to create a null distribution
        statistics (function or list of functions): function(s) to calculate the statistic on the data. If more than one is supplied, they will be applied per condition 
        rng (numpy.random.Generator, optional): Random number generator to use for shuffling trials.
            Be careful when using this with parallel processing, as it may lead to
            duplicate results if the same random number generator is used across processes.
            If None, uses a new default random number generator on each bootstrap.
            Default is None.
        parallel (bool or mp.pool.Pool, optional): Whether to run the bootstraps in parallel.
            If True, uses a multiprocessing pool with 10 workers. If a Pool is provided,
            it will use that pool instead. The pool will not be closed. If False,
            runs the bootstraps sequentially. Default is False.
        
    Returns:
        tuple: tuple containing:
            | **observed_dists (n_cond, n_bootstraps, len(data)//n_trials, nch):** bootstraps distributions for each condition
            | **conditions (n_cond):** unique conditions in the labels
            | **observed_corr (n_bootstraps, n_cond*n_cond, n_cond*n_cond, nch):** list of spatial correlation matrices for each bootstrap
            | **observed_dprime (nch):** d-prime value for each channel pooled across bootstraps and comparing across conditions
        
        if n_shuffle > 0:
            | **shuff_dists_dist (n_shuffle, n_cond, n_bootstraps, len(data)//n_trials, nch):** shuffled distributions for each condition
            | **shuff_corr_dist (n_shuffle, n_bootstraps, n_cond*n_cond, n_cond*n_cond, nch):** shuffled spatial correlation matrices
            | **shuff_dprime_dist (n_shuffle, nch):** shuffled d-prime  

    Examples:

        .. code-block:: python

            elec_pos, _, _ = aopy.data.load_chmap()
            n_elec = len(elec_pos)
            total_trials = 1600
            n_trials = 200
            n_bootstraps = 50

            # Test null distribution
            np.random.seed(0)
            data = 0.5*np.ones((total_trials,n_elec))
            data += np.random.normal(0.5, size=(total_trials,n_elec))
            data[:,n_elec//4:n_elec//2] += 0.1
            labels = np.zeros((total_trials,))
            labels[total_trials//2:] = 1

            def plot_result(means, corr_mat, dprime, row):

                mean12 = np.concatenate(means)
                clim = (np.min(mean12),np.max(mean12))

                plt.subplot(3,4,(4*(row-1))+1)
                im = aopy.visualization.plot_spatial_drive_map(means[0], 
                                                elec_data=True, cmap='Grays')
                im.set_clim(*clim)
                plt.colorbar(im, shrink=0.5)
                plt.axis('off')
                plt.title('Condition 1')

                plt.subplot(3,4,(4*(row-1))+2)
                im = aopy.visualization.plot_spatial_drive_map(means[1], 
                                                elec_data=True, cmap='Grays')
                im.set_clim(*clim)
                plt.colorbar(im, shrink=0.5)
                plt.axis('off')
                plt.title('Condition 2')

                plt.subplot(3,4,(4*(row-1))+3)
                im = plt.imshow(np.nanmean(corr_mat, axis=0), cmap='Grays', vmin=0, vmax=1, origin='lower')
                plt.colorbar(im, shrink=0.5)
                sz = len(corr_mat[0])//2
                plt.xticks(range(sz*2), labels=['1']*sz + ['2']*sz)
                plt.yticks(range(sz*2), labels=['1']*sz + ['2']*sz)
                plt.xlabel('Condition')
                plt.ylabel('Condition')
                plt.title('Correlation')

                plt.subplot(3,4,(4*(row-1))+4)
                im = aopy.visualization.plot_spatial_drive_map(dprime, elec_data=True, cmap='turbo')
                im.set_clim(0,5)
                plt.axis('off')
                plt.colorbar(im, shrink=0.5)
                plt.title('dprime')

            fig = plt.figure(figsize=(8,6), dpi=300)

            means = [np.mean(data[labels == i,:], axis=0) for i in np.unique(labels)]
            dists, conditions, corr_mat, dprime = \
                aopy.analysis.compare_conditions_bootstrap_spatial_corr(
                    data, elec_pos, labels, n_trials=n_trials, n_bootstraps=n_bootstraps, parallel=False
                )
            plot_result(means, corr_mat, dprime, 1)
            fig.text(0.5, 1, "Null distribution", ha='center', va='top', fontsize=14)

            # Test difference
            data[labels == 1,:n_elec//8] += 0.2

            means = [np.mean(data[labels == i,:], axis=0) for i in np.unique(labels)]
            dists, conditions, corr_mat, dprime, shuff_dists, shuff_mat, shuff_dprime = \
                aopy.analysis.compare_conditions_bootstrap_spatial_corr(
                    data, elec_pos, labels, n_trials=n_trials, n_bootstraps=n_bootstraps, n_shuffle=1, parallel=False
                )
            plot_result(means, corr_mat, dprime, 2)
            fig.text(0.5, 0.65, "Difference", ha='center', va='top', fontsize=14)

            # Test shuffled
            plot_result(means, shuff_mat[0], shuff_dprime[0], 3)
            fig.text(0.5, 0.35, "Shuffled", ha='center', va='top', fontsize=14)

        .. image:: _images/compare_conditions_bootstrap_spatial_corr.png

        Sweep over increasing n_trials of the same data as above
        
        .. code-block:: python

            n_bootstraps = 10
            avg_coeff_1 = []
            avg_coeff_2 = []
            avg_dprime_1 = []
            avg_dprime_2 = []
            trial_sizes = range(10, 450, 50)
            for n_trials in trial_sizes:
                dists, conditions, corr_mat, dprime = \
                    aopy.analysis.compare_conditions_bootstrap_spatial_corr(
                        data, elec_pos, labels, n_trials=n_trials, n_bootstraps=n_bootstraps, parallel=False
                    )
                avg_corr_map = np.nanmean(corr_mat, axis=0)
                sz = avg_corr_map.shape[0]//2
                avg_coeff_1.append(np.nanmean(avg_corr_map[:sz,:sz]))
                avg_coeff_2.append(np.nanmean(avg_corr_map[sz:,:sz]))
                avg_dprime_1.append(np.mean(dprime[:n_elec//8]))
                avg_dprime_2.append(np.mean(dprime[-n_elec//8:]))

            plt.figure(figsize=(5,2), dpi=300)
            plt.subplot(1,2,1)
            plt.plot(trial_sizes, avg_coeff_1)
            plt.plot(trial_sizes, avg_coeff_2)
            plt.ylabel('map correlation')
            plt.xlabel('num trials in each map')
            plt.legend(['within', 'across'], bbox_to_anchor=[1,1], loc='upper left')

            plt.subplot(1,2,2)
            plt.plot(trial_sizes, avg_dprime_1)
            plt.plot(trial_sizes, avg_dprime_2)
            plt.ylabel('dprime')
            plt.xlabel('num trials in each map')
            plt.legend(['diff', 'same'], bbox_to_anchor=[1,1], loc='upper left')

            plt.tight_layout()

        .. image:: _images/compare_conditions_bootstrap_spatial_corr_sweep.png
    '''
    conditions = np.unique(labels)
    if len(conditions) < 2:
        raise ValueError("At least two conditions are required for comparison")
    if parallel is True:
        parallel = mp.Pool(mp.cpu_count() // 2)  # use half of the available cores
    if n_shuffle > 0:
        shuff_pbar = tqdm(total=n_shuffle, desc="Shuffles")
        
    # Calculate observed distributions
    observed_dists, _, observed_corr, observed_dprime = \
        _compare_conditions_bootstrap_spatial_corr_worker(
            data, elec_pos, labels, n_trials=n_trials, n_bootstraps=n_bootstraps, 
            statistics=statistics, rng=rng, parallel=parallel
        )
    
    if n_shuffle == 0:
        return observed_dists, conditions, observed_corr, observed_dprime

    # Calculate shuffled distributions
    shuff_labels = labels.copy()
    shuff_dists_dist = []
    shuff_corr_dist = []
    shuff_dprime_dist = []
    for n in range(n_shuffle):
        np.random.shuffle(shuff_labels)
        shuff_dists, _, shuff_corr, shuff_dprime = \
            _compare_conditions_bootstrap_spatial_corr_worker(
                data, elec_pos, shuff_labels, n_trials=n_trials, n_bootstraps=n_bootstraps, 
                statistics=statistics, rng=rng, parallel=parallel
            )
        shuff_dists_dist.append(shuff_dists)
        shuff_corr_dist.append(shuff_corr)
        shuff_dprime_dist.append(shuff_dprime)
        shuff_pbar.update()
        
    return observed_dists, conditions, observed_corr, observed_dprime, \
        shuff_dists_dist, shuff_corr_dist, shuff_dprime_dist