Source code for mne_connectivity.spectral.epochs

# Authors: Martin Luessi <mluessi@nmr.mgh.harvard.edu>
#          Denis A. Engemann <denis.engemann@gmail.com>
#          Adam Li <adam2392@gmail.com>
#          Thomas S. Binns <t.s.binns@outlook.com>
#
# License: BSD (3-clause)

import inspect
from functools import partial

import numpy as np
from mne.epochs import BaseEpochs
from mne.parallel import parallel_func
from mne.source_estimate import _BaseSourceEstimate
from mne.time_frequency.multitaper import (
    _compute_mt_params,
    _csd_from_mt,
    _mt_spectra,
    _psd_from_mt,
    _psd_from_mt_adaptive,
)
from mne.time_frequency.spectrum import (
    BaseSpectrum,
    EpochsSpectrum,
    EpochsSpectrumArray,
)
from mne.time_frequency.tfr import cwt, morlet
from mne.utils import _arange_div, _check_option, _time_mask, logger, verbose, warn

from ..base import SpectralConnectivity, SpectroTemporalConnectivity
from ..utils import _check_multivariate_indices, check_indices, fill_doc
from .epochs_bivariate import _CON_METHOD_MAP_BIVARIATE
from .epochs_multivariate import (
    _CON_METHOD_MAP_MULTIVARIATE,
    _check_n_components_input,
    _check_rank_input,
    _gc_methods,
    _multicomp_methods,
    _multivariate_methods,
)


def _check_times(data, sfreq, times, tmin, tmax):
    # get the data size and time scale
    n_signals, _, times_in, warn_times = _get_and_verify_data_sizes(
        data=data, sfreq=sfreq, times=times
    )
    n_times_in = len(times_in)  # XXX: Why not use times returned from above func?

    if tmin is not None and tmin < times_in[0]:
        warn(
            f"start time tmin={tmin:.2f} s outside of the time scope of the data "
            f"[{times_in[0]:.2f} s, {times_in[-1]:.2f} s]"
        )
    if tmax is not None and tmax > times_in[-1]:
        warn(
            f"stop time tmax={tmax:.2f} s outside of the time scope of the data "
            f"[{times_in[0]:.2f} s, {times_in[-1]:.2f} s]"
        )

    mask = _time_mask(times_in, tmin, tmax, sfreq=sfreq)
    tmin_idx, tmax_idx = np.where(mask)[0][[0, -1]]
    tmax_idx += 1
    tmin_true = times_in[tmin_idx]
    tmax_true = times_in[tmax_idx - 1]  # time of last point used

    times = times_in[tmin_idx:tmax_idx]
    n_times = len(times)

    logger.info(
        f"    using t={tmin_true:.3f}s..{tmax_true:.3f}s for estimation ({n_times} "
        "points)"
    )

    return (
        n_signals,
        times,
        n_times,
        times_in,
        n_times_in,
        tmin_idx,
        tmax_idx,
        warn_times,
    )


def _check_freqs(sfreq, fmin, n_times):
    # check that fmin corresponds to at least 5 cycles
    dur = float(n_times) / sfreq
    five_cycle_freq = 5.0 / dur
    if len(fmin) == 1 and fmin[0] == -np.inf:
        # we use the 5 cycle freq. as default
        fmin = np.array([five_cycle_freq])
    else:
        if np.any(fmin < five_cycle_freq):
            warn(
                f"fmin={np.min(fmin):.3f} Hz corresponds to {dur * np.min(fmin):.3f} < "
                f"5 cycles based on the epoch length {dur:.3f} sec, need at least "
                f"{5.0 / np.min(fmin):.3f} sec epochs or fmin={five_cycle_freq:.3f}. "
                "Spectrum estimate will be unreliable."
            )

    return fmin


def _compute_freqs(n_times, sfreq, cwt_freqs, mode):
    from scipy.fft import rfftfreq

    # get frequencies of interest for the different modes
    if mode in ("multitaper", "fourier"):
        # fmin fmax etc is only supported for these modes
        # decide which frequencies to keep
        freqs_all = rfftfreq(n_times, 1.0 / sfreq)
    elif mode == "cwt_morlet":
        # cwt_morlet mode
        if cwt_freqs is None:
            raise ValueError("define frequencies of interest using cwt_freqs")
        else:
            cwt_freqs = cwt_freqs.astype(np.float64)
        if any(cwt_freqs > (sfreq / 2.0)):
            raise ValueError(
                "entries in cwt_freqs cannot be larger than Nyquist (sfreq / 2)"
            )
        freqs_all = cwt_freqs
    else:
        raise ValueError("mode has an invalid value")

    return freqs_all


def _compute_freq_mask(freqs_all, fmin, fmax, fskip):
    # create a frequency mask for all bands
    freq_mask = np.zeros(len(freqs_all), dtype=bool)
    for f_lower, f_upper in zip(fmin, fmax):
        freq_mask |= (freqs_all >= f_lower) & (freqs_all <= f_upper)

    # possibly skip frequency points
    for pos in range(fskip):
        freq_mask[pos + 1 :: fskip + 1] = False
    return freq_mask


def _prepare_connectivity(
    epoch_block,
    times_in,
    tmin,
    tmax,
    fmin,
    fmax,
    sfreq,
    freqs,
    indices,
    method,
    mode,
    fskip,
    n_bands,
    cwt_freqs,
    faverage,
    spectrum_computed,
):
    """Check and precompute dimensions of results data."""
    first_epoch = epoch_block[0]

    # Sort times and freqs
    if spectrum_computed:
        n_signals = first_epoch[0].shape[0]
        times = None
        n_times = None
        times_in = None
        n_times_in = None
        tmin_idx = None
        tmax_idx = None
        warn_times = False
    else:
        (
            n_signals,
            times,
            n_times,
            times_in,
            n_times_in,
            tmin_idx,
            tmax_idx,
            warn_times,
        ) = _check_times(
            data=first_epoch, sfreq=sfreq, times=times_in, tmin=tmin, tmax=tmax
        )
        # check that fmin corresponds to at least 5 cycles
        fmin = _check_freqs(sfreq=sfreq, fmin=fmin, n_times=n_times)
        # compute frequencies to analyze based on number of samples, sampling rate,
        # specified wavelet frequencies, and mode
        freqs = _compute_freqs(n_times, sfreq, cwt_freqs, mode)

    # compute the mask based on specified min/max and decimation factor
    freq_mask = _compute_freq_mask(freqs, fmin, fmax, fskip)

    # the frequency points where we compute connectivity
    freqs = freqs[freq_mask]
    n_freqs = len(freqs)

    # get the freq. indices and points for each band
    freq_idx_bands = [
        np.where((freqs >= fl) & (freqs <= fu))[0] for fl, fu in zip(fmin, fmax)
    ]
    freqs_bands = [freqs[freq_idx] for freq_idx in freq_idx_bands]

    # make sure we don't have empty bands
    for i, n_f_band in enumerate([len(f) for f in freqs_bands]):
        if n_f_band == 0:
            raise ValueError(
                f"There are no frequency points between {fmin[i]:.1f}Hz and "
                f"{fmax[i]:.1f}Hz. Change the band specification (fmin, fmax) or the "
                "frequency resolution."
            )
    if n_bands == 1:
        logger.info(
            f"    frequencies: {freqs_bands[0][0]:.1f}Hz..{freqs_bands[0][-1]:.1f}Hz "
            f"({n_freqs} points)"
        )
    else:
        logger.info("    computing connectivity for the bands:")
        for i, bfreqs in enumerate(freqs_bands):
            logger.info(
                f"     band {i + 1}: {bfreqs[0]:.1f}Hz..{bfreqs[-1]:.1f}Hz "
                f"({len(bfreqs)} points)"
            )
    if faverage:
        logger.info("    connectivity scores will be averaged for each band")

    # Sort indices
    multivariate_con = any(
        this_method in _multivariate_methods for this_method in method
    )

    if indices is None:
        if multivariate_con:
            if any(this_method in _gc_methods for this_method in method):
                raise ValueError(
                    "indices must be specified when computing Granger causality, as "
                    "all-to-all connectivity is not supported"
                )
            logger.info("using all indices for multivariate connectivity")
            # indices expected to be a masked array, even if not ragged
            indices_use = (
                np.arange(n_signals, dtype=int)[np.newaxis, :],
                np.arange(n_signals, dtype=int)[np.newaxis, :],
            )
            indices_use = np.ma.masked_array(indices_use, mask=False, fill_value=-1)
        else:
            logger.info("only using indices for lower-triangular matrix")
            # only compute r for lower-triangular region
            indices_use = np.tril_indices(n_signals, -1)
    else:
        if multivariate_con:
            # pad ragged indices and mask the invalid entries
            indices_use = _check_multivariate_indices(indices, n_signals)
            if any(this_method in _gc_methods for this_method in method):
                for seed, target in zip(indices_use[0], indices_use[1]):
                    intersection = np.intersect1d(
                        seed.compressed(), target.compressed()
                    )
                    if intersection.size > 0:
                        raise ValueError(
                            "seed and target indices must not intersect when computing "
                            "Granger causality"
                        )
        else:
            indices_use = check_indices(indices)

    # number of connections to compute
    n_cons = len(indices_use[0])

    logger.info(f"    computing connectivity for {n_cons} connections")

    return (
        n_cons,
        times,
        n_times,
        times_in,
        n_times_in,
        tmin_idx,
        tmax_idx,
        n_freqs,
        freq_mask,
        freqs,
        freqs_bands,
        freq_idx_bands,
        n_signals,
        indices_use,
        warn_times,
    )


def _assemble_spectral_params(
    mode,
    n_times,
    mt_adaptive,
    mt_bandwidth,
    sfreq,
    mt_low_bias,
    cwt_n_cycles,
    cwt_freqs,
    freqs,
    freq_mask,
):
    """Prepare time-frequency decomposition."""
    spectral_params = dict(eigvals=None, window_fun=None, wavelets=None, weights=None)
    n_tapers = None
    n_times_spectrum = 0
    if mode == "multitaper":
        window_fun, eigvals, mt_adaptive = _compute_mt_params(
            n_times, sfreq, mt_bandwidth, mt_low_bias, mt_adaptive
        )
        spectral_params.update(window_fun=window_fun, eigvals=eigvals)
    elif mode == "fourier":
        logger.info("    using FFT with a Hanning window to estimate spectra")
        spectral_params.update(window_fun=np.hanning(n_times), eigvals=1.0)
    elif mode == "cwt_morlet":
        logger.info("    using CWT with Morlet wavelets to estimate spectra")

        # reformat cwt_n_cycles if we have removed some frequencies
        # using fmin, fmax, fskip
        cwt_n_cycles = np.array((cwt_n_cycles,), dtype=float).ravel()
        if len(cwt_n_cycles) > 1:
            if len(cwt_n_cycles) != len(cwt_freqs):
                raise ValueError(
                    "cwt_n_cycles must be float or an array with the same size as "
                    "cwt_freqs"
                )
            cwt_n_cycles = cwt_n_cycles[freq_mask]

        # get the Morlet wavelets
        spectral_params.update(
            wavelets=morlet(sfreq, freqs, n_cycles=cwt_n_cycles, zero_mean=True)
        )
        n_times_spectrum = n_times
    else:
        raise ValueError("mode has an invalid value")
    return spectral_params, mt_adaptive, n_times_spectrum, n_tapers


########################################################################
# Connectivity estimators base class


class _AbstractConEstBase:
    """ABC for connectivity estimators."""

    def start_epoch(self):
        raise NotImplementedError("start_epoch method not implemented")

    def accumulate(self, con_idx, csd_xy):
        raise NotImplementedError("accumulate method not implemented")

    def combine(self, other):
        raise NotImplementedError("combine method not implemented")

    def compute_con(self, con_idx, n_epochs):
        raise NotImplementedError("compute_con method not implemented")


########################################################################


def _compute_spectra(
    data,
    sfreq,
    mode,
    sig_idx,
    tmin_idx,
    tmax_idx,
    mt_adaptive,
    eigvals,
    wavelets,
    window_fun,
    freq_mask,
    accumulate_psd,
):
    x_t = list()
    this_psd = list()
    for this_data in data:
        if mode in ("multitaper", "fourier"):
            if isinstance(this_data, _BaseSourceEstimate):
                _mt_spectra_partial = partial(_mt_spectra, dpss=window_fun, sfreq=sfreq)
                this_x_t = this_data.transform_data(
                    _mt_spectra_partial,
                    idx=sig_idx,
                    tmin_idx=tmin_idx,
                    tmax_idx=tmax_idx,
                )
            else:
                this_x_t, _ = _mt_spectra(
                    this_data[sig_idx, tmin_idx:tmax_idx], window_fun, sfreq
                )

            if mt_adaptive:
                # compute PSD and adaptive weights
                _this_psd, weights = _psd_from_mt_adaptive(
                    this_x_t, eigvals, freq_mask, return_weights=True
                )

                # only keep freqs of interest
                this_x_t = this_x_t[:, :, freq_mask]
            else:
                # do not use adaptive weights
                this_x_t = this_x_t[:, :, freq_mask]
                if mode == "multitaper":
                    weights = np.sqrt(eigvals)[np.newaxis, :, np.newaxis]
                else:
                    # hack to so we can sum over axis=-2 (tapers dim)
                    weights = np.ones((1, 1, 1))

                if accumulate_psd:
                    _this_psd = _psd_from_mt(this_x_t, weights)
        else:  # mode == 'cwt_morlet'
            weights = None
            if isinstance(this_data, _BaseSourceEstimate):
                cwt_partial = partial(cwt, Ws=wavelets, use_fft=True, mode="same")
                this_x_t = this_data.transform_data(
                    cwt_partial, idx=sig_idx, tmin_idx=tmin_idx, tmax_idx=tmax_idx
                )
            else:
                this_x_t = cwt(
                    this_data[sig_idx, tmin_idx:tmax_idx],
                    wavelets,
                    use_fft=True,
                    mode="same",
                )
            _this_psd = (this_x_t * this_x_t.conj()).real

        x_t.append(this_x_t)
        if accumulate_psd:
            this_psd.append(_this_psd)

    return x_t, this_psd, weights


def _epoch_spectral_connectivity(
    data,
    sig_idx,
    tmin_idx,
    tmax_idx,
    sfreq,
    method,
    mode,
    window_fun,
    eigvals,
    weights,
    wavelets,
    freq_mask,
    mt_adaptive,
    idx_map,
    n_cons,
    block_size,
    psd,
    accumulate_psd,
    con_method_types,
    con_methods,
    n_signals,
    n_signals_use,
    n_times,
    gc_n_lags,
    n_components,
    spectrum_computed,
    accumulate_inplace=True,
):
    """Estimate connectivity for one epoch (see spectral_connectivity)."""
    if any(this_method in _multivariate_methods for this_method in method):
        n_con_signals = n_signals_use**2
    else:
        n_con_signals = n_cons

    if wavelets is not None:
        n_times_spectrum = n_times
        n_freqs = len(wavelets)
    else:
        n_times_spectrum = 0
        n_freqs = np.sum(freq_mask)

    if not accumulate_inplace:
        # instantiate methods only for this epoch (used in parallel mode)
        con_methods = []
        for mtype in con_method_types:
            method_params = list(inspect.signature(mtype).parameters)
            if "n_signals" in method_params:
                # if it's a multivariate connectivity method
                if "n_lags" in method_params:
                    # if it's a Granger causality method
                    con_methods.append(
                        mtype(
                            n_signals_use, n_cons, n_freqs, n_times_spectrum, gc_n_lags
                        )
                    )
                else:
                    # if it's a coherency-based method
                    con_methods.append(
                        mtype(
                            n_signals_use,
                            n_cons,
                            n_freqs,
                            n_times_spectrum,
                            n_components=n_components,
                        )
                    )
            else:
                con_methods.append(mtype(n_cons, n_freqs, n_times_spectrum))

    _check_option("mode", mode, ("cwt_morlet", "multitaper", "fourier"))
    if len(sig_idx) == n_signals:
        # we use all signals: use a slice for faster indexing
        sig_idx = slice(None, None)

    # compute tapered spectra
    if spectrum_computed:  # use existing spectral info
        # XXX: Will need to distinguish time-resolved spectra here if support added
        # Select signals & freqs of interest (flexible indexing for optional tapers dim)
        x_t = np.array(data)[:, sig_idx][..., freq_mask]  # split dims to avoid np.ix_
        if weights is None:  # also assumes no tapers dim
            x_t = np.expand_dims(x_t, axis=2)  # CSD construction expects a tapers dim
            weights = np.ones((1, 1, 1))
        if accumulate_psd:
            this_psd = _psd_from_mt(x_t, weights)
    else:  # compute spectral info from scratch
        x_t, this_psd, weights = _compute_spectra(
            data=data,
            sfreq=sfreq,
            mode=mode,
            sig_idx=sig_idx,
            tmin_idx=tmin_idx,
            tmax_idx=tmax_idx,
            mt_adaptive=mt_adaptive,
            eigvals=eigvals,
            wavelets=wavelets,
            window_fun=window_fun,
            freq_mask=freq_mask,
            accumulate_psd=accumulate_psd,
        )

    x_t = np.concatenate(x_t, axis=0)
    if accumulate_psd:
        this_psd = np.concatenate(this_psd, axis=0)

    # accumulate or return psd
    if accumulate_psd:
        if accumulate_inplace:
            psd += this_psd
        else:
            psd = this_psd
    else:
        psd = None

    # tell the methods that a new epoch starts
    for method in con_methods:
        method.start_epoch()

    # accumulate connectivity scores
    if mode in ["multitaper", "fourier"]:
        for i in range(0, n_con_signals, block_size):
            n_extra = max(0, i + block_size - n_con_signals)
            con_idx = slice(i, i + block_size - n_extra)
            if mt_adaptive:
                csd = _csd_from_mt(
                    x_t[idx_map[0][con_idx]],
                    x_t[idx_map[1][con_idx]],
                    weights[idx_map[0][con_idx]],
                    weights[idx_map[1][con_idx]],
                )
            else:
                csd = _csd_from_mt(
                    x_t[idx_map[0][con_idx]], x_t[idx_map[1][con_idx]], weights, weights
                )

            for method in con_methods:
                method.accumulate(con_idx, csd)
    else:  # mode == 'cwt_morlet'  # reminder to add alternative TFR methods
        for i in range(0, n_con_signals, block_size):
            n_extra = max(0, i + block_size - n_con_signals)
            con_idx = slice(i, i + block_size - n_extra)
            # this codes can be very slow
            csd = x_t[idx_map[0][con_idx]] * x_t[idx_map[1][con_idx]].conjugate()

            for method in con_methods:
                method.accumulate(con_idx, csd)
                # future estimator types need to be explicitly handled here

    return con_methods, psd


def _get_n_epochs(epochs, n):
    """Generate lists with at most n epochs."""
    epochs_out = list()
    for epoch in epochs:
        if not isinstance(epoch, list | tuple):
            epoch = (epoch,)
        epochs_out.append(epoch)
        if len(epochs_out) >= n:
            yield epochs_out
            epochs_out = list()
    if 0 < len(epochs_out) < n:
        yield epochs_out


def _check_method(method):
    """Test if a method implements the required interface."""
    interface_members = [
        m[0]
        for m in inspect.getmembers(_AbstractConEstBase)
        if not m[0].startswith("_")
    ]
    method_members = [
        m[0] for m in inspect.getmembers(method) if not m[0].startswith("_")
    ]

    for member in interface_members:
        if member not in method_members:
            return False, member
    return True, None


def _get_and_verify_data_sizes(
    data, sfreq, n_signals=None, n_times=None, times=None, warn_times=True
):
    """Get and/or verify the data sizes and time scales."""
    if not isinstance(data, list | tuple):
        raise ValueError("data has to be a list or tuple")
    n_signals_tot = 0
    # Sometimes data can be (ndarray, SourceEstimate) groups so in the case
    # where ndarray comes first, don't use it for times
    times_inferred = False
    for this_data in data:
        this_n_signals, this_n_times = this_data.shape
        if n_times is not None:
            if this_n_times != n_times:
                raise ValueError(
                    "all input time series must have the same number of time points"
                )
        else:
            n_times = this_n_times
        n_signals_tot += this_n_signals

        if hasattr(this_data, "times"):
            assert isinstance(this_data, _BaseSourceEstimate)
            this_times = this_data.times
            if times is not None and not times_inferred:
                if warn_times and not np.allclose(times, this_times):
                    with np.printoptions(threshold=4, linewidth=120):
                        warn(
                            "time scales of input time series do not match:\n"
                            f"{this_times}\n{times}"
                        )
                    warn_times = False
            else:
                times = this_times
        elif times is None:
            times_inferred = True
            times = _arange_div(n_times, sfreq)

    if n_signals is not None:
        if n_signals != n_signals_tot:
            raise ValueError(
                "the number of time series has to be the same in each epoch"
            )
    n_signals = n_signals_tot

    return n_signals, n_times, times, warn_times


# map names to estimator types
_CON_METHOD_MAP = {**_CON_METHOD_MAP_BIVARIATE, **_CON_METHOD_MAP_MULTIVARIATE}


def _check_estimators(method):
    """Check construction of connectivity estimators."""
    n_methods = len(method)
    con_method_types = list()
    for this_method in method:
        if this_method in _CON_METHOD_MAP:
            con_method_types.append(_CON_METHOD_MAP[this_method])
        elif isinstance(this_method, str):
            raise ValueError(f"{this_method} is not a valid connectivity method")
        else:
            # support for custom class
            method_valid, msg = _check_method(this_method)
            if not method_valid:
                raise ValueError(
                    f"The supplied connectivity method does not have the method {msg}"
                )
            con_method_types.append(this_method)

    # if none of the comp_con functions needs the PSD, we don't estimate it
    accumulate_psd = any(this_method.accumulate_psd for this_method in con_method_types)

    return con_method_types, n_methods, accumulate_psd


[docs] @verbose @fill_doc def spectral_connectivity_epochs( data, names=None, method="coh", indices=None, sfreq=None, mode="multitaper", fmin=None, fmax=np.inf, fskip=0, faverage=False, tmin=None, tmax=None, mt_bandwidth=None, mt_adaptive=False, mt_low_bias=True, cwt_freqs=None, cwt_n_cycles=7, gc_n_lags=40, rank=None, n_components=1, block_size=1000, n_jobs=1, verbose=None, ): r"""Compute frequency- and time-frequency-domain connectivity measures. The connectivity method(s) are specified using the "method" parameter. All methods are based on estimates of the cross- and power spectral densities (CSD/PSD) Sxy and Sxx, Syy. Parameters ---------- data : array-like, shape=(n_epochs, n_signals, n_times) | Epochs | ~mne.time_frequency.EpochsSpectrum The data from which to compute connectivity. Can be epoched timeseries data as an :term:`array-like` or :class:`~mne.Epochs` object, or Fourier coefficients for each epoch as an :class:`~mne.time_frequency.EpochsSpectrum` object. If timeseries data, the spectral information will be computed according to the spectral estimation mode (see the ``mode`` parameter). If an :class:`~mne.time_frequency.EpochsSpectrum` object, this spectral information will be used and the ``mode`` parameter will be ignored. Note that it is also possible to combine multiple timeseries signals by providing a list of tuples, e.g.: :: data = [(arr_0, stc_0), (arr_1, stc_1), (arr_2, stc_2)] which corresponds to 3 epochs where ``arr_*`` is an array with the same number of time points as ``stc_*``. Data can also be a :class:`list`/:term:`generator` of arrays, ``shape (n_signals, n_times)``, or a :class:`list`/:term:`generator` of :class:`~mne.SourceEstimate` or :class:`~mne.VolSourceEstimate` objects. .. versionchanged:: 0.8 Fourier coefficients stored in an :class:`~mne.time_frequency.EpochsSpectrum` or :class:`~mne.time_frequency.EpochsSpectrumArray` object can also be passed in as data. Storing Fourier coefficients requires ``mne >= 1.8``. %(names)s method : str | list of str Connectivity measure(s) to compute. These can be ``['coh', 'cohy', 'imcoh', 'cacoh', 'mic', 'mim', 'plv', 'ciplv', 'ppc', 'pli', 'dpli', 'wpli', 'wpli2_debiased', 'gc', 'gc_tr']``. These are: * %(coh)s * %(cohy)s * %(imcoh)s * %(cacoh)s * %(mic)s * %(mim)s * %(plv)s * %(ciplv)s * %(ppc)s * %(pli)s * %(pli2_unbiased)s * %(dpli)s * %(wpli)s * %(wpli2_debiased)s * %(gc)s * %(gc_tr)s Multivariate methods (``['cacoh', 'mic', 'mim', 'gc', 'gc_tr']``) cannot be called with the other methods. indices : tuple of array | None Two arrays with indices of connections for which to compute connectivity. If a bivariate method is called, each array for the seeds and targets should contain the channel indices for each bivariate connection. If a multivariate method is called, each array for the seeds and targets should consist of nested arrays containing the channel indices for each multivariate connection. If ``None``, connections between all channels are computed, unless a Granger causality method is called, in which case an error is raised. sfreq : float The sampling frequency. Required if data is an :term:`array-like`. mode : str Spectrum estimation mode can be either: 'multitaper', 'fourier', or 'cwt_morlet'. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. fmin : float | tuple of float | None The lower frequency of interest. Multiple bands are defined using a tuple, e.g., (8., 20.) for two bands with 8 Hz and 20 Hz lower freq. If ``None``, the frequency corresponding to 5 cycles based on the epoch length is used. For example, with an epoch length of 1 sec, the lower frequency would be 5 / 1 sec = 5 Hz. fmax : float | tuple of float The upper frequency of interest. Multiple bands are defined using a tuple, e.g. (13., 30.) for two band with 13 Hz and 30 Hz upper freq. fskip : int Omit every "(fskip + 1)-th" frequency bin to decimate in frequency domain. faverage : bool Average connectivity scores for each frequency band. If True, the output freqs will be a list with arrays of the frequencies that were averaged. tmin : float | None Time to start connectivity estimation. Note: when ``data`` is an :term:`array-like`, the first sample is assumed to be at time 0. For :class:`~mne.Epochs`, the time information contained in the object is used to compute the time indices. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. tmax : float | None Time to end connectivity estimation. Note: when ``data`` is an :term:`array-like`, the first sample is assumed to be at time 0. For :class:`~mne.Epochs`, the time information contained in the object is used to compute the time indices. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. mt_bandwidth : float | None The bandwidth of the multitaper windowing function in Hz. Only used in 'multitaper' mode. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. mt_adaptive : bool Use adaptive weights to combine the tapered spectra into PSD. Only used in 'multitaper' mode. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. mt_low_bias : bool Only use tapers with more than 90 percent spectral concentration within bandwidth. Only used in 'multitaper' mode. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. cwt_freqs : array Array of frequencies of interest. Only used in 'cwt_morlet' mode. Only the frequencies within the range specified by ``fmin`` and ``fmax`` are used. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. cwt_n_cycles : float | array of float Number of cycles. Fixed number or one per frequency. Only used in 'cwt_morlet' mode. Ignored if ``data`` is an :class:`~mne.time_frequency.EpochsSpectrum` object. gc_n_lags : int Number of lags to use for the vector autoregressive model when computing Granger causality. Higher values increase computational cost, but reduce the degree of spectral smoothing in the results. Only used if ``method`` contains any of ``['gc', 'gc_tr']``. rank : tuple of array | None Two arrays with the rank to project the seed and target data to, respectively, using singular value decomposition. If None, the rank of the data is computed and projected to. Only used if ``method`` contains any of ``['cacoh', 'mic', 'mim', 'gc', 'gc_tr']``. n_components : int Number of connectivity components to extract from the data. If an `int`, the number of components must be <= the minimum rank of the seeds and targets. E.g. if the seed channels had a rank of 5 and the target channels had a rank of 3, ``n_components`` must be <= 3. If `None`, the number of components equal to the minimum rank of the seeds and targets is extracted (see the ``rank`` parameter). Only used if ``method`` contains any of ``['cacoh', 'mic']``. .. versionadded:: 0.8 block_size : int How many connections to compute at once (higher numbers are faster but require more memory). n_jobs : int How many samples to process in parallel. %(verbose)s Returns ------- con : instance of SpectralConnectivity or SpectroTemporalConnectivity | list Computed connectivity measure(s). An instance of :class:`SpectralConnectivity`, :class:`SpectroTemporalConnectivity`, or a list of instances corresponding to connectivity measures if several connectivity measures are specified. The shape of the connectivity result will be: - ``(n_cons, n_freqs)`` for multitaper or fourier modes - ``(n_cons, n_freqs, n_times)`` for cwt_morlet mode - ``(n_cons, n_comps, n_freqs (, n_times))`` for valid multivariate methods if ``n_components > 1`` - ``n_cons = n_signals ** 2`` for bivariate methods with ``indices=None`` - ``n_cons = 1`` for multivariate methods with ``indices=None`` - ``n_cons = len(indices[0])`` for bivariate and multivariate methods when indices is supplied See Also -------- mne_connectivity.spectral_connectivity_time mne_connectivity.SpectralConnectivity mne_connectivity.SpectroTemporalConnectivity Notes ----- Please note that the interpretation of the measures in this function depends on the data and underlying assumptions and does not necessarily reflect a causal relationship between brain regions. These measures are not to be interpreted over time. Each Epoch passed into the dataset is interpreted as an independent sample of the same connectivity structure. Within each Epoch, it is assumed that the spectral measure is stationary. The spectral measures implemented in this function are computed across Epochs. **Thus, spectral measures computed with only one Epoch will result in errorful values and spectral measures computed with few Epochs will be unreliable.** Please see :func:`spectral_connectivity_time` for time-resolved connectivity estimation. The spectral densities can be estimated using a multitaper method with digital prolate spheroidal sequence (DPSS) windows, a discrete Fourier transform with Hanning windows, or a continuous wavelet transform using Morlet wavelets. The spectral estimation mode is specified using the "mode" parameter. By default, the connectivity between all signals is computed (only connections corresponding to the lower-triangular part of the connectivity matrix). If one is only interested in the connectivity between some signals, the "indices" parameter can be used. For example, to compute the connectivity between the signal with index 0 and signals "2, 3, 4" (a total of 3 connections) one can use the following:: indices = (np.array([0, 0, 0]), # row indices np.array([2, 3, 4])) # col indices con = spectral_connectivity_epochs(data, method='coh', indices=indices, ...) In this case con.get_data().shape = (3, n_freqs). The connectivity scores are in the same order as defined indices. For multivariate methods, this is handled differently. If "indices" is None, connectivity between all signals will be computed and a single connectivity spectrum will be returned (this is not possible if a Granger causality method is called). If "indices" is specified, seed and target indices for each connection should be specified as nested array-likes. For example, to compute the connectivity between signals (0, 1) -> (2, 3) and (0, 1) -> (4, 5), indices should be specified as:: indices = (np.array([[0, 1], [0, 1]]), # seeds np.array([[2, 3], [4, 5]])) # targets More information on working with multivariate indices and handling connections where the number of seeds and targets are not equal can be found in the :doc:`../auto_examples/handling_ragged_arrays` example. **Supported Connectivity Measures** The connectivity method(s) is specified using the "method" parameter. The following methods are supported (note: ``E[]`` denotes average over epochs). Multiple measures can be computed at once by using a list/tuple, e.g., ``['coh', 'pli']`` to compute coherence and PLI. 'coh' : Coherence given by:: | E[Sxy] | C = --------------------- sqrt(E[Sxx] * E[Syy]) 'cohy' : Coherency given by:: E[Sxy] C = --------------------- sqrt(E[Sxx] * E[Syy]) 'imcoh' : Imaginary coherence :footcite:`NolteEtAl2004` given by:: Im(E[Sxy]) C = ---------------------- sqrt(E[Sxx] * E[Syy]) 'cacoh' : Canonical Coherency (CaCoh) :footcite:`VidaurreEtAl2019` given by: :math:`\textrm{CaCoh}=\Large{\frac{\boldsymbol{a}^T\boldsymbol{D} (\Phi)\boldsymbol{b}}{\sqrt{\boldsymbol{a}^T\boldsymbol{a} \boldsymbol{b}^T\boldsymbol{b}}}}` where: :math:`\boldsymbol{D}(\Phi)` is the cross-spectral density between seeds and targets transformed for a given phase angle :math:`\Phi`; and :math:`\boldsymbol{a}` and :math:`\boldsymbol{b}` are eigenvectors for the seeds and targets, such that :math:`\boldsymbol{a}^T\boldsymbol{D}(\Phi)\boldsymbol{b}` maximises coherency between the seeds and targets. Taking the absolute value of the results gives maximised coherence. 'mic' : Maximised Imaginary part of Coherency (MIC) :footcite:`EwaldEtAl2012` given by: :math:`\textrm{MIC}=\Large{\frac{\boldsymbol{\alpha}^T \boldsymbol{E \beta}}{\parallel\boldsymbol{\alpha}\parallel \parallel\boldsymbol{\beta}\parallel}}` where: :math:`\boldsymbol{E}` is the imaginary part of the transformed cross-spectral density between seeds and targets; and :math:`\boldsymbol{\alpha}` and :math:`\boldsymbol{\beta}` are eigenvectors for the seeds and targets, such that :math:`\boldsymbol{\alpha}^T \boldsymbol{E \beta}` maximises the imaginary part of coherency between the seeds and targets. 'mim' : Multivariate Interaction Measure (MIM) :footcite:`EwaldEtAl2012` given by: :math:`\textrm{MIM}=tr(\boldsymbol{EE}^T)` where :math:`\boldsymbol{E}` is the imaginary part of the transformed cross-spectral density between seeds and targets. 'plv' : Phase-Locking Value (PLV) :footcite:`LachauxEtAl1999` given by:: PLV = |E[Sxy/|Sxy|]| 'ciplv' : corrected imaginary PLV (ciPLV) :footcite:`BrunaEtAl2018` given by:: |E[Im(Sxy/|Sxy|)]| ciPLV = ------------------------------------ sqrt(1 - |E[real(Sxy/|Sxy|)]| ** 2) 'ppc' : Pairwise Phase Consistency (PPC), an unbiased estimator of squared PLV :footcite:`VinckEtAl2010`. 'pli' : Phase Lag Index (PLI) :footcite:`StamEtAl2007` given by:: PLI = |E[sign(Im(Sxy))]| 'pli2_unbiased' : Unbiased estimator of squared PLI :footcite:`VinckEtAl2011`. 'dpli' : Directed Phase Lag Index (DPLI) :footcite:`StamEtAl2012` given by (where H is the Heaviside function):: DPLI = E[H(Im(Sxy))] 'wpli' : Weighted Phase Lag Index (WPLI) :footcite:`VinckEtAl2011` given by:: |E[Im(Sxy)]| WPLI = ------------------ E[|Im(Sxy)|] 'wpli2_debiased' : Debiased estimator of squared WPLI :footcite:`VinckEtAl2011`. 'gc' : State-space Granger Causality (GC) :footcite:`BarnettSeth2015` given by: :math:`GC = ln\Large{(\frac{\lvert\boldsymbol{S}_{tt}\rvert}{\lvert \boldsymbol{S}_{tt}-\boldsymbol{H}_{ts}\boldsymbol{\Sigma}_{ss \lvert t}\boldsymbol{H}_{ts}^*\rvert}})` where: :math:`s` and :math:`t` represent the seeds and targets, respectively; :math:`\boldsymbol{H}` is the spectral transfer function; :math:`\boldsymbol{\Sigma}` is the residuals matrix of the autoregressive model; and :math:`\boldsymbol{S}` is :math:`\boldsymbol{\Sigma}` transformed by :math:`\boldsymbol{H}`. 'gc_tr' : State-space GC on time-reversed signals :footcite:`BarnettSeth2015,WinklerEtAl2016` given by the same equation as for 'gc', but where the autocovariance sequence from which the autoregressive model is produced is transposed to mimic the reversal of the original signal in time :footcite:`HaufeEtAl2012`. References ---------- .. footbibliography:: """ # noqa: E501 if n_jobs != 1: parallel, my_epoch_spectral_connectivity, n_jobs = parallel_func( _epoch_spectral_connectivity, n_jobs, verbose=verbose ) # format fmin and fmax and check inputs if fmin is None: fmin = -np.inf # set it to -inf, so we can adjust it later fmin = np.array((fmin,), dtype=float).ravel() fmax = np.array((fmax,), dtype=float).ravel() if len(fmin) != len(fmax): raise ValueError("fmin and fmax must have the same length") if np.any(fmin > fmax): raise ValueError("fmax must be larger than fmin") n_bands = len(fmin) # assign names to connectivity methods if not isinstance(method, list | tuple): method = [method] # make it a list so we can iterate over it if n_bands != 1 and any(this_method in _gc_methods for this_method in method): raise ValueError( "computing Granger causality on multiple frequency bands is not yet " "supported" ) if any(this_method in _multivariate_methods for this_method in method): if not all(this_method in _multivariate_methods for this_method in method): raise ValueError( "bivariate and multivariate connectivity methods cannot be used in the " "same function call" ) multivariate_con = True else: multivariate_con = False # handle connectivity estimators (con_method_types, n_methods, accumulate_psd) = _check_estimators(method) times_in = None events = None event_id = None freqs = None weights = None metadata = None spectrum_computed = False if isinstance(data, BaseEpochs | EpochsSpectrum | EpochsSpectrumArray): names = data.ch_names sfreq = data.info["sfreq"] events = data.events event_id = data.event_id # Extract metadata from the Epochs data structure. # Make Annotations persist through by adding them to the metadata. metadata = data.metadata if metadata is None: annots_in_metadata = False else: annots_in_metadata = all( name not in metadata.columns for name in ["annot_onset", "annot_duration", "annot_description"] ) if hasattr(data, "annotations") and not annots_in_metadata: data.add_annotations_to_metadata(overwrite=True) metadata = data.metadata if isinstance(data, EpochsSpectrum | EpochsSpectrumArray): # XXX: Will need to be updated if new Spectrum methods are added if not np.iscomplexobj(data.get_data()): raise TypeError( "if `data` is an EpochsSpectrum object, it must contain " "complex-valued Fourier coefficients, such as that returned from " "Epochs.compute_psd(output='complex')" ) if "segment" in data._dims: raise ValueError( "`data` cannot contain Fourier coefficients for individual segments" ) if isinstance(data, EpochsSpectrum): # mode can be read mode from Spectrum mode = data.method mode = "fourier" if mode == "welch" else mode else: # spectral method is "unknown", so take mode from data dimensions # Currently, actual mode doesn't matter as long as we handle tapers and # their weights in the same way as for multitaper spectra mode = "multitaper" if "taper" in data._dims else "fourier" spectrum_computed = True freqs = data.freqs weights = data.weights else: times_in = data.times # input times for Epochs input type elif sfreq is None: raise ValueError("Sampling frequency (sfreq) is required with array input.") # loop over data; it could be a generator that returns # (n_signals x n_times) arrays or SourceEstimates epoch_idx = 0 logger.info("Connectivity computation...") warn_times = True for epoch_block in _get_n_epochs(data, n_jobs): if epoch_idx == 0: # initialize everything times and frequencies ( n_cons, times, n_times, times_in, n_times_in, tmin_idx, tmax_idx, n_freqs, freq_mask, freqs, freqs_bands, freq_idx_bands, n_signals, indices_use, warn_times, ) = _prepare_connectivity( epoch_block=epoch_block, times_in=times_in, tmin=tmin, tmax=tmax, fmin=fmin, fmax=fmax, sfreq=sfreq, freqs=freqs, indices=indices, method=method, mode=mode, fskip=fskip, n_bands=n_bands, cwt_freqs=cwt_freqs, faverage=faverage, spectrum_computed=spectrum_computed, ) # check rank input and compute data ranks if necessary if multivariate_con: rank = _check_rank_input(rank, data, indices_use) n_components = _check_n_components_input(n_components, rank) if n_components == 1: # n_components=0 means space for a components dimension is not # allocated in the results, similar to how n_times_spectrum=0 is # used to indicate that time is not a dimension in the results n_components = 0 else: rank = None n_components = 0 gc_n_lags = None # make sure padded indices are stored in the connectivity object if multivariate_con and indices is not None: # create a copy so that `indices_use` can be modified indices = (indices_use[0].copy(), indices_use[1].copy()) # get the window function, wavelets, etc for different modes if not spectrum_computed: spectral_params, mt_adaptive, n_times_spectrum, n_tapers = ( _assemble_spectral_params( mode=mode, n_times=n_times, mt_adaptive=mt_adaptive, mt_bandwidth=mt_bandwidth, sfreq=sfreq, mt_low_bias=mt_low_bias, cwt_n_cycles=cwt_n_cycles, cwt_freqs=cwt_freqs, freqs=freqs, freq_mask=freq_mask, ) ) else: spectral_params = dict( eigvals=None, window_fun=None, wavelets=None, weights=weights ) n_times_spectrum = 0 n_tapers = None if weights is None else weights.size # unique signals for which we actually need to compute PSD etc. if multivariate_con: sig_idx = np.unique(indices_use.compressed()) remapping = {ch_i: sig_i for sig_i, ch_i in enumerate(sig_idx)} remapped_inds = indices_use.copy() for idx in sig_idx: remapped_inds[indices_use == idx] = remapping[idx] remapped_sig = np.unique(remapped_inds.compressed()) else: sig_idx = np.unique(np.r_[indices_use[0], indices_use[1]]) n_signals_use = len(sig_idx) # map indices to unique indices if multivariate_con: indices_use = remapped_inds # use remapped seeds & targets idx_map = [ np.sort(np.repeat(remapped_sig, len(sig_idx))), np.tile(remapped_sig, len(sig_idx)), ] else: idx_map = [np.searchsorted(sig_idx, ind) for ind in indices_use] # allocate space to accumulate PSD if accumulate_psd: if n_times_spectrum == 0: psd_shape = (n_signals_use, n_freqs) else: psd_shape = (n_signals_use, n_freqs, n_times_spectrum) psd = np.zeros(psd_shape) else: psd = None # create instances of the connectivity estimators con_methods = [] for mtype_i, mtype in enumerate(con_method_types): method_params = dict( n_cons=n_cons, n_freqs=n_freqs, n_times=n_times_spectrum ) if method[mtype_i] in _multivariate_methods: method_params.update(dict(n_signals=n_signals_use, n_jobs=n_jobs)) if method[mtype_i] in _multicomp_methods: method_params.update(dict(n_components=n_components)) if method[mtype_i] in _gc_methods: method_params.update(dict(n_lags=gc_n_lags)) con_methods.append(mtype(**method_params)) sep = ", " metrics_str = sep.join([meth.name for meth in con_methods]) logger.info(f" the following metrics will be computed: {metrics_str}") # check dimensions and time scale if not spectrum_computed: # XXX: Can we assume upstream checks sufficient? for this_epoch in epoch_block: _, _, _, warn_times = _get_and_verify_data_sizes( this_epoch, sfreq, n_signals, n_times_in, times_in, warn_times=warn_times, ) call_params = dict( sig_idx=sig_idx, tmin_idx=tmin_idx, tmax_idx=tmax_idx, sfreq=sfreq, method=method, mode=mode, freq_mask=freq_mask, idx_map=idx_map, n_cons=n_cons, block_size=block_size, psd=psd, accumulate_psd=accumulate_psd, mt_adaptive=mt_adaptive, con_method_types=con_method_types, con_methods=con_methods if n_jobs == 1 else None, n_signals=n_signals, n_signals_use=n_signals_use, n_times=n_times, gc_n_lags=gc_n_lags, n_components=n_components, spectrum_computed=spectrum_computed, accumulate_inplace=True if n_jobs == 1 else False, ) call_params.update(**spectral_params) if n_jobs == 1: # no parallel processing for this_epoch in epoch_block: logger.info( f" computing cross-spectral density for epoch {epoch_idx + 1}" ) # con methods and psd are updated inplace _epoch_spectral_connectivity(data=this_epoch, **call_params) epoch_idx += 1 else: # process epochs in parallel logger.info( f" computing cross-spectral density for epochs {epoch_idx + 1}.." f"{epoch_idx + len(epoch_block)}" ) out = parallel( my_epoch_spectral_connectivity(data=this_epoch, **call_params) for this_epoch in epoch_block ) # do the accumulation for this_out in out: for _method, parallel_method in zip(con_methods, this_out[0]): _method.combine(parallel_method) if accumulate_psd: psd += this_out[1] epoch_idx += len(epoch_block) # normalize n_epochs = epoch_idx if accumulate_psd: psd /= n_epochs # compute final connectivity scores con = list() patterns = list() for method_i, conn_method in enumerate(con_methods): # future estimators will need to be handled here if conn_method.accumulate_psd: # compute scores block-wise to save memory for i in range(0, n_cons, block_size): con_idx = slice(i, i + block_size) psd_xx = psd[idx_map[0][con_idx]] psd_yy = psd[idx_map[1][con_idx]] conn_method.compute_con(con_idx, n_epochs, psd_xx, psd_yy) else: # compute all scores at once if method[method_i] in _multivariate_methods: conn_method.compute_con(indices_use, rank, n_epochs) else: conn_method.compute_con(slice(0, n_cons), n_epochs) # get the connectivity scores this_con = conn_method.con_scores this_patterns = conn_method.patterns if this_con.shape[0] != n_cons: raise RuntimeError( "first dimension of connectivity scores does not match the number of " "connections; please contact the mne-connectivity developers" ) if faverage: if n_components != 0 and method[method_i] in _multicomp_methods: this_con = np.moveaxis(this_con, 2, 1) # make freqs the 2nd dimension if this_con.shape[1] != n_freqs: raise RuntimeError( "second dimension of connectivity scores does not match the number " "of frequencies; please contact the mne-connectivity developers" ) con_shape = (n_cons, n_bands) + this_con.shape[2:] this_con_bands = np.empty(con_shape, dtype=this_con.dtype) for band_idx in range(n_bands): this_con_bands[:, band_idx] = np.mean( this_con[:, freq_idx_bands[band_idx]], axis=1 ) this_con = this_con_bands if n_components != 0 and method[method_i] in _multicomp_methods: this_con = np.moveaxis(this_con, 1, 2) # return comps to 2nd dimension if this_patterns is not None: if n_components != 0: # make freqs the 4th dimension this_patterns = np.moveaxis(this_patterns, 4, 3) patterns_shape = list(this_patterns.shape) patterns_shape[3] = n_bands this_patterns_bands = np.empty( patterns_shape, dtype=this_patterns.dtype ) for band_idx in range(n_bands): this_patterns_bands[:, :, :, band_idx] = np.mean( this_patterns[:, :, :, freq_idx_bands[band_idx]], axis=3 ) this_patterns = this_patterns_bands if n_components != 0: # return comps to 4th dimension this_patterns = np.moveaxis(this_patterns, 3, 4) con.append(this_con) patterns.append(this_patterns) freqs_used = freqs if faverage: # for each band we return the frequencies that were averaged freqs = [np.mean(x) for x in freqs_bands] # make sure freq_bands is a list of equal-length lists # XXX: we lose information on which frequency points went into the # computation. If h5netcdf supports numpy objects in the future, then # we can change the min/max to just make it a list of lists. freqs_used = freqs_bands freqs_used = [[np.min(band), np.max(band)] for band in freqs_used] if indices is None and not multivariate_con: # return all-to-all connectivity matrices # raveled into a 1D array logger.info(" assembling connectivity matrix") con_flat = con con = list() for this_con_flat in con_flat: this_con = np.zeros( (n_signals, n_signals) + this_con_flat.shape[1:], dtype=this_con_flat.dtype, ) this_con[indices_use] = this_con_flat # ravel 2D connectivity into a 1D array # while keeping other dimensions this_con = this_con.reshape((n_signals**2,) + this_con_flat.shape[1:]) con.append(this_con) # number of nodes in the original data n_nodes = n_signals # create a list of connectivity containers conn_list = [] for _con, _patterns, _method in zip(con, patterns, method): kwargs = dict( data=_con, patterns=_patterns, names=names, freqs=freqs, method=_method, n_nodes=n_nodes, spec_method=mode if not isinstance(data, BaseSpectrum) else data.method, indices=indices, n_epochs_used=n_epochs, freqs_used=freqs_used, times_used=times, n_tapers=n_tapers, metadata=metadata, events=events, event_id=event_id, rank=rank, n_lags=gc_n_lags if _method in _gc_methods else None, ) if n_components and _method in _multicomp_methods: kwargs.update(components=np.arange(n_components) + 1) # create the connectivity container if mode in ["multitaper", "fourier"]: klass = SpectralConnectivity else: assert mode == "cwt_morlet" klass = SpectroTemporalConnectivity kwargs.update(times=times) conn_list.append(klass(**kwargs)) logger.info("[Connectivity computation done]") if n_methods == 1: # for a single method return connectivity directly conn_list = conn_list[0] return conn_list