PyPI - braindecode - Versions diffs - 0.8.1__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

braindecode 0.8.1py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of braindecode might be problematic. Click here for more details.

Files changed (108) hide show

braindecode/__init__.py +1 -2
braindecode/augmentation/__init__.py +39 -19
braindecode/augmentation/base.py +25 -28
braindecode/augmentation/functional.py +237 -100
braindecode/augmentation/transforms.py +326 -158
braindecode/classifier.py +26 -24
braindecode/datasets/__init__.py +28 -10
braindecode/datasets/base.py +220 -134
braindecode/datasets/bbci.py +43 -52
braindecode/datasets/bcicomp.py +47 -32
braindecode/datasets/bids.py +245 -0
braindecode/datasets/mne.py +45 -24
braindecode/datasets/moabb.py +87 -27
braindecode/datasets/nmt.py +311 -0
braindecode/datasets/sleep_physio_challe_18.py +412 -0
braindecode/datasets/sleep_physionet.py +43 -26
braindecode/datasets/tuh.py +324 -140
braindecode/datasets/xy.py +27 -12
braindecode/datautil/__init__.py +34 -18
braindecode/datautil/serialization.py +98 -71
braindecode/eegneuralnet.py +63 -47
braindecode/functional/__init__.py +10 -0
braindecode/functional/functions.py +251 -0
braindecode/functional/initialization.py +47 -0
braindecode/models/__init__.py +36 -14
braindecode/models/atcnet.py +153 -159
braindecode/models/attentionbasenet.py +550 -0
braindecode/models/base.py +86 -102
braindecode/models/biot.py +483 -0
braindecode/models/contrawr.py +296 -0
braindecode/models/ctnet.py +450 -0
braindecode/models/deep4.py +64 -75
braindecode/models/deepsleepnet.py +149 -119
braindecode/models/eegconformer.py +111 -171
braindecode/models/eeginception_erp.py +109 -118
braindecode/models/eeginception_mi.py +155 -97
braindecode/models/eegitnet.py +215 -151
braindecode/models/eegminer.py +255 -0
braindecode/models/eegnet.py +229 -161
braindecode/models/eegnex.py +247 -0
braindecode/models/eegresnet.py +234 -152
braindecode/models/eegsimpleconv.py +199 -0
braindecode/models/eegtcnet.py +335 -0
braindecode/models/fbcnet.py +221 -0
braindecode/models/fblightconvnet.py +313 -0
braindecode/models/fbmsnet.py +325 -0
braindecode/models/hybrid.py +52 -71
braindecode/models/ifnet.py +441 -0
braindecode/models/labram.py +1166 -0
braindecode/models/msvtnet.py +375 -0
braindecode/models/sccnet.py +182 -0
braindecode/models/shallow_fbcsp.py +50 -56
braindecode/models/signal_jepa.py +1012 -0
braindecode/models/sinc_shallow.py +337 -0
braindecode/models/sleep_stager_blanco_2020.py +55 -46
braindecode/models/sleep_stager_chambon_2018.py +54 -53
braindecode/models/sleep_stager_eldele_2021.py +248 -141
braindecode/models/sparcnet.py +378 -0
braindecode/models/summary.csv +41 -0
braindecode/models/syncnet.py +232 -0
braindecode/models/tcn.py +158 -88
braindecode/models/tidnet.py +280 -167
braindecode/models/tsinception.py +258 -0
braindecode/models/usleep.py +190 -177
braindecode/models/util.py +109 -141
braindecode/modules/__init__.py +38 -0
braindecode/modules/activation.py +60 -0
braindecode/modules/attention.py +757 -0
braindecode/modules/blocks.py +108 -0
braindecode/modules/convolution.py +274 -0
braindecode/modules/filter.py +632 -0
braindecode/modules/layers.py +133 -0
braindecode/modules/linear.py +50 -0
braindecode/modules/parametrization.py +38 -0
braindecode/modules/stats.py +77 -0
braindecode/modules/util.py +77 -0
braindecode/modules/wrapper.py +75 -0
braindecode/preprocessing/__init__.py +36 -11
braindecode/preprocessing/mne_preprocess.py +13 -7
braindecode/preprocessing/preprocess.py +139 -75
braindecode/preprocessing/windowers.py +576 -187
braindecode/regressor.py +23 -12
braindecode/samplers/__init__.py +16 -8
braindecode/samplers/base.py +148 -32
braindecode/samplers/ssl.py +162 -17
braindecode/training/__init__.py +18 -10
braindecode/training/callbacks.py +2 -4
braindecode/training/losses.py +3 -8
braindecode/training/scoring.py +76 -68
braindecode/util.py +55 -59
braindecode/version.py +1 -1
braindecode/visualization/__init__.py +2 -3
braindecode/visualization/confusion_matrices.py +117 -73
braindecode/visualization/gradients.py +14 -10
{braindecode-0.8.1.dist-info → braindecode-1.0.0.dist-info}/METADATA +39 -55
braindecode-1.0.0.dist-info/RECORD +101 -0
{braindecode-0.8.1.dist-info → braindecode-1.0.0.dist-info}/WHEEL +1 -1
{braindecode-0.8.1.dist-info → braindecode-1.0.0.dist-info/licenses}/LICENSE.txt +1 -1
braindecode-1.0.0.dist-info/licenses/NOTICE.txt +20 -0
braindecode/datautil/mne.py +0 -9
braindecode/datautil/preprocess.py +0 -12
braindecode/datautil/windowers.py +0 -6
braindecode/datautil/xy.py +0 -9
braindecode/models/eeginception.py +0 -317
braindecode/models/functions.py +0 -47
braindecode/models/modules.py +0 -358
braindecode-0.8.1.dist-info/RECORD +0 -68
{braindecode-0.8.1.dist-info → braindecode-1.0.0.dist-info}/top_level.txt +0 -0

braindecode/preprocessing/windowers.py CHANGED Viewed

@@ -1,5 +1,4 @@
-"""Get epochs from mne.Raw
-"""
+"""Get epochs from mne.Raw"""
 # Authors: Hubert Banville <hubert.jbanville@gmail.com>
 #          Lukas Gemein <l.gemein@gmail.com>
@@ -15,23 +14,199 @@
 #
 # License: BSD (3-clause)
+from __future__ import annotations
 import warnings
+from typing import Any, Callable
-import numpy as np
 import mne
+import numpy as np
 import pandas as pd
 from joblib import Parallel, delayed
+from numpy.typing import ArrayLike
-from ..datasets.base import WindowsDataset, BaseConcatDataset, EEGWindowsDataset
+from ..datasets.base import BaseConcatDataset, EEGWindowsDataset, WindowsDataset
+class _LazyDataFrame:
+    """
+    DataFrame-like object that lazily computes values (experimental).
+    This class emulates some features of a pandas DataFrame, but computes
+    the values on-the-fly when they are accessed. This is useful for
+    very long DataFrames with repetitive values.
+    Only the methods used by EEGWindowsDataset on its metadata are implemented.
+    Parameters:
+    -----------
+    length: int
+        The length of the dataframe.
+    functions: dict[str, Callable[[int], Any]]
+        A dictionary mapping column names to functions that take an index and
+        return the value of the column at that index.
+    columns: list[str]
+        The names of the columns in the dataframe.
+    series: bool
+        Whether the object should emulate a series or a dataframe.
+    """
+    def __init__(
+        self,
+        length: int,
+        functions: dict[str, Callable[[int], Any]],
+        columns: list[str],
+        series: bool = False,
+    ):
+        if not (isinstance(length, int) and length >= 0):
+            raise ValueError("Length must be a positive integer.")
+        if not all(c in functions for c in columns):
+            raise ValueError("All columns must have a corresponding function.")
+        if series and len(columns) != 1:
+            raise ValueError("Series must have exactly one column.")
+        self.length = length
+        self.functions = functions
+        self.columns = columns
+        self.series = series
+    @property
+    def loc(self):
+        return self
+    def __len__(self):
+        return self.length
+    def __getitem__(self, key):
+        if not isinstance(key, tuple):
+            key = (key, self.columns)
+        if len(key) == 1:
+            key = (key[0], self.columns)
+        if not len(key) == 2:
+            raise IndexError(
+                f"index must be either [row] or [row, column], got [{', '.join(map(str, key))}]."
+            )
+        row, col = key
+        if col == slice(None):  # all columns (i.e., call to df[row, :])
+            col = self.columns
+        one_col = False
+        if isinstance(col, str):  # one column
+            one_col = True
+            col = [col]
+        else:  # multiple columns
+            col = list(col)
+        if not all(c in self.columns for c in col):
+            raise IndexError(
+                f"All columns must be present in the dataframe with columns {self.columns}. Got {col}."
+            )
+        if row == slice(None):  # all rows (i.e., call to df[:] or df[:, col])
+            return _LazyDataFrame(self.length, self.functions, col)
+        if not isinstance(row, int):
+            raise NotImplementedError(
+                "Row indexing only supports either a single integer or a null slice (i.e., df[:])."
+            )
+        if not (0 <= row < self.length):
+            raise IndexError(f"Row index {row} is out of bounds.")
+        if self.series or one_col:
+            return self.functions[col[0]](row)
+        return pd.Series({c: self.functions[c](row) for c in col})
+    def to_numpy(self):
+        return _LazyDataFrame(
+            length=self.length,
+            functions=self.functions,
+            columns=self.columns,
+            series=len(self.columns) == 1,
+        )
+    def to_list(self):
+        return self.to_numpy()
+class _FixedLengthWindowFunctions:
+    """Class defining functions for lazy metadata generation in fixed length windowing
+    to be used in combination with _LazyDataFrame (experimental)."""
+    def __init__(
+        self,
+        start_offset_samples: int,
+        last_potential_start: int,
+        window_stride_samples: int,
+        window_size_samples: int,
+        target: Any,
+    ):
+        self.start_offset_samples = start_offset_samples
+        self.last_potential_start = last_potential_start
+        self.window_stride_samples = window_stride_samples
+        self.window_size_samples = window_size_samples
+        self.target_val = target
+    @property
+    def length(self) -> int:
+        return int(
+            np.ceil(
+                (self.last_potential_start + 1 - self.start_offset_samples)
+                / self.window_stride_samples
+            )
+        )
+    def i_window_in_trial(self, i: int) -> int:
+        return i
+    def i_start_in_trial(self, i: int) -> int:
+        return self.start_offset_samples + i * self.window_stride_samples
+    def i_stop_in_trial(self, i: int) -> int:
+        return (
+            self.start_offset_samples
+            + i * self.window_stride_samples
+            + self.window_size_samples
+        )
+    def target(self, i: int) -> Any:
+        return self.target_val
+def _get_use_mne_epochs(use_mne_epochs, reject, picks, flat, drop_bad_windows):
+    should_use_mne_epochs = (
+        (reject is not None)
+        or (picks is not None)
+        or (flat is not None)
+        or (drop_bad_windows is True)
+    )
+    if use_mne_epochs is None:
+        if should_use_mne_epochs:
+            warnings.warn(
+                "Using reject or picks or flat or dropping bad windows means "
+                "mne Epochs are created, "
+                "which will be substantially slower and may be deprecated in the future."
+            )
+        return should_use_mne_epochs
+    if not use_mne_epochs and should_use_mne_epochs:
+        raise ValueError(
+            "Cannot set use_mne_epochs=False when using reject, picks, flat, or dropping bad windows."
+        )
+    return use_mne_epochs
 # XXX it's called concat_ds...
 def create_windows_from_events(
-        concat_ds, trial_start_offset_samples=0, trial_stop_offset_samples=0,
-        window_size_samples=None, window_stride_samples=None,
-        drop_last_window=False, mapping=None, preload=False,
-        drop_bad_windows=None, picks=None, reject=None, flat=None,
-        on_missing='error', accepted_bads_ratio=0.0, n_jobs=1, verbose='error'):
+    concat_ds: BaseConcatDataset,
+    trial_start_offset_samples: int = 0,
+    trial_stop_offset_samples: int = 0,
+    window_size_samples: int | None = None,
+    window_stride_samples: int | None = None,
+    drop_last_window: bool = False,
+    mapping: dict[str, int] | None = None,
+    preload: bool = False,
+    drop_bad_windows: bool | None = None,
+    picks: str | ArrayLike | slice | None = None,
+    reject: dict[str, float] | None = None,
+    flat: dict[str, float] | None = None,
+    on_missing: str = "error",
+    accepted_bads_ratio: float = 0.0,
+    use_mne_epochs: bool | None = None,
+    n_jobs: int = 1,
+    verbose: bool | str | int | None = "error",
+):
     """Create windows based on events in mne.Raw.
     This function extracts windows of size window_size_samples in the interval
@@ -100,6 +275,10 @@ def create_windows_from_events(
         smaller than this, then only the corresponding trials are dropped, but
         the computation continues. Otherwise, an error is raised. Defaults to
         0.0 (raise an error).
+    use_mne_epochs: bool
+        If False, return EEGWindowsDataset objects.
+        If True, return mne.Epochs objects encapsulated in WindowsDataset objects,
+        which is substantially slower that EEGWindowsDataset.
     n_jobs: int
         Number of jobs to use to parallelize the windowing.
     verbose: bool | str | int | None
@@ -111,8 +290,11 @@ def create_windows_from_events(
         Concatenated datasets of WindowsDataset containing the extracted windows.
     """
     _check_windowing_arguments(
-        trial_start_offset_samples, trial_stop_offset_samples,
-        window_size_samples, window_stride_samples)
+        trial_start_offset_samples,
+        trial_stop_offset_samples,
+        window_size_samples,
+        window_stride_samples,
+    )
     # If user did not specify mapping, we extract all events from all datasets
     # and map them to increasing integers starting from 0
@@ -121,34 +303,62 @@ def create_windows_from_events(
     infer_window_size_stride = window_size_samples is None
     if drop_bad_windows is not None:
-        warnings.warn('Drop bad windows only has an effect if mne epochs are created, '
-                      'and this argument may be removed in the future.')
+        warnings.warn(
+            "Drop bad windows only has an effect if mne epochs are created, "
+            "and this argument may be removed in the future."
+        )
-    use_mne_epochs = (reject is not None) or (picks is not None) or (flat is not None) or (
-        drop_bad_windows is True)
-    if use_mne_epochs:
-        warnings.warn('Using reject or picks or flat or dropping bad windows means '
-                      'mne Epochs are created, '
-                      'which will be substantially slower and may be deprecated in the future.')
-        if drop_bad_windows is None:
-            drop_bad_windows = True
+    use_mne_epochs = _get_use_mne_epochs(
+        use_mne_epochs, reject, picks, flat, drop_bad_windows
+    )
+    if use_mne_epochs and drop_bad_windows is None:
+        drop_bad_windows = True
     list_of_windows_ds = Parallel(n_jobs=n_jobs)(
         delayed(_create_windows_from_events)(
-            ds, infer_mapping, infer_window_size_stride,
-            trial_start_offset_samples, trial_stop_offset_samples,
-            window_size_samples, window_stride_samples, drop_last_window,
-            mapping, preload, drop_bad_windows, picks, reject, flat,
-            on_missing, accepted_bads_ratio, verbose, use_mne_epochs) for ds in concat_ds.datasets)
+            ds,
+            infer_mapping,
+            infer_window_size_stride,
+            trial_start_offset_samples,
+            trial_stop_offset_samples,
+            window_size_samples,
+            window_stride_samples,
+            drop_last_window,
+            mapping,
+            preload,
+            drop_bad_windows,
+            picks,
+            reject,
+            flat,
+            on_missing,
+            accepted_bads_ratio,
+            verbose,
+            use_mne_epochs,
+        )
+        for ds in concat_ds.datasets
+    )
     return BaseConcatDataset(list_of_windows_ds)
 def create_fixed_length_windows(
-        concat_ds, start_offset_samples=0, stop_offset_samples=None,
-        window_size_samples=None, window_stride_samples=None, drop_last_window=None,
-        mapping=None, preload=False, picks=None,
-        reject=None, flat=None, targets_from='metadata', last_target_only=True,
-        on_missing='error', n_jobs=1, verbose='error'):
+    concat_ds: BaseConcatDataset,
+    start_offset_samples: int = 0,
+    stop_offset_samples: int | None = None,
+    window_size_samples: int | None = None,
+    window_stride_samples: int | None = None,
+    drop_last_window: bool | None = None,
+    mapping: dict[str, int] | None = None,
+    preload: bool = False,
+    picks: str | ArrayLike | slice | None = None,
+    reject: dict[str, float] | None = None,
+    flat: dict[str, float] | None = None,
+    targets_from: str = "metadata",
+    last_target_only: bool = True,
+    lazy_metadata: bool = False,
+    on_missing: str = "error",
+    n_jobs: int = 1,
+    verbose: bool | str | int | None = "error",
+):
     """Windower that creates sliding windows.
     Parameters
@@ -183,6 +393,9 @@ def create_fixed_length_windows(
     flat: dict | None
         Epoch rejection parameters based on flatness of signals. If None, no
         rejection based on flatness is done. See mne.Epochs.
+    lazy_metadata: bool
+        If True, metadata is not computed immediately, but only when accessed
+        by using the _LazyDataFrame (experimental).
     on_missing: str
         What to do if one or several event ids are not found in the recording.
         Valid keys are ‘error’ | ‘warning’ | ‘ignore’. See mne.Epochs.
@@ -196,35 +409,70 @@ def create_fixed_length_windows(
     windows_datasets: BaseConcatDataset
         Concatenated datasets of WindowsDataset containing the extracted windows.
     """
-    stop_offset_samples, drop_last_window = _check_and_set_fixed_length_window_arguments(
-        start_offset_samples, stop_offset_samples, window_size_samples, window_stride_samples,
-        drop_last_window)
+    stop_offset_samples, drop_last_window = (
+        _check_and_set_fixed_length_window_arguments(
+            start_offset_samples,
+            stop_offset_samples,
+            window_size_samples,
+            window_stride_samples,
+            drop_last_window,
+            lazy_metadata,
+        )
+    )
     # check if recordings are of different lengths
     lengths = np.array([ds.raw.n_times for ds in concat_ds.datasets])
     if (np.diff(lengths) != 0).any() and window_size_samples is None:
-        warnings.warn('Recordings have different lengths, they will not be batch-able!')
+        warnings.warn("Recordings have different lengths, they will not be batch-able!")
     if (window_size_samples is not None) and any(window_size_samples > lengths):
-        raise ValueError(f'Window size {window_size_samples} exceeds trial '
-                         f'duration {lengths.min()}.')
+        raise ValueError(
+            f"Window size {window_size_samples} exceeds trial duration {lengths.min()}."
+        )
     list_of_windows_ds = Parallel(n_jobs=n_jobs)(
         delayed(_create_fixed_length_windows)(
-            ds, start_offset_samples, stop_offset_samples, window_size_samples,
-            window_stride_samples, drop_last_window, mapping, preload,
-            picks, reject, flat, targets_from, last_target_only,
-            on_missing, verbose) for ds in concat_ds.datasets)
+            ds,
+            start_offset_samples,
+            stop_offset_samples,
+            window_size_samples,
+            window_stride_samples,
+            drop_last_window,
+            mapping,
+            preload,
+            picks,
+            reject,
+            flat,
+            targets_from,
+            last_target_only,
+            lazy_metadata,
+            on_missing,
+            verbose,
+        )
+        for ds in concat_ds.datasets
+    )
     return BaseConcatDataset(list_of_windows_ds)
 def _create_windows_from_events(
-        ds, infer_mapping, infer_window_size_stride,
-        trial_start_offset_samples, trial_stop_offset_samples,
-        window_size_samples=None, window_stride_samples=None,
-        drop_last_window=False, mapping=None, preload=False,
-        drop_bad_windows=True, picks=None, reject=None, flat=None,
-        on_missing='error', accepted_bads_ratio=0.0, verbose='error',
-        use_mne_epochs=False):
+    ds,
+    infer_mapping,
+    infer_window_size_stride,
+    trial_start_offset_samples,
+    trial_stop_offset_samples,
+    window_size_samples=None,
+    window_stride_samples=None,
+    drop_last_window=False,
+    mapping=None,
+    preload=False,
+    drop_bad_windows=True,
+    picks=None,
+    reject=None,
+    flat=None,
+    on_missing="error",
+    accepted_bads_ratio=0.0,
+    verbose="error",
+    use_mne_epochs=False,
+):
     """Create WindowsDataset from BaseDataset based on events.
     Parameters
@@ -254,47 +502,61 @@ def _create_windows_from_events(
         new_unique_events = [x for x in unique_events if x not in mapping]
         # mapping event descriptions to integers from 0 on
         max_id_existing_mapping = len(mapping)
-        mapping.update({
+        mapping.update(
+            {
                 event_name: i_event_type + max_id_existing_mapping
                 for i_event_type, event_name in enumerate(new_unique_events)
-        })
+            }
+        )
     events, events_id = mne.events_from_annotations(ds.raw, mapping)
     onsets = events[:, 0]
     # Onsets are relative to the beginning of the recording
-    filtered_durations = np.array([
-        a['duration'] for a in ds.raw.annotations
-        if a['description'] in events_id
-    ])
+    filtered_durations = np.array(
+        [a["duration"] for a in ds.raw.annotations if a["description"] in events_id]
+    )
-    stops = onsets + (filtered_durations * ds.raw.info['sfreq']).astype(int)
+    stops = onsets + (filtered_durations * ds.raw.info["sfreq"]).astype(int)
     # XXX This could probably be simplified by using chunk_duration in
     #     `events_from_annotations`
-    last_samp = ds.raw.first_samp + ds.raw.n_times
-    if stops[-1] + trial_stop_offset_samples > last_samp:
+    last_samp = ds.raw.first_samp + ds.raw.n_times - 1
+    # `stops` is used exclusively (i.e. `start:stop`), so add back 1
+    if stops[-1] + trial_stop_offset_samples > last_samp + 1:
         raise ValueError(
             '"trial_stop_offset_samples" too large. Stop of last trial '
             f'({stops[-1]}) + "trial_stop_offset_samples" '
-            f'({trial_stop_offset_samples}) must be smaller than length of'
-            f' recording ({len(ds)}).')
+            f"({trial_stop_offset_samples}) must be smaller than length of"
+            f" recording ({len(ds)})."
+        )
     if infer_window_size_stride:
         # window size is trial size
         if window_size_samples is None:
-            window_size_samples = stops[0] + trial_stop_offset_samples - (
-                onsets[0] + trial_start_offset_samples)
+            window_size_samples = (
+                stops[0]
+                + trial_stop_offset_samples
+                - (onsets[0] + trial_start_offset_samples)
+            )
             window_stride_samples = window_size_samples
         this_trial_sizes = (stops + trial_stop_offset_samples) - (
-            onsets + trial_start_offset_samples)
+            onsets + trial_start_offset_samples
+        )
         # Maybe actually this is not necessary?
         # We could also just say we just assume window size=trial size
         # in case not given, without this condition...
         # but then would have to change functions overall
-        # to deal with varying window sizes hmmhmh
-        assert np.all(this_trial_sizes == window_size_samples), (
-            'All trial sizes should be the same if you do not supply a window '
-            'size.')
+        checker_trials_size = this_trial_sizes == window_size_samples
+        if not np.all(checker_trials_size):
+            trials_drops = int(len(this_trial_sizes) - sum(checker_trials_size))
+            warnings.warn(
+                f"Dropping trials with different windows size {trials_drops}",
+            )
+            bads_size_trials = checker_trials_size
+            events = events[checker_trials_size]
+            onsets = onsets[checker_trials_size]
+            stops = stops[checker_trials_size]
     description = events[:, -1]
@@ -302,51 +564,90 @@ def _create_windows_from_events(
         onsets = onsets - ds.raw.first_samp
         stops = stops - ds.raw.first_samp
     i_trials, i_window_in_trials, starts, stops = _compute_window_inds(
-        onsets, stops, trial_start_offset_samples,
-        trial_stop_offset_samples, window_size_samples,
-        window_stride_samples, drop_last_window, accepted_bads_ratio)
+        onsets,
+        stops,
+        trial_start_offset_samples,
+        trial_stop_offset_samples,
+        window_size_samples,
+        window_stride_samples,
+        drop_last_window,
+        accepted_bads_ratio,
+    )
     if any(np.diff(starts) <= 0):
-        raise NotImplementedError('Trial overlap not implemented.')
+        raise NotImplementedError("Trial overlap not implemented.")
-    events = [[start, window_size_samples, description[i_trials[i_start]]]
-              for i_start, start in enumerate(starts)]
+    events = [
+        [start, window_size_samples, description[i_trials[i_start]]]
+        for i_start, start in enumerate(starts)
+    ]
     events = np.array(events)
     description = events[:, -1]
-    metadata = pd.DataFrame({
-        'i_window_in_trial': i_window_in_trials,
-        'i_start_in_trial': starts,
-        'i_stop_in_trial': stops,
-        'target': description
-    })
+    metadata = pd.DataFrame(
+        {
+            "i_window_in_trial": i_window_in_trials,
+            "i_start_in_trial": starts,
+            "i_stop_in_trial": stops,
+            "target": description,
+        }
+    )
     if use_mne_epochs:
         # window size - 1, since tmax is inclusive
         mne_epochs = mne.Epochs(
-            ds.raw, events, events_id, baseline=None, tmin=0,
-            tmax=(window_size_samples - 1) / ds.raw.info['sfreq'],
-            metadata=metadata, preload=preload, picks=picks, reject=reject,
-            flat=flat, on_missing=on_missing, verbose=verbose)
+            ds.raw,
+            events,
+            events_id,
+            baseline=None,
+            tmin=0,
+            tmax=(window_size_samples - 1) / ds.raw.info["sfreq"],
+            metadata=metadata,
+            preload=preload,
+            picks=picks,
+            reject=reject,
+            flat=flat,
+            on_missing=on_missing,
+            verbose=verbose,
+        )
         if drop_bad_windows:
             mne_epochs.drop_bad()
-        windows_ds = WindowsDataset(mne_epochs, ds.description,)
+        windows_ds = WindowsDataset(
+            mne_epochs,
+            ds.description,
+        )
     else:
         windows_ds = EEGWindowsDataset(
-            ds.raw, metadata=metadata, description=ds.description,)
+            ds.raw,
+            metadata=metadata,
+            description=ds.description,
+        )
     # add window_kwargs and raw_preproc_kwargs to windows dataset
-    setattr(windows_ds, 'window_kwargs', window_kwargs)
-    kwargs_name = 'raw_preproc_kwargs'
+    setattr(windows_ds, "window_kwargs", window_kwargs)
+    kwargs_name = "raw_preproc_kwargs"
     if hasattr(ds, kwargs_name):
         setattr(windows_ds, kwargs_name, getattr(ds, kwargs_name))
     return windows_ds
 def _create_fixed_length_windows(
-        ds, start_offset_samples, stop_offset_samples, window_size_samples,
-        window_stride_samples, drop_last_window, mapping=None, preload=False,
-        picks=None, reject=None, flat=None, targets_from='metadata',
-        last_target_only=True, on_missing='error', verbose='error'):
+    ds,
+    start_offset_samples,
+    stop_offset_samples,
+    window_size_samples,
+    window_stride_samples,
+    drop_last_window,
+    mapping=None,
+    preload=False,
+    picks=None,
+    reject=None,
+    flat=None,
+    targets_from="metadata",
+    last_target_only=True,
+    lazy_metadata=False,
+    on_missing="error",
+    verbose="error",
+):
     """Create WindowsDataset from BaseDataset with sliding windows.
     Parameters
@@ -365,8 +666,7 @@ def _create_fixed_length_windows(
     window_kwargs = [
         (create_fixed_length_windows.__name__, _get_windowing_kwargs(locals())),
     ]
-    stop = ds.raw.n_times\
-        if stop_offset_samples is None else stop_offset_samples
+    stop = ds.raw.n_times if stop_offset_samples is None else stop_offset_samples
     # assume window should be whole recording
     if window_size_samples is None:
@@ -375,15 +675,6 @@ def _create_fixed_length_windows(
         window_stride_samples = window_size_samples
     last_potential_start = stop - window_size_samples
-    # already includes last incomplete window start
-    starts = np.arange(
-        start_offset_samples,
-        last_potential_start + 1,
-        window_stride_samples)
-    if not drop_last_window and starts[-1] < last_potential_start:
-        # if last window does not end at trial stop, make it stop there
-        starts = np.append(starts, last_potential_start)
     # get targets from dataset description if they exist
     target = -1 if ds.target_name is None else ds.description[ds.target_name]
@@ -395,18 +686,53 @@ def _create_fixed_length_windows(
         else:
             target = mapping[target]
-    metadata = pd.DataFrame({
-        'i_window_in_trial': np.arange(len(starts)),
-        'i_start_in_trial': starts,
-        'i_stop_in_trial': starts + window_size_samples,
-        'target': len(starts) * [target]
-    })
+    if lazy_metadata:
+        factory = _FixedLengthWindowFunctions(
+            start_offset_samples,
+            last_potential_start,
+            window_stride_samples,
+            window_size_samples,
+            target,
+        )
+        metadata = _LazyDataFrame(
+            length=factory.length,
+            functions={
+                "i_window_in_trial": factory.i_window_in_trial,
+                "i_start_in_trial": factory.i_start_in_trial,
+                "i_stop_in_trial": factory.i_stop_in_trial,
+                "target": factory.target,
+            },
+            columns=[
+                "i_window_in_trial",
+                "i_start_in_trial",
+                "i_stop_in_trial",
+                "target",
+            ],
+        )
+    else:
+        # already includes last incomplete window start
+        starts = np.arange(
+            start_offset_samples, last_potential_start + 1, window_stride_samples
+        )
+        if not drop_last_window and starts[-1] < last_potential_start:
+            # if last window does not end at trial stop, make it stop there
+            starts = np.append(starts, last_potential_start)
+        metadata = pd.DataFrame(
+            {
+                "i_window_in_trial": np.arange(len(starts)),
+                "i_start_in_trial": starts,
+                "i_stop_in_trial": starts + window_size_samples,
+                "target": len(starts) * [target],
+            }
+        )
     window_kwargs.append(
-        (EEGWindowsDataset.__name__, {
-            'targets_from': targets_from,
-            'last_target_only': last_target_only
-        })
+        (
+            EEGWindowsDataset.__name__,
+            {"targets_from": targets_from, "last_target_only": last_target_only},
+        )
     )
     windows_ds = EEGWindowsDataset(
         ds.raw,
@@ -416,28 +742,52 @@ def _create_fixed_length_windows(
         last_target_only=last_target_only,
     )
     # add window_kwargs and raw_preproc_kwargs to windows dataset
-    setattr(windows_ds, 'window_kwargs', window_kwargs)
-    kwargs_name = 'raw_preproc_kwargs'
+    setattr(windows_ds, "window_kwargs", window_kwargs)
+    kwargs_name = "raw_preproc_kwargs"
     if hasattr(ds, kwargs_name):
         setattr(windows_ds, kwargs_name, getattr(ds, kwargs_name))
     return windows_ds
 def create_windows_from_target_channels(
-        concat_ds, window_size_samples=None, preload=False,
-        picks=None, reject=None, flat=None, n_jobs=1, last_target_only=True,
-        verbose='error'):
+    concat_ds,
+    window_size_samples=None,
+    preload=False,
+    picks=None,
+    reject=None,
+    flat=None,
+    n_jobs=1,
+    last_target_only=True,
+    verbose="error",
+):
     list_of_windows_ds = Parallel(n_jobs=n_jobs)(
         delayed(_create_windows_from_target_channels)(
-            ds, window_size_samples, preload, picks, reject,
-            flat, last_target_only, 'error', verbose) for ds in concat_ds.datasets)
+            ds,
+            window_size_samples,
+            preload,
+            picks,
+            reject,
+            flat,
+            last_target_only,
+            "error",
+            verbose,
+        )
+        for ds in concat_ds.datasets
+    )
     return BaseConcatDataset(list_of_windows_ds)
 def _create_windows_from_target_channels(
-        ds, window_size_samples, preload=False, picks=None,
-        reject=None, flat=None, last_target_only=True, on_missing='error',
-        verbose='error'):
+    ds,
+    window_size_samples,
+    preload=False,
+    picks=None,
+    reject=None,
+    flat=None,
+    last_target_only=True,
+    on_missing="error",
+    verbose="error",
+):
     """Create WindowsDataset from BaseDataset using targets `misc` channels from mne.Raw.
     Parameters
@@ -457,24 +807,26 @@ def _create_windows_from_target_channels(
     ]
     stop = ds.raw.n_times + ds.raw.first_samp
-    target = ds.raw.get_data(picks='misc')
+    target = ds.raw.get_data(picks="misc")
     # TODO: handle multi targets present only for some events
     stops = np.nonzero((~np.isnan(target[0, :])))[0] + 1
     stops = stops[(stops < stop) & (stops >= window_size_samples)]
     stops = stops.astype(int)
-    metadata = pd.DataFrame({
-        'i_window_in_trial': np.arange(len(stops)),
-        'i_start_in_trial': stops - window_size_samples,
-        'i_stop_in_trial': stops,
-        'target': len(stops) * [target]
-    })
-    targets_from = 'channels'
+    metadata = pd.DataFrame(
+        {
+            "i_window_in_trial": np.arange(len(stops)),
+            "i_start_in_trial": stops - window_size_samples,
+            "i_stop_in_trial": stops,
+            "target": len(stops) * [target],
+        }
+    )
+    targets_from = "channels"
     window_kwargs.append(
-        (EEGWindowsDataset.__name__, {
-            'targets_from': targets_from,
-            'last_target_only': last_target_only
-        })
+        (
+            EEGWindowsDataset.__name__,
+            {"targets_from": targets_from, "last_target_only": last_target_only},
+        )
     )
     windows_ds = EEGWindowsDataset(
         ds.raw,
@@ -483,16 +835,23 @@ def _create_windows_from_target_channels(
         targets_from=targets_from,
         last_target_only=last_target_only,
     )
-    setattr(windows_ds, 'window_kwargs', window_kwargs)
-    kwargs_name = 'raw_preproc_kwargs'
+    setattr(windows_ds, "window_kwargs", window_kwargs)
+    kwargs_name = "raw_preproc_kwargs"
     if hasattr(ds, kwargs_name):
         setattr(windows_ds, kwargs_name, getattr(ds, kwargs_name))
     return windows_ds
 def _compute_window_inds(
-        starts, stops, start_offset, stop_offset, size, stride,
-        drop_last_window, accepted_bads_ratio):
+    starts,
+    stops,
+    start_offset,
+    stop_offset,
+    size,
+    stride,
+    drop_last_window,
+    accepted_bads_ratio,
+):
     """Compute window start and stop indices.
     Create window starts from trial onsets (shifted by start_offset) to trial
@@ -531,27 +890,31 @@ def _compute_window_inds(
     starts += start_offset
     stops += stop_offset
-    if any(size > (stops-starts)):
-        bads_mask = size > (stops-starts)
-        min_duration = (stops-starts).min()
+    if any(size > (stops - starts)):
+        bads_mask = size > (stops - starts)
+        min_duration = (stops - starts).min()
         if sum(bads_mask) <= accepted_bads_ratio * len(starts):
             starts = starts[np.logical_not(bads_mask)]
             stops = stops[np.logical_not(bads_mask)]
             warnings.warn(
-                f'Trials {np.where(bads_mask)[0]} are being dropped as the '
-                f'window size ({size}) exceeds their duration {min_duration}.')
+                f"Trials {np.where(bads_mask)[0]} are being dropped as the "
+                f"window size ({size}) exceeds their duration {min_duration}."
+            )
         else:
             current_ratio = sum(bads_mask) / len(starts)
-            raise ValueError(f'Window size {size} exceeds trial duration '
-                             f'({min_duration}) for too many trials '
-                             f'({current_ratio * 100}%). Set '
-                             f'accepted_bads_ratio to at least {current_ratio}'
-                             'and restart training to be able to continue.')
+            raise ValueError(
+                f"Window size {size} exceeds trial duration "
+                f"({min_duration}) for too many trials "
+                f"({current_ratio * 100}%). Set "
+                f"accepted_bads_ratio to at least {current_ratio}"
+                "and restart training to be able to continue."
+            )
     i_window_in_trials, i_trials, window_starts = [], [], []
     for start_i, (start, stop) in enumerate(zip(starts, stops)):
-        # Generate possible window starts with given stride between original
-        # trial onsets (shifted by start_offset) and stops
+        # Generate possible window starts, with given stride, between original
+        # trial onsets and stops (shifted by start_offset and stop_offset,
+        # respectively)
         possible_starts = np.arange(start, stop, stride)
         # Possible window start is actually a start, if window size fits in
@@ -571,72 +934,98 @@ def _compute_window_inds(
                 i_window_in_trials.append(i_window_in_trials[-1] + 1)
                 i_trials.append(start_i)
-    # Update stops to now be event stops instead of trial stops
+    # Set window stops to be event stops (rather than trial stops)
     window_stops = np.array(window_starts) + size
     if not (len(i_window_in_trials) == len(window_starts) == len(window_stops)):
-        raise ValueError(f'{len(i_window_in_trials)} == '
-                         f'{len(window_starts)} == {len(window_stops)}')
+        raise ValueError(
+            f"{len(i_window_in_trials)} == {len(window_starts)} == {len(window_stops)}"
+        )
     return i_trials, i_window_in_trials, window_starts, window_stops
 def _check_windowing_arguments(
-        trial_start_offset_samples, trial_stop_offset_samples,
-        window_size_samples, window_stride_samples):
+    trial_start_offset_samples,
+    trial_stop_offset_samples,
+    window_size_samples,
+    window_stride_samples,
+):
     assert isinstance(trial_start_offset_samples, (int, np.integer))
-    assert (isinstance(trial_stop_offset_samples, (int, np.integer)) or
-           (trial_stop_offset_samples is None))
+    assert isinstance(trial_stop_offset_samples, (int, np.integer)) or (
+        trial_stop_offset_samples is None
+    )
     assert isinstance(window_size_samples, (int, np.integer, type(None)))
     assert isinstance(window_stride_samples, (int, np.integer, type(None)))
     assert (window_size_samples is None) == (window_stride_samples is None)
     if window_size_samples is not None:
-        assert window_size_samples > 0, (
-            "window size has to be larger than 0")
-        assert window_stride_samples > 0, (
-            "window stride has to be larger than 0")
-def _check_and_set_fixed_length_window_arguments(start_offset_samples, stop_offset_samples,
-                                                 window_size_samples, window_stride_samples,
-                                                 drop_last_window):
+        assert window_size_samples > 0, "window size has to be larger than 0"
+        assert window_stride_samples > 0, "window stride has to be larger than 0"
+def _check_and_set_fixed_length_window_arguments(
+    start_offset_samples,
+    stop_offset_samples,
+    window_size_samples,
+    window_stride_samples,
+    drop_last_window,
+    lazy_metadata,
+):
     """Raises warnings for incorrect input arguments and will set correct default values for
     stop_offset_samples & drop_last_window, if necessary.
     """
     _check_windowing_arguments(
-        start_offset_samples, stop_offset_samples,
-        window_size_samples, window_stride_samples)
+        start_offset_samples,
+        stop_offset_samples,
+        window_size_samples,
+        window_stride_samples,
+    )
     if stop_offset_samples == 0:
         warnings.warn(
-            'Meaning of `trial_stop_offset_samples`=0 has changed, use `None` '
-            'to indicate end of trial/recording. Using `None`.')
+            "Meaning of `trial_stop_offset_samples`=0 has changed, use `None` "
+            "to indicate end of trial/recording. Using `None`."
+        )
         stop_offset_samples = None
     if start_offset_samples != 0 or stop_offset_samples is not None:
-        warnings.warn('Usage of offset_sample args in create_fixed_length_windows is deprecated and'
-                      ' will be removed in future versions. Please use '
-                      'braindecode.preprocessing.preprocess.Preprocessor("crop", tmin, tmax)'
-                      ' instead.')
-    if window_size_samples is not None and window_stride_samples is not None and \
-            drop_last_window is None:
-        raise ValueError('drop_last_window must be set if both window_size_samples &'
-                         ' window_stride_samples have also been set')
-    elif window_size_samples is None and\
-            window_stride_samples is None and\
-            drop_last_window is False:
+        warnings.warn(
+            "Usage of offset_sample args in create_fixed_length_windows is deprecated and"
+            " will be removed in future versions. Please use "
+            'braindecode.preprocessing.preprocess.Preprocessor("crop", tmin, tmax)'
+            " instead."
+        )
+    if (
+        window_size_samples is not None
+        and window_stride_samples is not None
+        and drop_last_window is None
+    ):
+        raise ValueError(
+            "drop_last_window must be set if both window_size_samples &"
+            " window_stride_samples have also been set"
+        )
+    elif (
+        window_size_samples is None
+        and window_stride_samples is None
+        and drop_last_window is False
+    ):
         # necessary for following assertion
         drop_last_window = None
-    assert (window_size_samples is None) == \
-           (window_stride_samples is None) == \
-           (drop_last_window is None)
+    assert (
+        (window_size_samples is None)
+        == (window_stride_samples is None)
+        == (drop_last_window is None)
+    )
+    if not drop_last_window and lazy_metadata:
+        raise ValueError(
+            "Cannot have drop_last_window=False and lazy_metadata=True at the same time."
+        )
     return stop_offset_samples, drop_last_window
 def _get_windowing_kwargs(windowing_func_locals):
     input_kwargs = windowing_func_locals
-    input_kwargs.pop('ds')
+    input_kwargs.pop("ds")
     windowing_kwargs = {k: v for k, v in input_kwargs.items()}
     return windowing_kwargs

braindecode 0.8.1__py3-none-any.whl → 1.0.0__py3-none-any.whl

Potentially problematic release.

braindecode 0.8.1py3-none-any.whl → 1.0.0py3-none-any.whl