PyPI - braindecode - Versions diffs - 0.8__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

braindecode 0.8py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of braindecode might be problematic. Click here for more details.

Files changed (102) hide show

braindecode/__init__.py +1 -2
braindecode/augmentation/__init__.py +50 -0
braindecode/augmentation/base.py +222 -0
braindecode/augmentation/functional.py +1096 -0
braindecode/augmentation/transforms.py +1274 -0
braindecode/classifier.py +26 -24
braindecode/datasets/__init__.py +34 -0
braindecode/datasets/base.py +840 -0
braindecode/datasets/bbci.py +694 -0
braindecode/datasets/bcicomp.py +194 -0
braindecode/datasets/bids.py +245 -0
braindecode/datasets/mne.py +172 -0
braindecode/datasets/moabb.py +209 -0
braindecode/datasets/nmt.py +311 -0
braindecode/datasets/sleep_physio_challe_18.py +412 -0
braindecode/datasets/sleep_physionet.py +125 -0
braindecode/datasets/tuh.py +588 -0
braindecode/datasets/xy.py +95 -0
braindecode/datautil/__init__.py +49 -0
braindecode/datautil/serialization.py +342 -0
braindecode/datautil/util.py +41 -0
braindecode/eegneuralnet.py +63 -47
braindecode/functional/__init__.py +10 -0
braindecode/functional/functions.py +251 -0
braindecode/functional/initialization.py +47 -0
braindecode/models/__init__.py +52 -0
braindecode/models/atcnet.py +652 -0
braindecode/models/attentionbasenet.py +550 -0
braindecode/models/base.py +296 -0
braindecode/models/biot.py +483 -0
braindecode/models/contrawr.py +296 -0
braindecode/models/ctnet.py +450 -0
braindecode/models/deep4.py +322 -0
braindecode/models/deepsleepnet.py +295 -0
braindecode/models/eegconformer.py +372 -0
braindecode/models/eeginception_erp.py +304 -0
braindecode/models/eeginception_mi.py +371 -0
braindecode/models/eegitnet.py +301 -0
braindecode/models/eegminer.py +255 -0
braindecode/models/eegnet.py +473 -0
braindecode/models/eegnex.py +247 -0
braindecode/models/eegresnet.py +362 -0
braindecode/models/eegsimpleconv.py +199 -0
braindecode/models/eegtcnet.py +335 -0
braindecode/models/fbcnet.py +221 -0
braindecode/models/fblightconvnet.py +313 -0
braindecode/models/fbmsnet.py +325 -0
braindecode/models/hybrid.py +126 -0
braindecode/models/ifnet.py +441 -0
braindecode/models/labram.py +1166 -0
braindecode/models/msvtnet.py +375 -0
braindecode/models/sccnet.py +182 -0
braindecode/models/shallow_fbcsp.py +208 -0
braindecode/models/signal_jepa.py +1012 -0
braindecode/models/sinc_shallow.py +337 -0
braindecode/models/sleep_stager_blanco_2020.py +167 -0
braindecode/models/sleep_stager_chambon_2018.py +157 -0
braindecode/models/sleep_stager_eldele_2021.py +536 -0
braindecode/models/sparcnet.py +378 -0
braindecode/models/summary.csv +41 -0
braindecode/models/syncnet.py +232 -0
braindecode/models/tcn.py +273 -0
braindecode/models/tidnet.py +395 -0
braindecode/models/tsinception.py +258 -0
braindecode/models/usleep.py +340 -0
braindecode/models/util.py +133 -0
braindecode/modules/__init__.py +38 -0
braindecode/modules/activation.py +60 -0
braindecode/modules/attention.py +757 -0
braindecode/modules/blocks.py +108 -0
braindecode/modules/convolution.py +274 -0
braindecode/modules/filter.py +632 -0
braindecode/modules/layers.py +133 -0
braindecode/modules/linear.py +50 -0
braindecode/modules/parametrization.py +38 -0
braindecode/modules/stats.py +77 -0
braindecode/modules/util.py +77 -0
braindecode/modules/wrapper.py +75 -0
braindecode/preprocessing/__init__.py +37 -0
braindecode/preprocessing/mne_preprocess.py +77 -0
braindecode/preprocessing/preprocess.py +478 -0
braindecode/preprocessing/windowers.py +1031 -0
braindecode/regressor.py +23 -12
braindecode/samplers/__init__.py +18 -0
braindecode/samplers/base.py +401 -0
braindecode/samplers/ssl.py +263 -0
braindecode/training/__init__.py +23 -0
braindecode/training/callbacks.py +23 -0
braindecode/training/losses.py +105 -0
braindecode/training/scoring.py +483 -0
braindecode/util.py +55 -59
braindecode/version.py +1 -1
braindecode/visualization/__init__.py +8 -0
braindecode/visualization/confusion_matrices.py +289 -0
braindecode/visualization/gradients.py +57 -0
{braindecode-0.8.dist-info → braindecode-1.0.0.dist-info}/METADATA +39 -55
braindecode-1.0.0.dist-info/RECORD +101 -0
{braindecode-0.8.dist-info → braindecode-1.0.0.dist-info}/WHEEL +1 -1
{braindecode-0.8.dist-info → braindecode-1.0.0.dist-info/licenses}/LICENSE.txt +1 -1
braindecode-1.0.0.dist-info/licenses/NOTICE.txt +20 -0
braindecode-0.8.dist-info/RECORD +0 -11
{braindecode-0.8.dist-info → braindecode-1.0.0.dist-info}/top_level.txt +0 -0

braindecode/datasets/base.py ADDED Viewed

@@ -0,0 +1,840 @@
+"""
+Dataset classes.
+"""
+# Authors: Hubert Banville <hubert.jbanville@gmail.com>
+#          Lukas Gemein <l.gemein@gmail.com>
+#          Simon Brandt <simonbrandt@protonmail.com>
+#          David Sabbagh <dav.sabbagh@gmail.com>
+#          Robin Schirrmeister <robintibor@gmail.com>
+#
+# License: BSD (3-clause)
+from __future__ import annotations
+import json
+import os
+import shutil
+import warnings
+from collections.abc import Callable
+from glob import glob
+from typing import Iterable, no_type_check
+import mne.io
+import numpy as np
+import pandas as pd
+from torch.utils.data import ConcatDataset, Dataset
+def _create_description(description) -> pd.Series:
+    if description is not None:
+        if not isinstance(description, pd.Series) and not isinstance(description, dict):
+            raise ValueError(
+                f"'{description}' has to be either a pandas.Series or a dict."
+            )
+        if isinstance(description, dict):
+            description = pd.Series(description)
+    return description
+class BaseDataset(Dataset):
+    """Returns samples from an mne.io.Raw object along with a target.
+    Dataset which serves samples from an mne.io.Raw object along with a target.
+    The target is unique for the dataset, and is obtained through the
+    `description` attribute.
+    Parameters
+    ----------
+    raw : mne.io.Raw
+        Continuous data.
+    description : dict | pandas.Series | None
+        Holds additional description about the continuous signal / subject.
+    target_name : str | tuple | None
+        Name(s) of the index in `description` that should be used to provide the
+        target (e.g., to be used in a prediction task later on).
+    transform : callable | None
+        On-the-fly transform applied to the example before it is returned.
+    """
+    def __init__(
+        self,
+        raw: mne.io.BaseRaw,
+        description: dict | pd.Series | None = None,
+        target_name: str | tuple[str, ...] | None = None,
+        transform: Callable | None = None,
+    ):
+        self.raw = raw
+        self._description = _create_description(description)
+        self.transform = transform
+        # save target name for load/save later
+        self.target_name = self._target_name(target_name)
+    def __getitem__(self, index):
+        X = self.raw[:, index][0]
+        y = None
+        if self.target_name is not None:
+            y = self.description[self.target_name]
+        if isinstance(y, pd.Series):
+            y = y.to_list()
+        if self.transform is not None:
+            X = self.transform(X)
+        return X, y
+    def __len__(self):
+        return len(self.raw)
+    @property
+    def transform(self):
+        return self._transform
+    @transform.setter
+    def transform(self, value):
+        if value is not None and not callable(value):
+            raise ValueError("Transform needs to be a callable.")
+        self._transform = value
+    @property
+    def description(self) -> pd.Series:
+        return self._description
+    def set_description(self, description: dict | pd.Series, overwrite: bool = False):
+        """Update (add or overwrite) the dataset description.
+        Parameters
+        ----------
+        description: dict | pd.Series
+            Description in the form key: value.
+        overwrite: bool
+            Has to be True if a key in description already exists in the
+            dataset description.
+        """
+        description = _create_description(description)
+        for key, value in description.items():
+            # if the key is already in the existing description, drop it
+            if self._description is not None and key in self._description:
+                assert overwrite, (
+                    f"'{key}' already in description. Please "
+                    f"rename or set overwrite to True."
+                )
+                self._description.pop(key)
+        if self._description is None:
+            self._description = description
+        else:
+            self._description = pd.concat([self.description, description])
+    def _target_name(self, target_name):
+        if target_name is not None and not isinstance(target_name, (str, tuple, list)):
+            raise ValueError("target_name has to be None, str, tuple or list")
+        if target_name is None:
+            return target_name
+        else:
+            # convert tuple of names or single name to list
+            if isinstance(target_name, tuple):
+                target_name = [name for name in target_name]
+            elif not isinstance(target_name, list):
+                assert isinstance(target_name, str)
+                target_name = [target_name]
+            assert isinstance(target_name, list)
+            # check if target name(s) can be read from description
+            for name in target_name:
+                if self.description is None or name not in self.description:
+                    warnings.warn(
+                        f"'{name}' not in description. '__getitem__'"
+                        f"will fail unless an appropriate target is"
+                        f" added to description.",
+                        UserWarning,
+                    )
+        # return a list of str if there are multiple targets and a str otherwise
+        return target_name if len(target_name) > 1 else target_name[0]
+class EEGWindowsDataset(BaseDataset):
+    """Returns windows from an mne.Raw object, its window indices, along with a target.
+    Dataset which serves windows from an mne.Epochs object along with their
+    target and additional information. The `metadata` attribute of the Epochs
+    object must contain a column called `target`, which will be used to return
+    the target that corresponds to a window. Additional columns
+    `i_window_in_trial`, `i_start_in_trial`, `i_stop_in_trial` are also
+    required to serve information about the windowing (e.g., useful for cropped
+    training).
+    See `braindecode.datautil.windowers` to directly create a `WindowsDataset`
+    from a `BaseDataset` object.
+    Parameters
+    ----------
+    windows : mne.Raw or mne.Epochs (Epochs is outdated)
+        Windows obtained through the application of a windower to a BaseDataset
+        (see `braindecode.datautil.windowers`).
+    description : dict | pandas.Series | None
+        Holds additional info about the windows.
+    transform : callable | None
+        On-the-fly transform applied to a window before it is returned.
+    targets_from : str
+        Defines whether targets will be extracted from  metadata or from `misc`
+        channels (time series targets). It can be `metadata` (default) or `channels`.
+    last_target_only : bool
+        If targets are obtained from misc channels whether all targets if the entire
+        (compute) window will be returned or only the last target in the window.
+    metadata : pandas.DataFrame
+        Dataframe with crop indices, so `i_window_in_trial`, `i_start_in_trial`, `i_stop_in_trial`
+        as well as `targets`.
+    """
+    def __init__(
+        self,
+        raw: mne.io.BaseRaw | mne.BaseEpochs,
+        metadata: pd.DataFrame,
+        description: dict | pd.Series | None = None,
+        transform: Callable | None = None,
+        targets_from: str = "metadata",
+        last_target_only: bool = True,
+    ):
+        self.raw = raw
+        self.metadata = metadata
+        self._description = _create_description(description)
+        self.transform = transform
+        self.last_target_only = last_target_only
+        if targets_from not in ("metadata", "channels"):
+            raise ValueError("Wrong value for parameter `targets_from`.")
+        self.targets_from = targets_from
+        self.crop_inds = metadata.loc[
+            :, ["i_window_in_trial", "i_start_in_trial", "i_stop_in_trial"]
+        ].to_numpy()
+        if self.targets_from == "metadata":
+            self.y = metadata.loc[:, "target"].to_list()
+    def __getitem__(self, index: int):
+        """Get a window and its target.
+        Parameters
+        ----------
+        index : int
+            Index to the window (and target) to return.
+        Returns
+        -------
+        np.ndarray
+            Window of shape (n_channels, n_times).
+        int
+            Target for the windows.
+        np.ndarray
+            Crop indices.
+        """
+        # necessary to cast as list to get list of three tensors from batch,
+        # otherwise get single 2d-tensor...
+        crop_inds = self.crop_inds[index].tolist()
+        i_window_in_trial, i_start, i_stop = crop_inds
+        X = self.raw._getitem((slice(None), slice(i_start, i_stop)), return_times=False)
+        X = X.astype("float32")
+        # ensure we don't give the user the option
+        # to accidentally modify the underlying array
+        X = X.copy()
+        if self.transform is not None:
+            X = self.transform(X)
+        if self.targets_from == "metadata":
+            y = self.y[index]
+        else:
+            misc_mask = np.array(self.raw.get_channel_types()) == "misc"
+            if self.last_target_only:
+                y = X[misc_mask, -1]
+            else:
+                y = X[misc_mask, :]
+            # ensure we don't give the user the option
+            # to accidentally modify the underlying array
+            y = y.copy()
+            # remove the target channels from raw
+            X = X[~misc_mask, :]
+        return X, y, crop_inds
+    def __len__(self):
+        return len(self.crop_inds)
+    @property
+    def transform(self):
+        return self._transform
+    @transform.setter
+    def transform(self, value):
+        if value is not None and not callable(value):
+            raise ValueError("Transform needs to be a callable.")
+        self._transform = value
+    @property
+    def description(self) -> pd.Series:
+        return self._description
+    def set_description(self, description: dict | pd.Series, overwrite: bool = False):
+        """Update (add or overwrite) the dataset description.
+        Parameters
+        ----------
+        description: dict | pd.Series
+            Description in the form key: value.
+        overwrite: bool
+            Has to be True if a key in description already exists in the
+            dataset description.
+        """
+        description = _create_description(description)
+        for key, value in description.items():
+            # if they key is already in the existing description, drop it
+            if key in self._description:
+                assert overwrite, (
+                    f"'{key}' already in description. Please "
+                    f"rename or set overwrite to True."
+                )
+                self._description.pop(key)
+        self._description = pd.concat([self.description, description])
+class WindowsDataset(BaseDataset):
+    """Returns windows from an mne.Epochs object along with a target.
+    Dataset which serves windows from an mne.Epochs object along with their
+    target and additional information. The `metadata` attribute of the Epochs
+    object must contain a column called `target`, which will be used to return
+    the target that corresponds to a window. Additional columns
+    `i_window_in_trial`, `i_start_in_trial`, `i_stop_in_trial` are also
+    required to serve information about the windowing (e.g., useful for cropped
+    training).
+    See `braindecode.datautil.windowers` to directly create a `WindowsDataset`
+    from a `BaseDataset` object.
+    Parameters
+    ----------
+    windows : mne.Epochs
+        Windows obtained through the application of a windower to a BaseDataset
+        (see `braindecode.datautil.windowers`).
+    description : dict | pandas.Series | None
+        Holds additional info about the windows.
+    transform : callable | None
+        On-the-fly transform applied to a window before it is returned.
+    targets_from : str
+        Defines whether targets will be extracted from mne.Epochs metadata or mne.Epochs `misc`
+        channels (time series targets). It can be `metadata` (default) or `channels`.
+    """
+    def __init__(
+        self,
+        windows: mne.BaseEpochs,
+        description: dict | pd.Series | None = None,
+        transform: Callable | None = None,
+        targets_from: str = "metadata",
+        last_target_only: bool = True,
+    ):
+        self.windows = windows
+        self._description = _create_description(description)
+        self.transform = transform
+        self.last_target_only = last_target_only
+        if targets_from not in ("metadata", "channels"):
+            raise ValueError("Wrong value for parameter `targets_from`.")
+        self.targets_from = targets_from
+        self.crop_inds = self.windows.metadata.loc[
+            :, ["i_window_in_trial", "i_start_in_trial", "i_stop_in_trial"]
+        ].to_numpy()
+        if self.targets_from == "metadata":
+            self.y = self.windows.metadata.loc[:, "target"].to_list()
+    def __getitem__(self, index: int):
+        """Get a window and its target.
+        Parameters
+        ----------
+        index : int
+            Index to the window (and target) to return.
+        Returns
+        -------
+        np.ndarray
+            Window of shape (n_channels, n_times).
+        int
+            Target for the windows.
+        np.ndarray
+            Crop indices.
+        """
+        X = self.windows.get_data(item=index)[0].astype("float32")
+        if self.transform is not None:
+            X = self.transform(X)
+        if self.targets_from == "metadata":
+            y = self.y[index]
+        else:
+            misc_mask = np.array(self.windows.get_channel_types()) == "misc"
+            if self.last_target_only:
+                y = X[misc_mask, -1]
+            else:
+                y = X[misc_mask, :]
+            # remove the target channels from raw
+            X = X[~misc_mask, :]
+        # necessary to cast as list to get list of three tensors from batch,
+        # otherwise get single 2d-tensor...
+        crop_inds = self.crop_inds[index].tolist()
+        return X, y, crop_inds
+    def __len__(self) -> int:
+        return len(self.windows.events)
+    @property
+    def transform(self):
+        return self._transform
+    @transform.setter
+    def transform(self, value):
+        if value is not None and not callable(value):
+            raise ValueError("Transform needs to be a callable.")
+        self._transform = value
+    @property
+    def description(self) -> pd.Series:
+        return self._description
+    def set_description(self, description: dict | pd.Series, overwrite: bool = False):
+        """Update (add or overwrite) the dataset description.
+        Parameters
+        ----------
+        description: dict | pd.Series
+            Description in the form key: value.
+        overwrite: bool
+            Has to be True if a key in description already exists in the
+            dataset description.
+        """
+        description = _create_description(description)
+        for key, value in description.items():
+            # if they key is already in the existing description, drop it
+            if key in self._description:
+                assert overwrite, (
+                    f"'{key}' already in description. Please "
+                    f"rename or set overwrite to True."
+                )
+                self._description.pop(key)
+        self._description = pd.concat([self.description, description])
+class BaseConcatDataset(ConcatDataset):
+    """A base class for concatenated datasets.
+    Holds either mne.Raw or mne.Epoch in self.datasets and has
+    a pandas DataFrame with additional description.
+    Parameters
+    ----------
+    list_of_ds : list
+        list of BaseDataset, BaseConcatDataset or WindowsDataset
+    target_transform : callable | None
+        Optional function to call on targets before returning them.
+    """
+    def __init__(
+        self,
+        list_of_ds: list[BaseDataset | BaseConcatDataset | WindowsDataset]
+        | None = None,
+        target_transform: Callable | None = None,
+    ):
+        # if we get a list of BaseConcatDataset, get all the individual datasets
+        if list_of_ds and isinstance(list_of_ds[0], BaseConcatDataset):
+            list_of_ds = [d for ds in list_of_ds for d in ds.datasets]
+        super().__init__(list_of_ds)
+        self.target_transform = target_transform
+    def _get_sequence(self, indices):
+        X, y = list(), list()
+        for ind in indices:
+            out_i = super().__getitem__(ind)
+            X.append(out_i[0])
+            y.append(out_i[1])
+        X = np.stack(X, axis=0)
+        y = np.array(y)
+        return X, y
+    def __getitem__(self, idx: int | list):
+        """
+        Parameters
+        ----------
+        idx : int | list
+            Index of window and target to return. If provided as a list of
+            ints, multiple windows and targets will be extracted and
+            concatenated. The target output can be modified on the
+            fly by the ``traget_transform`` parameter.
+        """
+        if isinstance(idx, Iterable):  # Sample multiple windows
+            item = self._get_sequence(idx)
+        else:
+            item = super().__getitem__(idx)
+        if self.target_transform is not None:
+            item = item[:1] + (self.target_transform(item[1]),) + item[2:]
+        return item
+    @no_type_check  # TODO, it's a mess
+    def split(
+        self,
+        by: str | list[int] | list[list[int]] | dict[str, list[int]] | None = None,
+        property: str | None = None,
+        split_ids: list[int] | list[list[int]] | dict[str, list[int]] | None = None,
+    ) -> dict[str, BaseConcatDataset]:
+        """Split the dataset based on information listed in its description.
+        The format could be based on a DataFrame or based on indices.
+        Parameters
+        ----------
+        by : str | list | dict
+            If ``by`` is a string, splitting is performed based on the
+            description DataFrame column with this name.
+            If ``by`` is a (list of) list of integers, the position in the first
+            list corresponds to the split id and the integers to the
+            datapoints of that split.
+            If a dict then each key will be used in the returned
+            splits dict and each value should be a list of int.
+        property : str
+            Some property which is listed in the info DataFrame.
+        split_ids : list | dict
+            List of indices to be combined in a subset.
+            It can be a list of int or a list of list of int.
+        Returns
+        -------
+        splits : dict
+            A dictionary with the name of the split (a string) as key and the
+            dataset as value.
+        """
+        args_not_none = [by is not None, property is not None, split_ids is not None]
+        if sum(args_not_none) != 1:
+            raise ValueError("Splitting requires exactly one argument.")
+        if property is not None or split_ids is not None:
+            warnings.warn(
+                "Keyword arguments `property` and `split_ids` "
+                "are deprecated and will be removed in the future. "
+                "Use `by` instead.",
+                DeprecationWarning,
+            )
+            by = property if property is not None else split_ids
+        if isinstance(by, str):
+            split_ids = {
+                k: list(v) for k, v in self.description.groupby(by).groups.items()
+            }
+        elif isinstance(by, dict):
+            split_ids = by
+        else:
+            # assume list(int)
+            if not isinstance(by[0], list):
+                by = [by]
+            # assume list(list(int))
+            split_ids = {split_i: split for split_i, split in enumerate(by)}
+        return {
+            str(split_name): BaseConcatDataset(
+                [self.datasets[ds_ind] for ds_ind in ds_inds],
+                target_transform=self.target_transform,
+            )
+            for split_name, ds_inds in split_ids.items()
+        }
+    def get_metadata(self) -> pd.DataFrame:
+        """Concatenate the metadata and description of the wrapped Epochs.
+        Returns
+        -------
+        metadata : pd.DataFrame
+            DataFrame containing as many rows as there are windows in the
+            BaseConcatDataset, with the metadata and description information
+            for each window.
+        """
+        if not all(
+            [
+                isinstance(ds, (WindowsDataset, EEGWindowsDataset))
+                for ds in self.datasets
+            ]
+        ):
+            raise TypeError(
+                "Metadata dataframe can only be computed when all "
+                "datasets are WindowsDataset."
+            )
+        all_dfs = list()
+        for ds in self.datasets:
+            if hasattr(ds, "windows"):
+                df = ds.windows.metadata
+            else:
+                df = ds.metadata
+            for k, v in ds.description.items():
+                df[k] = v
+            all_dfs.append(df)
+        return pd.concat(all_dfs)
+    @property
+    def transform(self):
+        return [ds.transform for ds in self.datasets]
+    @transform.setter
+    def transform(self, fn):
+        for i in range(len(self.datasets)):
+            self.datasets[i].transform = fn
+    @property
+    def target_transform(self):
+        return self._target_transform
+    @target_transform.setter
+    def target_transform(self, fn):
+        if not (callable(fn) or fn is None):
+            raise TypeError("target_transform must be a callable.")
+        self._target_transform = fn
+    def _outdated_save(self, path, overwrite=False):
+        """This is a copy of the old saving function, that had inconsistent
+        functionality for BaseDataset and WindowsDataset. It only exists to
+        assure backwards compatibility by still being able to run the old tests.
+        Save dataset to files.
+        Parameters
+        ----------
+        path : str
+            Directory to which .fif / -epo.fif and .json files are stored.
+        overwrite : bool
+            Whether to delete old files (.json, .fif, -epo.fif) in specified
+            directory prior to saving.
+        """
+        warnings.warn(
+            "This function only exists for backwards compatibility "
+            "purposes. DO NOT USE!",
+            UserWarning,
+        )
+        if isinstance(self.datasets[0], EEGWindowsDataset):
+            raise NotImplementedError(
+                "Outdated save not implemented for new window datasets."
+            )
+        if len(self.datasets) == 0:
+            raise ValueError("Expect at least one dataset")
+        if not (
+            hasattr(self.datasets[0], "raw") or hasattr(self.datasets[0], "windows")
+        ):
+            raise ValueError("dataset should have either raw or windows attribute")
+        file_name_templates = ["{}-raw.fif", "{}-epo.fif"]
+        description_file_name = os.path.join(path, "description.json")
+        target_file_name = os.path.join(path, "target_name.json")
+        if not overwrite:
+            from braindecode.datautil.serialization import (  # Import here to avoid circular import
+                _check_save_dir_empty,
+            )
+            _check_save_dir_empty(path)
+        else:
+            for file_name_template in file_name_templates:
+                file_names = glob(
+                    os.path.join(path, f"*{file_name_template.lstrip('{}')}")
+                )
+                _ = [os.remove(f) for f in file_names]
+            if os.path.isfile(target_file_name):
+                os.remove(target_file_name)
+            if os.path.isfile(description_file_name):
+                os.remove(description_file_name)
+            for kwarg_name in [
+                "raw_preproc_kwargs",
+                "window_kwargs",
+                "window_preproc_kwargs",
+            ]:
+                kwarg_path = os.path.join(path, ".".join([kwarg_name, "json"]))
+                if os.path.exists(kwarg_path):
+                    os.remove(kwarg_path)
+        is_raw = hasattr(self.datasets[0], "raw")
+        if is_raw:
+            file_name_template = file_name_templates[0]
+        else:
+            file_name_template = file_name_templates[1]
+        for i_ds, ds in enumerate(self.datasets):
+            full_file_path = os.path.join(path, file_name_template.format(i_ds))
+            if is_raw:
+                ds.raw.save(full_file_path, overwrite=overwrite)
+            else:
+                ds.windows.save(full_file_path, overwrite=overwrite)
+        self.description.to_json(description_file_name)
+        for kwarg_name in [
+            "raw_preproc_kwargs",
+            "window_kwargs",
+            "window_preproc_kwargs",
+        ]:
+            if hasattr(self, kwarg_name):
+                kwargs_path = os.path.join(path, ".".join([kwarg_name, "json"]))
+                kwargs = getattr(self, kwarg_name)
+                if kwargs is not None:
+                    json.dump(kwargs, open(kwargs_path, "w"))
+    @property
+    def description(self) -> pd.DataFrame:
+        df = pd.DataFrame([ds.description for ds in self.datasets])
+        df.reset_index(inplace=True, drop=True)
+        return df
+    def set_description(
+        self, description: dict | pd.DataFrame, overwrite: bool = False
+    ):
+        """Update (add or overwrite) the dataset description.
+        Parameters
+        ----------
+        description: dict | pd.DataFrame
+            Description in the form key: value where the length of the value
+            has to match the number of datasets.
+        overwrite: bool
+            Has to be True if a key in description already exists in the
+            dataset description.
+        """
+        description = pd.DataFrame(description)
+        for key, value in description.items():
+            for ds, value_ in zip(self.datasets, value):
+                ds.set_description({key: value_}, overwrite=overwrite)
+    def save(self, path: str, overwrite: bool = False, offset: int = 0):
+        """Save datasets to files by creating one subdirectory for each dataset:
+        path/
+            0/
+                0-raw.fif | 0-epo.fif
+                description.json
+                raw_preproc_kwargs.json (if raws were preprocessed)
+                window_kwargs.json (if this is a windowed dataset)
+                window_preproc_kwargs.json  (if windows were preprocessed)
+                target_name.json (if target_name is not None and dataset is raw)
+            1/
+                1-raw.fif | 1-epo.fif
+                description.json
+                raw_preproc_kwargs.json (if raws were preprocessed)
+                window_kwargs.json (if this is a windowed dataset)
+                window_preproc_kwargs.json  (if windows were preprocessed)
+                target_name.json (if target_name is not None and dataset is raw)
+        Parameters
+        ----------
+        path : str
+            Directory in which subdirectories are created to store
+             -raw.fif | -epo.fif and .json files to.
+        overwrite : bool
+            Whether to delete old subdirectories that will be saved to in this
+            call.
+        offset : int
+            If provided, the integer is added to the id of the dataset in the
+            concat. This is useful in the setting of very large datasets, where
+            one dataset has to be processed and saved at a time to account for
+            its original position.
+        """
+        if len(self.datasets) == 0:
+            raise ValueError("Expect at least one dataset")
+        if not (
+            hasattr(self.datasets[0], "raw") or hasattr(self.datasets[0], "windows")
+        ):
+            raise ValueError("dataset should have either raw or windows attribute")
+        path_contents = os.listdir(path)
+        n_sub_dirs = len([os.path.isdir(e) for e in path_contents])
+        for i_ds, ds in enumerate(self.datasets):
+            # remove subdirectory from list of untouched files / subdirectories
+            if str(i_ds + offset) in path_contents:
+                path_contents.remove(str(i_ds + offset))
+            # save_dir/i_ds/
+            sub_dir = os.path.join(path, str(i_ds + offset))
+            if os.path.exists(sub_dir):
+                if overwrite:
+                    shutil.rmtree(sub_dir)
+                else:
+                    raise FileExistsError(
+                        f"Subdirectory {sub_dir} already exists. Please select"
+                        f" a different directory, set overwrite=True, or "
+                        f"resolve manually."
+                    )
+            # save_dir/{i_ds+offset}/
+            os.makedirs(sub_dir)
+            # save_dir/{i_ds+offset}/{i_ds+offset}-{raw_or_epo}.fif
+            self._save_signals(sub_dir, ds, i_ds, offset)
+            # save_dir/{i_ds+offset}/metadata_df.pkl
+            self._save_metadata(sub_dir, ds)
+            # save_dir/{i_ds+offset}/description.json
+            self._save_description(sub_dir, ds.description)
+            # save_dir/{i_ds+offset}/raw_preproc_kwargs.json
+            # save_dir/{i_ds+offset}/window_kwargs.json
+            # save_dir/{i_ds+offset}/window_preproc_kwargs.json
+            self._save_kwargs(sub_dir, ds)
+            # save_dir/{i_ds+offset}/target_name.json
+            self._save_target_name(sub_dir, ds)
+        if overwrite:
+            # the following will be True for all datasets preprocessed and
+            # stored in parallel with braindecode.preprocessing.preprocess
+            if i_ds + 1 + offset < n_sub_dirs:
+                warnings.warn(
+                    f"The number of saved datasets ({i_ds + 1 + offset}) "
+                    f"does not match the number of existing "
+                    f"subdirectories ({n_sub_dirs}). You may now "
+                    f"encounter a mix of differently preprocessed "
+                    f"datasets!",
+                    UserWarning,
+                )
+        # if path contains files or directories that were not touched, raise
+        # warning
+        if path_contents:
+            warnings.warn(
+                f"Chosen directory {path} contains other "
+                f"subdirectories or files {path_contents}."
+            )
+    @staticmethod
+    def _save_signals(sub_dir, ds, i_ds, offset):
+        raw_or_epo = "raw" if hasattr(ds, "raw") else "epo"
+        fif_file_name = f"{i_ds + offset}-{raw_or_epo}.fif"
+        fif_file_path = os.path.join(sub_dir, fif_file_name)
+        raw_or_windows = "raw" if raw_or_epo == "raw" else "windows"
+        # The following appears to be necessary to avoid a CI failure when
+        # preprocessing WindowsDatasets with serialization enabled. The failure
+        # comes from `mne.epochs._check_consistency` which ensures the Epochs's
+        # object `times` attribute is not writeable.
+        getattr(ds, raw_or_windows).times.flags["WRITEABLE"] = False
+        getattr(ds, raw_or_windows).save(fif_file_path)
+    @staticmethod
+    def _save_metadata(sub_dir, ds):
+        if hasattr(ds, "metadata"):
+            metadata_file_path = os.path.join(sub_dir, "metadata_df.pkl")
+            ds.metadata.to_pickle(metadata_file_path)
+    @staticmethod
+    def _save_description(sub_dir, description):
+        description_file_path = os.path.join(sub_dir, "description.json")
+        description.to_json(description_file_path)
+    @staticmethod
+    def _save_kwargs(sub_dir, ds):
+        for kwargs_name in [
+            "raw_preproc_kwargs",
+            "window_kwargs",
+            "window_preproc_kwargs",
+        ]:
+            if hasattr(ds, kwargs_name):
+                kwargs_file_name = ".".join([kwargs_name, "json"])
+                kwargs_file_path = os.path.join(sub_dir, kwargs_file_name)
+                kwargs = getattr(ds, kwargs_name)
+                if kwargs is not None:
+                    with open(kwargs_file_path, "w") as f:
+                        json.dump(kwargs, f)
+    @staticmethod
+    def _save_target_name(sub_dir, ds):
+        if hasattr(ds, "target_name"):
+            target_file_path = os.path.join(sub_dir, "target_name.json")
+            with open(target_file_path, "w") as f:
+                json.dump({"target_name": ds.target_name}, f)

braindecode 0.8__py3-none-any.whl → 1.0.0__py3-none-any.whl

Potentially problematic release.

braindecode 0.8py3-none-any.whl → 1.0.0py3-none-any.whl