PyPI - braindecode - Versions diffs - 1.3.0.dev180329405__py3-none-any.whl → 1.3.0.dev182330353__py3-none-any.whl - Mend

braindecode 1.3.0.dev180329405py3-none-any.whl → 1.3.0.dev182330353py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

braindecode/augmentation/base.py +1 -1
braindecode/datasets/__init__.py +12 -4
braindecode/datasets/base.py +115 -151
braindecode/datasets/bcicomp.py +4 -4
braindecode/datasets/bids.py +3 -3
braindecode/datasets/experimental.py +2 -2
braindecode/datasets/mne.py +3 -5
braindecode/datasets/moabb.py +17 -7
braindecode/datasets/nmt.py +2 -2
braindecode/datasets/sleep_physio_challe_18.py +2 -2
braindecode/datasets/sleep_physionet.py +2 -2
braindecode/datasets/tuh.py +2 -2
braindecode/datasets/xy.py +2 -2
braindecode/datautil/__init__.py +11 -1
braindecode/datautil/channel_utils.py +114 -0
braindecode/datautil/serialization.py +7 -7
braindecode/functional/functions.py +6 -2
braindecode/functional/initialization.py +2 -3
braindecode/models/__init__.py +6 -0
braindecode/models/atcnet.py +26 -27
braindecode/models/attentionbasenet.py +37 -32
braindecode/models/attn_sleep.py +2 -0
braindecode/models/base.py +280 -2
braindecode/models/bendr.py +469 -0
braindecode/models/biot.py +2 -0
braindecode/models/contrawr.py +2 -0
braindecode/models/ctnet.py +8 -3
braindecode/models/deepsleepnet.py +28 -19
braindecode/models/eegconformer.py +2 -2
braindecode/models/eeginception_erp.py +31 -25
braindecode/models/eegitnet.py +2 -0
braindecode/models/eegminer.py +2 -0
braindecode/models/eegnet.py +1 -1
braindecode/models/eegsym.py +917 -0
braindecode/models/eegtcnet.py +2 -0
braindecode/models/fbcnet.py +5 -1
braindecode/models/fblightconvnet.py +2 -0
braindecode/models/fbmsnet.py +20 -6
braindecode/models/ifnet.py +2 -0
braindecode/models/labram.py +33 -26
braindecode/models/medformer.py +758 -0
braindecode/models/msvtnet.py +2 -0
braindecode/models/patchedtransformer.py +1 -1
braindecode/models/signal_jepa.py +111 -27
braindecode/models/sinc_shallow.py +12 -9
braindecode/models/sstdpn.py +11 -11
braindecode/models/summary.csv +3 -0
braindecode/models/syncnet.py +2 -0
braindecode/models/tcn.py +2 -0
braindecode/models/usleep.py +26 -21
braindecode/models/util.py +3 -0
braindecode/modules/attention.py +10 -10
braindecode/modules/blocks.py +3 -3
braindecode/modules/filter.py +2 -9
braindecode/modules/layers.py +18 -17
braindecode/preprocessing/__init__.py +232 -3
braindecode/preprocessing/eegprep_preprocess.py +1202 -0
braindecode/preprocessing/mne_preprocess.py +142 -10
braindecode/preprocessing/preprocess.py +28 -18
braindecode/preprocessing/util.py +166 -0
braindecode/preprocessing/windowers.py +26 -20
braindecode/samplers/base.py +8 -8
braindecode/version.py +1 -1
{braindecode-1.3.0.dev180329405.dist-info → braindecode-1.3.0.dev182330353.dist-info}/METADATA +6 -2
braindecode-1.3.0.dev182330353.dist-info/RECORD +109 -0
braindecode-1.3.0.dev180329405.dist-info/RECORD +0 -103
{braindecode-1.3.0.dev180329405.dist-info → braindecode-1.3.0.dev182330353.dist-info}/WHEEL +0 -0
{braindecode-1.3.0.dev180329405.dist-info → braindecode-1.3.0.dev182330353.dist-info}/licenses/LICENSE.txt +0 -0
{braindecode-1.3.0.dev180329405.dist-info → braindecode-1.3.0.dev182330353.dist-info}/licenses/NOTICE.txt +0 -0
{braindecode-1.3.0.dev180329405.dist-info → braindecode-1.3.0.dev182330353.dist-info}/top_level.txt +0 -0

braindecode/datasets/xy.py CHANGED Viewed

@@ -12,7 +12,7 @@ import numpy as np
 import pandas as pd
 from numpy.typing import ArrayLike, NDArray
-from .base import BaseConcatDataset, BaseDataset
+from .base import BaseConcatDataset, RawDataset
 log = logging.getLogger(__name__)
@@ -69,7 +69,7 @@ def create_from_X_y(
         n_samples_per_x.append(x.shape[1])
         info = mne.create_info(ch_names=ch_names, sfreq=sfreq)
         raw = mne.io.RawArray(x, info)
-        base_dataset = BaseDataset(
+        base_dataset = RawDataset(
             raw, pd.Series({"target": target}), target_name="target"
         )
         base_datasets.append(base_dataset)

braindecode/datautil/__init__.py CHANGED Viewed

@@ -2,6 +2,10 @@
 Utilities for data manipulation.
 """
+from .channel_utils import (
+    division_channels_idx,
+    match_hemisphere_chans,
+)
 from .serialization import (
     _check_save_dir_empty,
     load_concat_dataset,
@@ -49,4 +53,10 @@ def __getattr__(name):
     raise AttributeError("No possible import named " + name)
-__all__ = ["load_concat_dataset", "save_concat_dataset", "_check_save_dir_empty"]
+__all__ = [
+    "load_concat_dataset",
+    "save_concat_dataset",
+    "_check_save_dir_empty",
+    "match_hemisphere_chans",
+    "division_channels_idx",
+]

braindecode/datautil/channel_utils.py ADDED Viewed

@@ -0,0 +1,114 @@
+"""
+Utilities for EEG channel manipulation and selection.
+This module provides functions for dividing and matching EEG channels,
+particularly for hemisphere-aware processing.
+"""
+import re
+from re import search
+def match_hemisphere_chans(left_chs, right_chs):
+    """
+    Match channels of the left and right hemispheres based on their names.
+    This function pairs channels from the left and right hemispheres by matching
+    their numeric identifiers. For a left channel with number N, it finds the
+    corresponding right channel with number N+1.
+    Parameters
+    ----------
+    left_chs : list of str
+        A list of channel names from the left hemisphere.
+    right_chs : list of str
+        A list of channel names from the right hemisphere.
+    Returns
+    -------
+    list of tuples
+        List of tuples with matched channel names from the left and right hemispheres.
+        Each tuple contains (left_channel, right_channel).
+    Raises
+    ------
+    ValueError
+        If the left and right channels do not match in length.
+    ValueError
+        If a channel name does not contain a number.
+    ValueError
+        If no matching right hemisphere channel is found for a left channel.
+    Examples
+    --------
+    >>> left = ['C3', 'F3']
+    >>> right = ['C4', 'F4']
+    >>> match_hemisphere_chans(left, right)
+    [('C3', 'C4'), ('F3', 'F4')]
+    """
+    if len(left_chs) != len(right_chs):
+        raise ValueError("Left and right channels do not match.")
+    right_chs = list(right_chs)
+    regexp = r"\d+"
+    out = []
+    for left in left_chs:
+        match = re.search(regexp, left)
+        if match is None:
+            raise ValueError(f"Channel '{left}' does not contain a number.")
+        chan_idx = 1 + int(match.group())
+        target_r = re.sub(regexp, str(chan_idx), left)
+        for right in right_chs:
+            if right == target_r:
+                out.append((left, right))
+                right_chs.remove(right)
+                break
+        else:
+            raise ValueError(
+                f"Found no right hemisphere matching channel for '{left}'."
+            )
+    return out
+def division_channels_idx(ch_names):
+    """
+    Divide EEG channel names into left, right, and middle based on numbering.
+    This function categorizes channels by their numeric suffix:
+    - Odd-numbered channels → left hemisphere
+    - Even-numbered channels → right hemisphere
+    - Channels without numbers → middle/midline
+    Parameters
+    ----------
+    ch_names : list of str
+        A list of EEG channel names to be divided based on their numbering.
+    Returns
+    -------
+    tuple of lists
+        Three lists containing the channel names:
+        - left: Odd-numbered channels (e.g., C3, F3, P3)
+        - right: Even-numbered channels (e.g., C4, F4, P4)
+        - middle: Channels without numbers (e.g., Cz, Fz, Pz)
+    Notes
+    -----
+    The function identifies channel numbers by searching for numeric characters
+    in the channel names. Standard 10-20 system EEG channel naming conventions
+    use odd numbers for left hemisphere and even numbers for right hemisphere.
+    Examples
+    --------
+    >>> channels = ['FP1', 'FP2', 'O1', 'O2', 'FZ']
+    >>> division_channels_idx(channels)
+    (['FP1', 'O1'], ['FP2', 'O2'], ['FZ'])
+    """
+    left, right, middle = [], [], []
+    for ch in ch_names:
+        number = search(r"\d+", ch)
+        if number is not None:
+            (left if int(number[0]) % 2 else right).append(ch)
+        else:
+            middle.append(ch)
+    return left, right, middle

braindecode/datautil/serialization.py CHANGED Viewed

@@ -19,8 +19,8 @@ from joblib import Parallel, delayed
 from ..datasets.base import (
     BaseConcatDataset,
-    BaseDataset,
     EEGWindowsDataset,
+    RawDataset,
     WindowsDataset,
 )
@@ -35,7 +35,7 @@ def save_concat_dataset(path, concat_dataset, overwrite=False):
 def _outdated_load_concat_dataset(path, preload, ids_to_load=None, target_name=None):
-    """Load a stored BaseConcatDataset of BaseDatasets or WindowsDatasets from
+    """Load a stored BaseConcatDataset from
     files.
     Parameters
@@ -52,7 +52,7 @@ def _outdated_load_concat_dataset(path, preload, ids_to_load=None, target_name=N
     Returns
     -------
-    concat_dataset: BaseConcatDataset of BaseDatasets or WindowsDatasets
+    concat_dataset: BaseConcatDataset
     """
     # assume we have a single concat dataset to load
     is_raw = (path / "0-raw.fif").is_file()
@@ -87,7 +87,7 @@ def _outdated_load_concat_dataset(path, preload, ids_to_load=None, target_name=N
         for i_signal, signal in enumerate(all_signals):
             if is_raw:
                 datasets.append(
-                    BaseDataset(
+                    RawDataset(
                         signal, description.iloc[i_signal], target_name=target_name
                     )
                 )
@@ -175,7 +175,7 @@ def _load_signals(fif_file, preload, is_raw):
 def load_concat_dataset(path, preload, ids_to_load=None, target_name=None, n_jobs=1):
-    """Load a stored BaseConcatDataset of BaseDatasets or WindowsDatasets from
+    """Load a stored BaseConcatDataset from
     files.
     Parameters
@@ -194,7 +194,7 @@ def load_concat_dataset(path, preload, ids_to_load=None, target_name=None, n_job
     Returns
     -------
-    concat_dataset: BaseConcatDataset of BaseDatasets or WindowsDatasets
+    concat_dataset: BaseConcatDataset
     """
     # Make sure we always work with a pathlib.Path
     path = Path(path)
@@ -266,7 +266,7 @@ def _load_parallel(path, i, preload, is_raw, has_stored_windows):
         target_name = json.load(open(target_file_path, "r"))["target_name"]
     if is_raw and (not has_stored_windows):
-        dataset = BaseDataset(signals, description, target_name)
+        dataset = RawDataset(signals, description, target_name)
     else:
         window_kwargs = _load_kwargs_json("window_kwargs", sub_dir)
         windows_ds_kwargs = [

braindecode/functional/functions.py CHANGED Viewed

@@ -181,20 +181,24 @@ def plv_time(x, forward_fourier=True, epsilon: float = 1e-6):
     The Phase Locking Value (PLV) is a measure of the synchronization between
     different channels by evaluating the consistency of phase differences
     over time. It ranges from 0 (no synchronization) to 1 (perfect
-    synchronization) [1]_.
+    synchronization) [Lachaux1999]_.
     Parameters
     ----------
     x : torch.Tensor
         Input tensor containing the signal data.
         - If `forward_fourier` is `True`, the shape should be `(..., channels, time)`.
         - If `forward_fourier` is `False`, the shape should be `(..., channels, freqs, 2)`,
           where the last dimension represents the real and imaginary parts.
     forward_fourier : bool, optional
         Specifies the format of the input tensor `x`.
         - If `True`, `x` is assumed to be in the time domain.
         - If `False`, `x` is assumed to be in the Fourier domain with separate real and
           imaginary components.
         Default is `True`.
     epsilon : float, default 1e-6
         Small numerical value to ensure positivity constraint on the complex part
@@ -207,7 +211,7 @@ def plv_time(x, forward_fourier=True, epsilon: float = 1e-6):
     References
     ----------
-    [1] Lachaux, J. P., Rodriguez, E., Martinerie, J., & Varela, F. J. (1999).
+    .. [Lachaux1999] Lachaux, J. P., Rodriguez, E., Martinerie, J., & Varela, F. J. (1999).
         Measuring phase synchrony in brain signals. Human brain mapping,
         8(4), 194-208.
     """

braindecode/functional/initialization.py CHANGED Viewed

@@ -5,9 +5,8 @@ from torch import nn
 def glorot_weight_zero_bias(model):
     """Initialize parameters of all modules by initializing weights with
-    glorot
-     uniform/xavier initialization, and setting biases to zero. Weights from
-     batch norm layers are set to 1.
+    glorot uniform/xavier initialization, and setting biases to zero. Weights from
+    batch norm layers are set to 1.
     Parameters
     ----------

braindecode/models/__init__.py CHANGED Viewed

@@ -6,6 +6,7 @@ from .atcnet import ATCNet
 from .attentionbasenet import AttentionBaseNet
 from .attn_sleep import AttnSleep
 from .base import EEGModuleMixin
+from .bendr import BENDR
 from .biot import BIOT
 from .contrawr import ContraWR
 from .ctnet import CTNet
@@ -19,6 +20,7 @@ from .eegminer import EEGMiner
 from .eegnet import EEGNet, EEGNetv4
 from .eegnex import EEGNeX
 from .eegsimpleconv import EEGSimpleConv
+from .eegsym import EEGSym
 from .eegtcnet import EEGTCNet
 from .fbcnet import FBCNet
 from .fblightconvnet import FBLightConvNet
@@ -26,6 +28,7 @@ from .fbmsnet import FBMSNet
 from .hybrid import HybridNet
 from .ifnet import IFNet
 from .labram import Labram
+from .medformer import MEDFormer
 from .msvtnet import MSVTNet
 from .patchedtransformer import PBT
 from .sccnet import SCCNet
@@ -58,6 +61,7 @@ __all__ = [
     "AttentionBaseNet",
     "EEGModuleMixin",
     "BIOT",
+    "BENDR",
     "ContraWR",
     "CTNet",
     "Deep4Net",
@@ -70,6 +74,7 @@ __all__ = [
     "EEGNet",
     "EEGNetv4",
     "EEGNeX",
+    "EEGSym",
     "EEGSimpleConv",
     "EEGTCNet",
     "FBCNet",
@@ -78,6 +83,7 @@ __all__ = [
     "HybridNet",
     "IFNet",
     "Labram",
+    "MEDFormer",
     "MSVTNet",
     "PBT",
     "SCCNet",

braindecode/models/atcnet.py CHANGED Viewed

@@ -15,7 +15,7 @@ from braindecode.modules import CausalConv1d, Ensure4d, MaxNormLinear
 class ATCNet(EEGModuleMixin, nn.Module):
     """ATCNet from Altaheri et al. (2022) [1]_.
-    :bdg-success:`Convolution` :bdg-info:`Small Attention`
+    :bdg-success:`Convolution` :bdg-secondary:`Recurrent` :bdg-info:`Small Attention`
     .. figure:: https://user-images.githubusercontent.com/25565236/185449791-e8539453-d4fa-41e1-865a-2cf7e91f60ef.png
         :align: center
@@ -50,7 +50,7 @@ class ATCNet(EEGModuleMixin, nn.Module):
         - **Temporal conv** (:class:`torch.nn.Conv2d`) with kernel ``(L_t, 1)`` builds a
             FIR-like filter bank (``F1`` maps).
         - **Depthwise spatial conv** (:class:`torch.nn.Conv2d`, ``groups=F1``) with kernel
-          ``(1, n_chans)`` learns per-filter spatial projections (akin to EEGNet’s CSP-like step).
+          ``(1, n_chans)`` learns per-filter spatial projections (akin to EEGNet's CSP-like step).
         - **BN → ELU → AvgPool → Dropout** to stabilize and condense activations.
         - **Refining temporal conv** (:class:`torch.nn.Conv2d`) with kernel ``(L_r, 1)`` +
           **BN → ELU → AvgPool → Dropout**.
@@ -62,13 +62,15 @@ class ATCNet(EEGModuleMixin, nn.Module):
     - **Sliding-Window Sequencer**
-      From the condensed time axis (length ``T_c``), ATCNet forms ``n`` overlapping windows
-      of width ``T_w = T_c - n + 1`` (one start per index). Each window produces a sequence
-      ``(B, F2, T_w)`` forwarded to its own attention–TCN branch. This creates *parallel*
-      encoders over shifted contexts and is key to robustness on nonstationary EEG.
+        From the condensed time axis (length ``T_c``), ATCNet forms ``n`` overlapping windows
+        of width ``T_w = T_c - n + 1`` (one start per index). Each window produces a sequence
+        ``(B, F2, T_w)`` forwarded to its own attention-TCN branch. This creates *parallel*
+        encoders over shifted contexts and is key to robustness on nonstationary EEG.
     - :class:`_AttentionBlock` **(small MHA on temporal positions)**
+        Attention here is *local to a window* and purely temporal.
         - *Operations.*
         - Rearrange to ``(B, T_w, F2)``,
         - Normalization :class:`torch.nn.LayerNorm`
@@ -76,11 +78,8 @@ class ATCNet(EEGModuleMixin, nn.Module):
         - Dropout :class:`torch.nn.Dropout`
         - Rearrange back to ``(B, F2, T_w)``.
-    **Note**: Attention is *local to a window* and purely temporal.
-    *Role.* Re-weights evidence across the window, letting the model emphasize informative
-    segments (onsets, bursts) before causal convolutions aggregate history.
+        *Role.* Re-weights evidence across the window, letting the model emphasize informative
+        segments (onsets, bursts) before causal convolutions aggregate history.
     - :class:`_TCNResidualBlock` **(causal dilated temporal CNN)**
@@ -90,8 +89,8 @@ class ATCNet(EEGModuleMixin, nn.Module):
           a residual (identity or 1x1 mapping).
         - The final feature used per window is the *last* causal step ``[..., -1]`` (forecast-style).
-    *Role.* Efficient long-range temporal integration with stable gradients; the dilated
-    receptive field complements attention’s soft selection.
+        *Role.* Efficient long-range temporal integration with stable gradients; the dilated
+        receptive field complements attention's soft selection.
     - **Aggregation & Classifier**
@@ -104,16 +103,16 @@ class ATCNet(EEGModuleMixin, nn.Module):
     .. rubric:: Convolutional Details
     - **Temporal.** Temporal structure is learned in three places:
-        - (1) the stem’s wide ``(L_t, 1)`` conv (learned filter bank),
+        - (1) the stem's wide ``(L_t, 1)`` conv (learned filter bank),
         - (2) the refining ``(L_r, 1)`` conv after pooling (short-term dynamics), and
-        - (3) the TCN’s causal 1-D convolutions with exponentially increasing dilation
+        - (3) the TCN's causal 1-D convolutions with exponentially increasing dilation
           (long-range dependencies). The minimum sequence length required by the TCN stack is
           ``(K_t - 1)·2^{L-1} + 1``; the implementation *auto-scales* kernels/pools/windows
           when inputs are shorter to preserve feasibility.
     - **Spatial.** A depthwise spatial conv spans the **full montage** (kernel ``(1, n_chans)``),
         producing *per-temporal-filter* spatial projections (no cross-filter mixing at this step).
-        This mirrors EEGNet’s interpretability: each temporal filter has its own spatial pattern.
+        This mirrors EEGNet's interpretability: each temporal filter has its own spatial pattern.
     .. rubric:: Attention / Sequential Modules
@@ -137,17 +136,17 @@ class ATCNet(EEGModuleMixin, nn.Module):
     .. rubric:: Usage and Configuration
-        - ``conv_block_n_filters (F1)``, ``conv_block_depth_mult (D)`` → capacity of the stem
-        (with ``F2 = F1·D`` feeding attention/TCN), dimensions aligned to ``F2``, like :class:`EEGNet`.
-        - Pool sizes ``P1,P2`` trade temporal resolution for stability/compute; they set
-        ``T_c = T/(P1·P2)`` and thus window width ``T_w``.
-        - ``n_windows`` controls the ensemble over shifts (compute ∝ windows).
-        - ``att_num_heads``, ``att_head_dim`` set attention capacity; keep ``H·d_h ≈ F2``.
-        - ``tcn_depth``, ``tcn_kernel_size`` govern receptive field; larger values demand
-        longer inputs (see minimum length above). The implementation warns and *rescales*
-        kernels/pools/windows if inputs are too short.
-        - **Aggregation choice.** ``concat=False`` (default, average of per-window logits) matches
-        the official code; ``concat=True`` mirrors the paper’s concatenation variant.
+    - ``conv_block_n_filters (F1)``, ``conv_block_depth_mult (D)`` → capacity of the stem
+      (with ``F2 = F1·D`` feeding attention/TCN), dimensions aligned to ``F2``, like :class:`EEGNet`.
+    - Pool sizes ``P1,P2`` trade temporal resolution for stability/compute; they set
+      ``T_c = T/(P1·P2)`` and thus window width ``T_w``.
+    - ``n_windows`` controls the ensemble over shifts (compute ∝ windows).
+    - ``att_num_heads``, ``att_head_dim`` set attention capacity; keep ``H·d_h ≈ F2``.
+    - ``tcn_depth``, ``tcn_kernel_size`` govern receptive field; larger values demand
+      longer inputs (see minimum length above). The implementation warns and *rescales*
+      kernels/pools/windows if inputs are too short.
+    - **Aggregation choice.** ``concat=False`` (default, average of per-window logits) matches
+      the official code; ``concat=True`` mirrors the paper's concatenation variant.
     Notes

braindecode/models/attentionbasenet.py CHANGED Viewed

@@ -97,7 +97,7 @@ class AttentionBaseNet(EEGModuleMixin, nn.Module):
     - **Temporal (where time-domain patterns are learned).**
         Wide kernels in the stem (``(1, L_t)``) act as a learned filter bank for oscillatory
-        bands/transients; the attention block’s depthwise temporal conv (``(1, L_a)``) sharpens
+        bands/transients; the attention block's depthwise temporal conv (``(1, L_a)``) sharpens
         short-term dynamics after downsampling. Pool sizes/strides (``P₁,S₁`` then ``P₂,S₂``)
         set the token rate and effective temporal resolution.
@@ -127,23 +127,24 @@ class AttentionBaseNet(EEGModuleMixin, nn.Module):
     .. rubric:: Additional Mechanisms
-        - **Attention variants at a glance.**
-        - ``"se"``: Squeeze-and-Excitation (global pooling → bottleneck → gates).
-        - ``"gsop"``: Global second-order pooling (covariance-aware channel weights).
-        - ``"fca"``: Frequency Channel Attention (DCT summary; uses ``seq_len`` and ``freq_idx``).
-        - ``"encnet"``: EncNet with learned codewords (uses ``n_codewords``).
-        - ``"eca"``: Efficient Channel Attention (local 1-D conv over channel descriptor; uses ``kernel_size``).
-        - ``"ge"``: Gather–Excite (context pooling with optional MLP; can use ``extra_params``).
-        - ``"gct"``: Gated Channel Transformation (global context normalization + gating).
-        - ``"srm"``: Style-based recalibration (mean–std descriptors; optional MLP).
-        - ``"cbam"``: Channel then temporal attention (uses ``kernel_size``).
-        - ``"cat"`` / ``"catlite"``: Collaborative (channel ± temporal) attention; *lite* omits temporal.
-        - **Auto-compatibility on short inputs.**
+    **Attention variants at a glance:**
-    If the input duration is too short for the configured kernels/pools, the implementation
-    **automatically rescales** temporal lengths/strides downward (with a warning) to keep
-    shapes valid and preserve the pipeline semantics.
+    - ``"se"``: Squeeze-and-Excitation (global pooling → bottleneck → gates).
+    - ``"gsop"``: Global second-order pooling (covariance-aware channel weights).
+    - ``"fca"``: Frequency Channel Attention (DCT summary; uses ``seq_len`` and ``freq_idx``).
+    - ``"encnet"``: EncNet with learned codewords (uses ``n_codewords``).
+    - ``"eca"``: Efficient Channel Attention (local 1-D conv over channel descriptor; uses ``kernel_size``).
+    - ``"ge"``: Gather–Excite (context pooling with optional MLP; can use ``extra_params``).
+    - ``"gct"``: Gated Channel Transformation (global context normalization + gating).
+    - ``"srm"``: Style-based recalibration (mean–std descriptors; optional MLP).
+    - ``"cbam"``: Channel then temporal attention (uses ``kernel_size``).
+    - ``"cat"`` / ``"catlite"``: Collaborative (channel ± temporal) attention; *lite* omits temporal.
+    **Auto-compatibility on short inputs:**
+        If the input duration is too short for the configured kernels/pools, the implementation
+        **automatically rescales** temporal lengths/strides downward (with a warning) to keep
+        shapes valid and preserve the pipeline semantics.
     .. rubric:: Usage and Configuration
@@ -158,9 +159,9 @@ class AttentionBaseNet(EEGModuleMixin, nn.Module):
     - ``drop_prob_inp`` and ``drop_prob_attn``: regularize stem and attention stages.
     - **Training tips.**
-    Start with moderate pooling (e.g., ``P₁=75,S₁=15``) and ELU activations; enable attention
-    only after the stem learns stable filters. For small datasets, prefer simpler modes
-    (``"se"``, ``"eca"``) before heavier ones (``"gsop"``, ``"encnet"``).
+        Start with moderate pooling (e.g., ``P₁=75,S₁=15``) and ELU activations; enable attention
+        only after the stem learns stable filters. For small datasets, prefer simpler modes
+        (``"se"``, ``"eca"``) before heavier ones (``"gsop"``, ``"encnet"``).
     Notes
     -----
@@ -170,6 +171,7 @@ class AttentionBaseNet(EEGModuleMixin, nn.Module):
       specific variants (CBAM/CAT).
     - The paper and original code with more details about the methodological
       choices are available at the [Martin2023]_ and [MartinCode]_.
     .. versionadded:: 0.9
     Parameters
@@ -198,19 +200,21 @@ class AttentionBaseNet(EEGModuleMixin, nn.Module):
         the depth of the network after the initial layer. Default is 16.
     attention_mode : str, optional
         The type of attention mechanism to apply. If `None`, no attention is applied.
-            - "se" for Squeeze-and-excitation network
-            - "gsop" for Global Second-Order Pooling
-            - "fca" for Frequency Channel Attention Network
-            - "encnet" for context encoding module
-            - "eca" for Efficient channel attention for deep convolutional neural networks
-            - "ge" for Gather-Excite
-            - "gct" for Gated Channel Transformation
-            - "srm" for Style-based Recalibration Module
-            - "cbam" for Convolutional Block Attention Module
-            - "cat" for Learning to collaborate channel and temporal attention
-            from multi-information fusion
-            - "catlite" for Learning to collaborate channel attention
-        from multi-information fusion (lite version, cat w/o temporal attention)
+        - "se" for Squeeze-and-excitation network
+        - "gsop" for Global Second-Order Pooling
+        - "fca" for Frequency Channel Attention Network
+        - "encnet" for context encoding module
+        - "eca" for Efficient channel attention for deep convolutional neural networks
+        - "ge" for Gather-Excite
+        - "gct" for Gated Channel Transformation
+        - "srm" for Style-based Recalibration Module
+        - "cbam" for Convolutional Block Attention Module
+        - "cat" for Learning to collaborate channel and temporal attention
+          from multi-information fusion
+        - "catlite" for Learning to collaborate channel attention
+          from multi-information fusion (lite version, cat w/o temporal attention)
     pool_length : int, default=8
         The length of the window for the average pooling operation.
     pool_stride : int, default=8
@@ -499,6 +503,7 @@ class _ChannelAttentionBlock(nn.Module):
     ----------
     attention_mode : str, optional
         The type of attention mechanism to apply. If `None`, no attention is applied.
         - "se" for Squeeze-and-excitation network
         - "gsop" for Global Second-Order Pooling
         - "fca" for Frequency Channel Attention Network

braindecode/models/attn_sleep.py CHANGED Viewed

@@ -18,6 +18,8 @@ from braindecode.modules import CausalConv1d
 class AttnSleep(EEGModuleMixin, nn.Module):
     """Sleep Staging Architecture from Eldele et al. (2021) [Eldele2021]_.
+    :bdg-success:`Convolution` :bdg-info:`Small Attention`
     .. figure:: https://raw.githubusercontent.com/emadeldeen24/AttnSleep/refs/heads/main/imgs/AttnSleep.png
         :align: center
         :alt: AttnSleep Architecture

braindecode 1.3.0.dev180329405__py3-none-any.whl → 1.3.0.dev182330353__py3-none-any.whl

braindecode 1.3.0.dev180329405py3-none-any.whl → 1.3.0.dev182330353py3-none-any.whl