PyPI - eegdash - Versions diffs - 0.3.9.dev182388821__py3-none-any.whl → 0.4.0.dev132__py3-none-any.whl - Mend

eegdash 0.3.9.dev182388821py3-none-any.whl → 0.4.0.dev132py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of eegdash might be problematic. Click here for more details.

Files changed (15) hide show

eegdash/__init__.py +1 -1
eegdash/api.py +68 -145
eegdash/bids_eeg_metadata.py +149 -27
eegdash/data_utils.py +63 -254
eegdash/dataset/dataset.py +27 -21
eegdash/downloader.py +176 -0
eegdash/features/datasets.py +4 -3
eegdash/hbn/preprocessing.py +1 -3
eegdash/hbn/windows.py +0 -2
eegdash/logging.py +23 -0
{eegdash-0.3.9.dev182388821.dist-info → eegdash-0.4.0.dev132.dist-info}/METADATA +5 -56
{eegdash-0.3.9.dev182388821.dist-info → eegdash-0.4.0.dev132.dist-info}/RECORD +15 -13
{eegdash-0.3.9.dev182388821.dist-info → eegdash-0.4.0.dev132.dist-info}/WHEEL +0 -0
{eegdash-0.3.9.dev182388821.dist-info → eegdash-0.4.0.dev132.dist-info}/licenses/LICENSE +0 -0
{eegdash-0.3.9.dev182388821.dist-info → eegdash-0.4.0.dev132.dist-info}/top_level.txt +0 -0

eegdash/data_utils.py CHANGED Viewed

@@ -1,10 +1,8 @@
 import io
 import json
-import logging
 import os
 import re
 import traceback
-import warnings
 from contextlib import redirect_stderr
 from pathlib import Path
 from typing import Any
@@ -13,9 +11,7 @@ import mne
 import mne_bids
 import numpy as np
 import pandas as pd
-import s3fs
 from bids import BIDSLayout
-from fsspec.callbacks import TqdmCallback
 from joblib import Parallel, delayed
 from mne._fiff.utils import _read_segments_file
 from mne.io import BaseRaw
@@ -23,10 +19,11 @@ from mne_bids import BIDSPath
 from braindecode.datasets import BaseDataset
+from . import downloader
+from .bids_eeg_metadata import enrich_from_participants
+from .logging import logger
 from .paths import get_default_cache_dir
-logger = logging.getLogger("eegdash")
 class EEGDashBaseDataset(BaseDataset):
     """A single EEG recording hosted on AWS S3 and cached locally upon first access.
@@ -73,6 +70,7 @@ class EEGDashBaseDataset(BaseDataset):
         # Compute a dataset folder name under cache_dir that encodes preprocessing
         # (e.g., bdf, mini) to avoid overlapping with the original dataset cache.
         self.dataset_folder = record.get("dataset", "")
+        # TODO: remove this hack when competition is over
         if s3_bucket:
             suffixes: list[str] = []
             bucket_lower = str(s3_bucket).lower()
@@ -91,6 +89,7 @@ class EEGDashBaseDataset(BaseDataset):
             rel = Path(self.dataset_folder) / rel
         self.filecache = self.cache_dir / rel
         self.bids_root = self.cache_dir / self.dataset_folder
         self.bidspath = BIDSPath(
             root=self.bids_root,
             datatype="eeg",
@@ -98,113 +97,18 @@ class EEGDashBaseDataset(BaseDataset):
             **self.bids_kwargs,
         )
-        self.s3file = self._get_s3path(record["bidspath"])
+        self.s3file = downloader.get_s3path(self.s3_bucket, record["bidspath"])
         self.bids_dependencies = record["bidsdependencies"]
-        # Temporary fix for BIDS dependencies path
-        # just to release to the competition
+        self.bids_dependencies_original = record["bidsdependencies"]
+        # TODO: removing temporary fix for BIDS dependencies path
+        # when the competition is over and dataset is digested properly
         if not self.s3_open_neuro:
-            self.bids_dependencies_original = self.bids_dependencies
             self.bids_dependencies = [
                 dep.split("/", 1)[1] for dep in self.bids_dependencies
             ]
         self._raw = None
-    def _get_s3path(self, filepath: str) -> str:
-        """Helper to form an AWS S3 URI for the given relative filepath."""
-        return f"{self.s3_bucket}/{filepath}"
-    def _download_s3(self) -> None:
-        """Download function that gets the raw EEG data from S3."""
-        filesystem = s3fs.S3FileSystem(
-            anon=True, client_kwargs={"region_name": "us-east-2"}
-        )
-        if not self.s3_open_neuro:
-            self.s3file = re.sub(r"(^|/)ds\d{6}/", r"\1", self.s3file, count=1)
-            if self.s3file.endswith(".set"):
-                self.s3file = self.s3file[:-4] + ".bdf"
-                self.filecache = self.filecache.with_suffix(".bdf")
-        self.filecache.parent.mkdir(parents=True, exist_ok=True)
-        info = filesystem.info(self.s3file)
-        size = info.get("size") or info.get("Size")
-        callback = TqdmCallback(
-            size=size,
-            tqdm_kwargs=dict(
-                desc=f"Downloading {Path(self.s3file).name}",
-                unit="B",
-                unit_scale=True,
-                unit_divisor=1024,
-                dynamic_ncols=True,
-                leave=True,
-                mininterval=0.2,
-                smoothing=0.1,
-                miniters=1,
-                bar_format="{desc}: {percentage:3.0f}%|{bar}| {n_fmt}/{total_fmt} "
-                "[{elapsed}<{remaining}, {rate_fmt}]",
-            ),
-        )
-        filesystem.get(self.s3file, self.filecache, callback=callback)
-        self.filenames = [self.filecache]
-    def _download_dependencies(self) -> None:
-        """Download all BIDS dependency files (metadata files, recording sidecar files)
-        from S3 and cache them locally.
-        """
-        filesystem = s3fs.S3FileSystem(
-            anon=True, client_kwargs={"region_name": "us-east-2"}
-        )
-        for i, dep in enumerate(self.bids_dependencies):
-            if not self.s3_open_neuro:
-                # fix this when our bucket is integrated into the
-                # mongodb
-                # if the file have ".set" replace to ".bdf"
-                if dep.endswith(".set"):
-                    dep = dep[:-4] + ".bdf"
-            s3path = self._get_s3path(dep)
-            if not self.s3_open_neuro:
-                dep = self.bids_dependencies_original[i]
-            dep_path = Path(dep)
-            if dep_path.parts and dep_path.parts[0] == self.record.get("dataset"):
-                dep_local = Path(self.dataset_folder, *dep_path.parts[1:])
-            else:
-                dep_local = Path(self.dataset_folder) / dep_path
-            filepath = self.cache_dir / dep_local
-            if not self.s3_open_neuro:
-                if filepath.suffix == ".set":
-                    filepath = filepath.with_suffix(".bdf")
-                if self.filecache.suffix == ".set":
-                    self.filecache = self.filecache.with_suffix(".bdf")
-            # here, we download the dependency and it is fine
-            # in the case of the competition.
-            if not filepath.exists():
-                filepath.parent.mkdir(parents=True, exist_ok=True)
-                info = filesystem.info(s3path)
-                size = info.get("size") or info.get("Size")
-                callback = TqdmCallback(
-                    size=size,
-                    tqdm_kwargs=dict(
-                        desc=f"Downloading {Path(s3path).name}",
-                        unit="B",
-                        unit_scale=True,
-                        unit_divisor=1024,
-                        dynamic_ncols=True,
-                        leave=True,
-                        mininterval=0.2,
-                        smoothing=0.1,
-                        miniters=1,
-                        bar_format="{desc}: {percentage:3.0f}%|{bar}| {n_fmt}/{total_fmt} "
-                        "[{elapsed}<{remaining}, {rate_fmt}]",
-                    ),
-                )
-                filesystem.get(s3path, filepath, callback=callback)
     def _get_raw_bids_args(self) -> dict[str, Any]:
         """Helper to restrict the metadata record to the fields needed to locate a BIDS
         recording.
@@ -222,130 +126,43 @@ class EEGDashBaseDataset(BaseDataset):
         if not os.path.exists(self.filecache):  # not preload
             if self.bids_dependencies:
-                self._download_dependencies()
-            self._download_s3()
+                downloader.download_dependencies(
+                    s3_bucket=self.s3_bucket,
+                    bids_dependencies=self.bids_dependencies,
+                    bids_dependencies_original=self.bids_dependencies_original,
+                    cache_dir=self.cache_dir,
+                    dataset_folder=self.dataset_folder,
+                    record=self.record,
+                    s3_open_neuro=self.s3_open_neuro,
+                )
+            self.filecache = downloader.download_s3_file(
+                self.s3file, self.filecache, self.s3_open_neuro
+            )
+            self.filenames = [self.filecache]
         if self._raw is None:
-            # capturing any warnings
-            # to-do: remove this once is fixed on the mne-bids side.
-            with warnings.catch_warnings(record=True) as w:
-                # Ensure all warnings are captured into 'w' and not shown to users
-                warnings.simplefilter("always")
-                try:
-                    # mne-bids emits RuntimeWarnings to stderr; silence stderr during read
-                    _stderr_buffer = io.StringIO()
-                    with redirect_stderr(_stderr_buffer):
-                        self._raw = mne_bids.read_raw_bids(
-                            bids_path=self.bidspath, verbose="ERROR"
-                        )
-                    # Parse unmapped participants.tsv fields reported by mne-bids and
-                    # inject them into Raw.info and the dataset description generically.
-                    extras = self._extract_unmapped_participants_from_warnings(w)
-                    if extras:
-                        # 1) Attach to Raw.info under subject_info.participants_extras
-                        try:
-                            subject_info = self._raw.info.get("subject_info") or {}
-                            if not isinstance(subject_info, dict):
-                                subject_info = {}
-                            pe = subject_info.get("participants_extras") or {}
-                            if not isinstance(pe, dict):
-                                pe = {}
-                            # Merge without overwriting
-                            for k, v in extras.items():
-                                pe.setdefault(k, v)
-                            subject_info["participants_extras"] = pe
-                            self._raw.info["subject_info"] = subject_info
-                        except Exception:
-                            # Non-fatal; continue
-                            pass
-                        # 2) Also add to this dataset's description, if possible, so
-                        #    targets can be selected later without naming specifics.
-                        try:
-                            if isinstance(self.description, dict):
-                                for k, v in extras.items():
-                                    self.description.setdefault(k, v)
-                            elif isinstance(self.description, pd.Series):
-                                for k, v in extras.items():
-                                    if k not in self.description.index:
-                                        self.description.loc[k] = v
-                        except Exception:
-                            pass
-                except Exception as e:
-                    logger.error(
-                        f"Error while reading BIDS file: {self.bidspath}\n"
-                        "This may be due to a missing or corrupted file.\n"
-                        "Please check the file and try again."
-                    )
-                    logger.error(f"Exception: {e}")
-                    logger.error(traceback.format_exc())
-                    raise e
-                # Filter noisy mapping notices from mne-bids; surface others
-                for captured_warning in w:
-                    try:
-                        msg = str(captured_warning.message)
-                    except Exception:
-                        continue
-                    # Suppress verbose participants mapping messages
-                    if "Unable to map the following column" in msg and "MNE" in msg:
-                        logger.debug(
-                            "Suppressed mne-bids mapping warning while reading BIDS file: %s",
-                            msg,
-                        )
-                        continue
-    def _extract_unmapped_participants_from_warnings(
-        self, warnings_list: list[Any]
-    ) -> dict[str, Any]:
-        """Scan captured warnings from mne-bids and extract unmapped participants.tsv
-        entries in a generic way.
-        Optionally, the column name can carry a note in parentheses that we ignore
-        for key/value extraction. Returns a mapping of column name -> raw value.
-        """
-        extras: dict[str, Any] = {}
-        header = "Unable to map the following column(s) to MNE:"
-        for wr in warnings_list:
-            try:
-                msg = str(wr.message)
-            except Exception:
-                continue
-            if header not in msg:
-                continue
-            lines = msg.splitlines()
-            # Find the header line, then parse subsequent lines as entries
             try:
-                idx = next(i for i, ln in enumerate(lines) if header in ln)
-            except StopIteration:
-                idx = -1
-            for line in lines[idx + 1 :]:
-                line = line.strip()
-                if not line:
-                    continue
-                # Pattern:  <col>(optional note): <value>
-                # Examples: "gender: F", "Ethnicity: Indian", "foo (ignored): bar"
-                m = re.match(r"^([^:]+?)(?:\s*\([^)]*\))?\s*:\s*(.*)$", line)
-                if not m:
-                    continue
-                col = m.group(1).strip()
-                val = m.group(2).strip()
-                # Keep original column names as provided to stay agnostic
-                if col and col not in extras:
-                    extras[col] = val
-        return extras
-    # === BaseDataset and PyTorch Dataset interface ===
-    def __getitem__(self, index):
-        """Main function to access a sample from the dataset."""
-        X = self.raw[:, index][0]
-        y = None
-        if self.target_name is not None:
-            y = self.description[self.target_name]
-        if isinstance(y, pd.Series):
-            y = y.to_list()
-        if self.transform is not None:
-            X = self.transform(X)
-        return X, y
+                # mne-bids can emit noisy warnings to stderr; keep user logs clean
+                _stderr_buffer = io.StringIO()
+                with redirect_stderr(_stderr_buffer):
+                    self._raw = mne_bids.read_raw_bids(
+                        bids_path=self.bidspath, verbose="ERROR"
+                    )
+                # Enrich Raw.info and description with participants.tsv extras
+                enrich_from_participants(
+                    self.bids_root, self.bidspath, self._raw, self.description
+                )
+            except Exception as e:
+                logger.error(
+                    f"Error while reading BIDS file: {self.bidspath}\n"
+                    "This may be due to a missing or corrupted file.\n"
+                    "Please check the file and try again.\n"
+                    "Usually erasing the local cache and re-downloading helps.\n"
+                    f"`rm {self.bidspath}`"
+                )
+                logger.error(f"Exception: {e}")
+                logger.error(traceback.format_exc())
+                raise e
     def __len__(self) -> int:
         """Return the number of samples in the dataset."""
@@ -426,13 +243,16 @@ class EEGDashBaseRaw(BaseRaw):
             ch_types.append(chtype)
         info = mne.create_info(ch_names=ch_names, sfreq=sfreq, ch_types=ch_types)
-        self.s3file = self._get_s3path(input_fname)
+        self.s3file = downloader.get_s3path(self._AWS_BUCKET, input_fname)
         self.cache_dir = Path(cache_dir) if cache_dir else get_default_cache_dir()
         self.filecache = self.cache_dir / input_fname
         self.bids_dependencies = bids_dependencies
         if preload and not os.path.exists(self.filecache):
-            self._download_s3()
+            self.filecache = downloader.download_s3_file(
+                self.s3file, self.filecache, self.s3_open_neuro
+            )
+            self.filenames = [self.filecache]
             preload = self.filecache
         super().__init__(
@@ -443,35 +263,24 @@ class EEGDashBaseRaw(BaseRaw):
             verbose=verbose,
         )
-    def _get_s3path(self, filepath):
-        return f"{self._AWS_BUCKET}/{filepath}"
-    def _download_s3(self) -> None:
-        self.filecache.parent.mkdir(parents=True, exist_ok=True)
-        filesystem = s3fs.S3FileSystem(
-            anon=True, client_kwargs={"region_name": "us-east-2"}
-        )
-        filesystem.download(self.s3file, self.filecache)
-        self.filenames = [self.filecache]
-    def _download_dependencies(self):
-        filesystem = s3fs.S3FileSystem(
-            anon=True, client_kwargs={"region_name": "us-east-2"}
-        )
-        for dep in self.bids_dependencies:
-            s3path = self._get_s3path(dep)
-            filepath = self.cache_dir / dep
-            if not filepath.exists():
-                filepath.parent.mkdir(parents=True, exist_ok=True)
-                filesystem.download(s3path, filepath)
     def _read_segment(
         self, start=0, stop=None, sel=None, data_buffer=None, *, verbose=None
     ):
         if not os.path.exists(self.filecache):  # not preload
-            if self.bids_dependencies:
-                self._download_dependencies()
-            self._download_s3()
+            if self.bids_dependencies:  # this is use only to sidecars for now
+                downloader.download_dependencies(
+                    s3_bucket=self._AWS_BUCKET,
+                    bids_dependencies=self.bids_dependencies,
+                    bids_dependencies_original=None,
+                    cache_dir=self.cache_dir,
+                    dataset_folder=self.filecache,
+                    record={},
+                    s3_open_neuro=self.s3_open_neuro,
+                )
+            self.filecache = downloader.download_s3_file(
+                self.s3file, self.filecache, self.s3_open_neuro
+            )
+            self.filenames = [self.filecache]
         else:  # not preload and file is not cached
             self.filenames = [self.filecache]
         return super()._read_segment(start, stop, sel, data_buffer, verbose=verbose)

eegdash/dataset/dataset.py CHANGED Viewed

@@ -1,15 +1,15 @@
-import logging
 from pathlib import Path
-from mne.utils import warn
+from rich.console import Console
+from rich.panel import Panel
+from rich.text import Text
 from ..api import EEGDashDataset
 from ..bids_eeg_metadata import build_query_from_kwargs
 from ..const import RELEASE_TO_OPENNEURO_DATASET_MAP, SUBJECT_MINI_RELEASE_MAP
+from ..logging import logger
 from .registry import register_openneuro_datasets
-logger = logging.getLogger("eegdash")
 class EEGChallengeDataset(EEGDashDataset):
     """EEG 2025 Challenge dataset helper.
@@ -23,8 +23,6 @@ class EEGChallengeDataset(EEGDashDataset):
     ----------
     release : str
         Release name. One of ["R1", ..., "R11"].
-    cache_dir : str
-        Local cache directory for data files.
     mini : bool, default True
         If True, restrict subjects to the challenge mini subset.
     query : dict | None
@@ -123,24 +121,32 @@ class EEGChallengeDataset(EEGDashDataset):
         else:
             s3_bucket = f"{s3_bucket}/{release}_L100_bdf"
-        warn(
-            "\n\n"
-            "[EEGChallengeDataset] EEG 2025 Competition Data Notice:\n"
-            "-------------------------------------------------------\n"
+        message_text = Text.from_markup(
             "This object loads the HBN dataset that has been preprocessed for the EEG Challenge:\n"
-            "  - Downsampled from 500Hz to 100Hz\n"
-            "  - Bandpass filtered (0.5–50 Hz)\n"
-            "\n"
-            "For full preprocessing details, see:\n"
-            "  https://github.com/eeg2025/downsample-datasets\n"
-            "\n"
-            "IMPORTANT: The data accessed via `EEGChallengeDataset` is NOT identical to what you get from `EEGDashDataset` directly.\n"
-            "If you are participating in the competition, always use `EEGChallengeDataset` to ensure consistency with the challenge data.\n"
-            "\n",
-            UserWarning,
-            module="eegdash",
+            "  * Downsampled from 500Hz to 100Hz\n"
+            "  * Bandpass filtered (0.5-50 Hz)\n\n"
+            "For full preprocessing applied for competition details, see:\n"
+            "  [link=https://github.com/eeg2025/downsample-datasets]https://github.com/eeg2025/downsample-datasets[/link]\n\n"
+            "The HBN dataset have some preprocessing applied by the HBN team:\n"
+            "  * Re-reference (Cz Channel)\n\n"
+            "[bold red]IMPORTANT[/bold red]: The data accessed via `EEGChallengeDataset` is [u]NOT[/u] identical to what you get from [link=https://github.com/sccn/EEGDash/blob/develop/eegdash/api.py]EEGDashDataset[/link] directly.\n"
+            "If you are participating in the competition, always use `EEGChallengeDataset` to ensure consistency with the challenge data."
+        )
+        warning_panel = Panel(
+            message_text,
+            title="[yellow]EEG 2025 Competition Data Notice[/yellow]",
+            subtitle="[cyan]Source: EEGChallengeDataset[/cyan]",
+            border_style="yellow",
         )
+        # Render the panel directly to the console so it displays in IPython/terminals
+        try:
+            Console().print(warning_panel)
+        except Exception:
+            warning_message = str(message_text)
+            logger.warning(warning_message)
         super().__init__(
             dataset=RELEASE_TO_OPENNEURO_DATASET_MAP[release],
             query=query,

eegdash/downloader.py ADDED Viewed

@@ -0,0 +1,176 @@
+import re
+import tempfile
+from pathlib import Path
+from typing import Any
+from urllib.parse import urlsplit
+import mne
+import numpy as np
+import s3fs
+import xarray as xr
+from fsspec.callbacks import TqdmCallback
+def get_s3_filesystem():
+    """Returns an S3FileSystem object."""
+    return s3fs.S3FileSystem(anon=True, client_kwargs={"region_name": "us-east-2"})
+def get_s3path(s3_bucket: str, filepath: str) -> str:
+    """Helper to form an AWS S3 URI for the given relative filepath."""
+    return f"{s3_bucket}/{filepath}"
+def download_s3_file(s3_path: str, local_path: Path, s3_open_neuro: bool):
+    """Download function that gets the raw EEG data from S3."""
+    filesystem = get_s3_filesystem()
+    if not s3_open_neuro:
+        s3_path = re.sub(r"(^|/)ds\d{6}/", r"\1", s3_path, count=1)
+        # TODO: remove this hack when competition is over
+        if s3_path.endswith(".set"):
+            s3_path = s3_path[:-4] + ".bdf"
+            local_path = local_path.with_suffix(".bdf")
+    local_path.parent.mkdir(parents=True, exist_ok=True)
+    _filesystem_get(filesystem=filesystem, s3path=s3_path, filepath=local_path)
+    return local_path
+def download_dependencies(
+    s3_bucket: str,
+    bids_dependencies: list[str],
+    bids_dependencies_original: list[str],
+    cache_dir: Path,
+    dataset_folder: Path,
+    record: dict[str, Any],
+    s3_open_neuro: bool,
+):
+    """Download all BIDS dependency files from S3 and cache them locally."""
+    filesystem = get_s3_filesystem()
+    for i, dep in enumerate(bids_dependencies):
+        if not s3_open_neuro:
+            if dep.endswith(".set"):
+                dep = dep[:-4] + ".bdf"
+        s3path = get_s3path(s3_bucket, dep)
+        if not s3_open_neuro:
+            dep = bids_dependencies_original[i]
+        dep_path = Path(dep)
+        if dep_path.parts and dep_path.parts[0] == record.get("dataset"):
+            dep_local = Path(dataset_folder, *dep_path.parts[1:])
+        else:
+            dep_local = Path(dataset_folder) / dep_path
+        filepath = cache_dir / dep_local
+        if not s3_open_neuro:
+            if filepath.suffix == ".set":
+                filepath = filepath.with_suffix(".bdf")
+        if not filepath.exists():
+            filepath.parent.mkdir(parents=True, exist_ok=True)
+            _filesystem_get(filesystem=filesystem, s3path=s3path, filepath=filepath)
+def _filesystem_get(filesystem: s3fs.S3FileSystem, s3path: str, filepath: Path):
+    """Helper to download a file from S3 with a progress bar."""
+    info = filesystem.info(s3path)
+    size = info.get("size") or info.get("Size")
+    callback = TqdmCallback(
+        size=size,
+        tqdm_kwargs=dict(
+            desc=f"Downloading {Path(s3path).name}",
+            unit="B",
+            unit_scale=True,
+            unit_divisor=1024,
+            dynamic_ncols=True,
+            leave=True,
+            mininterval=0.2,
+            smoothing=0.1,
+            miniters=1,
+            bar_format="{desc}: {percentage:3.0f}%|{bar}| {n_fmt}/{total_fmt} "
+            "[{elapsed}<{remaining}, {rate_fmt}]",
+        ),
+    )
+    filesystem.get(s3path, str(filepath), callback=callback)
+    return filepath
+def load_eeg_from_s3(s3path: str):
+    """Load EEG data from an S3 URI into an ``xarray.DataArray``.
+    Preserves the original filename, downloads sidecar files when applicable
+    (e.g., ``.fdt`` for EEGLAB, ``.vmrk``/``.eeg`` for BrainVision), and uses
+    MNE's direct readers.
+    Parameters
+    ----------
+    s3path : str
+        An S3 URI (should start with "s3://").
+    Returns
+    -------
+    xr.DataArray
+        EEG data with dimensions ``("channel", "time")``.
+    Raises
+    ------
+    ValueError
+        If the file extension is unsupported.
+    """
+    filesystem = get_s3_filesystem()
+    # choose a temp dir so sidecars can be colocated
+    with tempfile.TemporaryDirectory() as tmpdir:
+        # Derive local filenames from the S3 key to keep base name consistent
+        s3_key = urlsplit(s3path).path  # e.g., "/dsXXXX/sub-.../..._eeg.set"
+        basename = Path(s3_key).name
+        ext = Path(basename).suffix.lower()
+        local_main = Path(tmpdir) / basename
+        # Download main file
+        with (
+            filesystem.open(s3path, mode="rb") as fsrc,
+            open(local_main, "wb") as fdst,
+        ):
+            fdst.write(fsrc.read())
+        # Determine and fetch any required sidecars
+        sidecars: list[str] = []
+        if ext == ".set":  # EEGLAB
+            sidecars = [".fdt"]
+        elif ext == ".vhdr":  # BrainVision
+            sidecars = [".vmrk", ".eeg", ".dat", ".raw"]
+        for sc_ext in sidecars:
+            sc_key = s3_key[: -len(ext)] + sc_ext
+            sc_uri = f"s3://{urlsplit(s3path).netloc}{sc_key}"
+            try:
+                # If sidecar exists, download next to the main file
+                info = filesystem.info(sc_uri)
+                if info:
+                    sc_local = Path(tmpdir) / Path(sc_key).name
+                    with (
+                        filesystem.open(sc_uri, mode="rb") as fsrc,
+                        open(sc_local, "wb") as fdst,
+                    ):
+                        fdst.write(fsrc.read())
+            except Exception:
+                # Sidecar not present; skip silently
+                pass
+        # Read using appropriate MNE reader
+        raw = mne.io.read_raw(str(local_main), preload=True, verbose=False)
+        data = raw.get_data()
+        fs = raw.info["sfreq"]
+        max_time = data.shape[1] / fs
+        time_steps = np.linspace(0, max_time, data.shape[1]).squeeze()
+        channel_names = raw.ch_names
+        return xr.DataArray(
+            data=data,
+            dims=["channel", "time"],
+            coords={"time": time_steps, "channel": channel_names},
+        )

eegdash 0.3.9.dev182388821__py3-none-any.whl → 0.4.0.dev132__py3-none-any.whl

Potentially problematic release.

eegdash 0.3.9.dev182388821py3-none-any.whl → 0.4.0.dev132py3-none-any.whl