PyPI - ezmsg-learn - Versions diffs - 1.1.0__py3-none-any.whl - Mend

ezmsg-learn 1.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

ezmsg/learn/__init__.py +2 -0
ezmsg/learn/__version__.py +34 -0
ezmsg/learn/dim_reduce/__init__.py +0 -0
ezmsg/learn/dim_reduce/adaptive_decomp.py +274 -0
ezmsg/learn/dim_reduce/incremental_decomp.py +173 -0
ezmsg/learn/linear_model/__init__.py +1 -0
ezmsg/learn/linear_model/adaptive_linear_regressor.py +12 -0
ezmsg/learn/linear_model/cca.py +1 -0
ezmsg/learn/linear_model/linear_regressor.py +9 -0
ezmsg/learn/linear_model/sgd.py +9 -0
ezmsg/learn/linear_model/slda.py +12 -0
ezmsg/learn/model/__init__.py +0 -0
ezmsg/learn/model/cca.py +122 -0
ezmsg/learn/model/mlp.py +127 -0
ezmsg/learn/model/mlp_old.py +49 -0
ezmsg/learn/model/refit_kalman.py +369 -0
ezmsg/learn/model/rnn.py +160 -0
ezmsg/learn/model/transformer.py +175 -0
ezmsg/learn/nlin_model/__init__.py +1 -0
ezmsg/learn/nlin_model/mlp.py +10 -0
ezmsg/learn/process/__init__.py +0 -0
ezmsg/learn/process/adaptive_linear_regressor.py +142 -0
ezmsg/learn/process/base.py +154 -0
ezmsg/learn/process/linear_regressor.py +95 -0
ezmsg/learn/process/mlp_old.py +188 -0
ezmsg/learn/process/refit_kalman.py +403 -0
ezmsg/learn/process/rnn.py +245 -0
ezmsg/learn/process/sgd.py +117 -0
ezmsg/learn/process/sklearn.py +241 -0
ezmsg/learn/process/slda.py +110 -0
ezmsg/learn/process/ssr.py +374 -0
ezmsg/learn/process/torch.py +362 -0
ezmsg/learn/process/transformer.py +215 -0
ezmsg/learn/util.py +67 -0
ezmsg_learn-1.1.0.dist-info/METADATA +30 -0
ezmsg_learn-1.1.0.dist-info/RECORD +38 -0
ezmsg_learn-1.1.0.dist-info/WHEEL +4 -0
ezmsg_learn-1.1.0.dist-info/licenses/LICENSE +21 -0

ezmsg/learn/process/slda.py ADDED Viewed

@@ -0,0 +1,110 @@
+import typing
+import ezmsg.core as ez
+import numpy as np
+from ezmsg.baseproc import (
+    BaseStatefulTransformer,
+    BaseTransformerUnit,
+    processor_state,
+)
+from ezmsg.util.messages.axisarray import AxisArray
+from ezmsg.util.messages.util import replace
+from sklearn.discriminant_analysis import LinearDiscriminantAnalysis as LDA
+from ..util import ClassifierMessage
+class SLDASettings(ez.Settings):
+    settings_path: str
+    axis: str = "time"
+@processor_state
+class SLDAState:
+    lda: LDA
+    out_template: typing.Optional[ClassifierMessage] = None
+class SLDATransformer(BaseStatefulTransformer[SLDASettings, AxisArray, ClassifierMessage, SLDAState]):
+    def _reset_state(self, message: AxisArray) -> None:
+        if self.settings.settings_path[-4:] == ".mat":
+            # Expects a very specific format from a specific project. Not for general use.
+            import scipy.io as sio
+            matlab_sLDA = sio.loadmat(self.settings.settings_path, squeeze_me=True)
+            temp_weights = matlab_sLDA["weights"][1, 1:]
+            temp_intercept = matlab_sLDA["weights"][1, 0]
+            # Create weights and use zeros for channels we do not keep.
+            channels = matlab_sLDA["channels"] - 4
+            channels -= channels[0]  # Offsets are wrong somehow.
+            n_channels = message.data.shape[message.dims.index("ch")]
+            valid_indices = [ch for ch in channels if ch < n_channels]
+            full_weights = np.zeros(n_channels)
+            full_weights[valid_indices] = temp_weights[: len(valid_indices)]
+            lda = LDA(solver="lsqr", shrinkage="auto")
+            lda.classes_ = np.asarray([0, 1])
+            lda.coef_ = np.expand_dims(full_weights, axis=0)
+            lda.intercept_ = temp_intercept  # TODO: Is this supposed to be per-channel? Why the [1, 0]?
+            self.state.lda = lda
+            # mean = matlab_sLDA['mXtrain']
+            # std = matlab_sLDA['sXtrain']
+            # lags = matlab_sLDA['lags'] + 1
+        else:
+            import pickle
+            with open(self.settings.settings_path, "rb") as f:
+                self.state.lda = pickle.load(f)
+        # Create template ClassifierMessage using lda.classes_
+        out_labels = self.state.lda.classes_.tolist()
+        zero_shape = (0, len(out_labels))
+        self.state.out_template = ClassifierMessage(
+            data=np.zeros(zero_shape, dtype=message.data.dtype),
+            dims=[self.settings.axis, "classes"],
+            axes={
+                self.settings.axis: message.axes[self.settings.axis],
+                "classes": AxisArray.CoordinateAxis(data=np.array(out_labels), dims=["classes"]),
+            },
+            labels=out_labels,
+            key=message.key,
+        )
+    def _process(self, message: AxisArray) -> ClassifierMessage:
+        samp_ax_idx = message.dims.index(self.settings.axis)
+        X = np.moveaxis(message.data, samp_ax_idx, 0)
+        if X.shape[0]:
+            if isinstance(self.settings.settings_path, str) and self.settings.settings_path[-4:] == ".mat":
+                # Assumes F-contiguous weights
+                pred_probas = []
+                for samp in X:
+                    tmp = samp.flatten(order="F") * 1e-6
+                    tmp = np.expand_dims(tmp, axis=0)
+                    probas = self.state.lda.predict_proba(tmp)
+                    pred_probas.append(probas)
+                pred_probas = np.concatenate(pred_probas, axis=0)
+            else:
+                # This creates a copy.
+                X = X.reshape(X.shape[0], -1)
+                pred_probas = self.state.lda.predict_proba(X)
+            update_ax = self.state.out_template.axes[self.settings.axis]
+            update_ax.offset = message.axes[self.settings.axis].offset
+            return replace(
+                self.state.out_template,
+                data=pred_probas,
+                axes={
+                    **self.state.out_template.axes,
+                    # `replace` will copy the minimal set of fields
+                    self.settings.axis: replace(update_ax, offset=update_ax.offset),
+                },
+            )
+        else:
+            return self.state.out_template
+class SLDA(BaseTransformerUnit[SLDASettings, AxisArray, ClassifierMessage, SLDATransformer]):
+    SETTINGS = SLDASettings

ezmsg/learn/process/ssr.py ADDED Viewed

@@ -0,0 +1,374 @@
+"""Self-supervised regression framework and LRR implementation.
+This module provides a general framework for self-supervised channel
+regression via :class:`SelfSupervisedRegressionTransformer`, and a
+concrete implementation — Linear Regression Rereferencing (LRR) — via
+:class:`LRRTransformer`.
+**Framework.**  The base class accumulates the channel covariance
+``C = X^T X`` and solves per-cluster ridge regressions to obtain a weight
+matrix *W*.  Subclasses define what to *do* with *W* by implementing
+:meth:`~SelfSupervisedRegressionTransformer._on_weights_updated` and
+:meth:`~SelfSupervisedRegressionTransformer._process`.
+**LRR.**  For each channel *c*, predict it from the other channels in its
+cluster via ridge regression, then subtract the prediction::
+    y = X - X @ W = X @ (I - W)
+The effective weight matrix ``I - W`` is passed to
+:class:`~ezmsg.sigproc.affinetransform.AffineTransformTransformer`, which
+automatically exploits block-diagonal structure when ``channel_clusters``
+are provided.
+**Fitting.**  Given data matrix *X* of shape ``(samples, channels)``, the
+sufficient statistic is the channel covariance ``C = X^T X``.  When
+``incremental=True`` (default), *C* is accumulated across
+:meth:`~SelfSupervisedRegressionTransformer.partial_fit` calls.
+**Solving.**  Within each cluster the weight matrix *W* is obtained from
+the inverse of the (ridge-regularised) cluster covariance
+``C_inv = (C_cluster + lambda * I)^{-1}`` using the block-inverse identity::
+    W[:, c] = -C_inv[:, c] / C_inv[c, c],    diag(W) = 0
+This replaces the naive per-channel Cholesky loop with a single matrix
+inverse per cluster, keeping the linear algebra in the source array
+namespace so that GPU-backed arrays benefit from device-side computation.
+"""
+from __future__ import annotations
+import os
+import typing
+from abc import abstractmethod
+from pathlib import Path
+import ezmsg.core as ez
+import numpy as np
+from array_api_compat import get_namespace
+from ezmsg.baseproc import (
+    BaseAdaptiveTransformer,
+    BaseAdaptiveTransformerUnit,
+    processor_state,
+)
+from ezmsg.baseproc.protocols import SettingsType, StateType
+from ezmsg.sigproc.affinetransform import (
+    AffineTransformSettings,
+    AffineTransformTransformer,
+)
+from ezmsg.sigproc.util.array import array_device, xp_create
+from ezmsg.util.messages.axisarray import AxisArray
+# ---------------------------------------------------------------------------
+# Base: Self-supervised regression
+# ---------------------------------------------------------------------------
+class SelfSupervisedRegressionSettings(ez.Settings):
+    """Settings common to all self-supervised regression modes."""
+    weights: np.ndarray | str | Path | None = None
+    """Pre-calculated weight matrix *W* or path to a CSV file (``np.loadtxt``
+    compatible).  If provided, the transformer is ready immediately."""
+    axis: str | None = None
+    """Channel axis name. ``None`` defaults to the last dimension."""
+    channel_clusters: list[list[int]] | None = None
+    """Per-cluster regression.  ``None`` treats all channels as one cluster."""
+    ridge_lambda: float = 0.0
+    """Ridge (L2) regularisation parameter."""
+    incremental: bool = True
+    """When ``True``, accumulate ``X^T X`` across :meth:`partial_fit` calls.
+    When ``False``, each call replaces the previous statistics."""
+@processor_state
+class SelfSupervisedRegressionState:
+    cxx: object | None = None  # Array API; namespace matches source data.
+    n_samples: int = 0
+    weights: object | None = None  # Array API; namespace matches cxx.
+class SelfSupervisedRegressionTransformer(
+    BaseAdaptiveTransformer[SettingsType, AxisArray, AxisArray, StateType],
+    typing.Generic[SettingsType, StateType],
+):
+    """Abstract base for self-supervised regression transformers.
+    Subclasses must implement:
+    * :meth:`_on_weights_updated` — called whenever the weight matrix *W* is
+      (re)computed, so the subclass can build whatever internal transform it
+      needs (e.g. ``I - W`` for LRR).
+    * :meth:`_process` — the per-message transform step.
+    """
+    # -- message hash / state management ------------------------------------
+    def _hash_message(self, message: AxisArray) -> int:
+        axis = self.settings.axis or message.dims[-1]
+        axis_idx = message.get_axis_idx(axis)
+        return hash((message.key, message.data.shape[axis_idx]))
+    def _reset_state(self, message: AxisArray) -> None:
+        axis = self.settings.axis or message.dims[-1]
+        axis_idx = message.get_axis_idx(axis)
+        n_channels = message.data.shape[axis_idx]
+        self._validate_clusters(n_channels)
+        self._state.cxx = None
+        self._state.n_samples = 0
+        self._state.weights = None
+        # If pre-calculated weights are provided, load and go.
+        weights = self.settings.weights
+        if weights is not None:
+            if isinstance(weights, str):
+                weights = Path(os.path.abspath(os.path.expanduser(weights)))
+            if isinstance(weights, Path):
+                weights = np.loadtxt(weights, delimiter=",")
+            weights = np.asarray(weights, dtype=np.float64)
+            self._state.weights = weights
+            self._on_weights_updated()
+    # -- cluster validation --------------------------------------------------
+    def _validate_clusters(self, n_channels: int) -> None:
+        """Raise if any cluster index is out of range."""
+        clusters = self.settings.channel_clusters
+        if clusters is None:
+            return
+        all_indices = np.concatenate([np.asarray(g) for g in clusters])
+        if np.any((all_indices < 0) | (all_indices >= n_channels)):
+            raise ValueError(f"channel_clusters contains out-of-range indices (valid range: 0..{n_channels - 1})")
+    # -- weight solving ------------------------------------------------------
+    def _solve_weights(self, cxx):
+        """Solve all per-channel ridge regressions via matrix inverse.
+        Uses the block-inverse identity: for target channel *c* with
+        references *r*, ``w_c = -C_inv[r, c] / C_inv[c, c]`` where
+        ``C_inv = (C_cluster + λI)⁻¹``.  This replaces the per-channel
+        Cholesky loop with one matrix inverse per cluster.
+        All computation stays in the source array namespace so that
+        GPU-backed arrays benefit from device-side execution.  Cluster
+        results are scattered into the full matrix via a selection-matrix
+        multiply (``S @ W_cluster @ S^T``) to avoid numpy fancy indexing.
+        Returns weight matrix *W* in the same namespace as *cxx*, with
+        ``diag(W) == 0``.
+        """
+        xp = get_namespace(cxx)
+        dev = array_device(cxx)
+        n = cxx.shape[0]
+        clusters = self.settings.channel_clusters
+        if clusters is None:
+            clusters = [list(range(n))]
+        W = xp_create(xp.zeros, (n, n), dtype=cxx.dtype, device=dev)
+        eye_n = xp_create(xp.eye, n, dtype=cxx.dtype, device=dev)
+        for cluster in clusters:
+            k = len(cluster)
+            if k <= 1:
+                continue
+            idx_xp = xp.asarray(cluster) if dev is None else xp.asarray(cluster, device=dev)
+            eye_k = xp_create(xp.eye, k, dtype=cxx.dtype, device=dev)
+            # Extract cluster sub-covariance (stays on device)
+            sub = xp.take(xp.take(cxx, idx_xp, axis=0), idx_xp, axis=1)
+            if self.settings.ridge_lambda > 0:
+                sub = sub + self.settings.ridge_lambda * eye_k
+            # One inverse per cluster
+            try:
+                sub_inv = xp.linalg.inv(sub)
+            except Exception:
+                sub_inv = xp.linalg.pinv(sub)
+            # Diagonal via element-wise product with identity
+            diag_vals = xp.sum(sub_inv * eye_k, axis=0)
+            # w_c = -C_inv[:, c] / C_inv[c, c], vectorised over all c
+            W_cluster = -(sub_inv / xp.reshape(diag_vals, (1, k)))
+            # Zero the diagonal
+            W_cluster = W_cluster * (1.0 - eye_k)
+            # Scatter into full W
+            if k == n:
+                W = W + W_cluster
+            else:
+                # Selection matrix: columns of eye(n) at cluster indices
+                S = xp.take(eye_n, idx_xp, axis=1)  # (n, k)
+                W = W + xp.matmul(S, xp.matmul(W_cluster, xp.permute_dims(S, (1, 0))))
+        return W
+    # -- partial_fit (self-supervised, accepts AxisArray) --------------------
+    def partial_fit(self, message: AxisArray) -> None:  # type: ignore[override]
+        xp = get_namespace(message.data)
+        if xp.any(xp.isnan(message.data)):
+            return
+        # Hash check / state reset
+        msg_hash = self._hash_message(message)
+        if self._hash != msg_hash:
+            self._reset_state(message)
+            self._hash = msg_hash
+        axis = self.settings.axis or message.dims[-1]
+        axis_idx = message.get_axis_idx(axis)
+        data = message.data
+        # Move channel axis to last, flatten to 2-D
+        if axis_idx != data.ndim - 1:
+            perm = list(range(data.ndim))
+            perm.append(perm.pop(axis_idx))
+            data = xp.permute_dims(data, perm)
+        n_channels = data.shape[-1]
+        X = xp.reshape(data, (-1, n_channels))
+        # Covariance stays in the source namespace for accumulation.
+        cxx_new = xp.matmul(xp.permute_dims(X, (1, 0)), X)
+        if self.settings.incremental and self._state.cxx is not None:
+            self._state.cxx = self._state.cxx + cxx_new
+        else:
+            self._state.cxx = cxx_new
+        self._state.n_samples += int(X.shape[0])
+        self._state.weights = self._solve_weights(self._state.cxx)
+        self._on_weights_updated()
+    # -- convenience APIs ----------------------------------------------------
+    def fit(self, X: np.ndarray) -> None:
+        """Batch fit from a raw numpy array (samples x channels)."""
+        n_channels = X.shape[-1]
+        self._validate_clusters(n_channels)
+        X = np.asarray(X, dtype=np.float64).reshape(-1, n_channels)
+        self._state.cxx = X.T @ X
+        self._state.n_samples = X.shape[0]
+        self._state.weights = self._solve_weights(self._state.cxx)
+        self._on_weights_updated()
+    def fit_transform(self, message: AxisArray) -> AxisArray:
+        """Convenience: ``partial_fit`` then ``_process``."""
+        self.partial_fit(message)
+        return self._process(message)
+    # -- abstract hooks for subclasses ---------------------------------------
+    @abstractmethod
+    def _on_weights_updated(self) -> None:
+        """Called after ``self._state.weights`` has been set/updated.
+        Subclasses should build or refresh whatever internal transform
+        object they need for :meth:`_process`.
+        """
+        ...
+    @abstractmethod
+    def _process(self, message: AxisArray) -> AxisArray: ...
+# ---------------------------------------------------------------------------
+# Concrete: Linear Regression Rereferencing (LRR)
+# ---------------------------------------------------------------------------
+class LRRSettings(SelfSupervisedRegressionSettings):
+    """Settings for :class:`LRRTransformer`."""
+    min_cluster_size: int = 32
+    """Passed to :class:`AffineTransformTransformer` for the block-diagonal
+    merge threshold."""
+@processor_state
+class LRRState(SelfSupervisedRegressionState):
+    affine: AffineTransformTransformer | None = None
+class LRRTransformer(
+    SelfSupervisedRegressionTransformer[LRRSettings, LRRState],
+):
+    """Adaptive LRR transformer.
+    ``partial_fit`` accepts a plain :class:`AxisArray` (self-supervised),
+    and the transform step is delegated to an internal :class:`AffineTransformTransformer`.
+    """
+    # -- state management (clear own state, then delegate to base) ----------
+    def _reset_state(self, message: AxisArray) -> None:
+        self._state.affine = None
+        super()._reset_state(message)
+    # -- weights → affine transform -----------------------------------------
+    def _on_weights_updated(self) -> None:
+        xp = get_namespace(self._state.weights)
+        dev = array_device(self._state.weights)
+        n = self._state.weights.shape[0]
+        effective = xp_create(xp.eye, n, dtype=self._state.weights.dtype, device=dev) - self._state.weights
+        # Prefer in-place weight update when the affine transformer supports
+        # it (avoids a full _reset_state round-trip on every partial_fit).
+        if self._state.affine is not None:
+            self._state.affine.set_weights(effective)
+        else:
+            self._state.affine = AffineTransformTransformer(
+                AffineTransformSettings(
+                    weights=effective,
+                    axis=self.settings.axis,
+                    channel_clusters=self.settings.channel_clusters,
+                    min_cluster_size=self.settings.min_cluster_size,
+                )
+            )
+    # -- transform -----------------------------------------------------------
+    def _process(self, message: AxisArray) -> AxisArray:
+        if self._state.affine is None:
+            raise RuntimeError(
+                "LRRTransformer has not been fitted. Call partial_fit() or provide pre-calculated weights."
+            )
+        return self._state.affine(message)
+class LRRUnit(
+    BaseAdaptiveTransformerUnit[
+        LRRSettings,
+        AxisArray,
+        AxisArray,
+        LRRTransformer,
+    ],
+):
+    """ezmsg Unit wrapping :class:`LRRTransformer`.
+    Follows the :class:`BaseAdaptiveDecompUnit` pattern — accepts
+    :class:`AxisArray` (not :class:`SampleMessage`) for self-supervised
+    training via ``INPUT_SAMPLE``.
+    """
+    SETTINGS = LRRSettings
+    INPUT_SAMPLE = ez.InputStream(AxisArray)
+    @ez.subscriber(INPUT_SAMPLE)
+    async def on_sample(self, msg: AxisArray) -> None:
+        await self.processor.apartial_fit(msg)