PyPI - junifer - Versions diffs - 0.0.5.dev240__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

junifer 0.0.5.dev240py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (279) hide show

junifer/__init__.py +2 -31
junifer/__init__.pyi +37 -0
junifer/_version.py +9 -4
junifer/api/__init__.py +3 -5
junifer/api/__init__.pyi +4 -0
junifer/api/decorators.py +14 -19
junifer/api/functions.py +165 -109
junifer/api/py.typed +0 -0
junifer/api/queue_context/__init__.py +2 -4
junifer/api/queue_context/__init__.pyi +5 -0
junifer/api/queue_context/gnu_parallel_local_adapter.py +22 -6
junifer/api/queue_context/htcondor_adapter.py +23 -6
junifer/api/queue_context/py.typed +0 -0
junifer/api/queue_context/tests/test_gnu_parallel_local_adapter.py +3 -3
junifer/api/queue_context/tests/test_htcondor_adapter.py +3 -3
junifer/api/tests/test_functions.py +168 -74
junifer/cli/__init__.py +24 -0
junifer/cli/__init__.pyi +3 -0
junifer/{api → cli}/cli.py +141 -125
junifer/cli/parser.py +235 -0
junifer/cli/py.typed +0 -0
junifer/{api → cli}/tests/test_cli.py +8 -8
junifer/{api/tests/test_api_utils.py → cli/tests/test_cli_utils.py} +5 -4
junifer/{api → cli}/tests/test_parser.py +2 -2
junifer/{api → cli}/utils.py +6 -16
junifer/configs/juseless/__init__.py +2 -2
junifer/configs/juseless/__init__.pyi +3 -0
junifer/configs/juseless/datagrabbers/__init__.py +2 -12
junifer/configs/juseless/datagrabbers/__init__.pyi +13 -0
junifer/configs/juseless/datagrabbers/ixi_vbm.py +2 -2
junifer/configs/juseless/datagrabbers/py.typed +0 -0
junifer/configs/juseless/datagrabbers/tests/test_ucla.py +2 -2
junifer/configs/juseless/datagrabbers/ucla.py +4 -4
junifer/configs/juseless/py.typed +0 -0
junifer/conftest.py +25 -0
junifer/data/__init__.py +2 -42
junifer/data/__init__.pyi +29 -0
junifer/data/_dispatch.py +248 -0
junifer/data/coordinates/__init__.py +9 -0
junifer/data/coordinates/__init__.pyi +5 -0
junifer/data/coordinates/_ants_coordinates_warper.py +104 -0
junifer/data/coordinates/_coordinates.py +385 -0
junifer/data/coordinates/_fsl_coordinates_warper.py +81 -0
junifer/data/{tests → coordinates/tests}/test_coordinates.py +26 -33
junifer/data/masks/__init__.py +9 -0
junifer/data/masks/__init__.pyi +6 -0
junifer/data/masks/_ants_mask_warper.py +177 -0
junifer/data/masks/_fsl_mask_warper.py +106 -0
junifer/data/masks/_masks.py +802 -0
junifer/data/{tests → masks/tests}/test_masks.py +67 -63
junifer/data/parcellations/__init__.py +9 -0
junifer/data/parcellations/__init__.pyi +6 -0
junifer/data/parcellations/_ants_parcellation_warper.py +166 -0
junifer/data/parcellations/_fsl_parcellation_warper.py +89 -0
junifer/data/parcellations/_parcellations.py +1388 -0
junifer/data/{tests → parcellations/tests}/test_parcellations.py +165 -295
junifer/data/pipeline_data_registry_base.py +76 -0
junifer/data/py.typed +0 -0
junifer/data/template_spaces.py +44 -79
junifer/data/tests/test_data_utils.py +1 -2
junifer/data/tests/test_template_spaces.py +8 -4
junifer/data/utils.py +109 -4
junifer/datagrabber/__init__.py +2 -26
junifer/datagrabber/__init__.pyi +27 -0
junifer/datagrabber/aomic/__init__.py +2 -4
junifer/datagrabber/aomic/__init__.pyi +5 -0
junifer/datagrabber/aomic/id1000.py +81 -52
junifer/datagrabber/aomic/piop1.py +83 -55
junifer/datagrabber/aomic/piop2.py +85 -56
junifer/datagrabber/aomic/py.typed +0 -0
junifer/datagrabber/aomic/tests/test_id1000.py +19 -12
junifer/datagrabber/aomic/tests/test_piop1.py +52 -18
junifer/datagrabber/aomic/tests/test_piop2.py +50 -17
junifer/datagrabber/base.py +22 -18
junifer/datagrabber/datalad_base.py +71 -34
junifer/datagrabber/dmcc13_benchmark.py +31 -18
junifer/datagrabber/hcp1200/__init__.py +2 -3
junifer/datagrabber/hcp1200/__init__.pyi +4 -0
junifer/datagrabber/hcp1200/datalad_hcp1200.py +3 -3
junifer/datagrabber/hcp1200/hcp1200.py +26 -15
junifer/datagrabber/hcp1200/py.typed +0 -0
junifer/datagrabber/hcp1200/tests/test_hcp1200.py +8 -2
junifer/datagrabber/multiple.py +14 -9
junifer/datagrabber/pattern.py +132 -96
junifer/datagrabber/pattern_validation_mixin.py +206 -94
junifer/datagrabber/py.typed +0 -0
junifer/datagrabber/tests/test_datalad_base.py +27 -12
junifer/datagrabber/tests/test_dmcc13_benchmark.py +28 -11
junifer/datagrabber/tests/test_multiple.py +48 -2
junifer/datagrabber/tests/test_pattern_datalad.py +1 -1
junifer/datagrabber/tests/test_pattern_validation_mixin.py +6 -6
junifer/datareader/__init__.py +2 -2
junifer/datareader/__init__.pyi +3 -0
junifer/datareader/default.py +6 -6
junifer/datareader/py.typed +0 -0
junifer/external/nilearn/__init__.py +2 -3
junifer/external/nilearn/__init__.pyi +4 -0
junifer/external/nilearn/junifer_connectivity_measure.py +25 -17
junifer/external/nilearn/junifer_nifti_spheres_masker.py +4 -4
junifer/external/nilearn/py.typed +0 -0
junifer/external/nilearn/tests/test_junifer_connectivity_measure.py +17 -16
junifer/external/nilearn/tests/test_junifer_nifti_spheres_masker.py +2 -3
junifer/markers/__init__.py +2 -38
junifer/markers/__init__.pyi +37 -0
junifer/markers/base.py +11 -14
junifer/markers/brainprint.py +12 -14
junifer/markers/complexity/__init__.py +2 -18
junifer/markers/complexity/__init__.pyi +17 -0
junifer/markers/complexity/complexity_base.py +9 -11
junifer/markers/complexity/hurst_exponent.py +7 -7
junifer/markers/complexity/multiscale_entropy_auc.py +7 -7
junifer/markers/complexity/perm_entropy.py +7 -7
junifer/markers/complexity/py.typed +0 -0
junifer/markers/complexity/range_entropy.py +7 -7
junifer/markers/complexity/range_entropy_auc.py +7 -7
junifer/markers/complexity/sample_entropy.py +7 -7
junifer/markers/complexity/tests/test_complexity_base.py +1 -1
junifer/markers/complexity/tests/test_hurst_exponent.py +5 -5
junifer/markers/complexity/tests/test_multiscale_entropy_auc.py +5 -5
junifer/markers/complexity/tests/test_perm_entropy.py +5 -5
junifer/markers/complexity/tests/test_range_entropy.py +5 -5
junifer/markers/complexity/tests/test_range_entropy_auc.py +5 -5
junifer/markers/complexity/tests/test_sample_entropy.py +5 -5
junifer/markers/complexity/tests/test_weighted_perm_entropy.py +5 -5
junifer/markers/complexity/weighted_perm_entropy.py +7 -7
junifer/markers/ets_rss.py +12 -11
junifer/markers/falff/__init__.py +2 -3
junifer/markers/falff/__init__.pyi +4 -0
junifer/markers/falff/_afni_falff.py +38 -45
junifer/markers/falff/_junifer_falff.py +16 -19
junifer/markers/falff/falff_base.py +7 -11
junifer/markers/falff/falff_parcels.py +9 -9
junifer/markers/falff/falff_spheres.py +8 -8
junifer/markers/falff/py.typed +0 -0
junifer/markers/falff/tests/test_falff_spheres.py +3 -1
junifer/markers/functional_connectivity/__init__.py +2 -12
junifer/markers/functional_connectivity/__init__.pyi +13 -0
junifer/markers/functional_connectivity/crossparcellation_functional_connectivity.py +9 -8
junifer/markers/functional_connectivity/edge_functional_connectivity_parcels.py +8 -8
junifer/markers/functional_connectivity/edge_functional_connectivity_spheres.py +7 -7
junifer/markers/functional_connectivity/functional_connectivity_base.py +13 -12
junifer/markers/functional_connectivity/functional_connectivity_parcels.py +8 -8
junifer/markers/functional_connectivity/functional_connectivity_spheres.py +7 -7
junifer/markers/functional_connectivity/py.typed +0 -0
junifer/markers/functional_connectivity/tests/test_edge_functional_connectivity_parcels.py +1 -2
junifer/markers/functional_connectivity/tests/test_edge_functional_connectivity_spheres.py +1 -2
junifer/markers/functional_connectivity/tests/test_functional_connectivity_parcels.py +6 -6
junifer/markers/functional_connectivity/tests/test_functional_connectivity_spheres.py +5 -5
junifer/markers/parcel_aggregation.py +22 -17
junifer/markers/py.typed +0 -0
junifer/markers/reho/__init__.py +2 -3
junifer/markers/reho/__init__.pyi +4 -0
junifer/markers/reho/_afni_reho.py +29 -35
junifer/markers/reho/_junifer_reho.py +13 -14
junifer/markers/reho/py.typed +0 -0
junifer/markers/reho/reho_base.py +7 -11
junifer/markers/reho/reho_parcels.py +10 -10
junifer/markers/reho/reho_spheres.py +9 -9
junifer/markers/sphere_aggregation.py +22 -17
junifer/markers/temporal_snr/__init__.py +2 -3
junifer/markers/temporal_snr/__init__.pyi +4 -0
junifer/markers/temporal_snr/py.typed +0 -0
junifer/markers/temporal_snr/temporal_snr_base.py +11 -10
junifer/markers/temporal_snr/temporal_snr_parcels.py +8 -8
junifer/markers/temporal_snr/temporal_snr_spheres.py +7 -7
junifer/markers/tests/test_ets_rss.py +3 -3
junifer/markers/tests/test_parcel_aggregation.py +24 -24
junifer/markers/tests/test_sphere_aggregation.py +6 -6
junifer/markers/utils.py +3 -3
junifer/onthefly/__init__.py +2 -1
junifer/onthefly/_brainprint.py +138 -0
junifer/onthefly/read_transform.py +5 -8
junifer/pipeline/__init__.py +2 -10
junifer/pipeline/__init__.pyi +13 -0
junifer/{markers/collection.py → pipeline/marker_collection.py} +8 -14
junifer/pipeline/pipeline_component_registry.py +294 -0
junifer/pipeline/pipeline_step_mixin.py +15 -11
junifer/pipeline/py.typed +0 -0
junifer/{markers/tests/test_collection.py → pipeline/tests/test_marker_collection.py} +2 -3
junifer/pipeline/tests/test_pipeline_component_registry.py +200 -0
junifer/pipeline/tests/test_pipeline_step_mixin.py +36 -37
junifer/pipeline/tests/test_update_meta_mixin.py +4 -4
junifer/pipeline/tests/test_workdir_manager.py +43 -0
junifer/pipeline/update_meta_mixin.py +21 -17
junifer/pipeline/utils.py +6 -6
junifer/pipeline/workdir_manager.py +19 -5
junifer/preprocess/__init__.py +2 -10
junifer/preprocess/__init__.pyi +11 -0
junifer/preprocess/base.py +10 -10
junifer/preprocess/confounds/__init__.py +2 -2
junifer/preprocess/confounds/__init__.pyi +3 -0
junifer/preprocess/confounds/fmriprep_confound_remover.py +243 -64
junifer/preprocess/confounds/py.typed +0 -0
junifer/preprocess/confounds/tests/test_fmriprep_confound_remover.py +121 -14
junifer/preprocess/py.typed +0 -0
junifer/preprocess/smoothing/__init__.py +2 -2
junifer/preprocess/smoothing/__init__.pyi +3 -0
junifer/preprocess/smoothing/_afni_smoothing.py +40 -40
junifer/preprocess/smoothing/_fsl_smoothing.py +22 -32
junifer/preprocess/smoothing/_nilearn_smoothing.py +35 -14
junifer/preprocess/smoothing/py.typed +0 -0
junifer/preprocess/smoothing/smoothing.py +11 -13
junifer/preprocess/warping/__init__.py +2 -2
junifer/preprocess/warping/__init__.pyi +3 -0
junifer/preprocess/warping/_ants_warper.py +136 -32
junifer/preprocess/warping/_fsl_warper.py +73 -22
junifer/preprocess/warping/py.typed +0 -0
junifer/preprocess/warping/space_warper.py +39 -11
junifer/preprocess/warping/tests/test_space_warper.py +5 -9
junifer/py.typed +0 -0
junifer/stats.py +5 -5
junifer/storage/__init__.py +2 -10
junifer/storage/__init__.pyi +11 -0
junifer/storage/base.py +47 -13
junifer/storage/hdf5.py +95 -33
junifer/storage/pandas_base.py +12 -11
junifer/storage/py.typed +0 -0
junifer/storage/sqlite.py +11 -11
junifer/storage/tests/test_hdf5.py +86 -4
junifer/storage/tests/test_sqlite.py +2 -2
junifer/storage/tests/test_storage_base.py +5 -2
junifer/storage/tests/test_utils.py +33 -7
junifer/storage/utils.py +95 -9
junifer/testing/__init__.py +2 -3
junifer/testing/__init__.pyi +4 -0
junifer/testing/datagrabbers.py +10 -11
junifer/testing/py.typed +0 -0
junifer/testing/registry.py +4 -7
junifer/testing/tests/test_testing_registry.py +9 -17
junifer/tests/test_stats.py +2 -2
junifer/typing/__init__.py +9 -0
junifer/typing/__init__.pyi +31 -0
junifer/typing/_typing.py +68 -0
junifer/utils/__init__.py +2 -12
junifer/utils/__init__.pyi +18 -0
junifer/utils/_config.py +110 -0
junifer/utils/_yaml.py +16 -0
junifer/utils/helpers.py +6 -6
junifer/utils/logging.py +117 -8
junifer/utils/py.typed +0 -0
junifer/{pipeline → utils}/singleton.py +19 -14
junifer/utils/tests/test_config.py +59 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info}/METADATA +43 -38
junifer-0.0.6.dist-info/RECORD +350 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info}/WHEEL +1 -1
junifer-0.0.6.dist-info/entry_points.txt +2 -0
junifer/api/parser.py +0 -118
junifer/data/coordinates.py +0 -408
junifer/data/masks.py +0 -670
junifer/data/parcellations.py +0 -1828
junifer/pipeline/registry.py +0 -177
junifer/pipeline/tests/test_registry.py +0 -150
junifer-0.0.5.dev240.dist-info/RECORD +0 -275
junifer-0.0.5.dev240.dist-info/entry_points.txt +0 -2
/junifer/{api → cli}/tests/data/gmd_mean.yaml +0 -0
/junifer/{api → cli}/tests/data/gmd_mean_htcondor.yaml +0 -0
/junifer/{api → cli}/tests/data/partly_cloudy_agg_mean_tian.yml +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/AutobiographicalMemory_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/CogAC_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/CogAR_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/DMNBuckner_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Dosenbach2010_MNI_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Empathy_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Motor_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/MultiTask_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/PhysioStress_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Power2011_MNI_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Power2013_MNI_VOIs.tsv +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Rew_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Somatosensory_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/ToM_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/VigAtt_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/WM_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/eMDN_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/eSAD_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/extDMN_VOIs.txt +0 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info/licenses}/AUTHORS.rst +0 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info/licenses}/LICENSE.md +0 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info}/top_level.txt +0 -0

junifer/storage/base.py CHANGED Viewed

@@ -5,8 +5,9 @@
 # License: AGPL
 from abc import ABC, abstractmethod
+from collections.abc import Iterable
 from pathlib import Path
-from typing import Any, Dict, Iterable, List, Optional, Union
+from typing import Any, Optional, Union
 import numpy as np
 import pandas as pd
@@ -43,7 +44,7 @@ class BaseFeatureStorage(ABC):
     def __init__(
         self,
         uri: Union[str, Path],
-        storage_types: Union[List[str], str],
+        storage_types: Union[list[str], str],
         single_output: bool = True,
     ) -> None:
         self.uri = uri
@@ -61,7 +62,7 @@ class BaseFeatureStorage(ABC):
         self._valid_inputs = storage_types
         self.single_output = single_output
-    def get_valid_inputs(self) -> List[str]:
+    def get_valid_inputs(self) -> list[str]:
         """Get valid storage types for input.
         Returns
@@ -76,7 +77,7 @@ class BaseFeatureStorage(ABC):
             klass=NotImplementedError,
         )
-    def validate(self, input_: List[str]) -> None:
+    def validate(self, input_: list[str]) -> None:
         """Validate the input to the pipeline step.
         Parameters
@@ -98,7 +99,7 @@ class BaseFeatureStorage(ABC):
             )
     @abstractmethod
-    def list_features(self) -> Dict[str, Dict[str, Any]]:
+    def list_features(self) -> dict[str, dict[str, Any]]:
         """List the features in the storage.
         Returns
@@ -119,8 +120,8 @@ class BaseFeatureStorage(ABC):
         self,
         feature_name: Optional[str] = None,
         feature_md5: Optional[str] = None,
-    ) -> Dict[
-        str, Union[str, List[Union[int, str, Dict[str, str]]], np.ndarray]
+    ) -> dict[
+        str, Union[str, list[Union[int, str, dict[str, str]]], np.ndarray]
     ]:
         """Read stored feature.
@@ -169,7 +170,7 @@ class BaseFeatureStorage(ABC):
         )
     @abstractmethod
-    def store_metadata(self, meta_md5: str, element: Dict, meta: Dict) -> None:
+    def store_metadata(self, meta_md5: str, element: dict, meta: dict) -> None:
         """Store metadata.
         Parameters
@@ -225,11 +226,15 @@ class BaseFeatureStorage(ABC):
             self.store_scalar_table(
                 meta_md5=meta_md5, element=t_element, **kwargs
             )
+        elif kind == "timeseries_2d":
+            self.store_timeseries_2d(
+                meta_md5=meta_md5, element=t_element, **kwargs
+            )
     def store_matrix(
         self,
         meta_md5: str,
-        element: Dict,
+        element: dict,
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
         row_names: Optional[Iterable[str]] = None,
@@ -271,8 +276,8 @@ class BaseFeatureStorage(ABC):
     def store_vector(
         self,
         meta_md5: str,
-        element: Dict,
-        data: Union[np.ndarray, List],
+        element: dict,
+        data: Union[np.ndarray, list],
         col_names: Optional[Iterable[str]] = None,
     ) -> None:
         """Store vector.
@@ -297,7 +302,7 @@ class BaseFeatureStorage(ABC):
     def store_timeseries(
         self,
         meta_md5: str,
-        element: Dict,
+        element: dict,
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
     ) -> None:
@@ -320,10 +325,39 @@ class BaseFeatureStorage(ABC):
             klass=NotImplementedError,
         )
+    def store_timeseries_2d(
+        self,
+        meta_md5: str,
+        element: dict,
+        data: np.ndarray,
+        col_names: Optional[Iterable[str]] = None,
+        row_names: Optional[Iterable[str]] = None,
+    ) -> None:
+        """Store 2D timeseries.
+        Parameters
+        ----------
+        meta_md5 : str
+            The metadata MD5 hash.
+        element : dict
+            The element as a dictionary.
+        data : numpy.ndarray
+            The timeseries data to store.
+        col_names : list or tuple of str, optional
+            The column labels (default None).
+        row_names : list or tuple of str, optional
+            The row labels (default None).
+        """
+        raise_error(
+            msg="Concrete classes need to implement store_timeseries_2d().",
+            klass=NotImplementedError,
+        )
     def store_scalar_table(
         self,
         meta_md5: str,
-        element: Dict,
+        element: dict,
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
         row_names: Optional[Iterable[str]] = None,

junifer/storage/hdf5.py CHANGED Viewed

@@ -4,10 +4,10 @@
 #          Federico Raimondo <f.raimondo@fz-juelich.de>
 # License: AGPL
 from collections import defaultdict
+from collections.abc import Iterable
 from pathlib import Path
-from typing import Any, Dict, Iterable, List, Optional, Union
+from typing import Any, Optional, Union
 import numpy as np
 import pandas as pd
@@ -23,14 +23,20 @@ from ..external.h5io.h5io import (
 )
 from ..utils import logger, raise_error
 from .base import BaseFeatureStorage
-from .utils import element_to_prefix, matrix_to_vector, store_matrix_checks
+from .utils import (
+    element_to_prefix,
+    matrix_to_vector,
+    store_matrix_checks,
+    store_timeseries_2d_checks,
+    timeseries2d_to_vector,
+)
 __all__ = ["HDF5FeatureStorage"]
 def _create_chunk(
-    chunk_data: List[np.ndarray],
+    chunk_data: list[np.ndarray],
     kind: str,
     element_count: int,
     chunk_size: int,
@@ -81,7 +87,7 @@ def _create_chunk(
             chunk_size=tuple(array_chunk_size),
             n_chunk=i_chunk,
         )
-    elif kind in ["timeseries", "scalar_table"]:
+    elif kind in ["timeseries", "scalar_table", "timeseries_2d"]:
         out = ChunkedList(
             data=chunk_data,
             size=element_count,
@@ -90,8 +96,8 @@ def _create_chunk(
     else:
         raise_error(
             f"Invalid kind: {kind}. "
-            "Must be one of ['vector', 'matrix', 'timeseries',"
-            "'scalar_table']."
+            "Must be one of ['vector', 'matrix', 'timeseries', "
+            "'timeseries_2d', 'scalar_table']."
         )
     return out
@@ -164,7 +170,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         self.force_float32 = force_float32
         self.chunk_size = chunk_size
-    def get_valid_inputs(self) -> List[str]:
+    def get_valid_inputs(self) -> list[str]:
         """Get valid storage types for input.
         Returns
@@ -176,7 +182,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         """
         return ["matrix", "vector", "timeseries", "scalar_table"]
-    def _fetch_correct_uri_for_io(self, element: Optional[Dict]) -> str:
+    def _fetch_correct_uri_for_io(self, element: Optional[dict]) -> str:
         """Return proper URI for I/O based on `element`.
         If `element` is None, will return `self.uri`.
@@ -195,8 +201,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         if not self.single_output and not element:
             raise_error(
                 msg=(
-                    "`element` must be provided when `single_output` "
-                    "is False"
+                    "`element` must be provided when `single_output` is False"
                 ),
                 klass=RuntimeError,
             )
@@ -210,8 +215,8 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         return f"{self.uri.parent}/{prefix}{self.uri.name}"  # type: ignore
     def _read_metadata(
-        self, element: Optional[Dict[str, str]] = None
-    ) -> Dict[str, Dict[str, Any]]:
+        self, element: Optional[dict[str, str]] = None
+    ) -> dict[str, dict[str, Any]]:
         """Read metadata (should not be called directly).
         Parameters
@@ -261,7 +266,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         return metadata
-    def list_features(self) -> Dict[str, Dict[str, Any]]:
+    def list_features(self) -> dict[str, dict[str, Any]]:
         """List the features in the storage.
         Returns
@@ -281,8 +286,8 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         return metadata
     def _read_data(
-        self, md5: str, element: Optional[Dict[str, str]] = None
-    ) -> Dict[str, Any]:
+        self, md5: str, element: Optional[dict[str, str]] = None
+    ) -> dict[str, Any]:
         """Read data (should not be called directly).
         Parameters
@@ -338,8 +343,8 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         self,
         feature_name: Optional[str] = None,
         feature_md5: Optional[str] = None,
-    ) -> Dict[
-        str, Union[str, List[Union[int, str, Dict[str, str]]], np.ndarray]
+    ) -> dict[
+        str, Union[str, list[Union[int, str, dict[str, str]]], np.ndarray]
     ]:
         """Read stored feature.
@@ -513,6 +518,27 @@ class HDF5FeatureStorage(BaseFeatureStorage):
             columns = hdf_data["column_headers"]
             # Convert data from 3D to 2D
             reshaped_data = np.concatenate(all_data, axis=0)
+        elif hdf_data["kind"] == "timeseries_2d":
+            # Create dictionary for aggregating index data
+            element_idx = defaultdict(list)
+            all_data = []
+            for idx, element in enumerate(hdf_data["element"]):
+                # Get row count for the element
+                t_data = hdf_data["data"][idx]
+                flat_data, columns = timeseries2d_to_vector(
+                    data=t_data,
+                    col_names=hdf_data["column_headers"],
+                    row_names=hdf_data["row_headers"],
+                )
+                all_data.append(flat_data)
+                n_timepoints = flat_data.shape[0]
+                # Set rows for the index
+                for key, val in element.items():
+                    element_idx[key].extend([val] * n_timepoints)
+                # Add extra column for timepoints
+                element_idx["timepoint"].extend(np.arange(n_timepoints))
+            # Convert data from 3D to 2D
+            reshaped_data = np.concatenate(all_data, axis=0)
         elif hdf_data["kind"] == "scalar_table":
             # Create dictionary for aggregating index data
             element_idx = defaultdict(list)
@@ -562,7 +588,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         return df
     def _write_processed_data(
-        self, fname: str, processed_data: Dict[str, Any], title: str
+        self, fname: str, processed_data: dict[str, Any], title: str
     ) -> None:
         """Write processed data to HDF5 (should not be called directly).
@@ -594,8 +620,8 @@ class HDF5FeatureStorage(BaseFeatureStorage):
     def store_metadata(
         self,
         meta_md5: str,
-        element: Dict[str, str],
-        meta: Dict[str, Any],
+        element: dict[str, str],
+        meta: dict[str, Any],
     ) -> None:
         """Store metadata.
@@ -655,7 +681,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         self,
         kind: str,
         meta_md5: str,
-        element: List[Dict[str, str]],
+        element: list[dict[str, str]],
         data: np.ndarray,
         **kwargs: Any,
     ) -> None:
@@ -764,7 +790,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
             )
             t_data = stored_data["data"]
-            if kind in ["timeseries", "scalar_table"]:
+            if kind in ["timeseries", "scalar_table", "timeseries_2d"]:
                 t_data += data
             else:
                 t_data = np.concatenate((t_data, data), axis=-1)
@@ -797,7 +823,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
     def store_matrix(
         self,
         meta_md5: str,
-        element: Dict[str, str],
+        element: dict[str, str],
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
         row_names: Optional[Iterable[str]] = None,
@@ -876,8 +902,8 @@ class HDF5FeatureStorage(BaseFeatureStorage):
     def store_vector(
         self,
         meta_md5: str,
-        element: Dict[str, str],
-        data: Union[np.ndarray, List],
+        element: dict[str, str],
+        data: Union[np.ndarray, list],
         col_names: Optional[Iterable[str]] = None,
     ) -> None:
         """Store vector.
@@ -919,7 +945,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
     def store_timeseries(
         self,
         meta_md5: str,
-        element: Dict[str, str],
+        element: dict[str, str],
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
     ) -> None:
@@ -946,10 +972,48 @@ class HDF5FeatureStorage(BaseFeatureStorage):
             row_header_column_name="timepoint",
         )
+    def store_timeseries_2d(
+        self,
+        meta_md5: str,
+        element: dict[str, str],
+        data: np.ndarray,
+        col_names: Optional[Iterable[str]] = None,
+        row_names: Optional[Iterable[str]] = None,
+    ) -> None:
+        """Store a 2D timeseries.
+        Parameters
+        ----------
+        meta_md5 : str
+            The metadata MD5 hash.
+        element : dict
+            The element as dictionary.
+        data : numpy.ndarray
+            The 2D timeseries data to store.
+        col_names : list or tuple of str, optional
+            The column labels (default None).
+        row_names : list or tuple of str, optional
+            The row labels (default None).
+        """
+        store_timeseries_2d_checks(
+            data_shape=data.shape,
+            row_names_len=len(row_names),  # type: ignore
+            col_names_len=len(col_names),  # type: ignore
+        )
+        self._store_data(
+            kind="timeseries_2d",
+            meta_md5=meta_md5,
+            element=[element],  # convert to list
+            data=[data],  # convert to list
+            column_headers=col_names,
+            row_headers=row_names,
+        )
     def store_scalar_table(
         self,
         meta_md5: str,
-        element: Dict,
+        element: dict,
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
         row_names: Optional[Iterable[str]] = None,
@@ -1013,8 +1077,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         # Run loop to collect metadata
         logger.info(
-            "Collecting metadata from "
-            f"{self.uri.parent}/*_{self.uri.name}"  # type: ignore
+            f"Collecting metadata from {self.uri.parent}/*_{self.uri.name}"  # type: ignore
         )
         # Collect element files per feature MD5
         elements_per_feature_md5 = defaultdict(list)
@@ -1045,8 +1108,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
         # Run loop to collect data per feature per file
         logger.info(
-            "Collecting data from "
-            f"{self.uri.parent}/*_{self.uri.name}"  # type: ignore
+            f"Collecting data from {self.uri.parent}/*_{self.uri.name}"  # type: ignore
         )
         logger.info(f"Will collect {len(elements_per_feature_md5)} features.")
@@ -1091,7 +1153,7 @@ class HDF5FeatureStorage(BaseFeatureStorage):
                     kind = static_data["kind"]
                 # Append the "dynamic" data
-                if kind in ["timeseries", "scalar_table"]:
+                if kind in ["timeseries", "scalar_table", "timeseries_2d"]:
                     chunk_data.extend(t_data["data"])
                 else:
                     chunk_data.append(t_data["data"])

junifer/storage/pandas_base.py CHANGED Viewed

@@ -5,8 +5,9 @@
 # License: AGPL
 import json
+from collections.abc import Iterable
 from pathlib import Path
-from typing import Dict, Iterable, List, Optional, Union
+from typing import Optional, Union
 import numpy as np
 import pandas as pd
@@ -44,7 +45,7 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
     ) -> None:
         super().__init__(uri=uri, single_output=single_output, **kwargs)
-    def get_valid_inputs(self) -> List[str]:
+    def get_valid_inputs(self) -> list[str]:
         """Get valid storage types for input.
         Returns
@@ -56,7 +57,7 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
         """
         return ["matrix", "vector", "timeseries"]
-    def _meta_row(self, meta: Dict, meta_md5: str) -> pd.DataFrame:
+    def _meta_row(self, meta: dict, meta_md5: str) -> pd.DataFrame:
         """Convert the metadata to a pandas DataFrame.
         Parameters
@@ -80,7 +81,7 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
     @staticmethod
     def element_to_index(
-        element: Dict, n_rows: int = 1, rows_col_name: Optional[str] = None
+        element: dict, n_rows: int = 1, rows_col_name: Optional[str] = None
     ) -> Union[pd.Index, pd.MultiIndex]:
         """Convert the element metadata to index.
@@ -101,7 +102,7 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
         """
         # Make mapping between element access keys and values
-        elem_idx: Dict[str, Iterable[str]] = {
+        elem_idx: dict[str, Iterable[str]] = {
             k: [v] * n_rows for k, v in element.items()
         }
@@ -129,7 +130,7 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
         return index
     def store_df(
-        self, meta_md5: str, element: Dict, df: Union[pd.DataFrame, pd.Series]
+        self, meta_md5: str, element: dict, df: Union[pd.DataFrame, pd.Series]
     ) -> None:
         """Implement pandas DataFrame storing.
@@ -157,8 +158,8 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
     def _store_2d(
         self,
         meta_md5: str,
-        element: Dict,
-        data: Union[np.ndarray, List],
+        element: dict,
+        data: Union[np.ndarray, list],
         col_names: Optional[Iterable[str]] = None,
         rows_col_name: Optional[str] = None,
     ) -> None:
@@ -194,8 +195,8 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
     def store_vector(
         self,
         meta_md5: str,
-        element: Dict,
-        data: Union[np.ndarray, List],
+        element: dict,
+        data: Union[np.ndarray, list],
         col_names: Optional[Iterable[str]] = None,
     ) -> None:
         """Store vector.
@@ -232,7 +233,7 @@ class PandasBaseFeatureStorage(BaseFeatureStorage):
     def store_timeseries(
         self,
         meta_md5: str,
-        element: Dict,
+        element: dict,
         data: np.ndarray,
         col_names: Optional[Iterable[str]] = None,
     ) -> None:

junifer/storage/py.typed ADDED Viewed

File without changes

junifer/storage/sqlite.py CHANGED Viewed

@@ -6,7 +6,7 @@
 import json
 from pathlib import Path
-from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union
+from typing import TYPE_CHECKING, Any, Optional, Union
 import numpy as np
 import pandas as pd
@@ -92,7 +92,7 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
         # Set upsert
         self._upsert = upsert
-    def get_engine(self, element: Optional[Dict] = None) -> "Engine":
+    def get_engine(self, element: Optional[dict] = None) -> "Engine":
         """Get engine.
         Parameters
@@ -209,7 +209,7 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
                         msg=f"Invalid option {if_exists} for if_exists."
                     )
-    def list_features(self) -> Dict[str, Dict[str, Any]]:
+    def list_features(self) -> dict[str, dict[str, Any]]:
         """List the features in the storage.
         Returns
@@ -229,7 +229,7 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
         # Format index names for retrieved data
         meta_df.index = meta_df.index.str.replace(r"meta_", "")
         # Convert dataframe to dictionary
-        out: Dict[str, Dict[str, str]] = meta_df.to_dict(
+        out: dict[str, dict[str, str]] = meta_df.to_dict(
             orient="index"
         )  # type: ignore
         # Format output
@@ -242,8 +242,8 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
         self,
         feature_name: Optional[str] = None,
         feature_md5: Optional[str] = None,
-    ) -> Dict[
-        str, Union[str, List[Union[int, str, Dict[str, str]]], np.ndarray]
+    ) -> dict[
+        str, Union[str, list[Union[int, str, dict[str, str]]], np.ndarray]
     ]:
         """Read stored feature.
@@ -358,7 +358,7 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
         df = df.set_index(index_names)
         return df
-    def store_metadata(self, meta_md5: str, element: Dict, meta: Dict) -> None:
+    def store_metadata(self, meta_md5: str, element: dict, meta: dict) -> None:
         """Implement metadata storing in the storage.
         Parameters
@@ -381,7 +381,7 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
             self._save_upsert(meta_df, "meta", engine)
     def store_df(
-        self, meta_md5: str, element: Dict, df: Union[pd.DataFrame, pd.Series]
+        self, meta_md5: str, element: dict, df: Union[pd.DataFrame, pd.Series]
     ) -> None:
         """Implement pandas DataFrame storing.
@@ -434,10 +434,10 @@ class SQLiteFeatureStorage(PandasBaseFeatureStorage):
     def store_matrix(
         self,
         meta_md5: str,
-        element: Dict,
+        element: dict,
         data: np.ndarray,
-        col_names: Optional[List[str]] = None,
-        row_names: Optional[List[str]] = None,
+        col_names: Optional[list[str]] = None,
+        row_names: Optional[list[str]] = None,
         matrix_kind: str = "full",
         diagonal: bool = True,
     ) -> None:

junifer 0.0.5.dev240__py3-none-any.whl → 0.0.6__py3-none-any.whl

junifer 0.0.5.dev240py3-none-any.whl → 0.0.6py3-none-any.whl