PyPI - junifer - Versions diffs - 0.0.5.dev240__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

junifer 0.0.5.dev240py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (279) hide show

junifer/__init__.py +2 -31
junifer/__init__.pyi +37 -0
junifer/_version.py +9 -4
junifer/api/__init__.py +3 -5
junifer/api/__init__.pyi +4 -0
junifer/api/decorators.py +14 -19
junifer/api/functions.py +165 -109
junifer/api/py.typed +0 -0
junifer/api/queue_context/__init__.py +2 -4
junifer/api/queue_context/__init__.pyi +5 -0
junifer/api/queue_context/gnu_parallel_local_adapter.py +22 -6
junifer/api/queue_context/htcondor_adapter.py +23 -6
junifer/api/queue_context/py.typed +0 -0
junifer/api/queue_context/tests/test_gnu_parallel_local_adapter.py +3 -3
junifer/api/queue_context/tests/test_htcondor_adapter.py +3 -3
junifer/api/tests/test_functions.py +168 -74
junifer/cli/__init__.py +24 -0
junifer/cli/__init__.pyi +3 -0
junifer/{api → cli}/cli.py +141 -125
junifer/cli/parser.py +235 -0
junifer/cli/py.typed +0 -0
junifer/{api → cli}/tests/test_cli.py +8 -8
junifer/{api/tests/test_api_utils.py → cli/tests/test_cli_utils.py} +5 -4
junifer/{api → cli}/tests/test_parser.py +2 -2
junifer/{api → cli}/utils.py +6 -16
junifer/configs/juseless/__init__.py +2 -2
junifer/configs/juseless/__init__.pyi +3 -0
junifer/configs/juseless/datagrabbers/__init__.py +2 -12
junifer/configs/juseless/datagrabbers/__init__.pyi +13 -0
junifer/configs/juseless/datagrabbers/ixi_vbm.py +2 -2
junifer/configs/juseless/datagrabbers/py.typed +0 -0
junifer/configs/juseless/datagrabbers/tests/test_ucla.py +2 -2
junifer/configs/juseless/datagrabbers/ucla.py +4 -4
junifer/configs/juseless/py.typed +0 -0
junifer/conftest.py +25 -0
junifer/data/__init__.py +2 -42
junifer/data/__init__.pyi +29 -0
junifer/data/_dispatch.py +248 -0
junifer/data/coordinates/__init__.py +9 -0
junifer/data/coordinates/__init__.pyi +5 -0
junifer/data/coordinates/_ants_coordinates_warper.py +104 -0
junifer/data/coordinates/_coordinates.py +385 -0
junifer/data/coordinates/_fsl_coordinates_warper.py +81 -0
junifer/data/{tests → coordinates/tests}/test_coordinates.py +26 -33
junifer/data/masks/__init__.py +9 -0
junifer/data/masks/__init__.pyi +6 -0
junifer/data/masks/_ants_mask_warper.py +177 -0
junifer/data/masks/_fsl_mask_warper.py +106 -0
junifer/data/masks/_masks.py +802 -0
junifer/data/{tests → masks/tests}/test_masks.py +67 -63
junifer/data/parcellations/__init__.py +9 -0
junifer/data/parcellations/__init__.pyi +6 -0
junifer/data/parcellations/_ants_parcellation_warper.py +166 -0
junifer/data/parcellations/_fsl_parcellation_warper.py +89 -0
junifer/data/parcellations/_parcellations.py +1388 -0
junifer/data/{tests → parcellations/tests}/test_parcellations.py +165 -295
junifer/data/pipeline_data_registry_base.py +76 -0
junifer/data/py.typed +0 -0
junifer/data/template_spaces.py +44 -79
junifer/data/tests/test_data_utils.py +1 -2
junifer/data/tests/test_template_spaces.py +8 -4
junifer/data/utils.py +109 -4
junifer/datagrabber/__init__.py +2 -26
junifer/datagrabber/__init__.pyi +27 -0
junifer/datagrabber/aomic/__init__.py +2 -4
junifer/datagrabber/aomic/__init__.pyi +5 -0
junifer/datagrabber/aomic/id1000.py +81 -52
junifer/datagrabber/aomic/piop1.py +83 -55
junifer/datagrabber/aomic/piop2.py +85 -56
junifer/datagrabber/aomic/py.typed +0 -0
junifer/datagrabber/aomic/tests/test_id1000.py +19 -12
junifer/datagrabber/aomic/tests/test_piop1.py +52 -18
junifer/datagrabber/aomic/tests/test_piop2.py +50 -17
junifer/datagrabber/base.py +22 -18
junifer/datagrabber/datalad_base.py +71 -34
junifer/datagrabber/dmcc13_benchmark.py +31 -18
junifer/datagrabber/hcp1200/__init__.py +2 -3
junifer/datagrabber/hcp1200/__init__.pyi +4 -0
junifer/datagrabber/hcp1200/datalad_hcp1200.py +3 -3
junifer/datagrabber/hcp1200/hcp1200.py +26 -15
junifer/datagrabber/hcp1200/py.typed +0 -0
junifer/datagrabber/hcp1200/tests/test_hcp1200.py +8 -2
junifer/datagrabber/multiple.py +14 -9
junifer/datagrabber/pattern.py +132 -96
junifer/datagrabber/pattern_validation_mixin.py +206 -94
junifer/datagrabber/py.typed +0 -0
junifer/datagrabber/tests/test_datalad_base.py +27 -12
junifer/datagrabber/tests/test_dmcc13_benchmark.py +28 -11
junifer/datagrabber/tests/test_multiple.py +48 -2
junifer/datagrabber/tests/test_pattern_datalad.py +1 -1
junifer/datagrabber/tests/test_pattern_validation_mixin.py +6 -6
junifer/datareader/__init__.py +2 -2
junifer/datareader/__init__.pyi +3 -0
junifer/datareader/default.py +6 -6
junifer/datareader/py.typed +0 -0
junifer/external/nilearn/__init__.py +2 -3
junifer/external/nilearn/__init__.pyi +4 -0
junifer/external/nilearn/junifer_connectivity_measure.py +25 -17
junifer/external/nilearn/junifer_nifti_spheres_masker.py +4 -4
junifer/external/nilearn/py.typed +0 -0
junifer/external/nilearn/tests/test_junifer_connectivity_measure.py +17 -16
junifer/external/nilearn/tests/test_junifer_nifti_spheres_masker.py +2 -3
junifer/markers/__init__.py +2 -38
junifer/markers/__init__.pyi +37 -0
junifer/markers/base.py +11 -14
junifer/markers/brainprint.py +12 -14
junifer/markers/complexity/__init__.py +2 -18
junifer/markers/complexity/__init__.pyi +17 -0
junifer/markers/complexity/complexity_base.py +9 -11
junifer/markers/complexity/hurst_exponent.py +7 -7
junifer/markers/complexity/multiscale_entropy_auc.py +7 -7
junifer/markers/complexity/perm_entropy.py +7 -7
junifer/markers/complexity/py.typed +0 -0
junifer/markers/complexity/range_entropy.py +7 -7
junifer/markers/complexity/range_entropy_auc.py +7 -7
junifer/markers/complexity/sample_entropy.py +7 -7
junifer/markers/complexity/tests/test_complexity_base.py +1 -1
junifer/markers/complexity/tests/test_hurst_exponent.py +5 -5
junifer/markers/complexity/tests/test_multiscale_entropy_auc.py +5 -5
junifer/markers/complexity/tests/test_perm_entropy.py +5 -5
junifer/markers/complexity/tests/test_range_entropy.py +5 -5
junifer/markers/complexity/tests/test_range_entropy_auc.py +5 -5
junifer/markers/complexity/tests/test_sample_entropy.py +5 -5
junifer/markers/complexity/tests/test_weighted_perm_entropy.py +5 -5
junifer/markers/complexity/weighted_perm_entropy.py +7 -7
junifer/markers/ets_rss.py +12 -11
junifer/markers/falff/__init__.py +2 -3
junifer/markers/falff/__init__.pyi +4 -0
junifer/markers/falff/_afni_falff.py +38 -45
junifer/markers/falff/_junifer_falff.py +16 -19
junifer/markers/falff/falff_base.py +7 -11
junifer/markers/falff/falff_parcels.py +9 -9
junifer/markers/falff/falff_spheres.py +8 -8
junifer/markers/falff/py.typed +0 -0
junifer/markers/falff/tests/test_falff_spheres.py +3 -1
junifer/markers/functional_connectivity/__init__.py +2 -12
junifer/markers/functional_connectivity/__init__.pyi +13 -0
junifer/markers/functional_connectivity/crossparcellation_functional_connectivity.py +9 -8
junifer/markers/functional_connectivity/edge_functional_connectivity_parcels.py +8 -8
junifer/markers/functional_connectivity/edge_functional_connectivity_spheres.py +7 -7
junifer/markers/functional_connectivity/functional_connectivity_base.py +13 -12
junifer/markers/functional_connectivity/functional_connectivity_parcels.py +8 -8
junifer/markers/functional_connectivity/functional_connectivity_spheres.py +7 -7
junifer/markers/functional_connectivity/py.typed +0 -0
junifer/markers/functional_connectivity/tests/test_edge_functional_connectivity_parcels.py +1 -2
junifer/markers/functional_connectivity/tests/test_edge_functional_connectivity_spheres.py +1 -2
junifer/markers/functional_connectivity/tests/test_functional_connectivity_parcels.py +6 -6
junifer/markers/functional_connectivity/tests/test_functional_connectivity_spheres.py +5 -5
junifer/markers/parcel_aggregation.py +22 -17
junifer/markers/py.typed +0 -0
junifer/markers/reho/__init__.py +2 -3
junifer/markers/reho/__init__.pyi +4 -0
junifer/markers/reho/_afni_reho.py +29 -35
junifer/markers/reho/_junifer_reho.py +13 -14
junifer/markers/reho/py.typed +0 -0
junifer/markers/reho/reho_base.py +7 -11
junifer/markers/reho/reho_parcels.py +10 -10
junifer/markers/reho/reho_spheres.py +9 -9
junifer/markers/sphere_aggregation.py +22 -17
junifer/markers/temporal_snr/__init__.py +2 -3
junifer/markers/temporal_snr/__init__.pyi +4 -0
junifer/markers/temporal_snr/py.typed +0 -0
junifer/markers/temporal_snr/temporal_snr_base.py +11 -10
junifer/markers/temporal_snr/temporal_snr_parcels.py +8 -8
junifer/markers/temporal_snr/temporal_snr_spheres.py +7 -7
junifer/markers/tests/test_ets_rss.py +3 -3
junifer/markers/tests/test_parcel_aggregation.py +24 -24
junifer/markers/tests/test_sphere_aggregation.py +6 -6
junifer/markers/utils.py +3 -3
junifer/onthefly/__init__.py +2 -1
junifer/onthefly/_brainprint.py +138 -0
junifer/onthefly/read_transform.py +5 -8
junifer/pipeline/__init__.py +2 -10
junifer/pipeline/__init__.pyi +13 -0
junifer/{markers/collection.py → pipeline/marker_collection.py} +8 -14
junifer/pipeline/pipeline_component_registry.py +294 -0
junifer/pipeline/pipeline_step_mixin.py +15 -11
junifer/pipeline/py.typed +0 -0
junifer/{markers/tests/test_collection.py → pipeline/tests/test_marker_collection.py} +2 -3
junifer/pipeline/tests/test_pipeline_component_registry.py +200 -0
junifer/pipeline/tests/test_pipeline_step_mixin.py +36 -37
junifer/pipeline/tests/test_update_meta_mixin.py +4 -4
junifer/pipeline/tests/test_workdir_manager.py +43 -0
junifer/pipeline/update_meta_mixin.py +21 -17
junifer/pipeline/utils.py +6 -6
junifer/pipeline/workdir_manager.py +19 -5
junifer/preprocess/__init__.py +2 -10
junifer/preprocess/__init__.pyi +11 -0
junifer/preprocess/base.py +10 -10
junifer/preprocess/confounds/__init__.py +2 -2
junifer/preprocess/confounds/__init__.pyi +3 -0
junifer/preprocess/confounds/fmriprep_confound_remover.py +243 -64
junifer/preprocess/confounds/py.typed +0 -0
junifer/preprocess/confounds/tests/test_fmriprep_confound_remover.py +121 -14
junifer/preprocess/py.typed +0 -0
junifer/preprocess/smoothing/__init__.py +2 -2
junifer/preprocess/smoothing/__init__.pyi +3 -0
junifer/preprocess/smoothing/_afni_smoothing.py +40 -40
junifer/preprocess/smoothing/_fsl_smoothing.py +22 -32
junifer/preprocess/smoothing/_nilearn_smoothing.py +35 -14
junifer/preprocess/smoothing/py.typed +0 -0
junifer/preprocess/smoothing/smoothing.py +11 -13
junifer/preprocess/warping/__init__.py +2 -2
junifer/preprocess/warping/__init__.pyi +3 -0
junifer/preprocess/warping/_ants_warper.py +136 -32
junifer/preprocess/warping/_fsl_warper.py +73 -22
junifer/preprocess/warping/py.typed +0 -0
junifer/preprocess/warping/space_warper.py +39 -11
junifer/preprocess/warping/tests/test_space_warper.py +5 -9
junifer/py.typed +0 -0
junifer/stats.py +5 -5
junifer/storage/__init__.py +2 -10
junifer/storage/__init__.pyi +11 -0
junifer/storage/base.py +47 -13
junifer/storage/hdf5.py +95 -33
junifer/storage/pandas_base.py +12 -11
junifer/storage/py.typed +0 -0
junifer/storage/sqlite.py +11 -11
junifer/storage/tests/test_hdf5.py +86 -4
junifer/storage/tests/test_sqlite.py +2 -2
junifer/storage/tests/test_storage_base.py +5 -2
junifer/storage/tests/test_utils.py +33 -7
junifer/storage/utils.py +95 -9
junifer/testing/__init__.py +2 -3
junifer/testing/__init__.pyi +4 -0
junifer/testing/datagrabbers.py +10 -11
junifer/testing/py.typed +0 -0
junifer/testing/registry.py +4 -7
junifer/testing/tests/test_testing_registry.py +9 -17
junifer/tests/test_stats.py +2 -2
junifer/typing/__init__.py +9 -0
junifer/typing/__init__.pyi +31 -0
junifer/typing/_typing.py +68 -0
junifer/utils/__init__.py +2 -12
junifer/utils/__init__.pyi +18 -0
junifer/utils/_config.py +110 -0
junifer/utils/_yaml.py +16 -0
junifer/utils/helpers.py +6 -6
junifer/utils/logging.py +117 -8
junifer/utils/py.typed +0 -0
junifer/{pipeline → utils}/singleton.py +19 -14
junifer/utils/tests/test_config.py +59 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info}/METADATA +43 -38
junifer-0.0.6.dist-info/RECORD +350 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info}/WHEEL +1 -1
junifer-0.0.6.dist-info/entry_points.txt +2 -0
junifer/api/parser.py +0 -118
junifer/data/coordinates.py +0 -408
junifer/data/masks.py +0 -670
junifer/data/parcellations.py +0 -1828
junifer/pipeline/registry.py +0 -177
junifer/pipeline/tests/test_registry.py +0 -150
junifer-0.0.5.dev240.dist-info/RECORD +0 -275
junifer-0.0.5.dev240.dist-info/entry_points.txt +0 -2
/junifer/{api → cli}/tests/data/gmd_mean.yaml +0 -0
/junifer/{api → cli}/tests/data/gmd_mean_htcondor.yaml +0 -0
/junifer/{api → cli}/tests/data/partly_cloudy_agg_mean_tian.yml +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/AutobiographicalMemory_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/CogAC_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/CogAR_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/DMNBuckner_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Dosenbach2010_MNI_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Empathy_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Motor_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/MultiTask_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/PhysioStress_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Power2011_MNI_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Power2013_MNI_VOIs.tsv +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Rew_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/Somatosensory_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/ToM_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/VigAtt_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/WM_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/eMDN_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/eSAD_VOIs.txt +0 -0
/junifer/data/{VOIs → coordinates/VOIs}/meta/extDMN_VOIs.txt +0 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info/licenses}/AUTHORS.rst +0 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info/licenses}/LICENSE.md +0 -0
{junifer-0.0.5.dev240.dist-info → junifer-0.0.6.dist-info}/top_level.txt +0 -0

junifer/datagrabber/pattern_validation_mixin.py CHANGED Viewed

@@ -3,8 +3,8 @@
 # Authors: Synchon Mandal <s.mandal@fz-juelich.de>
 # License: AGPL
-from typing import Dict, List
+from ..typing import DataGrabberPatterns
 from ..utils import logger, raise_error, warn_with_log
@@ -33,10 +33,12 @@ PATTERNS_SCHEMA = {
                 "mandatory": ["pattern", "format"],
                 "optional": ["mappings"],
             },
+            "reference": {"mandatory": ["pattern"], "optional": []},
+            "prewarp_space": {"mandatory": [], "optional": []},
         },
     },
     "Warp": {
-        "mandatory": ["pattern", "src", "dst"],
+        "mandatory": ["pattern", "src", "dst", "warper"],
         "optional": {},
     },
     "VBM_GM": {
@@ -72,7 +74,7 @@ PATTERNS_SCHEMA = {
 class PatternValidationMixin:
     """Mixin class for pattern validation."""
-    def _validate_types(self, types: List[str]) -> None:
+    def _validate_types(self, types: list[str]) -> None:
         """Validate the types.
         Parameters
@@ -95,8 +97,8 @@ class PatternValidationMixin:
     def _validate_replacements(
         self,
-        replacements: List[str],
-        patterns: Dict[str, Dict[str, str]],
+        replacements: list[str],
+        patterns: DataGrabberPatterns,
         partial_pattern_ok: bool,
     ) -> None:
         """Validate the replacements.
@@ -132,45 +134,57 @@ class PatternValidationMixin:
         if any(not isinstance(x, str) for x in replacements):
             raise_error(
-                msg="`replacements` must be a list of strings.",
+                msg="`replacements` must be a list of strings",
                 klass=TypeError,
             )
+        # Make a list of all patterns recursively
+        all_patterns = []
+        for dtype_val in patterns.values():
+            # Conditional for list dtype vals like Warp
+            if isinstance(dtype_val, list):
+                for entry in dtype_val:
+                    all_patterns.append(entry.get("pattern", ""))
+            else:
+                all_patterns.append(dtype_val.get("pattern", ""))
+        # Check for stray replacements
         for x in replacements:
-            if all(
-                x not in y
-                for y in [
-                    data_type_val.get("pattern", "")
-                    for data_type_val in patterns.values()
-                ]
-            ):
+            if all(x not in y for y in all_patterns):
                 if partial_pattern_ok:
                     warn_with_log(
                         f"Replacement: `{x}` is not part of any pattern, "
                         "things might not work as expected if you are unsure "
-                        "of what you are doing"
+                        "of what you are doing."
                     )
                 else:
                     raise_error(
-                        msg=f"Replacement: {x} is not part of any pattern."
+                        msg=f"Replacement: `{x}` is not part of any pattern"
                     )
         # Check that at least one pattern has all the replacements
         at_least_one = False
-        for data_type_val in patterns.values():
-            if all(
-                x in data_type_val.get("pattern", "") for x in replacements
-            ):
-                at_least_one = True
+        for dtype_val in patterns.values():
+            # Conditional for list dtype vals like Warp
+            if isinstance(dtype_val, list):
+                for entry in dtype_val:
+                    if all(
+                        x in entry.get("pattern", "") for x in replacements
+                    ):
+                        at_least_one = True
+            else:
+                if all(
+                    x in dtype_val.get("pattern", "") for x in replacements
+                ):
+                    at_least_one = True
         if not at_least_one and not partial_pattern_ok:
             raise_error(
-                msg="At least one pattern must contain all replacements."
+                msg="At least one pattern must contain all replacements"
             )
     def _validate_mandatory_keys(
         self,
-        keys: List[str],
-        schema: List[str],
+        keys: list[str],
+        schema: list[str],
         data_type: str,
         partial_pattern_ok: bool = False,
     ) -> None:
@@ -207,7 +221,7 @@ class PatternValidationMixin:
                     warn_with_log(
                         f"Mandatory key: `{key}` not found for {data_type}, "
                         "things might not work as expected if you are unsure "
-                        "of what you are doing"
+                        "of what you are doing."
                     )
                 else:
                     raise_error(
@@ -215,10 +229,10 @@ class PatternValidationMixin:
                         klass=KeyError,
                     )
             else:
-                logger.debug(f"Mandatory key: `{key}` found for {data_type}")
+                logger.debug(f"Mandatory key: `{key}` found for {data_type}.")
     def _identify_stray_keys(
-        self, keys: List[str], schema: List[str], data_type: str
+        self, keys: list[str], schema: list[str], data_type: str
     ) -> None:
         """Identify stray keys.
@@ -249,9 +263,9 @@ class PatternValidationMixin:
     def validate_patterns(
         self,
-        types: List[str],
-        replacements: List[str],
-        patterns: Dict[str, Dict[str, str]],
+        types: list[str],
+        replacements: list[str],
+        patterns: DataGrabberPatterns,
         partial_pattern_ok: bool = False,
     ) -> None:
         """Validate the patterns.
@@ -298,87 +312,185 @@ class PatternValidationMixin:
                 msg="`patterns` must contain all `types`", klass=ValueError
             )
         # Check against schema
-        for data_type_key, data_type_val in patterns.items():
+        for dtype_key, dtype_val in patterns.items():
             # Check if valid data type is provided
-            if data_type_key not in PATTERNS_SCHEMA:
+            if dtype_key not in PATTERNS_SCHEMA:
                 raise_error(
-                    f"Unknown data type: {data_type_key}, "
+                    f"Unknown data type: {dtype_key}, "
                     f"should be one of: {list(PATTERNS_SCHEMA.keys())}"
                 )
-            # Check mandatory keys for data type
-            self._validate_mandatory_keys(
-                keys=list(data_type_val),
-                schema=PATTERNS_SCHEMA[data_type_key]["mandatory"],
-                data_type=data_type_key,
-                partial_pattern_ok=partial_pattern_ok,
-            )
-            # Check optional keys for data type
-            for optional_key, optional_val in PATTERNS_SCHEMA[data_type_key][
-                "optional"
-            ].items():
-                if optional_key not in data_type_val:
-                    logger.debug(
-                        f"Optional key: `{optional_key}` missing for "
-                        f"{data_type_key}"
-                    )
-                else:
-                    logger.debug(
-                        f"Optional key: `{optional_key}` found for "
-                        f"{data_type_key}"
-                    )
-                    # Set nested type name for easier access
-                    nested_data_type = f"{data_type_key}.{optional_key}"
-                    nested_mandatory_keys_schema = PATTERNS_SCHEMA[
-                        data_type_key
-                    ]["optional"][optional_key]["mandatory"]
-                    nested_optional_keys_schema = PATTERNS_SCHEMA[
-                        data_type_key
-                    ]["optional"][optional_key]["optional"]
-                    # Check mandatory keys for nested type
+            # Conditional for list dtype vals like Warp
+            if isinstance(dtype_val, list):
+                for idx, entry in enumerate(dtype_val):
+                    # Check mandatory keys for data type
                     self._validate_mandatory_keys(
-                        keys=list(optional_val["mandatory"]),
-                        schema=nested_mandatory_keys_schema,
-                        data_type=nested_data_type,
+                        keys=list(entry),
+                        schema=PATTERNS_SCHEMA[dtype_key]["mandatory"],
+                        data_type=f"{dtype_key}.{idx}",
                         partial_pattern_ok=partial_pattern_ok,
                     )
-                    # Check optional keys for nested type
-                    for nested_optional_key in nested_optional_keys_schema:
-                        if nested_optional_key not in optional_val["optional"]:
+                    # Check optional keys for data type
+                    for optional_key, optional_val in PATTERNS_SCHEMA[
+                        dtype_key
+                    ]["optional"].items():
+                        if optional_key not in entry:
                             logger.debug(
-                                f"Optional key: `{nested_optional_key}` "
-                                f"missing for {nested_data_type}"
+                                f"Optional key: `{optional_key}` missing for "
+                                f"{dtype_key}.{idx}"
                             )
                         else:
                             logger.debug(
-                                f"Optional key: `{nested_optional_key}` found "
-                                f"for {nested_data_type}"
+                                f"Optional key: `{optional_key}` found for "
+                                f"{dtype_key}.{idx}"
+                            )
+                            # Set nested type name for easier access
+                            nested_dtype = f"{dtype_key}.{idx}.{optional_key}"
+                            nested_mandatory_keys_schema = PATTERNS_SCHEMA[
+                                dtype_key
+                            ]["optional"][optional_key]["mandatory"]
+                            nested_optional_keys_schema = PATTERNS_SCHEMA[
+                                dtype_key
+                            ]["optional"][optional_key]["optional"]
+                            # Check mandatory keys for nested type
+                            self._validate_mandatory_keys(
+                                keys=list(optional_val["mandatory"]),
+                                schema=nested_mandatory_keys_schema,
+                                data_type=nested_dtype,
+                                partial_pattern_ok=partial_pattern_ok,
+                            )
+                            # Check optional keys for nested type
+                            for (
+                                nested_optional_key
+                            ) in nested_optional_keys_schema:
+                                if (
+                                    nested_optional_key
+                                    not in optional_val["optional"]
+                                ):
+                                    logger.debug(
+                                        f"Optional key: "
+                                        f"`{nested_optional_key}` missing for "
+                                        f"{nested_dtype}"
+                                    )
+                                else:
+                                    logger.debug(
+                                        f"Optional key: "
+                                        f"`{nested_optional_key}` found for "
+                                        f"{nested_dtype}"
+                                    )
+                            # Check stray key for nested data type
+                            self._identify_stray_keys(
+                                keys=(
+                                    optional_val["mandatory"]
+                                    + optional_val["optional"]
+                                ),
+                                schema=(
+                                    nested_mandatory_keys_schema
+                                    + nested_optional_keys_schema
+                                ),
+                                data_type=nested_dtype,
                             )
-                    # Check stray key for nested data type
+                    # Check stray key for data type
                     self._identify_stray_keys(
-                        keys=optional_val["mandatory"]
-                        + optional_val["optional"],
-                        schema=nested_mandatory_keys_schema
-                        + nested_optional_keys_schema,
-                        data_type=nested_data_type,
+                        keys=list(entry.keys()),
+                        schema=(
+                            PATTERNS_SCHEMA[dtype_key]["mandatory"]
+                            + list(
+                                PATTERNS_SCHEMA[dtype_key]["optional"].keys()
+                            )
+                        ),
+                        data_type=dtype_key,
                     )
-            # Check stray key for data type
-            self._identify_stray_keys(
-                keys=list(data_type_val.keys()),
-                schema=(
-                    PATTERNS_SCHEMA[data_type_key]["mandatory"]
-                    + list(PATTERNS_SCHEMA[data_type_key]["optional"].keys())
-                ),
-                data_type=data_type_key,
-            )
-            # Wildcard check in patterns
-            if "}*" in data_type_val.get("pattern", ""):
-                raise_error(
-                    msg=(
-                        f"`{data_type_key}.pattern` must not contain `*` "
-                        "following a replacement"
+                    # Wildcard check in patterns
+                    if "}*" in entry.get("pattern", ""):
+                        raise_error(
+                            msg=(
+                                f"`{dtype_key}.pattern` must not contain `*` "
+                                "following a replacement"
+                            ),
+                            klass=ValueError,
+                        )
+            else:
+                # Check mandatory keys for data type
+                self._validate_mandatory_keys(
+                    keys=list(dtype_val),
+                    schema=PATTERNS_SCHEMA[dtype_key]["mandatory"],
+                    data_type=dtype_key,
+                    partial_pattern_ok=partial_pattern_ok,
+                )
+                # Check optional keys for data type
+                for optional_key, optional_val in PATTERNS_SCHEMA[dtype_key][
+                    "optional"
+                ].items():
+                    if optional_key not in dtype_val:
+                        logger.debug(
+                            f"Optional key: `{optional_key}` missing for "
+                            f"{dtype_key}."
+                        )
+                    else:
+                        logger.debug(
+                            f"Optional key: `{optional_key}` found for "
+                            f"{dtype_key}."
+                        )
+                        # Set nested type name for easier access
+                        nested_dtype = f"{dtype_key}.{optional_key}"
+                        nested_mandatory_keys_schema = PATTERNS_SCHEMA[
+                            dtype_key
+                        ]["optional"][optional_key]["mandatory"]
+                        nested_optional_keys_schema = PATTERNS_SCHEMA[
+                            dtype_key
+                        ]["optional"][optional_key]["optional"]
+                        # Check mandatory keys for nested type
+                        self._validate_mandatory_keys(
+                            keys=list(optional_val["mandatory"]),
+                            schema=nested_mandatory_keys_schema,
+                            data_type=nested_dtype,
+                            partial_pattern_ok=partial_pattern_ok,
+                        )
+                        # Check optional keys for nested type
+                        for nested_optional_key in nested_optional_keys_schema:
+                            if (
+                                nested_optional_key
+                                not in optional_val["optional"]
+                            ):
+                                logger.debug(
+                                    f"Optional key: `{nested_optional_key}` "
+                                    f"missing for {nested_dtype}"
+                                )
+                            else:
+                                logger.debug(
+                                    f"Optional key: `{nested_optional_key}` "
+                                    f"found for {nested_dtype}"
+                                )
+                        # Check stray key for nested data type
+                        self._identify_stray_keys(
+                            keys=(
+                                optional_val["mandatory"]
+                                + optional_val["optional"]
+                            ),
+                            schema=(
+                                nested_mandatory_keys_schema
+                                + nested_optional_keys_schema
+                            ),
+                            data_type=nested_dtype,
+                        )
+                # Check stray key for data type
+                self._identify_stray_keys(
+                    keys=list(dtype_val.keys()),
+                    schema=(
+                        PATTERNS_SCHEMA[dtype_key]["mandatory"]
+                        + list(PATTERNS_SCHEMA[dtype_key]["optional"].keys())
                     ),
-                    klass=ValueError,
+                    data_type=dtype_key,
                 )
+                # Wildcard check in patterns
+                if "}*" in dtype_val.get("pattern", ""):
+                    raise_error(
+                        msg=(
+                            f"`{dtype_key}.pattern` must not contain `*` "
+                            "following a replacement"
+                        ),
+                        klass=ValueError,
+                    )
         # Validate replacements
         self._validate_replacements(

junifer/datagrabber/py.typed ADDED Viewed

File without changes

junifer/datagrabber/tests/test_datalad_base.py CHANGED Viewed

@@ -3,20 +3,21 @@
 # Authors: Synchon Mandal <s.mandal@fz-juelich.de>
 # License: AGPL
+import warnings
 from pathlib import Path
-from typing import Type
 import datalad.api as dl
 import pytest
 from junifer.datagrabber import DataladDataGrabber
+from junifer.utils import config
 _testing_dataset = {
     "example_bids": {
         "uri": "https://gin.g-node.org/juaml/datalad-example-bids",
-        "commit": "b87897cbe51bf0ee5514becaa5c7dd76491db5ad",
-        "id": "8fddff30-6993-420a-9d1e-b5b028c59468",
+        "commit": "3f288c8725207ae0c9b3616e093e78cda192b570",
+        "id": "582b9696-f13f-42e4-9587-b4e62aa2a8e7",
     },
     "example_bids_ses": {
         "uri": "https://gin.g-node.org/juaml/datalad-example-bids-ses",
@@ -27,7 +28,7 @@ _testing_dataset = {
 @pytest.fixture
-def concrete_datagrabber() -> Type[DataladDataGrabber]:
+def concrete_datagrabber() -> type[DataladDataGrabber]:
     """Return a concrete datalad-based DataGrabber.
     Returns
@@ -69,7 +70,7 @@ def concrete_datagrabber() -> Type[DataladDataGrabber]:
 def test_DataladDataGrabber_install_errors(
-    tmp_path: Path, concrete_datagrabber: Type
+    tmp_path: Path, concrete_datagrabber: type
 ) -> None:
     """Test DataladDataGrabber install errors / warnings.
@@ -95,6 +96,12 @@ def test_DataladDataGrabber_install_errors(
     with pytest.raises(ValueError, match=r"different ID"):
         with dg:
             pass
+    # Set config to skip id check and test
+    config.set(key="datagrabber.skipidcheck", val=True)
+    with dg:
+        pass
+    # Reset config
+    config.delete("datagrabber.skipidcheck")
     elem1_t1w = datadir / "example_bids/sub-01/anat/sub-01_T1w.nii.gz"
     elem1_t1w.unlink()
@@ -105,10 +112,18 @@ def test_DataladDataGrabber_install_errors(
     with pytest.warns(RuntimeWarning, match=r"one file is not clean"):
         with dg:
             pass
+    # Set config to skip dirty check and test
+    with warnings.catch_warnings():
+        warnings.simplefilter("error")
+        config.set(key="datagrabber.skipdirtycheck", val=True)
+        with dg:
+            pass
+        # Reset config
+        config.delete("datagrabber.skipdirtycheck")
 def test_DataladDataGrabber_clone_cleanup(
-    tmp_path: Path, concrete_datagrabber: Type
+    tmp_path: Path, concrete_datagrabber: type
 ) -> None:
     """Test DataladDataGrabber clone and remove.
@@ -157,7 +172,7 @@ def test_DataladDataGrabber_clone_cleanup(
 def test_DataladDataGrabber_clone_create_cleanup(
-    concrete_datagrabber: Type,
+    concrete_datagrabber: type,
 ) -> None:
     """Test DataladDataGrabber tempdir clone and remove.
@@ -203,7 +218,7 @@ def test_DataladDataGrabber_clone_create_cleanup(
 def test_DataladDataGrabber_previously_cloned(
-    tmp_path: Path, concrete_datagrabber: Type
+    tmp_path: Path, concrete_datagrabber: type
 ) -> None:
     """Test DataladDataGrabber on cloned dataset.
@@ -247,7 +262,7 @@ def test_DataladDataGrabber_previously_cloned(
         meta = elem1["BOLD"]["meta"]
         assert "datagrabber" in meta
         assert "datalad_dirty" in meta["datagrabber"]
-        assert meta["datagrabber"]["datalad_dirty"] is False
+        assert meta["datagrabber"]["datalad_dirty"] is True
         assert "datalad_commit_id" in meta["datagrabber"]
         assert meta["datagrabber"]["datalad_commit_id"] == commit
         assert "datalad_id" in meta["datagrabber"]
@@ -272,7 +287,7 @@ def test_DataladDataGrabber_previously_cloned(
 def test_DataladDataGrabber_previously_cloned_and_get(
-    tmp_path: Path, concrete_datagrabber: Type
+    tmp_path: Path, concrete_datagrabber: type
 ) -> None:
     """Test DataladDataGrabber on cloned dataset with files present.
@@ -327,7 +342,7 @@ def test_DataladDataGrabber_previously_cloned_and_get(
         meta = elem1["BOLD"]["meta"]
         assert "datagrabber" in meta
         assert "datalad_dirty" in meta["datagrabber"]
-        assert meta["datagrabber"]["datalad_dirty"] is False
+        assert meta["datagrabber"]["datalad_dirty"] is True
         assert "datalad_commit_id" in meta["datagrabber"]
         assert meta["datagrabber"]["datalad_commit_id"] == commit
         assert "datalad_id" in meta["datagrabber"]
@@ -355,7 +370,7 @@ def test_DataladDataGrabber_previously_cloned_and_get(
 def test_DataladDataGrabber_previously_cloned_and_get_dirty(
-    tmp_path: Path, concrete_datagrabber: Type
+    tmp_path: Path, concrete_datagrabber: type
 ) -> None:
     """Test DataladDataGrabber on a dirty cloned dataset.

junifer/datagrabber/tests/test_dmcc13_benchmark.py CHANGED Viewed

@@ -3,7 +3,7 @@
 # Authors: Synchon Mandal <s.mandal@fz-juelich.de>
 # License: AGPL
-from typing import List, Optional, Union
+from typing import Optional, Union
 import pytest
@@ -116,7 +116,12 @@ def test_DMCC13Benchmark(
             data_file_names.extend(
                 [
                     "sub-01_desc-preproc_T1w.nii.gz",
-                    "sub-01_from-MNI152NLin2009cAsym_to-T1w_mode-image_xfm.h5",
+                    [
+                        "sub-01_from-MNI152NLin2009cAsym_to-T1w"
+                        "_mode-image_xfm.h5",
+                        "sub-01_from-T1w_to-MNI152NLin2009cAsym"
+                        "_mode-image_xfm.h5",
+                    ],
                 ]
             )
         else:
@@ -127,14 +132,26 @@ def test_DMCC13Benchmark(
         for data_type, data_file_name in zip(data_types, data_file_names):
             # Assert data type
             assert data_type in out
-            # Assert data file path exists
-            assert out[data_type]["path"].exists()
-            # Assert data file path is a file
-            assert out[data_type]["path"].is_file()
-            # Assert data file name
-            assert out[data_type]["path"].name == data_file_name
-            # Assert metadata
-            assert "meta" in out[data_type]
+            # Conditional for Warp
+            if data_type == "Warp":
+                for idx, fname in enumerate(data_file_name):
+                    # Assert data file path exists
+                    assert out[data_type][idx]["path"].exists()
+                    # Assert data file path is a file
+                    assert out[data_type][idx]["path"].is_file()
+                    # Assert data file name
+                    assert out[data_type][idx]["path"].name == fname
+                    # Assert metadata
+                    assert "meta" in out[data_type][idx]
+            else:
+                # Assert data file path exists
+                assert out[data_type]["path"].exists()
+                # Assert data file path is a file
+                assert out[data_type]["path"].is_file()
+                # Assert data file name
+                assert out[data_type]["path"].name == data_file_name
+                # Assert metadata
+                assert "meta" in out[data_type]
         # Check BOLD nested data types
         for type_, file_name in zip(
@@ -201,7 +218,7 @@ def test_DMCC13Benchmark(
     ],
 )
 def test_DMCC13Benchmark_partial_data_access(
-    types: Union[str, List[str]],
+    types: Union[str, list[str]],
     native_t1w: bool,
 ) -> None:
     """Test DMCC13Benchmark DataGrabber partial data access.

junifer 0.0.5.dev240__py3-none-any.whl → 0.0.6__py3-none-any.whl

junifer 0.0.5.dev240py3-none-any.whl → 0.0.6py3-none-any.whl