junifer 0.0.6.dev277__py3-none-any.whl → 0.0.6.dev285__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
junifer/_version.py CHANGED
@@ -12,5 +12,5 @@ __version__: str
12
12
  __version_tuple__: VERSION_TUPLE
13
13
  version_tuple: VERSION_TUPLE
14
14
 
15
- __version__ = version = '0.0.6.dev277'
16
- __version_tuple__ = version_tuple = (0, 0, 6, 'dev277')
15
+ __version__ = version = '0.0.6.dev285'
16
+ __version_tuple__ = version_tuple = (0, 0, 6, 'dev285')
@@ -17,7 +17,7 @@ from datalad.support.exceptions import IncompleteResultsError
17
17
  from datalad.support.gitrepo import GitRepo
18
18
 
19
19
  from ..pipeline import WorkDirManager
20
- from ..utils import logger, raise_error, warn_with_log
20
+ from ..utils import config, logger, raise_error, warn_with_log
21
21
  from .base import BaseDataGrabber
22
22
 
23
23
 
@@ -143,27 +143,49 @@ class DataladDataGrabber(BaseDataGrabber):
143
143
  """
144
144
  return super().datadir / self._rootdir
145
145
 
146
- def _get_dataset_id_remote(self) -> str:
146
+ def _get_dataset_id_remote(self) -> tuple[str, bool]:
147
147
  """Get the dataset ID from the remote.
148
148
 
149
149
  Returns
150
150
  -------
151
151
  str
152
152
  The dataset ID.
153
+ bool
154
+ Whether the dataset is dirty.
155
+
156
+ Raises
157
+ ------
158
+ ValueError
159
+ If the dataset ID cannot be obtained from the remote.
153
160
 
154
161
  """
155
162
  remote_id = None
163
+ is_dirty = False
156
164
  with tempfile.TemporaryDirectory() as tmpdir:
157
- logger.debug(f"Querying {self.uri} for dataset ID")
158
- repo = GitRepo.clone(
159
- self.uri, path=tmpdir, clone_options=["-n", "--depth=1"]
165
+ if not config.get("datagrabber.skipidcheck", False):
166
+ logger.debug(f"Querying {self.uri} for dataset ID")
167
+ repo = GitRepo.clone(
168
+ self.uri, path=tmpdir, clone_options=["-n", "--depth=1"]
169
+ )
170
+ repo.checkout(name=".datalad/config", options=["HEAD"])
171
+ remote_id = repo.config.get("datalad.dataset.id", None)
172
+ logger.debug(f"Got remote dataset ID = {remote_id}")
173
+
174
+ if not config.get("datagrabber.skipdirtycheck", False):
175
+ is_dirty = repo.dirty
176
+ else:
177
+ logger.debug("Skipping dirty check")
178
+ is_dirty = False
179
+ else:
180
+ logger.debug("Skipping dataset ID check")
181
+ remote_id = self._dataset.id
182
+ is_dirty = False
183
+ logger.debug(
184
+ f"Remote dataset is {'' if is_dirty else 'not'} dirty"
160
185
  )
161
- repo.checkout(name=".datalad/config", options=["HEAD"])
162
- remote_id = repo.config.get("datalad.dataset.id", None)
163
- logger.debug(f"Got remote dataset ID = {remote_id}")
164
186
  if remote_id is None:
165
187
  raise_error("Could not get dataset ID from remote")
166
- return remote_id
188
+ return remote_id, is_dirty
167
189
 
168
190
  def _dataset_get(self, out: dict) -> dict:
169
191
  """Get the dataset found from the path in ``out``.
@@ -178,6 +200,11 @@ class DataladDataGrabber(BaseDataGrabber):
178
200
  dict
179
201
  The unmodified input dictionary.
180
202
 
203
+ Raises
204
+ ------
205
+ datalad.support.exceptions.IncompleteResultsError
206
+ If there is a datalad-related problem while fetching data.
207
+
181
208
  """
182
209
  to_get = []
183
210
  for type_val in out.values():
@@ -230,6 +257,8 @@ class DataladDataGrabber(BaseDataGrabber):
230
257
  ------
231
258
  ValueError
232
259
  If the dataset is already installed but with a different ID.
260
+ datalad.support.exceptions.IncompleteResultsError
261
+ If there is a datalad-related problem while cloning dataset.
233
262
 
234
263
  """
235
264
  isinstalled = dl.Dataset(self._datadir).is_installed()
@@ -238,23 +267,23 @@ class DataladDataGrabber(BaseDataGrabber):
238
267
  self._got_files = []
239
268
  self._dataset: dl.Dataset = dl.Dataset(self._datadir)
240
269
 
241
- remote_id = self._get_dataset_id_remote()
270
+ # Check if dataset is already installed with a different ID
271
+ remote_id, is_dirty = self._get_dataset_id_remote()
242
272
  if remote_id != self._dataset.id:
243
273
  raise_error(
244
274
  "Dataset already installed but with a different "
245
275
  f"ID: {self._dataset.id} (local) != {remote_id} (remote)"
246
276
  )
247
277
 
248
- # Check for dirty datasets:
249
- status = self._dataset.status()
250
- if any(x["state"] != "clean" for x in status):
251
- self.datalad_dirty = True
278
+ # Conditional reporting on dataset dirtiness
279
+ self.datalad_dirty = is_dirty
280
+ if self.datalad_dirty:
252
281
  warn_with_log(
253
- "At least one file is not clean, Junifer will "
254
- "consider this dataset as dirty."
282
+ "At least one file is not clean, "
283
+ f"marking dataset (id: {self._dataset.id}) as dirty."
255
284
  )
256
285
  else:
257
- logger.debug("Dataset is clean")
286
+ logger.debug(f"Dataset (id: {self._dataset.id}) is clean")
258
287
 
259
288
  else:
260
289
  logger.debug(f"Installing dataset {self.uri} to {self._datadir}")
@@ -3,12 +3,14 @@
3
3
  # Authors: Synchon Mandal <s.mandal@fz-juelich.de>
4
4
  # License: AGPL
5
5
 
6
+ import warnings
6
7
  from pathlib import Path
7
8
 
8
9
  import datalad.api as dl
9
10
  import pytest
10
11
 
11
12
  from junifer.datagrabber import DataladDataGrabber
13
+ from junifer.utils import config
12
14
 
13
15
 
14
16
  _testing_dataset = {
@@ -94,6 +96,12 @@ def test_DataladDataGrabber_install_errors(
94
96
  with pytest.raises(ValueError, match=r"different ID"):
95
97
  with dg:
96
98
  pass
99
+ # Set config to skip id check and test
100
+ config.set(key="datagrabber.skipidcheck", val=True)
101
+ with dg:
102
+ pass
103
+ # Reset config
104
+ config.delete("datagrabber.skipidcheck")
97
105
 
98
106
  elem1_t1w = datadir / "example_bids/sub-01/anat/sub-01_T1w.nii.gz"
99
107
  elem1_t1w.unlink()
@@ -104,6 +112,14 @@ def test_DataladDataGrabber_install_errors(
104
112
  with pytest.warns(RuntimeWarning, match=r"one file is not clean"):
105
113
  with dg:
106
114
  pass
115
+ # Set config to skip dirty check and test
116
+ with warnings.catch_warnings():
117
+ warnings.simplefilter("error")
118
+ config.set(key="datagrabber.skipdirtycheck", val=True)
119
+ with dg:
120
+ pass
121
+ # Reset config
122
+ config.delete("datagrabber.skipdirtycheck")
107
123
 
108
124
 
109
125
  def test_DataladDataGrabber_clone_cleanup(
@@ -246,7 +262,7 @@ def test_DataladDataGrabber_previously_cloned(
246
262
  meta = elem1["BOLD"]["meta"]
247
263
  assert "datagrabber" in meta
248
264
  assert "datalad_dirty" in meta["datagrabber"]
249
- assert meta["datagrabber"]["datalad_dirty"] is False
265
+ assert meta["datagrabber"]["datalad_dirty"] is True
250
266
  assert "datalad_commit_id" in meta["datagrabber"]
251
267
  assert meta["datagrabber"]["datalad_commit_id"] == commit
252
268
  assert "datalad_id" in meta["datagrabber"]
@@ -326,7 +342,7 @@ def test_DataladDataGrabber_previously_cloned_and_get(
326
342
  meta = elem1["BOLD"]["meta"]
327
343
  assert "datagrabber" in meta
328
344
  assert "datalad_dirty" in meta["datagrabber"]
329
- assert meta["datagrabber"]["datalad_dirty"] is False
345
+ assert meta["datagrabber"]["datalad_dirty"] is True
330
346
  assert "datalad_commit_id" in meta["datagrabber"]
331
347
  assert meta["datagrabber"]["datalad_commit_id"] == commit
332
348
  assert "datalad_id" in meta["datagrabber"]
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: junifer
3
- Version: 0.0.6.dev277
3
+ Version: 0.0.6.dev285
4
4
  Summary: JUelich NeuroImaging FEature extractoR
5
5
  Author-email: Fede Raimondo <f.raimondo@fz-juelich.de>, Synchon Mandal <s.mandal@fz-juelich.de>
6
6
  Maintainer-email: Fede Raimondo <f.raimondo@fz-juelich.de>, Synchon Mandal <s.mandal@fz-juelich.de>
@@ -1,6 +1,6 @@
1
1
  junifer/__init__.py,sha256=2McgH1yNue6Z1V26-uN_mfMjbTcx4CLhym-DMBl5xA4,266
2
2
  junifer/__init__.pyi,sha256=SsTvgq2Dod6UqJN96GH1lCphH6hJQQurEJHGNhHjGUI,508
3
- junifer/_version.py,sha256=oxdSo7e4dHuWGJ6fcFCd_o22QGOenmAuWxLqOvENYXw,428
3
+ junifer/_version.py,sha256=VOqNBo1Uj5NzgtOfO88V2py3fLW1gPgO44Cm-fu8TeY,428
4
4
  junifer/conftest.py,sha256=PWYkkRDU8ly2lYwv7VBKMHje4et6HX7Yey3Md_I2KbA,613
5
5
  junifer/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
6
6
  junifer/stats.py,sha256=e9aaagMGtgpRfW3Wdpz9ocpnYld1IWylCDcjFUgX9Mk,6225
@@ -123,7 +123,7 @@ junifer/data/tests/test_template_spaces.py,sha256=PJulN7xHpAcSOTY-UzTG_WPywZEBSl
123
123
  junifer/datagrabber/__init__.py,sha256=EHIK-lbjuvkt0V8ypFvLSt85OAAXSkaxBmVlCbNNz8M,323
124
124
  junifer/datagrabber/__init__.pyi,sha256=zOQE4TaCKXBTHnNqgmECtsszWIOHYiQ1CUEeXXFU9F4,832
125
125
  junifer/datagrabber/base.py,sha256=a3_fUZIN5Bqhq2f4ldpwk_eWeSVRDpDmx2QGIKzCtkg,6761
126
- junifer/datagrabber/datalad_base.py,sha256=2g-e_pLG0Legx4BvisrnGWYi1NCTyOkCi09QxbKX18M,11415
126
+ junifer/datagrabber/datalad_base.py,sha256=v_qGP66zk1-a-nU_u4qoSRNWYuh8YBdjhKkvzISgJWM,12586
127
127
  junifer/datagrabber/dmcc13_benchmark.py,sha256=VMyiwvkr4qSvzBICSksPPKOI2w_WVo06H89Url-hrNs,12819
128
128
  junifer/datagrabber/multiple.py,sha256=4tCOzojs3hoG7daHJJ7HUsx15atWR5nTmyP0S0__aig,6666
129
129
  junifer/datagrabber/pattern.py,sha256=UwJQ0MObBIS6eHH9FfoM_sBYuNM9n5NAX7DA0HdtL1A,18709
@@ -146,7 +146,7 @@ junifer/datagrabber/hcp1200/hcp1200.py,sha256=L_JTY0RYQ_Wst2La5EaGVDbya7IfSkTVkK
146
146
  junifer/datagrabber/hcp1200/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
147
147
  junifer/datagrabber/hcp1200/tests/test_hcp1200.py,sha256=HeXlD6wjvDq0EyqlB_nPqfXSIhAzALYAYjSCAjNOGGg,10972
148
148
  junifer/datagrabber/tests/test_base.py,sha256=fZdVhNhvfht9lpTHrAUf5E6mAfNNUP7OTQ5KLaBQ1gI,3506
149
- junifer/datagrabber/tests/test_datalad_base.py,sha256=5QSgsloHROVjp0g1UxXlk-Zmk-vHsLHGn05DJmmNkTI,16261
149
+ junifer/datagrabber/tests/test_datalad_base.py,sha256=nPF_N2Q09tgPmd5TD0dI9KU8G8HHLmydFa3agamijI8,16790
150
150
  junifer/datagrabber/tests/test_dmcc13_benchmark.py,sha256=QSdYAAwAj1DoE1oLhoraIc4lAgUgIaJyrtcOs_witzM,9914
151
151
  junifer/datagrabber/tests/test_multiple.py,sha256=tZBQhlEiSE1PeQ5E3TtuVgsHENquna9t39p54AJ-O5w,9963
152
152
  junifer/datagrabber/tests/test_pattern.py,sha256=H55jYRPfT3rMsoIQOAnWJgw3nGrkU7m2xFa3-ed6NQE,9527
@@ -341,10 +341,10 @@ junifer/utils/tests/test_config.py,sha256=7ltIXuwb_W4Mv_1dxQWyiyM10XgUAfsWKV6D_i
341
341
  junifer/utils/tests/test_fs.py,sha256=WQS7cKlKEZ742CIuiOYYpueeAhY9PqlastfDVpVVtvE,923
342
342
  junifer/utils/tests/test_helpers.py,sha256=k5qqfxK8dFyuewTJyR1Qn6-nFaYNuVr0ysc18bfPjyU,929
343
343
  junifer/utils/tests/test_logging.py,sha256=duO4ou365hxwa_kwihFtKPLaL6LC5XHiyhOijrrngbA,8009
344
- junifer-0.0.6.dev277.dist-info/AUTHORS.rst,sha256=rmULKpchpSol4ExWFdm-qu4fkpSZPYqIESVJBZtGb6E,163
345
- junifer-0.0.6.dev277.dist-info/LICENSE.md,sha256=MqCnOBu8uXsEOzRZWh9EBVfVz-kE9NkXcLCrtGXo2yU,34354
346
- junifer-0.0.6.dev277.dist-info/METADATA,sha256=_f6DUBkVFhbhg_l8PQXSibG-3q9WIM6EP9PBvayajuA,8429
347
- junifer-0.0.6.dev277.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
348
- junifer-0.0.6.dev277.dist-info/entry_points.txt,sha256=6O8ru0BP-SP7YMUZiizFNoaZ2HvJpadO2G7nKk4PwjI,48
349
- junifer-0.0.6.dev277.dist-info/top_level.txt,sha256=4bAq1R2QFQ4b3hohjys2JBvxrl0GKk5LNFzYvz9VGcA,8
350
- junifer-0.0.6.dev277.dist-info/RECORD,,
344
+ junifer-0.0.6.dev285.dist-info/AUTHORS.rst,sha256=rmULKpchpSol4ExWFdm-qu4fkpSZPYqIESVJBZtGb6E,163
345
+ junifer-0.0.6.dev285.dist-info/LICENSE.md,sha256=MqCnOBu8uXsEOzRZWh9EBVfVz-kE9NkXcLCrtGXo2yU,34354
346
+ junifer-0.0.6.dev285.dist-info/METADATA,sha256=fplMcovyUZPFi6ONcaA66A1mhJkxK4a3948mXRfW328,8429
347
+ junifer-0.0.6.dev285.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
348
+ junifer-0.0.6.dev285.dist-info/entry_points.txt,sha256=6O8ru0BP-SP7YMUZiizFNoaZ2HvJpadO2G7nKk4PwjI,48
349
+ junifer-0.0.6.dev285.dist-info/top_level.txt,sha256=4bAq1R2QFQ4b3hohjys2JBvxrl0GKk5LNFzYvz9VGcA,8
350
+ junifer-0.0.6.dev285.dist-info/RECORD,,