PyPI - junifer - Versions diffs - 0.0.3.dev186__py3-none-any.whl → 0.0.4__py3-none-any.whl - Mend

junifer 0.0.3.dev186py3-none-any.whl → 0.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (178) hide show

junifer/_version.py +14 -2
junifer/api/cli.py +162 -17
junifer/api/functions.py +87 -419
junifer/api/parser.py +24 -0
junifer/api/queue_context/__init__.py +8 -0
junifer/api/queue_context/gnu_parallel_local_adapter.py +258 -0
junifer/api/queue_context/htcondor_adapter.py +365 -0
junifer/api/queue_context/queue_context_adapter.py +60 -0
junifer/api/queue_context/tests/test_gnu_parallel_local_adapter.py +192 -0
junifer/api/queue_context/tests/test_htcondor_adapter.py +257 -0
junifer/api/res/afni/run_afni_docker.sh +6 -6
junifer/api/res/ants/ResampleImage +3 -0
junifer/api/res/ants/antsApplyTransforms +3 -0
junifer/api/res/ants/antsApplyTransformsToPoints +3 -0
junifer/api/res/ants/run_ants_docker.sh +39 -0
junifer/api/res/fsl/applywarp +3 -0
junifer/api/res/fsl/flirt +3 -0
junifer/api/res/fsl/img2imgcoord +3 -0
junifer/api/res/fsl/run_fsl_docker.sh +39 -0
junifer/api/res/fsl/std2imgcoord +3 -0
junifer/api/res/run_conda.sh +4 -4
junifer/api/res/run_venv.sh +22 -0
junifer/api/tests/data/partly_cloudy_agg_mean_tian.yml +16 -0
junifer/api/tests/test_api_utils.py +21 -3
junifer/api/tests/test_cli.py +232 -9
junifer/api/tests/test_functions.py +211 -439
junifer/api/tests/test_parser.py +1 -1
junifer/configs/juseless/datagrabbers/aomic_id1000_vbm.py +6 -1
junifer/configs/juseless/datagrabbers/camcan_vbm.py +6 -1
junifer/configs/juseless/datagrabbers/ixi_vbm.py +6 -1
junifer/configs/juseless/datagrabbers/tests/test_ucla.py +8 -8
junifer/configs/juseless/datagrabbers/ucla.py +44 -26
junifer/configs/juseless/datagrabbers/ukb_vbm.py +6 -1
junifer/data/VOIs/meta/AutobiographicalMemory_VOIs.txt +23 -0
junifer/data/VOIs/meta/Power2013_MNI_VOIs.tsv +264 -0
junifer/data/__init__.py +4 -0
junifer/data/coordinates.py +298 -31
junifer/data/masks.py +360 -28
junifer/data/parcellations.py +621 -188
junifer/data/template_spaces.py +190 -0
junifer/data/tests/test_coordinates.py +34 -3
junifer/data/tests/test_data_utils.py +1 -0
junifer/data/tests/test_masks.py +202 -86
junifer/data/tests/test_parcellations.py +266 -55
junifer/data/tests/test_template_spaces.py +104 -0
junifer/data/utils.py +4 -2
junifer/datagrabber/__init__.py +1 -0
junifer/datagrabber/aomic/id1000.py +111 -70
junifer/datagrabber/aomic/piop1.py +116 -53
junifer/datagrabber/aomic/piop2.py +116 -53
junifer/datagrabber/aomic/tests/test_id1000.py +27 -27
junifer/datagrabber/aomic/tests/test_piop1.py +27 -27
junifer/datagrabber/aomic/tests/test_piop2.py +27 -27
junifer/datagrabber/base.py +62 -10
junifer/datagrabber/datalad_base.py +0 -2
junifer/datagrabber/dmcc13_benchmark.py +372 -0
junifer/datagrabber/hcp1200/datalad_hcp1200.py +5 -0
junifer/datagrabber/hcp1200/hcp1200.py +30 -13
junifer/datagrabber/pattern.py +133 -27
junifer/datagrabber/pattern_datalad.py +111 -13
junifer/datagrabber/tests/test_base.py +57 -6
junifer/datagrabber/tests/test_datagrabber_utils.py +204 -76
junifer/datagrabber/tests/test_datalad_base.py +0 -6
junifer/datagrabber/tests/test_dmcc13_benchmark.py +256 -0
junifer/datagrabber/tests/test_multiple.py +43 -10
junifer/datagrabber/tests/test_pattern.py +125 -178
junifer/datagrabber/tests/test_pattern_datalad.py +44 -25
junifer/datagrabber/utils.py +151 -16
junifer/datareader/default.py +36 -10
junifer/external/nilearn/junifer_nifti_spheres_masker.py +6 -0
junifer/markers/base.py +25 -16
junifer/markers/collection.py +35 -16
junifer/markers/complexity/__init__.py +27 -0
junifer/markers/complexity/complexity_base.py +149 -0
junifer/markers/complexity/hurst_exponent.py +136 -0
junifer/markers/complexity/multiscale_entropy_auc.py +140 -0
junifer/markers/complexity/perm_entropy.py +132 -0
junifer/markers/complexity/range_entropy.py +136 -0
junifer/markers/complexity/range_entropy_auc.py +145 -0
junifer/markers/complexity/sample_entropy.py +134 -0
junifer/markers/complexity/tests/test_complexity_base.py +19 -0
junifer/markers/complexity/tests/test_hurst_exponent.py +69 -0
junifer/markers/complexity/tests/test_multiscale_entropy_auc.py +68 -0
junifer/markers/complexity/tests/test_perm_entropy.py +68 -0
junifer/markers/complexity/tests/test_range_entropy.py +69 -0
junifer/markers/complexity/tests/test_range_entropy_auc.py +69 -0
junifer/markers/complexity/tests/test_sample_entropy.py +68 -0
junifer/markers/complexity/tests/test_weighted_perm_entropy.py +68 -0
junifer/markers/complexity/weighted_perm_entropy.py +133 -0
junifer/markers/falff/_afni_falff.py +153 -0
junifer/markers/falff/_junifer_falff.py +142 -0
junifer/markers/falff/falff_base.py +91 -84
junifer/markers/falff/falff_parcels.py +61 -45
junifer/markers/falff/falff_spheres.py +64 -48
junifer/markers/falff/tests/test_falff_parcels.py +89 -121
junifer/markers/falff/tests/test_falff_spheres.py +92 -127
junifer/markers/functional_connectivity/crossparcellation_functional_connectivity.py +1 -0
junifer/markers/functional_connectivity/edge_functional_connectivity_parcels.py +1 -0
junifer/markers/functional_connectivity/functional_connectivity_base.py +1 -0
junifer/markers/functional_connectivity/tests/test_crossparcellation_functional_connectivity.py +46 -44
junifer/markers/functional_connectivity/tests/test_edge_functional_connectivity_parcels.py +34 -39
junifer/markers/functional_connectivity/tests/test_edge_functional_connectivity_spheres.py +40 -52
junifer/markers/functional_connectivity/tests/test_functional_connectivity_parcels.py +62 -70
junifer/markers/functional_connectivity/tests/test_functional_connectivity_spheres.py +99 -85
junifer/markers/parcel_aggregation.py +60 -38
junifer/markers/reho/_afni_reho.py +192 -0
junifer/markers/reho/_junifer_reho.py +281 -0
junifer/markers/reho/reho_base.py +69 -34
junifer/markers/reho/reho_parcels.py +26 -16
junifer/markers/reho/reho_spheres.py +23 -9
junifer/markers/reho/tests/test_reho_parcels.py +93 -92
junifer/markers/reho/tests/test_reho_spheres.py +88 -86
junifer/markers/sphere_aggregation.py +54 -9
junifer/markers/temporal_snr/temporal_snr_base.py +1 -0
junifer/markers/temporal_snr/tests/test_temporal_snr_parcels.py +38 -37
junifer/markers/temporal_snr/tests/test_temporal_snr_spheres.py +34 -38
junifer/markers/tests/test_collection.py +43 -42
junifer/markers/tests/test_ets_rss.py +29 -37
junifer/markers/tests/test_parcel_aggregation.py +587 -468
junifer/markers/tests/test_sphere_aggregation.py +209 -157
junifer/markers/utils.py +2 -40
junifer/onthefly/read_transform.py +13 -6
junifer/pipeline/__init__.py +1 -0
junifer/pipeline/pipeline_step_mixin.py +105 -41
junifer/pipeline/registry.py +17 -0
junifer/pipeline/singleton.py +45 -0
junifer/pipeline/tests/test_pipeline_step_mixin.py +139 -51
junifer/pipeline/tests/test_update_meta_mixin.py +1 -0
junifer/pipeline/tests/test_workdir_manager.py +104 -0
junifer/pipeline/update_meta_mixin.py +8 -2
junifer/pipeline/utils.py +154 -15
junifer/pipeline/workdir_manager.py +246 -0
junifer/preprocess/__init__.py +3 -0
junifer/preprocess/ants/__init__.py +4 -0
junifer/preprocess/ants/ants_apply_transforms_warper.py +185 -0
junifer/preprocess/ants/tests/test_ants_apply_transforms_warper.py +56 -0
junifer/preprocess/base.py +96 -69
junifer/preprocess/bold_warper.py +265 -0
junifer/preprocess/confounds/fmriprep_confound_remover.py +91 -134
junifer/preprocess/confounds/tests/test_fmriprep_confound_remover.py +106 -111
junifer/preprocess/fsl/__init__.py +4 -0
junifer/preprocess/fsl/apply_warper.py +179 -0
junifer/preprocess/fsl/tests/test_apply_warper.py +45 -0
junifer/preprocess/tests/test_bold_warper.py +159 -0
junifer/preprocess/tests/test_preprocess_base.py +6 -6
junifer/preprocess/warping/__init__.py +6 -0
junifer/preprocess/warping/_ants_warper.py +167 -0
junifer/preprocess/warping/_fsl_warper.py +109 -0
junifer/preprocess/warping/space_warper.py +213 -0
junifer/preprocess/warping/tests/test_space_warper.py +198 -0
junifer/stats.py +18 -4
junifer/storage/base.py +9 -1
junifer/storage/hdf5.py +8 -3
junifer/storage/pandas_base.py +2 -1
junifer/storage/sqlite.py +1 -0
junifer/storage/tests/test_hdf5.py +2 -1
junifer/storage/tests/test_sqlite.py +8 -8
junifer/storage/tests/test_utils.py +6 -6
junifer/storage/utils.py +1 -0
junifer/testing/datagrabbers.py +11 -7
junifer/testing/utils.py +1 -0
junifer/tests/test_stats.py +2 -0
junifer/utils/__init__.py +1 -0
junifer/utils/helpers.py +53 -0
junifer/utils/logging.py +14 -3
junifer/utils/tests/test_helpers.py +35 -0
{junifer-0.0.3.dev186.dist-info → junifer-0.0.4.dist-info}/METADATA +59 -28
junifer-0.0.4.dist-info/RECORD +257 -0
{junifer-0.0.3.dev186.dist-info → junifer-0.0.4.dist-info}/WHEEL +1 -1
junifer/markers/falff/falff_estimator.py +0 -334
junifer/markers/falff/tests/test_falff_estimator.py +0 -238
junifer/markers/reho/reho_estimator.py +0 -515
junifer/markers/reho/tests/test_reho_estimator.py +0 -260
junifer-0.0.3.dev186.dist-info/RECORD +0 -199
{junifer-0.0.3.dev186.dist-info → junifer-0.0.4.dist-info}/AUTHORS.rst +0 -0
{junifer-0.0.3.dev186.dist-info → junifer-0.0.4.dist-info}/LICENSE.md +0 -0
{junifer-0.0.3.dev186.dist-info → junifer-0.0.4.dist-info}/entry_points.txt +0 -0
{junifer-0.0.3.dev186.dist-info → junifer-0.0.4.dist-info}/top_level.txt +0 -0

junifer/api/functions.py CHANGED Viewed

@@ -6,8 +6,6 @@
 # License: AGPL
 import shutil
-import subprocess
-import textwrap
 import typing
 from pathlib import Path
 from typing import Dict, List, Optional, Tuple, Union
@@ -15,11 +13,12 @@ from typing import Dict, List, Optional, Tuple, Union
 from ..datagrabber.base import BaseDataGrabber
 from ..markers.base import BaseMarker
 from ..markers.collection import MarkerCollection
+from ..pipeline import WorkDirManager
 from ..pipeline.registry import build
 from ..preprocess.base import BasePreprocessor
 from ..storage.base import BaseFeatureStorage
 from ..utils import logger, raise_error
-from ..utils.fs import make_executable
+from .queue_context import GnuParallelLocalAdapter, HTCondorAdapter
 from .utils import yaml
@@ -80,7 +79,7 @@ def run(
     datagrabber: Dict,
     markers: List[Dict],
     storage: Dict,
-    preprocessor: Optional[Dict] = None,
+    preprocessors: Optional[List[Dict]] = None,
     elements: Union[str, List[Union[str, Tuple]], Tuple, None] = None,
 ) -> None:
     """Run the pipeline on the selected element.
@@ -103,10 +102,10 @@ def run(
         Storage to use. Must have a key ``kind`` with the kind of
         storage to use. All other keys are passed to the storage
         init function.
-    preprocessor : dict, optional
-        Preprocessor to use. Must have a key ``kind`` with the kind of
-        preprocessor to use. All other keys are passed to the preprocessor
-        init function (default None).
+    preprocessors : list of dict, optional
+        List of preprocessors to use. Each preprocessor is a dict with at
+        least a key ``kind`` specifying the preprocessor to use. All other keys
+        are passed to the preprocessor init function (default None).
     elements : str or tuple or list of str or tuple, optional
         Element(s) to process. Will be used to index the DataGrabber
         (default None).
@@ -115,6 +114,8 @@ def run(
     # Convert str to Path
     if isinstance(workdir, str):
         workdir = Path(workdir)
+    # Initiate working directory manager
+    WorkDirManager(workdir)
     if not isinstance(elements, list) and elements is not None:
         elements = [elements]
@@ -149,21 +150,29 @@ def run(
     storage_object = typing.cast(BaseFeatureStorage, storage_object)
     # Get preprocessor to use (if provided)
-    if preprocessor is not None:
-        preprocessor_object = _get_preprocessor(preprocessor)
+    if preprocessors is not None:
+        _preprocessors = [x.copy() for x in preprocessors]
+        built_preprocessors = []
+        for preprocessor in _preprocessors:
+            preprocessor_object = _get_preprocessor(preprocessor)
+            built_preprocessors.append(preprocessor_object)
     else:
-        preprocessor_object = None
+        built_preprocessors = None
     # Create new marker collection
     mc = MarkerCollection(
         markers=built_markers,
-        preprocessing=preprocessor_object,
+        preprocessors=built_preprocessors,
         storage=storage_object,
     )
+    mc.validate(datagrabber_object)
     # Fit elements
     with datagrabber_object:
         if elements is not None:
-            for t_element in elements:
+            for t_element in datagrabber_object.filter(
+                elements  # type: ignore
+            ):
                 mc.fit(datagrabber_object[t_element])
         else:
             for t_element in datagrabber_object:
@@ -213,7 +222,7 @@ def queue(
     ----------
     config : dict
         The configuration to be used for queueing the job.
-    kind : {"HTCondor", "SLURM"}
+    kind : {"HTCondor", "GNUParallelLocal"}
         The kind of job queue system to use.
     jobname : str, optional
         The name of the job (default "junifer_job").
@@ -228,13 +237,20 @@ def queue(
     Raises
     ------
     ValueError
-        If the value of ``kind`` is invalid.
+        If ``kind`` is invalid or
+        if the ``jobdir`` exists and ``overwrite = False``.
     """
+    valid_kind = ["HTCondor", "GNUParallelLocal"]
+    if kind not in valid_kind:
+        raise_error(
+            f"Invalid value for `kind`: {kind}, "
+            f"must be one of {valid_kind}"
+        )
     # Create a folder within the CWD to store the job files / config
-    cwd = Path.cwd()
-    jobdir = cwd / "junifer_jobs" / jobname
-    logger.info(f"Creating job in {jobdir.absolute()!s}")
+    jobdir = Path.cwd() / "junifer_jobs" / jobname
+    logger.info(f"Creating job directory at {jobdir.resolve()!s}")
     if jobdir.exists():
         if not overwrite:
             raise_error(
@@ -242,15 +258,16 @@ def queue(
                 "This error is raised to prevent overwriting job files "
                 "that might be scheduled but not yet executed. "
                 f"Either delete the directory {jobdir.absolute()!s} "
-                "or set overwrite=True."
+                "or set `overwrite=True.`"
             )
         else:
             logger.info(
-                f"Deleting existing job directory at {jobdir.absolute()!s}"
+                f"Deleting existing job directory at {jobdir.resolve()!s}"
             )
             shutil.rmtree(jobdir)
     jobdir.mkdir(exist_ok=True, parents=True)
+    # Load modules
     if "with" in config:
         to_load = config["with"]
         # If there is a list of files to load, copy and remove the path
@@ -260,15 +277,16 @@ def queue(
             to_load = [to_load]
         for item in to_load:
             if item.endswith(".py"):
-                logger.debug(f"Copying {item} to jobdir ({jobdir.absolute()})")
-                shutil.copy(item, jobdir)
+                logger.debug(f"Copying {item} to ({jobdir.resolve()!s})")
+                shutil.copy(src=item, dst=jobdir)
                 fixed_load.append(Path(item).name)
             else:
                 fixed_load.append(item)
         config["with"] = fixed_load
+    # Save YAML
     yaml_config = jobdir / "config.yaml"
-    logger.info(f"Writing YAML config to {yaml_config.absolute()!s}")
+    logger.info(f"Writing YAML config to {yaml_config.resolve()!s}")
     yaml.dump(config, stream=yaml_config)
     # Get list of elements
@@ -281,415 +299,65 @@ def queue(
             datagrabber = _get_datagrabber(config["datagrabber"])
             with datagrabber as dg:
                 elements = dg.get_elements()
-    # TODO: Fix typing of elements
+    # Listify elements
     if not isinstance(elements, list):
-        elements = [elements]  # type: ignore
-    typing.cast(List[Union[str, Tuple]], elements)
+        elements: List[Union[str, Tuple]] = [elements]
+    # Check job queueing system
+    adapter = None
     if kind == "HTCondor":
-        _queue_condor(
-            jobname=jobname,
-            jobdir=jobdir,
-            yaml_config=yaml_config,
-            elements=elements,  # type: ignore
-            config=config,
-            **kwargs,
+        adapter = HTCondorAdapter(
+            job_name=jobname,
+            job_dir=jobdir,
+            yaml_config_path=yaml_config,
+            elements=elements,
+            **kwargs,  # type: ignore
         )
-    elif kind == "SLURM":
-        _queue_slurm(
-            jobname=jobname,
-            jobdir=jobdir,
-            yaml_config=yaml_config,
-            elements=elements,  # type: ignore
-            config=config,
-            **kwargs,
+    elif kind == "GNUParallelLocal":
+        adapter = GnuParallelLocalAdapter(
+            job_name=jobname,
+            job_dir=jobdir,
+            yaml_config_path=yaml_config,
+            elements=elements,
+            **kwargs,  # type: ignore
         )
-    else:
-        raise_error(f"Unknown queue kind: {kind}")
+    adapter.prepare()  # type: ignore
     logger.info("Queue done")
-def _queue_condor(
-    jobname: str,
-    jobdir: Path,
-    yaml_config: Path,
-    elements: List[Union[str, Tuple]],
-    config: Dict,
-    env: Optional[Dict[str, str]] = None,
-    mem: str = "8G",
-    cpus: int = 1,
-    disk: str = "1G",
-    extra_preamble: str = "",
-    pre_run: Optional[str] = None,
-    verbose: str = "info",
-    collect: str = "yes",
-    submit: bool = False,
-) -> None:
-    """Submit job to HTCondor.
+def reset(config: Dict) -> None:
+    """Reset the storage and jobs directory.
     Parameters
     ----------
-    jobname : str
-        The name of the job.
-    jobdir : pathlib.Path
-        The path to the job directory.
-    yaml_config : pathlib.Path
-        The path to the YAML config file.
-    elements : list of str or tuple
-        Element(s) to process. Will be used to index the DataGrabber.
     config : dict
-        The configuration to be used for queueing the job.
-    env : dict, optional
-        The environment variables passed as dictionary (default None).
-    mem : str, optional
-        The size of memory (RAM) to use (default "8G").
-    cpus : int, optional
-        The number of CPU cores to use (default 1).
-    disk : str, optional
-        The size of disk (HDD or SSD) to use (default "1G").
-    extra_preamble : str, optional
-        Extra commands to pass to HTCondor (default "").
-    pre_run : str, optional
-        Extra bash commands to source before the job (default None).
-    verbose : str, optional
-        The level of verbosity (default "info").
-    collect : str, optional
-        Whether to submit "collect" task for junifer (default "yes").
-        Valid options are:
-            * "yes": Submit "collect" task and run even if some of the jobs
-                fail.
-            * "on_success_only": Submit "collect" task and run only if all jobs
-                succeed.
-            * "no": Do not submit "collect" task.
-    submit : bool, optional
-        Whether to submit the jobs. In any case, .dag files will be created
-        for submission (default False).
-    Raises
-    ------
-    ValueError
-        If the value of `env` is invalid.
+        The configuration to be used for resetting.
     """
-    logger.debug("Creating HTCondor job")
-    run_junifer_args = (
-        f"run {yaml_config.absolute()!s} "
-        f"--verbose {verbose} --element $(element)"
-    )
-    collect_junifer_args = (
-        f"collect {yaml_config.absolute()!s} --verbose {verbose} "
-    )
-    if not isinstance(collect, str):
-        raise_error("collect must be a string")
-    collect = collect.lower()
-    if collect not in ["yes", "no", "on_success_only"]:
-        raise_error(f"Invalid value for collect: {collect}")
-    # Set up the env_name, executable and arguments according to the
-    # environment type
-    if env is None:
-        env = {"kind": "local"}
-    if env["kind"] == "conda":
-        env_name = env["name"]
-        executable = "run_conda.sh"
-        arguments = f"{env_name} junifer"
-        exec_path = jobdir / executable
-        logger.info(f"Copying {executable} to {exec_path.absolute()!s}")
-        shutil.copy(Path(__file__).parent / "res" / executable, exec_path)
-        make_executable(exec_path)
-    elif env["kind"] == "venv":
-        env_name = env["name"]
-        executable = "run_venv.sh"
-        arguments = f"{env_name} junifer"
-        # TODO: Copy run_venv.sh to jobdir
-    elif env["kind"] == "local":
-        executable = "junifer"
-        arguments = ""
-    else:
-        raise ValueError(f'Unknown env kind: {env["kind"]}')
-    logger.info("Writing pre_run.sh to jobdir")
-    pre_run_fname = jobdir / "pre_run.sh"
-    with open(pre_run_fname, "w") as f:
-        f.write("#!/bin/bash\n\n")
-        f.write("# Force datalad to run in non-interactive mode\n")
-        f.write("DATALAD_UI_INTERACTIVE=false\n\n")
-        if pre_run is not None:
-            f.write(pre_run)
-    make_executable(pre_run_fname)
-    # Create log directory
-    log_dir = jobdir / "logs"
-    log_dir.mkdir(exist_ok=True, parents=True)
-    # Add preamble data
-    run_preamble = f"""
-        # The environment
-        universe = vanilla
-        getenv = True
-        # Resources
-        request_cpus = {cpus}
-        request_memory = {mem}
-        request_disk = {disk}
-        # Executable
-        initial_dir = {jobdir.absolute()!s}
-        executable = $(initial_dir)/{executable}
-        transfer_executable = False
-        arguments = {arguments} {run_junifer_args}
-        {extra_preamble}
-        # Logs
-        log = {log_dir.absolute()!s}/junifer_run_$(log_element).log
-        output = {log_dir.absolute()!s}/junifer_run_$(log_element).out
-        error = {log_dir.absolute()!s}/junifer_run_$(log_element).err
-        """
-    submit_run_fname = jobdir / f"run_{jobname}.submit"
-    submit_collect_fname = jobdir / f"collect_{jobname}.submit"
-    dag_fname = jobdir / f"{jobname}.dag"
-    # Write to run submit files
-    with open(submit_run_fname, "w") as submit_file:
-        submit_file.write(textwrap.dedent(run_preamble))
-        submit_file.write("queue\n")
-    collect_preamble = f"""
-        # The environment
-        universe = vanilla
-        getenv = True
-        # Resources
-        request_cpus = {cpus}
-        request_memory = {mem}
-        request_disk = {disk}
-        # Executable
-        initial_dir = {jobdir.absolute()!s}
-        executable = $(initial_dir)/{executable}
-        transfer_executable = False
-        arguments = {arguments} {collect_junifer_args}
-        {extra_preamble}
-        # Logs
-        log = {log_dir.absolute()!s}/junifer_collect.log
-        output = {log_dir.absolute()!s}/junifer_collect.out
-        error = {log_dir.absolute()!s}/junifer_collect.err
-        """
-    # Now create the collect submit file
-    with open(submit_collect_fname, "w") as submit_file:
-        submit_file.write(textwrap.dedent(collect_preamble))
-        submit_file.write("queue\n")
-    with open(dag_fname, "w") as dag_file:
-        # Get all subject and session names from file list
-        for i_job, t_elem in enumerate(elements):
-            str_elem = (
-                ",".join(t_elem) if isinstance(t_elem, tuple) else t_elem
-            )
-            log_elem = (
-                "_".join(t_elem) if isinstance(t_elem, tuple) else t_elem
-            )
-            dag_file.write(f"JOB run{i_job} {submit_run_fname}\n")
-            dag_file.write(
-                f'VARS run{i_job} element="{str_elem}" '
-                f'log_element="{log_elem}"\n\n'
-            )
-        if collect == "yes":
-            dag_file.write(f"FINAL collect {submit_collect_fname}\n")
-            collect_pre_fname = jobdir / "collect_pre.sh"
-            dag_file.write(
-                f"SCRIPT PRE collect {collect_pre_fname.as_posix()} "
-                "$DAG_STATUS\n"
-            )
-            with open(collect_pre_fname, "w") as pre_file:
-                pre_file.write("#!/bin/bash\n\n")
-                pre_file.write('if [ "${1}" == "4" ]; then\n')
-                pre_file.write("    exit 1\n")
-                pre_file.write("fi\n")
-            make_executable(collect_pre_fname)
-        elif collect == "on_success_only":
-            dag_file.write(f"JOB collect {submit_collect_fname}\n")
-            dag_file.write("PARENT ")
-            for i_job, _ in enumerate(elements):
-                dag_file.write(f"run{i_job} ")
-            dag_file.write("CHILD collect\n\n")
-    # Submit job(s)
-    if submit is True:
-        logger.info("Submitting HTCondor job")
-        subprocess.run(["condor_submit_dag", dag_fname])
-        logger.info("HTCondor job submitted")
-    else:
-        cmd = f"condor_submit_dag {dag_fname.absolute()!s}"
-        logger.info(
-            f"HTCondor job files created, to submit the job, run `{cmd}`"
+    # Fetch storage
+    storage = config["storage"]
+    storage_uri = Path(storage["uri"])
+    logger.info(f"Deleting {storage_uri.resolve()!s}")
+    # Delete storage; will be str
+    if storage_uri.exists():
+        # Delete files in the directory
+        for file in storage_uri.iterdir():
+            file.unlink(missing_ok=True)
+        # Remove directory
+        storage_uri.parent.rmdir()
+    # Fetch job name (if present)
+    if config.get("queue") is not None:
+        queue = config["queue"]
+        job_dir = (
+            Path.cwd()
+            / "junifer_jobs"
+            / (queue.get("jobname") or "junifer_job")
         )
-def _queue_slurm(
-    jobname: str,
-    jobdir: Path,
-    yaml_config: Path,
-    elements: List[Union[str, Tuple]],
-    config: Dict,
-) -> None:
-    """Submit job to SLURM.
-    Parameters
-    ----------
-    jobname : str
-        The name of the job.
-    jobdir : pathlib.Path
-        The path to the job directory.
-    yaml_config : pathlib.Path
-        The path to the YAML config file.
-    elements : str or tuple or list[str or tuple], optional
-        Element(s) to process. Will be used to index the DataGrabber
-        (default None).
-    config : dict
-        The configuration to be used for queueing the job.
-    """
-    pass
-    # logger.debug("Creating SLURM job")
-    # run_junifer_args = (
-    #     f"run {str(yaml_config.absolute())} "
-    #     f"--verbose {verbose} --element $(element)"
-    # )
-    # collect_junifer_args = \
-    #     f"collect {str(yaml_config.absolute())} --verbose {verbose} "
-    # # Set up the env_name, executable and arguments according to the
-    # # environment type
-    # if env is None:
-    #     env = {
-    #         "kind": "local",
-    #     }
-    # if env["kind"] == "conda":
-    #     env_name = env["name"]
-    #     executable = "run_conda.sh"
-    #     arguments = f"{env_name} junifer"
-    #     # TODO: Copy run_conda.sh to jobdir
-    #     exec_path = jobdir / executable
-    #     shutil.copy(Path(__file__).parent / "res" / executable, exec_path)
-    #     make_executable(exec_path)
-    # elif env["kind"] == "venv":
-    #     env_name = env["name"]
-    #     executable = "run_venv.sh"
-    #     arguments = f"{env_name} junifer"
-    #     # TODO: Copy run_venv.sh to jobdir
-    # elif env["kind"] == "local":
-    #     executable = "junifer"
-    #     arguments = ""
-    # else:
-    #     raise ValueError(f"Unknown env kind: {env['kind']}")
-    # # Create log directory
-    # log_dir = jobdir / 'logs'
-    # log_dir.mkdir(exist_ok=True, parents=True)
-    # # Add preamble data
-    # run_preamble = f"""
-    #     #!/bin/bash
-    #     #SBATCH --job-name={}
-    #     #SBATCH --account={}
-    #     #SBATCH --partition={}
-    #     #SBATCH --time={}
-    #     #SBATCH --ntasks={}
-    #     #SBATCH --cpus-per-task={cpus}
-    #     #SBATCH --mem-per-cpu={mem}
-    #     #SBATCH --mail-type={}
-    #     #SBATCH --mail-user={}
-    #     #SBATCH --output={}
-    #     #SBATCH --error={}
-    #     # Executable
-    #     initial_dir = {str(jobdir.absolute())}
-    #     executable = $(initial_dir)/{executable}
-    #     transfer_executable = False
-    #     arguments = {arguments} {run_junifer_args}
-    #     {extra_preamble}
-    #     # Logs
-    #     log = {str(log_dir.absolute())}/junifer_run_$(element).log
-    #     output = {str(log_dir.absolute())}/junifer_run_$(element).out
-    #     error = {str(log_dir.absolute())}/junifer_run_$(element).err
-    #     """
-    # submit_run_fname = jobdir / f'run_{jobname}.sh'
-    # submit_collect_fname = jobdir / f'collect_{jobname}.sh'
-    # # Write to run submit files
-    # with open(submit_run_fname, 'w') as submit_file:
-    #     submit_file.write(run_preamble)
-    #     submit_file.write('queue\n')
-    # collect_preamble = f"""
-    #     # The environment
-    #     universe = vanilla
-    #     getenv = True
-    #     # Resources
-    #     request_cpus = {cpus}
-    #     request_memory = {mem}
-    #     request_disk = {disk}
-    #     # Executable
-    #     initial_dir = {str(jobdir.absolute())}
-    #     executable = $(initial_dir)/{executable}
-    #     transfer_executable = False
-    #     arguments = {arguments} {collect_junifer_args}
-    #     {extra_preamble}
-    #     # Logs
-    #     log = {str(log_dir.absolute())}/junifer_collect.log
-    #     output = {str(log_dir.absolute())}/junifer_collect.out
-    #     error = {str(log_dir.absolute())}/junifer_collect.err
-    #     """
-    # # Now create the collect submit file
-    # with open(submit_collect_fname, 'w') as submit_file:
-    #     submit_file.write(collect_preamble)  # Eval preamble here
-    #     submit_file.write('queue\n')
-    # with open(dag_fname, 'w') as dag_file:
-    #     # Get all subject and session names from file list
-    #     for i_job, t_elem in enumerate(elements):
-    #         dag_file.write(f'JOB run{i_job} {submit_run_fname}\n')
-    #         dag_file.write(f'VARS run{i_job} element="{t_elem}"\n\n')
-    #     if collect is True:
-    #         dag_file.write(f'JOB collect {submit_collect_fname}\n')
-    #         dag_file.write('PARENT ')
-    #         for i_job, _t_elem in enumerate(elements):
-    #             dag_file.write(f'run{i_job} ')
-    #         dag_file.write('CHILD collect\n\n')
-    # # Submit job(s)
-    # if submit is True:
-    #     logger.info('Submitting SLURM job')
-    #     subprocess.run(['condor_submit_dag', dag_fname])
-    #     logger.info('HTCondor SLURM submitted')
-    # else:
-    #     cmd = f"condor_submit_dag {str(dag_fname.absolute())}"
-    #     logger.info(
-    #         f"SLURM job files created, to submit the job, run `{cmd}`"
-    #     )
+        logger.info(f"Deleting job directory at {job_dir.resolve()!s}")
+        if job_dir.exists():
+            # Remove files and directories
+            shutil.rmtree(job_dir)
+            # Remove directory
+            job_dir.parent.rmdir()

junifer/api/parser.py CHANGED Viewed

@@ -50,6 +50,8 @@ def parse_yaml(filepath: Union[str, Path]) -> Dict:
         # Convert load modules to list
         if not isinstance(to_load, list):
             to_load = [to_load]
+        # Initialize list to have absolute paths for custom modules
+        final_to_load = []
         for t_module in to_load:
             if t_module.endswith(".py"):
                 logger.debug(f"Importing file: {t_module}")
@@ -65,9 +67,18 @@ def parse_yaml(filepath: Union[str, Path]) -> Dict:
                 module = importlib.util.module_from_spec(spec)  # type: ignore
                 sys.modules[t_module] = module
                 spec.loader.exec_module(module)  # type: ignore
+                # Add absolute path to final list
+                final_to_load.append(str(file_path.resolve()))
             else:
                 logger.info(f"Importing module: {t_module}")
                 importlib.import_module(t_module)
+                # Add module to final list
+                final_to_load.append(t_module)
+        # Replace modules to be loaded so that custom modules will take the
+        # absolute path. This was not the case as found in #224. Similar thing
+        # is done with the storage URI below.
+        contents["with"] = final_to_load
     # Compute path for the URI parameter in storage files that are relative
     # This is a tricky thing that appeared in #127. The problem is that
@@ -88,4 +99,17 @@ def parse_yaml(filepath: Union[str, Path]) -> Dict:
                 contents["storage"]["uri"] = str(
                     (filepath.parent / uri_path).resolve()
                 )
+    # Allow relative path if queue env kind is venv; same motivation as above
+    if "queue" in contents:
+        if "env" in contents["queue"]:
+            if "venv" == contents["queue"]["env"]["kind"]:
+                # Check if the env name is relative
+                venv_path = Path(contents["queue"]["env"]["name"])
+                if not venv_path.is_absolute():
+                    # Compute the absolute path
+                    contents["queue"]["env"]["name"] = str(
+                        (filepath.parent / venv_path).resolve()
+                    )
     return contents

junifer/api/queue_context/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+"""Provide imports for queue context sub-package."""
+# Authors: Synchon Mandal <s.mandal@fz-juelich.de>
+# License: AGPL
+from .queue_context_adapter import QueueContextAdapter
+from .htcondor_adapter import HTCondorAdapter
+from .gnu_parallel_local_adapter import GnuParallelLocalAdapter

junifer 0.0.3.dev186__py3-none-any.whl → 0.0.4__py3-none-any.whl

junifer 0.0.3.dev186py3-none-any.whl → 0.0.4py3-none-any.whl