PyPI - parsl - Versions diffs - 2024.4.22__py3-none-any.whl → 2024.5.6__py3-none-any.whl - Mend

parsl 2024.4.22py3-none-any.whl → 2024.5.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

parsl/config.py +10 -1
parsl/data_provider/zip.py +32 -0
parsl/dataflow/dflow.py +34 -26
parsl/executors/high_throughput/executor.py +7 -1
parsl/executors/status_handling.py +0 -3
parsl/executors/taskvine/executor.py +0 -31
parsl/executors/workqueue/executor.py +0 -30
parsl/jobs/job_status_poller.py +1 -3
parsl/monitoring/monitoring.py +3 -0
parsl/monitoring/radios.py +1 -1
parsl/providers/kubernetes/kube.py +20 -1
parsl/tests/configs/local_threads_checkpoint_periodic.py +8 -10
parsl/tests/conftest.py +12 -1
parsl/tests/test_bash_apps/test_std_uri.py +128 -0
parsl/tests/test_checkpointing/test_periodic.py +20 -33
parsl/tests/test_htex/test_basic.py +2 -2
parsl/tests/test_htex/test_missing_worker.py +0 -4
parsl/tests/test_mpi_apps/test_resource_spec.py +2 -8
parsl/tests/test_staging/test_zip_in.py +42 -0
parsl/tests/test_staging/test_zip_to_zip.py +44 -0
parsl/tests/unit/__init__.py +0 -0
parsl/tests/unit/test_file.py +99 -0
parsl/usage_tracking/api.py +66 -0
parsl/usage_tracking/usage.py +39 -26
parsl/version.py +1 -1
{parsl-2024.4.22.dist-info → parsl-2024.5.6.dist-info}/METADATA +2 -2
{parsl-2024.4.22.dist-info → parsl-2024.5.6.dist-info}/RECORD +34 -28
{parsl-2024.4.22.data → parsl-2024.5.6.data}/scripts/exec_parsl_function.py +0 -0
{parsl-2024.4.22.data → parsl-2024.5.6.data}/scripts/parsl_coprocess.py +0 -0
{parsl-2024.4.22.data → parsl-2024.5.6.data}/scripts/process_worker_pool.py +0 -0
{parsl-2024.4.22.dist-info → parsl-2024.5.6.dist-info}/LICENSE +0 -0
{parsl-2024.4.22.dist-info → parsl-2024.5.6.dist-info}/WHEEL +0 -0
{parsl-2024.4.22.dist-info → parsl-2024.5.6.dist-info}/entry_points.txt +0 -0
{parsl-2024.4.22.dist-info → parsl-2024.5.6.dist-info}/top_level.txt +0 -0

parsl/config.py CHANGED Viewed

@@ -10,11 +10,12 @@ from parsl.executors.threads import ThreadPoolExecutor
 from parsl.errors import ConfigurationError
 from parsl.dataflow.taskrecord import TaskRecord
 from parsl.monitoring import MonitoringHub
+from parsl.usage_tracking.api import UsageInformation
 logger = logging.getLogger(__name__)
-class Config(RepresentationMixin):
+class Config(RepresentationMixin, UsageInformation):
     """
     Specification of Parsl configuration options.
@@ -50,6 +51,9 @@ class Config(RepresentationMixin):
         of 1.
     run_dir : str, optional
         Path to run directory. Default is 'runinfo'.
+    std_autopath : function, optional
+        Sets the function used to generate stdout/stderr specifications when parsl.AUTO_LOGPATH is used. If no function
+        is specified, generates paths that look like: ``rundir/NNN/task_logs/X/task_{id}_{name}{label}.{out/err}``
     strategy : str, optional
         Strategy to use for scaling blocks according to workflow needs. Can be 'simple', 'htex_auto_scale', 'none'
         or `None`.
@@ -89,6 +93,7 @@ class Config(RepresentationMixin):
                  retries: int = 0,
                  retry_handler: Optional[Callable[[Exception, TaskRecord], float]] = None,
                  run_dir: str = 'runinfo',
+                 std_autopath: Optional[Callable] = None,
                  strategy: Optional[str] = 'simple',
                  strategy_period: Union[float, int] = 5,
                  max_idletime: float = 120.0,
@@ -129,6 +134,7 @@ class Config(RepresentationMixin):
         self.usage_tracking = usage_tracking
         self.initialize_logging = initialize_logging
         self.monitoring = monitoring
+        self.std_autopath: Optional[Callable] = std_autopath
     @property
     def executors(self) -> Sequence[ParslExecutor]:
@@ -144,3 +150,6 @@ class Config(RepresentationMixin):
         if len(duplicates) > 0:
             raise ConfigurationError('Executors must have unique labels ({})'.format(
                 ', '.join(['label={}'.format(repr(d)) for d in duplicates])))
+    def get_usage_information(self):
+        return {"executors_len": len(self.executors)}

parsl/data_provider/zip.py CHANGED Viewed

@@ -42,6 +42,12 @@ class ZipFileStaging(Staging):
     """
     def can_stage_out(self, file: File) -> bool:
+        return self.is_zip_url(file)
+    def can_stage_in(self, file: File) -> bool:
+        return self.is_zip_url(file)
+    def is_zip_url(self, file: File) -> bool:
         logger.debug("archive provider checking File {}".format(repr(file)))
         # First check if this is the scheme we care about
@@ -76,6 +82,20 @@ class ZipFileStaging(Staging):
         app_fut = stage_out_app(zip_path, inside_path, working_dir, inputs=[file], _parsl_staging_inhibit=True, parent_fut=parent_fut)
         return app_fut
+    def stage_in(self, dm, executor, file, parent_fut):
+        assert file.scheme == 'zip'
+        zip_path, inside_path = zip_path_split(file.path)
+        working_dir = dm.dfk.executors[executor].working_dir
+        if working_dir:
+            file.local_path = os.path.join(working_dir, inside_path)
+        stage_in_app = _zip_stage_in_app(dm)
+        app_fut = stage_in_app(zip_path, inside_path, working_dir, outputs=[file], _parsl_staging_inhibit=True, parent_fut=parent_fut)
+        return app_fut._outputs[0]
 def _zip_stage_out(zip_file, inside_path, working_dir, parent_fut=None, inputs=[], _parsl_staging_inhibit=True):
     file = inputs[0]
@@ -93,6 +113,18 @@ def _zip_stage_out_app(dm):
     return parsl.python_app(executors=['_parsl_internal'], data_flow_kernel=dm.dfk)(_zip_stage_out)
+def _zip_stage_in(zip_file, inside_path, working_dir, *, parent_fut, outputs, _parsl_staging_inhibit=True):
+    with filelock.FileLock(zip_file + ".lock"):
+        with zipfile.ZipFile(zip_file, mode='r') as z:
+            content = z.read(inside_path)
+        with open(outputs[0], "wb") as of:
+            of.write(content)
+def _zip_stage_in_app(dm):
+    return parsl.python_app(executors=['_parsl_internal'], data_flow_kernel=dm.dfk)(_zip_stage_in)
 def zip_path_split(path: str) -> Tuple[str, str]:
     """Split zip: path into a zipfile name and a contained-file name.
     """

parsl/dataflow/dflow.py CHANGED Viewed

@@ -177,11 +177,9 @@ class DataFlowKernel:
         # this must be set before executors are added since add_executors calls
         # job_status_poller.add_executors.
-        radio = self.monitoring.radio if self.monitoring else None
         self.job_status_poller = JobStatusPoller(strategy=self.config.strategy,
                                                  strategy_period=self.config.strategy_period,
-                                                 max_idletime=self.config.max_idletime,
-                                                 monitoring=radio)
+                                                 max_idletime=self.config.max_idletime)
         self.executors: Dict[str, ParslExecutor] = {}
@@ -798,7 +796,6 @@ class DataFlowKernel:
         # be the original function wrapped with an in-task stageout wrapper), a
         # rewritten File object to be passed to task to be executed
-        @typechecked
         def stageout_one_file(file: File, rewritable_func: Callable):
             if not self.check_staging_inhibited(kwargs):
                 # replace a File with a DataFuture - either completing when the stageout
@@ -996,32 +993,16 @@ class DataFlowKernel:
         executor = random.choice(choices)
         logger.debug("Task {} will be sent to executor {}".format(task_id, executor))
-        # The below uses func.__name__ before it has been wrapped by any staging code.
-        label = app_kwargs.get('label')
-        for kw in ['stdout', 'stderr']:
-            if kw in app_kwargs:
-                if app_kwargs[kw] == parsl.AUTO_LOGNAME:
-                    if kw not in ignore_for_cache:
-                        ignore_for_cache += [kw]
-                    app_kwargs[kw] = os.path.join(
-                                self.run_dir,
-                                'task_logs',
-                                str(int(task_id / 10000)).zfill(4),  # limit logs to 10k entries per directory
-                                'task_{}_{}{}.{}'.format(
-                                    str(task_id).zfill(4),
-                                    func.__name__,
-                                    '' if label is None else '_{}'.format(label),
-                                    kw)
-                    )
         resource_specification = app_kwargs.get('parsl_resource_specification', {})
         task_record: TaskRecord
-        task_record = {'depends': [],
+        task_record = {'args': app_args,
+                       'depends': [],
                        'dfk': self,
                        'executor': executor,
+                       'func': func,
                        'func_name': func.__name__,
+                       'kwargs': app_kwargs,
                        'memoize': cache,
                        'hashsum': None,
                        'exec_fu': None,
@@ -1043,18 +1024,30 @@ class DataFlowKernel:
         self.update_task_state(task_record, States.unsched)
+        for kw in ['stdout', 'stderr']:
+            if kw in app_kwargs:
+                if app_kwargs[kw] == parsl.AUTO_LOGNAME:
+                    if kw not in ignore_for_cache:
+                        ignore_for_cache += [kw]
+                    if self.config.std_autopath is None:
+                        app_kwargs[kw] = self.default_std_autopath(task_record, kw)
+                    else:
+                        app_kwargs[kw] = self.config.std_autopath(task_record, kw)
         app_fu = AppFuture(task_record)
+        task_record['app_fu'] = app_fu
         # Transform remote input files to data futures
         app_args, app_kwargs, func = self._add_input_deps(executor, app_args, app_kwargs, func)
         func = self._add_output_deps(executor, app_args, app_kwargs, app_fu, func)
+        # Replace the function invocation in the TaskRecord with whatever file-staging
+        # substitutions have been made.
         task_record.update({
                     'args': app_args,
                     'func': func,
-                    'kwargs': app_kwargs,
-                    'app_fu': app_fu})
+                    'kwargs': app_kwargs})
         assert task_id not in self.tasks
@@ -1245,8 +1238,10 @@ class DataFlowKernel:
                 self._checkpoint_timer.close()
         # Send final stats
+        logger.info("Sending end message for usage tracking")
         self.usage_tracker.send_end_message()
         self.usage_tracker.close()
+        logger.info("Closed usage tracking")
         logger.info("Closing job status poller")
         self.job_status_poller.close()
@@ -1440,6 +1435,19 @@ class DataFlowKernel:
         log_std_stream("Standard out", task_record['app_fu'].stdout)
         log_std_stream("Standard error", task_record['app_fu'].stderr)
+    def default_std_autopath(self, taskrecord, kw):
+        label = taskrecord['kwargs'].get('label')
+        task_id = taskrecord['id']
+        return os.path.join(
+            self.run_dir,
+            'task_logs',
+            str(int(task_id / 10000)).zfill(4),  # limit logs to 10k entries per directory
+            'task_{}_{}{}.{}'.format(
+                str(task_id).zfill(4),
+                taskrecord['func_name'],
+                '' if label is None else '_{}'.format(label),
+                kw))
 class DataFlowKernelLoader:
     """Manage which DataFlowKernel is active.

parsl/executors/high_throughput/executor.py CHANGED Viewed

@@ -14,6 +14,7 @@ import math
 import warnings
 import parsl.launchers
+from parsl.usage_tracking.api import UsageInformation
 from parsl.serialize import pack_res_spec_apply_message, deserialize
 from parsl.serialize.errors import SerializationError, DeserializationError
 from parsl.app.errors import RemoteExceptionWrapper
@@ -62,7 +63,7 @@ DEFAULT_LAUNCH_CMD = ("process_worker_pool.py {debug} {max_workers_per_node} "
                       "--available-accelerators {accelerators}")
-class HighThroughputExecutor(BlockProviderExecutor, RepresentationMixin):
+class HighThroughputExecutor(BlockProviderExecutor, RepresentationMixin, UsageInformation):
     """Executor designed for cluster-scale
     The HighThroughputExecutor system has the following components:
@@ -818,4 +819,9 @@ class HighThroughputExecutor(BlockProviderExecutor, RepresentationMixin):
             logger.info("Unable to terminate Interchange process; sending SIGKILL")
             self.interchange_proc.kill()
+        self.interchange_proc.close()
         logger.info("Finished HighThroughputExecutor shutdown attempt")
+    def get_usage_information(self):
+        return {"mpi": self.enable_mpi_mode}

parsl/executors/status_handling.py CHANGED Viewed

@@ -43,9 +43,6 @@ class BlockProviderExecutor(ParslExecutor):
     invoking scale_out, but it will not initialize the blocks requested by
     any init_blocks parameter. Subclasses must implement that behaviour
     themselves.
-    BENC: TODO: block error handling: maybe I want this more user pluggable?
-    I'm not sure of use cases for switchability at the moment beyond "yes or no"
     """
     def __init__(self, *,
                  provider: Optional[ExecutionProvider],

parsl/executors/taskvine/executor.py CHANGED Viewed

@@ -4,7 +4,6 @@ high-throughput system for delegating Parsl tasks to thousands of remote machine
 """
 # Import Python built-in libraries
-import atexit
 import threading
 import multiprocessing
 import logging
@@ -180,24 +179,6 @@ class TaskVineExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         else:
             self._poncho_available = True
-        # Register atexit handler to cleanup when Python shuts down
-        atexit.register(self.atexit_cleanup)
-        # Attribute indicating whether this executor was started to shut it down properly.
-        # This safeguards cases where an object of this executor is created but
-        # the executor never starts, so it shouldn't be shutdowned.
-        self._is_started = False
-        # Attribute indicating whether this executor was shutdown before.
-        # This safeguards cases where this object is automatically shut down (e.g.,
-        # via atexit) and the user also explicitly calls shut down. While this is
-        # permitted, the effect of an executor shutdown should happen only once.
-        self._is_shutdown = False
-    def atexit_cleanup(self):
-        # Calls this executor's shutdown method upon Python exiting the process.
-        self.shutdown()
     def _get_launch_command(self, block_id):
         # Implements BlockProviderExecutor's abstract method.
         # This executor uses different terminology for worker/launch
@@ -257,9 +238,6 @@ class TaskVineExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         retrieve Parsl tasks within the TaskVine system.
         """
-        # Mark this executor object as started
-        self._is_started = True
         # Synchronize connection and communication settings between the manager and factory
         self.__synchronize_manager_factory_comm_settings()
@@ -618,14 +596,6 @@ class TaskVineExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         """Shutdown the executor. Sets flag to cancel the submit process and
         collector thread, which shuts down the TaskVine system submission.
         """
-        if not self._is_started:
-            # Don't shutdown if the executor never starts.
-            return
-        if self._is_shutdown:
-            # Don't shutdown this executor again.
-            return
         logger.debug("TaskVine shutdown started")
         self._should_stop.set()
@@ -650,7 +620,6 @@ class TaskVineExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         self._finished_task_queue.close()
         self._finished_task_queue.join_thread()
-        self._is_shutdown = True
         logger.debug("TaskVine shutdown completed")
     @wrap_with_logs

parsl/executors/workqueue/executor.py CHANGED Viewed

@@ -3,7 +3,6 @@ Cooperative Computing Lab (CCL) at Notre Dame to provide a fault-tolerant,
 high-throughput system for delegating Parsl tasks to thousands of remote machines
 """
-import atexit
 import threading
 import multiprocessing
 import logging
@@ -298,24 +297,6 @@ class WorkQueueExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         if self.init_command != "":
             self.launch_cmd = self.init_command + "; " + self.launch_cmd
-        # register atexit handler to cleanup when Python shuts down
-        atexit.register(self.atexit_cleanup)
-        # Attribute indicating whether this executor was started to shut it down properly.
-        # This safeguards cases where an object of this executor is created but
-        # the executor never starts, so it shouldn't be shutdowned.
-        self.is_started = False
-        # Attribute indicating whether this executor was shutdown before.
-        # This safeguards cases where this object is automatically shut down (e.g.,
-        # via atexit) and the user also explicitly calls shut down. While this is
-        # permitted, the effect of an executor shutdown should happen only once.
-        self.is_shutdown = False
-    def atexit_cleanup(self):
-        # Calls this executor's shutdown method upon Python exiting the process.
-        self.shutdown()
     def _get_launch_command(self, block_id):
         # this executor uses different terminology for worker/launch
         # commands than in htex
@@ -325,8 +306,6 @@ class WorkQueueExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         """Create submit process and collector thread to create, send, and
         retrieve Parsl tasks within the Work Queue system.
         """
-        # Mark this executor object as started
-        self.is_started = True
         self.tasks_lock = threading.Lock()
         # Create directories for data and results
@@ -713,14 +692,6 @@ class WorkQueueExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         """Shutdown the executor. Sets flag to cancel the submit process and
         collector thread, which shuts down the Work Queue system submission.
         """
-        if not self.is_started:
-            # Don't shutdown if the executor never starts.
-            return
-        if self.is_shutdown:
-            # Don't shutdown this executor again.
-            return
         logger.debug("Work Queue shutdown started")
         self.should_stop.value = True
@@ -741,7 +712,6 @@ class WorkQueueExecutor(BlockProviderExecutor, putils.RepresentationMixin):
         self.collector_queue.close()
         self.collector_queue.join_thread()
-        self.is_shutdown = True
         logger.debug("Work Queue shutdown completed")
     @wrap_with_logs

parsl/jobs/job_status_poller.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import logging
-import parsl
 from typing import List, Sequence, Optional, Union
 from parsl.jobs.strategy import Strategy
@@ -14,8 +13,7 @@ logger = logging.getLogger(__name__)
 class JobStatusPoller(Timer):
     def __init__(self, *, strategy: Optional[str], max_idletime: float,
-                 strategy_period: Union[float, int],
-                 monitoring: Optional["parsl.monitoring.radios.MonitoringRadio"] = None) -> None:
+                 strategy_period: Union[float, int]) -> None:
         self._executors = []  # type: List[BlockProviderExecutor]
         self._strategy = Strategy(strategy=strategy,
                                   max_idletime=max_idletime)

parsl/monitoring/monitoring.py CHANGED Viewed

@@ -244,6 +244,7 @@ class MonitoringHub(RepresentationMixin):
             self.router_exit_event.set()
             logger.info("Waiting for router to terminate")
             self.router_proc.join()
+            self.router_proc.close()
             logger.debug("Finished waiting for router termination")
             if len(exception_msgs) == 0:
                 logger.debug("Sending STOP to DBM")
@@ -252,6 +253,7 @@ class MonitoringHub(RepresentationMixin):
                 logger.debug("Not sending STOP to DBM, because there were DBM exceptions")
             logger.debug("Waiting for DB termination")
             self.dbm_proc.join()
+            self.dbm_proc.close()
             logger.debug("Finished waiting for DBM termination")
             # should this be message based? it probably doesn't need to be if
@@ -259,6 +261,7 @@ class MonitoringHub(RepresentationMixin):
             logger.info("Terminating filesystem radio receiver process")
             self.filesystem_proc.terminate()
             self.filesystem_proc.join()
+            self.filesystem_proc.close()
             logger.info("Closing monitoring multiprocessing queues")
             self.exception_q.close()

parsl/monitoring/radios.py CHANGED Viewed

@@ -177,7 +177,7 @@ class UDPRadio(MonitoringRadio):
 class MultiprocessingQueueRadio(MonitoringRadio):
-    """A monitoring radio intended which connects over a multiprocessing Queue.
+    """A monitoring radio which connects over a multiprocessing Queue.
     This radio is intended to be used on the submit side, where components
     in the submit process, or processes launched by multiprocessing, will have
     access to a Queue shared with the monitoring database code (bypassing the

parsl/providers/kubernetes/kube.py CHANGED Viewed

@@ -105,7 +105,26 @@ class KubernetesProvider(ExecutionProvider, RepresentationMixin):
         if not _kubernetes_enabled:
             raise OptionalModuleMissing(['kubernetes'],
                                         "Kubernetes provider requires kubernetes module and config.")
-        config.load_kube_config()
+        try:
+            config.load_kube_config()
+        except config.config_exception.ConfigException:
+            # `load_kube_config` assumes a local kube-config file, and fails if not
+            # present, raising:
+            #
+            #     kubernetes.config.config_exception.ConfigException: Invalid
+            #     kube-config file. No configuration found.
+            #
+            # Since running a parsl driver script on a kubernetes cluster is a common
+            # pattern to enable worker-interchange communication, this enables an
+            # in-cluster config to be loaded if a kube-config file isn't found.
+            #
+            # Based on: https://github.com/kubernetes-client/python/issues/1005
+            try:
+                config.load_incluster_config()
+            except config.config_exception.ConfigException:
+                raise config.config_exception.ConfigException(
+                    "Failed to load both kube-config file and in-cluster configuration."
+                )
         self.namespace = namespace
         self.image = image

parsl/tests/configs/local_threads_checkpoint_periodic.py CHANGED Viewed

@@ -1,13 +1,11 @@
 from parsl.config import Config
 from parsl.executors.threads import ThreadPoolExecutor
-config = Config(
-    executors=[
-        ThreadPoolExecutor(
-            label='local_threads_checkpoint_periodic',
-            max_threads=1
-        )
-    ],
-    checkpoint_mode='periodic',
-    checkpoint_period='00:00:05'
-)
+def fresh_config():
+    tpe = ThreadPoolExecutor(label='local_threads_checkpoint_periodic', max_threads=1)
+    return Config(
+        executors=[tpe],
+        checkpoint_mode='periodic',
+        checkpoint_period='00:00:02'
+    )

parsl/tests/conftest.py CHANGED Viewed

@@ -3,8 +3,10 @@ import itertools
 import logging
 import os
 import pathlib
+import random
 import re
 import shutil
+import string
 import time
 import types
 import signal
@@ -139,7 +141,7 @@ def pytest_configure(config):
     )
     config.addinivalue_line(
         'markers',
-        'staging_required: Marks tests that require a staging provider, when there is no sharedFS)'
+        'staging_required: Marks tests that require a staging provider, when there is no sharedFS'
     )
     config.addinivalue_line(
         'markers',
@@ -245,6 +247,7 @@ def load_dfk_local_module(request, pytestconfig, tmpd_cwd_session):
         if callable(local_teardown):
             local_teardown()
+            assert DataFlowKernelLoader._dfk is None, "Expected teardown to clear DFK"
         if local_config:
             if parsl.dfk() != dfk:
@@ -421,3 +424,11 @@ def try_assert():
             raise AssertionError("Bad assert call: no attempts or timeout period")
     yield _impl
+@pytest.fixture
+def randomstring():
+    def func(length=5, alphabet=string.ascii_letters):
+        return "".join(random.choice(alphabet) for _ in range(length))
+    return func

parsl/tests/test_bash_apps/test_std_uri.py ADDED Viewed

@@ -0,0 +1,128 @@
+import logging
+import parsl
+import pytest
+import zipfile
+from functools import partial
+from parsl.app.futures import DataFuture
+from parsl.data_provider.files import File
+from parsl.executors import ThreadPoolExecutor
+@parsl.bash_app
+def app_stdout(stdout=parsl.AUTO_LOGNAME):
+    return "echo hello"
+def const_str(cpath, task_record, err_or_out):
+    return cpath
+def const_with_cpath(autopath_specifier, content_path, caplog):
+    with parsl.load(parsl.Config(std_autopath=partial(const_str, autopath_specifier))):
+        fut = app_stdout()
+        # we don't have to wait for a result to check this attributes
+        assert fut.stdout is autopath_specifier
+        # there is no DataFuture to wait for in the str case: the model is that
+        # the stdout will be immediately available on task completion.
+        fut.result()
+    with open(content_path, "r") as file:
+        assert file.readlines() == ["hello\n"]
+    for record in caplog.records:
+        assert record.levelno < logging.ERROR
+    parsl.clear()
+@pytest.mark.local
+def test_std_autopath_const_str(caplog, tmpd_cwd):
+    """Tests str and tuple mode autopaths with constant autopath, which should
+    all be passed through unmodified.
+    """
+    cpath = str(tmpd_cwd / "CONST")
+    const_with_cpath(cpath, cpath, caplog)
+@pytest.mark.local
+def test_std_autopath_const_pathlike(caplog, tmpd_cwd):
+    cpath = tmpd_cwd / "CONST"
+    const_with_cpath(cpath, cpath, caplog)
+@pytest.mark.local
+def test_std_autopath_const_tuples(caplog, tmpd_cwd):
+    file = tmpd_cwd / "CONST"
+    cpath = (file, "w")
+    const_with_cpath(cpath, file, caplog)
+class URIFailError(Exception):
+    pass
+def fail_uri(task_record, err_or_out):
+    raise URIFailError("Deliberate failure in std stream filename generation")
+@pytest.mark.local
+def test_std_autopath_fail(caplog):
+    with parsl.load(parsl.Config(std_autopath=fail_uri)):
+        with pytest.raises(URIFailError):
+            app_stdout()
+    parsl.clear()
+@parsl.bash_app
+def app_both(stdout=parsl.AUTO_LOGNAME, stderr=parsl.AUTO_LOGNAME):
+    return "echo hello; echo goodbye >&2"
+def zip_uri(base, task_record, err_or_out):
+    """Should generate Files in base.zip like app_both.0.out or app_both.123.err"""
+    zip_path = base / "base.zip"
+    file = f"{task_record['func_name']}.{task_record['id']}.{task_record['try_id']}.{err_or_out}"
+    return File(f"zip:{zip_path}/{file}")
+@pytest.mark.local
+def test_std_autopath_zip(caplog, tmpd_cwd):
+    with parsl.load(parsl.Config(run_dir=str(tmpd_cwd),
+                                 executors=[ThreadPoolExecutor(working_dir=str(tmpd_cwd))],
+                                 std_autopath=partial(zip_uri, tmpd_cwd))):
+        futs = []
+        for _ in range(10):
+            fut = app_both()
+            # assertions that should hold after submission
+            assert isinstance(fut.stdout, DataFuture)
+            assert fut.stdout.file_obj.url.startswith("zip")
+            futs.append(fut)
+        # Barrier for all the stageouts to complete so that we can
+        # poke at the zip file.
+        [(fut.stdout.result(), fut.stderr.result()) for fut in futs]
+        with zipfile.ZipFile(tmpd_cwd / "base.zip") as z:
+            for fut in futs:
+                assert fut.done(), "AppFuture should be done if stageout is done"
+                stdout_relative_path = f"app_both.{fut.tid}.0.stdout"
+                with z.open(stdout_relative_path) as f:
+                    assert f.readlines() == [b'hello\n']
+                stderr_relative_path = f"app_both.{fut.tid}.0.stderr"
+                with z.open(stderr_relative_path) as f:
+                    assert f.readlines()[-1] == b'goodbye\n'
+    for record in caplog.records:
+        assert record.levelno < logging.ERROR
+    parsl.clear()

parsl 2024.4.22__py3-none-any.whl → 2024.5.6__py3-none-any.whl

parsl 2024.4.22py3-none-any.whl → 2024.5.6py3-none-any.whl