PyPI - toil - Versions diffs - 6.1.0a1__py3-none-any.whl → 8.0.0__py3-none-any.whl - Mend

toil 6.1.0a1py3-none-any.whl → 8.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (193) hide show

toil/__init__.py +122 -315
toil/batchSystems/__init__.py +1 -0
toil/batchSystems/abstractBatchSystem.py +173 -89
toil/batchSystems/abstractGridEngineBatchSystem.py +272 -148
toil/batchSystems/awsBatch.py +244 -135
toil/batchSystems/cleanup_support.py +26 -16
toil/batchSystems/contained_executor.py +31 -28
toil/batchSystems/gridengine.py +86 -50
toil/batchSystems/htcondor.py +166 -89
toil/batchSystems/kubernetes.py +632 -382
toil/batchSystems/local_support.py +20 -15
toil/batchSystems/lsf.py +134 -81
toil/batchSystems/lsfHelper.py +13 -11
toil/batchSystems/mesos/__init__.py +41 -29
toil/batchSystems/mesos/batchSystem.py +290 -151
toil/batchSystems/mesos/executor.py +79 -50
toil/batchSystems/mesos/test/__init__.py +31 -23
toil/batchSystems/options.py +46 -28
toil/batchSystems/registry.py +53 -19
toil/batchSystems/singleMachine.py +296 -125
toil/batchSystems/slurm.py +603 -138
toil/batchSystems/torque.py +47 -33
toil/bus.py +186 -76
toil/common.py +664 -368
toil/cwl/__init__.py +1 -1
toil/cwl/cwltoil.py +1136 -483
toil/cwl/utils.py +17 -22
toil/deferred.py +63 -42
toil/exceptions.py +5 -3
toil/fileStores/__init__.py +5 -5
toil/fileStores/abstractFileStore.py +140 -60
toil/fileStores/cachingFileStore.py +717 -269
toil/fileStores/nonCachingFileStore.py +116 -87
toil/job.py +1225 -368
toil/jobStores/abstractJobStore.py +416 -266
toil/jobStores/aws/jobStore.py +863 -477
toil/jobStores/aws/utils.py +201 -120
toil/jobStores/conftest.py +3 -2
toil/jobStores/fileJobStore.py +292 -154
toil/jobStores/googleJobStore.py +140 -74
toil/jobStores/utils.py +36 -15
toil/leader.py +668 -272
toil/lib/accelerators.py +115 -18
toil/lib/aws/__init__.py +74 -31
toil/lib/aws/ami.py +122 -87
toil/lib/aws/iam.py +284 -108
toil/lib/aws/s3.py +31 -0
toil/lib/aws/session.py +214 -39
toil/lib/aws/utils.py +287 -231
toil/lib/bioio.py +13 -5
toil/lib/compatibility.py +11 -6
toil/lib/conversions.py +104 -47
toil/lib/docker.py +131 -103
toil/lib/ec2.py +361 -199
toil/lib/ec2nodes.py +174 -106
toil/lib/encryption/_dummy.py +5 -3
toil/lib/encryption/_nacl.py +10 -6
toil/lib/encryption/conftest.py +1 -0
toil/lib/exceptions.py +26 -7
toil/lib/expando.py +5 -3
toil/lib/ftp_utils.py +217 -0
toil/lib/generatedEC2Lists.py +127 -19
toil/lib/humanize.py +6 -2
toil/lib/integration.py +341 -0
toil/lib/io.py +141 -15
toil/lib/iterables.py +4 -2
toil/lib/memoize.py +12 -8
toil/lib/misc.py +66 -21
toil/lib/objects.py +2 -2
toil/lib/resources.py +68 -15
toil/lib/retry.py +126 -81
toil/lib/threading.py +299 -82
toil/lib/throttle.py +16 -15
toil/options/common.py +843 -409
toil/options/cwl.py +175 -90
toil/options/runner.py +50 -0
toil/options/wdl.py +73 -17
toil/provisioners/__init__.py +117 -46
toil/provisioners/abstractProvisioner.py +332 -157
toil/provisioners/aws/__init__.py +70 -33
toil/provisioners/aws/awsProvisioner.py +1145 -715
toil/provisioners/clusterScaler.py +541 -279
toil/provisioners/gceProvisioner.py +282 -179
toil/provisioners/node.py +155 -79
toil/realtimeLogger.py +34 -22
toil/resource.py +137 -75
toil/server/app.py +128 -62
toil/server/celery_app.py +3 -1
toil/server/cli/wes_cwl_runner.py +82 -53
toil/server/utils.py +54 -28
toil/server/wes/abstract_backend.py +64 -26
toil/server/wes/amazon_wes_utils.py +21 -15
toil/server/wes/tasks.py +121 -63
toil/server/wes/toil_backend.py +142 -107
toil/server/wsgi_app.py +4 -3
toil/serviceManager.py +58 -22
toil/statsAndLogging.py +224 -70
toil/test/__init__.py +282 -183
toil/test/batchSystems/batchSystemTest.py +460 -210
toil/test/batchSystems/batch_system_plugin_test.py +90 -0
toil/test/batchSystems/test_gridengine.py +173 -0
toil/test/batchSystems/test_lsf_helper.py +67 -58
toil/test/batchSystems/test_slurm.py +110 -49
toil/test/cactus/__init__.py +0 -0
toil/test/cactus/test_cactus_integration.py +56 -0
toil/test/cwl/cwlTest.py +496 -287
toil/test/cwl/measure_default_memory.cwl +12 -0
toil/test/cwl/not_run_required_input.cwl +29 -0
toil/test/cwl/scatter_duplicate_outputs.cwl +40 -0
toil/test/cwl/seqtk_seq.cwl +1 -1
toil/test/docs/scriptsTest.py +69 -46
toil/test/jobStores/jobStoreTest.py +427 -264
toil/test/lib/aws/test_iam.py +118 -50
toil/test/lib/aws/test_s3.py +16 -9
toil/test/lib/aws/test_utils.py +5 -6
toil/test/lib/dockerTest.py +118 -141
toil/test/lib/test_conversions.py +113 -115
toil/test/lib/test_ec2.py +58 -50
toil/test/lib/test_integration.py +104 -0
toil/test/lib/test_misc.py +12 -5
toil/test/mesos/MesosDataStructuresTest.py +23 -10
toil/test/mesos/helloWorld.py +7 -6
toil/test/mesos/stress.py +25 -20
toil/test/options/__init__.py +13 -0
toil/test/options/options.py +42 -0
toil/test/provisioners/aws/awsProvisionerTest.py +320 -150
toil/test/provisioners/clusterScalerTest.py +440 -250
toil/test/provisioners/clusterTest.py +166 -44
toil/test/provisioners/gceProvisionerTest.py +174 -100
toil/test/provisioners/provisionerTest.py +25 -13
toil/test/provisioners/restartScript.py +5 -4
toil/test/server/serverTest.py +188 -141
toil/test/sort/restart_sort.py +137 -68
toil/test/sort/sort.py +134 -66
toil/test/sort/sortTest.py +91 -49
toil/test/src/autoDeploymentTest.py +141 -101
toil/test/src/busTest.py +20 -18
toil/test/src/checkpointTest.py +8 -2
toil/test/src/deferredFunctionTest.py +49 -35
toil/test/src/dockerCheckTest.py +32 -24
toil/test/src/environmentTest.py +135 -0
toil/test/src/fileStoreTest.py +539 -272
toil/test/src/helloWorldTest.py +7 -4
toil/test/src/importExportFileTest.py +61 -31
toil/test/src/jobDescriptionTest.py +46 -21
toil/test/src/jobEncapsulationTest.py +2 -0
toil/test/src/jobFileStoreTest.py +74 -50
toil/test/src/jobServiceTest.py +187 -73
toil/test/src/jobTest.py +121 -71
toil/test/src/miscTests.py +19 -18
toil/test/src/promisedRequirementTest.py +82 -36
toil/test/src/promisesTest.py +7 -6
toil/test/src/realtimeLoggerTest.py +10 -6
toil/test/src/regularLogTest.py +71 -37
toil/test/src/resourceTest.py +80 -49
toil/test/src/restartDAGTest.py +36 -22
toil/test/src/resumabilityTest.py +9 -2
toil/test/src/retainTempDirTest.py +45 -14
toil/test/src/systemTest.py +12 -8
toil/test/src/threadingTest.py +44 -25
toil/test/src/toilContextManagerTest.py +10 -7
toil/test/src/userDefinedJobArgTypeTest.py +8 -5
toil/test/src/workerTest.py +73 -23
toil/test/utils/toilDebugTest.py +103 -33
toil/test/utils/toilKillTest.py +4 -5
toil/test/utils/utilsTest.py +245 -106
toil/test/wdl/wdltoil_test.py +818 -149
toil/test/wdl/wdltoil_test_kubernetes.py +91 -0
toil/toilState.py +120 -35
toil/utils/toilConfig.py +13 -4
toil/utils/toilDebugFile.py +44 -27
toil/utils/toilDebugJob.py +214 -27
toil/utils/toilDestroyCluster.py +11 -6
toil/utils/toilKill.py +8 -3
toil/utils/toilLaunchCluster.py +256 -140
toil/utils/toilMain.py +37 -16
toil/utils/toilRsyncCluster.py +32 -14
toil/utils/toilSshCluster.py +49 -22
toil/utils/toilStats.py +356 -273
toil/utils/toilStatus.py +292 -139
toil/utils/toilUpdateEC2Instances.py +3 -1
toil/version.py +12 -12
toil/wdl/utils.py +5 -5
toil/wdl/wdltoil.py +3913 -1033
toil/worker.py +367 -184
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/LICENSE +25 -0
toil-8.0.0.dist-info/METADATA +173 -0
toil-8.0.0.dist-info/RECORD +253 -0
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/WHEEL +1 -1
toil-6.1.0a1.dist-info/METADATA +0 -125
toil-6.1.0a1.dist-info/RECORD +0 -237
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/entry_points.txt +0 -0
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/top_level.txt +0 -0

toil/jobStores/abstractJobStore.py CHANGED Viewed

@@ -16,45 +16,39 @@ import os
 import pickle
 import re
 import shutil
-import sys
 from abc import ABC, ABCMeta, abstractmethod
+from collections.abc import Iterator, ValuesView
 from contextlib import closing, contextmanager
 from datetime import timedelta
 from http.client import BadStatusLine
-from typing import (IO,
-                    TYPE_CHECKING,
-                    Any,
-                    Callable,
-                    ContextManager,
-                    Dict,
-                    Iterable,
-                    Iterator,
-                    List,
-                    Optional,
-                    Set,
-                    Tuple,
-                    Union,
-                    ValuesView,
-                    cast,
-                    overload)
-if sys.version_info >= (3, 8):
-    from typing import Literal
-else:
-    from typing_extensions import Literal
+from typing import (
+    IO,
+    TYPE_CHECKING,
+    Any,
+    Callable,
+    ContextManager,
+    Literal,
+    Optional,
+    Union,
+    cast,
+    overload,
+)
 from urllib.error import HTTPError
 from urllib.parse import ParseResult, urlparse
-from urllib.request import urlopen
+from urllib.request import urlopen, Request
 from uuid import uuid4
 from toil.common import Config, getNodeID, safeUnpickleFromStream
 from toil.fileStores import FileID
-from toil.job import (CheckpointJobDescription,
-                      JobDescription,
-                      JobException,
-                      ServiceJobDescription)
+from toil.job import (
+    CheckpointJobDescription,
+    JobDescription,
+    JobException,
+    ServiceJobDescription,
+)
+from toil.lib.ftp_utils import FtpFsAccess
 from toil.lib.compatibility import deprecated
+from toil.lib.exceptions import UnimplementedURLException
 from toil.lib.io import WriteWatchingStream
 from toil.lib.memoize import memoize
 from toil.lib.retry import ErrorCondition, retry
@@ -67,10 +61,22 @@ logger = logging.getLogger(__name__)
 try:
     from botocore.exceptions import ProxyConnectionError
 except ImportError:
     class ProxyConnectionError(BaseException):  # type: ignore
         """Dummy class."""
+class LocatorException(Exception):
+    """
+    Base exception class for all locator exceptions.
+    For example, job store/aws bucket exceptions where they already exist
+    """
+    def __init__(self, error_msg: str, locator: str, prefix: Optional[str] = None):
+        full_locator = locator if prefix is None else f"{prefix}:{locator}"
+        super().__init__(error_msg % full_locator)
 class InvalidImportExportUrlException(Exception):
     def __init__(self, url: ParseResult) -> None:
         """
@@ -78,24 +84,10 @@ class InvalidImportExportUrlException(Exception):
         """
         super().__init__("The URL '%s' is invalid." % url.geturl())
-class UnimplementedURLException(RuntimeError):
-    def __init__(self, url: ParseResult, operation: str) -> None:
-        """
-        Make a new exception to report that a URL scheme is not implemented, or
-        that the implementation can't be loaded because its dependencies are
-        not installed.
-        :param url: The given URL
-        :param operation: Whether we are trying to 'import' or 'export'
-        """
-        super().__init__(
-            f"No available job store implementation can {operation} the URL "
-            f"'{url.geturl()}'. Ensure Toil has been installed "
-            f"with the appropriate extras."
-        )
 class NoSuchJobException(Exception):
     """Indicates that the specified job does not exist."""
     def __init__(self, jobStoreID: FileID):
         """
         :param str jobStoreID: the jobStoreID that was mistakenly assumed to exist
@@ -105,17 +97,21 @@ class NoSuchJobException(Exception):
 class ConcurrentFileModificationException(Exception):
     """Indicates that the file was attempted to be modified by multiple processes at once."""
     def __init__(self, jobStoreFileID: FileID):
         """
         :param jobStoreFileID: the ID of the file that was modified by multiple workers
                or processes concurrently
         """
-        super().__init__('Concurrent update to file %s detected.' % jobStoreFileID)
+        super().__init__("Concurrent update to file %s detected." % jobStoreFileID)
 class NoSuchFileException(Exception):
     """Indicates that the specified file does not exist."""
-    def __init__(self, jobStoreFileID: FileID, customName: Optional[str] = None, *extra: Any):
+    def __init__(
+        self, jobStoreFileID: FileID, customName: Optional[str] = None, *extra: Any
+    ):
         """
         :param jobStoreFileID: the ID of the file that was mistakenly assumed to exist
         :param customName: optionally, an alternate name for the nonexistent file
@@ -136,24 +132,33 @@ class NoSuchFileException(Exception):
         super().__init__(message)
-class NoSuchJobStoreException(Exception):
+class NoSuchJobStoreException(LocatorException):
     """Indicates that the specified job store does not exist."""
-    def __init__(self, locator: str):
+    def __init__(self, locator: str, prefix: str):
         """
         :param str locator: The location of the job store
         """
-        super().__init__("The job store '%s' does not exist, so there is nothing to restart." % locator)
+        super().__init__(
+            "The job store '%s' does not exist, so there is nothing to restart.",
+            locator,
+            prefix,
+        )
-class JobStoreExistsException(Exception):
+class JobStoreExistsException(LocatorException):
     """Indicates that the specified job store already exists."""
-    def __init__(self, locator: str):
+    def __init__(self, locator: str, prefix: str):
         """
         :param str locator: The location of the job store
         """
         super().__init__(
             "The job store '%s' already exists. Use --restart to resume the workflow, or remove "
-            "the job store with 'toil clean' to start the workflow from scratch." % locator)
+            "the job store with 'toil clean' to start the workflow from scratch.",
+            locator,
+            prefix,
+        )
 class AbstractJobStore(ABC):
@@ -205,7 +210,7 @@ class AbstractJobStore(ABC):
         self.__config = config
         self.write_config()
-    @deprecated(new_function_name='write_config')
+    @deprecated(new_function_name="write_config")
     def writeConfig(self) -> None:
         return self.write_config()
@@ -214,7 +219,9 @@ class AbstractJobStore(ABC):
         Persists the value of the :attr:`AbstractJobStore.config` attribute to the
         job store, so that it can be retrieved later by other instances of this class.
         """
-        with self.write_shared_file_stream('config.pickle', encrypted=False) as fileHandle:
+        with self.write_shared_file_stream(
+            "config.pickle", encrypted=False
+        ) as fileHandle:
             pickle.dump(self.__config, fileHandle, pickle.HIGHEST_PROTOCOL)
     def resume(self) -> None:
@@ -224,7 +231,7 @@ class AbstractJobStore(ABC):
         :raises NoSuchJobStoreException: if the physical storage for this job store doesn't exist
         """
-        with self.read_shared_file_stream('config.pickle') as fileHandle:
+        with self.read_shared_file_stream("config.pickle") as fileHandle:
             config = safeUnpickleFromStream(fileHandle)
             assert config.workflowID is not None
             self.__config = config
@@ -242,9 +249,9 @@ class AbstractJobStore(ABC):
         """
         return self.__locator
-    rootJobStoreIDFileName = 'rootJobStoreID'
+    rootJobStoreIDFileName = "rootJobStoreID"
-    @deprecated(new_function_name='set_root_job')
+    @deprecated(new_function_name="set_root_job")
     def setRootJob(self, rootJobStoreID: FileID) -> None:
         """Set the root job of the workflow backed by this job store."""
         return self.set_root_job(rootJobStoreID)
@@ -256,9 +263,9 @@ class AbstractJobStore(ABC):
         :param job_id: The ID of the job to set as root
         """
         with self.write_shared_file_stream(self.rootJobStoreIDFileName) as f:
-            f.write(job_id.encode('utf-8'))
+            f.write(job_id.encode("utf-8"))
-    @deprecated(new_function_name='load_root_job')
+    @deprecated(new_function_name="load_root_job")
     def loadRootJob(self) -> JobDescription:
         return self.load_root_job()
@@ -273,16 +280,18 @@ class AbstractJobStore(ABC):
         """
         try:
             with self.read_shared_file_stream(self.rootJobStoreIDFileName) as f:
-                rootJobStoreID = f.read().decode('utf-8')
+                rootJobStoreID = f.read().decode("utf-8")
         except NoSuchFileException:
-            raise JobException('No job has been set as the root in this job store')
+            raise JobException("No job has been set as the root in this job store")
         if not self.job_exists(rootJobStoreID):
-            raise JobException("The root job '%s' doesn't exist. Either the Toil workflow "
-                               "is finished or has never been started" % rootJobStoreID)
+            raise JobException(
+                "The root job '%s' doesn't exist. Either the Toil workflow "
+                "is finished or has never been started" % rootJobStoreID
+            )
         return self.load_job(rootJobStoreID)
     # FIXME: This is only used in tests, why do we have it?
-    @deprecated(new_function_name='create_root_job')
+    @deprecated(new_function_name="create_root_job")
     def createRootJob(self, desc: JobDescription) -> JobDescription:
         return self.create_root_job(desc)
@@ -299,7 +308,7 @@ class AbstractJobStore(ABC):
         self.set_root_job(job_description.jobStoreID)
         return job_description
-    @deprecated(new_function_name='get_root_job_return_value')
+    @deprecated(new_function_name="get_root_job_return_value")
     def getRootJobReturnValue(self) -> Any:
         return self.get_root_job_return_value()
@@ -310,12 +319,12 @@ class AbstractJobStore(ABC):
         Raises an exception if the root job hasn't fulfilled its promise yet.
         """
         # Parse out the return value from the root job
-        with self.read_shared_file_stream('rootJobReturnValue') as fH:
+        with self.read_shared_file_stream("rootJobReturnValue") as fH:
             return safeUnpickleFromStream(fH)
     @staticmethod
     @memoize
-    def _get_job_store_classes() -> List['AbstractJobStore']:
+    def _get_job_store_classes() -> list["AbstractJobStore"]:
         """
         A list of concrete AbstractJobStore implementations whose dependencies are installed.
@@ -325,23 +334,30 @@ class AbstractJobStore(ABC):
             "toil.jobStores.fileJobStore.FileJobStore",
             "toil.jobStores.googleJobStore.GoogleJobStore",
             "toil.jobStores.aws.jobStore.AWSJobStore",
-            "toil.jobStores.abstractJobStore.JobStoreSupport")
+            "toil.jobStores.abstractJobStore.JobStoreSupport",
+        )
         jobStoreClasses = []
         for className in jobStoreClassNames:
-            moduleName, className = className.rsplit('.', 1)
+            moduleName, className = className.rsplit(".", 1)
             from importlib import import_module
             try:
                 module = import_module(moduleName)
             except (ImportError, ProxyConnectionError):
-                logger.debug("Unable to import '%s' as is expected if the corresponding extra was "
-                             "omitted at installation time.", moduleName)
+                logger.debug(
+                    "Unable to import '%s' as is expected if the corresponding extra was "
+                    "omitted at installation time.",
+                    moduleName,
+                )
             else:
                 jobStoreClass = getattr(module, className)
                 jobStoreClasses.append(jobStoreClass)
         return jobStoreClasses
     @classmethod
-    def _findJobStoreForUrl(cls, url: ParseResult, export: bool = False) -> 'AbstractJobStore':
+    def _findJobStoreForUrl(
+        cls, url: ParseResult, export: bool = False
+    ) -> "AbstractJobStore":
         """
         Returns the AbstractJobStore subclass that supports the given URL.
@@ -360,46 +376,58 @@ class AbstractJobStore(ABC):
     # returns a file ID. Explain this to MyPy.
     @overload
-    def importFile(self,
-                   srcUrl: str,
-                   sharedFileName: str,
-                   hardlink: bool = False,
-                   symlink: bool = True) -> None: ...
+    def importFile(
+        self,
+        srcUrl: str,
+        sharedFileName: str,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> None: ...
     @overload
-    def importFile(self,
-                   srcUrl: str,
-                   sharedFileName: None = None,
-                   hardlink: bool = False,
-                   symlink: bool = True) -> FileID: ...
-    @deprecated(new_function_name='import_file')
-    def importFile(self,
-                   srcUrl: str,
-                   sharedFileName: Optional[str] = None,
-                   hardlink: bool = False,
-                   symlink: bool = True) -> Optional[FileID]:
+    def importFile(
+        self,
+        srcUrl: str,
+        sharedFileName: None = None,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> FileID: ...
+    @deprecated(new_function_name="import_file")
+    def importFile(
+        self,
+        srcUrl: str,
+        sharedFileName: Optional[str] = None,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> Optional[FileID]:
         return self.import_file(srcUrl, sharedFileName, hardlink, symlink)
     @overload
-    def import_file(self,
-                    src_uri: str,
-                    shared_file_name: str,
-                    hardlink: bool = False,
-                    symlink: bool = True) -> None: ...
+    def import_file(
+        self,
+        src_uri: str,
+        shared_file_name: str,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> None: ...
     @overload
-    def import_file(self,
-                    src_uri: str,
-                    shared_file_name: None = None,
-                    hardlink: bool = False,
-                    symlink: bool = True) -> FileID: ...
-    def import_file(self,
-                    src_uri: str,
-                    shared_file_name: Optional[str] = None,
-                    hardlink: bool = False,
-                    symlink: bool = True) -> Optional[FileID]:
+    def import_file(
+        self,
+        src_uri: str,
+        shared_file_name: None = None,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> FileID: ...
+    def import_file(
+        self,
+        src_uri: str,
+        shared_file_name: Optional[str] = None,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> Optional[FileID]:
         """
         Imports the file at the given URL into job store. The ID of the newly imported file is
         returned. If the name of a shared file name is provided, the file will be imported as
@@ -437,18 +465,23 @@ class AbstractJobStore(ABC):
         # subclasses of AbstractJobStore.
         parseResult = urlparse(src_uri)
         otherCls = self._findJobStoreForUrl(parseResult)
-        return self._import_file(otherCls,
-                                 parseResult,
-                                 shared_file_name=shared_file_name,
-                                 hardlink=hardlink,
-                                 symlink=symlink)
-    def _import_file(self,
-                     otherCls: 'AbstractJobStore',
-                     uri: ParseResult,
-                     shared_file_name: Optional[str] = None,
-                     hardlink: bool = False,
-                     symlink: bool = True) -> Optional[FileID]:
+        logger.info("Importing input %s...", src_uri)
+        return self._import_file(
+            otherCls,
+            parseResult,
+            shared_file_name=shared_file_name,
+            hardlink=hardlink,
+            symlink=symlink,
+        )
+    def _import_file(
+        self,
+        otherCls: "AbstractJobStore",
+        uri: ParseResult,
+        shared_file_name: Optional[str] = None,
+        hardlink: bool = False,
+        symlink: bool = True,
+    ) -> Optional[FileID]:
         """
         Import the file at the given URL using the given job store class to retrieve that file.
         See also :meth:`.importFile`. This method applies a generic approach to importing: it
@@ -478,7 +511,7 @@ class AbstractJobStore(ABC):
                 otherCls._read_from_url(uri, writable)
                 return None
-    @deprecated(new_function_name='export_file')
+    @deprecated(new_function_name="export_file")
     def exportFile(self, jobStoreFileID: FileID, dstUrl: str) -> None:
         return self.export_file(jobStoreFileID, dstUrl)
@@ -497,13 +530,17 @@ class AbstractJobStore(ABC):
         :param str file_id: The id of the file in the job store that should be exported.
         :param str dst_uri: URL that points to a file or object in the storage mechanism of a
-                supported URL scheme e.g. a blob in an AWS s3 bucket.
+                supported URL scheme e.g. a blob in an AWS s3 bucket. May also be a local path.
         """
+        from toil.common import Toil
+        dst_uri = Toil.normalize_uri(dst_uri)
         parseResult = urlparse(dst_uri)
         otherCls = self._findJobStoreForUrl(parseResult, export=True)
         self._export_file(otherCls, file_id, parseResult)
-    def _export_file(self, otherCls: 'AbstractJobStore', jobStoreFileID: FileID, url: ParseResult) -> None:
+    def _export_file(
+        self, otherCls: "AbstractJobStore", jobStoreFileID: FileID, url: ParseResult
+    ) -> None:
         """
         Refer to exportFile docstring for information about this method.
@@ -518,7 +555,9 @@ class AbstractJobStore(ABC):
         """
         self._default_export_file(otherCls, jobStoreFileID, url)
-    def _default_export_file(self, otherCls: 'AbstractJobStore', jobStoreFileID: FileID, url: ParseResult) -> None:
+    def _default_export_file(
+        self, otherCls: "AbstractJobStore", jobStoreFileID: FileID, url: ParseResult
+    ) -> None:
         """
         Refer to exportFile docstring for information about this method.
@@ -533,7 +572,7 @@ class AbstractJobStore(ABC):
         """
         executable = False
         with self.read_file_stream(jobStoreFileID) as readable:
-            if getattr(jobStoreFileID, 'executable', False):
+            if getattr(jobStoreFileID, "executable", False):
                 executable = jobStoreFileID.executable
             otherCls._write_to_url(readable, url, executable)
@@ -542,6 +581,8 @@ class AbstractJobStore(ABC):
         """
         Return True if the file at the given URI exists, and False otherwise.
+        May raise an error if file existence cannot be determined.
         :param src_uri: URL that points to a file or object in the storage
                mechanism of a supported URL scheme e.g. a blob in an AWS s3 bucket.
         """
@@ -572,7 +613,7 @@ class AbstractJobStore(ABC):
         return otherCls._get_is_directory(parseResult)
     @classmethod
-    def list_url(cls, src_uri: str) -> List[str]:
+    def list_url(cls, src_uri: str) -> list[str]:
         """
         List the directory at the given URL. Returned path components can be
         joined with '/' onto the passed URL to form new URLs. Those that end in
@@ -597,7 +638,7 @@ class AbstractJobStore(ABC):
         return otherCls._list_url(parseResult)
     @classmethod
-    def read_from_url(cls, src_uri: str, writable: IO[bytes]) -> Tuple[int, bool]:
+    def read_from_url(cls, src_uri: str, writable: IO[bytes]) -> tuple[int, bool]:
         """
         Read the given URL and write its content into the given writable stream.
@@ -628,6 +669,8 @@ class AbstractJobStore(ABC):
     def _url_exists(cls, url: ParseResult) -> bool:
         """
         Return True if the item at the given URL exists, and Flase otherwise.
+        May raise an error if file existence cannot be determined.
         """
         raise NotImplementedError(f"No implementation for {url}")
@@ -655,7 +698,7 @@ class AbstractJobStore(ABC):
     @classmethod
     @abstractmethod
-    def _read_from_url(cls, url: ParseResult, writable: IO[bytes]) -> Tuple[int, bool]:
+    def _read_from_url(cls, url: ParseResult, writable: IO[bytes]) -> tuple[int, bool]:
         """
         Reads the contents of the object at the specified location and writes it to the given
         writable stream.
@@ -675,7 +718,7 @@ class AbstractJobStore(ABC):
     @classmethod
     @abstractmethod
-    def _list_url(cls, url: ParseResult) -> List[str]:
+    def _list_url(cls, url: ParseResult) -> list[str]:
         """
         List the contents of the given URL, which may or may not end in '/'
@@ -707,7 +750,12 @@ class AbstractJobStore(ABC):
     @classmethod
     @abstractmethod
-    def _write_to_url(cls, readable: Union[IO[bytes], IO[str]], url: ParseResult, executable: bool = False) -> None:
+    def _write_to_url(
+        cls,
+        readable: Union[IO[bytes], IO[str]],
+        url: ParseResult,
+        executable: bool = False,
+    ) -> None:
         """
         Reads the contents of the given readable stream and writes it to the object at the
         specified location. Raises FileNotFoundError if the URL doesn't exist..
@@ -754,11 +802,11 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='get_env')
-    def getEnv(self) -> Dict[str, str]:
+    @deprecated(new_function_name="get_env")
+    def getEnv(self) -> dict[str, str]:
         return self.get_env()
-    def get_env(self) -> Dict[str, str]:
+    def get_env(self) -> dict[str, str]:
         """
         Returns a dictionary of environment variables that this job store requires to be set in
         order to function properly on a worker.
@@ -769,7 +817,7 @@ class AbstractJobStore(ABC):
     # Cleanup functions
     def clean(
-        self, jobCache: Optional[Dict[Union[str, "TemporaryID"], JobDescription]] = None
+        self, jobCache: Optional[dict[Union[str, "TemporaryID"], JobDescription]] = None
     ) -> JobDescription:
         """
         Function to cleanup the state of a job store after a restart.
@@ -797,7 +845,9 @@ class AbstractJobStore(ABC):
                 return self.load_job(jobId)
         def haveJob(jobId: str) -> bool:
-            assert len(jobId) > 1, f"Job ID {jobId} too short; is a string being used as a list?"
+            assert (
+                len(jobId) > 1
+            ), f"Job ID {jobId} too short; is a string being used as a list?"
             if jobCache is not None:
                 if jobId in jobCache:
                     return True
@@ -817,13 +867,15 @@ class AbstractJobStore(ABC):
                 jobCache[str(jobDescription.jobStoreID)] = jobDescription
                 self.update_job(jobDescription)
-        def getJobDescriptions() -> Union[ValuesView[JobDescription], Iterator[JobDescription]]:
+        def getJobDescriptions() -> (
+            Union[ValuesView[JobDescription], Iterator[JobDescription]]
+        ):
             if jobCache is not None:
                 return jobCache.values()
             else:
                 return self.jobs()
-        def get_jobs_reachable_from_root() -> Set[str]:
+        def get_jobs_reachable_from_root() -> set[str]:
             """
             Traverse the job graph from the root job and return a flattened set of all active jobstore IDs.
@@ -833,18 +885,17 @@ class AbstractJobStore(ABC):
             # Iterate from the root JobDescription and collate all jobs
             # that are reachable from it.
             root_job_description = self.load_root_job()
-            reachable_from_root: Set[str] = set()
+            reachable_from_root: set[str] = set()
-            # Add first root job outside of the loop below.
-            reachable_from_root.add(str(root_job_description.jobStoreID))
-            # add all of root's linked service jobs as well
-            for service_jobstore_id in root_job_description.services:
-                if haveJob(service_jobstore_id):
-                    reachable_from_root.add(service_jobstore_id)
-            for merged_jobstore_id in root_job_description.merged_jobs:
+            for merged_in in root_job_description.get_chain():
+                # Add the job itself and any other jobs that chained with it.
                 # Keep merged-in jobs around themselves, but don't bother
                 # exploring them, since we took their successors.
-                reachable_from_root.add(merged_jobstore_id)
+                reachable_from_root.add(merged_in.job_store_id)
+            # add all of root's linked service jobs as well
+            for service_job_store_id in root_job_description.services:
+                if haveJob(service_job_store_id):
+                    reachable_from_root.add(service_job_store_id)
             # Unprocessed means it might have successor jobs we need to add.
             unprocessed_job_descriptions = [root_job_description]
@@ -852,24 +903,30 @@ class AbstractJobStore(ABC):
             while unprocessed_job_descriptions:
                 new_job_descriptions_to_process = []  # Reset.
                 for job_description in unprocessed_job_descriptions:
-                    for successor_jobstore_id in job_description.allSuccessors():
-                        if successor_jobstore_id not in reachable_from_root and haveJob(successor_jobstore_id):
-                            successor_job_description = getJobDescription(successor_jobstore_id)
-                            # Add each successor job.
-                            reachable_from_root.add(
-                                str(successor_job_description.jobStoreID)
-                            )
-                            # Add all of the successor's linked service jobs as well.
-                            for service_jobstore_id in successor_job_description.services:
-                                if haveJob(service_jobstore_id):
-                                    reachable_from_root.add(service_jobstore_id)
-                            new_job_descriptions_to_process.append(successor_job_description)
-                    for merged_jobstore_id in job_description.merged_jobs:
+                    for merged_in in job_description.get_chain():
+                        # Add the job and anything chained with it.
                         # Keep merged-in jobs around themselves, but don't bother
                         # exploring them, since we took their successors.
-                        reachable_from_root.add(merged_jobstore_id)
+                        reachable_from_root.add(merged_in.job_store_id)
+                    for successor_job_store_id in job_description.allSuccessors():
+                        if (
+                            successor_job_store_id not in reachable_from_root
+                            and haveJob(successor_job_store_id)
+                        ):
+                            successor_job_description = getJobDescription(
+                                successor_job_store_id
+                            )
+                            # Add all of the successor's linked service jobs as well.
+                            for (
+                                service_job_store_id
+                            ) in successor_job_description.services:
+                                if haveJob(service_job_store_id):
+                                    reachable_from_root.add(service_job_store_id)
+                            new_job_descriptions_to_process.append(
+                                successor_job_description
+                            )
                 unprocessed_job_descriptions = new_job_descriptions_to_process
             logger.debug(f"{len(reachable_from_root)} jobs reachable from root.")
@@ -879,22 +936,32 @@ class AbstractJobStore(ABC):
         # Cleanup jobs that are not reachable from the root, and therefore orphaned
         # TODO: Avoid reiterating reachable_from_root (which may be very large)
-        unreachable = [x for x in getJobDescriptions() if x.jobStoreID not in reachable_from_root]
+        unreachable = [
+            x for x in getJobDescriptions() if x.jobStoreID not in reachable_from_root
+        ]
         for jobDescription in unreachable:
             # clean up any associated files before deletion
             for fileID in jobDescription.filesToDelete:
                 # Delete any files that should already be deleted
-                logger.warning(f"Deleting file '{fileID}'. It is marked for deletion but has not yet been removed.")
+                logger.warning(
+                    f"Deleting file '{fileID}'. It is marked for deletion but has not yet been removed."
+                )
                 self.delete_file(fileID)
             # Delete the job from us and the cache
             deleteJob(str(jobDescription.jobStoreID))
-        jobDescriptionsReachableFromRoot = {id: getJobDescription(id) for id in reachable_from_root}
+        jobDescriptionsReachableFromRoot = {
+            id: getJobDescription(id) for id in reachable_from_root
+        }
         # Clean up any checkpoint jobs -- delete any successors it
         # may have launched, and restore the job to a pristine state
         jobsDeletedByCheckpoints = set()
-        for jobDescription in [desc for desc in jobDescriptionsReachableFromRoot.values() if isinstance(desc, CheckpointJobDescription)]:
+        for jobDescription in [
+            desc
+            for desc in jobDescriptionsReachableFromRoot.values()
+            if isinstance(desc, CheckpointJobDescription)
+        ]:
             if jobDescription.jobStoreID in jobsDeletedByCheckpoints:
                 # This is a checkpoint that was nested within an
                 # earlier checkpoint, so it and all its successors are
@@ -920,20 +987,23 @@ class AbstractJobStore(ABC):
             if len(jobDescription.filesToDelete) != 0:
                 # Delete any files that should already be deleted
                 for fileID in jobDescription.filesToDelete:
-                    logger.critical("Removing file in job store: %s that was "
-                                    "marked for deletion but not previously removed" % fileID)
+                    logger.critical(
+                        "Removing file in job store: %s that was "
+                        "marked for deletion but not previously removed" % fileID
+                    )
                     self.delete_file(fileID)
                 jobDescription.filesToDelete = []
                 changed[0] = True
-            # For a job whose command is already executed, remove jobs from the
+            # For a job whose body has already executed, remove jobs from the
             # stack that are already deleted. This cleans up the case that the
             # jobDescription had successors to run, but had not been updated to
             # reflect this.
-            if jobDescription.command is None:
+            if not jobDescription.has_body():
                 def stackSizeFn() -> int:
                     return len(list(jobDescription.allSuccessors()))
                 startStackSize = stackSizeFn()
                 # Remove deleted jobs
                 jobDescription.filterSuccessors(haveJob)
@@ -959,16 +1029,25 @@ class AbstractJobStore(ABC):
                 assert isinstance(serviceJobDescription, ServiceJobDescription)
                 if flag == 1:
-                    logger.debug("Recreating a start service flag for job: %s, flag: %s",
-                                 jobStoreID, newFlag)
+                    logger.debug(
+                        "Recreating a start service flag for job: %s, flag: %s",
+                        jobStoreID,
+                        newFlag,
+                    )
                     serviceJobDescription.startJobStoreID = newFlag
                 elif flag == 2:
-                    logger.debug("Recreating a terminate service flag for job: %s, flag: %s",
-                                 jobStoreID, newFlag)
+                    logger.debug(
+                        "Recreating a terminate service flag for job: %s, flag: %s",
+                        jobStoreID,
+                        newFlag,
+                    )
                     serviceJobDescription.terminateJobStoreID = newFlag
                 else:
-                    logger.debug("Recreating a error service flag for job: %s, flag: %s",
-                                 jobStoreID, newFlag)
+                    logger.debug(
+                        "Recreating a error service flag for job: %s, flag: %s",
+                        jobStoreID,
+                        newFlag,
+                    )
                     assert flag == 3
                     serviceJobDescription.errorJobStoreID = newFlag
@@ -981,6 +1060,7 @@ class AbstractJobStore(ABC):
             def servicesSizeFn() -> int:
                 return len(jobDescription.services)
             startServicesSize = servicesSizeFn()
             def replaceFlagsIfNeeded(serviceJobDescription: JobDescription) -> None:
@@ -1041,12 +1121,14 @@ class AbstractJobStore(ABC):
         # Remove any crufty stats/logging files from the previous run
         logger.debug("Discarding old statistics and logs...")
         # We have to manually discard the stream to avoid getting
         # stuck on a blocking write from the job store.
         def discardStream(stream: Union[IO[bytes], IO[str]]) -> None:
             """Read the stream 4K at a time until EOF, discarding all input."""
             while len(stream.read(4096)) != 0:
                 pass
         self.read_logs(discardStream)
         logger.debug("Job store is clean")
@@ -1058,7 +1140,7 @@ class AbstractJobStore(ABC):
     # existence of jobs
     ##########################################
-    @deprecated(new_function_name='assign_job_id')
+    @deprecated(new_function_name="assign_job_id")
     def assignID(self, jobDescription: JobDescription) -> None:
         return self.assign_job_id(jobDescription)
@@ -1082,7 +1164,7 @@ class AbstractJobStore(ABC):
         """
         yield
-    @deprecated(new_function_name='create_job')
+    @deprecated(new_function_name="create_job")
     def create(self, jobDescription: JobDescription) -> JobDescription:
         return self.create_job(jobDescription)
@@ -1098,7 +1180,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='job_exists')
+    @deprecated(new_function_name="job_exists")
     def exists(self, jobStoreID: str) -> bool:
         return self.job_exists(jobStoreID)
@@ -1114,7 +1196,7 @@ class AbstractJobStore(ABC):
     # One year should be sufficient to finish any pipeline ;-)
     publicUrlExpiration = timedelta(days=365)
-    @deprecated(new_function_name='get_public_url')
+    @deprecated(new_function_name="get_public_url")
     def getPublicUrl(self, fileName: str) -> str:
         return self.get_public_url(fileName)
@@ -1133,7 +1215,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='get_shared_public_url')
+    @deprecated(new_function_name="get_shared_public_url")
     def getSharedPublicUrl(self, sharedFileName: str) -> str:
         return self.get_shared_public_url(sharedFileName)
@@ -1155,7 +1237,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='load_job')
+    @deprecated(new_function_name="load_job")
     def load(self, jobStoreID: str) -> JobDescription:
         return self.load_job(jobStoreID)
@@ -1175,7 +1257,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='update_job')
+    @deprecated(new_function_name="update_job")
     def update(self, jobDescription: JobDescription) -> None:
         return self.update_job(jobDescription)
@@ -1190,7 +1272,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='delete_job')
+    @deprecated(new_function_name="delete_job")
     def delete(self, jobStoreID: str) -> None:
         return self.delete_job(jobStoreID)
@@ -1227,12 +1309,19 @@ class AbstractJobStore(ABC):
     # associated with a given job.
     ##########################################
-    @deprecated(new_function_name='write_file')
-    def writeFile(self, localFilePath: str, jobStoreID: Optional[str] = None, cleanup: bool = False) -> str:
+    @deprecated(new_function_name="write_file")
+    def writeFile(
+        self,
+        localFilePath: str,
+        jobStoreID: Optional[str] = None,
+        cleanup: bool = False,
+    ) -> str:
         return self.write_file(localFilePath, jobStoreID, cleanup)
     @abstractmethod
-    def write_file(self, local_path: str, job_id: Optional[str] = None, cleanup: bool = False) -> str:
+    def write_file(
+        self, local_path: str, job_id: Optional[str] = None, cleanup: bool = False
+    ) -> str:
         """
         Takes a file (as a path) and places it in this job store. Returns an ID that can be used
         to retrieve the file at a later time.  The file is written in a atomic manner.  It will
@@ -1263,19 +1352,27 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='write_file_stream')
-    def writeFileStream(self, jobStoreID: Optional[str] = None, cleanup: bool = False, basename: Optional[str] = None,
-                        encoding: Optional[str] = None, errors: Optional[str] = None) -> ContextManager[Tuple[IO[bytes], str]]:
+    @deprecated(new_function_name="write_file_stream")
+    def writeFileStream(
+        self,
+        jobStoreID: Optional[str] = None,
+        cleanup: bool = False,
+        basename: Optional[str] = None,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> ContextManager[tuple[IO[bytes], str]]:
         return self.write_file_stream(jobStoreID, cleanup, basename, encoding, errors)
     @abstractmethod
     @contextmanager
-    def write_file_stream(self,
-                          job_id: Optional[str] = None,
-                          cleanup: bool = False,
-                          basename: Optional[str] = None,
-                          encoding: Optional[str] = None,
-                          errors: Optional[str] = None) -> Iterator[Tuple[IO[bytes], str]]:
+    def write_file_stream(
+        self,
+        job_id: Optional[str] = None,
+        cleanup: bool = False,
+        basename: Optional[str] = None,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> Iterator[tuple[IO[bytes], str]]:
         """
         Similar to writeFile, but returns a context manager yielding a tuple of
         1) a file handle which can be written to and 2) the ID of the resulting
@@ -1314,18 +1411,22 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='get_empty_file_store_id')
-    def getEmptyFileStoreID(self,
-                            jobStoreID: Optional[str] = None,
-                            cleanup: bool = False,
-                            basename: Optional[str] = None) -> str:
+    @deprecated(new_function_name="get_empty_file_store_id")
+    def getEmptyFileStoreID(
+        self,
+        jobStoreID: Optional[str] = None,
+        cleanup: bool = False,
+        basename: Optional[str] = None,
+    ) -> str:
         return self.get_empty_file_store_id(jobStoreID, cleanup, basename)
     @abstractmethod
-    def get_empty_file_store_id(self,
-                                job_id: Optional[str] = None,
-                                cleanup: bool = False,
-                                basename: Optional[str] = None) -> str:
+    def get_empty_file_store_id(
+        self,
+        job_id: Optional[str] = None,
+        cleanup: bool = False,
+        basename: Optional[str] = None,
+    ) -> str:
         """
         Creates an empty file in the job store and returns its ID.
         Call to fileExists(getEmptyFileStoreID(jobStoreID)) will return True.
@@ -1347,8 +1448,10 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='read_file')
-    def readFile(self, jobStoreFileID: str, localFilePath: str, symlink: bool = False) -> None:
+    @deprecated(new_function_name="read_file")
+    def readFile(
+        self, jobStoreFileID: str, localFilePath: str, symlink: bool = False
+    ) -> None:
         return self.read_file(jobStoreFileID, localFilePath, symlink)
     @abstractmethod
@@ -1376,7 +1479,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='read_file_stream')
+    @deprecated(new_function_name="read_file_stream")
     def readFileStream(
         self,
         jobStoreFileID: str,
@@ -1391,14 +1494,12 @@ class AbstractJobStore(ABC):
         file_id: Union[FileID, str],
         encoding: Literal[None] = None,
         errors: Optional[str] = None,
-    ) -> ContextManager[IO[bytes]]:
-        ...
+    ) -> ContextManager[IO[bytes]]: ...
     @overload
     def read_file_stream(
         self, file_id: Union[FileID, str], encoding: str, errors: Optional[str] = None
-    ) -> ContextManager[IO[str]]:
-        ...
+    ) -> ContextManager[IO[str]]: ...
     @abstractmethod
     def read_file_stream(
@@ -1424,7 +1525,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='delete_file')
+    @deprecated(new_function_name="delete_file")
     def deleteFile(self, jobStoreFileID: str) -> None:
         return self.delete_file(jobStoreFileID)
@@ -1438,7 +1539,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='file_exists')
+    @deprecated(new_function_name="file_exists")
     def fileExists(self, jobStoreFileID: str) -> bool:
         """Determine whether a file exists in this job store."""
         return self.file_exists(jobStoreFileID)
@@ -1452,7 +1553,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='get_file_size')
+    @deprecated(new_function_name="get_file_size")
     def getFileSize(self, jobStoreFileID: str) -> int:
         """Get the size of the given file in bytes."""
         return self.get_file_size(jobStoreFileID)
@@ -1472,7 +1573,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='update_file')
+    @deprecated(new_function_name="update_file")
     def updateFile(self, jobStoreFileID: str, localFilePath: str) -> None:
         """Replaces the existing version of a file in the job store."""
         return self.update_file(jobStoreFileID, localFilePath)
@@ -1493,19 +1594,20 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='update_file_stream')
-    def updateFileStream(self,
-                         jobStoreFileID: str,
-                         encoding: Optional[str] = None,
-                         errors: Optional[str] = None) -> ContextManager[IO[Any]]:
+    @deprecated(new_function_name="update_file_stream")
+    def updateFileStream(
+        self,
+        jobStoreFileID: str,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> ContextManager[IO[Any]]:
         return self.update_file_stream(jobStoreFileID, encoding, errors)
     @abstractmethod
     @contextmanager
-    def update_file_stream(self,
-                           file_id: str,
-                           encoding: Optional[str] = None,
-                           errors: Optional[str] = None) -> Iterator[IO[Any]]:
+    def update_file_stream(
+        self, file_id: str, encoding: Optional[str] = None, errors: Optional[str] = None
+    ) -> Iterator[IO[Any]]:
         """
         Replaces the existing version of a file in the job store. Similar to writeFile, but
         returns a context manager yielding a file handle which can be written to. The
@@ -1531,20 +1633,29 @@ class AbstractJobStore(ABC):
     # with specific jobs.
     ##########################################
-    sharedFileNameRegex = re.compile(r'^[a-zA-Z0-9._-]+$')
+    sharedFileNameRegex = re.compile(r"^[a-zA-Z0-9._-]+$")
-    @deprecated(new_function_name='write_shared_file_stream')
-    def writeSharedFileStream(self, sharedFileName: str, isProtected: Optional[bool] = None, encoding: Optional[str] = None,
-                                errors: Optional[str] = None) -> ContextManager[IO[bytes]]:
-        return self.write_shared_file_stream(sharedFileName, isProtected, encoding, errors)
+    @deprecated(new_function_name="write_shared_file_stream")
+    def writeSharedFileStream(
+        self,
+        sharedFileName: str,
+        isProtected: Optional[bool] = None,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> ContextManager[IO[bytes]]:
+        return self.write_shared_file_stream(
+            sharedFileName, isProtected, encoding, errors
+        )
     @abstractmethod
     @contextmanager
-    def write_shared_file_stream(self,
-                                 shared_file_name: str,
-                                 encrypted: Optional[bool] = None,
-                                 encoding: Optional[str] = None,
-                                 errors: Optional[str] = None) -> Iterator[IO[bytes]]:
+    def write_shared_file_stream(
+        self,
+        shared_file_name: str,
+        encrypted: Optional[bool] = None,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> Iterator[IO[bytes]]:
         """
         Returns a context manager yielding a writable file handle to the global file referenced
         by the given name.  File will be created in an atomic manner.
@@ -1569,19 +1680,23 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='read_shared_file_stream')
-    def readSharedFileStream(self,
-                             sharedFileName: str,
-                             encoding: Optional[str] = None,
-                             errors: Optional[str] = None) -> ContextManager[IO[bytes]]:
+    @deprecated(new_function_name="read_shared_file_stream")
+    def readSharedFileStream(
+        self,
+        sharedFileName: str,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> ContextManager[IO[bytes]]:
         return self.read_shared_file_stream(sharedFileName, encoding, errors)
     @abstractmethod
     @contextmanager
-    def read_shared_file_stream(self,
-                                shared_file_name: str,
-                                encoding: Optional[str] = None,
-                                errors: Optional[str] = None) -> Iterator[IO[bytes]]:
+    def read_shared_file_stream(
+        self,
+        shared_file_name: str,
+        encoding: Optional[str] = None,
+        errors: Optional[str] = None,
+    ) -> Iterator[IO[bytes]]:
         """
         Returns a context manager yielding a readable file handle to the global file referenced
         by the given name.
@@ -1600,7 +1715,7 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='write_logs')
+    @deprecated(new_function_name="write_logs")
     def writeStatsAndLogging(self, statsAndLoggingString: str) -> None:
         return self.write_logs(statsAndLoggingString)
@@ -1616,8 +1731,10 @@ class AbstractJobStore(ABC):
         """
         raise NotImplementedError()
-    @deprecated(new_function_name='read_logs')
-    def readStatsAndLogging(self, callback: Callable[..., Any], readAll: bool = False) -> int:
+    @deprecated(new_function_name="read_logs")
+    def readStatsAndLogging(
+        self, callback: Callable[..., Any], readAll: bool = False
+    ) -> int:
         return self.read_logs(callback, readAll)
     @abstractmethod
@@ -1652,8 +1769,8 @@ class AbstractJobStore(ABC):
         this method. Other methods will rely on always having the most current
         pid available. So far there is no reason to store any old pids.
         """
-        with self.write_shared_file_stream('pid.log') as f:
-            f.write(str(os.getpid()).encode('utf-8'))
+        with self.write_shared_file_stream("pid.log") as f:
+            f.write(str(os.getpid()).encode("utf-8"))
     def read_leader_pid(self) -> int:
         """
@@ -1661,7 +1778,7 @@ class AbstractJobStore(ABC):
         :raise NoSuchFileException: If the PID file doesn't exist.
         """
-        with self.read_shared_file_stream('pid.log') as f:
+        with self.read_shared_file_stream("pid.log") as f:
             return int(f.read().strip())
     def write_leader_node_id(self) -> None:
@@ -1670,7 +1787,7 @@ class AbstractJobStore(ABC):
         by the leader.
         """
         with self.write_shared_file_stream("leader_node_id.log") as f:
-            f.write(getNodeID().encode('utf-8'))
+            f.write(getNodeID().encode("utf-8"))
     def read_leader_node_id(self) -> str:
         """
@@ -1679,7 +1796,7 @@ class AbstractJobStore(ABC):
         :raise NoSuchFileException: If the node ID file doesn't exist.
         """
         with self.read_shared_file_stream("leader_node_id.log") as f:
-            return f.read().decode('utf-8').strip()
+            return f.read().decode("utf-8").strip()
     def write_kill_flag(self, kill: bool = False) -> None:
         """
@@ -1692,7 +1809,7 @@ class AbstractJobStore(ABC):
         workers are expected to be cleaned up by the leader.
         """
         with self.write_shared_file_stream("_toil_kill_flag") as f:
-            f.write(("YES" if kill else "NO").encode('utf-8'))
+            f.write(("YES" if kill else "NO").encode("utf-8"))
     def read_kill_flag(self) -> bool:
         """
@@ -1733,25 +1850,40 @@ class AbstractJobStore(ABC):
         if not cls._validateSharedFileName(sharedFileName):
             raise ValueError("Not a valid shared file name: '%s'." % sharedFileName)
 class JobStoreSupport(AbstractJobStore, metaclass=ABCMeta):
     """
     A mostly fake JobStore to access URLs not really associated with real job
     stores.
     """
+    @classmethod
+    def _setup_ftp(cls) -> FtpFsAccess:
+        # FTP connections are not reused. Ideally, a thread should watch any reused FTP connections
+        # and close them when necessary
+        return FtpFsAccess()
     @classmethod
     def _supports_url(cls, url: ParseResult, export: bool = False) -> bool:
-        return url.scheme.lower() in ('http', 'https', 'ftp') and not export
+        return url.scheme.lower() in ("http", "https", "ftp") and not export
     @classmethod
     def _url_exists(cls, url: ParseResult) -> bool:
+        # Deal with FTP first to support user/password auth
+        if url.scheme.lower() == "ftp":
+            ftp = cls._setup_ftp()
+            return ftp.exists(url.geturl())
         try:
-            # TODO: Figure out how to HEAD instead of this.
-            with cls._open_url(url):
+            with closing(urlopen(Request(url.geturl(), method="HEAD"))):
                 return True
-        except:
-            pass
-        return False
+        except HTTPError as e:
+            if e.code in (404, 410):
+                return False
+            else:
+                raise
+        # Any other errors we should pass through because something really went
+        # wrong (e.g. server is broken today but file may usually exist)
     @classmethod
     @retry(
@@ -1761,17 +1893,19 @@ class JobStoreSupport(AbstractJobStore, metaclass=ABCMeta):
         ]
     )
     def _get_size(cls, url: ParseResult) -> Optional[int]:
-        if url.scheme.lower() == 'ftp':
-            return None
-        with closing(urlopen(url.geturl())) as readable:
-            # just read the header for content length
-            size = readable.info().get('content-length')
-            return int(size) if size is not None else None
+        if url.scheme.lower() == "ftp":
+            ftp = cls._setup_ftp()
+            return ftp.size(url.geturl())
+        # just read the header for content length
+        resp = urlopen(Request(url.geturl(), method="HEAD"))
+        size = resp.info().get("content-length")
+        return int(size) if size is not None else None
     @classmethod
     def _read_from_url(
         cls, url: ParseResult, writable: Union[IO[bytes], IO[str]]
-    ) -> Tuple[int, bool]:
+    ) -> tuple[int, bool]:
         # We can't actually retry after we start writing.
         # TODO: Implement retry with byte range requests
         with cls._open_url(url) as readable:
@@ -1780,8 +1914,10 @@ class JobStoreSupport(AbstractJobStore, metaclass=ABCMeta):
             # nested function can modify it without creating its own
             # local with the same name.
             size = [0]
             def count(l: int) -> None:
                 size[0] += l
             counter = WriteWatchingStream(writable)
             counter.onWrite(count)
@@ -1793,18 +1929,32 @@ class JobStoreSupport(AbstractJobStore, metaclass=ABCMeta):
     @retry(
         errors=[
             BadStatusLine,
-            ErrorCondition(error=HTTPError, error_codes=[408, 500, 503]),
+            ErrorCondition(error=HTTPError, error_codes=[408, 429, 500, 502, 503]),
         ]
     )
     def _open_url(cls, url: ParseResult) -> IO[bytes]:
+        # Deal with FTP first so we support user/password auth
+        if url.scheme.lower() == "ftp":
+            ftp = cls._setup_ftp()
+            # we open in read mode as write mode is not supported
+            return ftp.open(url.geturl(), mode="r")
         try:
             return cast(IO[bytes], closing(urlopen(url.geturl())))
         except HTTPError as e:
-            if e.code == 404:
+            if e.code in (404, 410):
                 # Translate into a FileNotFoundError for detecting
-                # un-importable files
+                # known nonexistent files
                 raise FileNotFoundError(str(url)) from e
             else:
+                # Other codes indicate a real problem with the server; we don't
+                # want to e.g. run a workflow without an optional input that
+                # the user specified a path to just because the server was
+                # busy.
+                # Sometimes we expect to see this when polling existence for
+                # inputs at guessed paths, so don't complain *too* loudly here.
+                logger.debug("Unusual status %d for URL %s", e.code, str(url))
                 raise
     @classmethod
@@ -1813,6 +1963,6 @@ class JobStoreSupport(AbstractJobStore, metaclass=ABCMeta):
         return False
     @classmethod
-    def _list_url(cls, url: ParseResult) -> List[str]:
+    def _list_url(cls, url: ParseResult) -> list[str]:
         # TODO: Implement HTTP index parsing and FTP directory listing
         raise NotImplementedError("HTTP and FTP URLs cannot yet be listed")

toil 6.1.0a1__py3-none-any.whl → 8.0.0__py3-none-any.whl

toil 6.1.0a1py3-none-any.whl → 8.0.0py3-none-any.whl