PyPI - toil - Versions diffs - 6.0.0__py3-none-any.whl → 6.1.0__py3-none-any.whl - Mend

toil 6.0.0py3-none-any.whl → 6.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

toil/batchSystems/abstractBatchSystem.py +19 -4
toil/batchSystems/abstractGridEngineBatchSystem.py +22 -22
toil/batchSystems/cleanup_support.py +7 -3
toil/batchSystems/lsf.py +7 -7
toil/batchSystems/slurm.py +85 -14
toil/bus.py +38 -0
toil/common.py +20 -18
toil/cwl/cwltoil.py +81 -63
toil/exceptions.py +1 -1
toil/fileStores/abstractFileStore.py +53 -4
toil/fileStores/cachingFileStore.py +4 -20
toil/fileStores/nonCachingFileStore.py +5 -14
toil/job.py +46 -30
toil/jobStores/abstractJobStore.py +21 -23
toil/jobStores/aws/utils.py +5 -4
toil/jobStores/fileJobStore.py +1 -1
toil/leader.py +17 -14
toil/lib/conversions.py +19 -0
toil/lib/generatedEC2Lists.py +8 -8
toil/lib/io.py +28 -2
toil/lib/resources.py +8 -1
toil/lib/threading.py +27 -12
toil/options/common.py +5 -7
toil/options/wdl.py +5 -0
toil/provisioners/abstractProvisioner.py +8 -0
toil/statsAndLogging.py +36 -8
toil/test/batchSystems/test_slurm.py +21 -6
toil/test/cactus/__init__.py +0 -0
toil/test/cactus/test_cactus_integration.py +58 -0
toil/test/cwl/cwlTest.py +243 -151
toil/test/docs/scriptsTest.py +2 -2
toil/test/jobStores/jobStoreTest.py +7 -5
toil/test/lib/test_ec2.py +1 -1
toil/test/options/__init__.py +13 -0
toil/test/options/options.py +37 -0
toil/test/provisioners/clusterTest.py +9 -8
toil/test/utils/toilDebugTest.py +1 -1
toil/test/utils/utilsTest.py +3 -3
toil/test/wdl/wdltoil_test.py +91 -16
toil/utils/toilDebugFile.py +1 -1
toil/utils/toilStats.py +309 -266
toil/utils/toilStatus.py +1 -1
toil/version.py +9 -9
toil/wdl/wdltoil.py +341 -189
toil/worker.py +31 -16
{toil-6.0.0.dist-info → toil-6.1.0.dist-info}/METADATA +6 -7
{toil-6.0.0.dist-info → toil-6.1.0.dist-info}/RECORD +51 -47
{toil-6.0.0.dist-info → toil-6.1.0.dist-info}/LICENSE +0 -0
{toil-6.0.0.dist-info → toil-6.1.0.dist-info}/WHEEL +0 -0
{toil-6.0.0.dist-info → toil-6.1.0.dist-info}/entry_points.txt +0 -0
{toil-6.0.0.dist-info → toil-6.1.0.dist-info}/top_level.txt +0 -0

toil/jobStores/aws/utils.py CHANGED Viewed

@@ -17,13 +17,12 @@ import logging
 import os
 import types
 from ssl import SSLError
-from typing import Optional, cast
+from typing import Optional, cast, TYPE_CHECKING
 from boto3.s3.transfer import TransferConfig
 from boto.exception import SDBResponseError
 from botocore.client import Config
 from botocore.exceptions import ClientError
-from mypy_boto3_s3 import S3Client, S3ServiceResource
 from toil.lib.aws import session
 from toil.lib.aws.utils import connection_reset, get_bucket_region
@@ -36,6 +35,8 @@ from toil.lib.retry import (DEFAULT_DELAYS,
                             get_error_status,
                             old_retry,
                             retry)
+if TYPE_CHECKING:
+    from mypy_boto3_s3 import S3Client, S3ServiceResource
 logger = logging.getLogger(__name__)
@@ -290,7 +291,7 @@ class ServerSideCopyProhibitedError(RuntimeError):
     error=ClientError,
     error_codes=[404, 500, 502, 503, 504]
 )])
-def copyKeyMultipart(resource: S3ServiceResource,
+def copyKeyMultipart(resource: "S3ServiceResource",
                      srcBucketName: str,
                      srcKeyName: str,
                      srcKeyVersion: str,
@@ -346,7 +347,7 @@ def copyKeyMultipart(resource: S3ServiceResource,
     # not wherever the bucket virtual hostnames go.
     source_region = get_bucket_region(srcBucketName)
     source_client = cast(
-        S3Client,
+        "S3Client",
         session.client(
             's3',
             region_name=source_region,

toil/jobStores/fileJobStore.py CHANGED Viewed

@@ -920,7 +920,7 @@ class FileJobStore(AbstractJobStore):
         :raise NoSuchFileException: if the file with ID jobStoreFileID does
                                     not exist or is not a file
         """
-        if not self.file_exists(unquote(jobStoreFileID)):
+        if not self.file_exists(jobStoreFileID):
             raise NoSuchFileException(jobStoreFileID)
     def _get_arbitrary_jobs_dir_for_name(self, jobNameSlug):

toil/leader.py CHANGED Viewed

@@ -28,14 +28,16 @@ import enlighten
 from toil import resolveEntryPoint
 from toil.batchSystems import DeadlockException
 from toil.batchSystems.abstractBatchSystem import (AbstractBatchSystem,
-                                                   BatchJobExitReason)
+                                                   BatchJobExitReason,
+                                                   EXIT_STATUS_UNAVAILABLE_VALUE)
 from toil.bus import (JobCompletedMessage,
                       JobFailedMessage,
                       JobIssuedMessage,
                       JobMissingMessage,
                       JobUpdatedMessage,
                       QueueSizeMessage,
-                      gen_message_bus_path)
+                      gen_message_bus_path,
+                      get_job_kind)
 from toil.common import Config, ToilMetrics
 from toil.cwl.utils import CWL_UNSUPPORTED_REQUIREMENT_EXIT_CODE
 from toil.exceptions import FailedJobsException
@@ -705,8 +707,9 @@ class Leader:
             if exitStatus == 0:
                 logger.debug('Job ended: %s', updatedJob)
             else:
-                logger.warning(f'Job failed with exit value {exitStatus}: {updatedJob}\n'
-                               f'Exit reason: {exitReason}')
+                status_string = str(exitStatus) if exitStatus != EXIT_STATUS_UNAVAILABLE_VALUE else "<UNAVAILABLE>"
+                logger.warning(f'Job failed with exit value {status_string}: {updatedJob}\n'
+                               f'Exit reason: {BatchJobExitReason.to_string(exitReason)}')
                 if exitStatus == CWL_UNSUPPORTED_REQUIREMENT_EXIT_CODE:
                     # This is a CWL job informing us that the workflow is
                     # asking things of us that Toil can't do. When we raise an
@@ -715,7 +718,7 @@ class Leader:
                     logger.warning("This indicates an unsupported CWL requirement!")
                     self.recommended_fail_exit_code = CWL_UNSUPPORTED_REQUIREMENT_EXIT_CODE
             # Tell everyone it stopped running.
-            self._messages.publish(JobCompletedMessage(updatedJob.get_job_kind(), updatedJob.jobStoreID, exitStatus))
+            self._messages.publish(JobCompletedMessage(get_job_kind(updatedJob.get_names()), updatedJob.jobStoreID, exitStatus))
             self.process_finished_job(bsID, exitStatus, wall_time=wallTime, exit_reason=exitReason)
     def _processLostJobs(self):
@@ -921,7 +924,7 @@ class Leader:
                    "%s and %s",
                    jobNode, str(jobBatchSystemID), jobNode.requirements_string())
         # Tell everyone it is issued and the queue size changed
-        self._messages.publish(JobIssuedMessage(jobNode.get_job_kind(), jobNode.jobStoreID, jobBatchSystemID))
+        self._messages.publish(JobIssuedMessage(get_job_kind(jobNode.get_names()), jobNode.jobStoreID, jobBatchSystemID))
         self._messages.publish(QueueSizeMessage(self.getNumberOfJobsIssued()))
         # Tell the user there's another job to do
         self.progress_overall.total += 1
@@ -1157,7 +1160,7 @@ class Leader:
             self.progress_overall.update(incr=-1)
             self.progress_failed.update(incr=1)
-        # Delegate to the vers
+        # Delegate to the version that uses a JobDescription
         return self.process_finished_job_description(issued_job, result_status, wall_time, exit_reason, batch_system_id)
     def process_finished_job_description(self, finished_job: JobDescription, result_status: int,
@@ -1208,11 +1211,12 @@ class Leader:
                     # more memory efficient than read().striplines() while leaving off the
                     # trailing \n left when using readlines()
                     # http://stackoverflow.com/a/15233739
-                    StatsAndLogging.logWithFormatting(job_store_id, log_stream, method=logger.warning,
+                    StatsAndLogging.logWithFormatting(f'Log from job "{job_store_id}"', log_stream, method=logger.warning,
                                                       message='The job seems to have left a log file, indicating failure: %s' % replacement_job)
                 if self.config.writeLogs or self.config.writeLogsGzip:
                     with replacement_job.getLogFileHandle(self.jobStore) as log_stream:
-                        StatsAndLogging.writeLogFiles(replacement_job.chainedJobs, log_stream, self.config, failed=True)
+                        # Send log data from the job store to each per-job log file involved.
+                        StatsAndLogging.writeLogFiles([names.stats_name for names in replacement_job.get_chain()], log_stream, self.config, failed=True)
             if result_status != 0:
                 # If the batch system returned a non-zero exit code then the worker
                 # is assumed not to have captured the failure of the job, so we
@@ -1236,13 +1240,12 @@ class Leader:
                         else:
                             with log_stream:
                                 if os.path.getsize(log_file) > 0:
-                                    StatsAndLogging.logWithFormatting(job_store_id, log_stream, method=logger.warning,
+                                    StatsAndLogging.logWithFormatting(f'Log from job "{job_store_id}"', log_stream, method=logger.warning,
                                                                       message='The batch system left a non-empty file %s:' % log_file)
                                     if self.config.writeLogs or self.config.writeLogsGzip:
                                         file_root, _ = os.path.splitext(os.path.basename(log_file))
-                                        job_names = replacement_job.chainedJobs
-                                        if job_names is None:   # For jobs that fail this way, replacement_job.chainedJobs is not guaranteed to be set
-                                            job_names = [str(replacement_job)]
+                                        job_names = [names.stats_name for names in replacement_job.get_chain()]
+                                        # Tack the batch system log file name onto each job's name
                                         job_names = [j + '_' + file_root for j in job_names]
                                         log_stream.seek(0)
                                         StatsAndLogging.writeLogFiles(job_names, log_stream, self.config, failed=True)
@@ -1309,7 +1312,7 @@ class Leader:
         # Tell everyone it failed
-        self._messages.publish(JobFailedMessage(job_desc.get_job_kind(), job_id))
+        self._messages.publish(JobFailedMessage(get_job_kind(job_desc.get_names()), job_id))
         if job_id in self.toilState.service_to_client:
             # Is a service job

toil/lib/conversions.py CHANGED Viewed

@@ -128,3 +128,22 @@ def hms_duration_to_seconds(hms: str) -> float:
     seconds += float(vals_to_convert[2])
     return seconds
+def strtobool(val: str) -> bool:
+    """
+    Make a human-readable string into a bool.
+    Convert a string along the lines of "y", "1", "ON", "TrUe", or
+    "Yes" to True, and the corresponding false-ish values to False.
+    """
+    # We only track prefixes, so "y" covers "y", "yes",
+    # and "yeah no" and makes them all True.
+    TABLE = {True: ["1", "on", "y", "t"], False: ["0", "off", "n", "f"]}
+    lowered = val.lower()
+    for result, prefixes in TABLE.items():
+        for prefix in prefixes:
+            if lowered.startswith(prefix):
+                return result
+    raise ValueError(f"Cannot convert \"{val}\" to a bool")

toil 6.0.0__py3-none-any.whl → 6.1.0__py3-none-any.whl

toil 6.0.0py3-none-any.whl → 6.1.0py3-none-any.whl