PyPI - toil - Versions diffs - 6.1.0a1__py3-none-any.whl → 7.0.0__py3-none-any.whl - Mend

toil 6.1.0a1py3-none-any.whl → 7.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (104) hide show

toil/__init__.py +1 -232
toil/batchSystems/abstractBatchSystem.py +41 -17
toil/batchSystems/abstractGridEngineBatchSystem.py +79 -65
toil/batchSystems/awsBatch.py +8 -8
toil/batchSystems/cleanup_support.py +7 -3
toil/batchSystems/contained_executor.py +4 -5
toil/batchSystems/gridengine.py +1 -1
toil/batchSystems/htcondor.py +5 -5
toil/batchSystems/kubernetes.py +25 -11
toil/batchSystems/local_support.py +3 -3
toil/batchSystems/lsf.py +9 -9
toil/batchSystems/mesos/batchSystem.py +4 -4
toil/batchSystems/mesos/executor.py +3 -2
toil/batchSystems/options.py +9 -0
toil/batchSystems/singleMachine.py +11 -10
toil/batchSystems/slurm.py +129 -16
toil/batchSystems/torque.py +1 -1
toil/bus.py +45 -3
toil/common.py +56 -31
toil/cwl/cwltoil.py +442 -371
toil/deferred.py +1 -1
toil/exceptions.py +1 -1
toil/fileStores/abstractFileStore.py +69 -20
toil/fileStores/cachingFileStore.py +6 -22
toil/fileStores/nonCachingFileStore.py +6 -15
toil/job.py +270 -86
toil/jobStores/abstractJobStore.py +37 -31
toil/jobStores/aws/jobStore.py +280 -218
toil/jobStores/aws/utils.py +60 -31
toil/jobStores/conftest.py +2 -2
toil/jobStores/fileJobStore.py +3 -3
toil/jobStores/googleJobStore.py +3 -4
toil/leader.py +89 -38
toil/lib/aws/__init__.py +26 -10
toil/lib/aws/iam.py +2 -2
toil/lib/aws/session.py +62 -22
toil/lib/aws/utils.py +73 -37
toil/lib/conversions.py +24 -1
toil/lib/ec2.py +118 -69
toil/lib/expando.py +1 -1
toil/lib/generatedEC2Lists.py +8 -8
toil/lib/io.py +42 -4
toil/lib/misc.py +1 -3
toil/lib/resources.py +57 -16
toil/lib/retry.py +12 -5
toil/lib/threading.py +29 -14
toil/lib/throttle.py +1 -1
toil/options/common.py +31 -30
toil/options/wdl.py +5 -0
toil/provisioners/__init__.py +9 -3
toil/provisioners/abstractProvisioner.py +12 -2
toil/provisioners/aws/__init__.py +20 -15
toil/provisioners/aws/awsProvisioner.py +406 -329
toil/provisioners/gceProvisioner.py +2 -2
toil/provisioners/node.py +13 -5
toil/server/app.py +1 -1
toil/statsAndLogging.py +93 -23
toil/test/__init__.py +27 -12
toil/test/batchSystems/batchSystemTest.py +40 -33
toil/test/batchSystems/batch_system_plugin_test.py +79 -0
toil/test/batchSystems/test_slurm.py +22 -7
toil/test/cactus/__init__.py +0 -0
toil/test/cactus/test_cactus_integration.py +58 -0
toil/test/cwl/cwlTest.py +245 -236
toil/test/cwl/seqtk_seq.cwl +1 -1
toil/test/docs/scriptsTest.py +11 -14
toil/test/jobStores/jobStoreTest.py +40 -54
toil/test/lib/aws/test_iam.py +2 -2
toil/test/lib/test_ec2.py +1 -1
toil/test/options/__init__.py +13 -0
toil/test/options/options.py +37 -0
toil/test/provisioners/aws/awsProvisionerTest.py +51 -34
toil/test/provisioners/clusterTest.py +99 -16
toil/test/server/serverTest.py +2 -2
toil/test/src/autoDeploymentTest.py +1 -1
toil/test/src/dockerCheckTest.py +2 -1
toil/test/src/environmentTest.py +125 -0
toil/test/src/fileStoreTest.py +1 -1
toil/test/src/jobDescriptionTest.py +18 -8
toil/test/src/jobTest.py +1 -1
toil/test/src/realtimeLoggerTest.py +4 -0
toil/test/src/workerTest.py +52 -19
toil/test/utils/toilDebugTest.py +62 -4
toil/test/utils/utilsTest.py +23 -21
toil/test/wdl/wdltoil_test.py +49 -21
toil/test/wdl/wdltoil_test_kubernetes.py +77 -0
toil/toilState.py +68 -9
toil/utils/toilDebugFile.py +1 -1
toil/utils/toilDebugJob.py +153 -26
toil/utils/toilLaunchCluster.py +12 -2
toil/utils/toilRsyncCluster.py +7 -2
toil/utils/toilSshCluster.py +7 -3
toil/utils/toilStats.py +310 -266
toil/utils/toilStatus.py +98 -52
toil/version.py +11 -11
toil/wdl/wdltoil.py +644 -225
toil/worker.py +125 -83
{toil-6.1.0a1.dist-info → toil-7.0.0.dist-info}/LICENSE +25 -0
toil-7.0.0.dist-info/METADATA +158 -0
{toil-6.1.0a1.dist-info → toil-7.0.0.dist-info}/RECORD +103 -96
{toil-6.1.0a1.dist-info → toil-7.0.0.dist-info}/WHEEL +1 -1
toil-6.1.0a1.dist-info/METADATA +0 -125
{toil-6.1.0a1.dist-info → toil-7.0.0.dist-info}/entry_points.txt +0 -0
{toil-6.1.0a1.dist-info → toil-7.0.0.dist-info}/top_level.txt +0 -0

toil/test/utils/utilsTest.py CHANGED Viewed

@@ -39,7 +39,7 @@ from toil.test import (ToilTest,
                        needs_rsync3,
                        slow)
 from toil.test.sort.sortTest import makeFileToSort
-from toil.utils.toilStats import getStats, processData
+from toil.utils.toilStats import get_stats, process_data
 from toil.utils.toilStatus import ToilStatus
 from toil.version import python
@@ -56,6 +56,7 @@ class UtilsTest(ToilTest):
         super().setUp()
         self.tempDir = self._createTempDir()
         self.tempFile = get_temp_file(rootDir=self.tempDir)
+        self.outputFile = get_temp_file(rootDir=self.tempDir)
         self.outputFile = 'someSortedStuff.txt'
         self.toilDir = os.path.join(self.tempDir, "jobstore")
         self.assertFalse(os.path.exists(self.toilDir))
@@ -73,9 +74,9 @@ class UtilsTest(ToilTest):
             '-m',
             'toil.test.sort.sort',
             f'file:{self.toilDir}',
+            f'--fileToSort={self.tempFile}',
+            f'--outputFile={self.outputFile}',
             '--clean=never',
-            '--numLines=1',
-            '--lineLength=1'
         ]
         self.restart_sort_workflow_cmd = [
@@ -91,7 +92,7 @@ class UtilsTest(ToilTest):
         if os.path.exists(self.toilDir):
             shutil.rmtree(self.toilDir)
-        for f in ['fileToSort.txt', 'sortedFile.txt', 'output.txt']:
+        for f in [self.tempFile, self.outputFile, os.path.join(self.tempDir, "output.txt")]:
             if os.path.exists(f):
                 os.remove(f)
@@ -298,8 +299,8 @@ class UtilsTest(ToilTest):
         config = Config()
         config.setOptions(options)
         jobStore = Toil.resumeJobStore(config.jobStore)
-        stats = getStats(jobStore)
-        collatedStats = processData(jobStore.config, stats)
+        stats = get_stats(jobStore)
+        collatedStats = process_data(jobStore.config, stats)
         self.assertTrue(len(collatedStats.job_types) == 2, "Some jobs are not represented in the stats.")
     def check_status(self, status, status_fn, seconds=20):
@@ -314,14 +315,14 @@ class UtilsTest(ToilTest):
     def testGetPIDStatus(self):
         """Test that ToilStatus.getPIDStatus() behaves as expected."""
         wf = subprocess.Popen(self.sort_workflow_cmd)
-        self.check_status('RUNNING', status_fn=ToilStatus.getPIDStatus, seconds=20)
+        self.check_status('RUNNING', status_fn=ToilStatus.getPIDStatus, seconds=60)
         wf.wait()
-        self.check_status('COMPLETED', status_fn=ToilStatus.getPIDStatus)
+        self.check_status('COMPLETED', status_fn=ToilStatus.getPIDStatus, seconds=60)
         # TODO: we need to reach into the FileJobStore's files and delete this
         #  shared file. We assume we know its internal layout.
         os.remove(os.path.join(self.toilDir, 'files/shared/pid.log'))
-        self.check_status('QUEUED', status_fn=ToilStatus.getPIDStatus)
+        self.check_status('QUEUED', status_fn=ToilStatus.getPIDStatus, seconds=60)
     def testGetStatusFailedToilWF(self):
         """
@@ -331,9 +332,9 @@ class UtilsTest(ToilTest):
         """
         # --badWorker is set to force failure.
         wf = subprocess.Popen(self.sort_workflow_cmd + ['--badWorker=1'])
-        self.check_status('RUNNING', status_fn=ToilStatus.getStatus)
+        self.check_status('RUNNING', status_fn=ToilStatus.getStatus, seconds=60)
         wf.wait()
-        self.check_status('ERROR', status_fn=ToilStatus.getStatus)
+        self.check_status('ERROR', status_fn=ToilStatus.getStatus, seconds=60)
     @needs_cwl
     @needs_docker
@@ -341,22 +342,22 @@ class UtilsTest(ToilTest):
         """Test that ToilStatus.getStatus() behaves as expected with a failing CWL workflow."""
         # --badWorker is set to force failure.
         cmd = ['toil-cwl-runner', '--jobStore', self.toilDir, '--clean=never', '--badWorker=1',
-               'src/toil/test/cwl/sorttool.cwl', '--reverse', '--input', 'src/toil/test/cwl/whale.txt']
+               'src/toil/test/cwl/sorttool.cwl', '--reverse', '--input', 'src/toil/test/cwl/whale.txt', f'--outdir={self.tempDir}']
         wf = subprocess.Popen(cmd)
-        self.check_status('RUNNING', status_fn=ToilStatus.getStatus)
+        self.check_status('RUNNING', status_fn=ToilStatus.getStatus, seconds=60)
         wf.wait()
-        self.check_status('ERROR', status_fn=ToilStatus.getStatus)
+        self.check_status('ERROR', status_fn=ToilStatus.getStatus, seconds=60)
     @needs_cwl
     @needs_docker
     def testGetStatusSuccessfulCWLWF(self):
         """Test that ToilStatus.getStatus() behaves as expected with a successful CWL workflow."""
         cmd = ['toil-cwl-runner', '--jobStore', self.toilDir, '--clean=never',
-               'src/toil/test/cwl/sorttool.cwl', '--reverse', '--input', 'src/toil/test/cwl/whale.txt']
+               'src/toil/test/cwl/sorttool.cwl', '--reverse', '--input', 'src/toil/test/cwl/whale.txt', f'--outdir={self.tempDir}']
         wf = subprocess.Popen(cmd)
-        self.check_status('RUNNING', status_fn=ToilStatus.getStatus, seconds=20)
+        self.check_status('RUNNING', status_fn=ToilStatus.getStatus, seconds=60)
         wf.wait()
-        self.check_status('COMPLETED', status_fn=ToilStatus.getStatus)
+        self.check_status('COMPLETED', status_fn=ToilStatus.getStatus, seconds=60)
     @needs_cwl
     @patch('builtins.print')
@@ -375,23 +376,24 @@ class UtilsTest(ToilTest):
         args, kwargs = mock_print.call_args
         self.assertIn('invalidcommand', args[0])
+    @pytest.mark.timeout(1200)
     def testRestartAttribute(self):
         """
-        Test that the job store is only destroyed when we observe a succcessful workflow run.
+        Test that the job store is only destroyed when we observe a successful workflow run.
         The following simulates a failing workflow that attempts to resume without restart().
         In this case, the job store should not be destroyed until restart() is called.
         """
         # Run a workflow that will always fail
-        cmd = self.restart_sort_workflow_cmd + ['--badWorker=1']
+        cmd = self.restart_sort_workflow_cmd + ['--badWorker=1', '--logDebug']
         subprocess.run(cmd)
-        restart_cmd = self.restart_sort_workflow_cmd + ['--badWorker=0', '--restart']
+        restart_cmd = self.restart_sort_workflow_cmd + ['--badWorker=0', '--logDebug', '--restart']
         subprocess.run(restart_cmd)
         # Check the job store exists after restart attempt
         self.assertTrue(os.path.exists(self.toilDir))
-        successful_cmd = [python, '-m', 'toil.test.sort.sort', 'file:' + self.toilDir,
+        successful_cmd = [python, '-m', 'toil.test.sort.sort', '--logDebug', 'file:' + self.toilDir,
                                   '--restart']
         subprocess.run(successful_cmd)

toil/test/wdl/wdltoil_test.py CHANGED Viewed

@@ -3,27 +3,31 @@ import os
 import shutil
 import subprocess
 import unittest
-import uuid
-from typing import Any, Dict, List, Optional, Set
-from unittest.mock import patch
+from uuid import uuid4
+from typing import Optional
 from unittest.mock import patch
 from typing import Any, Dict, List, Set
+import pytest
+from toil.provisioners import cluster_factory
 from toil.test import (ToilTest,
                        needs_docker_cuda,
                        needs_google_storage,
                        needs_singularity_or_docker,
-                       slow)
+                       needs_wdl,
+                       slow, integrative)
 from toil.version import exactPython
 from toil.wdl.wdltoil import WDLSectionJob, WDLWorkflowGraph
+@needs_wdl
 class BaseWDLTest(ToilTest):
     """Base test class for WDL tests."""
     def setUp(self) -> None:
         """Runs anew before each test to create farm fresh temp dirs."""
-        self.output_dir = os.path.join('/tmp/', 'toil-wdl-test-' + str(uuid.uuid4()))
+        self.output_dir = os.path.join('/tmp/', 'toil-wdl-test-' + str(uuid4()))
         os.makedirs(self.output_dir)
     def tearDown(self) -> None:
@@ -36,11 +40,12 @@ class WDLConformanceTests(BaseWDLTest):
     WDL conformance tests for Toil.
     """
     wdl_dir = "wdl-conformance-tests"
     @classmethod
     def setUpClass(cls) -> None:
         url = "https://github.com/DataBiosphere/wdl-conformance-tests.git"
-        commit = "032fb99a1458d456b6d5f17d27928469ec1a1c68"
+        commit = "c87b62b4f460e009fd42edec13669c4db14cf90c"
         p = subprocess.Popen(
             f"git clone {url} {cls.wdl_dir} && cd {cls.wdl_dir} && git checkout {commit}",
@@ -59,7 +64,7 @@ class WDLConformanceTests(BaseWDLTest):
     # estimated running time: 2 minutes
     @slow
     def test_conformance_tests_v10(self):
-        tests_to_run = "0,1,5-7,9-15,17,22-24,26,28-30,32-40,53,57-59,62,67-69"
+        tests_to_run = "0-15,17-20,22-71,73-77"
         p = subprocess.run(self.base_command + ["-v", "1.0", "-n", tests_to_run], capture_output=True)
         if p.returncode != 0:
@@ -70,7 +75,7 @@ class WDLConformanceTests(BaseWDLTest):
     # estimated running time: 2 minutes
     @slow
     def test_conformance_tests_v11(self):
-        tests_to_run = "2-11,13-15,17-20,22-24,26,29,30,32-40,53,57-59,62,67-69"
+        tests_to_run = "1-63,65-71,73-75,77"
         p = subprocess.run(self.base_command + ["-v", "1.1", "-n", tests_to_run], capture_output=True)
         if p.returncode != 0:
@@ -78,6 +83,16 @@ class WDLConformanceTests(BaseWDLTest):
         p.check_returncode()
+    @slow
+    def test_conformance_tests_integration(self):
+        ids_to_run = "encode,tut01,tut02,tut03,tut04"
+        p = subprocess.run(self.base_command + ["-v", "1.0", "--id", ids_to_run], capture_output=True)
+        if p.returncode != 0:
+            print(p.stdout.decode('utf-8', errors='replace'))
+        p.check_returncode()
     @classmethod
     def tearDownClass(cls) -> None:
         upper_dir = os.path.dirname(os.getcwd())
@@ -87,6 +102,7 @@ class WDLConformanceTests(BaseWDLTest):
 class WDLTests(BaseWDLTest):
     """Tests for Toil's MiniWDL-based implementation."""
     @classmethod
     def setUpClass(cls) -> None:
         """Runs once for all tests."""
@@ -101,7 +117,8 @@ class WDLTests(BaseWDLTest):
         wdl = os.path.abspath('src/toil/test/wdl/md5sum/md5sum.1.0.wdl')
         json_file = os.path.abspath('src/toil/test/wdl/md5sum/md5sum.json')
-        result_json = subprocess.check_output(self.base_command + [wdl, json_file, '-o', self.output_dir, '--logDebug', '--retryCount=0'])
+        result_json = subprocess.check_output(
+            self.base_command + [wdl, json_file, '-o', self.output_dir, '--logDebug', '--retryCount=0'])
         result = json.loads(result_json)
         assert 'ga4ghMd5.value' in result
@@ -109,13 +126,23 @@ class WDLTests(BaseWDLTest):
         assert os.path.exists(result['ga4ghMd5.value'])
         assert os.path.basename(result['ga4ghMd5.value']) == 'md5sum.txt'
+    def test_missing_output_directory(self):
+        """
+        Test if Toil can run a WDL workflow into a new directory.
+        """
+        wdl = os.path.abspath('src/toil/test/wdl/md5sum/md5sum.1.0.wdl')
+        json_file = os.path.abspath('src/toil/test/wdl/md5sum/md5sum.json')
+        subprocess.check_call(self.base_command + [wdl, json_file, '-o', os.path.join(self.output_dir, "does", "not", "exist"), '--logDebug', '--retryCount=0'])
     @needs_singularity_or_docker
     def test_miniwdl_self_test(self, extra_args: Optional[List[str]] = None) -> None:
         """Test if the MiniWDL self test runs and produces the expected output."""
         wdl_file = os.path.abspath('src/toil/test/wdl/miniwdl_self_test/self_test.wdl')
         json_file = os.path.abspath('src/toil/test/wdl/miniwdl_self_test/inputs.json')
-        result_json = subprocess.check_output(self.base_command + [wdl_file, json_file, '--logDebug', '-o', self.output_dir, '--outputDialect', 'miniwdl'] + (extra_args or []))
+        result_json = subprocess.check_output(
+            self.base_command + [wdl_file, json_file, '--logDebug', '-o', self.output_dir, '--outputDialect',
+                                 'miniwdl'] + (extra_args or []))
         result = json.loads(result_json)
         # Expect MiniWDL-style output with a designated "dir"
@@ -132,7 +159,7 @@ class WDLTests(BaseWDLTest):
         assert isinstance(outputs['hello_caller.message_files'], list)
         assert len(outputs['hello_caller.message_files']) == 2
         for item in outputs['hello_caller.message_files']:
-            # All the files should be strings in the "out" direcotry
+            # All the files should be strings in the "out" directory
             assert isinstance(item, str)
             assert item.startswith(out_dir)
@@ -172,7 +199,8 @@ class WDLTests(BaseWDLTest):
                 "GiraffeDeepVariant.runDeepVariantCallVariants.in_dv_gpu_container": "google/deepvariant:1.3.0-gpu"
             })
-        result_json = subprocess.check_output(self.base_command + [wdl_file, json_file, '-o', self.output_dir, '--outputDialect', 'miniwdl'])
+        result_json = subprocess.check_output(
+            self.base_command + [wdl_file, json_file, '-o', self.output_dir, '--outputDialect', 'miniwdl'])
         result = json.loads(result_json)
         # Expect MiniWDL-style output with a designated "dir"
@@ -200,7 +228,9 @@ class WDLTests(BaseWDLTest):
         wdl_file = f"{base_uri}/workflows/giraffe.wdl"
         json_file = f"{base_uri}/params/giraffe.json"
-        result_json = subprocess.check_output(self.base_command + [wdl_file, json_file, '-o', self.output_dir, '--outputDialect', 'miniwdl', '--scale', '0.1'])
+        result_json = subprocess.check_output(
+            self.base_command + [wdl_file, json_file, '-o', self.output_dir, '--outputDialect', 'miniwdl', '--scale',
+                                 '0.1'])
         result = json.loads(result_json)
         # Expect MiniWDL-style output with a designated "dir"
@@ -265,7 +295,6 @@ class WDLTests(BaseWDLTest):
         # worth extracting a base type for this interface.
         with patch.object(WDLWorkflowGraph, 'is_decl', mock_is_decl):
             with patch.object(WDLWorkflowGraph, 'get_transitive_dependencies', mock_get_transitive_dependencies):
                 with self.subTest(msg="Two unrelated decls can coalesce"):
                     # Set up two unrelated decls
                     all_decls = {"decl1", "decl2"}
@@ -275,7 +304,7 @@ class WDLTests(BaseWDLTest):
                     }
                     result = WDLSectionJob.coalesce_nodes(["decl1", "decl2"], WDLWorkflowGraph([]))
                     # Make sure they coalesced
                     assert len(result) == 1
                     assert "decl1" in result[0]
@@ -289,12 +318,11 @@ class WDLTests(BaseWDLTest):
                     }
                     result = WDLSectionJob.coalesce_nodes(["decl", "nondecl"], WDLWorkflowGraph([]))
                     assert len(result) == 2
                     assert len(result[0]) == 1
                     assert len(result[1]) == 1
                 with self.subTest(msg="Two adjacent decls with a common dependency can coalesce"):
                     all_decls = {"decl1", "decl2"}
                     all_deps = {
@@ -304,7 +332,7 @@ class WDLTests(BaseWDLTest):
                     }
                     result = WDLSectionJob.coalesce_nodes(["base", "decl1", "decl2"], WDLWorkflowGraph([]))
                     assert len(result) == 2
                     assert "base" in result[0]
                     assert "decl1" in result[1]
@@ -319,7 +347,7 @@ class WDLTests(BaseWDLTest):
                     }
                     result = WDLSectionJob.coalesce_nodes(["base", "decl1", "decl2"], WDLWorkflowGraph([]))
                     assert len(result) == 3
                     assert "base" in result[0]
@@ -332,7 +360,7 @@ class WDLTests(BaseWDLTest):
                     }
                     result = WDLSectionJob.coalesce_nodes(["decl1", "decl2", "successor"], WDLWorkflowGraph([]))
                     assert len(result) == 2
                     assert "decl1" in result[0]
                     assert "decl2" in result[0]

toil/test/wdl/wdltoil_test_kubernetes.py ADDED Viewed

@@ -0,0 +1,77 @@
+import unittest
+from toil.test.provisioners.clusterTest import AbstractClusterTest
+from uuid import uuid4
+import pytest
+from toil.provisioners import cluster_factory
+from toil.test import (slow, integrative)
+@integrative
+@slow
+@pytest.mark.timeout(600)
+class WDLKubernetesClusterTest(AbstractClusterTest):
+    """
+    Ensure WDL works on the Kubernetes batchsystem.
+    """
+    def __init__(self, name):
+        super().__init__(name)
+        self.clusterName = 'wdl-integration-test-' + str(uuid4())
+        # t2.medium is the minimum t2 instance that permits Kubernetes
+        self.leaderNodeType = "t2.medium"
+        self.instanceTypes = ["t2.medium"]
+        self.clusterType = "kubernetes"
+    def setUp(self) -> None:
+        super().setUp()
+        self.jobStore = f'aws:{self.awsRegion()}:wdl-test-{uuid4()}'
+    def launchCluster(self) -> None:
+        self.createClusterUtil(args=['--leaderStorage', str(self.requestedLeaderStorage),
+                                     '--nodeTypes', ",".join(self.instanceTypes),
+                                     '-w', ",".join(self.numWorkers),
+                                     '--nodeStorage', str(self.requestedLeaderStorage)])
+    def test_wdl_kubernetes_cluster(self):
+        """
+        Test that a wdl workflow works on a kubernetes cluster. Launches a cluster with 1 worker. This runs a wdl
+        workflow that performs an image pull on the worker.
+        :return:
+        """
+        self.numWorkers = "1"
+        self.requestedLeaderStorage = 30
+        # create the cluster
+        self.launchCluster()
+        # get leader
+        self.cluster = cluster_factory(
+            provisioner="aws", zone=self.zone, clusterName=self.clusterName
+        )
+        self.leader = self.cluster.getLeader()
+        url = "https://github.com/DataBiosphere/wdl-conformance-tests.git"
+        commit = "09b9659cd01473e836738a2e0dd205df0adb49c5"
+        wdl_dir = "wdl_conformance_tests"
+        # get the wdl-conformance-tests repo to get WDL tasks to run
+        self.sshUtil([
+            "bash",
+            "-c",
+            f"git clone {url} {wdl_dir} && cd {wdl_dir} && git checkout {commit}"
+        ])
+        # run on kubernetes batchsystem
+        toil_options = ['--batchSystem=kubernetes',
+                        f"--jobstore={self.jobStore}"]
+        # run WDL workflow that will run singularity
+        test_options = [f"tests/md5sum/md5sum.wdl", f"tests/md5sum/md5sum.json"]
+        self.sshUtil([
+            "bash",
+            "-c",
+            f"cd {wdl_dir} && toil-wdl-runner {' '.join(test_options)} {' '.join(toil_options)}"])
+if __name__ == "__main__":
+    unittest.main()  # run all tests

toil/toilState.py CHANGED Viewed

@@ -12,6 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import logging
+import time
 from typing import Dict, Optional, Set
 from toil.bus import JobUpdatedMessage, MessageBus
@@ -183,12 +184,70 @@ class ToilState:
         if job_id in self.__job_database:
             # Update the one true copy in place
             old_truth = self.__job_database[job_id]
-            old_truth.check_new_version(new_truth)
+            old_truth.assert_is_not_newer_than(new_truth)
             old_truth.__dict__.update(new_truth.__dict__)
         else:
             # Just keep the new one
             self.__job_database[job_id] = new_truth
+    def reset_job_expecting_change(self, job_id: str, timeout: float) -> bool:
+        """
+        Discard any local modifications to a JobDescription.
+        Will make modifications from other hosts visible.
+        Will wait for up to timeout seconds for a modification (or deletion)
+        from another host to actually be visible.
+        Always replaces the JobDescription with what is stored in the job
+        store, even if no modification ends up being visible.
+        Returns True if an update was detected in time, and False otherwise.
+        """
+        start_time = time.time()
+        wait_time = 0.1
+        initially_known = job_id in self.__job_database
+        new_truth: Optional[JobDescription] = None
+        while True:
+            try:
+                new_truth = self.__job_store.load_job(job_id)
+            except NoSuchJobException:
+                # The job is gone now.
+                if job_id in self.__job_database:
+                    # So forget about it
+                    del self.__job_database[job_id]
+                    # TODO: Other collections may still reference it.
+                if initially_known:
+                    # Job was deleted, that's an update
+                    return True
+            else:
+                if job_id in self.__job_database:
+                    # We have an old version to compare against
+                    old_truth = self.__job_database[job_id]
+                    old_truth.assert_is_not_newer_than(new_truth)
+                    if old_truth.is_updated_by(new_truth):
+                        # Do the update
+                        old_truth.__dict__.update(new_truth.__dict__)
+                        return True
+                else:
+                    # Just keep the new one. That's an update.
+                    self.__job_database[job_id] = new_truth
+                    return True
+            # We looked but didn't get a good update
+            time_elapsed = time.time() - start_time
+            if time_elapsed >= timeout:
+                # We're out of time to check.
+                if new_truth is not None:
+                    # Commit whatever we managed to load to accomplish a real
+                    # reset.
+                    old_truth.__dict__.update(new_truth.__dict__)
+                return False
+            # Wait a little and poll again
+            time.sleep(min(timeout - time_elapsed, wait_time))
+            # Using exponential backoff
+            wait_time *= 2
     # The next 3 functions provide tracking of how many successor jobs a given job
     # is waiting on, exposing only legit operations.
     # TODO: turn these into messages?
@@ -247,10 +306,10 @@ class ToilState:
         :param jobDesc: The description for the root job of the workflow being run.
         """
-        # If the job description has a command, is a checkpoint, has services
+        # If the job description has a body, is a checkpoint, has services
         # or is ready to be deleted it is ready to be processed (i.e. it is updated)
         if (
-            jobDesc.command is not None
+            jobDesc.has_body()
             or (
                 isinstance(jobDesc, CheckpointJobDescription)
                 and jobDesc.checkpoint is not None
@@ -259,10 +318,10 @@ class ToilState:
             or jobDesc.nextSuccessors() is None
         ):
             logger.debug(
-                "Found job to run: %s, with command: %s, with checkpoint: %s, with "
+                "Found job to run: %s, with body: %s, with checkpoint: %s, with "
                 "services: %s, with no next successors: %s",
                 jobDesc.jobStoreID,
-                jobDesc.command is not None,
+                jobDesc.has_body(),
                 isinstance(jobDesc, CheckpointJobDescription)
                 and jobDesc.checkpoint is not None,
                 len(jobDesc.services) > 0,
@@ -272,18 +331,18 @@ class ToilState:
             self.bus.publish(JobUpdatedMessage(str(jobDesc.jobStoreID), 0))
             if isinstance(jobDesc, CheckpointJobDescription) and jobDesc.checkpoint is not None:
-                jobDesc.command = jobDesc.checkpoint
+                jobDesc.restore_checkpoint()
         else:  # There exist successors
             logger.debug(
                 "Adding job: %s to the state with %s successors",
                 jobDesc.jobStoreID,
-                len(jobDesc.nextSuccessors()),
+                len(jobDesc.nextSuccessors() or set()),
             )
             # Record the number of successors
             self.successorCounts[str(jobDesc.jobStoreID)] = len(
-                jobDesc.nextSuccessors()
+                jobDesc.nextSuccessors() or set()
             )
             def processSuccessorWithMultiplePredecessors(successor: JobDescription) -> None:
@@ -305,7 +364,7 @@ class ToilState:
                     self._buildToilState(successor)
             # For each successor
-            for successorJobStoreID in jobDesc.nextSuccessors():
+            for successorJobStoreID in jobDesc.nextSuccessors() or set():
                 # If the successor does not yet point back at a
                 # predecessor we have not yet considered it

toil/utils/toilDebugFile.py CHANGED Viewed

@@ -17,11 +17,11 @@ import logging
 import os.path
 import sys
 from typing import Optional
-from distutils.util import strtobool
 from toil.common import Config, Toil, parser_with_common_options
 from toil.jobStores.fileJobStore import FileJobStore
 from toil.lib.resources import glob
+from toil.lib.conversions import strtobool
 from toil.statsAndLogging import set_logging_from_options
 logger = logging.getLogger(__name__)

toil 6.1.0a1__py3-none-any.whl → 7.0.0__py3-none-any.whl

toil 6.1.0a1py3-none-any.whl → 7.0.0py3-none-any.whl