PyPI - toil - Versions diffs - 8.1.0b1__py3-none-any.whl → 9.0.0__py3-none-any.whl - Mend

toil 8.1.0b1py3-none-any.whl → 9.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (275) hide show

toil/__init__.py +0 -35
toil/batchSystems/abstractBatchSystem.py +1 -1
toil/batchSystems/abstractGridEngineBatchSystem.py +1 -1
toil/batchSystems/awsBatch.py +1 -1
toil/batchSystems/cleanup_support.py +1 -1
toil/batchSystems/kubernetes.py +53 -7
toil/batchSystems/local_support.py +1 -1
toil/batchSystems/mesos/batchSystem.py +13 -8
toil/batchSystems/mesos/test/__init__.py +3 -2
toil/batchSystems/registry.py +15 -118
toil/batchSystems/singleMachine.py +1 -1
toil/batchSystems/slurm.py +27 -26
toil/bus.py +5 -3
toil/common.py +59 -12
toil/cwl/cwltoil.py +81 -38
toil/cwl/utils.py +103 -3
toil/job.py +64 -49
toil/jobStores/abstractJobStore.py +35 -239
toil/jobStores/aws/jobStore.py +2 -1
toil/jobStores/fileJobStore.py +27 -2
toil/jobStores/googleJobStore.py +110 -33
toil/leader.py +9 -0
toil/lib/accelerators.py +4 -2
toil/lib/aws/utils.py.orig +504 -0
toil/lib/bioio.py +1 -1
toil/lib/docker.py +252 -91
toil/lib/dockstore.py +11 -3
toil/lib/exceptions.py +5 -3
toil/lib/generatedEC2Lists.py +81 -19
toil/lib/history.py +87 -13
toil/lib/history_submission.py +23 -9
toil/lib/io.py +34 -22
toil/lib/misc.py +8 -2
toil/lib/plugins.py +106 -0
toil/lib/resources.py +2 -1
toil/lib/threading.py +11 -10
toil/lib/url.py +320 -0
toil/options/common.py +8 -0
toil/options/cwl.py +13 -1
toil/options/runner.py +17 -10
toil/options/wdl.py +22 -0
toil/provisioners/aws/awsProvisioner.py +25 -2
toil/server/api_spec/LICENSE +201 -0
toil/server/api_spec/README.rst +5 -0
toil/server/app.py +12 -6
toil/server/cli/wes_cwl_runner.py +3 -2
toil/server/wes/abstract_backend.py +21 -43
toil/server/wes/toil_backend.py +2 -2
toil/test/__init__.py +275 -115
toil/test/batchSystems/batchSystemTest.py +228 -213
toil/test/batchSystems/batch_system_plugin_test.py +7 -0
toil/test/batchSystems/test_slurm.py +27 -0
toil/test/cactus/pestis.tar.gz +0 -0
toil/test/conftest.py +7 -0
toil/test/cwl/2.fasta +11 -0
toil/test/cwl/2.fastq +12 -0
toil/test/cwl/conftest.py +1 -1
toil/test/cwl/cwlTest.py +1175 -870
toil/test/cwl/directory/directory/file.txt +15 -0
toil/test/cwl/download_directory_file.json +4 -0
toil/test/cwl/download_directory_s3.json +4 -0
toil/test/cwl/download_file.json +6 -0
toil/test/cwl/download_http.json +6 -0
toil/test/cwl/download_https.json +6 -0
toil/test/cwl/download_s3.json +6 -0
toil/test/cwl/download_subdirectory_file.json +5 -0
toil/test/cwl/download_subdirectory_s3.json +5 -0
toil/test/cwl/empty.json +1 -0
toil/test/cwl/mock_mpi/fake_mpi.yml +8 -0
toil/test/cwl/mock_mpi/fake_mpi_run.py +42 -0
toil/test/cwl/optional-file-exists.json +6 -0
toil/test/cwl/optional-file-missing.json +6 -0
toil/test/cwl/preemptible_expression.json +1 -0
toil/test/cwl/revsort-job-missing.json +6 -0
toil/test/cwl/revsort-job.json +6 -0
toil/test/cwl/s3_secondary_file.json +16 -0
toil/test/cwl/seqtk_seq_job.json +6 -0
toil/test/cwl/stream.json +6 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.dat +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f0 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f1 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f1i +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f2 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f2_TSM0 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f3 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f3_TSM0 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f4 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f4_TSM0 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.f5 +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.info +0 -0
toil/test/cwl/test_filename_conflict_resolution.ms/table.lock +0 -0
toil/test/cwl/whale.txt +16 -0
toil/test/docs/scripts/example_alwaysfail.py +38 -0
toil/test/docs/scripts/example_alwaysfail_with_files.wdl +33 -0
toil/test/docs/scripts/example_cachingbenchmark.py +117 -0
toil/test/docs/scripts/stagingExampleFiles/in.txt +1 -0
toil/test/docs/scripts/stagingExampleFiles/out.txt +2 -0
toil/test/docs/scripts/tutorial_arguments.py +23 -0
toil/test/docs/scripts/tutorial_debugging.patch +12 -0
toil/test/docs/scripts/tutorial_debugging_hangs.wdl +126 -0
toil/test/docs/scripts/tutorial_debugging_works.wdl +129 -0
toil/test/docs/scripts/tutorial_docker.py +20 -0
toil/test/docs/scripts/tutorial_dynamic.py +24 -0
toil/test/docs/scripts/tutorial_encapsulation.py +28 -0
toil/test/docs/scripts/tutorial_encapsulation2.py +29 -0
toil/test/docs/scripts/tutorial_helloworld.py +15 -0
toil/test/docs/scripts/tutorial_invokeworkflow.py +27 -0
toil/test/docs/scripts/tutorial_invokeworkflow2.py +30 -0
toil/test/docs/scripts/tutorial_jobfunctions.py +22 -0
toil/test/docs/scripts/tutorial_managing.py +29 -0
toil/test/docs/scripts/tutorial_managing2.py +56 -0
toil/test/docs/scripts/tutorial_multiplejobs.py +25 -0
toil/test/docs/scripts/tutorial_multiplejobs2.py +21 -0
toil/test/docs/scripts/tutorial_multiplejobs3.py +22 -0
toil/test/docs/scripts/tutorial_promises.py +25 -0
toil/test/docs/scripts/tutorial_promises2.py +30 -0
toil/test/docs/scripts/tutorial_quickstart.py +22 -0
toil/test/docs/scripts/tutorial_requirements.py +44 -0
toil/test/docs/scripts/tutorial_services.py +45 -0
toil/test/docs/scripts/tutorial_staging.py +45 -0
toil/test/docs/scripts/tutorial_stats.py +64 -0
toil/test/docs/scriptsTest.py +2 -1
toil/test/lib/aws/test_iam.py +3 -1
toil/test/lib/dockerTest.py +205 -122
toil/test/lib/test_history.py +101 -77
toil/test/lib/test_url.py +69 -0
toil/test/lib/url_plugin_test.py +105 -0
toil/test/provisioners/aws/awsProvisionerTest.py +13 -10
toil/test/provisioners/clusterTest.py +17 -4
toil/test/provisioners/gceProvisionerTest.py +17 -15
toil/test/server/serverTest.py +78 -36
toil/test/sort/sort.py +4 -1
toil/test/src/busTest.py +17 -17
toil/test/src/deferredFunctionTest.py +145 -132
toil/test/src/importExportFileTest.py +71 -63
toil/test/src/jobEncapsulationTest.py +27 -28
toil/test/src/jobServiceTest.py +149 -133
toil/test/src/jobTest.py +219 -211
toil/test/src/miscTests.py +66 -60
toil/test/src/promisedRequirementTest.py +163 -169
toil/test/src/regularLogTest.py +24 -24
toil/test/src/resourceTest.py +82 -76
toil/test/src/restartDAGTest.py +51 -47
toil/test/src/resumabilityTest.py +24 -19
toil/test/src/retainTempDirTest.py +60 -57
toil/test/src/systemTest.py +17 -13
toil/test/src/threadingTest.py +29 -32
toil/test/utils/ABCWorkflowDebug/B_file.txt +1 -0
toil/test/utils/ABCWorkflowDebug/debugWorkflow.py +204 -0
toil/test/utils/ABCWorkflowDebug/mkFile.py +16 -0
toil/test/utils/ABCWorkflowDebug/sleep.cwl +12 -0
toil/test/utils/ABCWorkflowDebug/sleep.yaml +1 -0
toil/test/utils/toilDebugTest.py +117 -102
toil/test/utils/toilKillTest.py +54 -53
toil/test/utils/utilsTest.py +303 -229
toil/test/wdl/lint_error.wdl +9 -0
toil/test/wdl/md5sum/empty_file.json +1 -0
toil/test/wdl/md5sum/md5sum-gs.json +1 -0
toil/test/wdl/md5sum/md5sum.1.0.wdl +32 -0
toil/test/wdl/md5sum/md5sum.input +1 -0
toil/test/wdl/md5sum/md5sum.json +1 -0
toil/test/wdl/md5sum/md5sum.wdl +25 -0
toil/test/wdl/miniwdl_self_test/inputs-namespaced.json +1 -0
toil/test/wdl/miniwdl_self_test/inputs.json +1 -0
toil/test/wdl/miniwdl_self_test/self_test.wdl +40 -0
toil/test/wdl/standard_library/as_map.json +16 -0
toil/test/wdl/standard_library/as_map_as_input.wdl +23 -0
toil/test/wdl/standard_library/as_pairs.json +7 -0
toil/test/wdl/standard_library/as_pairs_as_input.wdl +23 -0
toil/test/wdl/standard_library/ceil.json +3 -0
toil/test/wdl/standard_library/ceil_as_command.wdl +16 -0
toil/test/wdl/standard_library/ceil_as_input.wdl +16 -0
toil/test/wdl/standard_library/collect_by_key.json +1 -0
toil/test/wdl/standard_library/collect_by_key_as_input.wdl +23 -0
toil/test/wdl/standard_library/cross.json +11 -0
toil/test/wdl/standard_library/cross_as_input.wdl +19 -0
toil/test/wdl/standard_library/flatten.json +7 -0
toil/test/wdl/standard_library/flatten_as_input.wdl +18 -0
toil/test/wdl/standard_library/floor.json +3 -0
toil/test/wdl/standard_library/floor_as_command.wdl +16 -0
toil/test/wdl/standard_library/floor_as_input.wdl +16 -0
toil/test/wdl/standard_library/keys.json +8 -0
toil/test/wdl/standard_library/keys_as_input.wdl +24 -0
toil/test/wdl/standard_library/length.json +7 -0
toil/test/wdl/standard_library/length_as_input.wdl +16 -0
toil/test/wdl/standard_library/length_as_input_with_map.json +7 -0
toil/test/wdl/standard_library/length_as_input_with_map.wdl +17 -0
toil/test/wdl/standard_library/length_invalid.json +3 -0
toil/test/wdl/standard_library/range.json +3 -0
toil/test/wdl/standard_library/range_0.json +3 -0
toil/test/wdl/standard_library/range_as_input.wdl +17 -0
toil/test/wdl/standard_library/range_invalid.json +3 -0
toil/test/wdl/standard_library/read_boolean.json +3 -0
toil/test/wdl/standard_library/read_boolean_as_command.wdl +17 -0
toil/test/wdl/standard_library/read_float.json +3 -0
toil/test/wdl/standard_library/read_float_as_command.wdl +17 -0
toil/test/wdl/standard_library/read_int.json +3 -0
toil/test/wdl/standard_library/read_int_as_command.wdl +17 -0
toil/test/wdl/standard_library/read_json.json +3 -0
toil/test/wdl/standard_library/read_json_as_output.wdl +31 -0
toil/test/wdl/standard_library/read_lines.json +3 -0
toil/test/wdl/standard_library/read_lines_as_output.wdl +31 -0
toil/test/wdl/standard_library/read_map.json +3 -0
toil/test/wdl/standard_library/read_map_as_output.wdl +31 -0
toil/test/wdl/standard_library/read_string.json +3 -0
toil/test/wdl/standard_library/read_string_as_command.wdl +17 -0
toil/test/wdl/standard_library/read_tsv.json +3 -0
toil/test/wdl/standard_library/read_tsv_as_output.wdl +31 -0
toil/test/wdl/standard_library/round.json +3 -0
toil/test/wdl/standard_library/round_as_command.wdl +16 -0
toil/test/wdl/standard_library/round_as_input.wdl +16 -0
toil/test/wdl/standard_library/size.json +3 -0
toil/test/wdl/standard_library/size_as_command.wdl +17 -0
toil/test/wdl/standard_library/size_as_output.wdl +36 -0
toil/test/wdl/standard_library/stderr.json +3 -0
toil/test/wdl/standard_library/stderr_as_output.wdl +30 -0
toil/test/wdl/standard_library/stdout.json +3 -0
toil/test/wdl/standard_library/stdout_as_output.wdl +30 -0
toil/test/wdl/standard_library/sub.json +3 -0
toil/test/wdl/standard_library/sub_as_input.wdl +17 -0
toil/test/wdl/standard_library/sub_as_input_with_file.wdl +17 -0
toil/test/wdl/standard_library/transpose.json +6 -0
toil/test/wdl/standard_library/transpose_as_input.wdl +18 -0
toil/test/wdl/standard_library/write_json.json +6 -0
toil/test/wdl/standard_library/write_json_as_command.wdl +17 -0
toil/test/wdl/standard_library/write_lines.json +7 -0
toil/test/wdl/standard_library/write_lines_as_command.wdl +17 -0
toil/test/wdl/standard_library/write_map.json +6 -0
toil/test/wdl/standard_library/write_map_as_command.wdl +17 -0
toil/test/wdl/standard_library/write_tsv.json +6 -0
toil/test/wdl/standard_library/write_tsv_as_command.wdl +17 -0
toil/test/wdl/standard_library/zip.json +12 -0
toil/test/wdl/standard_library/zip_as_input.wdl +19 -0
toil/test/wdl/test.csv +3 -0
toil/test/wdl/test.tsv +3 -0
toil/test/wdl/testfiles/croo.wdl +38 -0
toil/test/wdl/testfiles/drop_files.wdl +62 -0
toil/test/wdl/testfiles/drop_files_subworkflow.wdl +13 -0
toil/test/wdl/testfiles/empty.txt +0 -0
toil/test/wdl/testfiles/not_enough_outputs.wdl +33 -0
toil/test/wdl/testfiles/random.wdl +66 -0
toil/test/wdl/testfiles/read_file.wdl +18 -0
toil/test/wdl/testfiles/string_file_coercion.json +1 -0
toil/test/wdl/testfiles/string_file_coercion.wdl +35 -0
toil/test/wdl/testfiles/test.json +4 -0
toil/test/wdl/testfiles/test_boolean.txt +1 -0
toil/test/wdl/testfiles/test_float.txt +1 -0
toil/test/wdl/testfiles/test_int.txt +1 -0
toil/test/wdl/testfiles/test_lines.txt +5 -0
toil/test/wdl/testfiles/test_map.txt +2 -0
toil/test/wdl/testfiles/test_string.txt +1 -0
toil/test/wdl/testfiles/url_to_file.wdl +13 -0
toil/test/wdl/testfiles/url_to_optional_file.wdl +14 -0
toil/test/wdl/testfiles/vocab.json +1 -0
toil/test/wdl/testfiles/vocab.wdl +66 -0
toil/test/wdl/testfiles/wait.wdl +34 -0
toil/test/wdl/wdl_specification/type_pair.json +23 -0
toil/test/wdl/wdl_specification/type_pair_basic.wdl +36 -0
toil/test/wdl/wdl_specification/type_pair_with_files.wdl +36 -0
toil/test/wdl/wdl_specification/v1_spec.json +1 -0
toil/test/wdl/wdl_specification/v1_spec_declaration.wdl +39 -0
toil/test/wdl/wdltoil_test.py +751 -529
toil/test/wdl/wdltoil_test_kubernetes.py +2 -2
toil/utils/toilSshCluster.py +23 -0
toil/utils/toilUpdateEC2Instances.py +1 -0
toil/version.py +5 -5
toil/wdl/wdltoil.py +518 -437
toil/worker.py +11 -6
{toil-8.1.0b1.dist-info → toil-9.0.0.dist-info}/METADATA +25 -24
toil-9.0.0.dist-info/RECORD +444 -0
{toil-8.1.0b1.dist-info → toil-9.0.0.dist-info}/WHEEL +1 -1
toil-8.1.0b1.dist-info/RECORD +0 -259
{toil-8.1.0b1.dist-info → toil-9.0.0.dist-info}/entry_points.txt +0 -0
{toil-8.1.0b1.dist-info → toil-9.0.0.dist-info/licenses}/LICENSE +0 -0
{toil-8.1.0b1.dist-info → toil-9.0.0.dist-info}/top_level.txt +0 -0

toil/test/cwl/cwlTest.py CHANGED Viewed

@@ -12,6 +12,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+from collections.abc import Generator
 import json
 import logging
 import os
@@ -20,7 +21,6 @@ import shutil
 import stat
 import subprocess
 import sys
-import unittest
 import uuid
 import zipfile
 from functools import partial
@@ -45,27 +45,30 @@ from toil.cwl.utils import (
     download_structure,
     visit_cwl_class_and_reduce,
     visit_top_cwl_class,
+    remove_redundant_mounts
 )
 from toil.fileStores import FileID
 from toil.fileStores.abstractFileStore import AbstractFileStore
+from toil.job import WorkerImportJob
 from toil.lib.threading import cpu_count
 from toil.test import (
-    ToilTest,
-    needs_aws_s3,
-    needs_cwl,
-    needs_docker,
-    needs_docker_cuda,
-    needs_gridengine,
-    needs_kubernetes,
-    needs_local_cuda,
-    needs_lsf,
-    needs_mesos,
-    needs_online,
-    needs_singularity_or_docker,
-    needs_slurm,
-    needs_torque,
-    needs_wes_server,
-    slow,
+    get_data,
+)
+from toil.test import (
+    pslow as slow,
+    pneeds_docker as needs_docker,
+    pneeds_cwl as needs_cwl,
+    pneeds_aws_s3 as needs_aws_s3,
+    pneeds_docker_cuda as needs_docker_cuda,
+    pneeds_gridengine as needs_gridengine,
+    pneeds_kubernetes as needs_kubernetes,
+    pneeds_local_cuda as needs_local_cuda,
+    pneeds_lsf as needs_lsf,
+    pneeds_mesos as needs_mesos,
+    pneeds_online as needs_online,
+    pneeds_slurm as needs_slurm,
+    pneeds_torque as needs_torque,
+    pneeds_wes_server as needs_wes_server,
 )
 log = logging.getLogger(__name__)
@@ -222,72 +225,58 @@ def run_conformance_tests(
         log.info("Unsuccessful return code is OK")
-TesterFuncType = Callable[[str, str, "CWLObjectType"], None]
+TesterFuncType = Callable[[Path, Path, "CWLObjectType", Path], None]
 @needs_cwl
-class CWLWorkflowTest(ToilTest):
+@pytest.mark.cwl
+class TestCWLWorkflow:
     """
     CWL tests included in Toil that don't involve the whole CWL conformance
     test suite. Tests Toil-specific functions like URL types supported for
     inputs.
     """
-    def setUp(self) -> None:
-        """Runs anew before each test to create farm fresh temp dirs."""
-        self.outDir = f"/tmp/toil-cwl-test-{str(uuid.uuid4())}"
-        os.makedirs(self.outDir)
-        self.rootDir = self._projectRootPath()
-        self.jobStoreDir = f"./jobstore-{str(uuid.uuid4())}"
-    def tearDown(self) -> None:
-        """Clean up outputs."""
-        if os.path.exists(self.outDir):
-            shutil.rmtree(self.outDir)
-        if os.path.exists(self.jobStoreDir):
-            shutil.rmtree(self.jobStoreDir)
-        unittest.TestCase.tearDown(self)
     def test_cwl_cmdline_input(self) -> None:
         """
         Test that running a CWL workflow with inputs specified on the command line passes.
         """
         from toil.cwl import cwltoil
-        cwlfile = "src/toil/test/cwl/conditional_wf.cwl"
-        args = [cwlfile, "--message", "str", "--sleep", "2"]
-        st = StringIO()
-        # If the workflow runs, it must have had options
-        cwltoil.main(args, stdout=st)
+        with get_data("test/cwl/conditional_wf.cwl") as cwlfile:
+            args = [str(cwlfile), "--message", "str", "--sleep", "2"]
+            st = StringIO()
+            # If the workflow runs, it must have had options
+            cwltoil.main(args, stdout=st)
     def _tester(
         self,
-        cwlfile: str,
-        jobfile: str,
+        cwlfile: Path,
+        jobfile: Path,
         expect: "CWLObjectType",
-        main_args: list[str] = [],
+        outdir: Path,
         out_name: str = "output",
-        output_here: bool = False,
+        main_args: Optional[list[str]] = None,
     ) -> None:
         from toil.cwl import cwltoil
         st = StringIO()
-        main_args = main_args[:]
-        if not output_here:
-            # Don't just dump output in the working directory.
-            main_args.extend(["--logDebug", "--outdir", self.outDir])
-        main_args.extend(
+        real_main_args = main_args or []
+        real_main_args.extend(
             [
-                os.path.join(self.rootDir, cwlfile),
-                os.path.join(self.rootDir, jobfile),
+                "--logDebug",
+                "--outdir",
+                str(outdir),
+                str(cwlfile),
+                str(jobfile),
             ]
         )
-        cwltoil.main(main_args, stdout=st)
+        cwltoil.main(real_main_args, stdout=st)
         out = json.loads(st.getvalue())
         out.get(out_name, {}).pop("http://commonwl.org/cwltool#generation", None)
         out.get(out_name, {}).pop("nameext", None)
         out.get(out_name, {}).pop("nameroot", None)
-        self.assertEqual(out, expect)
+        assert out == expect
         for k, v in expect.items():
             if (
@@ -298,11 +287,11 @@ class CWLWorkflowTest(ToilTest):
             ):
                 # This is a top-level output file.
                 # None of our output files should be executable.
-                self.assertTrue(os.path.exists(v["path"]))
-                self.assertFalse(os.stat(v["path"]).st_mode & stat.S_IXUSR)
+                assert os.path.exists(v["path"]) is True
+                assert (os.stat(v["path"]).st_mode & stat.S_IXUSR) == 0
     def _debug_worker_tester(
-        self, cwlfile: str, jobfile: str, expect: "CWLObjectType"
+        self, cwlfile: Path, jobfile: Path, expect: "CWLObjectType", outdir: Path
     ) -> None:
         from toil.cwl import cwltoil
@@ -311,9 +300,9 @@ class CWLWorkflowTest(ToilTest):
             [
                 "--debugWorker",
                 "--outdir",
-                self.outDir,
-                os.path.join(self.rootDir, cwlfile),
-                os.path.join(self.rootDir, jobfile),
+                str(outdir),
+                str(cwlfile),
+                str(jobfile),
             ],
             stdout=st,
         )
@@ -321,172 +310,216 @@ class CWLWorkflowTest(ToilTest):
         out["output"].pop("http://commonwl.org/cwltool#generation", None)
         out["output"].pop("nameext", None)
         out["output"].pop("nameroot", None)
-        self.assertEqual(out, expect)
-    def revsort(self, cwl_filename: str, tester_fn: TesterFuncType) -> None:
-        tester_fn(
-            "src/toil/test/cwl/" + cwl_filename,
-            "src/toil/test/cwl/revsort-job.json",
-            self._expected_revsort_output(self.outDir),
-        )
+        assert out == expect
-    def revsort_no_checksum(self, cwl_filename: str, tester_fn: TesterFuncType) -> None:
-        tester_fn(
-            "src/toil/test/cwl/" + cwl_filename,
-            "src/toil/test/cwl/revsort-job.json",
-            self._expected_revsort_nochecksum_output(self.outDir),
-        )
-    def download(self, inputs: str, tester_fn: TesterFuncType) -> None:
-        input_location = os.path.join("src/toil/test/cwl", inputs)
-        tester_fn(
-            "src/toil/test/cwl/download.cwl",
-            input_location,
-            self._expected_download_output(self.outDir),
-        )
-    def load_contents(self, inputs: str, tester_fn: TesterFuncType) -> None:
-        input_location = os.path.join("src/toil/test/cwl", inputs)
-        tester_fn(
-            "src/toil/test/cwl/load_contents.cwl",
-            input_location,
-            self._expected_load_contents_output(self.outDir),
-        )
-    def download_directory(self, inputs: str, tester_fn: TesterFuncType) -> None:
-        input_location = os.path.join("src/toil/test/cwl", inputs)
-        tester_fn(
-            "src/toil/test/cwl/download_directory.cwl",
-            input_location,
-            self._expected_download_output(self.outDir),
-        )
-    def download_subdirectory(self, inputs: str, tester_fn: TesterFuncType) -> None:
-        input_location = os.path.join("src/toil/test/cwl", inputs)
-        tester_fn(
-            "src/toil/test/cwl/download_subdirectory.cwl",
-            input_location,
-            self._expected_download_output(self.outDir),
-        )
-    def test_mpi(self) -> None:
+    def revsort(
+        self, cwl_filename: str, tester_fn: TesterFuncType, out_dir: Path
+    ) -> None:
+        with get_data(f"test/cwl/{cwl_filename}") as cwl_file:
+            with get_data("test/cwl/revsort-job.json") as job_file:
+                tester_fn(
+                    cwl_file, job_file, self._expected_revsort_output(out_dir), out_dir
+                )
+    def revsort_no_checksum(
+        self, cwl_filename: str, tester_fn: TesterFuncType, out_dir: Path
+    ) -> None:
+        with get_data(f"test/cwl/{cwl_filename}") as cwl_file:
+            with get_data("test/cwl/revsort-job.json") as job_file:
+                tester_fn(
+                    cwl_file,
+                    job_file,
+                    self._expected_revsort_nochecksum_output(out_dir),
+                    out_dir,
+                )
+    def download(self, inputs: str, tester_fn: TesterFuncType, out_dir: Path) -> None:
+        with get_data(f"test/cwl/{inputs}") as input_location:
+            with get_data("test/cwl/download.cwl") as cwl_file:
+                tester_fn(
+                    cwl_file,
+                    input_location,
+                    self._expected_download_output(out_dir),
+                    out_dir,
+                )
+    def load_contents(
+        self, inputs: str, tester_fn: TesterFuncType, out_dir: Path
+    ) -> None:
+        with get_data(f"test/cwl/{inputs}") as input_location:
+            with get_data("test/cwl/load_contents.cwl") as cwl_file:
+                tester_fn(
+                    cwl_file,
+                    input_location,
+                    self._expected_load_contents_output(out_dir),
+                    out_dir,
+                )
+    def download_directory(
+        self, inputs: str, tester_fn: TesterFuncType, out_dir: Path
+    ) -> None:
+        with get_data(f"test/cwl/{inputs}") as input_location:
+            with get_data("test/cwl/download_directory.cwl") as cwl_file:
+                tester_fn(
+                    cwl_file,
+                    input_location,
+                    self._expected_download_output(out_dir),
+                    out_dir,
+                )
+    def download_subdirectory(
+        self, inputs: str, tester_fn: TesterFuncType, out_dir: Path
+    ) -> None:
+        with get_data(f"test/cwl/{inputs}") as input_location:
+            with get_data("test/cwl/download_subdirectory.cwl") as cwl_file:
+                tester_fn(
+                    cwl_file,
+                    input_location,
+                    self._expected_download_output(out_dir),
+                    out_dir,
+                )
+    def test_mpi(self, tmp_path: Path) -> None:
         from toil.cwl import cwltoil
         stdout = StringIO()
-        main_args = [
-            "--outdir",
-            self.outDir,
-            "--enable-dev",
-            "--enable-ext",
-            "--mpi-config-file",
-            os.path.join(self.rootDir, "src/toil/test/cwl/mock_mpi/fake_mpi.yml"),
-            os.path.join(self.rootDir, "src/toil/test/cwl/mpi_simple.cwl"),
-        ]
-        path = os.environ["PATH"]
-        os.environ["PATH"] = f"{path}:{self.rootDir}/src/toil/test/cwl/mock_mpi/"
-        cwltoil.main(main_args, stdout=stdout)
-        os.environ["PATH"] = path
-        out = json.loads(stdout.getvalue())
-        with open(out.get("pids", {}).get("location")[len("file://") :]) as f:
-            two_pids = [int(i) for i in f.read().split()]
-        self.assertEqual(len(two_pids), 2)
-        self.assertTrue(isinstance(two_pids[0], int))
-        self.assertTrue(isinstance(two_pids[1], int))
+        with get_data("test/cwl/mock_mpi/fake_mpi.yml") as mpi_config_file:
+            with get_data("test/cwl/mpi_simple.cwl") as cwl_file:
+                with get_data("test/cwl/mock_mpi/fake_mpi_run.py") as fake_mpi_run:
+                    main_args = [
+                        "--logDebug",
+                        "--outdir",
+                        str(tmp_path),
+                        "--enable-dev",
+                        "--enable-ext",
+                        "--mpi-config-file",
+                        str(mpi_config_file),
+                        str(cwl_file),
+                    ]
+                    path = os.environ["PATH"]
+                    os.environ["PATH"] = f"{path}:{fake_mpi_run.parent}"
+                    cwltoil.main(main_args, stdout=stdout)
+                    os.environ["PATH"] = path
+                    stdout_text = stdout.getvalue()
+                    assert "pids" in stdout_text
+                    out = json.loads(stdout_text)
+                    with open(
+                        out.get("pids", {}).get("location")[len("file://") :]
+                    ) as f:
+                        two_pids = [int(i) for i in f.read().split()]
+                    assert len(two_pids) == 2
+                    assert isinstance(two_pids[0], int)
+                    assert isinstance(two_pids[1], int)
     @needs_aws_s3
-    def test_s3_as_secondary_file(self) -> None:
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_s3_as_secondary_file(self, tmp_path: Path) -> None:
         from toil.cwl import cwltoil
         stdout = StringIO()
-        main_args = [
-            "--outdir",
-            self.outDir,
-            os.path.join(self.rootDir, "src/toil/test/cwl/s3_secondary_file.cwl"),
-            os.path.join(self.rootDir, "src/toil/test/cwl/s3_secondary_file.json"),
-        ]
-        cwltoil.main(main_args, stdout=stdout)
-        out = json.loads(stdout.getvalue())
-        self.assertEqual(
-            out["output"]["checksum"], "sha1$d14dd02e354918b4776b941d154c18ebc15b9b38"
-        )
-        self.assertEqual(out["output"]["size"], 24)
-        with open(out["output"]["location"][len("file://") :]) as f:
-            self.assertEqual(f.read().strip(), "When is s4 coming out?")
+        with get_data("test/cwl/s3_secondary_file.cwl") as cwl_file:
+            with get_data("test/cwl/s3_secondary_file.json") as inputs_file:
+                main_args = ["--outdir", str(tmp_path), str(cwl_file), str(inputs_file)]
+                cwltoil.main(main_args, stdout=stdout)
+                out = json.loads(stdout.getvalue())
+                assert (
+                    out["output"]["checksum"]
+                    == "sha1$d14dd02e354918b4776b941d154c18ebc15b9b38"
+                )
+                assert out["output"]["size"] == 24
+                with open(out["output"]["location"][len("file://") :]) as f:
+                    assert f.read().strip() == "When is s4 coming out?"
-    def test_run_revsort(self) -> None:
-        self.revsort("revsort.cwl", self._tester)
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_run_revsort(self, tmp_path: Path) -> None:
+        self.revsort("revsort.cwl", self._tester, tmp_path)
-    def test_run_revsort_nochecksum(self) -> None:
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_run_revsort_nochecksum(self, tmp_path: Path) -> None:
         self.revsort_no_checksum(
-            "revsort.cwl", partial(self._tester, main_args=["--no-compute-checksum"])
+            "revsort.cwl",
+            partial(self._tester, main_args=["--no-compute-checksum"]),
+            tmp_path,
         )
-    def test_run_revsort_no_container(self) -> None:
+    def test_run_revsort_no_container(self, tmp_path: Path) -> None:
         self.revsort(
-            "revsort.cwl", partial(self._tester, main_args=["--no-container"])
+            "revsort.cwl", partial(self._tester, main_args=["--no-container"]), tmp_path
         )
-    def test_run_revsort2(self) -> None:
-        self.revsort("revsort2.cwl", self._tester)
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_run_revsort2(self, tmp_path: Path) -> None:
+        self.revsort("revsort2.cwl", self._tester, tmp_path)
-    def test_run_revsort_debug_worker(self) -> None:
-        self.revsort("revsort.cwl", self._debug_worker_tester)
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_run_revsort_debug_worker(self, tmp_path: Path) -> None:
+        self.revsort("revsort.cwl", self._debug_worker_tester, tmp_path)
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_run_colon_output(self, tmp_path: Path) -> None:
+        with get_data("test/cwl/colon_test_output.cwl") as cwl_file:
+            with get_data("test/cwl/colon_test_output_job.yaml") as inputs_file:
+                self._tester(
+                    cwl_file,
+                    inputs_file,
+                    self._expected_colon_output(tmp_path),
+                    tmp_path,
+                    out_name="result",
+                )
-    def test_run_colon_output(self) -> None:
-        self._tester(
-            "src/toil/test/cwl/colon_test_output.cwl",
-            "src/toil/test/cwl/colon_test_output_job.yaml",
-            self._expected_colon_output(self.outDir),
-            out_name="result",
-        )
     @pytest.mark.integrative
-    @needs_singularity_or_docker
-    def test_run_dockstore_trs(self) -> None:
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_run_dockstore_trs(self, tmp_path: Path) -> None:
         from toil.cwl import cwltoil
         stdout = StringIO()
         main_args = [
             "--outdir",
-            self.outDir,
+            str(tmp_path),
             "#workflow/github.com/dockstore-testing/md5sum-checker:master",
-            "https://raw.githubusercontent.com/dockstore-testing/md5sum-checker/refs/heads/master/md5sum/md5sum-input-cwl.json"
+            "https://raw.githubusercontent.com/dockstore-testing/md5sum-checker/refs/heads/master/md5sum/md5sum-input-cwl.json",
         ]
         cwltoil.main(main_args, stdout=stdout)
         out = json.loads(stdout.getvalue())
         with open(out.get("output_file", {}).get("location")[len("file://") :]) as f:
             computed_hash = f.read().strip()
-        self.assertEqual(computed_hash, "00579a00e3e7fa0674428ac7049423e2")
+        assert computed_hash == "00579a00e3e7fa0674428ac7049423e2"
-    def test_glob_dir_bypass_file_store(self) -> None:
+    def test_glob_dir_bypass_file_store(self, tmp_path: Path) -> None:
         self.maxDiff = 1000
-        try:
-            # We need to output to the current directory to make sure that
-            # works.
-            self._tester(
-                "src/toil/test/cwl/glob_dir.cwl",
-                "src/toil/test/cwl/empty.json",
-                self._expected_glob_dir_output(os.getcwd()),
-                main_args=["--bypass-file-store"],
-                output_here=True,
-            )
-        finally:
-            # Clean up anything we made in the current directory.
-            try:
-                shutil.rmtree(os.path.join(os.getcwd(), "shouldmake"))
-            except FileNotFoundError:
-                pass
-    def test_required_input_condition_protection(self) -> None:
+        with get_data("test/cwl/glob_dir.cwl") as cwl_file:
+            with get_data("test/cwl/empty.json") as inputs_file:
+                self._tester(
+                    cwl_file,
+                    inputs_file,
+                    self._expected_glob_dir_output(tmp_path),
+                    tmp_path,
+                    main_args=["--bypass-file-store"],
+                )
+    def test_required_input_condition_protection(self, tmp_path: Path) -> None:
         # This doesn't run containerized
-        self._tester(
-            "src/toil/test/cwl/not_run_required_input.cwl",
-            "src/toil/test/cwl/empty.json",
-            {},
-        )
+        with get_data("test/cwl/not_run_required_input.cwl") as cwl_file:
+            with get_data("test/cwl/empty.json") as inputs_file:
+                self._tester(cwl_file, inputs_file, {}, tmp_path)
     @needs_slurm
-    def test_slurm_node_memory(self) -> None:
+    @pytest.mark.slurm
+    def test_slurm_node_memory(self, tmp_path: Path) -> None:
         pass
         # Run the workflow. This will either finish quickly and tell us the
@@ -497,28 +530,29 @@ class CWLWorkflowTest(ToilTest):
         # And if we run out of time we need to stop the workflow gracefully and
         # cancel the Slurm jobs.
-        main_args = [
-            f"--jobStore={self.jobStoreDir}",
-            # Avoid racing to toil kill before the jobstore is removed
-            "--clean=never",
-            "--batchSystem=slurm",
-            "--no-cwl-default-ram",
-            "--slurmDefaultAllMem=True",
-            "--outdir",
-            self.outDir,
-            os.path.join(self.rootDir, "src/toil/test/cwl/measure_default_memory.cwl"),
-        ]
         try:
-            log.debug("Start test workflow")
-            child = subprocess.Popen(
-                ["toil-cwl-runner"] + main_args, stdout=subprocess.PIPE
-            )
-            output, _ = child.communicate(timeout=60)
+            with get_data("test/cwl/measure_default_memory.cwl") as cwl_file:
+                main_args = [
+                    f"--jobStore={str(tmp_path / 'jobStoreDir')}",
+                    # Avoid racing to toil kill before the jobstore is removed
+                    "--clean=never",
+                    "--batchSystem=slurm",
+                    "--no-cwl-default-ram",
+                    "--slurmDefaultAllMem=True",
+                    "--outdir",
+                    str(tmp_path / "outdir"),
+                    str(cwl_file),
+                ]
+                log.debug("Start test workflow")
+                child = subprocess.Popen(
+                    ["toil-cwl-runner"] + main_args, stdout=subprocess.PIPE
+                )
+                output, _ = child.communicate(timeout=60)
         except subprocess.TimeoutExpired:
             # The job didn't finish quickly; presumably waiting for a full node.
             # Stop the workflow
             log.debug("Workflow might be waiting for a full node. Stop it.")
-            subprocess.check_call(["toil", "kill", self.jobStoreDir])
+            subprocess.check_call(["toil", "kill", str(tmp_path / "jobStoreDir")])
             # Wait another little bit for it to clean up, making sure to collect output in case it is blocked on writing
             child.communicate(timeout=20)
             # Kill it off in case it is still running
@@ -538,113 +572,151 @@ class CWLWorkflowTest(ToilTest):
             else:
                 result = int(memory_string)
             # We should see more than the CWL default or the Toil default, assuming Slurm nodes of reasonable size (3 GiB).
-            self.assertGreater(result, 3 * 1024 * 1024)
+            assert result > (3 * 1024 * 1024)
     @needs_aws_s3
-    def test_download_s3(self) -> None:
-        self.download("download_s3.json", self._tester)
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_download_s3(self, tmp_path: Path) -> None:
+        self.download("download_s3.json", self._tester, tmp_path)
-    def test_download_http(self) -> None:
-        self.download("download_http.json", self._tester)
+    def test_download_http(self, tmp_path: Path) -> None:
+        self.download("download_http.json", self._tester, tmp_path)
-    def test_download_https(self) -> None:
-        self.download("download_https.json", self._tester)
+    def test_download_https(self, tmp_path: Path) -> None:
+        self.download("download_https.json", self._tester, tmp_path)
-    def test_download_https_reference(self) -> None:
+    def test_download_https_reference(self, tmp_path: Path) -> None:
         self.download(
             "download_https.json",
             partial(self._tester, main_args=["--reference-inputs"]),
+            tmp_path,
         )
-    def test_download_file(self) -> None:
-        self.download("download_file.json", self._tester)
+    def test_download_file(self, tmp_path: Path) -> None:
+        self.download("download_file.json", self._tester, tmp_path)
     @needs_aws_s3
-    def test_download_directory_s3(self) -> None:
-        self.download_directory("download_directory_s3.json", self._tester)
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_download_directory_s3(self, tmp_path: Path) -> None:
+        self.download_directory("download_directory_s3.json", self._tester, tmp_path)
     @needs_aws_s3
-    def test_download_directory_s3_reference(self) -> None:
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_download_directory_s3_reference(self, tmp_path: Path) -> None:
         self.download_directory(
             "download_directory_s3.json",
             partial(self._tester, main_args=["--reference-inputs"]),
+            tmp_path,
         )
-    def test_download_directory_file(self) -> None:
-        self.download_directory("download_directory_file.json", self._tester)
+    def test_download_directory_file(self, tmp_path: Path) -> None:
+        self.download_directory("download_directory_file.json", self._tester, tmp_path)
     @needs_aws_s3
-    def test_download_subdirectory_s3(self) -> None:
-        self.download_subdirectory("download_subdirectory_s3.json", self._tester)
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_download_subdirectory_s3(self, tmp_path: Path) -> None:
+        self.download_subdirectory(
+            "download_subdirectory_s3.json", self._tester, tmp_path
+        )
-    def test_download_subdirectory_file(self) -> None:
-        self.download_subdirectory("download_subdirectory_file.json", self._tester)
+    def test_download_subdirectory_file(self, tmp_path: Path) -> None:
+        self.download_subdirectory(
+            "download_subdirectory_file.json", self._tester, tmp_path
+        )
     # We also want to make sure we can run a bare tool with loadContents on the inputs, which requires accessing the input data early in the leader.
     @needs_aws_s3
-    def test_load_contents_s3(self) -> None:
-        self.load_contents("download_s3.json", self._tester)
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_load_contents_s3(self, tmp_path: Path) -> None:
+        self.load_contents("download_s3.json", self._tester, tmp_path)
-    def test_load_contents_http(self) -> None:
-        self.load_contents("download_http.json", self._tester)
+    def test_load_contents_http(self, tmp_path: Path) -> None:
+        self.load_contents("download_http.json", self._tester, tmp_path)
-    def test_load_contents_https(self) -> None:
-        self.load_contents("download_https.json", self._tester)
+    def test_load_contents_https(self, tmp_path: Path) -> None:
+        self.load_contents("download_https.json", self._tester, tmp_path)
-    def test_load_contents_file(self) -> None:
-        self.load_contents("download_file.json", self._tester)
+    def test_load_contents_file(self, tmp_path: Path) -> None:
+        self.load_contents("download_file.json", self._tester, tmp_path)
     @slow
     @pytest.mark.integrative
-    @unittest.skip("Fails too often due to remote service")
-    def test_bioconda(self) -> None:
-        self._tester(
-            "src/toil/test/cwl/seqtk_seq.cwl",
-            "src/toil/test/cwl/seqtk_seq_job.json",
-            self._expected_seqtk_output(self.outDir),
-            main_args=["--beta-conda-dependencies"],
-            out_name="output1",
-        )
+    @pytest.mark.slow
+    @pytest.mark.skip("Fails too often due to remote service")
+    def test_bioconda(self, tmp_path: Path) -> None:
+        with get_data("test/cwl/seqtk_seq.cwl") as cwl_file:
+            with get_data("test/cwl/seqtk_seq_job.json") as inputs_file:
+                self._tester(
+                    cwl_file,
+                    inputs_file,
+                    self._expected_seqtk_output(tmp_path),
+                    tmp_path,
+                    main_args=["--beta-conda-dependencies"],
+                    out_name="output1",
+                )
     @needs_docker
-    def test_default_args(self) -> None:
-        self._tester(
-            "src/toil/test/cwl/seqtk_seq.cwl",
-            "src/toil/test/cwl/seqtk_seq_job.json",
-            self._expected_seqtk_output(self.outDir),
-            main_args=[
-                "--default-container",
-                "quay.io/biocontainers/seqtk:1.4--he4a0461_1",
-            ],
-            out_name="output1",
-        )
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_default_args(self, tmp_path: Path) -> None:
+        with get_data("test/cwl/seqtk_seq.cwl") as cwl_file:
+            with get_data("test/cwl/seqtk_seq_job.json") as inputs_file:
+                self._tester(
+                    cwl_file,
+                    inputs_file,
+                    self._expected_seqtk_output(tmp_path),
+                    tmp_path,
+                    main_args=[
+                        "--default-container",
+                        "quay.io/biocontainers/seqtk:1.4--he4a0461_1",
+                    ],
+                    out_name="output1",
+                )
     @needs_docker
+    @pytest.mark.docker
     @pytest.mark.integrative
-    @unittest.skip("Fails too often due to remote service")
-    def test_biocontainers(self) -> None:
-        self._tester(
-            "src/toil/test/cwl/seqtk_seq.cwl",
-            "src/toil/test/cwl/seqtk_seq_job.json",
-            self._expected_seqtk_output(self.outDir),
-            main_args=["--beta-use-biocontainers"],
-            out_name="output1",
-        )
+    @pytest.mark.online
+    @pytest.mark.skip(reason="Fails too often due to remote service")
+    def test_biocontainers(self, tmp_path: Path) -> None:
+        with get_data("test/cwl/seqtk_seq.cwl") as cwl_file:
+            with get_data("test/cwl/seqtk_seq_job.json") as inputs_file:
+                self._tester(
+                    cwl_file,
+                    inputs_file,
+                    self._expected_seqtk_output(tmp_path),
+                    tmp_path,
+                    main_args=["--beta-use-biocontainers"],
+                    out_name="output1",
+                )
     @needs_docker
     @needs_docker_cuda
     @needs_local_cuda
-    def test_cuda(self) -> None:
-        self._tester(
-            "src/toil/test/cwl/nvidia_smi.cwl",
-            "src/toil/test/cwl/empty.json",
-            {},
-            out_name="result",
-        )
+    @pytest.mark.docker
+    @pytest.mark.online
+    @pytest.mark.docker_cuda
+    @pytest.mark.local_cuda
+    def test_cuda(self, tmp_path: Path) -> None:
+        with get_data("test/cwl/nvidia_smi.cwl") as cwl_file:
+            with get_data("test/cwl/empty.json") as inputs_file:
+                self._tester(
+                    cwl_file,
+                    inputs_file,
+                    {},
+                    tmp_path,
+                    out_name="result",
+                )
     @slow
-    def test_restart(self) -> None:
+    @pytest.mark.slow
+    def test_restart(self, tmp_path: Path) -> None:
         """
         Enable restarts with toil-cwl-runner -- run failing test, re-run correct test.
         Only implemented for single machine.
@@ -652,195 +724,203 @@ class CWLWorkflowTest(ToilTest):
         log.info("Running CWL Test Restart.  Expecting failure, then success.")
         from toil.cwl import cwltoil
-        outDir = self._createTempDir()
-        cwlDir = os.path.join(self._projectRootPath(), "src", "toil", "test", "cwl")
-        cmd = [
-            "--outdir",
-            outDir,
-            "--jobStore",
-            os.path.join(outDir, "jobStore"),
-            "--no-container",
-            os.path.join(cwlDir, "revsort.cwl"),
-            os.path.join(cwlDir, "revsort-job.json"),
-        ]
-        # create a fake rev bin that actually points to the "date" binary
-        cal_path = [
-            d
-            for d in os.environ["PATH"].split(":")
-            if os.path.exists(os.path.join(d, "date"))
-        ][-1]
-        os.symlink(os.path.join(cal_path, "date"), f'{os.path.join(outDir, "rev")}')
-        def path_with_bogus_rev() -> str:
-            # append to the front of the PATH so that we check there first
-            return f"{outDir}:" + os.environ["PATH"]
-        orig_path = os.environ["PATH"]
-        # Force a failure by trying to use an incorrect version of `rev` from the PATH
-        os.environ["PATH"] = path_with_bogus_rev()
-        try:
-            subprocess.check_output(
-                ["toil-cwl-runner"] + cmd,
-                env=os.environ.copy(),
-                stderr=subprocess.STDOUT,
-            )
-            self.fail("Expected problem job with incorrect PATH did not fail")
-        except subprocess.CalledProcessError:
-            pass
-        # Finish the job with a correct PATH
-        os.environ["PATH"] = orig_path
-        cmd.insert(0, "--restart")
-        cwltoil.main(cmd)
-        # Should fail because previous job completed successfully
-        try:
-            subprocess.check_output(
-                ["toil-cwl-runner"] + cmd,
-                env=os.environ.copy(),
-                stderr=subprocess.STDOUT,
-            )
-            self.fail("Restart with missing directory did not fail")
-        except subprocess.CalledProcessError:
-            pass
-    def test_caching(self) -> None:
+        outDir = tmp_path / "outDir"
+        outDir.mkdir()
+        jobStore = tmp_path / "jobStore"
+        with get_data("test/cwl/revsort.cwl") as cwl_file:
+            with get_data("test/cwl/revsort-job.json") as job_file:
+                cmd = [
+                    "--outdir",
+                    str(outDir),
+                    "--jobStore",
+                    str(jobStore),
+                    "--no-container",
+                    str(cwl_file),
+                    str(job_file),
+                ]
+                # create a fake rev bin that actually points to the "date" binary
+                cal_path = [
+                    d
+                    for d in os.environ["PATH"].split(":")
+                    if os.path.exists(os.path.join(d, "date"))
+                ][-1]
+                os.symlink(
+                    os.path.realpath(os.path.join(cal_path, "date")), outDir / "rev"
+                )
+                def path_with_bogus_rev() -> str:
+                    # append to the front of the PATH so that we check there first
+                    return f"{str(outDir)}:" + os.environ["PATH"]
+                orig_path = os.environ["PATH"]
+                # Force a failure by trying to use an incorrect version of `rev` from the PATH
+                os.environ["PATH"] = path_with_bogus_rev()
+                try:
+                    subprocess.check_output(
+                        ["toil-cwl-runner"] + cmd,
+                        env=os.environ.copy(),
+                        stderr=subprocess.STDOUT,
+                    )
+                    pytest.fail("Expected problem job with incorrect PATH did not fail")
+                except subprocess.CalledProcessError:
+                    pass
+                # Finish the job with a correct PATH
+                os.environ["PATH"] = orig_path
+                cmd.insert(0, "--restart")
+                cwltoil.main(cmd)
+                # Should fail because previous job completed successfully
+                try:
+                    subprocess.check_output(
+                        ["toil-cwl-runner"] + cmd,
+                        env=os.environ.copy(),
+                        stderr=subprocess.STDOUT,
+                    )
+                    pytest.fail("Restart with missing directory did not fail")
+                except subprocess.CalledProcessError:
+                    pass
+    def test_caching(self, tmp_path: Path) -> None:
         log.info("Running CWL caching test.")
         from toil.cwl import cwltoil
-        outDir = self._createTempDir()
-        cacheDir = self._createTempDir()
-        cwlDir = os.path.join(self._projectRootPath(), "src", "toil", "test", "cwl")
-        log_path = os.path.join(outDir, "log")
-        cmd = [
-            "--outdir",
-            outDir,
-            "--jobStore",
-            os.path.join(outDir, "jobStore"),
-            "--clean=always",
-            "--no-container",
-            "--cachedir",
-            cacheDir,
-            os.path.join(cwlDir, "revsort.cwl"),
-            os.path.join(cwlDir, "revsort-job.json"),
-        ]
-        st = StringIO()
-        ret = cwltoil.main(cmd, stdout=st)
-        assert ret == 0
-        # cwltool hashes certain steps into directories, ensure it exists
-        # since cwltool caches per task and revsort has 2 cwl tasks, there should be 2 directories and 2 status files
-        assert (len(os.listdir(cacheDir)) == 4)
-        # Rerun the workflow to ensure there is a cache hit and that we don't rerun the tools
-        st = StringIO()
-        cmd = [
-                  "--writeLogsFromAllJobs=True",
-                  "--writeLogs",
-                  log_path
-              ] + cmd
-        ret = cwltoil.main(cmd, stdout=st)
-        assert ret == 0
-        # Ensure all of the worker logs are using their cached outputs
-        for file in os.listdir(log_path):
-            assert "Using cached output" in open(os.path.join(log_path, file), encoding="utf-8").read()
+        outDir = tmp_path / "outDir"
+        cacheDir = tmp_path / "cacheDir"
+        log_path = outDir / "log"
+        with get_data("test/cwl/revsort.cwl") as cwl_file:
+            with get_data("test/cwl/revsort-job.json") as job_file:
+                cmd = [
+                    "--outdir",
+                    str(outDir),
+                    "--jobStore",
+                    str(tmp_path / "jobStore"),
+                    "--clean=always",
+                    "--no-container",
+                    "--cachedir",
+                    str(cacheDir),
+                    str(cwl_file),
+                    str(job_file),
+                ]
+                st = StringIO()
+                ret = cwltoil.main(cmd, stdout=st)
+                assert ret == 0
+                # cwltool hashes certain steps into directories, ensure it exists
+                # since cwltool caches per task and revsort has 2 cwl tasks, there should be 2 directories and 2 status files
+                assert sum(1 for _ in cacheDir.iterdir()) == 4
+                # Rerun the workflow to ensure there is a cache hit and that we don't rerun the tools
+                st = StringIO()
+                cmd = [
+                    "--writeLogsFromAllJobs=True",
+                    "--writeLogs",
+                    str(log_path),
+                ] + cmd
+                ret = cwltoil.main(cmd, stdout=st)
+                assert ret == 0
+                # Ensure all of the worker logs are using their cached outputs
+                for file in log_path.iterdir():
+                    assert "Using cached output" in file.read_text(encoding="utf-8")
     @needs_aws_s3
-    def test_streamable(self, extra_args: Optional[list[str]] = None) -> None:
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_streamable(
+        self, tmp_path: Path, extra_args: Optional[list[str]] = None
+    ) -> None:
         """
         Test that a file with 'streamable'=True is a named pipe.
         This is a CWL1.2 feature.
         """
-        cwlfile = "src/toil/test/cwl/stream.cwl"
-        jobfile = "src/toil/test/cwl/stream.json"
-        out_name = "output"
-        jobstore = f"--jobStore=aws:us-west-1:toil-stream-{uuid.uuid4()}"
-        from toil.cwl import cwltoil
         st = StringIO()
-        args = [
-            "--logDebug",
-            "--outdir",
-            self.outDir,
-            jobstore,
-            os.path.join(self.rootDir, cwlfile),
-            os.path.join(self.rootDir, jobfile),
-        ]
-        if extra_args:
-            args = extra_args + args
-        log.info("Run CWL run: %s", " ".join(args))
-        cwltoil.main(args, stdout=st)
+        outDir = tmp_path / "outDir"
+        with get_data("test/cwl/stream.cwl") as cwlfile:
+            with get_data("test/cwl/stream.json") as jobfile:
+                out_name = "output"
+                jobstore = f"--jobStore=aws:us-west-1:toil-stream-{uuid.uuid4()}"
+                from toil.cwl import cwltoil
+                args = [
+                    "--logDebug",
+                    "--outdir",
+                    str(outDir),
+                    jobstore,
+                    str(cwlfile),
+                    str(jobfile),
+                ]
+                if extra_args:
+                    args = extra_args + args
+                log.info("Run CWL run: %s", " ".join(args))
+                cwltoil.main(args, stdout=st)
         out = json.loads(st.getvalue())
         out[out_name].pop("http://commonwl.org/cwltool#generation", None)
         out[out_name].pop("nameext", None)
         out[out_name].pop("nameroot", None)
-        self.assertEqual(out, self._expected_streaming_output(self.outDir))
+        assert out == self._expected_streaming_output(outDir)
         with open(out[out_name]["location"][len("file://") :]) as f:
-            self.assertEqual(f.read().strip(), "When is s4 coming out?")
+            assert f.read().strip() == "When is s4 coming out?"
     @needs_aws_s3
-    def test_streamable_reference(self) -> None:
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_streamable_reference(self, tmp_path: Path) -> None:
         """
         Test that a streamable file is a stream even when passed around by URI.
         """
-        self.test_streamable(extra_args=["--reference-inputs"])
+        self.test_streamable(tmp_path=tmp_path, extra_args=["--reference-inputs"])
-    def test_preemptible(self) -> None:
+    def test_preemptible(self, tmp_path: Path) -> None:
         """
         Tests that the http://arvados.org/cwl#UsePreemptible extension is supported.
         """
-        cwlfile = "src/toil/test/cwl/preemptible.cwl"
-        jobfile = "src/toil/test/cwl/empty.json"
-        out_name = "output"
         from toil.cwl import cwltoil
         st = StringIO()
-        args = [
-            "--outdir",
-            self.outDir,
-            os.path.join(self.rootDir, cwlfile),
-            os.path.join(self.rootDir, jobfile),
-        ]
-        cwltoil.main(args, stdout=st)
+        out_name = "output"
+        with get_data("test/cwl/preemptible.cwl") as cwlfile:
+            with get_data("test/cwl/empty.json") as jobfile:
+                args = [
+                    "--outdir",
+                    str(tmp_path / "outDir"),
+                    str(cwlfile),
+                    str(jobfile),
+                ]
+                cwltoil.main(args, stdout=st)
         out = json.loads(st.getvalue())
         out[out_name].pop("http://commonwl.org/cwltool#generation", None)
         out[out_name].pop("nameext", None)
         out[out_name].pop("nameroot", None)
         with open(out[out_name]["location"][len("file://") :]) as f:
-            self.assertEqual(f.read().strip(), "hello")
+            assert f.read().strip() == "hello"
-    def test_preemptible_expression(self) -> None:
+    def test_preemptible_expression(self, tmp_path: Path) -> None:
         """
         Tests that the http://arvados.org/cwl#UsePreemptible extension is validated.
         """
-        cwlfile = "src/toil/test/cwl/preemptible_expression.cwl"
-        jobfile = "src/toil/test/cwl/preemptible_expression.json"
         from toil.cwl import cwltoil
         st = StringIO()
-        args = [
-            "--outdir",
-            self.outDir,
-            os.path.join(self.rootDir, cwlfile),
-            os.path.join(self.rootDir, jobfile),
-        ]
-        try:
-            cwltoil.main(args, stdout=st)
-            raise RuntimeError("Did not raise correct exception")
-        except ValidationException as e:
-            # Make sure we chastise the user appropriately.
-            assert "expressions are not allowed" in str(e)
+        with get_data("test/cwl/preemptible_expression.cwl") as cwlfile:
+            with get_data("test/cwl/preemptible_expression.json") as jobfile:
+                args = [
+                    "--outdir",
+                    str(tmp_path),
+                    str(cwlfile),
+                    str(jobfile),
+                ]
+                with pytest.raises(
+                    ValidationException, match=re.escape("expressions are not allowed")
+                ):
+                    cwltoil.main(args, stdout=st)
     @staticmethod
-    def _expected_seqtk_output(outDir: str) -> "CWLObjectType":
-        path = os.path.join(outDir, "out")
-        loc = "file://" + path
+    def _expected_seqtk_output(outDir: Path) -> "CWLObjectType":
+        path = outDir / "out"
         return {
             "output1": {
-                "location": loc,
-                "path": path,
+                "location": path.as_uri(),
+                "path": str(path),
                 "checksum": "sha1$322e001e5a99f19abdce9f02ad0f02a17b5066c2",
                 "basename": "out",
                 "class": "File",
@@ -849,13 +929,12 @@ class CWLWorkflowTest(ToilTest):
         }
     @staticmethod
-    def _expected_revsort_output(outDir: str) -> "CWLObjectType":
-        path = os.path.join(outDir, "output.txt")
-        loc = "file://" + path
+    def _expected_revsort_output(outDir: Path) -> "CWLObjectType":
+        path = outDir / "output.txt"
         return {
             "output": {
-                "location": loc,
-                "path": path,
+                "location": path.as_uri(),
+                "path": str(path),
                 "basename": "output.txt",
                 "size": 1111,
                 "class": "File",
@@ -864,13 +943,12 @@ class CWLWorkflowTest(ToilTest):
         }
     @staticmethod
-    def _expected_revsort_nochecksum_output(outDir: str) -> "CWLObjectType":
-        path = os.path.join(outDir, "output.txt")
-        loc = "file://" + path
+    def _expected_revsort_nochecksum_output(outDir: Path) -> "CWLObjectType":
+        path = outDir / "output.txt"
         return {
             "output": {
-                "location": loc,
-                "path": path,
+                "location": path.as_uri(),
+                "path": str(path),
                 "basename": "output.txt",
                 "size": 1111,
                 "class": "File",
@@ -878,30 +956,29 @@ class CWLWorkflowTest(ToilTest):
         }
     @staticmethod
-    def _expected_download_output(outDir: str) -> "CWLObjectType":
-        path = os.path.join(outDir, "output.txt")
-        loc = "file://" + path
+    def _expected_download_output(outDir: Path) -> "CWLObjectType":
+        path = outDir / "output.txt"
         return {
             "output": {
-                "location": loc,
+                "location": path.as_uri(),
                 "basename": "output.txt",
                 "size": 0,
                 "class": "File",
                 "checksum": "sha1$da39a3ee5e6b4b0d3255bfef95601890afd80709",
-                "path": path,
+                "path": str(path),
             }
         }
     @staticmethod
-    def _expected_glob_dir_output(out_dir: str) -> "CWLObjectType":
-        dir_path = os.path.join(out_dir, "shouldmake")
-        dir_loc = "file://" + dir_path
-        file_path = os.path.join(dir_path, "test.txt")
-        file_loc = os.path.join(dir_loc, "test.txt")
+    def _expected_glob_dir_output(out_dir: Path) -> "CWLObjectType":
+        dir_path = out_dir / "shouldmake"
+        dir_loc = dir_path.as_uri()
+        file_path = dir_path / "test.txt"
+        file_loc = file_path.as_uri()
         return {
             "shouldmake": {
                 "location": dir_loc,
-                "path": dir_path,
+                "path": str(dir_path),
                 "basename": "shouldmake",
                 "nameroot": "shouldmake",
                 "nameext": "",
@@ -910,7 +987,7 @@ class CWLWorkflowTest(ToilTest):
                     {
                         "class": "File",
                         "location": file_loc,
-                        "path": file_path,
+                        "path": str(file_path),
                         "basename": "test.txt",
                         "checksum": "sha1$da39a3ee5e6b4b0d3255bfef95601890afd80709",
                         "size": 0,
@@ -922,7 +999,7 @@ class CWLWorkflowTest(ToilTest):
         }
     @classmethod
-    def _expected_load_contents_output(cls, out_dir: str) -> "CWLObjectType":
+    def _expected_load_contents_output(cls, out_dir: Path) -> "CWLObjectType":
         """
         Generate the putput we expect from load_contents.cwl, when sending
         output files to the given directory.
@@ -932,13 +1009,15 @@ class CWLWorkflowTest(ToilTest):
         return expected
     @staticmethod
-    def _expected_colon_output(outDir: str) -> "CWLObjectType":
-        path = os.path.join(outDir, "A:Gln2Cys_result")
-        loc = "file://" + os.path.join(outDir, "A%3AGln2Cys_result")
+    def _expected_colon_output(outDir: Path) -> "CWLObjectType":
+        path = outDir / "A:Gln2Cys_result"
+        loc = "file://" + os.path.join(
+            outDir, "A%3AGln2Cys_result"
+        )  # not using .as_uri to ensure the expected escaping
         return {
             "result": {
                 "location": loc,
-                "path": path,
+                "path": str(path),
                 "basename": "A:Gln2Cys_result",
                 "class": "Directory",
                 "listing": [
@@ -956,13 +1035,12 @@ class CWLWorkflowTest(ToilTest):
             }
         }
-    def _expected_streaming_output(self, outDir: str) -> "CWLObjectType":
-        path = os.path.join(outDir, "output.txt")
-        loc = "file://" + path
+    def _expected_streaming_output(self, outDir: Path) -> "CWLObjectType":
+        path = outDir / "output.txt"
         return {
             "output": {
-                "location": loc,
-                "path": path,
+                "location": path.as_uri(),
+                "path": str(path),
                 "basename": "output.txt",
                 "size": 24,
                 "class": "File",
@@ -970,102 +1048,101 @@ class CWLWorkflowTest(ToilTest):
             }
         }
-    def test_missing_import(self) -> None:
-        tmp_path = self._createTempDir()
-        out_dir = os.path.join(tmp_path, "cwl-out-dir")
-        toil = "toil-cwl-runner"
-        options = [
-            f"--outdir={out_dir}",
-            "--clean=always",
-        ]
-        cmd = [toil] + options + ["src/toil/test/cwl/revsort.cwl", "src/toil/test/cwl/revsort-job-missing.json"]
-        p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-        stdout, stderr = p.communicate()
-        # Make sure that the missing file is mentioned in the log so the user knows
-        assert b"missing.txt" in stderr
-        assert p.returncode == 1
+    @needs_docker
+    @pytest.mark.docker
+    @pytest.mark.online
+    def test_missing_import(self, tmp_path: Path) -> None:
+        with get_data("test/cwl/revsort.cwl") as cwl_file:
+            with get_data("test/cwl/revsort-job-missing.json") as inputs_file:
+                cmd = [
+                    "toil-cwl-runner",
+                    f"--outdir={str(tmp_path)}",
+                    "--clean=always",
+                    str(cwl_file),
+                    str(inputs_file),
+                ]
+                p = subprocess.run(cmd, capture_output=True, text=True)
+                # Make sure that the missing file is mentioned in the log so the user knows
+                assert p.returncode == 1, p.stderr
+                assert "missing.txt" in p.stderr
     @needs_aws_s3
-    def test_optional_secondary_files_exists(self) -> None:
-        tmp_path = self._createTempDir()
-        out_dir = os.path.join(tmp_path, "cwl-out-dir")
-        cwlfile = "src/toil/test/cwl/optional-file.cwl"
-        jobfile = "src/toil/test/cwl/optional-file-exists.json"
-        args = [
-            os.path.join(self.rootDir, cwlfile),
-            os.path.join(self.rootDir, jobfile),
-            f"--outdir={out_dir}"
-        ]
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_optional_secondary_files_exists(self, tmp_path: Path) -> None:
         from toil.cwl import cwltoil
-        ret = cwltoil.main(args)
-        assert ret == 0
-        assert os.path.exists(os.path.join(out_dir, "wdl_templates_old.zip"))
+        with get_data("test/cwl/optional-file.cwl") as cwlfile:
+            with get_data("test/cwl/optional-file-exists.json") as jobfile:
+                args = [str(cwlfile), str(jobfile), f"--outdir={str(tmp_path)}"]
+                ret = cwltoil.main(args)
+                assert ret == 0
+                assert (tmp_path / "wdl_templates_old.zip").exists()
     @needs_aws_s3
-    def test_optional_secondary_files_missing(self) -> None:
-        tmp_path = self._createTempDir()
-        out_dir = os.path.join(tmp_path, "cwl-out-dir")
+    @pytest.mark.aws_s3
+    @pytest.mark.online
+    def test_optional_secondary_files_missing(self, tmp_path: Path) -> None:
+        from toil.cwl import cwltoil
-        cwlfile = "src/toil/test/cwl/optional-file.cwl"
-        jobfile = "src/toil/test/cwl/optional-file-missing.json"
+        with get_data("test/cwl/optional-file.cwl") as cwlfile:
+            with get_data("test/cwl/optional-file-missing.json") as jobfile:
+                args = [str(cwlfile), str(jobfile), f"--outdir={str(tmp_path)}"]
+                ret = cwltoil.main(args)
+                assert ret == 0
+                assert not (tmp_path / "hello_old.zip").exists()
-        args = [
-            os.path.join(self.rootDir, cwlfile),
-            os.path.join(self.rootDir, jobfile),
-            f"--outdir={out_dir}"
-        ]
-        from toil.cwl import cwltoil
-        ret = cwltoil.main(args)
-        assert ret == 0
-        assert not os.path.exists(os.path.join(out_dir, "hello_old.zip"))
+@pytest.fixture(scope="function")
+def cwl_v1_0_spec(tmp_path: Path) -> Generator[Path]:
+    # The latest cwl git commit hash from https://github.com/common-workflow-language/common-workflow-language.
+    # Update it to get the latest tests.
+    testhash = (
+        "6a955874ade22080b8ef962b4e0d6e408112c1ef"  # Date:   Tue Dec 16 2020 8:43pm PST
+    )
+    url = (
+        "https://github.com/common-workflow-language/common-workflow-language/archive/%s.zip"
+        % testhash
+    )
+    urlretrieve(url, "spec.zip")
+    with zipfile.ZipFile("spec.zip", "r") as z:
+        z.extractall()
+    shutil.move("common-workflow-language-%s" % testhash, str(tmp_path))
+    os.remove("spec.zip")
+    try:
+        yield tmp_path / ("common-workflow-language-%s" % testhash)
+    finally:
+        pass  # no cleanup
+@pytest.mark.integrative
+@pytest.mark.conformance
 @needs_cwl
 @needs_online
-class CWLv10Test(ToilTest):
+@pytest.mark.cwl
+@pytest.mark.online
+class TestCWLv10Conformance:
     """
     Run the CWL 1.0 conformance tests in various environments.
     """
-    def setUp(self) -> None:
-        """Runs anew before each test to create farm fresh temp dirs."""
-        self.outDir = f"/tmp/toil-cwl-test-{str(uuid.uuid4())}"
-        os.makedirs(self.outDir)
-        self.rootDir = self._projectRootPath()
-        self.cwlSpec = os.path.join(self.rootDir, "src/toil/test/cwl/spec")
-        self.workDir = os.path.join(self.cwlSpec, "v1.0")
-        # The latest cwl git commit hash from https://github.com/common-workflow-language/common-workflow-language.
-        # Update it to get the latest tests.
-        testhash = "6a955874ade22080b8ef962b4e0d6e408112c1ef"  # Date:   Tue Dec 16 2020 8:43pm PST
-        url = (
-            "https://github.com/common-workflow-language/common-workflow-language/archive/%s.zip"
-            % testhash
-        )
-        if not os.path.exists(self.cwlSpec):
-            urlretrieve(url, "spec.zip")
-            with zipfile.ZipFile("spec.zip", "r") as z:
-                z.extractall()
-            shutil.move("common-workflow-language-%s" % testhash, self.cwlSpec)
-            os.remove("spec.zip")
-    def tearDown(self) -> None:
-        """Clean up outputs."""
-        if os.path.exists(self.outDir):
-            shutil.rmtree(self.outDir)
-        unittest.TestCase.tearDown(self)
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
+    @pytest.mark.online
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
-    def test_run_conformance_with_caching(self) -> None:
-        self.test_run_conformance(caching=True)
+    def test_run_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_run_conformance(cwl_v1_0_spec, caching=True)
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
+    @pytest.mark.online
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
     def test_run_conformance(
         self,
+        cwl_v1_0_spec: Path,
         batchSystem: Optional[str] = None,
         caching: bool = False,
         selected_tests: Optional[str] = None,
@@ -1073,8 +1150,8 @@ class CWLv10Test(ToilTest):
         extra_args: Optional[list[str]] = None,
     ) -> None:
         run_conformance_tests(
-            workDir=self.workDir,
-            yml="conformance_test_v1.0.yaml",
+            workDir=str(cwl_v1_0_spec / "v1.0"),
+            yml=str(cwl_v1_0_spec / "v1.0" / "conformance_test_v1.0.yaml"),
             caching=caching,
             batchSystem=batchSystem,
             selected_tests=selected_tests,
@@ -1084,38 +1161,66 @@ class CWLv10Test(ToilTest):
     @slow
     @needs_lsf
-    @unittest.skip("Not run")
-    def test_lsf_cwl_conformance(self, caching: bool = False) -> None:
-        self.test_run_conformance(batchSystem="lsf", caching=caching)
+    @pytest.mark.slow
+    @pytest.mark.lsf
+    @pytest.mark.skip("Not run")
+    def test_lsf_cwl_conformance(
+        self, cwl_v1_0_spec: Path, caching: bool = False
+    ) -> None:
+        self.test_run_conformance(cwl_v1_0_spec, batchSystem="lsf", caching=caching)
     @slow
     @needs_slurm
-    @unittest.skip("Not run")
-    def test_slurm_cwl_conformance(self, caching: bool = False) -> None:
-        self.test_run_conformance(batchSystem="slurm", caching=caching)
+    @pytest.mark.slow
+    @pytest.mark.slurm
+    @pytest.mark.skip("Not run")
+    def test_slurm_cwl_conformance(
+        self, cwl_v1_0_spec: Path, caching: bool = False
+    ) -> None:
+        self.test_run_conformance(cwl_v1_0_spec, batchSystem="slurm", caching=caching)
     @slow
     @needs_torque
-    @unittest.skip("Not run")
-    def test_torque_cwl_conformance(self, caching: bool = False) -> None:
-        self.test_run_conformance(batchSystem="torque", caching=caching)
+    @pytest.mark.slow
+    @pytest.mark.torque
+    @pytest.mark.skip("Not run")
+    def test_torque_cwl_conformance(
+        self, cwl_v1_0_spec: Path, caching: bool = False
+    ) -> None:
+        self.test_run_conformance(cwl_v1_0_spec, batchSystem="torque", caching=caching)
     @slow
     @needs_gridengine
-    @unittest.skip("Not run")
-    def test_gridengine_cwl_conformance(self, caching: bool = False) -> None:
-        self.test_run_conformance(batchSystem="grid_engine", caching=caching)
+    @pytest.mark.slow
+    @pytest.mark.gridengine
+    @pytest.mark.skip("Not run")
+    def test_gridengine_cwl_conformance(
+        self, cwl_v1_0_spec: Path, caching: bool = False
+    ) -> None:
+        self.test_run_conformance(
+            cwl_v1_0_spec, batchSystem="grid_engine", caching=caching
+        )
     @slow
     @needs_mesos
-    @unittest.skip("Not run")
-    def test_mesos_cwl_conformance(self, caching: bool = False) -> None:
-        self.test_run_conformance(batchSystem="mesos", caching=caching)
+    @pytest.mark.slow
+    @pytest.mark.mesos
+    @pytest.mark.skip("Not run")
+    def test_mesos_cwl_conformance(
+        self, cwl_v1_0_spec: Path, caching: bool = False
+    ) -> None:
+        self.test_run_conformance(cwl_v1_0_spec, batchSystem="mesos", caching=caching)
     @slow
     @needs_kubernetes
-    def test_kubernetes_cwl_conformance(self, caching: bool = False) -> None:
+    @pytest.mark.slow
+    @pytest.mark.kubernetes
+    @pytest.mark.online
+    def test_kubernetes_cwl_conformance(
+        self, cwl_v1_0_spec: Path, caching: bool = False
+    ) -> None:
         self.test_run_conformance(
+            cwl_v1_0_spec,
             caching=caching,
             batchSystem="kubernetes",
             extra_args=["--retryCount=3"],
@@ -1127,82 +1232,100 @@ class CWLv10Test(ToilTest):
     @slow
     @needs_lsf
-    @unittest.skip("Not run")
-    def test_lsf_cwl_conformance_with_caching(self) -> None:
-        self.test_lsf_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.lsf
+    @pytest.mark.skip(reason="Not run")
+    def test_lsf_cwl_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_lsf_cwl_conformance(cwl_v1_0_spec, caching=True)
     @slow
     @needs_slurm
-    @unittest.skip("Not run")
-    def test_slurm_cwl_conformance_with_caching(self) -> None:
-        self.test_slurm_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.slurm
+    @pytest.mark.skip(reason="Not run")
+    def test_slurm_cwl_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_slurm_cwl_conformance(cwl_v1_0_spec, caching=True)
     @slow
     @needs_torque
-    @unittest.skip("Not run")
-    def test_torque_cwl_conformance_with_caching(self) -> None:
-        self.test_torque_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.torque
+    @pytest.mark.skip(reason="Not run")
+    def test_torque_cwl_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_torque_cwl_conformance(cwl_v1_0_spec, caching=True)
     @slow
     @needs_gridengine
-    @unittest.skip("Not run")
-    def test_gridengine_cwl_conformance_with_caching(self) -> None:
-        self.test_gridengine_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.gridengine
+    @pytest.mark.skip(reason="Not run")
+    def test_gridengine_cwl_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_gridengine_cwl_conformance(cwl_v1_0_spec, caching=True)
     @slow
     @needs_mesos
-    @unittest.skip("Not run")
-    def test_mesos_cwl_conformance_with_caching(self) -> None:
-        self.test_mesos_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.mesos
+    @pytest.mark.skip(reason="Not run")
+    def test_mesos_cwl_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_mesos_cwl_conformance(cwl_v1_0_spec, caching=True)
     @slow
     @needs_kubernetes
-    def test_kubernetes_cwl_conformance_with_caching(self) -> None:
-        self.test_kubernetes_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.kubernetes
+    @pytest.mark.online
+    def test_kubernetes_cwl_conformance_with_caching(self, cwl_v1_0_spec: Path) -> None:
+        self.test_kubernetes_cwl_conformance(cwl_v1_0_spec, caching=True)
+@pytest.fixture(scope="function")
+def cwl_v1_1_spec(tmp_path: Path) -> Generator[Path]:
+    # The latest cwl git commit hash from https://github.com/common-workflow-language/cwl-v1.1
+    # Update it to get the latest tests.
+    testhash = "664835e83eb5e57eee18a04ce7b05fb9d70d77b7"
+    url = (
+        "https://github.com/common-workflow-language/cwl-v1.1/archive/%s.zip" % testhash
+    )
+    urlretrieve(url, "spec.zip")
+    with zipfile.ZipFile("spec.zip", "r") as z:
+        z.extractall()
+    shutil.move("cwl-v1.1-%s" % testhash, str(tmp_path))
+    os.remove("spec.zip")
+    try:
+        yield tmp_path / ("cwl-v1.1-%s" % testhash)
+    finally:
+        pass  # no cleanup
+@pytest.mark.integrative
+@pytest.mark.conformance
 @needs_cwl
 @needs_online
-class CWLv11Test(ToilTest):
+@pytest.mark.cwl
+@pytest.mark.online
+class TestCWLv11Conformance:
     """
     Run the CWL 1.1 conformance tests in various environments.
     """
-    rootDir: str
-    cwlSpec: str
-    test_yaml: str
-    @classmethod
-    def setUpClass(cls) -> None:
-        """Runs anew before each test."""
-        cls.rootDir = cls._projectRootPath()
-        cls.cwlSpec = os.path.join(cls.rootDir, "src/toil/test/cwl/spec_v11")
-        cls.test_yaml = os.path.join(cls.cwlSpec, "conformance_tests.yaml")
-        # TODO: Use a commit zip in case someone decides to rewrite master's history?
-        url = "https://github.com/common-workflow-language/cwl-v1.1.git"
-        commit = "664835e83eb5e57eee18a04ce7b05fb9d70d77b7"
-        p = subprocess.Popen(
-            f"git clone {url} {cls.cwlSpec} && cd {cls.cwlSpec} && git checkout {commit}",
-            shell=True,
-        )
-        p.communicate()
-    def tearDown(self) -> None:
-        """Clean up outputs."""
-        unittest.TestCase.tearDown(self)
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
+    @pytest.mark.online
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
     def test_run_conformance(
         self,
+        cwl_v1_1_spec: Path,
         caching: bool = False,
         batchSystem: Optional[str] = None,
         skipped_tests: Optional[str] = None,
         extra_args: Optional[list[str]] = None,
     ) -> None:
         run_conformance_tests(
-            workDir=self.cwlSpec,
-            yml=self.test_yaml,
+            workDir=str(cwl_v1_1_spec),
+            yml=str(cwl_v1_1_spec / "conformance_tests.yaml"),
             caching=caching,
             batchSystem=batchSystem,
             skipped_tests=skipped_tests,
@@ -1210,14 +1333,24 @@ class CWLv11Test(ToilTest):
         )
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
+    @pytest.mark.online
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
-    def test_run_conformance_with_caching(self) -> None:
-        self.test_run_conformance(caching=True)
+    def test_run_conformance_with_caching(self, cwl_v1_1_spec: Path) -> None:
+        self.test_run_conformance(cwl_v1_1_spec, caching=True)
     @slow
     @needs_kubernetes
-    def test_kubernetes_cwl_conformance(self, caching: bool = False) -> None:
+    @pytest.mark.slow
+    @pytest.mark.kubernetes
+    @pytest.mark.online
+    def test_kubernetes_cwl_conformance(
+        self, cwl_v1_1_spec: Path, caching: bool = False
+    ) -> None:
         self.test_run_conformance(
+            cwl_v1_1_spec,
             batchSystem="kubernetes",
             extra_args=["--retryCount=3"],
             # These tests don't work with
@@ -1229,44 +1362,52 @@ class CWLv11Test(ToilTest):
     @slow
     @needs_kubernetes
-    def test_kubernetes_cwl_conformance_with_caching(self) -> None:
-        self.test_kubernetes_cwl_conformance(caching=True)
+    @pytest.mark.slow
+    @pytest.mark.kubernetes
+    @pytest.mark.online
+    def test_kubernetes_cwl_conformance_with_caching(self, cwl_v1_1_spec: Path) -> None:
+        self.test_kubernetes_cwl_conformance(cwl_v1_1_spec, caching=True)
+@pytest.fixture(scope="function")
+def cwl_v1_2_spec(tmp_path: Path) -> Generator[Path]:
+    # The latest cwl git commit hash from https://github.com/common-workflow-language/cwl-v1.2
+    # Update it to get the latest tests.
+    testhash = "0d538a0dbc5518f3c6083ce4571926f65cb84f76"
+    url = (
+        "https://github.com/common-workflow-language/cwl-v1.2/archive/%s.zip" % testhash
+    )
+    urlretrieve(url, "spec.zip")
+    with zipfile.ZipFile("spec.zip", "r") as z:
+        z.extractall()
+    shutil.move("cwl-v1.2-%s" % testhash, str(tmp_path))
+    os.remove("spec.zip")
+    try:
+        yield tmp_path / ("cwl-v1.2-%s" % testhash)
+    finally:
+        pass  # no cleanup
+@pytest.mark.integrative
+@pytest.mark.conformance
 @needs_cwl
 @needs_online
-class CWLv12Test(ToilTest):
+@pytest.mark.cwl
+@pytest.mark.online
+class TestCWLv12Conformance:
     """
     Run the CWL 1.2 conformance tests in various environments.
     """
-    rootDir: str
-    cwlSpec: str
-    test_yaml: str
-    @classmethod
-    def setUpClass(cls) -> None:
-        """Runs anew before each test."""
-        cls.rootDir = cls._projectRootPath()
-        cls.cwlSpec = os.path.join(cls.rootDir, "src/toil/test/cwl/spec_v12")
-        cls.test_yaml = os.path.join(cls.cwlSpec, "conformance_tests.yaml")
-        # TODO: Use a commit zip in case someone decides to rewrite master's history?
-        url = "https://github.com/common-workflow-language/cwl-v1.2.git"
-        commit = "0d538a0dbc5518f3c6083ce4571926f65cb84f76"
-        p = subprocess.Popen(
-            f"git clone {url} {cls.cwlSpec} && cd {cls.cwlSpec} && git checkout {commit}",
-            shell=True,
-        )
-        p.communicate()
-    def tearDown(self) -> None:
-        """Clean up outputs."""
-        unittest.TestCase.tearDown(self)
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
+    @pytest.mark.online
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
     def test_run_conformance(
         self,
+        cwl_v1_2_spec: Path,
         runner: Optional[str] = None,
         caching: bool = False,
         batchSystem: Optional[str] = None,
@@ -1277,10 +1418,10 @@ class CWLv12Test(ToilTest):
         junit_file: Optional[str] = None,
     ) -> None:
         if junit_file is None:
-            junit_file = os.path.join(self.rootDir, "conformance-1.2.junit.xml")
+            junit_file = os.path.abspath("conformance-1.2.junit.xml")
         run_conformance_tests(
-            workDir=self.cwlSpec,
-            yml=self.test_yaml,
+            workDir=str(cwl_v1_2_spec),
+            yml=str(cwl_v1_2_spec / "conformance_tests.yaml"),
             runner=runner,
             caching=caching,
             batchSystem=batchSystem,
@@ -1290,48 +1431,67 @@ class CWLv12Test(ToilTest):
             must_support_all_features=must_support_all_features,
             junit_file=junit_file,
         )
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
+    @pytest.mark.online
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
-    def test_run_conformance_with_caching(self) -> None:
+    def test_run_conformance_with_caching(self, cwl_v1_2_spec: Path) -> None:
         self.test_run_conformance(
+            cwl_v1_2_spec,
             caching=True,
-            junit_file=os.path.join(self.rootDir, "caching-conformance-1.2.junit.xml"),
+            junit_file=os.path.abspath("caching-conformance-1.2.junit.xml"),
         )
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
-    def test_run_conformance_with_task_caching(self) -> None:
+    def test_run_conformance_with_task_caching(
+        self, cwl_v1_2_spec: Path, tmp_path: Path
+    ) -> None:
         self.test_run_conformance(
-            junit_file=os.path.join(self.rootDir, "task-caching-conformance-1.2.junit.xml"),
-            extra_args=["--cachedir", self._createTempDir("task_cache")]
+            cwl_v1_2_spec,
+            junit_file=os.path.abspath("task-caching-conformance-1.2.junit.xml"),
+            extra_args=["--cachedir", str(tmp_path / "task_cache")],
         )
     @slow
+    @needs_docker
+    @pytest.mark.slow
+    @pytest.mark.docker
     @pytest.mark.timeout(CONFORMANCE_TEST_TIMEOUT)
-    def test_run_conformance_with_in_place_update(self) -> None:
+    def test_run_conformance_with_in_place_update(self, cwl_v1_2_spec: Path) -> None:
         """
         Make sure that with --bypass-file-store we properly support in place
         update on a single node, and that this doesn't break any other
         features.
         """
         self.test_run_conformance(
+            cwl_v1_2_spec,
             extra_args=["--bypass-file-store"],
             must_support_all_features=True,
-            junit_file=os.path.join(
-                self.rootDir, "in-place-update-conformance-1.2.junit.xml"
-            ),
+            junit_file=os.path.abspath("in-place-update-conformance-1.2.junit.xml"),
         )
     @slow
     @needs_kubernetes
+    @pytest.mark.slow
+    @pytest.mark.kubernetes
+    @pytest.mark.online
     def test_kubernetes_cwl_conformance(
-        self, caching: bool = False, junit_file: Optional[str] = None
+        self,
+        cwl_v1_2_spec: Path,
+        caching: bool = False,
+        junit_file: Optional[str] = None,
     ) -> None:
         if junit_file is None:
-            junit_file = os.path.join(
-                self.rootDir, "kubernetes-conformance-1.2.junit.xml"
-            )
+            junit_file = os.path.abspath("kubernetes-conformance-1.2.junit.xml")
         self.test_run_conformance(
+            cwl_v1_2_spec,
             caching=caching,
             batchSystem="kubernetes",
             extra_args=["--retryCount=3"],
@@ -1346,17 +1506,22 @@ class CWLv12Test(ToilTest):
     @slow
     @needs_kubernetes
-    def test_kubernetes_cwl_conformance_with_caching(self) -> None:
+    @pytest.mark.slow
+    @pytest.mark.kubernetes
+    @pytest.mark.online
+    def test_kubernetes_cwl_conformance_with_caching(self, cwl_v1_2_spec: Path) -> None:
         self.test_kubernetes_cwl_conformance(
+            cwl_v1_2_spec,
             caching=True,
-            junit_file=os.path.join(
-                self.rootDir, "kubernetes-caching-conformance-1.2.junit.xml"
-            ),
+            junit_file=os.path.abspath("kubernetes-caching-conformance-1.2.junit.xml"),
         )
     @slow
     @needs_wes_server
-    def test_wes_server_cwl_conformance(self) -> None:
+    @pytest.mark.slow
+    @pytest.mark.wes_server
+    @pytest.mark.online
+    def test_wes_server_cwl_conformance(self, cwl_v1_2_spec: Path) -> None:
         """
         Run the CWL conformance tests via WES. TOIL_WES_ENDPOINT must be
         specified. If the WES server requires authentication, set TOIL_WES_USER
@@ -1367,7 +1532,7 @@ class CWLv12Test(ToilTest):
         TOIL_WES_ENDPOINT=http://localhost:8080 \
         TOIL_WES_USER=test \
         TOIL_WES_PASSWORD=password \
-        python -m pytest src/toil/test/cwl/cwlTest.py::CWLv12Test::test_wes_server_cwl_conformance -vv --log-level INFO --log-cli-level INFO
+        python -m pytest src/toil/test/cwl/cwlTest.py::TestCWLv12Conformance::test_wes_server_cwl_conformance -vv --log-level INFO --log-cli-level INFO
         """
         endpoint = os.environ.get("TOIL_WES_ENDPOINT")
         extra_args = [f"--wes_endpoint={endpoint}"]
@@ -1382,6 +1547,7 @@ class CWLv12Test(ToilTest):
         #     e.g.: https://github.com/common-workflow-language/cwl-v1.2/blob/1.2.1_proposed/tests/mixed-versions/wf-v10.cwl#L4-L10
         self.test_run_conformance(
+            cwl_v1_2_spec,
             runner="toil-wes-cwl-runner",
             selected_tests="1-309,313-337",
             extra_args=extra_args,
@@ -1389,183 +1555,162 @@ class CWLv12Test(ToilTest):
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small_log_dir
 def test_workflow_echo_string_scatter_stderr_log_dir(tmp_path: Path) -> None:
     log_dir = tmp_path / "cwl-logs"
-    job_store = "test_workflow_echo_string_scatter_stderr_log_dir"
-    toil = "toil-cwl-runner"
-    jobstore = f"--jobStore={job_store}"
-    option_1 = "--strict-memory-limit"
-    option_2 = "--force-docker-pull"
-    option_3 = "--clean=always"
-    option_4 = f"--log-dir={log_dir}"
-    cwl = os.path.join(
-        os.path.dirname(__file__), "echo_string_scatter_capture_stdout.cwl"
-    )
-    cmd = [toil, jobstore, option_1, option_2, option_3, option_4, cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    outputs = json.loads(stdout)
-    out_list = outputs["list_out"]
-    assert len(out_list) == 2, f"outList shoud have two file elements {out_list}"
-    out_base = outputs["list_out"][0]
-    # This is a test on the scatter functionality and stdout.
-    # Each value of scatter should generate a separate file in the output.
-    for index, file in enumerate(out_list):
-        if index > 0:
-            new_file_loc = out_base["location"] + f"_{index + 1}"
-        else:
-            new_file_loc = out_base["location"]
-        assert (
-            new_file_loc == file["location"]
-        ), f"Toil should have detected conflicts for these stdout files {new_file_loc} and {file}"
+    with get_data("test/cwl/echo_string_scatter_capture_stdout.cwl") as cwl_file:
+        cmd = [
+            "toil-cwl-runner",
+            f"--jobStore={tmp_path / 'jobstore'}",
+            "--strict-memory-limit",
+            f"--log-dir={log_dir}",
+            str(cwl_file),
+        ]
+        p = subprocess.run(cmd, capture_output=True, text=True)
+        outputs = json.loads(p.stdout)
+        out_list = outputs["list_out"]
+        assert len(out_list) == 2, f"outList shoud have two file elements {out_list}"
+        out_base = outputs["list_out"][0]
+        # This is a test on the scatter functionality and stdout.
+        # Each value of scatter should generate a separate file in the output.
+        for index, file in enumerate(out_list):
+            if index > 0:
+                new_file_loc = out_base["location"] + f"_{index + 1}"
+            else:
+                new_file_loc = out_base["location"]
+            assert (
+                new_file_loc == file["location"]
+            ), f"Toil should have detected conflicts for these stdout files {new_file_loc} and {file}"
-    assert b"Finished toil run successfully" in stderr
-    assert p.returncode == 0
+        assert "Finished toil run successfully" in p.stderr
+        assert p.returncode == 0
-    assert log_dir.exists()
-    scatter_0 = log_dir / "echo-test-scatter.0.scatter"
-    scatter_1 = log_dir / "echo-test-scatter.1.scatter"
-    list_0 = log_dir / "echo-test-scatter.0.list"
-    list_1 = log_dir / "echo-test-scatter.1.list"
-    assert scatter_0.exists()
-    assert scatter_1.exists()
-    assert list_0.exists()
-    assert list_1.exists()
+        assert log_dir.exists()
+        scatter_0 = log_dir / "echo-test-scatter.0.scatter"
+        scatter_1 = log_dir / "echo-test-scatter.1.scatter"
+        list_0 = log_dir / "echo-test-scatter.0.list"
+        list_1 = log_dir / "echo-test-scatter.1.list"
+        assert scatter_0.exists()
+        assert scatter_1.exists()
+        assert list_0.exists()
+        assert list_1.exists()
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small_log_dir
 def test_log_dir_echo_no_output(tmp_path: Path) -> None:
     log_dir = tmp_path / "cwl-logs"
-    job_store = "test_log_dir_echo_no_output"
-    toil = "toil-cwl-runner"
-    jobstore = f"--jobStore={job_store}"
-    option_1 = "--strict-memory-limit"
-    option_2 = "--force-docker-pull"
-    option_3 = "--clean=always"
-    option_4 = f"--log-dir={log_dir}"
-    cwl = os.path.join(os.path.dirname(__file__), "echo-stdout-log-dir.cwl")
-    cmd = [toil, jobstore, option_1, option_2, option_3, option_4, cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    tmp_path = log_dir
-    assert log_dir.exists()
-    assert len(list(tmp_path.iterdir())) == 1
-    subdir = next(tmp_path.iterdir())
-    assert subdir.name == "echo"
-    assert subdir.is_dir()
-    assert len(list(subdir.iterdir())) == 1
-    result = next(subdir.iterdir())
-    assert result.name == "out.txt"
-    output = open(result).read()
-    assert "hello" in output
+    job_store = tmp_path / "test_log_dir_echo_no_output"
+    with get_data("test/cwl/echo-stdout-log-dir.cwl") as cwl_file:
+        cmd = [
+            "toil-cwl-runner",
+            f"--jobStore={job_store}",
+            "--strict-memory-limit",
+            f"--log-dir={str(log_dir)}",
+            str(cwl_file),
+        ]
+        subprocess.run(cmd)
+        assert log_dir.exists()
+        assert sum(1 for _ in log_dir.iterdir()) == 1
+        subdir = next(log_dir.iterdir())
+        assert subdir.name == "echo"
+        assert subdir.is_dir()
+        assert sum(1 for _ in subdir.iterdir()) == 1
+        result = next(subdir.iterdir())
+        assert result.name == "out.txt"
+        assert "hello" in result.read_text()
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small_log_dir
 def test_log_dir_echo_stderr(tmp_path: Path) -> None:
     log_dir = tmp_path / "cwl-logs"
+    log_dir.mkdir()
+    with get_data("test/cwl/echo-stderr.cwl") as cwl_file:
+        cmd = [
+            "toil-cwl-runner",
+            f"--jobStore={str(tmp_path / 'test_log_dir_echo_stderr')}",
+            "--strict-memory-limit",
+            "--force-docker-pull",
+            "--clean=always",
+            f"--log-dir={str(log_dir)}",
+            str(cwl_file),
+        ]
+        subprocess.run(cmd)
+        tmp_path = log_dir
-    job_store = "test_log_dir_echo_stderr"
-    toil = "toil-cwl-runner"
-    jobstore = f"--jobStore={job_store}"
-    option_1 = "--strict-memory-limit"
-    option_2 = "--force-docker-pull"
-    option_3 = "--clean=always"
-    option_4 = f"--log-dir={log_dir}"
-    cwl = os.path.join(os.path.dirname(__file__), "echo-stderr.cwl")
-    cmd = [toil, jobstore, option_1, option_2, option_3, option_4, cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    tmp_path = log_dir
-    assert len(list(tmp_path.iterdir())) == 1
-    subdir = next(tmp_path.iterdir())
-    assert subdir.name == "echo-stderr.cwl"
-    assert subdir.is_dir()
-    assert len(list(subdir.iterdir())) == 1
-    result = next(subdir.iterdir())
-    assert result.name == "out.txt"
-    output = open(result).read()
-    assert output == "hello\n"
+        assert len(list(tmp_path.iterdir())) == 1
+        subdir = next(tmp_path.iterdir())
+        assert subdir.name == "echo-stderr.cwl"
+        assert subdir.is_dir()
+        assert len(list(subdir.iterdir())) == 1
+        result = next(subdir.iterdir())
+        assert result.name == "out.txt"
+        output = open(result).read()
+        assert output == "hello\n"
 # TODO: It's not clear how this test tests filename conflict resolution; it
 # seems like it runs a python script to copy some files and makes sure the
 # workflow doesn't fail.
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small_log_dir
 def test_filename_conflict_resolution(tmp_path: Path) -> None:
-    out_dir = tmp_path / "cwl-out-dir"
-    toil = "toil-cwl-runner"
-    options = [
-        f"--outdir={out_dir}",
-        "--clean=always",
-    ]
-    cwl = os.path.join(
-        os.path.dirname(__file__), "test_filename_conflict_resolution.cwl"
-    )
-    input = os.path.join(
-        os.path.dirname(__file__), "test_filename_conflict_resolution.ms"
-    )
-    cwl_inputs = ["--msin", input]
-    cmd = [toil] + options + [cwl] + cwl_inputs
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    assert b"Finished toil run successfully" in stderr
-    assert p.returncode == 0
+    with get_data("test/cwl/test_filename_conflict_resolution.cwl") as cwl_file:
+        with get_data("test/cwl/test_filename_conflict_resolution.ms") as msin:
+            cmd = [
+                "toil-cwl-runner",
+                f"--outdir={tmp_path}",
+                str(cwl_file),
+                "--msin",
+                str(msin),
+            ]
+            p = subprocess.run(cmd, capture_output=True, text=True)
+            assert "Finished toil run successfully" in p.stderr
+            assert p.returncode == 0
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small_log_dir
 def test_filename_conflict_resolution_3_or_more(tmp_path: Path) -> None:
-    out_dir = tmp_path / "cwl-out-dir"
-    toil = "toil-cwl-runner"
-    options = [
-        f"--outdir={out_dir}",
-        "--clean=always",
-    ]
-    cwl = os.path.join(os.path.dirname(__file__), "scatter_duplicate_outputs.cwl")
-    cmd = [toil] + options + [cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    assert b"Finished toil run successfully" in stderr
-    assert p.returncode == 0
-    assert (
-        len(os.listdir(out_dir)) == 9
-    ), "All 9 files made by the scatter should be in the directory"
+    with get_data("test/cwl/scatter_duplicate_outputs.cwl") as cwl_file:
+        cmd = ["toil-cwl-runner", f"--outdir={tmp_path}", str(cwl_file)]
+        p = subprocess.run(cmd, capture_output=True, text=True)
+        assert "Finished toil run successfully" in p.stderr
+        assert p.returncode == 0
+        assert (
+            sum(1 for _ in tmp_path.iterdir()) == 9
+        ), f"All 9 files made by the scatter should be in the directory: {tmp_path}"
 @needs_cwl
 @needs_docker
+@pytest.mark.cwl
+@pytest.mark.docker
 @pytest.mark.cwl_small_log_dir
 def test_filename_conflict_detection(tmp_path: Path) -> None:
     """
     Make sure we don't just stage files over each other when using a container.
     """
-    out_dir = tmp_path / "cwl-out-dir"
-    toil = "toil-cwl-runner"
-    options = [
-        f"--outdir={out_dir}",
-        "--clean=always",
-    ]
-    cwl = os.path.join(
-        os.path.dirname(__file__), "test_filename_conflict_detection.cwl"
-    )
-    cmd = [toil] + options + [cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    assert b"File staging conflict" in stderr
-    assert p.returncode != 0
+    with get_data("test/cwl/test_filename_conflict_detection.cwl") as cwl_file:
+        cmd = ["toil-cwl-runner", f"--outdir={tmp_path}", str(cwl_file)]
+        p = subprocess.run(cmd, capture_output=True, text=True)
+        assert "File staging conflict" in p.stderr
+        assert p.returncode != 0
 @needs_cwl
 @needs_docker
+@pytest.mark.cwl
+@pytest.mark.docker
 @pytest.mark.cwl_small_log_dir
 def test_filename_conflict_detection_at_root(tmp_path: Path) -> None:
     """
@@ -1573,101 +1718,89 @@ def test_filename_conflict_detection_at_root(tmp_path: Path) -> None:
     Specifically, when using a container and the files are at the root of the work dir.
     """
-    out_dir = tmp_path / "cwl-out-dir"
-    toil = "toil-cwl-runner"
-    options = [
-        f"--outdir={out_dir}",
-        "--clean=always",
-    ]
-    cwl = os.path.join(
-        os.path.dirname(__file__), "test_filename_conflict_detection_at_root.cwl"
-    )
-    cmd = [toil] + options + [cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    assert b"File staging conflict" in stderr
-    assert p.returncode != 0
+    with get_data("test/cwl/test_filename_conflict_detection_at_root.cwl") as cwl_file:
+        cmd = ["toil-cwl-runner", f"--outdir={tmp_path}", str(cwl_file)]
+        p = subprocess.run(cmd, capture_output=True, text=True)
+        assert "File staging conflict" in p.stderr
+        assert p.returncode != 0
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small
-def test_pick_value_with_one_null_value(caplog: pytest.LogCaptureFixture) -> None:
+def test_pick_value_with_one_null_value(
+    caplog: pytest.LogCaptureFixture, tmp_path: Path
+) -> None:
     """
     Make sure toil-cwl-runner does not false log a warning when pickValue is
     used but outputSource only contains one null value. See: #3991.
     """
     from toil.cwl import cwltoil
-    cwl_file = os.path.join(os.path.dirname(__file__), "conditional_wf.cwl")
-    job_file = os.path.join(os.path.dirname(__file__), "conditional_wf.yaml")
-    args = [cwl_file, job_file]
-    with caplog.at_level(logging.WARNING, logger="toil.cwl.cwltoil"):
-        cwltoil.main(args)
-        for line in caplog.messages:
-            assert (
-                "You had a conditional step that did not run, but you did not use pickValue to handle the skipped input."
-                not in line
-            )
+    with get_data("test/cwl/conditional_wf.cwl") as cwl_file:
+        with get_data("test/cwl/conditional_wf.yaml") as job_file:
+            with caplog.at_level(logging.WARNING, logger="toil.cwl.cwltoil"):
+                cwltoil.main([f"--outdir={tmp_path}", str(cwl_file), str(job_file)])
+                for line in caplog.messages:
+                    assert (
+                        "You had a conditional step that did not run, but you did not use pickValue to handle the skipped input."
+                        not in line
+                    )
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small
-def test_workflow_echo_string() -> None:
-    toil = "toil-cwl-runner"
-    jobstore = f"--jobStore=file:explicit-local-jobstore-{uuid.uuid4()}"
-    option_1 = "--strict-memory-limit"
-    option_2 = "--force-docker-pull"
-    option_3 = "--clean=always"
-    cwl = os.path.join(os.path.dirname(__file__), "echo_string.cwl")
-    cmd = [toil, jobstore, option_1, option_2, option_3, cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    stdout2 = stdout.decode("utf-8")
-    stderr2 = stderr.decode("utf-8")
-    assert (
-        stdout2.strip() == "{}"
-    ), f"Got wrong output: {stdout2}\nWith error: {stderr2}"
-    assert "Finished toil run successfully" in stderr2
-    assert p.returncode == 0
+def test_workflow_echo_string(tmp_path: Path) -> None:
+    with get_data("test/cwl/echo_string.cwl") as cwl_file:
+        cmd = [
+            "toil-cwl-runner",
+            f"--jobStore=file:{tmp_path / 'jobstore'}",
+            "--strict-memory-limit",
+            str(cwl_file),
+        ]
+        p = subprocess.run(cmd, capture_output=True, text=True)
+        assert (
+            p.stdout.strip() == "{}"
+        ), f"Got wrong output: {p.stdout}\nWith error: {p.stderr}"
+        assert "Finished toil run successfully" in p.stderr
+        assert p.returncode == 0
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small
-def test_workflow_echo_string_scatter_capture_stdout() -> None:
-    toil = "toil-cwl-runner"
-    jobstore = f"--jobStore=file:explicit-local-jobstore-{uuid.uuid4()}"
-    option_1 = "--strict-memory-limit"
-    option_2 = "--force-docker-pull"
-    option_3 = "--clean=always"
-    cwl = os.path.join(
-        os.path.dirname(__file__), "echo_string_scatter_capture_stdout.cwl"
-    )
-    cmd = [toil, jobstore, option_1, option_2, option_3, cwl]
-    p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-    stdout, stderr = p.communicate()
-    log.debug("Workflow standard output: %s", stdout)
-    assert len(stdout) > 0
-    outputs = json.loads(stdout)
-    out_list = outputs["list_out"]
-    assert len(out_list) == 2, f"outList shoud have two file elements {out_list}"
-    out_base = outputs["list_out"][0]
-    # This is a test on the scatter functionality and stdout.
-    # Each value of scatter should generate a separate file in the output.
-    for index, file in enumerate(out_list):
-        if index > 0:
-            new_file_loc = out_base["location"] + f"_{index + 1}"
-        else:
-            new_file_loc = out_base["location"]
-        assert (
-            new_file_loc == file["location"]
-        ), f"Toil should have detected conflicts for these stdout files {new_file_loc} and {file}"
+def test_workflow_echo_string_scatter_capture_stdout(tmp_path: Path) -> None:
+    with get_data("test/cwl/echo_string_scatter_capture_stdout.cwl") as cwl_file:
+        cmd = [
+            "toil-cwl-runner",
+            f"--jobStore=file:{tmp_path / 'jobStore'}",
+            "--strict-memory-limit",
+            str(cwl_file),
+        ]
+        p = subprocess.run(cmd, capture_output=True, text=True)
+        assert len(p.stdout) > 0
+        outputs = json.loads(p.stdout)
+        out_list = outputs["list_out"]
+        assert len(out_list) == 2, f"outList shoud have two file elements {out_list}"
+        out_base = outputs["list_out"][0]
+        # This is a test on the scatter functionality and stdout.
+        # Each value of scatter should generate a separate file in the output.
+        for index, file in enumerate(out_list):
+            if index > 0:
+                new_file_loc = out_base["location"] + f"_{index + 1}"
+            else:
+                new_file_loc = out_base["location"]
+            assert (
+                new_file_loc == file["location"]
+            ), f"Toil should have detected conflicts for these stdout files {new_file_loc} and {file}"
-    assert b"Finished toil run successfully" in stderr
-    assert p.returncode == 0
+        assert "Finished toil run successfully" in p.stderr
+        assert p.returncode == 0
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small
 def test_visit_top_cwl_class() -> None:
     structure = {
@@ -1719,6 +1852,7 @@ def test_visit_top_cwl_class() -> None:
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small
 def test_visit_cwl_class_and_reduce() -> None:
     structure = {
@@ -1780,6 +1914,135 @@ def test_visit_cwl_class_and_reduce() -> None:
 @needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_trim_mounts_op_nonredundant() -> None:
+    """
+    Make sure we don't remove all non-duplicate listings
+    """
+    s: CWLObjectType = {"class": "Directory", "basename": "directory", "listing": [{"class": "File", "basename": "file", "contents": "hello world"}]}
+    remove_redundant_mounts(s)
+    # nothing should have been removed
+    assert isinstance(s['listing'], list)
+    assert len(s['listing']) == 1
+@needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_trim_mounts_op_redundant() -> None:
+    """
+    Make sure we remove all duplicate listings
+    """
+    s: CWLObjectType = {
+        "class": "Directory",
+        "location": "file:///home/heaucques/Documents/toil/test_dir",
+        "basename": "test_dir",
+        "listing": [
+            {
+                "class": "Directory",
+                "location": "file:///home/heaucques/Documents/toil/test_dir/nested_dir",
+                "basename": "nested_dir",
+                "listing": [],
+                "path": "/home/heaucques/Documents/toil/test_dir/nested_dir"
+            },
+            {
+                "class": "File",
+                "location": "file:///home/heaucques/Documents/toil/test_dir/test_file",
+                "basename": "test_file",
+                "size": 0,
+                "nameroot": "test_file",
+                "nameext": "",
+                "path": "/home/heaucques/Documents/toil/test_dir/test_file",
+                "checksum": "sha1$da39a3ee5e6b4b0d3255bfef95601890afd80709"
+            }
+        ],
+        "path": "/home/heaucques/Documents/toil/test_dir"
+    }
+    remove_redundant_mounts(s)
+    # everything should have been removed
+    assert isinstance(s['listing'], list)
+    assert len(s['listing']) == 0
+@needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_trim_mounts_op_partially_redundant() -> None:
+    """
+    Make sure we remove only the redundant listings in the CWL object and leave nonredundant listings intact
+    """
+    s: CWLObjectType = {
+        "class": "Directory",
+        "location": "file:///home/heaucques/Documents/toil/test_dir",
+        "basename": "test_dir",
+        "listing": [
+            {
+                "class": "Directory",
+                "location": "file:///home/heaucques/Documents/thing",
+                "basename": "thing2",
+                "listing": [],
+                "path": "/home/heaucques/Documents/toil/thing2"
+            },
+            {
+                "class": "File",
+                "location": "file:///home/heaucques/Documents/toil/test_dir/test_file",
+                "basename": "test_file",
+                "size": 0,
+                "nameroot": "test_file",
+                "nameext": "",
+                "path": "/home/heaucques/Documents/toil/test_dir/test_file",
+                "checksum": "sha1$da39a3ee5e6b4b0d3255bfef95601890afd80709"
+            }
+        ],
+        "path": "/home/heaucques/Documents/toil/test_dir"
+    }
+    remove_redundant_mounts(s)
+    # everything except the nested directory should be removed
+    assert isinstance(s['listing'], list)
+    assert len(s['listing']) == 1
+@needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_trim_mounts_op_mixed_urls_and_paths() -> None:
+    """
+    Ensure we remove redundant listings in certain edge cases
+    """
+    # Edge cases around encoding:
+    # Ensure URL decoded file URIs match the bare path equivalent. Both of these paths should have the same shared directory
+    s: CWLObjectType = {"class": "Directory", "basename": "123", "location": "file:///tmp/%25/123", "listing": [{"class": "File", "path": "/tmp/%/123/456", "basename": "456"}]}
+    remove_redundant_mounts(s)
+    assert isinstance(s['listing'], list)
+    assert len(s['listing']) == 0
+@needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_trim_mounts_op_decodable_paths() -> None:
+    """"""
+    # Ensure path names don't get unnecessarily decoded
+    s: CWLObjectType = {"class": "Directory", "basename": "dir", "path": "/tmp/cat%2Ftag/dir", "listing": [{"class": "File", "path": "/tmp/cat/tag/dir/file", "basename": "file"}]}
+    remove_redundant_mounts(s)
+    assert isinstance(s['listing'], list)
+    assert len(s['listing']) == 1
+@needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_trim_mounts_op_multiple_encodings() -> None:
+    # Ensure differently encoded URLs are properly decoded
+    s: CWLObjectType = {"class": "Directory", "basename": "dir", "location": "file:///tmp/cat%2Ftag/dir", "listing": [{"class": "File", "location": "file:///tmp/cat%2ftag/dir/file", "basename": "file"}]}
+    remove_redundant_mounts(s)
+    assert isinstance(s['listing'], list)
+    assert len(s['listing']) == 0
+@needs_cwl
+@pytest.mark.cwl
 @pytest.mark.cwl_small
 def test_download_structure(tmp_path: Path) -> None:
     """
@@ -1804,7 +2067,7 @@ def test_download_structure(tmp_path: Path) -> None:
     }
     # Say where to put it on the filesystem
-    to_dir = str(tmp_path)
+    to_dir = tmp_path
     # Make a fake file store
     file_store = Mock(AbstractFileStore)
@@ -1817,7 +2080,7 @@ def test_download_structure(tmp_path: Path) -> None:
     existing: dict[str, str] = {}
     # Do the download
-    download_structure(file_store, index, existing, structure, to_dir)
+    download_structure(file_store, index, existing, structure, str(to_dir))
     # Check the results
     # 3 files should be made
@@ -1826,61 +2089,53 @@ def test_download_structure(tmp_path: Path) -> None:
     assert len(existing) == 2
     # Make sure that the index contents (path to URI) are correct
-    assert os.path.join(to_dir, "dir1/dir2/f1") in index
-    assert os.path.join(to_dir, "dir1/dir2/f1again") in index
-    assert os.path.join(to_dir, "anotherfile") in index
+    assert str(to_dir / "dir1/dir2/f1") in index
+    assert str(to_dir / "dir1/dir2/f1again") in index
+    assert str(to_dir / "anotherfile") in index
     assert (
-        index[os.path.join(to_dir, "dir1/dir2/f1")]
+        index[str(to_dir / "dir1/dir2/f1")]
         == cast(
             DirectoryStructure, cast(DirectoryStructure, structure["dir1"])["dir2"]
         )["f1"]
     )
     assert (
-        index[os.path.join(to_dir, "dir1/dir2/f1again")]
+        index[str(to_dir / "dir1/dir2/f1again")]
         == cast(
             DirectoryStructure, cast(DirectoryStructure, structure["dir1"])["dir2"]
         )["f1again"]
     )
-    assert index[os.path.join(to_dir, "anotherfile")] == structure["anotherfile"]
+    assert index[str(to_dir / "anotherfile")] == structure["anotherfile"]
     # And the existing contents (URI to path)
     assert "toilfile:" + fid1.pack() in existing
     assert "toilfile:" + fid2.pack() in existing
     assert existing["toilfile:" + fid1.pack()] in [
-        os.path.join(to_dir, "dir1/dir2/f1"),
-        os.path.join(to_dir, "dir1/dir2/f1again"),
+        str(to_dir / "dir1/dir2/f1"),
+        str(to_dir / "dir1/dir2/f1again"),
     ]
-    assert existing["toilfile:" + fid2.pack()] == os.path.join(to_dir, "anotherfile")
+    assert existing["toilfile:" + fid2.pack()] == str(to_dir / "anotherfile")
     # The directory structure should be created for real
-    assert os.path.isdir(os.path.join(to_dir, "dir1")) is True
-    assert os.path.isdir(os.path.join(to_dir, "dir1/dir2")) is True
-    assert os.path.isdir(os.path.join(to_dir, "dir1/dir2/dir2sub")) is True
-    assert os.path.isdir(os.path.join(to_dir, "dir1/dir3")) is True
+    assert (to_dir / "dir1").is_dir()
+    assert (to_dir / "dir1/dir2").is_dir()
+    assert (to_dir / "dir1/dir2/dir2sub").is_dir()
+    assert (to_dir / "dir1/dir3").is_dir()
     # The file store should have been asked to do the download
     file_store.readGlobalFile.assert_has_calls(
         [
-            call(fid1, os.path.join(to_dir, "dir1/dir2/f1"), symlink=False),
-            call(fid1, os.path.join(to_dir, "dir1/dir2/f1again"), symlink=False),
-            call(fid2, os.path.join(to_dir, "anotherfile"), symlink=False),
+            call(fid1, str(to_dir / "dir1/dir2/f1"), symlink=False),
+            call(fid1, str(to_dir / "dir1/dir2/f1again"), symlink=False),
+            call(fid2, str(to_dir / "anotherfile"), symlink=False),
         ],
         any_order=True,
     )
 @needs_cwl
+@pytest.mark.cwl
 @pytest.mark.timeout(300)
 def test_import_on_workers() -> None:
-    args = [
-        "src/toil/test/cwl/download.cwl",
-        "src/toil/test/cwl/download_file.json",
-        "--runImportsOnWorkers",
-        "--importWorkersDisk=10MiB",
-        "--realTimeLogging=True",
-        "--logLevel=INFO",
-        "--logColors=False",
-    ]
     from toil.cwl import cwltoil
     detector = ImportWorkersMessageHandler()
@@ -1888,10 +2143,49 @@ def test_import_on_workers() -> None:
     # Set up a log message detector to the root logger
     logging.getLogger().addHandler(detector)
-    cwltoil.main(args)
+    with get_data("test/cwl/download.cwl") as cwl_file:
+        with get_data("test/cwl/directory/directory/file.txt") as file_path:
+            # To make sure we see every job issued with a leader log message
+            # that we can then detect for the test, we need to turn off
+            # chaining.
+            args = [
+                "--runImportsOnWorkers",
+                "--importWorkersDisk=10MiB",
+                "--realTimeLogging=True",
+                "--logLevel=INFO",
+                "--logColors=False",
+                "--disableChaining=True",
+                str(cwl_file),
+                "--input",
+                str(file_path),
+            ]
+            cwltoil.main(args)
+        assert detector.detected is True
-    assert detector.detected is True
+@needs_cwl
+@pytest.mark.cwl
+@pytest.mark.cwl_small
+def test_missing_tmpdir_and_tmp_outdir(tmp_path: Path) -> None:
+    """
+    tmpdir_prefix and tmp_outdir_prefix do not need to exist prior to running the workflow
+    """
+    tmpdir_prefix = os.path.join(tmp_path, "tmpdir/blah")
+    tmp_outdir_prefix = os.path.join(tmp_path, "tmp_outdir/blah")
+    assert not os.path.exists(os.path.dirname(tmpdir_prefix))
+    assert not os.path.exists(os.path.dirname(tmp_outdir_prefix))
+    with get_data("test/cwl/echo_string.cwl") as cwl_file:
+        cmd = [
+            "toil-cwl-runner",
+            f"--jobStore=file:{tmp_path / 'jobstore'}",
+            "--strict-memory-limit",
+            f'--tmpdir-prefix={tmpdir_prefix}',
+            f'--tmp-outdir-prefix={tmp_outdir_prefix}',
+            str(cwl_file),
+        ]
+        p = subprocess.run(cmd)
+        assert p.returncode == 0
 # StreamHandler is generic, _typeshed doesn't exist at runtime, do a bit of typing trickery, see https://github.com/python/typeshed/issues/5680
 if TYPE_CHECKING:
@@ -1904,7 +2198,7 @@ else:
 class ImportWorkersMessageHandler(_stream_handler):
     """
-    Detect the import workers log message and set a flag.
+    Detect whether any WorkerImportJob jobs ran during a workflow.
     """
     def __init__(self) -> None:
@@ -1913,7 +2207,18 @@ class ImportWorkersMessageHandler(_stream_handler):
         super().__init__(sys.stderr)
     def emit(self, record: logging.LogRecord) -> None:
-        if (record.msg % record.args).startswith(
-            "Issued job 'CWLImportJob' CWLImportJob"
+        # We get the job name from the class since we already started failing
+        # this test once due to it being renamed.
+        try:
+            formatted = record.getMessage()
+        except TypeError as e:
+            # The log message has the wrong number of items for its fields.
+            # Complain in a way we could figure out.
+            raise RuntimeError(
+                f"Log message {record.msg} has wrong number of "
+                f"fields in {record.args}"
+            ) from e
+        if formatted.startswith(
+            f"Issued job '{WorkerImportJob.__name__}'"
         ):
             self.detected = True

toil 8.1.0b1__py3-none-any.whl → 9.0.0__py3-none-any.whl

toil 8.1.0b1py3-none-any.whl → 9.0.0py3-none-any.whl