PyPI - toil - Versions diffs - 6.1.0a1__py3-none-any.whl → 8.0.0__py3-none-any.whl - Mend

toil 6.1.0a1py3-none-any.whl → 8.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (193) hide show

toil/__init__.py +122 -315
toil/batchSystems/__init__.py +1 -0
toil/batchSystems/abstractBatchSystem.py +173 -89
toil/batchSystems/abstractGridEngineBatchSystem.py +272 -148
toil/batchSystems/awsBatch.py +244 -135
toil/batchSystems/cleanup_support.py +26 -16
toil/batchSystems/contained_executor.py +31 -28
toil/batchSystems/gridengine.py +86 -50
toil/batchSystems/htcondor.py +166 -89
toil/batchSystems/kubernetes.py +632 -382
toil/batchSystems/local_support.py +20 -15
toil/batchSystems/lsf.py +134 -81
toil/batchSystems/lsfHelper.py +13 -11
toil/batchSystems/mesos/__init__.py +41 -29
toil/batchSystems/mesos/batchSystem.py +290 -151
toil/batchSystems/mesos/executor.py +79 -50
toil/batchSystems/mesos/test/__init__.py +31 -23
toil/batchSystems/options.py +46 -28
toil/batchSystems/registry.py +53 -19
toil/batchSystems/singleMachine.py +296 -125
toil/batchSystems/slurm.py +603 -138
toil/batchSystems/torque.py +47 -33
toil/bus.py +186 -76
toil/common.py +664 -368
toil/cwl/__init__.py +1 -1
toil/cwl/cwltoil.py +1136 -483
toil/cwl/utils.py +17 -22
toil/deferred.py +63 -42
toil/exceptions.py +5 -3
toil/fileStores/__init__.py +5 -5
toil/fileStores/abstractFileStore.py +140 -60
toil/fileStores/cachingFileStore.py +717 -269
toil/fileStores/nonCachingFileStore.py +116 -87
toil/job.py +1225 -368
toil/jobStores/abstractJobStore.py +416 -266
toil/jobStores/aws/jobStore.py +863 -477
toil/jobStores/aws/utils.py +201 -120
toil/jobStores/conftest.py +3 -2
toil/jobStores/fileJobStore.py +292 -154
toil/jobStores/googleJobStore.py +140 -74
toil/jobStores/utils.py +36 -15
toil/leader.py +668 -272
toil/lib/accelerators.py +115 -18
toil/lib/aws/__init__.py +74 -31
toil/lib/aws/ami.py +122 -87
toil/lib/aws/iam.py +284 -108
toil/lib/aws/s3.py +31 -0
toil/lib/aws/session.py +214 -39
toil/lib/aws/utils.py +287 -231
toil/lib/bioio.py +13 -5
toil/lib/compatibility.py +11 -6
toil/lib/conversions.py +104 -47
toil/lib/docker.py +131 -103
toil/lib/ec2.py +361 -199
toil/lib/ec2nodes.py +174 -106
toil/lib/encryption/_dummy.py +5 -3
toil/lib/encryption/_nacl.py +10 -6
toil/lib/encryption/conftest.py +1 -0
toil/lib/exceptions.py +26 -7
toil/lib/expando.py +5 -3
toil/lib/ftp_utils.py +217 -0
toil/lib/generatedEC2Lists.py +127 -19
toil/lib/humanize.py +6 -2
toil/lib/integration.py +341 -0
toil/lib/io.py +141 -15
toil/lib/iterables.py +4 -2
toil/lib/memoize.py +12 -8
toil/lib/misc.py +66 -21
toil/lib/objects.py +2 -2
toil/lib/resources.py +68 -15
toil/lib/retry.py +126 -81
toil/lib/threading.py +299 -82
toil/lib/throttle.py +16 -15
toil/options/common.py +843 -409
toil/options/cwl.py +175 -90
toil/options/runner.py +50 -0
toil/options/wdl.py +73 -17
toil/provisioners/__init__.py +117 -46
toil/provisioners/abstractProvisioner.py +332 -157
toil/provisioners/aws/__init__.py +70 -33
toil/provisioners/aws/awsProvisioner.py +1145 -715
toil/provisioners/clusterScaler.py +541 -279
toil/provisioners/gceProvisioner.py +282 -179
toil/provisioners/node.py +155 -79
toil/realtimeLogger.py +34 -22
toil/resource.py +137 -75
toil/server/app.py +128 -62
toil/server/celery_app.py +3 -1
toil/server/cli/wes_cwl_runner.py +82 -53
toil/server/utils.py +54 -28
toil/server/wes/abstract_backend.py +64 -26
toil/server/wes/amazon_wes_utils.py +21 -15
toil/server/wes/tasks.py +121 -63
toil/server/wes/toil_backend.py +142 -107
toil/server/wsgi_app.py +4 -3
toil/serviceManager.py +58 -22
toil/statsAndLogging.py +224 -70
toil/test/__init__.py +282 -183
toil/test/batchSystems/batchSystemTest.py +460 -210
toil/test/batchSystems/batch_system_plugin_test.py +90 -0
toil/test/batchSystems/test_gridengine.py +173 -0
toil/test/batchSystems/test_lsf_helper.py +67 -58
toil/test/batchSystems/test_slurm.py +110 -49
toil/test/cactus/__init__.py +0 -0
toil/test/cactus/test_cactus_integration.py +56 -0
toil/test/cwl/cwlTest.py +496 -287
toil/test/cwl/measure_default_memory.cwl +12 -0
toil/test/cwl/not_run_required_input.cwl +29 -0
toil/test/cwl/scatter_duplicate_outputs.cwl +40 -0
toil/test/cwl/seqtk_seq.cwl +1 -1
toil/test/docs/scriptsTest.py +69 -46
toil/test/jobStores/jobStoreTest.py +427 -264
toil/test/lib/aws/test_iam.py +118 -50
toil/test/lib/aws/test_s3.py +16 -9
toil/test/lib/aws/test_utils.py +5 -6
toil/test/lib/dockerTest.py +118 -141
toil/test/lib/test_conversions.py +113 -115
toil/test/lib/test_ec2.py +58 -50
toil/test/lib/test_integration.py +104 -0
toil/test/lib/test_misc.py +12 -5
toil/test/mesos/MesosDataStructuresTest.py +23 -10
toil/test/mesos/helloWorld.py +7 -6
toil/test/mesos/stress.py +25 -20
toil/test/options/__init__.py +13 -0
toil/test/options/options.py +42 -0
toil/test/provisioners/aws/awsProvisionerTest.py +320 -150
toil/test/provisioners/clusterScalerTest.py +440 -250
toil/test/provisioners/clusterTest.py +166 -44
toil/test/provisioners/gceProvisionerTest.py +174 -100
toil/test/provisioners/provisionerTest.py +25 -13
toil/test/provisioners/restartScript.py +5 -4
toil/test/server/serverTest.py +188 -141
toil/test/sort/restart_sort.py +137 -68
toil/test/sort/sort.py +134 -66
toil/test/sort/sortTest.py +91 -49
toil/test/src/autoDeploymentTest.py +141 -101
toil/test/src/busTest.py +20 -18
toil/test/src/checkpointTest.py +8 -2
toil/test/src/deferredFunctionTest.py +49 -35
toil/test/src/dockerCheckTest.py +32 -24
toil/test/src/environmentTest.py +135 -0
toil/test/src/fileStoreTest.py +539 -272
toil/test/src/helloWorldTest.py +7 -4
toil/test/src/importExportFileTest.py +61 -31
toil/test/src/jobDescriptionTest.py +46 -21
toil/test/src/jobEncapsulationTest.py +2 -0
toil/test/src/jobFileStoreTest.py +74 -50
toil/test/src/jobServiceTest.py +187 -73
toil/test/src/jobTest.py +121 -71
toil/test/src/miscTests.py +19 -18
toil/test/src/promisedRequirementTest.py +82 -36
toil/test/src/promisesTest.py +7 -6
toil/test/src/realtimeLoggerTest.py +10 -6
toil/test/src/regularLogTest.py +71 -37
toil/test/src/resourceTest.py +80 -49
toil/test/src/restartDAGTest.py +36 -22
toil/test/src/resumabilityTest.py +9 -2
toil/test/src/retainTempDirTest.py +45 -14
toil/test/src/systemTest.py +12 -8
toil/test/src/threadingTest.py +44 -25
toil/test/src/toilContextManagerTest.py +10 -7
toil/test/src/userDefinedJobArgTypeTest.py +8 -5
toil/test/src/workerTest.py +73 -23
toil/test/utils/toilDebugTest.py +103 -33
toil/test/utils/toilKillTest.py +4 -5
toil/test/utils/utilsTest.py +245 -106
toil/test/wdl/wdltoil_test.py +818 -149
toil/test/wdl/wdltoil_test_kubernetes.py +91 -0
toil/toilState.py +120 -35
toil/utils/toilConfig.py +13 -4
toil/utils/toilDebugFile.py +44 -27
toil/utils/toilDebugJob.py +214 -27
toil/utils/toilDestroyCluster.py +11 -6
toil/utils/toilKill.py +8 -3
toil/utils/toilLaunchCluster.py +256 -140
toil/utils/toilMain.py +37 -16
toil/utils/toilRsyncCluster.py +32 -14
toil/utils/toilSshCluster.py +49 -22
toil/utils/toilStats.py +356 -273
toil/utils/toilStatus.py +292 -139
toil/utils/toilUpdateEC2Instances.py +3 -1
toil/version.py +12 -12
toil/wdl/utils.py +5 -5
toil/wdl/wdltoil.py +3913 -1033
toil/worker.py +367 -184
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/LICENSE +25 -0
toil-8.0.0.dist-info/METADATA +173 -0
toil-8.0.0.dist-info/RECORD +253 -0
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/WHEEL +1 -1
toil-6.1.0a1.dist-info/METADATA +0 -125
toil-6.1.0a1.dist-info/RECORD +0 -237
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/entry_points.txt +0 -0
{toil-6.1.0a1.dist-info → toil-8.0.0.dist-info}/top_level.txt +0 -0

toil/lib/ec2.py CHANGED Viewed

@@ -1,22 +1,29 @@
 import logging
 import time
 from base64 import b64encode
-from operator import attrgetter
-from typing import Dict, Iterable, List, Optional, Union
-from boto3.resources.base import ServiceResource
-from boto.ec2.instance import Instance as Boto2Instance
-from boto.ec2.spotinstancerequest import SpotInstanceRequest
-from botocore.client import BaseClient
+from collections.abc import Generator, Iterable, Mapping
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
 from toil.lib.aws.session import establish_boto3_session
 from toil.lib.aws.utils import flatten_tags
 from toil.lib.exceptions import panic
-from toil.lib.retry import (ErrorCondition,
-                            get_error_code,
-                            get_error_message,
-                            old_retry,
-                            retry)
+from toil.lib.retry import (
+    ErrorCondition,
+    get_error_code,
+    get_error_message,
+    old_retry,
+    retry,
+)
+if TYPE_CHECKING:
+    from mypy_boto3_autoscaling.client import AutoScalingClient
+    from mypy_boto3_ec2.client import EC2Client
+    from mypy_boto3_ec2.service_resource import EC2ServiceResource, Instance
+    from mypy_boto3_ec2.type_defs import (
+        DescribeInstancesResultTypeDef,
+        InstanceTypeDef,
+        SpotInstanceRequestTypeDef,
+    )
 a_short_time = 5
 a_long_time = 60 * 60
@@ -27,44 +34,55 @@ class UserError(RuntimeError):
     def __init__(self, message=None, cause=None):
         if (message is None) == (cause is None):
             raise RuntimeError("Must pass either message or cause.")
-        super().__init__(
-            message if cause is None else cause.message)
+        super().__init__(message if cause is None else cause.message)
 def not_found(e):
     try:
-        return get_error_code(e).endswith('.NotFound')
+        return get_error_code(e).endswith(".NotFound")
     except ValueError:
         # Not the right kind of error
         return False
 def inconsistencies_detected(e):
-    if get_error_code(e) == 'InvalidGroup.NotFound':
+    if get_error_code(e) == "InvalidGroup.NotFound":
         return True
     m = get_error_message(e).lower()
-    matches = ('invalid iam instance profile' in m) or ('no associated iam roles' in m)
+    matches = ("invalid iam instance profile" in m) or ("no associated iam roles" in m)
     return matches
 # We also define these error categories for the new retry decorator
-INCONSISTENCY_ERRORS = [ErrorCondition(boto_error_codes=['InvalidGroup.NotFound']),
-                        ErrorCondition(error_message_must_include='Invalid IAM Instance Profile'),
-                        ErrorCondition(error_message_must_include='no associated IAM Roles')]
+INCONSISTENCY_ERRORS = [
+    ErrorCondition(boto_error_codes=["InvalidGroup.NotFound"]),
+    ErrorCondition(error_message_must_include="Invalid IAM Instance Profile"),
+    ErrorCondition(error_message_must_include="no associated IAM Roles"),
+]
 def retry_ec2(t=a_short_time, retry_for=10 * a_short_time, retry_while=not_found):
-    return old_retry(delays=(t, t, t * 2, t * 4),
-                     timeout=retry_for,
-                     predicate=retry_while)
+    return old_retry(
+        delays=(t, t, t * 2, t * 4), timeout=retry_for, predicate=retry_while
+    )
 class UnexpectedResourceState(Exception):
     def __init__(self, resource, to_state, state):
         super().__init__(
-            "Expected state of %s to be '%s' but got '%s'" %
-            (resource, to_state, state))
-def wait_transition(resource, from_states, to_state,
-                    state_getter=attrgetter('state')):
+            "Expected state of %s to be '%s' but got '%s'" % (resource, to_state, state)
+        )
+def wait_transition(
+    boto3_ec2: "EC2Client",
+    resource: "InstanceTypeDef",
+    from_states: Iterable[str],
+    to_state: str,
+    state_getter: Callable[["InstanceTypeDef"], str] = lambda x: x.get("State").get(
+        "Name"
+    ),
+):
     """
     Wait until the specified EC2 resource (instance, image, volume, ...) transitions from any
     of the given 'from' states to the specified 'to' state. If the instance is found in a state
@@ -76,59 +94,84 @@ def wait_transition(resource, from_states, to_state,
     :param to_state: the state of the resource when this method returns
     """
     state = state_getter(resource)
+    instance_id = resource["InstanceId"]
     while state in from_states:
         time.sleep(a_short_time)
         for attempt in retry_ec2():
             with attempt:
-                resource.update(validate=True)
+                described = boto3_ec2.describe_instances(InstanceIds=[instance_id])
+        resource = described["Reservations"][0]["Instances"][
+            0
+        ]  # there should only be one requested
         state = state_getter(resource)
     if state != to_state:
         raise UnexpectedResourceState(resource, to_state, state)
-def wait_instances_running(ec2, instances: Iterable[Boto2Instance]) -> Iterable[Boto2Instance]:
+def wait_instances_running(
+    boto3_ec2: "EC2Client", instances: Iterable["InstanceTypeDef"]
+) -> Generator["InstanceTypeDef", None, None]:
     """
     Wait until no instance in the given iterable is 'pending'. Yield every instance that
     entered the running state as soon as it does.
-    :param boto.ec2.connection.EC2Connection ec2: the EC2 connection to use for making requests
-    :param Iterable[Boto2Instance] instances: the instances to wait on
-    :rtype: Iterable[Boto2Instance]
+    :param boto3_ec2: the EC2 connection to use for making requests
+    :param instances: the instances to wait on
     """
     running_ids = set()
     other_ids = set()
     while True:
         pending_ids = set()
         for i in instances:
-            if i.state == 'pending':
-                pending_ids.add(i.id)
-            elif i.state == 'running':
-                if i.id in running_ids:
-                    raise RuntimeError("An instance was already added to the list of running instance IDs. Maybe there is a duplicate.")
-                running_ids.add(i.id)
+            i: "InstanceTypeDef"
+            if i["State"]["Name"] == "pending":
+                pending_ids.add(i["InstanceId"])
+            elif i["State"]["Name"] == "running":
+                if i["InstanceId"] in running_ids:
+                    raise RuntimeError(
+                        "An instance was already added to the list of running instance IDs. Maybe there is a duplicate."
+                    )
+                running_ids.add(i["InstanceId"])
                 yield i
             else:
-                if i.id in other_ids:
-                    raise RuntimeError("An instance was already added to the list of other instances. Maybe there is a duplicate.")
-                other_ids.add(i.id)
+                if i["InstanceId"] in other_ids:
+                    raise RuntimeError(
+                        "An instance was already added to the list of other instances. Maybe there is a duplicate."
+                    )
+                other_ids.add(i["InstanceId"])
                 yield i
-        logger.info('%i instance(s) pending, %i running, %i other.',
-                    *list(map(len, (pending_ids, running_ids, other_ids))))
+        logger.info(
+            "%i instance(s) pending, %i running, %i other.",
+            *list(map(len, (pending_ids, running_ids, other_ids))),
+        )
         if not pending_ids:
             break
         seconds = max(a_short_time, min(len(pending_ids), 10 * a_short_time))
-        logger.info('Sleeping for %is', seconds)
+        logger.info("Sleeping for %is", seconds)
         time.sleep(seconds)
         for attempt in retry_ec2():
             with attempt:
-                instances = ec2.get_only_instances(list(pending_ids))
-def wait_spot_requests_active(ec2, requests: Iterable[SpotInstanceRequest], timeout: float = None, tentative: bool = False) -> Iterable[List[SpotInstanceRequest]]:
+                described_instances = boto3_ec2.describe_instances(
+                    InstanceIds=list(pending_ids)
+                )
+                instances = [
+                    instance
+                    for reservation in described_instances["Reservations"]
+                    for instance in reservation["Instances"]
+                ]
+def wait_spot_requests_active(
+    boto3_ec2: "EC2Client",
+    requests: Iterable["SpotInstanceRequestTypeDef"],
+    timeout: float = None,
+    tentative: bool = False,
+) -> Iterable[list["SpotInstanceRequestTypeDef"]]:
     """
     Wait until no spot request in the given iterator is in the 'open' state or, optionally,
     a timeout occurs. Yield spot requests as soon as they leave the 'open' state.
+    :param boto3_ec2: ec2 client
     :param requests: The requests to wait on.
     :param timeout: Maximum time in seconds to spend waiting or None to wait forever. If a
@@ -145,55 +188,68 @@ def wait_spot_requests_active(ec2, requests: Iterable[SpotInstanceRequest], time
     other_ids = set()
     open_ids = None
-    def cancel():
-        logger.warning('Cancelling remaining %i spot requests.', len(open_ids))
-        ec2.cancel_spot_instance_requests(list(open_ids))
+    def cancel() -> None:
+        logger.warning("Cancelling remaining %i spot requests.", len(open_ids))
+        boto3_ec2.cancel_spot_instance_requests(SpotInstanceRequestIds=list(open_ids))
-    def spot_request_not_found(e):
-        return get_error_code(e) == 'InvalidSpotInstanceRequestID.NotFound'
+    def spot_request_not_found(e: Exception) -> bool:
+        return get_error_code(e) == "InvalidSpotInstanceRequestID.NotFound"
     try:
         while True:
             open_ids, eval_ids, fulfill_ids = set(), set(), set()
             batch = []
             for r in requests:
-                if r.state == 'open':
-                    open_ids.add(r.id)
-                    if r.status.code == 'pending-evaluation':
-                        eval_ids.add(r.id)
-                    elif r.status.code == 'pending-fulfillment':
-                        fulfill_ids.add(r.id)
+                r: "SpotInstanceRequestTypeDef"  # pycharm thinks it is a string
+                if r["State"] == "open":
+                    open_ids.add(r["InstanceId"])
+                    if r["Status"] == "pending-evaluation":
+                        eval_ids.add(r["InstanceId"])
+                    elif r["Status"] == "pending-fulfillment":
+                        fulfill_ids.add(r["InstanceId"])
                     else:
                         logger.info(
-                            'Request %s entered status %s indicating that it will not be '
-                            'fulfilled anytime soon.', r.id, r.status.code)
-                elif r.state == 'active':
-                    if r.id in active_ids:
-                        raise RuntimeError("A request was already added to the list of active requests. Maybe there are duplicate requests.")
-                    active_ids.add(r.id)
+                            "Request %s entered status %s indicating that it will not be "
+                            "fulfilled anytime soon.",
+                            r["InstanceId"],
+                            r["Status"],
+                        )
+                elif r["State"] == "active":
+                    if r["InstanceId"] in active_ids:
+                        raise RuntimeError(
+                            "A request was already added to the list of active requests. Maybe there are duplicate requests."
+                        )
+                    active_ids.add(r["InstanceId"])
                     batch.append(r)
                 else:
-                    if r.id in other_ids:
-                        raise RuntimeError("A request was already added to the list of other IDs. Maybe there are duplicate requests.")
-                    other_ids.add(r.id)
+                    if r["InstanceId"] in other_ids:
+                        raise RuntimeError(
+                            "A request was already added to the list of other IDs. Maybe there are duplicate requests."
+                        )
+                    other_ids.add(r["InstanceId"])
                     batch.append(r)
             if batch:
                 yield batch
-            logger.info('%i spot requests(s) are open (%i of which are pending evaluation and %i '
-                     'are pending fulfillment), %i are active and %i are in another state.',
-                        *list(map(len, (open_ids, eval_ids, fulfill_ids, active_ids, other_ids))))
+            logger.info(
+                "%i spot requests(s) are open (%i of which are pending evaluation and %i "
+                "are pending fulfillment), %i are active and %i are in another state.",
+                *list(
+                    map(len, (open_ids, eval_ids, fulfill_ids, active_ids, other_ids))
+                ),
+            )
             if not open_ids or tentative and not eval_ids and not fulfill_ids:
                 break
             sleep_time = 2 * a_short_time
             if timeout is not None and time.time() + sleep_time >= timeout:
-                logger.warning('Timed out waiting for spot requests.')
+                logger.warning("Timed out waiting for spot requests.")
                 break
-            logger.info('Sleeping for %is', sleep_time)
+            logger.info("Sleeping for %is", sleep_time)
             time.sleep(sleep_time)
             for attempt in retry_ec2(retry_while=spot_request_not_found):
                 with attempt:
-                    requests = ec2.get_all_spot_instance_requests(
-                        list(open_ids))
+                    requests = boto3_ec2.describe_spot_instance_requests(
+                        SpotInstanceRequestIds=list(open_ids)
+                    )
     except BaseException:
         if open_ids:
             with panic(logger):
@@ -204,73 +260,125 @@ def wait_spot_requests_active(ec2, requests: Iterable[SpotInstanceRequest], time
             cancel()
-def create_spot_instances(ec2, price, image_id, spec, num_instances=1, timeout=None, tentative=False, tags=None) -> Iterable[List[Boto2Instance]]:
+def create_spot_instances(
+    boto3_ec2: "EC2Client",
+    price,
+    image_id,
+    spec,
+    num_instances=1,
+    timeout=None,
+    tentative=False,
+    tags=None,
+) -> Generator["DescribeInstancesResultTypeDef", None, None]:
     """
     Create instances on the spot market.
     """
-    def spotRequestNotFound(e):
-        return getattr(e, 'error_code', None) == "InvalidSpotInstanceRequestID.NotFound"
-    for attempt in retry_ec2(retry_for=a_long_time,
-                             retry_while=inconsistencies_detected):
+    def spotRequestNotFound(e):
+        return getattr(e, "error_code", None) == "InvalidSpotInstanceRequestID.NotFound"
+    spec["LaunchSpecification"].update(
+        {"ImageId": image_id}
+    )  # boto3 image id is in the launch specification
+    for attempt in retry_ec2(
+        retry_for=a_long_time, retry_while=inconsistencies_detected
+    ):
         with attempt:
-            requests = ec2.request_spot_instances(
-                price, image_id, count=num_instances, **spec)
+            requests_dict = boto3_ec2.request_spot_instances(
+                SpotPrice=price, InstanceCount=num_instances, **spec
+            )
+            requests = requests_dict["SpotInstanceRequests"]
     if tags is not None:
-        for requestID in (request.id for request in requests):
+        for requestID in (request["SpotInstanceRequestId"] for request in requests):
             for attempt in retry_ec2(retry_while=spotRequestNotFound):
                 with attempt:
-                    ec2.create_tags([requestID], tags)
+                    boto3_ec2.create_tags(Resources=[requestID], Tags=tags)
     num_active, num_other = 0, 0
     # noinspection PyUnboundLocalVariable,PyTypeChecker
     # request_spot_instances's type annotation is wrong
-    for batch in wait_spot_requests_active(ec2,
-                                           requests,
-                                           timeout=timeout,
-                                           tentative=tentative):
+    for batch in wait_spot_requests_active(
+        boto3_ec2, requests, timeout=timeout, tentative=tentative
+    ):
         instance_ids = []
         for request in batch:
-            if request.state == 'active':
-                instance_ids.append(request.instance_id)
+            request: "SpotInstanceRequestTypeDef"
+            if request["State"] == "active":
+                instance_ids.append(request["InstanceId"])
                 num_active += 1
             else:
                 logger.info(
-                    'Request %s in unexpected state %s.',
-                    request.id,
-                    request.state)
+                    "Request %s in unexpected state %s.",
+                    request["InstanceId"],
+                    request["State"],
+                )
                 num_other += 1
         if instance_ids:
             # This next line is the reason we batch. It's so we can get multiple instances in
             # a single request.
-            yield ec2.get_only_instances(instance_ids)
+            for instance_id in instance_ids:
+                for attempt in retry_ec2():
+                    with attempt:
+                        # Increase hop limit from 1 to use Instance Metadata V2
+                        boto3_ec2.modify_instance_metadata_options(
+                            InstanceId=instance_id, HttpPutResponseHopLimit=3
+                        )
+            yield boto3_ec2.describe_instances(InstanceIds=instance_ids)
     if not num_active:
-        message = 'None of the spot requests entered the active state'
+        message = "None of the spot requests entered the active state"
         if tentative:
-            logger.warning(message + '.')
+            logger.warning(message + ".")
         else:
             raise RuntimeError(message)
     if num_other:
-        logger.warning('%i request(s) entered a state other than active.', num_other)
+        logger.warning("%i request(s) entered a state other than active.", num_other)
-def create_ondemand_instances(ec2, image_id, spec, num_instances=1) -> List[Boto2Instance]:
+def create_ondemand_instances(
+    boto3_ec2: "EC2Client",
+    image_id: str,
+    spec: Mapping[str, Any],
+    num_instances: int = 1,
+) -> list["InstanceTypeDef"]:
     """
     Requests the RunInstances EC2 API call but accounts for the race between recently created
     instance profiles, IAM roles and an instance creation that refers to them.
-    :rtype: List[Boto2Instance]
     """
-    instance_type = spec['instance_type']
-    logger.info('Creating %s instance(s) ... ', instance_type)
-    for attempt in retry_ec2(retry_for=a_long_time,
-                             retry_while=inconsistencies_detected):
+    instance_type = spec["InstanceType"]
+    logger.info("Creating %s instance(s) ... ", instance_type)
+    boto_instance_list = []
+    for attempt in retry_ec2(
+        retry_for=a_long_time, retry_while=inconsistencies_detected
+    ):
         with attempt:
-            return ec2.run_instances(image_id,
-                                     min_count=num_instances,
-                                     max_count=num_instances,
-                                     **spec).instances
+            boto_instance_list: list["InstanceTypeDef"] = boto3_ec2.run_instances(
+                ImageId=image_id, MinCount=num_instances, MaxCount=num_instances, **spec
+            )["Instances"]
+    return boto_instance_list
+def increase_instance_hop_limit(
+    boto3_ec2: "EC2Client", boto_instance_list: list["InstanceTypeDef"]
+) -> None:
+    """
+    Increase the default HTTP hop limit, as we are running Toil and Kubernetes inside a Docker container, so the default
+    hop limit of 1 will not be enough when grabbing metadata information with ec2_metadata
+    Must be called after the instances are guaranteed to be running.
+    :param boto_instance_list: List of boto instances to modify
+    :return:
+    """
+    for boto_instance in boto_instance_list:
+        instance_id = boto_instance["InstanceId"]
+        for attempt in retry_ec2():
+            with attempt:
+                # Increase hop limit from 1 to use Instance Metadata V2
+                boto3_ec2.modify_instance_metadata_options(
+                    InstanceId=instance_id, HttpPutResponseHopLimit=3
+                )
 def prune(bushy: dict) -> dict:
@@ -287,32 +395,37 @@ def prune(bushy: dict) -> dict:
 # We need a module-level client to get the dynamically-generated error types to
 # catch, and to wait on IAM items.
-iam_client = establish_boto3_session().client('iam')
+iam_client = establish_boto3_session().client("iam")
 # exception is generated by a factory so we weirdly need a client instance to reference it
-@retry(errors=[iam_client.exceptions.NoSuchEntityException],
-       intervals=[1, 1, 2, 4, 8, 16, 32, 64])
+@retry(
+    errors=[iam_client.exceptions.NoSuchEntityException],
+    intervals=[1, 1, 2, 4, 8, 16, 32, 64],
+)
 def wait_until_instance_profile_arn_exists(instance_profile_arn: str):
     # TODO: We have no guarantee that the ARN contains the name.
-    instance_profile_name = instance_profile_arn.split(':instance-profile/')[-1]
+    instance_profile_name = instance_profile_arn.split(":instance-profile/")[-1]
     logger.debug("Checking for instance profile %s...", instance_profile_name)
     iam_client.get_instance_profile(InstanceProfileName=instance_profile_name)
     logger.debug("Instance profile found")
 @retry(intervals=[5, 5, 10, 20, 20, 20, 20], errors=INCONSISTENCY_ERRORS)
-def create_instances(ec2_resource: ServiceResource,
-                     image_id: str,
-                     key_name: str,
-                     instance_type: str,
-                     num_instances: int = 1,
-                     security_group_ids: Optional[List] = None,
-                     user_data: Optional[Union[str, bytes]] = None,
-                     block_device_map: Optional[List[Dict]] = None,
-                     instance_profile_arn: Optional[str] = None,
-                     placement_az: Optional[str] = None,
-                     subnet_id: str = None,
-                     tags: Optional[Dict[str, str]] = None) -> List[dict]:
+def create_instances(
+    ec2_resource: "EC2ServiceResource",
+    image_id: str,
+    key_name: str,
+    instance_type: str,
+    num_instances: int = 1,
+    security_group_ids: Optional[list] = None,
+    user_data: Optional[Union[str, bytes]] = None,
+    block_device_map: Optional[list[dict]] = None,
+    instance_profile_arn: Optional[str] = None,
+    placement_az: Optional[str] = None,
+    subnet_id: str = None,
+    tags: Optional[dict[str, str]] = None,
+) -> list["Instance"]:
     """
     Replaces create_ondemand_instances.  Uses boto3 and returns a list of Boto3 instance dicts.
@@ -323,20 +436,25 @@ def create_instances(ec2_resource: ServiceResource,
     Tags, if given, are applied to the instances, and all volumes.
     """
-    logger.info('Creating %s instance(s) ... ', instance_type)
+    logger.info("Creating %s instance(s) ... ", instance_type)
     if isinstance(user_data, str):
-        user_data = user_data.encode('utf-8')
-    request = {'ImageId': image_id,
-               'MinCount': num_instances,
-               'MaxCount': num_instances,
-               'KeyName': key_name,
-               'SecurityGroupIds': security_group_ids,
-               'InstanceType': instance_type,
-               'UserData': user_data,
-               'BlockDeviceMappings': block_device_map,
-               'SubnetId': subnet_id}
+        user_data = user_data.encode("utf-8")
+    request = {
+        "ImageId": image_id,
+        "MinCount": num_instances,
+        "MaxCount": num_instances,
+        "KeyName": key_name,
+        "SecurityGroupIds": security_group_ids,
+        "InstanceType": instance_type,
+        "UserData": user_data,
+        "BlockDeviceMappings": block_device_map,
+        "SubnetId": subnet_id,
+        # Metadata V2 defaults hops to 1, which is an issue when running inside a docker container
+        # https://github.com/adamchainz/ec2-metadata?tab=readme-ov-file#instance-metadata-service-version-2
+        "MetadataOptions": {"HttpPutResponseHopLimit": 3},
+    }
     if instance_profile_arn:
         # We could just retry when we get an error because the ARN doesn't
@@ -344,32 +462,37 @@ def create_instances(ec2_resource: ServiceResource,
         wait_until_instance_profile_arn_exists(instance_profile_arn)
         # Add it to the request
-        request['IamInstanceProfile'] = {'Arn': instance_profile_arn}
+        request["IamInstanceProfile"] = {"Arn": instance_profile_arn}
     if placement_az:
-        request['Placement'] = {'AvailabilityZone': placement_az}
+        request["Placement"] = {"AvailabilityZone": placement_az}
     if tags:
         # Tag everything when we make it.
         flat_tags = flatten_tags(tags)
-        request['TagSpecifications'] = [{'ResourceType': 'instance', 'Tags': flat_tags},
-                                        {'ResourceType': 'volume', 'Tags': flat_tags}]
+        request["TagSpecifications"] = [
+            {"ResourceType": "instance", "Tags": flat_tags},
+            {"ResourceType": "volume", "Tags": flat_tags},
+        ]
     return ec2_resource.create_instances(**prune(request))
 @retry(intervals=[5, 5, 10, 20, 20, 20, 20], errors=INCONSISTENCY_ERRORS)
-def create_launch_template(ec2_client: BaseClient,
-                           template_name: str,
-                           image_id: str,
-                           key_name: str,
-                           instance_type: str,
-                           security_group_ids: Optional[List] = None,
-                           user_data: Optional[Union[str, bytes]] = None,
-                           block_device_map: Optional[List[Dict]] = None,
-                           instance_profile_arn: Optional[str] = None,
-                           placement_az: Optional[str] = None,
-                           subnet_id: Optional[str] = None,
-                           tags: Optional[Dict[str, str]] = None) -> str:
+def create_launch_template(
+    ec2_client: "EC2Client",
+    template_name: str,
+    image_id: str,
+    key_name: str,
+    instance_type: str,
+    security_group_ids: Optional[list] = None,
+    user_data: Optional[Union[str, bytes]] = None,
+    block_device_map: Optional[list[dict]] = None,
+    instance_profile_arn: Optional[str] = None,
+    placement_az: Optional[str] = None,
+    subnet_id: Optional[str] = None,
+    tags: Optional[dict[str, str]] = None,
+) -> str:
     """
     Creates a launch template with the given name for launching instances with the given parameters.
@@ -385,22 +508,26 @@ def create_launch_template(ec2_client: BaseClient,
     """
-    logger.info('Creating launch template for %s instances ... ', instance_type)
+    logger.info("Creating launch template for %s instances ... ", instance_type)
     if isinstance(user_data, str):
         # Make sure we have bytes
-        user_data = user_data.encode('utf-8')
+        user_data = user_data.encode("utf-8")
     # Then base64 and decode back to str.
-    user_data = b64encode(user_data).decode('utf-8')
-    template = {'ImageId': image_id,
-                'KeyName': key_name,
-                'SecurityGroupIds': security_group_ids,
-                'InstanceType': instance_type,
-                'UserData': user_data,
-                'BlockDeviceMappings': block_device_map,
-                'SubnetId': subnet_id}
+    user_data = b64encode(user_data).decode("utf-8")
+    template = {
+        "ImageId": image_id,
+        "KeyName": key_name,
+        "SecurityGroupIds": security_group_ids,
+        "InstanceType": instance_type,
+        "UserData": user_data,
+        "BlockDeviceMappings": block_device_map,
+        "SubnetId": subnet_id,
+        # Increase hop limit from 1 to use Instance Metadata V2
+        "MetadataOptions": {"HttpPutResponseHopLimit": 3},
+    }
     if instance_profile_arn:
         # We could just retry when we get an error because the ARN doesn't
@@ -408,38 +535,48 @@ def create_launch_template(ec2_client: BaseClient,
         wait_until_instance_profile_arn_exists(instance_profile_arn)
         # Add it to the request
-        template['IamInstanceProfile'] = {'Arn': instance_profile_arn}
+        template["IamInstanceProfile"] = {"Arn": instance_profile_arn}
     if placement_az:
-        template['Placement'] = {'AvailabilityZone': placement_az}
+        template["Placement"] = {"AvailabilityZone": placement_az}
+    flat_tags = []
     if tags:
         # Tag everything when we make it.
         flat_tags = flatten_tags(tags)
-        template['TagSpecifications'] = [{'ResourceType': 'instance', 'Tags': flat_tags},
-                                         {'ResourceType': 'volume', 'Tags': flat_tags}]
+        template["TagSpecifications"] = [
+            {"ResourceType": "instance", "Tags": flat_tags},
+            {"ResourceType": "volume", "Tags": flat_tags},
+        ]
-    request = {'LaunchTemplateData': prune(template),
-               'LaunchTemplateName': template_name}
+    request = {
+        "LaunchTemplateData": prune(template),
+        "LaunchTemplateName": template_name,
+    }
     if tags:
-        request['TagSpecifications'] = [{'ResourceType': 'launch-template', 'Tags': flat_tags}]
+        request["TagSpecifications"] = [
+            {"ResourceType": "launch-template", "Tags": flat_tags}
+        ]
-    return ec2_client.create_launch_template(**request)['LaunchTemplate']['LaunchTemplateId']
+    return ec2_client.create_launch_template(**request)["LaunchTemplate"][
+        "LaunchTemplateId"
+    ]
 @retry(intervals=[5, 5, 10, 20, 20, 20, 20], errors=INCONSISTENCY_ERRORS)
-def create_auto_scaling_group(autoscaling_client: BaseClient,
-                              asg_name: str,
-                              launch_template_ids: Dict[str, str],
-                              vpc_subnets: List[str],
-                              min_size: int,
-                              max_size: int,
-                              instance_types: Optional[List[str]] = None,
-                              spot_bid: Optional[float] = None,
-                              spot_cheapest: bool = False,
-                              tags: Optional[Dict[str, str]] = None) -> None:
+def create_auto_scaling_group(
+    autoscaling_client: "AutoScalingClient",
+    asg_name: str,
+    launch_template_ids: dict[str, str],
+    vpc_subnets: list[str],
+    min_size: int,
+    max_size: int,
+    instance_types: Optional[Iterable[str]] = None,
+    spot_bid: Optional[float] = None,
+    spot_cheapest: bool = False,
+    tags: Optional[dict[str, str]] = None,
+) -> None:
     """
     Create a new Auto Scaling Group with the given name (which is also its
     unique identifier).
@@ -472,19 +609,26 @@ def create_auto_scaling_group(autoscaling_client: BaseClient,
     """
     if instance_types is None:
-        instance_types = []
+        instance_types: list[str] = []
     if instance_types is not None and len(instance_types) > 20:
-        raise RuntimeError(f"Too many instance types ({len(instance_types)}) in group; AWS supports only 20.")
+        raise RuntimeError(
+            f"Too many instance types ({len(instance_types)}) in group; AWS supports only 20."
+        )
     if len(vpc_subnets) == 0:
-        raise RuntimeError("No VPC subnets specified to launch into; not clear where to put instances")
+        raise RuntimeError(
+            "No VPC subnets specified to launch into; not clear where to put instances"
+        )
     def get_launch_template_spec(instance_type):
         """
         Get a LaunchTemplateSpecification for the given instance type.
         """
-        return {'LaunchTemplateId': launch_template_ids[instance_type], 'Version': '$Default'}
+        return {
+            "LaunchTemplateId": launch_template_ids[instance_type],
+            "Version": "$Default",
+        }
     # We always write the ASG with a MixedInstancesPolicy even when we have only one type.
     # And we use a separate launch template for every instance type, and apply it as an override.
@@ -493,24 +637,42 @@ def create_auto_scaling_group(autoscaling_client: BaseClient,
     # We need to use a launch template per instance type so that different
     # instance types with specified EBS storage size overrides will get their
     # storage.
-    mip = {'LaunchTemplate': {'LaunchTemplateSpecification': get_launch_template_spec(next(iter(instance_types))),
-                              'Overrides': [{'InstanceType': t, 'LaunchTemplateSpecification': get_launch_template_spec(t)} for t in instance_types]}}
+    mip = {
+        "LaunchTemplate": {
+            "LaunchTemplateSpecification": get_launch_template_spec(
+                next(iter(instance_types))
+            ),  # noqa
+            "Overrides": [
+                {
+                    "InstanceType": t,
+                    "LaunchTemplateSpecification": get_launch_template_spec(t),
+                }
+                for t in instance_types
+            ],
+        }
+    }  # noqa
     if spot_bid is not None:
         # Ask for spot instances by saying everything above base capacity of 0 should be spot.
-        mip['InstancesDistribution'] = {'OnDemandPercentageAboveBaseCapacity': 0,
-                                        'SpotAllocationStrategy': 'capacity-optimized' if not spot_cheapest else 'lowest-price',
-                                        'SpotMaxPrice': str(spot_bid)}
-    asg = {'AutoScalingGroupName': asg_name,
-           'MixedInstancesPolicy': prune(mip),
-           'MinSize': min_size,
-           'MaxSize': max_size,
-           'VPCZoneIdentifier': ','.join(vpc_subnets)}
+        mip["InstancesDistribution"] = {
+            "OnDemandPercentageAboveBaseCapacity": 0,
+            "SpotAllocationStrategy": (
+                "capacity-optimized" if not spot_cheapest else "lowest-price"
+            ),
+            "SpotMaxPrice": str(spot_bid),
+        }
+    asg = {
+        "AutoScalingGroupName": asg_name,
+        "MixedInstancesPolicy": prune(mip),
+        "MinSize": min_size,
+        "MaxSize": max_size,
+        "VPCZoneIdentifier": ",".join(vpc_subnets),
+    }
     if tags:
         # Tag the ASG itself.
-        asg['Tags'] = flatten_tags(tags)
+        asg["Tags"] = flatten_tags(tags)
     logger.debug("Creating Autoscaling Group across subnets: %s", vpc_subnets)

toil 6.1.0a1__py3-none-any.whl → 8.0.0__py3-none-any.whl

toil 6.1.0a1py3-none-any.whl → 8.0.0py3-none-any.whl