PyPI - sagemaker-core - Versions diffs - 1.0.47__py3-none-any.whl → 1.0.62__py3-none-any.whl - Mend

sagemaker-core 1.0.47py3-none-any.whl → 1.0.62py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

sagemaker_core/main/config_schema.py CHANGED Viewed

@@ -106,7 +106,8 @@ SAGEMAKER_PYTHON_SDK_CONFIG_SCHEMA = {
                                                 "type": "array",
                                                 "items": {"type": "string"},
                                             },
-                                        }
+                                        },
+                                        "cluster_role": {"type": "string"},
                                     },
                                 },
                                 "CompilationJob": {

sagemaker_core/main/resources.py CHANGED Viewed

@@ -978,6 +978,7 @@ class App(Base):
         user_profile_name: The user profile name.
         space_name: The name of the space. If this value is not set, then UserProfileName must be set.
         status: The status.
+        effective_trusted_identity_propagation_status: The effective status of Trusted Identity Propagation (TIP) for this application. When enabled, user identities from IAM Identity Center are being propagated through the application to TIP enabled Amazon Web Services services. When disabled, standard IAM role-based access is used.
         recovery_mode:  Indicates whether the application is launched in recovery mode.
         last_health_check_timestamp: The timestamp of the last health check.
         last_user_activity_timestamp: The timestamp of the last user's activity. LastUserActivityTimestamp is also updated when SageMaker AI performs health checks without user activity. As a result, this value is set to the same value as LastHealthCheckTimestamp.
@@ -995,6 +996,7 @@ class App(Base):
     user_profile_name: Optional[str] = Unassigned()
     space_name: Optional[str] = Unassigned()
     status: Optional[str] = Unassigned()
+    effective_trusted_identity_propagation_status: Optional[str] = Unassigned()
     recovery_mode: Optional[bool] = Unassigned()
     last_health_check_timestamp: Optional[datetime.datetime] = Unassigned()
     last_user_activity_timestamp: Optional[datetime.datetime] = Unassigned()
@@ -3222,7 +3224,11 @@ class Cluster(Base):
         restricted_instance_groups: The specialized instance groups for training models like Amazon Nova to be created in the SageMaker HyperPod cluster.
         vpc_config:
         orchestrator: The type of orchestrator used for the SageMaker HyperPod cluster.
+        tiered_storage_config: The current configuration for managed tier checkpointing on the HyperPod cluster. For example, this shows whether the feature is enabled and the percentage of cluster memory allocated for checkpoint storage.
         node_recovery: The node recovery mode configured for the SageMaker HyperPod cluster.
+        node_provisioning_mode: The mode used for provisioning nodes in the cluster.
+        cluster_role: The Amazon Resource Name (ARN) of the IAM role that HyperPod uses for cluster autoscaling operations.
+        auto_scaling: The current autoscaling configuration and status for the autoscaler.
     """
@@ -3237,7 +3243,11 @@ class Cluster(Base):
     )
     vpc_config: Optional[shapes.VpcConfig] = Unassigned()
     orchestrator: Optional[shapes.ClusterOrchestrator] = Unassigned()
+    tiered_storage_config: Optional[shapes.ClusterTieredStorageConfig] = Unassigned()
     node_recovery: Optional[str] = Unassigned()
+    node_provisioning_mode: Optional[str] = Unassigned()
+    cluster_role: Optional[str] = Unassigned()
+    auto_scaling: Optional[shapes.ClusterAutoScalingConfigOutput] = Unassigned()
     def get_name(self) -> str:
         attributes = vars(self)
@@ -3262,7 +3272,8 @@ class Cluster(Base):
                 "vpc_config": {
                     "security_group_ids": {"type": "array", "items": {"type": "string"}},
                     "subnets": {"type": "array", "items": {"type": "string"}},
-                }
+                },
+                "cluster_role": {"type": "string"},
             }
             return create_func(
                 *args,
@@ -3287,6 +3298,10 @@ class Cluster(Base):
         tags: Optional[List[shapes.Tag]] = Unassigned(),
         orchestrator: Optional[shapes.ClusterOrchestrator] = Unassigned(),
         node_recovery: Optional[str] = Unassigned(),
+        tiered_storage_config: Optional[shapes.ClusterTieredStorageConfig] = Unassigned(),
+        node_provisioning_mode: Optional[str] = Unassigned(),
+        cluster_role: Optional[str] = Unassigned(),
+        auto_scaling: Optional[shapes.ClusterAutoScalingConfig] = Unassigned(),
         session: Optional[Session] = None,
         region: Optional[str] = None,
     ) -> Optional["Cluster"]:
@@ -3299,8 +3314,12 @@ class Cluster(Base):
             restricted_instance_groups: The specialized instance groups for training models like Amazon Nova to be created in the SageMaker HyperPod cluster.
             vpc_config: Specifies the Amazon Virtual Private Cloud (VPC) that is associated with the Amazon SageMaker HyperPod cluster. You can control access to and from your resources by configuring your VPC. For more information, see Give SageMaker access to resources in your Amazon VPC.  When your Amazon VPC and subnets support IPv6, network communications differ based on the cluster orchestration platform:   Slurm-orchestrated clusters automatically configure nodes with dual IPv6 and IPv4 addresses, allowing immediate IPv6 network communications.   In Amazon EKS-orchestrated clusters, nodes receive dual-stack addressing, but pods can only use IPv6 when the Amazon EKS cluster is explicitly IPv6-enabled. For information about deploying an IPv6 Amazon EKS cluster, see Amazon EKS IPv6 Cluster Deployment.   Additional resources for IPv6 configuration:   For information about adding IPv6 support to your VPC, see to IPv6 Support for VPC.   For information about creating a new IPv6-compatible VPC, see Amazon VPC Creation Guide.   To configure SageMaker HyperPod with a custom Amazon VPC, see Custom Amazon VPC Setup for SageMaker HyperPod.
             tags: Custom tags for managing the SageMaker HyperPod cluster as an Amazon Web Services resource. You can add tags to your cluster in the same way you add them in other Amazon Web Services services that support tagging. To learn more about tagging Amazon Web Services resources in general, see Tagging Amazon Web Services Resources User Guide.
-            orchestrator: The type of orchestrator to use for the SageMaker HyperPod cluster. Currently, the only supported value is "eks", which is to use an Amazon Elastic Kubernetes Service (EKS) cluster as the orchestrator.
+            orchestrator: The type of orchestrator to use for the SageMaker HyperPod cluster. Currently, the only supported value is "eks", which is to use an Amazon Elastic Kubernetes Service cluster as the orchestrator.
             node_recovery: The node recovery mode for the SageMaker HyperPod cluster. When set to Automatic, SageMaker HyperPod will automatically reboot or replace faulty nodes when issues are detected. When set to None, cluster administrators will need to manually manage any faulty cluster instances.
+            tiered_storage_config: The configuration for managed tier checkpointing on the HyperPod cluster. When enabled, this feature uses a multi-tier storage approach for storing model checkpoints, providing faster checkpoint operations and improved fault tolerance across cluster nodes.
+            node_provisioning_mode: The mode for provisioning nodes in the cluster. You can specify the following modes:    Continuous: Scaling behavior that enables 1) concurrent operation execution within instance groups, 2) continuous retry mechanisms for failed operations, 3) enhanced customer visibility into cluster events through detailed event streams, 4) partial provisioning capabilities. Your clusters and instance groups remain InService while scaling. This mode is only supported for EKS orchestrated clusters.
+            cluster_role: The Amazon Resource Name (ARN) of the IAM role that HyperPod assumes to perform cluster autoscaling operations. This role must have permissions for sagemaker:BatchAddClusterNodes and sagemaker:BatchDeleteClusterNodes. This is only required when autoscaling is enabled and when HyperPod is performing autoscaling operations.
+            auto_scaling: The autoscaling configuration for the cluster. Enables automatic scaling of cluster nodes based on workload demand using a Karpenter-based system.
             session: Boto3 session.
             region: Region name.
@@ -3337,6 +3356,10 @@ class Cluster(Base):
             "Tags": tags,
             "Orchestrator": orchestrator,
             "NodeRecovery": node_recovery,
+            "TieredStorageConfig": tiered_storage_config,
+            "NodeProvisioningMode": node_provisioning_mode,
+            "ClusterRole": cluster_role,
+            "AutoScaling": auto_scaling,
         }
         operation_input_args = Base.populate_chained_attributes(
@@ -3450,8 +3473,11 @@ class Cluster(Base):
         restricted_instance_groups: Optional[
             List[shapes.ClusterRestrictedInstanceGroupSpecification]
         ] = Unassigned(),
+        tiered_storage_config: Optional[shapes.ClusterTieredStorageConfig] = Unassigned(),
         node_recovery: Optional[str] = Unassigned(),
         instance_groups_to_delete: Optional[List[str]] = Unassigned(),
+        cluster_role: Optional[str] = Unassigned(),
+        auto_scaling: Optional[shapes.ClusterAutoScalingConfig] = Unassigned(),
     ) -> Optional["Cluster"]:
         """
         Update a Cluster resource
@@ -3484,8 +3510,11 @@ class Cluster(Base):
             "ClusterName": self.cluster_name,
             "InstanceGroups": instance_groups,
             "RestrictedInstanceGroups": restricted_instance_groups,
+            "TieredStorageConfig": tiered_storage_config,
             "NodeRecovery": node_recovery,
             "InstanceGroupsToDelete": instance_groups_to_delete,
+            "ClusterRole": cluster_role,
+            "AutoScaling": auto_scaling,
         }
         logger.debug(f"Input request: {operation_input_args}")
         # serialize the input request
@@ -3731,6 +3760,7 @@ class Cluster(Base):
     def get_node(
         self,
         node_id: Optional[str] = Unassigned(),
+        node_logical_id: Optional[str] = Unassigned(),
         session: Optional[Session] = None,
         region: Optional[str] = None,
     ) -> Optional[shapes.ClusterNodeDetails]:
@@ -3739,6 +3769,7 @@ class Cluster(Base):
         Parameters:
             node_id: The ID of the SageMaker HyperPod cluster node.
+            node_logical_id: The logical identifier of the node to describe. You can specify either NodeLogicalId or InstanceId, but not both. NodeLogicalId can be used to describe nodes that are still being provisioned and don't yet have an InstanceId assigned.
             session: Boto3 session.
             region: Region name.
@@ -3761,6 +3792,7 @@ class Cluster(Base):
         operation_input_args = {
             "ClusterName": self.cluster_name,
             "NodeId": node_id,
+            "NodeLogicalId": node_logical_id,
         }
         # serialize the input request
         operation_input_args = serialize(operation_input_args)
@@ -3785,6 +3817,7 @@ class Cluster(Base):
         instance_group_name_contains: Optional[str] = Unassigned(),
         sort_by: Optional[str] = Unassigned(),
         sort_order: Optional[str] = Unassigned(),
+        include_node_logical_ids: Optional[bool] = Unassigned(),
         session: Optional[Session] = None,
         region: Optional[str] = None,
     ) -> ResourceIterator[shapes.ClusterNodeDetails]:
@@ -3799,6 +3832,7 @@ class Cluster(Base):
             next_token: If the result of the previous ListClusterNodes request was truncated, the response includes a NextToken. To retrieve the next set of cluster nodes, use the token in the next request.
             sort_by: The field by which to sort results. The default value is CREATION_TIME.
             sort_order: The sort order for results. The default value is Ascending.
+            include_node_logical_ids: Specifies whether to include nodes that are still being provisioned in the response. When set to true, the response includes all nodes regardless of their provisioning status. When set to False (default), only nodes with assigned InstanceIds are returned.
             session: Boto3 session.
             region: Region name.
@@ -3825,6 +3859,7 @@ class Cluster(Base):
             "InstanceGroupNameContains": instance_group_name_contains,
             "SortBy": sort_by,
             "SortOrder": sort_order,
+            "IncludeNodeLogicalIds": include_node_logical_ids,
         }
         # serialize the input request
         operation_input_args = serialize(operation_input_args)
@@ -3847,6 +3882,7 @@ class Cluster(Base):
     def update_software(
         self,
         deployment_config: Optional[shapes.DeploymentConfiguration] = Unassigned(),
+        image_id: Optional[str] = Unassigned(),
         session: Optional[Session] = None,
         region: Optional[str] = None,
     ) -> None:
@@ -3855,6 +3891,7 @@ class Cluster(Base):
         Parameters:
             deployment_config: The configuration to use when updating the AMI versions.
+            image_id: When configuring your HyperPod cluster, you can specify an image ID using one of the following options:    HyperPodPublicAmiId: Use a HyperPod public AMI    CustomAmiId: Use your custom AMI    default: Use the default latest system image   If you choose to use a custom AMI (CustomAmiId), ensure it meets the following requirements:   Encryption: The custom AMI must be unencrypted.   Ownership: The custom AMI must be owned by the same Amazon Web Services account that is creating the HyperPod cluster.   Volume support: Only the primary AMI snapshot volume is supported; additional AMI volumes are not supported.   When updating the instance group's AMI through the UpdateClusterSoftware operation, if an instance group uses a custom AMI, you must provide an ImageId or use the default as input. Note that if you don't specify an instance group in your UpdateClusterSoftware request, then all of the instance groups are patched with the specified image.
             session: Boto3 session.
             region: Region name.
@@ -3876,6 +3913,7 @@ class Cluster(Base):
             "ClusterName": self.cluster_name,
             "InstanceGroups": self.instance_groups,
             "DeploymentConfig": deployment_config,
+            "ImageId": image_id,
         }
         # serialize the input request
         operation_input_args = serialize(operation_input_args)
@@ -3893,6 +3931,7 @@ class Cluster(Base):
     def batch_delete_nodes(
         self,
         node_ids: Optional[List[str]] = Unassigned(),
+        node_logical_ids: Optional[List[str]] = Unassigned(),
         session: Optional[Session] = None,
         region: Optional[str] = None,
     ) -> Optional[shapes.BatchDeleteClusterNodesResponse]:
@@ -3901,6 +3940,7 @@ class Cluster(Base):
         Parameters:
             node_ids: A list of node IDs to be deleted from the specified cluster.    For SageMaker HyperPod clusters using the Slurm workload manager, you cannot remove instances that are configured as Slurm controller nodes.   If you need to delete more than 99 instances, contact Support for assistance.
+            node_logical_ids: A list of NodeLogicalIds identifying the nodes to be deleted. You can specify up to 50 NodeLogicalIds. You must specify either NodeLogicalIds, InstanceIds, or both, with a combined maximum of 50 identifiers.
             session: Boto3 session.
             region: Region name.
@@ -3923,6 +3963,7 @@ class Cluster(Base):
         operation_input_args = {
             "ClusterName": self.cluster_name,
             "NodeIds": node_ids,
+            "NodeLogicalIds": node_logical_ids,
         }
         # serialize the input request
         operation_input_args = serialize(operation_input_args)
@@ -9407,20 +9448,20 @@ class Endpoint(Base):
         region: Optional[str] = None,
     ) -> Optional[shapes.InvokeEndpointOutput]:
         """
-        After you deploy a model into production using Amazon SageMaker hosting services, your client applications use this API to get inferences from the model hosted at the specified endpoint.
+        After you deploy a model into production using Amazon SageMaker AI hosting services, your client applications use this API to get inferences from the model hosted at the specified endpoint.
         Parameters:
-            body: Provides input data, in the format specified in the ContentType request header. Amazon SageMaker passes all of the data in the body to the model.  For information about the format of the request body, see Common Data Formats-Inference.
+            body: Provides input data, in the format specified in the ContentType request header. Amazon SageMaker AI passes all of the data in the body to the model.  For information about the format of the request body, see Common Data Formats-Inference.
             content_type: The MIME type of the input data in the request body.
             accept: The desired MIME type of the inference response from the model container.
-            custom_attributes: Provides additional information about a request for an inference submitted to a model hosted at an Amazon SageMaker endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to provide an ID that you can use to track a request or to provide other metadata that a service endpoint was programmed to process. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1).  The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function.  This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker Python SDK.
+            custom_attributes: Provides additional information about a request for an inference submitted to a model hosted at an Amazon SageMaker AI endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to provide an ID that you can use to track a request or to provide other metadata that a service endpoint was programmed to process. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1).  The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function.  This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker AI Python SDK.
             target_model: The model to request for inference when invoking a multi-model endpoint.
             target_variant: Specify the production variant to send the inference request to when invoking an endpoint that is running two or more variants. Note that this parameter overrides the default behavior for the endpoint, which is to distribute the invocation traffic based on the variant weights. For information about how to use variant targeting to perform a/b testing, see Test models in production
             target_container_hostname: If the endpoint hosts multiple containers and is configured to use direct invocation, this parameter specifies the host name of the container to invoke.
             inference_id: If you provide a value, it is added to the captured data when you enable data capture on the endpoint. For information about data capture, see Capture Data.
             enable_explanations: An optional JMESPath expression used to override the EnableExplanations parameter of the ClarifyExplainerConfig API. See the EnableExplanations section in the developer guide for more information.
             inference_component_name: If the endpoint hosts one or more inference components, this parameter specifies the name of inference component to invoke.
-            session_id: Creates a stateful session or identifies an existing one. You can do one of the following:   Create a stateful session by specifying the value NEW_SESSION.   Send your request to an existing stateful session by specifying the ID of that session.   With a stateful session, you can send multiple requests to a stateful model. When you create a session with a stateful model, the model must create the session ID and set the expiration time. The model must also provide that information in the response to your request. You can get the ID and timestamp from the NewSessionId response parameter. For any subsequent request where you specify that session ID, SageMaker routes the request to the same instance that supports the session.
+            session_id: Creates a stateful session or identifies an existing one. You can do one of the following:   Create a stateful session by specifying the value NEW_SESSION.   Send your request to an existing stateful session by specifying the ID of that session.   With a stateful session, you can send multiple requests to a stateful model. When you create a session with a stateful model, the model must create the session ID and set the expiration time. The model must also provide that information in the response to your request. You can get the ID and timestamp from the NewSessionId response parameter. For any subsequent request where you specify that session ID, SageMaker AI routes the request to the same instance that supports the session.
             session: Boto3 session.
             region: Region name.
@@ -9488,14 +9529,14 @@ class Endpoint(Base):
         region: Optional[str] = None,
     ) -> Optional[shapes.InvokeEndpointAsyncOutput]:
         """
-        After you deploy a model into production using Amazon SageMaker hosting services, your client applications use this API to get inferences from the model hosted at the specified endpoint in an asynchronous manner.
+        After you deploy a model into production using Amazon SageMaker AI hosting services, your client applications use this API to get inferences from the model hosted at the specified endpoint in an asynchronous manner.
         Parameters:
             input_location: The Amazon S3 URI where the inference request payload is stored.
             content_type: The MIME type of the input data in the request body.
             accept: The desired MIME type of the inference response from the model container.
-            custom_attributes: Provides additional information about a request for an inference submitted to a model hosted at an Amazon SageMaker endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to provide an ID that you can use to track a request or to provide other metadata that a service endpoint was programmed to process. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1).  The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function.  This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker Python SDK.
-            inference_id: The identifier for the inference request. Amazon SageMaker will generate an identifier for you if none is specified.
+            custom_attributes: Provides additional information about a request for an inference submitted to a model hosted at an Amazon SageMaker AI endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to provide an ID that you can use to track a request or to provide other metadata that a service endpoint was programmed to process. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1).  The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function.  This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker AI Python SDK.
+            inference_id: The identifier for the inference request. Amazon SageMaker AI will generate an identifier for you if none is specified.
             request_ttl_seconds: Maximum age in seconds a request can be in the queue before it is marked as expired. The default is 6 hours, or 21,600 seconds.
             invocation_timeout_seconds: Maximum amount of time in seconds a request can be processed before it is marked as expired. The default is 15 minutes, or 900 seconds.
             session: Boto3 session.
@@ -9563,10 +9604,10 @@ class Endpoint(Base):
         Invokes a model at the specified endpoint to return the inference response as a stream.
         Parameters:
-            body: Provides input data, in the format specified in the ContentType request header. Amazon SageMaker passes all of the data in the body to the model.  For information about the format of the request body, see Common Data Formats-Inference.
+            body: Provides input data, in the format specified in the ContentType request header. Amazon SageMaker AI passes all of the data in the body to the model.  For information about the format of the request body, see Common Data Formats-Inference.
             content_type: The MIME type of the input data in the request body.
             accept: The desired MIME type of the inference response from the model container.
-            custom_attributes: Provides additional information about a request for an inference submitted to a model hosted at an Amazon SageMaker endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to provide an ID that you can use to track a request or to provide other metadata that a service endpoint was programmed to process. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1).  The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function.  This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker Python SDK.
+            custom_attributes: Provides additional information about a request for an inference submitted to a model hosted at an Amazon SageMaker AI endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to provide an ID that you can use to track a request or to provide other metadata that a service endpoint was programmed to process. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1).  The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function.  This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker AI Python SDK.
             target_variant: Specify the production variant to send the inference request to when invoking an endpoint that is running two or more variants. Note that this parameter overrides the default behavior for the endpoint, which is to distribute the invocation traffic based on the variant weights. For information about how to use variant targeting to perform a/b testing, see Test models in production
             target_container_hostname: If the endpoint hosts multiple containers and is configured to use direct invocation, this parameter specifies the host name of the container to invoke.
             inference_id: An identifier that you assign to your request.
@@ -9591,7 +9632,7 @@ class Endpoint(Base):
             InternalFailure: An internal failure occurred. Try your request again. If the problem persists, contact Amazon Web Services customer support.
             InternalStreamFailure: The stream processing failed because of an unknown error, exception or failure. Try your request again.
             ModelError: Model (owned by the customer in the container) returned 4xx or 5xx error code.
-            ModelStreamError: An error occurred while streaming the response body. This error can have the following error codes:  ModelInvocationTimeExceeded  The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker.  StreamBroken  The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
+            ModelStreamError: An error occurred while streaming the response body. This error can have the following error codes:  ModelInvocationTimeExceeded  The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker AI.  StreamBroken  The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
             ServiceUnavailable: The service is currently unavailable.
             ValidationError: There was an error validating your request.
         """
@@ -16916,7 +16957,7 @@ class LabelingJob(Base):
         Parameters:
             labeling_job_name: The name of the labeling job. This name is used to identify the job in a list of labeling jobs. Labeling job names must be unique within an Amazon Web Services account and region. LabelingJobName is not case sensitive. For example, Example-job and example-job are considered the same labeling job name by Ground Truth.
-            label_attribute_name: The attribute name to use for the label in the output manifest file. This is the key for the key/value pair formed with the label that a worker assigns to the object. The LabelAttributeName must meet the following requirements.   The name can't end with "-metadata".    If you are using one of the following built-in task types, the attribute name must end with "-ref". If the task type you are using is not listed below, the attribute name must not end with "-ref".   Image semantic segmentation (SemanticSegmentation), and adjustment (AdjustmentSemanticSegmentation) and verification (VerificationSemanticSegmentation) labeling jobs for this task type.   Video frame object detection (VideoObjectDetection), and adjustment and verification (AdjustmentVideoObjectDetection) labeling jobs for this task type.   Video frame object tracking (VideoObjectTracking), and adjustment and verification (AdjustmentVideoObjectTracking) labeling jobs for this task type.   3D point cloud semantic segmentation (3DPointCloudSemanticSegmentation), and adjustment and verification (Adjustment3DPointCloudSemanticSegmentation) labeling jobs for this task type.    3D point cloud object tracking (3DPointCloudObjectTracking), and adjustment and verification (Adjustment3DPointCloudObjectTracking) labeling jobs for this task type.        If you are creating an adjustment or verification labeling job, you must use a different LabelAttributeName than the one used in the original labeling job. The original labeling job is the Ground Truth labeling job that produced the labels that you want verified or adjusted. To learn more about adjustment and verification labeling jobs, see Verify and Adjust Labels.
+            label_attribute_name: The attribute name to use for the label in the output manifest file. This is the key for the key/value pair formed with the label that a worker assigns to the object. The LabelAttributeName must meet the following requirements.   The name can't end with "-metadata".    If you are using one of the built-in task types or one of the following, the attribute name must end with "-ref".   Image semantic segmentation (SemanticSegmentation) and adjustment (AdjustmentSemanticSegmentation) labeling jobs for this task type. One exception is that verification (VerificationSemanticSegmentation) must not end with -"ref".   Video frame object detection (VideoObjectDetection), and adjustment and verification (AdjustmentVideoObjectDetection) labeling jobs for this task type.   Video frame object tracking (VideoObjectTracking), and adjustment and verification (AdjustmentVideoObjectTracking) labeling jobs for this task type.   3D point cloud semantic segmentation (3DPointCloudSemanticSegmentation), and adjustment and verification (Adjustment3DPointCloudSemanticSegmentation) labeling jobs for this task type.    3D point cloud object tracking (3DPointCloudObjectTracking), and adjustment and verification (Adjustment3DPointCloudObjectTracking) labeling jobs for this task type.        If you are creating an adjustment or verification labeling job, you must use a different LabelAttributeName than the one used in the original labeling job. The original labeling job is the Ground Truth labeling job that produced the labels that you want verified or adjusted. To learn more about adjustment and verification labeling jobs, see Verify and Adjust Labels.
             input_config: Input data for the labeling job, such as the Amazon S3 location of the data objects and the location of the manifest file that describes the data objects. You must specify at least one of the following: S3DataSource or SnsDataSource.    Use SnsDataSource to specify an SNS input topic for a streaming labeling job. If you do not specify and SNS input topic ARN, Ground Truth will create a one-time labeling job that stops after all data objects in the input manifest file have been labeled.   Use S3DataSource to specify an input manifest file for both streaming and one-time labeling jobs. Adding an S3DataSource is optional if you use SnsDataSource to create a streaming labeling job.   If you use the Amazon Mechanical Turk workforce, your input data should not include confidential information, personal information or protected health information. Use ContentClassifiers to specify that your data is free of personally identifiable information and adult content.
             output_config: The location of the output data and the Amazon Web Services Key Management Service key ID for the key used to encrypt the output data, if any.
             role_arn: The Amazon Resource Number (ARN) that Amazon SageMaker assumes to perform tasks on your behalf during data labeling. You must grant this role the necessary permissions so that Amazon SageMaker can successfully complete data labeling.
@@ -22510,6 +22551,7 @@ class NotebookInstance(Base):
         failure_reason: If status is Failed, the reason it failed.
         url: The URL that you use to connect to the Jupyter notebook that is running in your notebook instance.
         instance_type: The type of ML compute instance running on the notebook instance.
+        ip_address_type: The IP address type configured for the notebook instance. Returns ipv4 for IPv4-only connectivity or dualstack for both IPv4 and IPv6 connectivity.
         subnet_id: The ID of the VPC subnet.
         security_groups: The IDs of the VPC security groups.
         role_arn: The Amazon Resource Name (ARN) of the IAM role associated with the instance.
@@ -22535,6 +22577,7 @@ class NotebookInstance(Base):
     failure_reason: Optional[str] = Unassigned()
     url: Optional[str] = Unassigned()
     instance_type: Optional[str] = Unassigned()
+    ip_address_type: Optional[str] = Unassigned()
     subnet_id: Optional[str] = Unassigned()
     security_groups: Optional[List[str]] = Unassigned()
     role_arn: Optional[str] = Unassigned()
@@ -22598,6 +22641,7 @@ class NotebookInstance(Base):
         role_arn: str,
         subnet_id: Optional[str] = Unassigned(),
         security_group_ids: Optional[List[str]] = Unassigned(),
+        ip_address_type: Optional[str] = Unassigned(),
         kms_key_id: Optional[str] = Unassigned(),
         tags: Optional[List[shapes.Tag]] = Unassigned(),
         lifecycle_config_name: Optional[str] = Unassigned(),
@@ -22623,6 +22667,7 @@ class NotebookInstance(Base):
             role_arn:  When you send any requests to Amazon Web Services resources from the notebook instance, SageMaker AI assumes this role to perform tasks on your behalf. You must grant this role necessary permissions so SageMaker AI can perform these tasks. The policy must allow the SageMaker AI service principal (sagemaker.amazonaws.com) permissions to assume this role. For more information, see SageMaker AI Roles.   To be able to pass this role to SageMaker AI, the caller of this API must have the iam:PassRole permission.
             subnet_id: The ID of the subnet in a VPC to which you would like to have a connectivity from your ML compute instance.
             security_group_ids: The VPC security group IDs, in the form sg-xxxxxxxx. The security groups must be for the same VPC as specified in the subnet.
+            ip_address_type: The IP address type for the notebook instance. Specify ipv4 for IPv4-only connectivity or dualstack for both IPv4 and IPv6 connectivity. When you specify dualstack, the subnet must support IPv6 CIDR blocks. If not specified, defaults to ipv4.
             kms_key_id: The Amazon Resource Name (ARN) of a Amazon Web Services Key Management Service key that SageMaker AI uses to encrypt data on the storage volume attached to your notebook instance. The KMS key you provide must be enabled. For information, see Enabling and Disabling Keys in the Amazon Web Services Key Management Service Developer Guide.
             tags: An array of key-value pairs. You can use tags to categorize your Amazon Web Services resources in different ways, for example, by purpose, owner, or environment. For more information, see Tagging Amazon Web Services Resources.
             lifecycle_config_name: The name of a lifecycle configuration to associate with the notebook instance. For information about lifestyle configurations, see Step 2.1: (Optional) Customize a Notebook Instance.
@@ -22632,7 +22677,7 @@ class NotebookInstance(Base):
             default_code_repository: A Git repository to associate with the notebook instance as its default code repository. This can be either the name of a Git repository stored as a resource in your account, or the URL of a Git repository in Amazon Web Services CodeCommit or in any other Git repository. When you open a notebook instance, it opens in the directory that contains this repository. For more information, see Associating Git Repositories with SageMaker AI Notebook Instances.
             additional_code_repositories: An array of up to three Git repositories to associate with the notebook instance. These can be either the names of Git repositories stored as resources in your account, or the URL of Git repositories in Amazon Web Services CodeCommit or in any other Git repository. These repositories are cloned at the same level as the default repository of your notebook instance. For more information, see Associating Git Repositories with SageMaker AI Notebook Instances.
             root_access: Whether root access is enabled or disabled for users of the notebook instance. The default value is Enabled.  Lifecycle configurations need root access to be able to set up a notebook instance. Because of this, lifecycle configurations associated with a notebook instance always run with root access even if you disable root access for users.
-            platform_identifier: The platform identifier of the notebook instance runtime environment.
+            platform_identifier: The platform identifier of the notebook instance runtime environment. The default value is notebook-al2-v2.
             instance_metadata_service_configuration: Information on the IMDS configuration of the notebook instance
             session: Boto3 session.
             region: Region name.
@@ -22666,6 +22711,7 @@ class NotebookInstance(Base):
             "InstanceType": instance_type,
             "SubnetId": subnet_id,
             "SecurityGroupIds": security_group_ids,
+            "IpAddressType": ip_address_type,
             "RoleArn": role_arn,
             "KmsKeyId": kms_key_id,
             "Tags": tags,
@@ -22788,6 +22834,8 @@ class NotebookInstance(Base):
     def update(
         self,
         instance_type: Optional[str] = Unassigned(),
+        ip_address_type: Optional[str] = Unassigned(),
+        platform_identifier: Optional[str] = Unassigned(),
         role_arn: Optional[str] = Unassigned(),
         lifecycle_config_name: Optional[str] = Unassigned(),
         disassociate_lifecycle_config: Optional[bool] = Unassigned(),
@@ -22835,6 +22883,8 @@ class NotebookInstance(Base):
         operation_input_args = {
             "NotebookInstanceName": self.notebook_instance_name,
             "InstanceType": instance_type,
+            "IpAddressType": ip_address_type,
+            "PlatformIdentifier": platform_identifier,
             "RoleArn": role_arn,
             "LifecycleConfigName": lifecycle_config_name,
             "DisassociateLifecycleConfig": disassociate_lifecycle_config,
@@ -23949,7 +23999,7 @@ class PartnerApp(Base):
         arn: The ARN of the SageMaker Partner AI App that was described.
         name: The name of the SageMaker Partner AI App.
         type: The type of SageMaker Partner AI App. Must be one of the following: lakera-guard, comet, deepchecks-llm-evaluation, or fiddler.
-        status: The status of the SageMaker Partner AI App.
+        status: The status of the SageMaker Partner AI App.   Creating: SageMaker AI is creating the partner AI app. The partner AI app is not available during creation.   Updating: SageMaker AI is updating the partner AI app. The partner AI app is not available when updating.   Deleting: SageMaker AI is deleting the partner AI app. The partner AI app is not available during deletion.   Available: The partner AI app is provisioned and accessible.   Failed: The partner AI app is in a failed state and isn't available. SageMaker AI is investigating the issue. For further guidance, contact Amazon Web Services Support.   UpdateFailed: The partner AI app couldn't be updated but is available.   Deleted: The partner AI app is permanently deleted and not available.
         creation_time: The time that the SageMaker Partner AI App was created.
         last_modified_time: The time that the SageMaker Partner AI App was last modified.
         execution_role_arn: The ARN of the IAM role associated with the SageMaker Partner AI App.
@@ -26260,6 +26310,40 @@ class ProcessingJob(Base):
         transform(response, "DescribeProcessingJobResponse", self)
         return self
+    @Base.add_validate_call
+    def delete(
+        self,
+    ) -> None:
+        """
+        Delete a ProcessingJob resource
+        Raises:
+            botocore.exceptions.ClientError: This exception is raised for AWS service related errors.
+                The error message and error code can be parsed from the exception as follows:
+                ```
+                try:
+                    # AWS service call here
+                except botocore.exceptions.ClientError as e:
+                    error_message = e.response['Error']['Message']
+                    error_code = e.response['Error']['Code']
+                ```
+            ResourceInUse: Resource being accessed is in use.
+            ResourceNotFound: Resource being access is not found.
+        """
+        client = Base.get_sagemaker_client()
+        operation_input_args = {
+            "ProcessingJobName": self.processing_job_name,
+        }
+        # serialize the input request
+        operation_input_args = serialize(operation_input_args)
+        logger.debug(f"Serialized input request: {operation_input_args}")
+        client.delete_processing_job(**operation_input_args)
+        logger.info(f"Deleting {self.__class__.__name__} - {self.get_name()}")
     @Base.add_validate_call
     def stop(self) -> None:
         """
@@ -28660,6 +28744,40 @@ class TrainingJob(Base):
         return self
+    @Base.add_validate_call
+    def delete(
+        self,
+    ) -> None:
+        """
+        Delete a TrainingJob resource
+        Raises:
+            botocore.exceptions.ClientError: This exception is raised for AWS service related errors.
+                The error message and error code can be parsed from the exception as follows:
+                ```
+                try:
+                    # AWS service call here
+                except botocore.exceptions.ClientError as e:
+                    error_message = e.response['Error']['Message']
+                    error_code = e.response['Error']['Code']
+                ```
+            ResourceInUse: Resource being accessed is in use.
+            ResourceNotFound: Resource being access is not found.
+        """
+        client = Base.get_sagemaker_client()
+        operation_input_args = {
+            "TrainingJobName": self.training_job_name,
+        }
+        # serialize the input request
+        operation_input_args = serialize(operation_input_args)
+        logger.debug(f"Serialized input request: {operation_input_args}")
+        client.delete_training_job(**operation_input_args)
+        logger.info(f"Deleting {self.__class__.__name__} - {self.get_name()}")
     @Base.add_validate_call
     def stop(self) -> None:
         """
@@ -28774,6 +28892,69 @@ class TrainingJob(Base):
                     raise TimeoutExceededError(resouce_type="TrainingJob", status=current_status)
                 time.sleep(poll)
+    @Base.add_validate_call
+    def wait_for_delete(
+        self,
+        poll: int = 5,
+        timeout: Optional[int] = None,
+    ) -> None:
+        """
+        Wait for a TrainingJob resource to be deleted.
+        Parameters:
+            poll: The number of seconds to wait between each poll.
+            timeout: The maximum number of seconds to wait before timing out.
+        Raises:
+            botocore.exceptions.ClientError: This exception is raised for AWS service related errors.
+                The error message and error code can be parsed from the exception as follows:
+                ```
+                try:
+                    # AWS service call here
+                except botocore.exceptions.ClientError as e:
+                    error_message = e.response['Error']['Message']
+                    error_code = e.response['Error']['Code']
+                ```
+            TimeoutExceededError:  If the resource does not reach a terminal state before the timeout.
+            DeleteFailedStatusError:   If the resource reaches a failed state.
+            WaiterError: Raised when an error occurs while waiting.
+        """
+        start_time = time.time()
+        progress = Progress(
+            SpinnerColumn("bouncingBar"),
+            TextColumn("{task.description}"),
+            TimeElapsedColumn(),
+        )
+        progress.add_task("Waiting for TrainingJob to be deleted...")
+        status = Status("Current status:")
+        with Live(
+            Panel(
+                Group(progress, status),
+                title="Wait Log Panel",
+                border_style=Style(color=Color.BLUE.value),
+            )
+        ):
+            while True:
+                try:
+                    self.refresh()
+                    current_status = self.training_job_status
+                    status.update(f"Current status: [bold]{current_status}")
+                    if timeout is not None and time.time() - start_time >= timeout:
+                        raise TimeoutExceededError(
+                            resouce_type="TrainingJob", status=current_status
+                        )
+                except botocore.exceptions.ClientError as e:
+                    error_code = e.response["Error"]["Code"]
+                    if "ResourceNotFound" in error_code or "ValidationException" in error_code:
+                        logger.info("Resource was not found. It may have been deleted.")
+                        return
+                    raise e
+                time.sleep(poll)
     @classmethod
     @Base.add_validate_call
     def get_all(
@@ -28874,6 +29055,9 @@ class TrainingPlan(Base):
         total_instance_count: The total number of instances reserved in this training plan.
         available_instance_count: The number of instances currently available for use in this training plan.
         in_use_instance_count: The number of instances currently in use from this training plan.
+        unhealthy_instance_count: The number of instances in the training plan that are currently in an unhealthy state.
+        available_spare_instance_count: The number of available spare instances in the training plan.
+        total_ultra_server_count: The total number of UltraServers reserved to this training plan.
         target_resources: The target resources (e.g., SageMaker Training Jobs, SageMaker HyperPod) that can use this training plan. Training plans are specific to their target resource.   A training plan designed for SageMaker training jobs can only be used to schedule and run training jobs.   A training plan for HyperPod clusters can be used exclusively to provide compute resources to a cluster's instance group.
         reserved_capacity_summaries: The list of Reserved Capacity providing the underlying compute resources of the plan.
@@ -28892,6 +29076,9 @@ class TrainingPlan(Base):
     total_instance_count: Optional[int] = Unassigned()
     available_instance_count: Optional[int] = Unassigned()
     in_use_instance_count: Optional[int] = Unassigned()
+    unhealthy_instance_count: Optional[int] = Unassigned()
+    available_spare_instance_count: Optional[int] = Unassigned()
+    total_ultra_server_count: Optional[int] = Unassigned()
     target_resources: Optional[List[str]] = Unassigned()
     reserved_capacity_summaries: Optional[List[shapes.ReservedCapacitySummary]] = Unassigned()
@@ -28917,6 +29104,7 @@ class TrainingPlan(Base):
         cls,
         training_plan_name: str,
         training_plan_offering_id: str,
+        spare_instance_count_per_ultra_server: Optional[int] = Unassigned(),
         tags: Optional[List[shapes.Tag]] = Unassigned(),
         session: Optional[Session] = None,
         region: Optional[str] = None,
@@ -28927,6 +29115,7 @@ class TrainingPlan(Base):
         Parameters:
             training_plan_name: The name of the training plan to create.
             training_plan_offering_id: The unique identifier of the training plan offering to use for creating this plan.
+            spare_instance_count_per_ultra_server: Number of spare instances to reserve per UltraServer for enhanced resiliency. Default is 1.
             tags: An array of key-value pairs to apply to this training plan.
             session: Boto3 session.
             region: Region name.
@@ -28960,6 +29149,7 @@ class TrainingPlan(Base):
         operation_input_args = {
             "TrainingPlanName": training_plan_name,
             "TrainingPlanOfferingId": training_plan_offering_id,
+            "SpareInstanceCountPerUltraServer": spare_instance_count_per_ultra_server,
             "Tags": tags,
         }

sagemaker-core 1.0.47__py3-none-any.whl → 1.0.62__py3-none-any.whl

sagemaker-core 1.0.47py3-none-any.whl → 1.0.62py3-none-any.whl