aws-sdk-sagemaker 1.338.0 → 1.340.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: e54fd7220260c7ae2bd313f1524b522c371c3341639300d787b67dee686a31ac
4
- data.tar.gz: 0b401dde82b5ced1143ab4e38a466accf2af71a72f0ccd6a64f69a767cd24923
3
+ metadata.gz: f760b6f6d6902ca08349489fe9e34c577365953a32aa2f031a4db9e67aa9cb08
4
+ data.tar.gz: 5d01231c9d2c1d978d56deee398fb98fe79da54085d362172671724d6bce3233
5
5
  SHA512:
6
- metadata.gz: 54f2c402a70cfa7b98a138094f92539f09a745fe62f5c1c8907ffa0f74fb7623549f323a415991274a5b1cbade2076f24dcc5b024c0c77f45870bce86b618032
7
- data.tar.gz: b09d6030aeda9847de87498ee7a7f5b15c251b7b740afcdd43caf2dcb139cd6cc049400a02280c0ed1e602c5345ad29b42ee2641caca3f0b7e524341c48da0f4
6
+ metadata.gz: a658467635f982e5e53c0cd5a428c96d8f17acb120d16c31184b8ac8ddd2f21c9062c41e6df84610f95227118ae6de6a47053642188e8ed29208e2d44cfa5863
7
+ data.tar.gz: ec789fc4a9c2d3014b4e19c7a5b628f158fdc8a3b262139e86e44147b83a65107844ac19445d924aa41f1e90791d961c6c1bf8abb2ef19a9de49e6a54e63cba0
data/CHANGELOG.md CHANGED
@@ -1,6 +1,16 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.340.0 (2025-11-20)
5
+ ------------------
6
+
7
+ * Feature - Added training plan support for inference endpoints. Added HyperPod task governance with accelerator partition-based quota allocation. Added BatchRebootClusterNodes and BatchReplaceClusterNodes APIs. Updated ListClusterNodes to include privateDnsHostName.
8
+
9
+ 1.339.0 (2025-11-19)
10
+ ------------------
11
+
12
+ * Feature - Added support for enhanced metrics for SageMaker AI Endpoints. This features provides Utilization Metrics at instance and container granularity and also provides easy configuration of metric publish frequency from 10 sec -> 5 mins
13
+
4
14
  1.338.0 (2025-11-13)
5
15
  ------------------
6
16
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.338.0
1
+ 1.340.0
@@ -950,6 +950,209 @@ module Aws::SageMaker
950
950
  req.send_request(options)
951
951
  end
952
952
 
953
+ # Reboots specific nodes within a SageMaker HyperPod cluster using a
954
+ # soft recovery mechanism. `BatchRebootClusterNodes` performs a graceful
955
+ # reboot of the specified nodes by calling the Amazon Elastic Compute
956
+ # Cloud `RebootInstances` API, which attempts to cleanly shut down the
957
+ # operating system before restarting the instance.
958
+ #
959
+ # This operation is useful for recovering from transient issues or
960
+ # applying certain configuration changes that require a restart.
961
+ #
962
+ # <note markdown="1"> * Rebooting a node may cause temporary service interruption for
963
+ # workloads running on that node. Ensure your workloads can handle
964
+ # node restarts or use appropriate scheduling to minimize impact.
965
+ #
966
+ # * You can reboot up to 25 nodes in a single request.
967
+ #
968
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
969
+ # ensure rebooting nodes will not disrupt critical cluster operations.
970
+ #
971
+ # </note>
972
+ #
973
+ # @option params [required, String] :cluster_name
974
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
975
+ # cluster containing the nodes to reboot.
976
+ #
977
+ # @option params [Array<String>] :node_ids
978
+ # A list of EC2 instance IDs to reboot using soft recovery. You can
979
+ # specify between 1 and 25 instance IDs.
980
+ #
981
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
982
+ # at least one is required.
983
+ #
984
+ # * Each instance ID must follow the pattern `i-` followed by 17
985
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
986
+ #
987
+ # </note>
988
+ #
989
+ # @option params [Array<String>] :node_logical_ids
990
+ # A list of logical node IDs to reboot using soft recovery. You can
991
+ # specify between 1 and 25 logical node IDs.
992
+ #
993
+ # The `NodeLogicalId` is a unique identifier that persists throughout
994
+ # the node's lifecycle and can be used to track nodes that are still
995
+ # being provisioned and don't yet have an EC2 instance ID assigned.
996
+ #
997
+ # * This parameter is only supported for clusters using `Continuous` as
998
+ # the `NodeProvisioningMode`. For clusters using the default
999
+ # provisioning mode, use `NodeIds` instead.
1000
+ #
1001
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1002
+ # at least one is required.
1003
+ #
1004
+ # @return [Types::BatchRebootClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
1005
+ #
1006
+ # * {Types::BatchRebootClusterNodesResponse#successful #successful} => Array&lt;String&gt;
1007
+ # * {Types::BatchRebootClusterNodesResponse#failed #failed} => Array&lt;Types::BatchRebootClusterNodesError&gt;
1008
+ # * {Types::BatchRebootClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array&lt;Types::BatchRebootClusterNodeLogicalIdsError&gt;
1009
+ # * {Types::BatchRebootClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array&lt;String&gt;
1010
+ #
1011
+ # @example Request syntax with placeholder values
1012
+ #
1013
+ # resp = client.batch_reboot_cluster_nodes({
1014
+ # cluster_name: "ClusterNameOrArn", # required
1015
+ # node_ids: ["ClusterNodeId"],
1016
+ # node_logical_ids: ["ClusterNodeLogicalId"],
1017
+ # })
1018
+ #
1019
+ # @example Response structure
1020
+ #
1021
+ # resp.successful #=> Array
1022
+ # resp.successful[0] #=> String
1023
+ # resp.failed #=> Array
1024
+ # resp.failed[0].node_id #=> String
1025
+ # resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1026
+ # resp.failed[0].message #=> String
1027
+ # resp.failed_node_logical_ids #=> Array
1028
+ # resp.failed_node_logical_ids[0].node_logical_id #=> String
1029
+ # resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1030
+ # resp.failed_node_logical_ids[0].message #=> String
1031
+ # resp.successful_node_logical_ids #=> Array
1032
+ # resp.successful_node_logical_ids[0] #=> String
1033
+ #
1034
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodes AWS API Documentation
1035
+ #
1036
+ # @overload batch_reboot_cluster_nodes(params = {})
1037
+ # @param [Hash] params ({})
1038
+ def batch_reboot_cluster_nodes(params = {}, options = {})
1039
+ req = build_request(:batch_reboot_cluster_nodes, params)
1040
+ req.send_request(options)
1041
+ end
1042
+
1043
+ # Replaces specific nodes within a SageMaker HyperPod cluster with new
1044
+ # hardware. `BatchReplaceClusterNodes` terminates the specified
1045
+ # instances and provisions new replacement instances with the same
1046
+ # configuration but fresh hardware. The Amazon Machine Image (AMI) and
1047
+ # instance configuration remain the same.
1048
+ #
1049
+ # This operation is useful for recovering from hardware failures or
1050
+ # persistent issues that cannot be resolved through a reboot.
1051
+ #
1052
+ # * **Data Loss Warning:** Replacing nodes destroys all instance
1053
+ # volumes, including both root and secondary volumes. All data stored
1054
+ # on these volumes will be permanently lost and cannot be recovered.
1055
+ #
1056
+ # * To safeguard your work, back up your data to Amazon S3 or an FSx for
1057
+ # Lustre file system before invoking the API on a worker node group.
1058
+ # This will help prevent any potential data loss from the instance
1059
+ # root volume. For more information about backup, see [Use the backup
1060
+ # script provided by SageMaker HyperPod][1].
1061
+ #
1062
+ # * If you want to invoke this API on an existing cluster, you'll first
1063
+ # need to patch the cluster by running the [UpdateClusterSoftware
1064
+ # API][2]. For more information about patching a cluster, see [Update
1065
+ # the SageMaker HyperPod platform software of a cluster][3].
1066
+ #
1067
+ # * You can replace up to 25 nodes in a single request.
1068
+ #
1069
+ #
1070
+ #
1071
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software-backup
1072
+ # [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_UpdateClusterSoftware.html
1073
+ # [3]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software
1074
+ #
1075
+ # @option params [required, String] :cluster_name
1076
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
1077
+ # cluster containing the nodes to replace.
1078
+ #
1079
+ # @option params [Array<String>] :node_ids
1080
+ # A list of EC2 instance IDs to replace with new hardware. You can
1081
+ # specify between 1 and 25 instance IDs.
1082
+ #
1083
+ # Replace operations destroy all instance volumes (root and secondary).
1084
+ # Ensure you have backed up any important data before proceeding.
1085
+ #
1086
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1087
+ # at least one is required.
1088
+ #
1089
+ # * Each instance ID must follow the pattern `i-` followed by 17
1090
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
1091
+ #
1092
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
1093
+ # you cannot replace instances that are configured as Slurm controller
1094
+ # nodes.
1095
+ #
1096
+ # </note>
1097
+ #
1098
+ # @option params [Array<String>] :node_logical_ids
1099
+ # A list of logical node IDs to replace with new hardware. You can
1100
+ # specify between 1 and 25 logical node IDs.
1101
+ #
1102
+ # The `NodeLogicalId` is a unique identifier that persists throughout
1103
+ # the node's lifecycle and can be used to track nodes that are still
1104
+ # being provisioned and don't yet have an EC2 instance ID assigned.
1105
+ #
1106
+ # * Replace operations destroy all instance volumes (root and
1107
+ # secondary). Ensure you have backed up any important data before
1108
+ # proceeding.
1109
+ #
1110
+ # * This parameter is only supported for clusters using `Continuous` as
1111
+ # the `NodeProvisioningMode`. For clusters using the default
1112
+ # provisioning mode, use `NodeIds` instead.
1113
+ #
1114
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1115
+ # at least one is required.
1116
+ #
1117
+ # @return [Types::BatchReplaceClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
1118
+ #
1119
+ # * {Types::BatchReplaceClusterNodesResponse#successful #successful} => Array&lt;String&gt;
1120
+ # * {Types::BatchReplaceClusterNodesResponse#failed #failed} => Array&lt;Types::BatchReplaceClusterNodesError&gt;
1121
+ # * {Types::BatchReplaceClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array&lt;Types::BatchReplaceClusterNodeLogicalIdsError&gt;
1122
+ # * {Types::BatchReplaceClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array&lt;String&gt;
1123
+ #
1124
+ # @example Request syntax with placeholder values
1125
+ #
1126
+ # resp = client.batch_replace_cluster_nodes({
1127
+ # cluster_name: "ClusterNameOrArn", # required
1128
+ # node_ids: ["ClusterNodeId"],
1129
+ # node_logical_ids: ["ClusterNodeLogicalId"],
1130
+ # })
1131
+ #
1132
+ # @example Response structure
1133
+ #
1134
+ # resp.successful #=> Array
1135
+ # resp.successful[0] #=> String
1136
+ # resp.failed #=> Array
1137
+ # resp.failed[0].node_id #=> String
1138
+ # resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1139
+ # resp.failed[0].message #=> String
1140
+ # resp.failed_node_logical_ids #=> Array
1141
+ # resp.failed_node_logical_ids[0].node_logical_id #=> String
1142
+ # resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1143
+ # resp.failed_node_logical_ids[0].message #=> String
1144
+ # resp.successful_node_logical_ids #=> Array
1145
+ # resp.successful_node_logical_ids[0] #=> String
1146
+ #
1147
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodes AWS API Documentation
1148
+ #
1149
+ # @overload batch_replace_cluster_nodes(params = {})
1150
+ # @param [Hash] params ({})
1151
+ def batch_replace_cluster_nodes(params = {}, options = {})
1152
+ req = build_request(:batch_replace_cluster_nodes, params)
1153
+ req.send_request(options)
1154
+ end
1155
+
953
1156
  # Creates an *action*. An action is a lineage tracking entity that
954
1157
  # represents an action or activity. For example, a model deployment or
955
1158
  # an HPO job. Generally, an action involves at least one input or output
@@ -1259,7 +1462,7 @@ module Aws::SageMaker
1259
1462
  # resource_config: { # required
1260
1463
  # instance_type: "ml.m4.xlarge", # accepts ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.p3dn.24xlarge, ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5n.xlarge, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.16xlarge, ml.g5.12xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.trn2.48xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.8xlarge, ml.c6i.4xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.8xlarge, ml.r5d.12xlarge, ml.r5d.16xlarge, ml.r5d.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.8xlarge, ml.r5.12xlarge, ml.r5.16xlarge, ml.r5.24xlarge, ml.p6-b200.48xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.c7i.large, ml.c7i.xlarge, ml.c7i.2xlarge, ml.c7i.4xlarge, ml.c7i.8xlarge, ml.c7i.12xlarge, ml.c7i.16xlarge, ml.c7i.24xlarge, ml.c7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge, ml.p6e-gb200.36xlarge, ml.p5.4xlarge
1261
1464
  # instance_count: 1,
1262
- # volume_size_in_gb: 1, # required
1465
+ # volume_size_in_gb: 1,
1263
1466
  # volume_kms_key_id: "KmsKeyId",
1264
1467
  # keep_alive_period_in_seconds: 1,
1265
1468
  # instance_groups: [
@@ -2725,6 +2928,10 @@ module Aws::SageMaker
2725
2928
  # accelerators: 1,
2726
2929
  # v_cpu: 1.0,
2727
2930
  # memory_in_gi_b: 1.0,
2931
+ # accelerator_partition: {
2932
+ # type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
2933
+ # count: 1, # required
2934
+ # },
2728
2935
  # },
2729
2936
  # ],
2730
2937
  # resource_sharing_config: {
@@ -4090,6 +4297,9 @@ module Aws::SageMaker
4090
4297
  # isolated. If they are, no inbound or outbound network calls can be
4091
4298
  # made to or from the model containers.
4092
4299
  #
4300
+ # @option params [Types::MetricsConfig] :metrics_config
4301
+ # The configuration parameters for utilization metrics.
4302
+ #
4093
4303
  # @return [Types::CreateEndpointConfigOutput] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
4094
4304
  #
4095
4305
  # * {Types::CreateEndpointConfigOutput#endpoint_config_arn #endpoint_config_arn} => String
@@ -4245,6 +4455,10 @@ module Aws::SageMaker
4245
4455
  # subnets: ["SubnetId"], # required
4246
4456
  # },
4247
4457
  # enable_network_isolation: false,
4458
+ # metrics_config: {
4459
+ # enable_enhanced_metrics: false,
4460
+ # metric_publish_frequency_in_seconds: 1,
4461
+ # },
4248
4462
  # })
4249
4463
  #
4250
4464
  # @example Response structure
@@ -5190,7 +5404,7 @@ module Aws::SageMaker
5190
5404
  # resource_config: {
5191
5405
  # instance_type: "ml.m4.xlarge", # accepts ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.p3dn.24xlarge, ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5n.xlarge, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.16xlarge, ml.g5.12xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.trn2.48xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.8xlarge, ml.c6i.4xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.8xlarge, ml.r5d.12xlarge, ml.r5d.16xlarge, ml.r5d.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.8xlarge, ml.r5.12xlarge, ml.r5.16xlarge, ml.r5.24xlarge, ml.p6-b200.48xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.c7i.large, ml.c7i.xlarge, ml.c7i.2xlarge, ml.c7i.4xlarge, ml.c7i.8xlarge, ml.c7i.12xlarge, ml.c7i.16xlarge, ml.c7i.24xlarge, ml.c7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge, ml.p6e-gb200.36xlarge, ml.p5.4xlarge
5192
5406
  # instance_count: 1,
5193
- # volume_size_in_gb: 1, # required
5407
+ # volume_size_in_gb: 1,
5194
5408
  # volume_kms_key_id: "KmsKeyId",
5195
5409
  # keep_alive_period_in_seconds: 1,
5196
5410
  # instance_groups: [
@@ -5341,7 +5555,7 @@ module Aws::SageMaker
5341
5555
  # resource_config: {
5342
5556
  # instance_type: "ml.m4.xlarge", # accepts ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.p3dn.24xlarge, ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5n.xlarge, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.16xlarge, ml.g5.12xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.trn2.48xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.8xlarge, ml.c6i.4xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.8xlarge, ml.r5d.12xlarge, ml.r5d.16xlarge, ml.r5d.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.8xlarge, ml.r5.12xlarge, ml.r5.16xlarge, ml.r5.24xlarge, ml.p6-b200.48xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.c7i.large, ml.c7i.xlarge, ml.c7i.2xlarge, ml.c7i.4xlarge, ml.c7i.8xlarge, ml.c7i.12xlarge, ml.c7i.16xlarge, ml.c7i.24xlarge, ml.c7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge, ml.p6e-gb200.36xlarge, ml.p5.4xlarge
5343
5557
  # instance_count: 1,
5344
- # volume_size_in_gb: 1, # required
5558
+ # volume_size_in_gb: 1,
5345
5559
  # volume_kms_key_id: "KmsKeyId",
5346
5560
  # keep_alive_period_in_seconds: 1,
5347
5561
  # instance_groups: [
@@ -9795,7 +10009,7 @@ module Aws::SageMaker
9795
10009
  # resource_config: {
9796
10010
  # instance_type: "ml.m4.xlarge", # accepts ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.p3dn.24xlarge, ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5n.xlarge, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.16xlarge, ml.g5.12xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.trn2.48xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.8xlarge, ml.c6i.4xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.8xlarge, ml.r5d.12xlarge, ml.r5d.16xlarge, ml.r5d.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.8xlarge, ml.r5.12xlarge, ml.r5.16xlarge, ml.r5.24xlarge, ml.p6-b200.48xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.c7i.large, ml.c7i.xlarge, ml.c7i.2xlarge, ml.c7i.4xlarge, ml.c7i.8xlarge, ml.c7i.12xlarge, ml.c7i.16xlarge, ml.c7i.24xlarge, ml.c7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge, ml.p6e-gb200.36xlarge, ml.p5.4xlarge
9797
10011
  # instance_count: 1,
9798
- # volume_size_in_gb: 1, # required
10012
+ # volume_size_in_gb: 1,
9799
10013
  # volume_kms_key_id: "KmsKeyId",
9800
10014
  # keep_alive_period_in_seconds: 1,
9801
10015
  # instance_groups: [
@@ -13905,6 +14119,8 @@ module Aws::SageMaker
13905
14119
  # resp.compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
13906
14120
  # resp.compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
13907
14121
  # resp.compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
14122
+ # resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
14123
+ # resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
13908
14124
  # resp.compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
13909
14125
  # resp.compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
13910
14126
  # resp.compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
@@ -14621,6 +14837,7 @@ module Aws::SageMaker
14621
14837
  # * {Types::DescribeEndpointOutput#pending_deployment_summary #pending_deployment_summary} => Types::PendingDeploymentSummary
14622
14838
  # * {Types::DescribeEndpointOutput#explainer_config #explainer_config} => Types::ExplainerConfig
14623
14839
  # * {Types::DescribeEndpointOutput#shadow_production_variants #shadow_production_variants} => Array&lt;Types::ProductionVariantSummary&gt;
14840
+ # * {Types::DescribeEndpointOutput#metrics_config #metrics_config} => Types::MetricsConfig
14624
14841
  #
14625
14842
  # @example Request syntax with placeholder values
14626
14843
  #
@@ -14811,6 +15028,8 @@ module Aws::SageMaker
14811
15028
  # resp.shadow_production_variants[0].capacity_reservation_config.ec2_capacity_reservations[0].total_instance_count #=> Integer
14812
15029
  # resp.shadow_production_variants[0].capacity_reservation_config.ec2_capacity_reservations[0].available_instance_count #=> Integer
14813
15030
  # resp.shadow_production_variants[0].capacity_reservation_config.ec2_capacity_reservations[0].used_by_current_endpoint #=> Integer
15031
+ # resp.metrics_config.enable_enhanced_metrics #=> Boolean
15032
+ # resp.metrics_config.metric_publish_frequency_in_seconds #=> Integer
14814
15033
  #
14815
15034
  #
14816
15035
  # The following waiters are defined for this operation (see {Client#wait_until} for detailed usage):
@@ -14847,6 +15066,7 @@ module Aws::SageMaker
14847
15066
  # * {Types::DescribeEndpointConfigOutput#execution_role_arn #execution_role_arn} => String
14848
15067
  # * {Types::DescribeEndpointConfigOutput#vpc_config #vpc_config} => Types::VpcConfig
14849
15068
  # * {Types::DescribeEndpointConfigOutput#enable_network_isolation #enable_network_isolation} => Boolean
15069
+ # * {Types::DescribeEndpointConfigOutput#metrics_config #metrics_config} => Types::MetricsConfig
14850
15070
  #
14851
15071
  # @example Request syntax with placeholder values
14852
15072
  #
@@ -14953,6 +15173,8 @@ module Aws::SageMaker
14953
15173
  # resp.vpc_config.subnets #=> Array
14954
15174
  # resp.vpc_config.subnets[0] #=> String
14955
15175
  # resp.enable_network_isolation #=> Boolean
15176
+ # resp.metrics_config.enable_enhanced_metrics #=> Boolean
15177
+ # resp.metrics_config.metric_publish_frequency_in_seconds #=> Integer
14956
15178
  #
14957
15179
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeEndpointConfig AWS API Documentation
14958
15180
  #
@@ -18398,7 +18620,7 @@ module Aws::SageMaker
18398
18620
  # resp.available_spare_instance_count #=> Integer
18399
18621
  # resp.total_ultra_server_count #=> Integer
18400
18622
  # resp.target_resources #=> Array
18401
- # resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
18623
+ # resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
18402
18624
  # resp.reserved_capacity_summaries #=> Array
18403
18625
  # resp.reserved_capacity_summaries[0].reserved_capacity_arn #=> String
18404
18626
  # resp.reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
@@ -20337,6 +20559,7 @@ module Aws::SageMaker
20337
20559
  # resp.cluster_node_summaries[0].instance_status.status #=> String, one of "Running", "Failure", "Pending", "ShuttingDown", "SystemUpdating", "DeepHealthCheckInProgress", "NotFound"
20338
20560
  # resp.cluster_node_summaries[0].instance_status.message #=> String
20339
20561
  # resp.cluster_node_summaries[0].ultra_server_info.id #=> String
20562
+ # resp.cluster_node_summaries[0].private_dns_hostname #=> String
20340
20563
  #
20341
20564
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListClusterNodes AWS API Documentation
20342
20565
  #
@@ -20800,6 +21023,8 @@ module Aws::SageMaker
20800
21023
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
20801
21024
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
20802
21025
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
21026
+ # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
21027
+ # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
20803
21028
  # resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
20804
21029
  # resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
20805
21030
  # resp.compute_quota_summaries[0].compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
@@ -25447,7 +25672,7 @@ module Aws::SageMaker
25447
25672
  # resp.training_plan_summaries[0].in_use_instance_count #=> Integer
25448
25673
  # resp.training_plan_summaries[0].total_ultra_server_count #=> Integer
25449
25674
  # resp.training_plan_summaries[0].target_resources #=> Array
25450
- # resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
25675
+ # resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
25451
25676
  # resp.training_plan_summaries[0].reserved_capacity_summaries #=> Array
25452
25677
  # resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_arn #=> String
25453
25678
  # resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
@@ -26468,7 +26693,7 @@ module Aws::SageMaker
26468
26693
  #
26469
26694
  # @option params [required, Array<String>] :target_resources
26470
26695
  # The target resources (e.g., SageMaker Training Jobs, SageMaker
26471
- # HyperPod) to search for in the offerings.
26696
+ # HyperPod, SageMaker Endpoints) to search for in the offerings.
26472
26697
  #
26473
26698
  # Training plans are specific to their target resource.
26474
26699
  #
@@ -26478,6 +26703,10 @@ module Aws::SageMaker
26478
26703
  # * A training plan for HyperPod clusters can be used exclusively to
26479
26704
  # provide compute resources to a cluster's instance group.
26480
26705
  #
26706
+ # * A training plan for SageMaker endpoints can be used exclusively to
26707
+ # provide compute resources to SageMaker endpoints for model
26708
+ # deployment.
26709
+ #
26481
26710
  # @return [Types::SearchTrainingPlanOfferingsResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
26482
26711
  #
26483
26712
  # * {Types::SearchTrainingPlanOfferingsResponse#training_plan_offerings #training_plan_offerings} => Array&lt;Types::TrainingPlanOffering&gt;
@@ -26492,7 +26721,7 @@ module Aws::SageMaker
26492
26721
  # start_time_after: Time.now,
26493
26722
  # end_time_before: Time.now,
26494
26723
  # duration_hours: 1, # required
26495
- # target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster
26724
+ # target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster, endpoint
26496
26725
  # })
26497
26726
  #
26498
26727
  # @example Response structure
@@ -26500,7 +26729,7 @@ module Aws::SageMaker
26500
26729
  # resp.training_plan_offerings #=> Array
26501
26730
  # resp.training_plan_offerings[0].training_plan_offering_id #=> String
26502
26731
  # resp.training_plan_offerings[0].target_resources #=> Array
26503
- # resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
26732
+ # resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
26504
26733
  # resp.training_plan_offerings[0].requested_start_time_after #=> Time
26505
26734
  # resp.training_plan_offerings[0].requested_end_time_before #=> Time
26506
26735
  # resp.training_plan_offerings[0].duration_hours #=> Integer
@@ -27938,6 +28167,10 @@ module Aws::SageMaker
27938
28167
  # accelerators: 1,
27939
28168
  # v_cpu: 1.0,
27940
28169
  # memory_in_gi_b: 1.0,
28170
+ # accelerator_partition: {
28171
+ # type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
28172
+ # count: 1, # required
28173
+ # },
27941
28174
  # },
27942
28175
  # ],
27943
28176
  # resource_sharing_config: {
@@ -31346,7 +31579,7 @@ module Aws::SageMaker
31346
31579
  tracer: tracer
31347
31580
  )
31348
31581
  context[:gem_name] = 'aws-sdk-sagemaker'
31349
- context[:gem_version] = '1.338.0'
31582
+ context[:gem_version] = '1.340.0'
31350
31583
  Seahorse::Client::Request.new(handlers, context)
31351
31584
  end
31352
31585