aws-sdk-sagemaker 1.339.0 → 1.341.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +10 -0
- data/VERSION +1 -1
- data/lib/aws-sdk-sagemaker/client.rb +321 -9
- data/lib/aws-sdk-sagemaker/client_api.rb +192 -0
- data/lib/aws-sdk-sagemaker/types.rb +717 -11
- data/lib/aws-sdk-sagemaker.rb +1 -1
- data/sig/client.rbs +96 -9
- data/sig/types.rbs +149 -7
- metadata +3 -3
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: 26865b73cdcf61e9575a07d832b43aa93e24edce14672d0fec79742958394014
|
|
4
|
+
data.tar.gz: 0d0613bf3801d91d0d176695ccf4422a7e531ec6054f80a735069034eb79a2a1
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 06ee60e1d183dab830facd89ff879c1df147cc673f511e681cf0ecc2f45211585f034dbeb9893534cf8d1f4486554e59a8375d1acf5b8cd4398f8944245ad875
|
|
7
|
+
data.tar.gz: 913fb03b0fea5374c8eb21cfc8d4668e1705b493f94b9fb1ab30646ef2bc0bce18bc9deddbf5c0a20034dc466cb34b532de52eaeda6e822999d525659eda3585
|
data/CHANGELOG.md
CHANGED
|
@@ -1,6 +1,16 @@
|
|
|
1
1
|
Unreleased Changes
|
|
2
2
|
------------------
|
|
3
3
|
|
|
4
|
+
1.341.0 (2025-11-21)
|
|
5
|
+
------------------
|
|
6
|
+
|
|
7
|
+
* Feature - Enhanced SageMaker HyperPod instance groups with support for MinInstanceCount, CapacityRequirements (Spot/On-Demand), and KubernetesConfig (labels and taints). Also Added speculative decoding and MaxInstanceCount for model optimization jobs.
|
|
8
|
+
|
|
9
|
+
1.340.0 (2025-11-20)
|
|
10
|
+
------------------
|
|
11
|
+
|
|
12
|
+
* Feature - Added training plan support for inference endpoints. Added HyperPod task governance with accelerator partition-based quota allocation. Added BatchRebootClusterNodes and BatchReplaceClusterNodes APIs. Updated ListClusterNodes to include privateDnsHostName.
|
|
13
|
+
|
|
4
14
|
1.339.0 (2025-11-19)
|
|
5
15
|
------------------
|
|
6
16
|
|
data/VERSION
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
1.
|
|
1
|
+
1.341.0
|
|
@@ -950,6 +950,209 @@ module Aws::SageMaker
|
|
|
950
950
|
req.send_request(options)
|
|
951
951
|
end
|
|
952
952
|
|
|
953
|
+
# Reboots specific nodes within a SageMaker HyperPod cluster using a
|
|
954
|
+
# soft recovery mechanism. `BatchRebootClusterNodes` performs a graceful
|
|
955
|
+
# reboot of the specified nodes by calling the Amazon Elastic Compute
|
|
956
|
+
# Cloud `RebootInstances` API, which attempts to cleanly shut down the
|
|
957
|
+
# operating system before restarting the instance.
|
|
958
|
+
#
|
|
959
|
+
# This operation is useful for recovering from transient issues or
|
|
960
|
+
# applying certain configuration changes that require a restart.
|
|
961
|
+
#
|
|
962
|
+
# <note markdown="1"> * Rebooting a node may cause temporary service interruption for
|
|
963
|
+
# workloads running on that node. Ensure your workloads can handle
|
|
964
|
+
# node restarts or use appropriate scheduling to minimize impact.
|
|
965
|
+
#
|
|
966
|
+
# * You can reboot up to 25 nodes in a single request.
|
|
967
|
+
#
|
|
968
|
+
# * For SageMaker HyperPod clusters using the Slurm workload manager,
|
|
969
|
+
# ensure rebooting nodes will not disrupt critical cluster operations.
|
|
970
|
+
#
|
|
971
|
+
# </note>
|
|
972
|
+
#
|
|
973
|
+
# @option params [required, String] :cluster_name
|
|
974
|
+
# The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
|
|
975
|
+
# cluster containing the nodes to reboot.
|
|
976
|
+
#
|
|
977
|
+
# @option params [Array<String>] :node_ids
|
|
978
|
+
# A list of EC2 instance IDs to reboot using soft recovery. You can
|
|
979
|
+
# specify between 1 and 25 instance IDs.
|
|
980
|
+
#
|
|
981
|
+
# <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
982
|
+
# at least one is required.
|
|
983
|
+
#
|
|
984
|
+
# * Each instance ID must follow the pattern `i-` followed by 17
|
|
985
|
+
# hexadecimal characters (for example, `i-0123456789abcdef0`).
|
|
986
|
+
#
|
|
987
|
+
# </note>
|
|
988
|
+
#
|
|
989
|
+
# @option params [Array<String>] :node_logical_ids
|
|
990
|
+
# A list of logical node IDs to reboot using soft recovery. You can
|
|
991
|
+
# specify between 1 and 25 logical node IDs.
|
|
992
|
+
#
|
|
993
|
+
# The `NodeLogicalId` is a unique identifier that persists throughout
|
|
994
|
+
# the node's lifecycle and can be used to track nodes that are still
|
|
995
|
+
# being provisioned and don't yet have an EC2 instance ID assigned.
|
|
996
|
+
#
|
|
997
|
+
# * This parameter is only supported for clusters using `Continuous` as
|
|
998
|
+
# the `NodeProvisioningMode`. For clusters using the default
|
|
999
|
+
# provisioning mode, use `NodeIds` instead.
|
|
1000
|
+
#
|
|
1001
|
+
# * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
1002
|
+
# at least one is required.
|
|
1003
|
+
#
|
|
1004
|
+
# @return [Types::BatchRebootClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
|
1005
|
+
#
|
|
1006
|
+
# * {Types::BatchRebootClusterNodesResponse#successful #successful} => Array<String>
|
|
1007
|
+
# * {Types::BatchRebootClusterNodesResponse#failed #failed} => Array<Types::BatchRebootClusterNodesError>
|
|
1008
|
+
# * {Types::BatchRebootClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array<Types::BatchRebootClusterNodeLogicalIdsError>
|
|
1009
|
+
# * {Types::BatchRebootClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array<String>
|
|
1010
|
+
#
|
|
1011
|
+
# @example Request syntax with placeholder values
|
|
1012
|
+
#
|
|
1013
|
+
# resp = client.batch_reboot_cluster_nodes({
|
|
1014
|
+
# cluster_name: "ClusterNameOrArn", # required
|
|
1015
|
+
# node_ids: ["ClusterNodeId"],
|
|
1016
|
+
# node_logical_ids: ["ClusterNodeLogicalId"],
|
|
1017
|
+
# })
|
|
1018
|
+
#
|
|
1019
|
+
# @example Response structure
|
|
1020
|
+
#
|
|
1021
|
+
# resp.successful #=> Array
|
|
1022
|
+
# resp.successful[0] #=> String
|
|
1023
|
+
# resp.failed #=> Array
|
|
1024
|
+
# resp.failed[0].node_id #=> String
|
|
1025
|
+
# resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1026
|
+
# resp.failed[0].message #=> String
|
|
1027
|
+
# resp.failed_node_logical_ids #=> Array
|
|
1028
|
+
# resp.failed_node_logical_ids[0].node_logical_id #=> String
|
|
1029
|
+
# resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1030
|
+
# resp.failed_node_logical_ids[0].message #=> String
|
|
1031
|
+
# resp.successful_node_logical_ids #=> Array
|
|
1032
|
+
# resp.successful_node_logical_ids[0] #=> String
|
|
1033
|
+
#
|
|
1034
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodes AWS API Documentation
|
|
1035
|
+
#
|
|
1036
|
+
# @overload batch_reboot_cluster_nodes(params = {})
|
|
1037
|
+
# @param [Hash] params ({})
|
|
1038
|
+
def batch_reboot_cluster_nodes(params = {}, options = {})
|
|
1039
|
+
req = build_request(:batch_reboot_cluster_nodes, params)
|
|
1040
|
+
req.send_request(options)
|
|
1041
|
+
end
|
|
1042
|
+
|
|
1043
|
+
# Replaces specific nodes within a SageMaker HyperPod cluster with new
|
|
1044
|
+
# hardware. `BatchReplaceClusterNodes` terminates the specified
|
|
1045
|
+
# instances and provisions new replacement instances with the same
|
|
1046
|
+
# configuration but fresh hardware. The Amazon Machine Image (AMI) and
|
|
1047
|
+
# instance configuration remain the same.
|
|
1048
|
+
#
|
|
1049
|
+
# This operation is useful for recovering from hardware failures or
|
|
1050
|
+
# persistent issues that cannot be resolved through a reboot.
|
|
1051
|
+
#
|
|
1052
|
+
# * **Data Loss Warning:** Replacing nodes destroys all instance
|
|
1053
|
+
# volumes, including both root and secondary volumes. All data stored
|
|
1054
|
+
# on these volumes will be permanently lost and cannot be recovered.
|
|
1055
|
+
#
|
|
1056
|
+
# * To safeguard your work, back up your data to Amazon S3 or an FSx for
|
|
1057
|
+
# Lustre file system before invoking the API on a worker node group.
|
|
1058
|
+
# This will help prevent any potential data loss from the instance
|
|
1059
|
+
# root volume. For more information about backup, see [Use the backup
|
|
1060
|
+
# script provided by SageMaker HyperPod][1].
|
|
1061
|
+
#
|
|
1062
|
+
# * If you want to invoke this API on an existing cluster, you'll first
|
|
1063
|
+
# need to patch the cluster by running the [UpdateClusterSoftware
|
|
1064
|
+
# API][2]. For more information about patching a cluster, see [Update
|
|
1065
|
+
# the SageMaker HyperPod platform software of a cluster][3].
|
|
1066
|
+
#
|
|
1067
|
+
# * You can replace up to 25 nodes in a single request.
|
|
1068
|
+
#
|
|
1069
|
+
#
|
|
1070
|
+
#
|
|
1071
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software-backup
|
|
1072
|
+
# [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_UpdateClusterSoftware.html
|
|
1073
|
+
# [3]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software
|
|
1074
|
+
#
|
|
1075
|
+
# @option params [required, String] :cluster_name
|
|
1076
|
+
# The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
|
|
1077
|
+
# cluster containing the nodes to replace.
|
|
1078
|
+
#
|
|
1079
|
+
# @option params [Array<String>] :node_ids
|
|
1080
|
+
# A list of EC2 instance IDs to replace with new hardware. You can
|
|
1081
|
+
# specify between 1 and 25 instance IDs.
|
|
1082
|
+
#
|
|
1083
|
+
# Replace operations destroy all instance volumes (root and secondary).
|
|
1084
|
+
# Ensure you have backed up any important data before proceeding.
|
|
1085
|
+
#
|
|
1086
|
+
# <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
1087
|
+
# at least one is required.
|
|
1088
|
+
#
|
|
1089
|
+
# * Each instance ID must follow the pattern `i-` followed by 17
|
|
1090
|
+
# hexadecimal characters (for example, `i-0123456789abcdef0`).
|
|
1091
|
+
#
|
|
1092
|
+
# * For SageMaker HyperPod clusters using the Slurm workload manager,
|
|
1093
|
+
# you cannot replace instances that are configured as Slurm controller
|
|
1094
|
+
# nodes.
|
|
1095
|
+
#
|
|
1096
|
+
# </note>
|
|
1097
|
+
#
|
|
1098
|
+
# @option params [Array<String>] :node_logical_ids
|
|
1099
|
+
# A list of logical node IDs to replace with new hardware. You can
|
|
1100
|
+
# specify between 1 and 25 logical node IDs.
|
|
1101
|
+
#
|
|
1102
|
+
# The `NodeLogicalId` is a unique identifier that persists throughout
|
|
1103
|
+
# the node's lifecycle and can be used to track nodes that are still
|
|
1104
|
+
# being provisioned and don't yet have an EC2 instance ID assigned.
|
|
1105
|
+
#
|
|
1106
|
+
# * Replace operations destroy all instance volumes (root and
|
|
1107
|
+
# secondary). Ensure you have backed up any important data before
|
|
1108
|
+
# proceeding.
|
|
1109
|
+
#
|
|
1110
|
+
# * This parameter is only supported for clusters using `Continuous` as
|
|
1111
|
+
# the `NodeProvisioningMode`. For clusters using the default
|
|
1112
|
+
# provisioning mode, use `NodeIds` instead.
|
|
1113
|
+
#
|
|
1114
|
+
# * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
1115
|
+
# at least one is required.
|
|
1116
|
+
#
|
|
1117
|
+
# @return [Types::BatchReplaceClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
|
1118
|
+
#
|
|
1119
|
+
# * {Types::BatchReplaceClusterNodesResponse#successful #successful} => Array<String>
|
|
1120
|
+
# * {Types::BatchReplaceClusterNodesResponse#failed #failed} => Array<Types::BatchReplaceClusterNodesError>
|
|
1121
|
+
# * {Types::BatchReplaceClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array<Types::BatchReplaceClusterNodeLogicalIdsError>
|
|
1122
|
+
# * {Types::BatchReplaceClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array<String>
|
|
1123
|
+
#
|
|
1124
|
+
# @example Request syntax with placeholder values
|
|
1125
|
+
#
|
|
1126
|
+
# resp = client.batch_replace_cluster_nodes({
|
|
1127
|
+
# cluster_name: "ClusterNameOrArn", # required
|
|
1128
|
+
# node_ids: ["ClusterNodeId"],
|
|
1129
|
+
# node_logical_ids: ["ClusterNodeLogicalId"],
|
|
1130
|
+
# })
|
|
1131
|
+
#
|
|
1132
|
+
# @example Response structure
|
|
1133
|
+
#
|
|
1134
|
+
# resp.successful #=> Array
|
|
1135
|
+
# resp.successful[0] #=> String
|
|
1136
|
+
# resp.failed #=> Array
|
|
1137
|
+
# resp.failed[0].node_id #=> String
|
|
1138
|
+
# resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1139
|
+
# resp.failed[0].message #=> String
|
|
1140
|
+
# resp.failed_node_logical_ids #=> Array
|
|
1141
|
+
# resp.failed_node_logical_ids[0].node_logical_id #=> String
|
|
1142
|
+
# resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1143
|
+
# resp.failed_node_logical_ids[0].message #=> String
|
|
1144
|
+
# resp.successful_node_logical_ids #=> Array
|
|
1145
|
+
# resp.successful_node_logical_ids[0] #=> String
|
|
1146
|
+
#
|
|
1147
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodes AWS API Documentation
|
|
1148
|
+
#
|
|
1149
|
+
# @overload batch_replace_cluster_nodes(params = {})
|
|
1150
|
+
# @param [Hash] params ({})
|
|
1151
|
+
def batch_replace_cluster_nodes(params = {}, options = {})
|
|
1152
|
+
req = build_request(:batch_replace_cluster_nodes, params)
|
|
1153
|
+
req.send_request(options)
|
|
1154
|
+
end
|
|
1155
|
+
|
|
953
1156
|
# Creates an *action*. An action is a lineage tracking entity that
|
|
954
1157
|
# represents an action or activity. For example, a model deployment or
|
|
955
1158
|
# an HPO job. Generally, an action involves at least one input or output
|
|
@@ -2243,6 +2446,7 @@ module Aws::SageMaker
|
|
|
2243
2446
|
# instance_groups: [
|
|
2244
2447
|
# {
|
|
2245
2448
|
# instance_count: 1, # required
|
|
2449
|
+
# min_instance_count: 1,
|
|
2246
2450
|
# instance_group_name: "ClusterInstanceGroupName", # required
|
|
2247
2451
|
# instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p6e-gb200.36xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.12xlarge, ml.c5.18xlarge, ml.c5.24xlarge, ml.c5n.large, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.8xlarge, ml.m5.12xlarge, ml.m5.16xlarge, ml.m5.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.gr6.4xlarge, ml.gr6.8xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.p6-b200.48xlarge, ml.trn2.3xlarge, ml.trn2.48xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.r6i.large, ml.r6i.xlarge, ml.r6i.2xlarge, ml.r6i.4xlarge, ml.r6i.8xlarge, ml.r6i.12xlarge, ml.r6i.16xlarge, ml.r6i.24xlarge, ml.r6i.32xlarge, ml.i3en.large, ml.i3en.xlarge, ml.i3en.2xlarge, ml.i3en.3xlarge, ml.i3en.6xlarge, ml.i3en.12xlarge, ml.i3en.24xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge
|
|
2248
2452
|
# life_cycle_config: { # required
|
|
@@ -2288,6 +2492,24 @@ module Aws::SageMaker
|
|
|
2288
2492
|
# },
|
|
2289
2493
|
# },
|
|
2290
2494
|
# image_id: "ImageId",
|
|
2495
|
+
# kubernetes_config: {
|
|
2496
|
+
# labels: {
|
|
2497
|
+
# "ClusterKubernetesLabelKey" => "ClusterKubernetesLabelValue",
|
|
2498
|
+
# },
|
|
2499
|
+
# taints: [
|
|
2500
|
+
# {
|
|
2501
|
+
# key: "ClusterKubernetesTaintKey", # required
|
|
2502
|
+
# value: "ClusterKubernetesTaintValue",
|
|
2503
|
+
# effect: "NoSchedule", # required, accepts NoSchedule, PreferNoSchedule, NoExecute
|
|
2504
|
+
# },
|
|
2505
|
+
# ],
|
|
2506
|
+
# },
|
|
2507
|
+
# capacity_requirements: {
|
|
2508
|
+
# spot: {
|
|
2509
|
+
# },
|
|
2510
|
+
# on_demand: {
|
|
2511
|
+
# },
|
|
2512
|
+
# },
|
|
2291
2513
|
# },
|
|
2292
2514
|
# ],
|
|
2293
2515
|
# restricted_instance_groups: [
|
|
@@ -2725,6 +2947,10 @@ module Aws::SageMaker
|
|
|
2725
2947
|
# accelerators: 1,
|
|
2726
2948
|
# v_cpu: 1.0,
|
|
2727
2949
|
# memory_in_gi_b: 1.0,
|
|
2950
|
+
# accelerator_partition: {
|
|
2951
|
+
# type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
|
|
2952
|
+
# count: 1, # required
|
|
2953
|
+
# },
|
|
2728
2954
|
# },
|
|
2729
2955
|
# ],
|
|
2730
2956
|
# resource_sharing_config: {
|
|
@@ -8363,6 +8589,9 @@ module Aws::SageMaker
|
|
|
8363
8589
|
# The type of instance that hosts the optimized model that you create
|
|
8364
8590
|
# with the optimization job.
|
|
8365
8591
|
#
|
|
8592
|
+
# @option params [Integer] :max_instance_count
|
|
8593
|
+
# The maximum number of instances to use for the optimization job.
|
|
8594
|
+
#
|
|
8366
8595
|
# @option params [Hash<String,String>] :optimization_environment
|
|
8367
8596
|
# The environment variables to set in the model container.
|
|
8368
8597
|
#
|
|
@@ -8424,8 +8653,12 @@ module Aws::SageMaker
|
|
|
8424
8653
|
# accept_eula: false, # required
|
|
8425
8654
|
# },
|
|
8426
8655
|
# },
|
|
8656
|
+
# sage_maker_model: {
|
|
8657
|
+
# model_name: "ModelName",
|
|
8658
|
+
# },
|
|
8427
8659
|
# },
|
|
8428
|
-
# deployment_instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.12xlarge, ml.g6.16xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.12xlarge, ml.g6e.16xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge
|
|
8660
|
+
# deployment_instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.12xlarge, ml.g6.16xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.12xlarge, ml.g6e.16xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge
|
|
8661
|
+
# max_instance_count: 1,
|
|
8429
8662
|
# optimization_environment: {
|
|
8430
8663
|
# "NonEmptyString256" => "String256",
|
|
8431
8664
|
# },
|
|
@@ -8449,11 +8682,21 @@ module Aws::SageMaker
|
|
|
8449
8682
|
# "NonEmptyString256" => "String256",
|
|
8450
8683
|
# },
|
|
8451
8684
|
# },
|
|
8685
|
+
# model_speculative_decoding_config: {
|
|
8686
|
+
# technique: "EAGLE", # required, accepts EAGLE
|
|
8687
|
+
# training_data_source: {
|
|
8688
|
+
# s3_uri: "S3Uri", # required
|
|
8689
|
+
# s3_data_type: "S3Prefix", # required, accepts S3Prefix, ManifestFile
|
|
8690
|
+
# },
|
|
8691
|
+
# },
|
|
8452
8692
|
# },
|
|
8453
8693
|
# ],
|
|
8454
8694
|
# output_config: { # required
|
|
8455
8695
|
# kms_key_id: "KmsKeyId",
|
|
8456
8696
|
# s3_output_location: "S3Uri", # required
|
|
8697
|
+
# sage_maker_model: {
|
|
8698
|
+
# model_name: "ModelName",
|
|
8699
|
+
# },
|
|
8457
8700
|
# },
|
|
8458
8701
|
# stopping_condition: { # required
|
|
8459
8702
|
# max_runtime_in_seconds: 1,
|
|
@@ -13443,6 +13686,7 @@ module Aws::SageMaker
|
|
|
13443
13686
|
# resp.instance_groups #=> Array
|
|
13444
13687
|
# resp.instance_groups[0].current_count #=> Integer
|
|
13445
13688
|
# resp.instance_groups[0].target_count #=> Integer
|
|
13689
|
+
# resp.instance_groups[0].min_count #=> Integer
|
|
13446
13690
|
# resp.instance_groups[0].instance_group_name #=> String
|
|
13447
13691
|
# resp.instance_groups[0].instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p6e-gb200.36xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.12xlarge", "ml.c5.18xlarge", "ml.c5.24xlarge", "ml.c5n.large", "ml.c5n.2xlarge", "ml.c5n.4xlarge", "ml.c5n.9xlarge", "ml.c5n.18xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.8xlarge", "ml.m5.12xlarge", "ml.m5.16xlarge", "ml.m5.24xlarge", "ml.t3.medium", "ml.t3.large", "ml.t3.xlarge", "ml.t3.2xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.16xlarge", "ml.g6.12xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.gr6.4xlarge", "ml.gr6.8xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.16xlarge", "ml.g6e.12xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.p6-b200.48xlarge", "ml.trn2.3xlarge", "ml.trn2.48xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.m6i.large", "ml.m6i.xlarge", "ml.m6i.2xlarge", "ml.m6i.4xlarge", "ml.m6i.8xlarge", "ml.m6i.12xlarge", "ml.m6i.16xlarge", "ml.m6i.24xlarge", "ml.m6i.32xlarge", "ml.r6i.large", "ml.r6i.xlarge", "ml.r6i.2xlarge", "ml.r6i.4xlarge", "ml.r6i.8xlarge", "ml.r6i.12xlarge", "ml.r6i.16xlarge", "ml.r6i.24xlarge", "ml.r6i.32xlarge", "ml.i3en.large", "ml.i3en.xlarge", "ml.i3en.2xlarge", "ml.i3en.3xlarge", "ml.i3en.6xlarge", "ml.i3en.12xlarge", "ml.i3en.24xlarge", "ml.m7i.large", "ml.m7i.xlarge", "ml.m7i.2xlarge", "ml.m7i.4xlarge", "ml.m7i.8xlarge", "ml.m7i.12xlarge", "ml.m7i.16xlarge", "ml.m7i.24xlarge", "ml.m7i.48xlarge", "ml.r7i.large", "ml.r7i.xlarge", "ml.r7i.2xlarge", "ml.r7i.4xlarge", "ml.r7i.8xlarge", "ml.r7i.12xlarge", "ml.r7i.16xlarge", "ml.r7i.24xlarge", "ml.r7i.48xlarge"
|
|
13448
13692
|
# resp.instance_groups[0].life_cycle_config.source_s3_uri #=> String
|
|
@@ -13472,6 +13716,20 @@ module Aws::SageMaker
|
|
|
13472
13716
|
# resp.instance_groups[0].scheduled_update_config.deployment_config.auto_rollback_configuration[0].alarm_name #=> String
|
|
13473
13717
|
# resp.instance_groups[0].current_image_id #=> String
|
|
13474
13718
|
# resp.instance_groups[0].desired_image_id #=> String
|
|
13719
|
+
# resp.instance_groups[0].active_operations #=> Hash
|
|
13720
|
+
# resp.instance_groups[0].active_operations["ActiveClusterOperationName"] #=> Integer
|
|
13721
|
+
# resp.instance_groups[0].kubernetes_config.current_labels #=> Hash
|
|
13722
|
+
# resp.instance_groups[0].kubernetes_config.current_labels["ClusterKubernetesLabelKey"] #=> String
|
|
13723
|
+
# resp.instance_groups[0].kubernetes_config.desired_labels #=> Hash
|
|
13724
|
+
# resp.instance_groups[0].kubernetes_config.desired_labels["ClusterKubernetesLabelKey"] #=> String
|
|
13725
|
+
# resp.instance_groups[0].kubernetes_config.current_taints #=> Array
|
|
13726
|
+
# resp.instance_groups[0].kubernetes_config.current_taints[0].key #=> String
|
|
13727
|
+
# resp.instance_groups[0].kubernetes_config.current_taints[0].value #=> String
|
|
13728
|
+
# resp.instance_groups[0].kubernetes_config.current_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
|
|
13729
|
+
# resp.instance_groups[0].kubernetes_config.desired_taints #=> Array
|
|
13730
|
+
# resp.instance_groups[0].kubernetes_config.desired_taints[0].key #=> String
|
|
13731
|
+
# resp.instance_groups[0].kubernetes_config.desired_taints[0].value #=> String
|
|
13732
|
+
# resp.instance_groups[0].kubernetes_config.desired_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
|
|
13475
13733
|
# resp.instance_groups[0].target_state_count #=> Integer
|
|
13476
13734
|
# resp.instance_groups[0].software_update_status #=> String, one of "Pending", "InProgress", "Succeeded", "Failed", "RollbackInProgress", "RollbackComplete"
|
|
13477
13735
|
# resp.instance_groups[0].active_software_update_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENTAGE"
|
|
@@ -13582,6 +13840,7 @@ module Aws::SageMaker
|
|
|
13582
13840
|
# resp.event_details.event_details.event_metadata.instance_group.ami_override #=> String
|
|
13583
13841
|
# resp.event_details.event_details.event_metadata.instance_group_scaling.instance_count #=> Integer
|
|
13584
13842
|
# resp.event_details.event_details.event_metadata.instance_group_scaling.target_count #=> Integer
|
|
13843
|
+
# resp.event_details.event_details.event_metadata.instance_group_scaling.min_count #=> Integer
|
|
13585
13844
|
# resp.event_details.event_details.event_metadata.instance_group_scaling.failure_message #=> String
|
|
13586
13845
|
# resp.event_details.event_details.event_metadata.instance.customer_eni #=> String
|
|
13587
13846
|
# resp.event_details.event_details.event_metadata.instance.additional_enis.efa_enis #=> Array
|
|
@@ -13659,6 +13918,19 @@ module Aws::SageMaker
|
|
|
13659
13918
|
# resp.node_details.current_image_id #=> String
|
|
13660
13919
|
# resp.node_details.desired_image_id #=> String
|
|
13661
13920
|
# resp.node_details.ultra_server_info.id #=> String
|
|
13921
|
+
# resp.node_details.kubernetes_config.current_labels #=> Hash
|
|
13922
|
+
# resp.node_details.kubernetes_config.current_labels["ClusterKubernetesLabelKey"] #=> String
|
|
13923
|
+
# resp.node_details.kubernetes_config.desired_labels #=> Hash
|
|
13924
|
+
# resp.node_details.kubernetes_config.desired_labels["ClusterKubernetesLabelKey"] #=> String
|
|
13925
|
+
# resp.node_details.kubernetes_config.current_taints #=> Array
|
|
13926
|
+
# resp.node_details.kubernetes_config.current_taints[0].key #=> String
|
|
13927
|
+
# resp.node_details.kubernetes_config.current_taints[0].value #=> String
|
|
13928
|
+
# resp.node_details.kubernetes_config.current_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
|
|
13929
|
+
# resp.node_details.kubernetes_config.desired_taints #=> Array
|
|
13930
|
+
# resp.node_details.kubernetes_config.desired_taints[0].key #=> String
|
|
13931
|
+
# resp.node_details.kubernetes_config.desired_taints[0].value #=> String
|
|
13932
|
+
# resp.node_details.kubernetes_config.desired_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
|
|
13933
|
+
# resp.node_details.capacity_type #=> String, one of "Spot", "OnDemand"
|
|
13662
13934
|
#
|
|
13663
13935
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeClusterNode AWS API Documentation
|
|
13664
13936
|
#
|
|
@@ -13912,6 +14184,8 @@ module Aws::SageMaker
|
|
|
13912
14184
|
# resp.compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
|
|
13913
14185
|
# resp.compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
|
|
13914
14186
|
# resp.compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
|
|
14187
|
+
# resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
|
|
14188
|
+
# resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
|
|
13915
14189
|
# resp.compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
|
|
13916
14190
|
# resp.compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
|
|
13917
14191
|
# resp.compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
|
|
@@ -17399,6 +17673,7 @@ module Aws::SageMaker
|
|
|
17399
17673
|
# * {Types::DescribeOptimizationJobResponse#model_source #model_source} => Types::OptimizationJobModelSource
|
|
17400
17674
|
# * {Types::DescribeOptimizationJobResponse#optimization_environment #optimization_environment} => Hash<String,String>
|
|
17401
17675
|
# * {Types::DescribeOptimizationJobResponse#deployment_instance_type #deployment_instance_type} => String
|
|
17676
|
+
# * {Types::DescribeOptimizationJobResponse#max_instance_count #max_instance_count} => Integer
|
|
17402
17677
|
# * {Types::DescribeOptimizationJobResponse#optimization_configs #optimization_configs} => Array<Types::OptimizationConfig>
|
|
17403
17678
|
# * {Types::DescribeOptimizationJobResponse#output_config #output_config} => Types::OptimizationJobOutputConfig
|
|
17404
17679
|
# * {Types::DescribeOptimizationJobResponse#optimization_output #optimization_output} => Types::OptimizationOutput
|
|
@@ -17424,9 +17699,11 @@ module Aws::SageMaker
|
|
|
17424
17699
|
# resp.optimization_job_name #=> String
|
|
17425
17700
|
# resp.model_source.s3.s3_uri #=> String
|
|
17426
17701
|
# resp.model_source.s3.model_access_config.accept_eula #=> Boolean
|
|
17702
|
+
# resp.model_source.sage_maker_model.model_name #=> String
|
|
17427
17703
|
# resp.optimization_environment #=> Hash
|
|
17428
17704
|
# resp.optimization_environment["NonEmptyString256"] #=> String
|
|
17429
|
-
# resp.deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
|
|
17705
|
+
# resp.deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
|
|
17706
|
+
# resp.max_instance_count #=> Integer
|
|
17430
17707
|
# resp.optimization_configs #=> Array
|
|
17431
17708
|
# resp.optimization_configs[0].model_quantization_config.image #=> String
|
|
17432
17709
|
# resp.optimization_configs[0].model_quantization_config.override_environment #=> Hash
|
|
@@ -17437,8 +17714,12 @@ module Aws::SageMaker
|
|
|
17437
17714
|
# resp.optimization_configs[0].model_sharding_config.image #=> String
|
|
17438
17715
|
# resp.optimization_configs[0].model_sharding_config.override_environment #=> Hash
|
|
17439
17716
|
# resp.optimization_configs[0].model_sharding_config.override_environment["NonEmptyString256"] #=> String
|
|
17717
|
+
# resp.optimization_configs[0].model_speculative_decoding_config.technique #=> String, one of "EAGLE"
|
|
17718
|
+
# resp.optimization_configs[0].model_speculative_decoding_config.training_data_source.s3_uri #=> String
|
|
17719
|
+
# resp.optimization_configs[0].model_speculative_decoding_config.training_data_source.s3_data_type #=> String, one of "S3Prefix", "ManifestFile"
|
|
17440
17720
|
# resp.output_config.kms_key_id #=> String
|
|
17441
17721
|
# resp.output_config.s3_output_location #=> String
|
|
17722
|
+
# resp.output_config.sage_maker_model.model_name #=> String
|
|
17442
17723
|
# resp.optimization_output.recommended_inference_image #=> String
|
|
17443
17724
|
# resp.role_arn #=> String
|
|
17444
17725
|
# resp.stopping_condition.max_runtime_in_seconds #=> Integer
|
|
@@ -18411,7 +18692,7 @@ module Aws::SageMaker
|
|
|
18411
18692
|
# resp.available_spare_instance_count #=> Integer
|
|
18412
18693
|
# resp.total_ultra_server_count #=> Integer
|
|
18413
18694
|
# resp.target_resources #=> Array
|
|
18414
|
-
# resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
|
|
18695
|
+
# resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
|
|
18415
18696
|
# resp.reserved_capacity_summaries #=> Array
|
|
18416
18697
|
# resp.reserved_capacity_summaries[0].reserved_capacity_arn #=> String
|
|
18417
18698
|
# resp.reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
|
|
@@ -20350,6 +20631,7 @@ module Aws::SageMaker
|
|
|
20350
20631
|
# resp.cluster_node_summaries[0].instance_status.status #=> String, one of "Running", "Failure", "Pending", "ShuttingDown", "SystemUpdating", "DeepHealthCheckInProgress", "NotFound"
|
|
20351
20632
|
# resp.cluster_node_summaries[0].instance_status.message #=> String
|
|
20352
20633
|
# resp.cluster_node_summaries[0].ultra_server_info.id #=> String
|
|
20634
|
+
# resp.cluster_node_summaries[0].private_dns_hostname #=> String
|
|
20353
20635
|
#
|
|
20354
20636
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListClusterNodes AWS API Documentation
|
|
20355
20637
|
#
|
|
@@ -20813,6 +21095,8 @@ module Aws::SageMaker
|
|
|
20813
21095
|
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
|
|
20814
21096
|
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
|
|
20815
21097
|
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
|
|
21098
|
+
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
|
|
21099
|
+
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
|
|
20816
21100
|
# resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
|
|
20817
21101
|
# resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
|
|
20818
21102
|
# resp.compute_quota_summaries[0].compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
|
|
@@ -24261,7 +24545,8 @@ module Aws::SageMaker
|
|
|
24261
24545
|
# resp.optimization_job_summaries[0].optimization_start_time #=> Time
|
|
24262
24546
|
# resp.optimization_job_summaries[0].optimization_end_time #=> Time
|
|
24263
24547
|
# resp.optimization_job_summaries[0].last_modified_time #=> Time
|
|
24264
|
-
# resp.optimization_job_summaries[0].deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
|
|
24548
|
+
# resp.optimization_job_summaries[0].deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
|
|
24549
|
+
# resp.optimization_job_summaries[0].max_instance_count #=> Integer
|
|
24265
24550
|
# resp.optimization_job_summaries[0].optimization_types #=> Array
|
|
24266
24551
|
# resp.optimization_job_summaries[0].optimization_types[0] #=> String
|
|
24267
24552
|
# resp.next_token #=> String
|
|
@@ -25460,7 +25745,7 @@ module Aws::SageMaker
|
|
|
25460
25745
|
# resp.training_plan_summaries[0].in_use_instance_count #=> Integer
|
|
25461
25746
|
# resp.training_plan_summaries[0].total_ultra_server_count #=> Integer
|
|
25462
25747
|
# resp.training_plan_summaries[0].target_resources #=> Array
|
|
25463
|
-
# resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
|
|
25748
|
+
# resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
|
|
25464
25749
|
# resp.training_plan_summaries[0].reserved_capacity_summaries #=> Array
|
|
25465
25750
|
# resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_arn #=> String
|
|
25466
25751
|
# resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
|
|
@@ -26481,7 +26766,7 @@ module Aws::SageMaker
|
|
|
26481
26766
|
#
|
|
26482
26767
|
# @option params [required, Array<String>] :target_resources
|
|
26483
26768
|
# The target resources (e.g., SageMaker Training Jobs, SageMaker
|
|
26484
|
-
# HyperPod) to search for in the offerings.
|
|
26769
|
+
# HyperPod, SageMaker Endpoints) to search for in the offerings.
|
|
26485
26770
|
#
|
|
26486
26771
|
# Training plans are specific to their target resource.
|
|
26487
26772
|
#
|
|
@@ -26491,6 +26776,10 @@ module Aws::SageMaker
|
|
|
26491
26776
|
# * A training plan for HyperPod clusters can be used exclusively to
|
|
26492
26777
|
# provide compute resources to a cluster's instance group.
|
|
26493
26778
|
#
|
|
26779
|
+
# * A training plan for SageMaker endpoints can be used exclusively to
|
|
26780
|
+
# provide compute resources to SageMaker endpoints for model
|
|
26781
|
+
# deployment.
|
|
26782
|
+
#
|
|
26494
26783
|
# @return [Types::SearchTrainingPlanOfferingsResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
|
26495
26784
|
#
|
|
26496
26785
|
# * {Types::SearchTrainingPlanOfferingsResponse#training_plan_offerings #training_plan_offerings} => Array<Types::TrainingPlanOffering>
|
|
@@ -26505,7 +26794,7 @@ module Aws::SageMaker
|
|
|
26505
26794
|
# start_time_after: Time.now,
|
|
26506
26795
|
# end_time_before: Time.now,
|
|
26507
26796
|
# duration_hours: 1, # required
|
|
26508
|
-
# target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster
|
|
26797
|
+
# target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster, endpoint
|
|
26509
26798
|
# })
|
|
26510
26799
|
#
|
|
26511
26800
|
# @example Response structure
|
|
@@ -26513,7 +26802,7 @@ module Aws::SageMaker
|
|
|
26513
26802
|
# resp.training_plan_offerings #=> Array
|
|
26514
26803
|
# resp.training_plan_offerings[0].training_plan_offering_id #=> String
|
|
26515
26804
|
# resp.training_plan_offerings[0].target_resources #=> Array
|
|
26516
|
-
# resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
|
|
26805
|
+
# resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
|
|
26517
26806
|
# resp.training_plan_offerings[0].requested_start_time_after #=> Time
|
|
26518
26807
|
# resp.training_plan_offerings[0].requested_end_time_before #=> Time
|
|
26519
26808
|
# resp.training_plan_offerings[0].duration_hours #=> Integer
|
|
@@ -27596,6 +27885,7 @@ module Aws::SageMaker
|
|
|
27596
27885
|
# instance_groups: [
|
|
27597
27886
|
# {
|
|
27598
27887
|
# instance_count: 1, # required
|
|
27888
|
+
# min_instance_count: 1,
|
|
27599
27889
|
# instance_group_name: "ClusterInstanceGroupName", # required
|
|
27600
27890
|
# instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p6e-gb200.36xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.12xlarge, ml.c5.18xlarge, ml.c5.24xlarge, ml.c5n.large, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.8xlarge, ml.m5.12xlarge, ml.m5.16xlarge, ml.m5.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.gr6.4xlarge, ml.gr6.8xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.p6-b200.48xlarge, ml.trn2.3xlarge, ml.trn2.48xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.r6i.large, ml.r6i.xlarge, ml.r6i.2xlarge, ml.r6i.4xlarge, ml.r6i.8xlarge, ml.r6i.12xlarge, ml.r6i.16xlarge, ml.r6i.24xlarge, ml.r6i.32xlarge, ml.i3en.large, ml.i3en.xlarge, ml.i3en.2xlarge, ml.i3en.3xlarge, ml.i3en.6xlarge, ml.i3en.12xlarge, ml.i3en.24xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge
|
|
27601
27891
|
# life_cycle_config: { # required
|
|
@@ -27641,6 +27931,24 @@ module Aws::SageMaker
|
|
|
27641
27931
|
# },
|
|
27642
27932
|
# },
|
|
27643
27933
|
# image_id: "ImageId",
|
|
27934
|
+
# kubernetes_config: {
|
|
27935
|
+
# labels: {
|
|
27936
|
+
# "ClusterKubernetesLabelKey" => "ClusterKubernetesLabelValue",
|
|
27937
|
+
# },
|
|
27938
|
+
# taints: [
|
|
27939
|
+
# {
|
|
27940
|
+
# key: "ClusterKubernetesTaintKey", # required
|
|
27941
|
+
# value: "ClusterKubernetesTaintValue",
|
|
27942
|
+
# effect: "NoSchedule", # required, accepts NoSchedule, PreferNoSchedule, NoExecute
|
|
27943
|
+
# },
|
|
27944
|
+
# ],
|
|
27945
|
+
# },
|
|
27946
|
+
# capacity_requirements: {
|
|
27947
|
+
# spot: {
|
|
27948
|
+
# },
|
|
27949
|
+
# on_demand: {
|
|
27950
|
+
# },
|
|
27951
|
+
# },
|
|
27644
27952
|
# },
|
|
27645
27953
|
# ],
|
|
27646
27954
|
# restricted_instance_groups: [
|
|
@@ -27951,6 +28259,10 @@ module Aws::SageMaker
|
|
|
27951
28259
|
# accelerators: 1,
|
|
27952
28260
|
# v_cpu: 1.0,
|
|
27953
28261
|
# memory_in_gi_b: 1.0,
|
|
28262
|
+
# accelerator_partition: {
|
|
28263
|
+
# type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
|
|
28264
|
+
# count: 1, # required
|
|
28265
|
+
# },
|
|
27954
28266
|
# },
|
|
27955
28267
|
# ],
|
|
27956
28268
|
# resource_sharing_config: {
|
|
@@ -31359,7 +31671,7 @@ module Aws::SageMaker
|
|
|
31359
31671
|
tracer: tracer
|
|
31360
31672
|
)
|
|
31361
31673
|
context[:gem_name] = 'aws-sdk-sagemaker'
|
|
31362
|
-
context[:gem_version] = '1.
|
|
31674
|
+
context[:gem_version] = '1.341.0'
|
|
31363
31675
|
Seahorse::Client::Request.new(handlers, context)
|
|
31364
31676
|
end
|
|
31365
31677
|
|