aws-sdk-sagemaker 1.339.0 → 1.340.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +5 -0
- data/VERSION +1 -1
- data/lib/aws-sdk-sagemaker/client.rb +226 -6
- data/lib/aws-sdk-sagemaker/client_api.rb +103 -0
- data/lib/aws-sdk-sagemaker/types.rb +403 -7
- data/lib/aws-sdk-sagemaker.rb +1 -1
- data/sig/client.rbs +42 -4
- data/sig/types.rbs +70 -4
- metadata +1 -1
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: f760b6f6d6902ca08349489fe9e34c577365953a32aa2f031a4db9e67aa9cb08
|
|
4
|
+
data.tar.gz: 5d01231c9d2c1d978d56deee398fb98fe79da54085d362172671724d6bce3233
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: a658467635f982e5e53c0cd5a428c96d8f17acb120d16c31184b8ac8ddd2f21c9062c41e6df84610f95227118ae6de6a47053642188e8ed29208e2d44cfa5863
|
|
7
|
+
data.tar.gz: ec789fc4a9c2d3014b4e19c7a5b628f158fdc8a3b262139e86e44147b83a65107844ac19445d924aa41f1e90791d961c6c1bf8abb2ef19a9de49e6a54e63cba0
|
data/CHANGELOG.md
CHANGED
|
@@ -1,6 +1,11 @@
|
|
|
1
1
|
Unreleased Changes
|
|
2
2
|
------------------
|
|
3
3
|
|
|
4
|
+
1.340.0 (2025-11-20)
|
|
5
|
+
------------------
|
|
6
|
+
|
|
7
|
+
* Feature - Added training plan support for inference endpoints. Added HyperPod task governance with accelerator partition-based quota allocation. Added BatchRebootClusterNodes and BatchReplaceClusterNodes APIs. Updated ListClusterNodes to include privateDnsHostName.
|
|
8
|
+
|
|
4
9
|
1.339.0 (2025-11-19)
|
|
5
10
|
------------------
|
|
6
11
|
|
data/VERSION
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
1.
|
|
1
|
+
1.340.0
|
|
@@ -950,6 +950,209 @@ module Aws::SageMaker
|
|
|
950
950
|
req.send_request(options)
|
|
951
951
|
end
|
|
952
952
|
|
|
953
|
+
# Reboots specific nodes within a SageMaker HyperPod cluster using a
|
|
954
|
+
# soft recovery mechanism. `BatchRebootClusterNodes` performs a graceful
|
|
955
|
+
# reboot of the specified nodes by calling the Amazon Elastic Compute
|
|
956
|
+
# Cloud `RebootInstances` API, which attempts to cleanly shut down the
|
|
957
|
+
# operating system before restarting the instance.
|
|
958
|
+
#
|
|
959
|
+
# This operation is useful for recovering from transient issues or
|
|
960
|
+
# applying certain configuration changes that require a restart.
|
|
961
|
+
#
|
|
962
|
+
# <note markdown="1"> * Rebooting a node may cause temporary service interruption for
|
|
963
|
+
# workloads running on that node. Ensure your workloads can handle
|
|
964
|
+
# node restarts or use appropriate scheduling to minimize impact.
|
|
965
|
+
#
|
|
966
|
+
# * You can reboot up to 25 nodes in a single request.
|
|
967
|
+
#
|
|
968
|
+
# * For SageMaker HyperPod clusters using the Slurm workload manager,
|
|
969
|
+
# ensure rebooting nodes will not disrupt critical cluster operations.
|
|
970
|
+
#
|
|
971
|
+
# </note>
|
|
972
|
+
#
|
|
973
|
+
# @option params [required, String] :cluster_name
|
|
974
|
+
# The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
|
|
975
|
+
# cluster containing the nodes to reboot.
|
|
976
|
+
#
|
|
977
|
+
# @option params [Array<String>] :node_ids
|
|
978
|
+
# A list of EC2 instance IDs to reboot using soft recovery. You can
|
|
979
|
+
# specify between 1 and 25 instance IDs.
|
|
980
|
+
#
|
|
981
|
+
# <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
982
|
+
# at least one is required.
|
|
983
|
+
#
|
|
984
|
+
# * Each instance ID must follow the pattern `i-` followed by 17
|
|
985
|
+
# hexadecimal characters (for example, `i-0123456789abcdef0`).
|
|
986
|
+
#
|
|
987
|
+
# </note>
|
|
988
|
+
#
|
|
989
|
+
# @option params [Array<String>] :node_logical_ids
|
|
990
|
+
# A list of logical node IDs to reboot using soft recovery. You can
|
|
991
|
+
# specify between 1 and 25 logical node IDs.
|
|
992
|
+
#
|
|
993
|
+
# The `NodeLogicalId` is a unique identifier that persists throughout
|
|
994
|
+
# the node's lifecycle and can be used to track nodes that are still
|
|
995
|
+
# being provisioned and don't yet have an EC2 instance ID assigned.
|
|
996
|
+
#
|
|
997
|
+
# * This parameter is only supported for clusters using `Continuous` as
|
|
998
|
+
# the `NodeProvisioningMode`. For clusters using the default
|
|
999
|
+
# provisioning mode, use `NodeIds` instead.
|
|
1000
|
+
#
|
|
1001
|
+
# * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
1002
|
+
# at least one is required.
|
|
1003
|
+
#
|
|
1004
|
+
# @return [Types::BatchRebootClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
|
1005
|
+
#
|
|
1006
|
+
# * {Types::BatchRebootClusterNodesResponse#successful #successful} => Array<String>
|
|
1007
|
+
# * {Types::BatchRebootClusterNodesResponse#failed #failed} => Array<Types::BatchRebootClusterNodesError>
|
|
1008
|
+
# * {Types::BatchRebootClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array<Types::BatchRebootClusterNodeLogicalIdsError>
|
|
1009
|
+
# * {Types::BatchRebootClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array<String>
|
|
1010
|
+
#
|
|
1011
|
+
# @example Request syntax with placeholder values
|
|
1012
|
+
#
|
|
1013
|
+
# resp = client.batch_reboot_cluster_nodes({
|
|
1014
|
+
# cluster_name: "ClusterNameOrArn", # required
|
|
1015
|
+
# node_ids: ["ClusterNodeId"],
|
|
1016
|
+
# node_logical_ids: ["ClusterNodeLogicalId"],
|
|
1017
|
+
# })
|
|
1018
|
+
#
|
|
1019
|
+
# @example Response structure
|
|
1020
|
+
#
|
|
1021
|
+
# resp.successful #=> Array
|
|
1022
|
+
# resp.successful[0] #=> String
|
|
1023
|
+
# resp.failed #=> Array
|
|
1024
|
+
# resp.failed[0].node_id #=> String
|
|
1025
|
+
# resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1026
|
+
# resp.failed[0].message #=> String
|
|
1027
|
+
# resp.failed_node_logical_ids #=> Array
|
|
1028
|
+
# resp.failed_node_logical_ids[0].node_logical_id #=> String
|
|
1029
|
+
# resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1030
|
+
# resp.failed_node_logical_ids[0].message #=> String
|
|
1031
|
+
# resp.successful_node_logical_ids #=> Array
|
|
1032
|
+
# resp.successful_node_logical_ids[0] #=> String
|
|
1033
|
+
#
|
|
1034
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodes AWS API Documentation
|
|
1035
|
+
#
|
|
1036
|
+
# @overload batch_reboot_cluster_nodes(params = {})
|
|
1037
|
+
# @param [Hash] params ({})
|
|
1038
|
+
def batch_reboot_cluster_nodes(params = {}, options = {})
|
|
1039
|
+
req = build_request(:batch_reboot_cluster_nodes, params)
|
|
1040
|
+
req.send_request(options)
|
|
1041
|
+
end
|
|
1042
|
+
|
|
1043
|
+
# Replaces specific nodes within a SageMaker HyperPod cluster with new
|
|
1044
|
+
# hardware. `BatchReplaceClusterNodes` terminates the specified
|
|
1045
|
+
# instances and provisions new replacement instances with the same
|
|
1046
|
+
# configuration but fresh hardware. The Amazon Machine Image (AMI) and
|
|
1047
|
+
# instance configuration remain the same.
|
|
1048
|
+
#
|
|
1049
|
+
# This operation is useful for recovering from hardware failures or
|
|
1050
|
+
# persistent issues that cannot be resolved through a reboot.
|
|
1051
|
+
#
|
|
1052
|
+
# * **Data Loss Warning:** Replacing nodes destroys all instance
|
|
1053
|
+
# volumes, including both root and secondary volumes. All data stored
|
|
1054
|
+
# on these volumes will be permanently lost and cannot be recovered.
|
|
1055
|
+
#
|
|
1056
|
+
# * To safeguard your work, back up your data to Amazon S3 or an FSx for
|
|
1057
|
+
# Lustre file system before invoking the API on a worker node group.
|
|
1058
|
+
# This will help prevent any potential data loss from the instance
|
|
1059
|
+
# root volume. For more information about backup, see [Use the backup
|
|
1060
|
+
# script provided by SageMaker HyperPod][1].
|
|
1061
|
+
#
|
|
1062
|
+
# * If you want to invoke this API on an existing cluster, you'll first
|
|
1063
|
+
# need to patch the cluster by running the [UpdateClusterSoftware
|
|
1064
|
+
# API][2]. For more information about patching a cluster, see [Update
|
|
1065
|
+
# the SageMaker HyperPod platform software of a cluster][3].
|
|
1066
|
+
#
|
|
1067
|
+
# * You can replace up to 25 nodes in a single request.
|
|
1068
|
+
#
|
|
1069
|
+
#
|
|
1070
|
+
#
|
|
1071
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software-backup
|
|
1072
|
+
# [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_UpdateClusterSoftware.html
|
|
1073
|
+
# [3]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software
|
|
1074
|
+
#
|
|
1075
|
+
# @option params [required, String] :cluster_name
|
|
1076
|
+
# The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
|
|
1077
|
+
# cluster containing the nodes to replace.
|
|
1078
|
+
#
|
|
1079
|
+
# @option params [Array<String>] :node_ids
|
|
1080
|
+
# A list of EC2 instance IDs to replace with new hardware. You can
|
|
1081
|
+
# specify between 1 and 25 instance IDs.
|
|
1082
|
+
#
|
|
1083
|
+
# Replace operations destroy all instance volumes (root and secondary).
|
|
1084
|
+
# Ensure you have backed up any important data before proceeding.
|
|
1085
|
+
#
|
|
1086
|
+
# <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
1087
|
+
# at least one is required.
|
|
1088
|
+
#
|
|
1089
|
+
# * Each instance ID must follow the pattern `i-` followed by 17
|
|
1090
|
+
# hexadecimal characters (for example, `i-0123456789abcdef0`).
|
|
1091
|
+
#
|
|
1092
|
+
# * For SageMaker HyperPod clusters using the Slurm workload manager,
|
|
1093
|
+
# you cannot replace instances that are configured as Slurm controller
|
|
1094
|
+
# nodes.
|
|
1095
|
+
#
|
|
1096
|
+
# </note>
|
|
1097
|
+
#
|
|
1098
|
+
# @option params [Array<String>] :node_logical_ids
|
|
1099
|
+
# A list of logical node IDs to replace with new hardware. You can
|
|
1100
|
+
# specify between 1 and 25 logical node IDs.
|
|
1101
|
+
#
|
|
1102
|
+
# The `NodeLogicalId` is a unique identifier that persists throughout
|
|
1103
|
+
# the node's lifecycle and can be used to track nodes that are still
|
|
1104
|
+
# being provisioned and don't yet have an EC2 instance ID assigned.
|
|
1105
|
+
#
|
|
1106
|
+
# * Replace operations destroy all instance volumes (root and
|
|
1107
|
+
# secondary). Ensure you have backed up any important data before
|
|
1108
|
+
# proceeding.
|
|
1109
|
+
#
|
|
1110
|
+
# * This parameter is only supported for clusters using `Continuous` as
|
|
1111
|
+
# the `NodeProvisioningMode`. For clusters using the default
|
|
1112
|
+
# provisioning mode, use `NodeIds` instead.
|
|
1113
|
+
#
|
|
1114
|
+
# * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
|
|
1115
|
+
# at least one is required.
|
|
1116
|
+
#
|
|
1117
|
+
# @return [Types::BatchReplaceClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
|
1118
|
+
#
|
|
1119
|
+
# * {Types::BatchReplaceClusterNodesResponse#successful #successful} => Array<String>
|
|
1120
|
+
# * {Types::BatchReplaceClusterNodesResponse#failed #failed} => Array<Types::BatchReplaceClusterNodesError>
|
|
1121
|
+
# * {Types::BatchReplaceClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array<Types::BatchReplaceClusterNodeLogicalIdsError>
|
|
1122
|
+
# * {Types::BatchReplaceClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array<String>
|
|
1123
|
+
#
|
|
1124
|
+
# @example Request syntax with placeholder values
|
|
1125
|
+
#
|
|
1126
|
+
# resp = client.batch_replace_cluster_nodes({
|
|
1127
|
+
# cluster_name: "ClusterNameOrArn", # required
|
|
1128
|
+
# node_ids: ["ClusterNodeId"],
|
|
1129
|
+
# node_logical_ids: ["ClusterNodeLogicalId"],
|
|
1130
|
+
# })
|
|
1131
|
+
#
|
|
1132
|
+
# @example Response structure
|
|
1133
|
+
#
|
|
1134
|
+
# resp.successful #=> Array
|
|
1135
|
+
# resp.successful[0] #=> String
|
|
1136
|
+
# resp.failed #=> Array
|
|
1137
|
+
# resp.failed[0].node_id #=> String
|
|
1138
|
+
# resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1139
|
+
# resp.failed[0].message #=> String
|
|
1140
|
+
# resp.failed_node_logical_ids #=> Array
|
|
1141
|
+
# resp.failed_node_logical_ids[0].node_logical_id #=> String
|
|
1142
|
+
# resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
|
|
1143
|
+
# resp.failed_node_logical_ids[0].message #=> String
|
|
1144
|
+
# resp.successful_node_logical_ids #=> Array
|
|
1145
|
+
# resp.successful_node_logical_ids[0] #=> String
|
|
1146
|
+
#
|
|
1147
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodes AWS API Documentation
|
|
1148
|
+
#
|
|
1149
|
+
# @overload batch_replace_cluster_nodes(params = {})
|
|
1150
|
+
# @param [Hash] params ({})
|
|
1151
|
+
def batch_replace_cluster_nodes(params = {}, options = {})
|
|
1152
|
+
req = build_request(:batch_replace_cluster_nodes, params)
|
|
1153
|
+
req.send_request(options)
|
|
1154
|
+
end
|
|
1155
|
+
|
|
953
1156
|
# Creates an *action*. An action is a lineage tracking entity that
|
|
954
1157
|
# represents an action or activity. For example, a model deployment or
|
|
955
1158
|
# an HPO job. Generally, an action involves at least one input or output
|
|
@@ -2725,6 +2928,10 @@ module Aws::SageMaker
|
|
|
2725
2928
|
# accelerators: 1,
|
|
2726
2929
|
# v_cpu: 1.0,
|
|
2727
2930
|
# memory_in_gi_b: 1.0,
|
|
2931
|
+
# accelerator_partition: {
|
|
2932
|
+
# type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
|
|
2933
|
+
# count: 1, # required
|
|
2934
|
+
# },
|
|
2728
2935
|
# },
|
|
2729
2936
|
# ],
|
|
2730
2937
|
# resource_sharing_config: {
|
|
@@ -13912,6 +14119,8 @@ module Aws::SageMaker
|
|
|
13912
14119
|
# resp.compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
|
|
13913
14120
|
# resp.compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
|
|
13914
14121
|
# resp.compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
|
|
14122
|
+
# resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
|
|
14123
|
+
# resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
|
|
13915
14124
|
# resp.compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
|
|
13916
14125
|
# resp.compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
|
|
13917
14126
|
# resp.compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
|
|
@@ -18411,7 +18620,7 @@ module Aws::SageMaker
|
|
|
18411
18620
|
# resp.available_spare_instance_count #=> Integer
|
|
18412
18621
|
# resp.total_ultra_server_count #=> Integer
|
|
18413
18622
|
# resp.target_resources #=> Array
|
|
18414
|
-
# resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
|
|
18623
|
+
# resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
|
|
18415
18624
|
# resp.reserved_capacity_summaries #=> Array
|
|
18416
18625
|
# resp.reserved_capacity_summaries[0].reserved_capacity_arn #=> String
|
|
18417
18626
|
# resp.reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
|
|
@@ -20350,6 +20559,7 @@ module Aws::SageMaker
|
|
|
20350
20559
|
# resp.cluster_node_summaries[0].instance_status.status #=> String, one of "Running", "Failure", "Pending", "ShuttingDown", "SystemUpdating", "DeepHealthCheckInProgress", "NotFound"
|
|
20351
20560
|
# resp.cluster_node_summaries[0].instance_status.message #=> String
|
|
20352
20561
|
# resp.cluster_node_summaries[0].ultra_server_info.id #=> String
|
|
20562
|
+
# resp.cluster_node_summaries[0].private_dns_hostname #=> String
|
|
20353
20563
|
#
|
|
20354
20564
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListClusterNodes AWS API Documentation
|
|
20355
20565
|
#
|
|
@@ -20813,6 +21023,8 @@ module Aws::SageMaker
|
|
|
20813
21023
|
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
|
|
20814
21024
|
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
|
|
20815
21025
|
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
|
|
21026
|
+
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
|
|
21027
|
+
# resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
|
|
20816
21028
|
# resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
|
|
20817
21029
|
# resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
|
|
20818
21030
|
# resp.compute_quota_summaries[0].compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
|
|
@@ -25460,7 +25672,7 @@ module Aws::SageMaker
|
|
|
25460
25672
|
# resp.training_plan_summaries[0].in_use_instance_count #=> Integer
|
|
25461
25673
|
# resp.training_plan_summaries[0].total_ultra_server_count #=> Integer
|
|
25462
25674
|
# resp.training_plan_summaries[0].target_resources #=> Array
|
|
25463
|
-
# resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
|
|
25675
|
+
# resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
|
|
25464
25676
|
# resp.training_plan_summaries[0].reserved_capacity_summaries #=> Array
|
|
25465
25677
|
# resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_arn #=> String
|
|
25466
25678
|
# resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
|
|
@@ -26481,7 +26693,7 @@ module Aws::SageMaker
|
|
|
26481
26693
|
#
|
|
26482
26694
|
# @option params [required, Array<String>] :target_resources
|
|
26483
26695
|
# The target resources (e.g., SageMaker Training Jobs, SageMaker
|
|
26484
|
-
# HyperPod) to search for in the offerings.
|
|
26696
|
+
# HyperPod, SageMaker Endpoints) to search for in the offerings.
|
|
26485
26697
|
#
|
|
26486
26698
|
# Training plans are specific to their target resource.
|
|
26487
26699
|
#
|
|
@@ -26491,6 +26703,10 @@ module Aws::SageMaker
|
|
|
26491
26703
|
# * A training plan for HyperPod clusters can be used exclusively to
|
|
26492
26704
|
# provide compute resources to a cluster's instance group.
|
|
26493
26705
|
#
|
|
26706
|
+
# * A training plan for SageMaker endpoints can be used exclusively to
|
|
26707
|
+
# provide compute resources to SageMaker endpoints for model
|
|
26708
|
+
# deployment.
|
|
26709
|
+
#
|
|
26494
26710
|
# @return [Types::SearchTrainingPlanOfferingsResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
|
26495
26711
|
#
|
|
26496
26712
|
# * {Types::SearchTrainingPlanOfferingsResponse#training_plan_offerings #training_plan_offerings} => Array<Types::TrainingPlanOffering>
|
|
@@ -26505,7 +26721,7 @@ module Aws::SageMaker
|
|
|
26505
26721
|
# start_time_after: Time.now,
|
|
26506
26722
|
# end_time_before: Time.now,
|
|
26507
26723
|
# duration_hours: 1, # required
|
|
26508
|
-
# target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster
|
|
26724
|
+
# target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster, endpoint
|
|
26509
26725
|
# })
|
|
26510
26726
|
#
|
|
26511
26727
|
# @example Response structure
|
|
@@ -26513,7 +26729,7 @@ module Aws::SageMaker
|
|
|
26513
26729
|
# resp.training_plan_offerings #=> Array
|
|
26514
26730
|
# resp.training_plan_offerings[0].training_plan_offering_id #=> String
|
|
26515
26731
|
# resp.training_plan_offerings[0].target_resources #=> Array
|
|
26516
|
-
# resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
|
|
26732
|
+
# resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
|
|
26517
26733
|
# resp.training_plan_offerings[0].requested_start_time_after #=> Time
|
|
26518
26734
|
# resp.training_plan_offerings[0].requested_end_time_before #=> Time
|
|
26519
26735
|
# resp.training_plan_offerings[0].duration_hours #=> Integer
|
|
@@ -27951,6 +28167,10 @@ module Aws::SageMaker
|
|
|
27951
28167
|
# accelerators: 1,
|
|
27952
28168
|
# v_cpu: 1.0,
|
|
27953
28169
|
# memory_in_gi_b: 1.0,
|
|
28170
|
+
# accelerator_partition: {
|
|
28171
|
+
# type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
|
|
28172
|
+
# count: 1, # required
|
|
28173
|
+
# },
|
|
27954
28174
|
# },
|
|
27955
28175
|
# ],
|
|
27956
28176
|
# resource_sharing_config: {
|
|
@@ -31359,7 +31579,7 @@ module Aws::SageMaker
|
|
|
31359
31579
|
tracer: tracer
|
|
31360
31580
|
)
|
|
31361
31581
|
context[:gem_name] = 'aws-sdk-sagemaker'
|
|
31362
|
-
context[:gem_version] = '1.
|
|
31582
|
+
context[:gem_version] = '1.340.0'
|
|
31363
31583
|
Seahorse::Client::Request.new(handlers, context)
|
|
31364
31584
|
end
|
|
31365
31585
|
|
|
@@ -14,6 +14,8 @@ module Aws::SageMaker
|
|
|
14
14
|
|
|
15
15
|
include Seahorse::Model
|
|
16
16
|
|
|
17
|
+
AcceleratorPartitionConfig = Shapes::StructureShape.new(name: 'AcceleratorPartitionConfig')
|
|
18
|
+
AcceleratorPartitionConfigCountInteger = Shapes::IntegerShape.new(name: 'AcceleratorPartitionConfigCountInteger')
|
|
17
19
|
AcceleratorsAmount = Shapes::IntegerShape.new(name: 'AcceleratorsAmount')
|
|
18
20
|
Accept = Shapes::StringShape.new(name: 'Accept')
|
|
19
21
|
AcceptEula = Shapes::BooleanShape.new(name: 'AcceptEula')
|
|
@@ -211,6 +213,24 @@ module Aws::SageMaker
|
|
|
211
213
|
BatchDescribeModelPackageInput = Shapes::StructureShape.new(name: 'BatchDescribeModelPackageInput')
|
|
212
214
|
BatchDescribeModelPackageOutput = Shapes::StructureShape.new(name: 'BatchDescribeModelPackageOutput')
|
|
213
215
|
BatchDescribeModelPackageSummary = Shapes::StructureShape.new(name: 'BatchDescribeModelPackageSummary')
|
|
216
|
+
BatchRebootClusterNodeLogicalIdsError = Shapes::StructureShape.new(name: 'BatchRebootClusterNodeLogicalIdsError')
|
|
217
|
+
BatchRebootClusterNodeLogicalIdsErrors = Shapes::ListShape.new(name: 'BatchRebootClusterNodeLogicalIdsErrors')
|
|
218
|
+
BatchRebootClusterNodesError = Shapes::StructureShape.new(name: 'BatchRebootClusterNodesError')
|
|
219
|
+
BatchRebootClusterNodesErrorCode = Shapes::StringShape.new(name: 'BatchRebootClusterNodesErrorCode')
|
|
220
|
+
BatchRebootClusterNodesErrors = Shapes::ListShape.new(name: 'BatchRebootClusterNodesErrors')
|
|
221
|
+
BatchRebootClusterNodesRequest = Shapes::StructureShape.new(name: 'BatchRebootClusterNodesRequest')
|
|
222
|
+
BatchRebootClusterNodesRequestNodeIdsList = Shapes::ListShape.new(name: 'BatchRebootClusterNodesRequestNodeIdsList')
|
|
223
|
+
BatchRebootClusterNodesRequestNodeLogicalIdsList = Shapes::ListShape.new(name: 'BatchRebootClusterNodesRequestNodeLogicalIdsList')
|
|
224
|
+
BatchRebootClusterNodesResponse = Shapes::StructureShape.new(name: 'BatchRebootClusterNodesResponse')
|
|
225
|
+
BatchReplaceClusterNodeLogicalIdsError = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodeLogicalIdsError')
|
|
226
|
+
BatchReplaceClusterNodeLogicalIdsErrors = Shapes::ListShape.new(name: 'BatchReplaceClusterNodeLogicalIdsErrors')
|
|
227
|
+
BatchReplaceClusterNodesError = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodesError')
|
|
228
|
+
BatchReplaceClusterNodesErrorCode = Shapes::StringShape.new(name: 'BatchReplaceClusterNodesErrorCode')
|
|
229
|
+
BatchReplaceClusterNodesErrors = Shapes::ListShape.new(name: 'BatchReplaceClusterNodesErrors')
|
|
230
|
+
BatchReplaceClusterNodesRequest = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodesRequest')
|
|
231
|
+
BatchReplaceClusterNodesRequestNodeIdsList = Shapes::ListShape.new(name: 'BatchReplaceClusterNodesRequestNodeIdsList')
|
|
232
|
+
BatchReplaceClusterNodesRequestNodeLogicalIdsList = Shapes::ListShape.new(name: 'BatchReplaceClusterNodesRequestNodeLogicalIdsList')
|
|
233
|
+
BatchReplaceClusterNodesResponse = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodesResponse')
|
|
214
234
|
BatchStrategy = Shapes::StringShape.new(name: 'BatchStrategy')
|
|
215
235
|
BatchTransformInput = Shapes::StructureShape.new(name: 'BatchTransformInput')
|
|
216
236
|
BestObjectiveNotImproving = Shapes::StructureShape.new(name: 'BestObjectiveNotImproving')
|
|
@@ -1569,6 +1589,7 @@ module Aws::SageMaker
|
|
|
1569
1589
|
LocalPath = Shapes::StringShape.new(name: 'LocalPath')
|
|
1570
1590
|
Long = Shapes::IntegerShape.new(name: 'Long')
|
|
1571
1591
|
LongS3Uri = Shapes::StringShape.new(name: 'LongS3Uri')
|
|
1592
|
+
MIGProfileType = Shapes::StringShape.new(name: 'MIGProfileType')
|
|
1572
1593
|
MLFramework = Shapes::StringShape.new(name: 'MLFramework')
|
|
1573
1594
|
MajorMinorVersion = Shapes::StringShape.new(name: 'MajorMinorVersion')
|
|
1574
1595
|
ManagedInstanceScalingMaxInstanceCount = Shapes::IntegerShape.new(name: 'ManagedInstanceScalingMaxInstanceCount')
|
|
@@ -2708,6 +2729,10 @@ module Aws::SageMaker
|
|
|
2708
2729
|
WorkteamName = Shapes::StringShape.new(name: 'WorkteamName')
|
|
2709
2730
|
Workteams = Shapes::ListShape.new(name: 'Workteams')
|
|
2710
2731
|
|
|
2732
|
+
AcceleratorPartitionConfig.add_member(:type, Shapes::ShapeRef.new(shape: MIGProfileType, required: true, location_name: "Type"))
|
|
2733
|
+
AcceleratorPartitionConfig.add_member(:count, Shapes::ShapeRef.new(shape: AcceleratorPartitionConfigCountInteger, required: true, location_name: "Count", metadata: {"box" => true}))
|
|
2734
|
+
AcceleratorPartitionConfig.struct_class = Types::AcceleratorPartitionConfig
|
|
2735
|
+
|
|
2711
2736
|
ActionSource.add_member(:source_uri, Shapes::ShapeRef.new(shape: SourceUri, required: true, location_name: "SourceUri"))
|
|
2712
2737
|
ActionSource.add_member(:source_type, Shapes::ShapeRef.new(shape: String256, location_name: "SourceType"))
|
|
2713
2738
|
ActionSource.add_member(:source_id, Shapes::ShapeRef.new(shape: String256, location_name: "SourceId"))
|
|
@@ -3210,6 +3235,64 @@ module Aws::SageMaker
|
|
|
3210
3235
|
BatchDescribeModelPackageSummary.add_member(:model_approval_status, Shapes::ShapeRef.new(shape: ModelApprovalStatus, location_name: "ModelApprovalStatus"))
|
|
3211
3236
|
BatchDescribeModelPackageSummary.struct_class = Types::BatchDescribeModelPackageSummary
|
|
3212
3237
|
|
|
3238
|
+
BatchRebootClusterNodeLogicalIdsError.add_member(:node_logical_id, Shapes::ShapeRef.new(shape: ClusterNodeLogicalId, required: true, location_name: "NodeLogicalId"))
|
|
3239
|
+
BatchRebootClusterNodeLogicalIdsError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
|
|
3240
|
+
BatchRebootClusterNodeLogicalIdsError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
|
|
3241
|
+
BatchRebootClusterNodeLogicalIdsError.struct_class = Types::BatchRebootClusterNodeLogicalIdsError
|
|
3242
|
+
|
|
3243
|
+
BatchRebootClusterNodeLogicalIdsErrors.member = Shapes::ShapeRef.new(shape: BatchRebootClusterNodeLogicalIdsError)
|
|
3244
|
+
|
|
3245
|
+
BatchRebootClusterNodesError.add_member(:node_id, Shapes::ShapeRef.new(shape: ClusterNodeId, required: true, location_name: "NodeId"))
|
|
3246
|
+
BatchRebootClusterNodesError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
|
|
3247
|
+
BatchRebootClusterNodesError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
|
|
3248
|
+
BatchRebootClusterNodesError.struct_class = Types::BatchRebootClusterNodesError
|
|
3249
|
+
|
|
3250
|
+
BatchRebootClusterNodesErrors.member = Shapes::ShapeRef.new(shape: BatchRebootClusterNodesError)
|
|
3251
|
+
|
|
3252
|
+
BatchRebootClusterNodesRequest.add_member(:cluster_name, Shapes::ShapeRef.new(shape: ClusterNameOrArn, required: true, location_name: "ClusterName"))
|
|
3253
|
+
BatchRebootClusterNodesRequest.add_member(:node_ids, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesRequestNodeIdsList, location_name: "NodeIds"))
|
|
3254
|
+
BatchRebootClusterNodesRequest.add_member(:node_logical_ids, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesRequestNodeLogicalIdsList, location_name: "NodeLogicalIds"))
|
|
3255
|
+
BatchRebootClusterNodesRequest.struct_class = Types::BatchRebootClusterNodesRequest
|
|
3256
|
+
|
|
3257
|
+
BatchRebootClusterNodesRequestNodeIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeId)
|
|
3258
|
+
|
|
3259
|
+
BatchRebootClusterNodesRequestNodeLogicalIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeLogicalId)
|
|
3260
|
+
|
|
3261
|
+
BatchRebootClusterNodesResponse.add_member(:successful, Shapes::ShapeRef.new(shape: ClusterNodeIds, location_name: "Successful"))
|
|
3262
|
+
BatchRebootClusterNodesResponse.add_member(:failed, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesErrors, location_name: "Failed"))
|
|
3263
|
+
BatchRebootClusterNodesResponse.add_member(:failed_node_logical_ids, Shapes::ShapeRef.new(shape: BatchRebootClusterNodeLogicalIdsErrors, location_name: "FailedNodeLogicalIds"))
|
|
3264
|
+
BatchRebootClusterNodesResponse.add_member(:successful_node_logical_ids, Shapes::ShapeRef.new(shape: ClusterNodeLogicalIdList, location_name: "SuccessfulNodeLogicalIds"))
|
|
3265
|
+
BatchRebootClusterNodesResponse.struct_class = Types::BatchRebootClusterNodesResponse
|
|
3266
|
+
|
|
3267
|
+
BatchReplaceClusterNodeLogicalIdsError.add_member(:node_logical_id, Shapes::ShapeRef.new(shape: ClusterNodeLogicalId, required: true, location_name: "NodeLogicalId"))
|
|
3268
|
+
BatchReplaceClusterNodeLogicalIdsError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
|
|
3269
|
+
BatchReplaceClusterNodeLogicalIdsError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
|
|
3270
|
+
BatchReplaceClusterNodeLogicalIdsError.struct_class = Types::BatchReplaceClusterNodeLogicalIdsError
|
|
3271
|
+
|
|
3272
|
+
BatchReplaceClusterNodeLogicalIdsErrors.member = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodeLogicalIdsError)
|
|
3273
|
+
|
|
3274
|
+
BatchReplaceClusterNodesError.add_member(:node_id, Shapes::ShapeRef.new(shape: ClusterNodeId, required: true, location_name: "NodeId"))
|
|
3275
|
+
BatchReplaceClusterNodesError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
|
|
3276
|
+
BatchReplaceClusterNodesError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
|
|
3277
|
+
BatchReplaceClusterNodesError.struct_class = Types::BatchReplaceClusterNodesError
|
|
3278
|
+
|
|
3279
|
+
BatchReplaceClusterNodesErrors.member = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesError)
|
|
3280
|
+
|
|
3281
|
+
BatchReplaceClusterNodesRequest.add_member(:cluster_name, Shapes::ShapeRef.new(shape: ClusterNameOrArn, required: true, location_name: "ClusterName"))
|
|
3282
|
+
BatchReplaceClusterNodesRequest.add_member(:node_ids, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesRequestNodeIdsList, location_name: "NodeIds"))
|
|
3283
|
+
BatchReplaceClusterNodesRequest.add_member(:node_logical_ids, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesRequestNodeLogicalIdsList, location_name: "NodeLogicalIds"))
|
|
3284
|
+
BatchReplaceClusterNodesRequest.struct_class = Types::BatchReplaceClusterNodesRequest
|
|
3285
|
+
|
|
3286
|
+
BatchReplaceClusterNodesRequestNodeIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeId)
|
|
3287
|
+
|
|
3288
|
+
BatchReplaceClusterNodesRequestNodeLogicalIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeLogicalId)
|
|
3289
|
+
|
|
3290
|
+
BatchReplaceClusterNodesResponse.add_member(:successful, Shapes::ShapeRef.new(shape: ClusterNodeIds, location_name: "Successful"))
|
|
3291
|
+
BatchReplaceClusterNodesResponse.add_member(:failed, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesErrors, location_name: "Failed"))
|
|
3292
|
+
BatchReplaceClusterNodesResponse.add_member(:failed_node_logical_ids, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodeLogicalIdsErrors, location_name: "FailedNodeLogicalIds"))
|
|
3293
|
+
BatchReplaceClusterNodesResponse.add_member(:successful_node_logical_ids, Shapes::ShapeRef.new(shape: ClusterNodeLogicalIdList, location_name: "SuccessfulNodeLogicalIds"))
|
|
3294
|
+
BatchReplaceClusterNodesResponse.struct_class = Types::BatchReplaceClusterNodesResponse
|
|
3295
|
+
|
|
3213
3296
|
BatchTransformInput.add_member(:data_captured_destination_s3_uri, Shapes::ShapeRef.new(shape: DestinationS3Uri, required: true, location_name: "DataCapturedDestinationS3Uri"))
|
|
3214
3297
|
BatchTransformInput.add_member(:dataset_format, Shapes::ShapeRef.new(shape: MonitoringDatasetFormat, required: true, location_name: "DatasetFormat"))
|
|
3215
3298
|
BatchTransformInput.add_member(:local_path, Shapes::ShapeRef.new(shape: ProcessingLocalPath, required: true, location_name: "LocalPath"))
|
|
@@ -3561,6 +3644,7 @@ module Aws::SageMaker
|
|
|
3561
3644
|
ClusterNodeSummary.add_member(:last_software_update_time, Shapes::ShapeRef.new(shape: Timestamp, location_name: "LastSoftwareUpdateTime"))
|
|
3562
3645
|
ClusterNodeSummary.add_member(:instance_status, Shapes::ShapeRef.new(shape: ClusterInstanceStatusDetails, required: true, location_name: "InstanceStatus"))
|
|
3563
3646
|
ClusterNodeSummary.add_member(:ultra_server_info, Shapes::ShapeRef.new(shape: UltraServerInfo, location_name: "UltraServerInfo"))
|
|
3647
|
+
ClusterNodeSummary.add_member(:private_dns_hostname, Shapes::ShapeRef.new(shape: ClusterPrivateDnsHostname, location_name: "PrivateDnsHostname"))
|
|
3564
3648
|
ClusterNodeSummary.struct_class = Types::ClusterNodeSummary
|
|
3565
3649
|
|
|
3566
3650
|
ClusterOrchestrator.add_member(:eks, Shapes::ShapeRef.new(shape: ClusterOrchestratorEksConfig, required: true, location_name: "Eks"))
|
|
@@ -3703,6 +3787,7 @@ module Aws::SageMaker
|
|
|
3703
3787
|
ComputeQuotaResourceConfig.add_member(:accelerators, Shapes::ShapeRef.new(shape: AcceleratorsAmount, location_name: "Accelerators"))
|
|
3704
3788
|
ComputeQuotaResourceConfig.add_member(:v_cpu, Shapes::ShapeRef.new(shape: VCpuAmount, location_name: "VCpu"))
|
|
3705
3789
|
ComputeQuotaResourceConfig.add_member(:memory_in_gi_b, Shapes::ShapeRef.new(shape: MemoryInGiBAmount, location_name: "MemoryInGiB"))
|
|
3790
|
+
ComputeQuotaResourceConfig.add_member(:accelerator_partition, Shapes::ShapeRef.new(shape: AcceleratorPartitionConfig, location_name: "AcceleratorPartition"))
|
|
3706
3791
|
ComputeQuotaResourceConfig.struct_class = Types::ComputeQuotaResourceConfig
|
|
3707
3792
|
|
|
3708
3793
|
ComputeQuotaResourceConfigList.member = Shapes::ShapeRef.new(shape: ComputeQuotaResourceConfig)
|
|
@@ -12019,6 +12104,24 @@ module Aws::SageMaker
|
|
|
12019
12104
|
o.output = Shapes::ShapeRef.new(shape: BatchDescribeModelPackageOutput)
|
|
12020
12105
|
end)
|
|
12021
12106
|
|
|
12107
|
+
api.add_operation(:batch_reboot_cluster_nodes, Seahorse::Model::Operation.new.tap do |o|
|
|
12108
|
+
o.name = "BatchRebootClusterNodes"
|
|
12109
|
+
o.http_method = "POST"
|
|
12110
|
+
o.http_request_uri = "/"
|
|
12111
|
+
o.input = Shapes::ShapeRef.new(shape: BatchRebootClusterNodesRequest)
|
|
12112
|
+
o.output = Shapes::ShapeRef.new(shape: BatchRebootClusterNodesResponse)
|
|
12113
|
+
o.errors << Shapes::ShapeRef.new(shape: ResourceNotFound)
|
|
12114
|
+
end)
|
|
12115
|
+
|
|
12116
|
+
api.add_operation(:batch_replace_cluster_nodes, Seahorse::Model::Operation.new.tap do |o|
|
|
12117
|
+
o.name = "BatchReplaceClusterNodes"
|
|
12118
|
+
o.http_method = "POST"
|
|
12119
|
+
o.http_request_uri = "/"
|
|
12120
|
+
o.input = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesRequest)
|
|
12121
|
+
o.output = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesResponse)
|
|
12122
|
+
o.errors << Shapes::ShapeRef.new(shape: ResourceNotFound)
|
|
12123
|
+
end)
|
|
12124
|
+
|
|
12022
12125
|
api.add_operation(:create_action, Seahorse::Model::Operation.new.tap do |o|
|
|
12023
12126
|
o.name = "CreateAction"
|
|
12024
12127
|
o.http_method = "POST"
|
|
@@ -10,6 +10,33 @@
|
|
|
10
10
|
module Aws::SageMaker
|
|
11
11
|
module Types
|
|
12
12
|
|
|
13
|
+
# Configuration for allocating accelerator partitions.
|
|
14
|
+
#
|
|
15
|
+
# @!attribute [rw] type
|
|
16
|
+
# The Multi-Instance GPU (MIG) profile type that defines the partition
|
|
17
|
+
# configuration. The profile specifies the compute and memory
|
|
18
|
+
# allocation for each partition instance. The available profile types
|
|
19
|
+
# depend on the instance type specified in the compute quota
|
|
20
|
+
# configuration.
|
|
21
|
+
# @return [String]
|
|
22
|
+
#
|
|
23
|
+
# @!attribute [rw] count
|
|
24
|
+
# The number of accelerator partitions to allocate with the specified
|
|
25
|
+
# partition type. If you don't specify a value for vCPU and
|
|
26
|
+
# MemoryInGiB, SageMaker AI automatically allocates ratio-based values
|
|
27
|
+
# for those parameters based on the accelerator partition count you
|
|
28
|
+
# provide.
|
|
29
|
+
# @return [Integer]
|
|
30
|
+
#
|
|
31
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/AcceleratorPartitionConfig AWS API Documentation
|
|
32
|
+
#
|
|
33
|
+
class AcceleratorPartitionConfig < Struct.new(
|
|
34
|
+
:type,
|
|
35
|
+
:count)
|
|
36
|
+
SENSITIVE = []
|
|
37
|
+
include Aws::Structure
|
|
38
|
+
end
|
|
39
|
+
|
|
13
40
|
# A structure describing the source of an action.
|
|
14
41
|
#
|
|
15
42
|
# @!attribute [rw] source_uri
|
|
@@ -3452,6 +3479,348 @@ module Aws::SageMaker
|
|
|
3452
3479
|
include Aws::Structure
|
|
3453
3480
|
end
|
|
3454
3481
|
|
|
3482
|
+
# Represents an error encountered when rebooting a node (identified by
|
|
3483
|
+
# its logical node ID) from a SageMaker HyperPod cluster.
|
|
3484
|
+
#
|
|
3485
|
+
# @!attribute [rw] node_logical_id
|
|
3486
|
+
# The logical node ID of the node that encountered an error during the
|
|
3487
|
+
# reboot operation.
|
|
3488
|
+
# @return [String]
|
|
3489
|
+
#
|
|
3490
|
+
# @!attribute [rw] error_code
|
|
3491
|
+
# The error code associated with the error encountered when rebooting
|
|
3492
|
+
# a node by logical node ID.
|
|
3493
|
+
#
|
|
3494
|
+
# Possible values:
|
|
3495
|
+
#
|
|
3496
|
+
# * `InstanceIdNotFound`: The node does not exist in the specified
|
|
3497
|
+
# cluster.
|
|
3498
|
+
#
|
|
3499
|
+
# * `InvalidInstanceStatus`: The node is in a state that does not
|
|
3500
|
+
# allow rebooting. Wait for the node to finish any ongoing changes
|
|
3501
|
+
# before retrying.
|
|
3502
|
+
#
|
|
3503
|
+
# * `InstanceIdInUse`: Another operation is already in progress for
|
|
3504
|
+
# this node. Wait for the operation to complete before retrying.
|
|
3505
|
+
#
|
|
3506
|
+
# * `InternalServerError`: An internal error occurred while processing
|
|
3507
|
+
# this node.
|
|
3508
|
+
# @return [String]
|
|
3509
|
+
#
|
|
3510
|
+
# @!attribute [rw] message
|
|
3511
|
+
# A human-readable message describing the error encountered when
|
|
3512
|
+
# rebooting a node by logical node ID.
|
|
3513
|
+
# @return [String]
|
|
3514
|
+
#
|
|
3515
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodeLogicalIdsError AWS API Documentation
|
|
3516
|
+
#
|
|
3517
|
+
class BatchRebootClusterNodeLogicalIdsError < Struct.new(
|
|
3518
|
+
:node_logical_id,
|
|
3519
|
+
:error_code,
|
|
3520
|
+
:message)
|
|
3521
|
+
SENSITIVE = []
|
|
3522
|
+
include Aws::Structure
|
|
3523
|
+
end
|
|
3524
|
+
|
|
3525
|
+
# Represents an error encountered when rebooting a node from a SageMaker
|
|
3526
|
+
# HyperPod cluster.
|
|
3527
|
+
#
|
|
3528
|
+
# @!attribute [rw] node_id
|
|
3529
|
+
# The EC2 instance ID of the node that encountered an error during the
|
|
3530
|
+
# reboot operation.
|
|
3531
|
+
# @return [String]
|
|
3532
|
+
#
|
|
3533
|
+
# @!attribute [rw] error_code
|
|
3534
|
+
# The error code associated with the error encountered when rebooting
|
|
3535
|
+
# a node.
|
|
3536
|
+
#
|
|
3537
|
+
# Possible values:
|
|
3538
|
+
#
|
|
3539
|
+
# * `InstanceIdNotFound`: The instance does not exist in the specified
|
|
3540
|
+
# cluster.
|
|
3541
|
+
#
|
|
3542
|
+
# * `InvalidInstanceStatus`: The instance is in a state that does not
|
|
3543
|
+
# allow rebooting. Wait for the instance to finish any ongoing
|
|
3544
|
+
# changes before retrying.
|
|
3545
|
+
#
|
|
3546
|
+
# * `InstanceIdInUse`: Another operation is already in progress for
|
|
3547
|
+
# this node. Wait for the operation to complete before retrying.
|
|
3548
|
+
#
|
|
3549
|
+
# * `InternalServerError`: An internal error occurred while processing
|
|
3550
|
+
# this node.
|
|
3551
|
+
# @return [String]
|
|
3552
|
+
#
|
|
3553
|
+
# @!attribute [rw] message
|
|
3554
|
+
# A human-readable message describing the error encountered when
|
|
3555
|
+
# rebooting a node.
|
|
3556
|
+
# @return [String]
|
|
3557
|
+
#
|
|
3558
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodesError AWS API Documentation
|
|
3559
|
+
#
|
|
3560
|
+
class BatchRebootClusterNodesError < Struct.new(
|
|
3561
|
+
:node_id,
|
|
3562
|
+
:error_code,
|
|
3563
|
+
:message)
|
|
3564
|
+
SENSITIVE = []
|
|
3565
|
+
include Aws::Structure
|
|
3566
|
+
end
|
|
3567
|
+
|
|
3568
|
+
# @!attribute [rw] cluster_name
|
|
3569
|
+
# The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
|
|
3570
|
+
# cluster containing the nodes to reboot.
|
|
3571
|
+
# @return [String]
|
|
3572
|
+
#
|
|
3573
|
+
# @!attribute [rw] node_ids
|
|
3574
|
+
# A list of EC2 instance IDs to reboot using soft recovery. You can
|
|
3575
|
+
# specify between 1 and 25 instance IDs.
|
|
3576
|
+
#
|
|
3577
|
+
# <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
|
|
3578
|
+
# but at least one is required.
|
|
3579
|
+
#
|
|
3580
|
+
# * Each instance ID must follow the pattern `i-` followed by 17
|
|
3581
|
+
# hexadecimal characters (for example, `i-0123456789abcdef0`).
|
|
3582
|
+
#
|
|
3583
|
+
# </note>
|
|
3584
|
+
# @return [Array<String>]
|
|
3585
|
+
#
|
|
3586
|
+
# @!attribute [rw] node_logical_ids
|
|
3587
|
+
# A list of logical node IDs to reboot using soft recovery. You can
|
|
3588
|
+
# specify between 1 and 25 logical node IDs.
|
|
3589
|
+
#
|
|
3590
|
+
# The `NodeLogicalId` is a unique identifier that persists throughout
|
|
3591
|
+
# the node's lifecycle and can be used to track nodes that are still
|
|
3592
|
+
# being provisioned and don't yet have an EC2 instance ID assigned.
|
|
3593
|
+
#
|
|
3594
|
+
# * This parameter is only supported for clusters using `Continuous`
|
|
3595
|
+
# as the `NodeProvisioningMode`. For clusters using the default
|
|
3596
|
+
# provisioning mode, use `NodeIds` instead.
|
|
3597
|
+
#
|
|
3598
|
+
# * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
|
|
3599
|
+
# but at least one is required.
|
|
3600
|
+
# @return [Array<String>]
|
|
3601
|
+
#
|
|
3602
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodesRequest AWS API Documentation
|
|
3603
|
+
#
|
|
3604
|
+
class BatchRebootClusterNodesRequest < Struct.new(
|
|
3605
|
+
:cluster_name,
|
|
3606
|
+
:node_ids,
|
|
3607
|
+
:node_logical_ids)
|
|
3608
|
+
SENSITIVE = []
|
|
3609
|
+
include Aws::Structure
|
|
3610
|
+
end
|
|
3611
|
+
|
|
3612
|
+
# @!attribute [rw] successful
|
|
3613
|
+
# A list of EC2 instance IDs for which the reboot operation was
|
|
3614
|
+
# successfully initiated.
|
|
3615
|
+
# @return [Array<String>]
|
|
3616
|
+
#
|
|
3617
|
+
# @!attribute [rw] failed
|
|
3618
|
+
# A list of errors encountered for EC2 instance IDs that could not be
|
|
3619
|
+
# rebooted. Each error includes the instance ID, an error code, and a
|
|
3620
|
+
# descriptive message.
|
|
3621
|
+
# @return [Array<Types::BatchRebootClusterNodesError>]
|
|
3622
|
+
#
|
|
3623
|
+
# @!attribute [rw] failed_node_logical_ids
|
|
3624
|
+
# A list of errors encountered for logical node IDs that could not be
|
|
3625
|
+
# rebooted. Each error includes the logical node ID, an error code,
|
|
3626
|
+
# and a descriptive message. This field is only present when
|
|
3627
|
+
# `NodeLogicalIds` were provided in the request.
|
|
3628
|
+
# @return [Array<Types::BatchRebootClusterNodeLogicalIdsError>]
|
|
3629
|
+
#
|
|
3630
|
+
# @!attribute [rw] successful_node_logical_ids
|
|
3631
|
+
# A list of logical node IDs for which the reboot operation was
|
|
3632
|
+
# successfully initiated. This field is only present when
|
|
3633
|
+
# `NodeLogicalIds` were provided in the request.
|
|
3634
|
+
# @return [Array<String>]
|
|
3635
|
+
#
|
|
3636
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodesResponse AWS API Documentation
|
|
3637
|
+
#
|
|
3638
|
+
class BatchRebootClusterNodesResponse < Struct.new(
|
|
3639
|
+
:successful,
|
|
3640
|
+
:failed,
|
|
3641
|
+
:failed_node_logical_ids,
|
|
3642
|
+
:successful_node_logical_ids)
|
|
3643
|
+
SENSITIVE = []
|
|
3644
|
+
include Aws::Structure
|
|
3645
|
+
end
|
|
3646
|
+
|
|
3647
|
+
# Represents an error encountered when replacing a node (identified by
|
|
3648
|
+
# its logical node ID) in a SageMaker HyperPod cluster.
|
|
3649
|
+
#
|
|
3650
|
+
# @!attribute [rw] node_logical_id
|
|
3651
|
+
# The logical node ID of the node that encountered an error during the
|
|
3652
|
+
# replacement operation.
|
|
3653
|
+
# @return [String]
|
|
3654
|
+
#
|
|
3655
|
+
# @!attribute [rw] error_code
|
|
3656
|
+
# The error code associated with the error encountered when replacing
|
|
3657
|
+
# a node by logical node ID.
|
|
3658
|
+
#
|
|
3659
|
+
# Possible values:
|
|
3660
|
+
#
|
|
3661
|
+
# * `InstanceIdNotFound`: The node does not exist in the specified
|
|
3662
|
+
# cluster.
|
|
3663
|
+
#
|
|
3664
|
+
# * `InvalidInstanceStatus`: The node is in a state that does not
|
|
3665
|
+
# allow replacement. Wait for the node to finish any ongoing changes
|
|
3666
|
+
# before retrying.
|
|
3667
|
+
#
|
|
3668
|
+
# * `InstanceIdInUse`: Another operation is already in progress for
|
|
3669
|
+
# this node. Wait for the operation to complete before retrying.
|
|
3670
|
+
#
|
|
3671
|
+
# * `InternalServerError`: An internal error occurred while processing
|
|
3672
|
+
# this node.
|
|
3673
|
+
# @return [String]
|
|
3674
|
+
#
|
|
3675
|
+
# @!attribute [rw] message
|
|
3676
|
+
# A human-readable message describing the error encountered when
|
|
3677
|
+
# replacing a node by logical node ID.
|
|
3678
|
+
# @return [String]
|
|
3679
|
+
#
|
|
3680
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodeLogicalIdsError AWS API Documentation
|
|
3681
|
+
#
|
|
3682
|
+
class BatchReplaceClusterNodeLogicalIdsError < Struct.new(
|
|
3683
|
+
:node_logical_id,
|
|
3684
|
+
:error_code,
|
|
3685
|
+
:message)
|
|
3686
|
+
SENSITIVE = []
|
|
3687
|
+
include Aws::Structure
|
|
3688
|
+
end
|
|
3689
|
+
|
|
3690
|
+
# Represents an error encountered when replacing a node in a SageMaker
|
|
3691
|
+
# HyperPod cluster.
|
|
3692
|
+
#
|
|
3693
|
+
# @!attribute [rw] node_id
|
|
3694
|
+
# The EC2 instance ID of the node that encountered an error during the
|
|
3695
|
+
# replacement operation.
|
|
3696
|
+
# @return [String]
|
|
3697
|
+
#
|
|
3698
|
+
# @!attribute [rw] error_code
|
|
3699
|
+
# The error code associated with the error encountered when replacing
|
|
3700
|
+
# a node.
|
|
3701
|
+
#
|
|
3702
|
+
# Possible values:
|
|
3703
|
+
#
|
|
3704
|
+
# * `InstanceIdNotFound`: The instance does not exist in the specified
|
|
3705
|
+
# cluster.
|
|
3706
|
+
#
|
|
3707
|
+
# * `InvalidInstanceStatus`: The instance is in a state that does not
|
|
3708
|
+
# allow replacement. Wait for the instance to finish any ongoing
|
|
3709
|
+
# changes before retrying.
|
|
3710
|
+
#
|
|
3711
|
+
# * `InstanceIdInUse`: Another operation is already in progress for
|
|
3712
|
+
# this node. Wait for the operation to complete before retrying.
|
|
3713
|
+
#
|
|
3714
|
+
# * `InternalServerError`: An internal error occurred while processing
|
|
3715
|
+
# this node.
|
|
3716
|
+
# @return [String]
|
|
3717
|
+
#
|
|
3718
|
+
# @!attribute [rw] message
|
|
3719
|
+
# A human-readable message describing the error encountered when
|
|
3720
|
+
# replacing a node.
|
|
3721
|
+
# @return [String]
|
|
3722
|
+
#
|
|
3723
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodesError AWS API Documentation
|
|
3724
|
+
#
|
|
3725
|
+
class BatchReplaceClusterNodesError < Struct.new(
|
|
3726
|
+
:node_id,
|
|
3727
|
+
:error_code,
|
|
3728
|
+
:message)
|
|
3729
|
+
SENSITIVE = []
|
|
3730
|
+
include Aws::Structure
|
|
3731
|
+
end
|
|
3732
|
+
|
|
3733
|
+
# @!attribute [rw] cluster_name
|
|
3734
|
+
# The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
|
|
3735
|
+
# cluster containing the nodes to replace.
|
|
3736
|
+
# @return [String]
|
|
3737
|
+
#
|
|
3738
|
+
# @!attribute [rw] node_ids
|
|
3739
|
+
# A list of EC2 instance IDs to replace with new hardware. You can
|
|
3740
|
+
# specify between 1 and 25 instance IDs.
|
|
3741
|
+
#
|
|
3742
|
+
# Replace operations destroy all instance volumes (root and
|
|
3743
|
+
# secondary). Ensure you have backed up any important data before
|
|
3744
|
+
# proceeding.
|
|
3745
|
+
#
|
|
3746
|
+
# <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
|
|
3747
|
+
# but at least one is required.
|
|
3748
|
+
#
|
|
3749
|
+
# * Each instance ID must follow the pattern `i-` followed by 17
|
|
3750
|
+
# hexadecimal characters (for example, `i-0123456789abcdef0`).
|
|
3751
|
+
#
|
|
3752
|
+
# * For SageMaker HyperPod clusters using the Slurm workload manager,
|
|
3753
|
+
# you cannot replace instances that are configured as Slurm
|
|
3754
|
+
# controller nodes.
|
|
3755
|
+
#
|
|
3756
|
+
# </note>
|
|
3757
|
+
# @return [Array<String>]
|
|
3758
|
+
#
|
|
3759
|
+
# @!attribute [rw] node_logical_ids
|
|
3760
|
+
# A list of logical node IDs to replace with new hardware. You can
|
|
3761
|
+
# specify between 1 and 25 logical node IDs.
|
|
3762
|
+
#
|
|
3763
|
+
# The `NodeLogicalId` is a unique identifier that persists throughout
|
|
3764
|
+
# the node's lifecycle and can be used to track nodes that are still
|
|
3765
|
+
# being provisioned and don't yet have an EC2 instance ID assigned.
|
|
3766
|
+
#
|
|
3767
|
+
# * Replace operations destroy all instance volumes (root and
|
|
3768
|
+
# secondary). Ensure you have backed up any important data before
|
|
3769
|
+
# proceeding.
|
|
3770
|
+
#
|
|
3771
|
+
# * This parameter is only supported for clusters using `Continuous`
|
|
3772
|
+
# as the `NodeProvisioningMode`. For clusters using the default
|
|
3773
|
+
# provisioning mode, use `NodeIds` instead.
|
|
3774
|
+
#
|
|
3775
|
+
# * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
|
|
3776
|
+
# but at least one is required.
|
|
3777
|
+
# @return [Array<String>]
|
|
3778
|
+
#
|
|
3779
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodesRequest AWS API Documentation
|
|
3780
|
+
#
|
|
3781
|
+
class BatchReplaceClusterNodesRequest < Struct.new(
|
|
3782
|
+
:cluster_name,
|
|
3783
|
+
:node_ids,
|
|
3784
|
+
:node_logical_ids)
|
|
3785
|
+
SENSITIVE = []
|
|
3786
|
+
include Aws::Structure
|
|
3787
|
+
end
|
|
3788
|
+
|
|
3789
|
+
# @!attribute [rw] successful
|
|
3790
|
+
# A list of EC2 instance IDs for which the replacement operation was
|
|
3791
|
+
# successfully initiated.
|
|
3792
|
+
# @return [Array<String>]
|
|
3793
|
+
#
|
|
3794
|
+
# @!attribute [rw] failed
|
|
3795
|
+
# A list of errors encountered for EC2 instance IDs that could not be
|
|
3796
|
+
# replaced. Each error includes the instance ID, an error code, and a
|
|
3797
|
+
# descriptive message.
|
|
3798
|
+
# @return [Array<Types::BatchReplaceClusterNodesError>]
|
|
3799
|
+
#
|
|
3800
|
+
# @!attribute [rw] failed_node_logical_ids
|
|
3801
|
+
# A list of errors encountered for logical node IDs that could not be
|
|
3802
|
+
# replaced. Each error includes the logical node ID, an error code,
|
|
3803
|
+
# and a descriptive message. This field is only present when
|
|
3804
|
+
# `NodeLogicalIds` were provided in the request.
|
|
3805
|
+
# @return [Array<Types::BatchReplaceClusterNodeLogicalIdsError>]
|
|
3806
|
+
#
|
|
3807
|
+
# @!attribute [rw] successful_node_logical_ids
|
|
3808
|
+
# A list of logical node IDs for which the replacement operation was
|
|
3809
|
+
# successfully initiated. This field is only present when
|
|
3810
|
+
# `NodeLogicalIds` were provided in the request.
|
|
3811
|
+
# @return [Array<String>]
|
|
3812
|
+
#
|
|
3813
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodesResponse AWS API Documentation
|
|
3814
|
+
#
|
|
3815
|
+
class BatchReplaceClusterNodesResponse < Struct.new(
|
|
3816
|
+
:successful,
|
|
3817
|
+
:failed,
|
|
3818
|
+
:failed_node_logical_ids,
|
|
3819
|
+
:successful_node_logical_ids)
|
|
3820
|
+
SENSITIVE = []
|
|
3821
|
+
include Aws::Structure
|
|
3822
|
+
end
|
|
3823
|
+
|
|
3455
3824
|
# Input object for the batch transform job.
|
|
3456
3825
|
#
|
|
3457
3826
|
# @!attribute [rw] data_captured_destination_s3_uri
|
|
@@ -5536,6 +5905,10 @@ module Aws::SageMaker
|
|
|
5536
5905
|
# Contains information about the UltraServer.
|
|
5537
5906
|
# @return [Types::UltraServerInfo]
|
|
5538
5907
|
#
|
|
5908
|
+
# @!attribute [rw] private_dns_hostname
|
|
5909
|
+
# The private DNS hostname of the SageMaker HyperPod cluster node.
|
|
5910
|
+
# @return [String]
|
|
5911
|
+
#
|
|
5539
5912
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ClusterNodeSummary AWS API Documentation
|
|
5540
5913
|
#
|
|
5541
5914
|
class ClusterNodeSummary < Struct.new(
|
|
@@ -5546,7 +5919,8 @@ module Aws::SageMaker
|
|
|
5546
5919
|
:launch_time,
|
|
5547
5920
|
:last_software_update_time,
|
|
5548
5921
|
:instance_status,
|
|
5549
|
-
:ultra_server_info
|
|
5922
|
+
:ultra_server_info,
|
|
5923
|
+
:private_dns_hostname)
|
|
5550
5924
|
SENSITIVE = []
|
|
5551
5925
|
include Aws::Structure
|
|
5552
5926
|
end
|
|
@@ -6294,6 +6668,11 @@ module Aws::SageMaker
|
|
|
6294
6668
|
# Accelerators are set to 0.
|
|
6295
6669
|
# @return [Float]
|
|
6296
6670
|
#
|
|
6671
|
+
# @!attribute [rw] accelerator_partition
|
|
6672
|
+
# The accelerator partition configuration for fractional GPU
|
|
6673
|
+
# allocation.
|
|
6674
|
+
# @return [Types::AcceleratorPartitionConfig]
|
|
6675
|
+
#
|
|
6297
6676
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ComputeQuotaResourceConfig AWS API Documentation
|
|
6298
6677
|
#
|
|
6299
6678
|
class ComputeQuotaResourceConfig < Struct.new(
|
|
@@ -6301,7 +6680,8 @@ module Aws::SageMaker
|
|
|
6301
6680
|
:count,
|
|
6302
6681
|
:accelerators,
|
|
6303
6682
|
:v_cpu,
|
|
6304
|
-
:memory_in_gi_b
|
|
6683
|
+
:memory_in_gi_b,
|
|
6684
|
+
:accelerator_partition)
|
|
6305
6685
|
SENSITIVE = []
|
|
6306
6686
|
include Aws::Structure
|
|
6307
6687
|
end
|
|
@@ -20816,7 +21196,7 @@ module Aws::SageMaker
|
|
|
20816
21196
|
#
|
|
20817
21197
|
# @!attribute [rw] target_resources
|
|
20818
21198
|
# The target resources (e.g., SageMaker Training Jobs, SageMaker
|
|
20819
|
-
# HyperPod) that can use this training plan.
|
|
21199
|
+
# HyperPod, SageMaker Endpoints) that can use this training plan.
|
|
20820
21200
|
#
|
|
20821
21201
|
# Training plans are specific to their target resource.
|
|
20822
21202
|
#
|
|
@@ -20825,6 +21205,10 @@ module Aws::SageMaker
|
|
|
20825
21205
|
#
|
|
20826
21206
|
# * A training plan for HyperPod clusters can be used exclusively to
|
|
20827
21207
|
# provide compute resources to a cluster's instance group.
|
|
21208
|
+
#
|
|
21209
|
+
# * A training plan for SageMaker endpoints can be used exclusively to
|
|
21210
|
+
# provide compute resources to SageMaker endpoints for model
|
|
21211
|
+
# deployment.
|
|
20828
21212
|
# @return [Array<String>]
|
|
20829
21213
|
#
|
|
20830
21214
|
# @!attribute [rw] reserved_capacity_summaries
|
|
@@ -45661,7 +46045,7 @@ module Aws::SageMaker
|
|
|
45661
46045
|
#
|
|
45662
46046
|
# @!attribute [rw] target_resources
|
|
45663
46047
|
# The target resources (e.g., SageMaker Training Jobs, SageMaker
|
|
45664
|
-
# HyperPod) to search for in the offerings.
|
|
46048
|
+
# HyperPod, SageMaker Endpoints) to search for in the offerings.
|
|
45665
46049
|
#
|
|
45666
46050
|
# Training plans are specific to their target resource.
|
|
45667
46051
|
#
|
|
@@ -45670,6 +46054,10 @@ module Aws::SageMaker
|
|
|
45670
46054
|
#
|
|
45671
46055
|
# * A training plan for HyperPod clusters can be used exclusively to
|
|
45672
46056
|
# provide compute resources to a cluster's instance group.
|
|
46057
|
+
#
|
|
46058
|
+
# * A training plan for SageMaker endpoints can be used exclusively to
|
|
46059
|
+
# provide compute resources to SageMaker endpoints for model
|
|
46060
|
+
# deployment.
|
|
45673
46061
|
# @return [Array<String>]
|
|
45674
46062
|
#
|
|
45675
46063
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/SearchTrainingPlanOfferingsRequest AWS API Documentation
|
|
@@ -48905,7 +49293,7 @@ module Aws::SageMaker
|
|
|
48905
49293
|
#
|
|
48906
49294
|
# @!attribute [rw] target_resources
|
|
48907
49295
|
# The target resources (e.g., SageMaker Training Jobs, SageMaker
|
|
48908
|
-
# HyperPod) for this training plan offering.
|
|
49296
|
+
# HyperPod, SageMaker Endpoints) for this training plan offering.
|
|
48909
49297
|
#
|
|
48910
49298
|
# Training plans are specific to their target resource.
|
|
48911
49299
|
#
|
|
@@ -48914,6 +49302,10 @@ module Aws::SageMaker
|
|
|
48914
49302
|
#
|
|
48915
49303
|
# * A training plan for HyperPod clusters can be used exclusively to
|
|
48916
49304
|
# provide compute resources to a cluster's instance group.
|
|
49305
|
+
#
|
|
49306
|
+
# * A training plan for SageMaker endpoints can be used exclusively to
|
|
49307
|
+
# provide compute resources to SageMaker endpoints for model
|
|
49308
|
+
# deployment.
|
|
48917
49309
|
# @return [Array<String>]
|
|
48918
49310
|
#
|
|
48919
49311
|
# @!attribute [rw] requested_start_time_after
|
|
@@ -49035,8 +49427,8 @@ module Aws::SageMaker
|
|
|
49035
49427
|
# @return [Integer]
|
|
49036
49428
|
#
|
|
49037
49429
|
# @!attribute [rw] target_resources
|
|
49038
|
-
# The target resources (e.g., training jobs, HyperPod clusters
|
|
49039
|
-
# can use this training plan.
|
|
49430
|
+
# The target resources (e.g., training jobs, HyperPod clusters,
|
|
49431
|
+
# Endpoints) that can use this training plan.
|
|
49040
49432
|
#
|
|
49041
49433
|
# Training plans are specific to their target resource.
|
|
49042
49434
|
#
|
|
@@ -49045,6 +49437,10 @@ module Aws::SageMaker
|
|
|
49045
49437
|
#
|
|
49046
49438
|
# * A training plan for HyperPod clusters can be used exclusively to
|
|
49047
49439
|
# provide compute resources to a cluster's instance group.
|
|
49440
|
+
#
|
|
49441
|
+
# * A training plan for SageMaker endpoints can be used exclusively to
|
|
49442
|
+
# provide compute resources to SageMaker endpoints for model
|
|
49443
|
+
# deployment.
|
|
49048
49444
|
# @return [Array<String>]
|
|
49049
49445
|
#
|
|
49050
49446
|
# @!attribute [rw] reserved_capacity_summaries
|
data/lib/aws-sdk-sagemaker.rb
CHANGED
data/sig/client.rbs
CHANGED
|
@@ -181,6 +181,36 @@ module Aws
|
|
|
181
181
|
) -> _BatchDescribeModelPackageResponseSuccess
|
|
182
182
|
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _BatchDescribeModelPackageResponseSuccess
|
|
183
183
|
|
|
184
|
+
interface _BatchRebootClusterNodesResponseSuccess
|
|
185
|
+
include ::Seahorse::Client::_ResponseSuccess[Types::BatchRebootClusterNodesResponse]
|
|
186
|
+
def successful: () -> ::Array[::String]
|
|
187
|
+
def failed: () -> ::Array[Types::BatchRebootClusterNodesError]
|
|
188
|
+
def failed_node_logical_ids: () -> ::Array[Types::BatchRebootClusterNodeLogicalIdsError]
|
|
189
|
+
def successful_node_logical_ids: () -> ::Array[::String]
|
|
190
|
+
end
|
|
191
|
+
# https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#batch_reboot_cluster_nodes-instance_method
|
|
192
|
+
def batch_reboot_cluster_nodes: (
|
|
193
|
+
cluster_name: ::String,
|
|
194
|
+
?node_ids: Array[::String],
|
|
195
|
+
?node_logical_ids: Array[::String]
|
|
196
|
+
) -> _BatchRebootClusterNodesResponseSuccess
|
|
197
|
+
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _BatchRebootClusterNodesResponseSuccess
|
|
198
|
+
|
|
199
|
+
interface _BatchReplaceClusterNodesResponseSuccess
|
|
200
|
+
include ::Seahorse::Client::_ResponseSuccess[Types::BatchReplaceClusterNodesResponse]
|
|
201
|
+
def successful: () -> ::Array[::String]
|
|
202
|
+
def failed: () -> ::Array[Types::BatchReplaceClusterNodesError]
|
|
203
|
+
def failed_node_logical_ids: () -> ::Array[Types::BatchReplaceClusterNodeLogicalIdsError]
|
|
204
|
+
def successful_node_logical_ids: () -> ::Array[::String]
|
|
205
|
+
end
|
|
206
|
+
# https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#batch_replace_cluster_nodes-instance_method
|
|
207
|
+
def batch_replace_cluster_nodes: (
|
|
208
|
+
cluster_name: ::String,
|
|
209
|
+
?node_ids: Array[::String],
|
|
210
|
+
?node_logical_ids: Array[::String]
|
|
211
|
+
) -> _BatchReplaceClusterNodesResponseSuccess
|
|
212
|
+
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _BatchReplaceClusterNodesResponseSuccess
|
|
213
|
+
|
|
184
214
|
interface _CreateActionResponseSuccess
|
|
185
215
|
include ::Seahorse::Client::_ResponseSuccess[Types::CreateActionResponse]
|
|
186
216
|
def action_arn: () -> ::String
|
|
@@ -1013,7 +1043,11 @@ module Aws
|
|
|
1013
1043
|
count: ::Integer?,
|
|
1014
1044
|
accelerators: ::Integer?,
|
|
1015
1045
|
v_cpu: ::Float?,
|
|
1016
|
-
memory_in_gi_b: ::Float
|
|
1046
|
+
memory_in_gi_b: ::Float?,
|
|
1047
|
+
accelerator_partition: {
|
|
1048
|
+
type: ("mig-1g.5gb" | "mig-1g.10gb" | "mig-1g.18gb" | "mig-1g.20gb" | "mig-1g.23gb" | "mig-1g.35gb" | "mig-1g.45gb" | "mig-1g.47gb" | "mig-2g.10gb" | "mig-2g.20gb" | "mig-2g.35gb" | "mig-2g.45gb" | "mig-2g.47gb" | "mig-3g.20gb" | "mig-3g.40gb" | "mig-3g.71gb" | "mig-3g.90gb" | "mig-3g.93gb" | "mig-4g.20gb" | "mig-4g.40gb" | "mig-4g.71gb" | "mig-4g.90gb" | "mig-4g.93gb" | "mig-7g.40gb" | "mig-7g.80gb" | "mig-7g.141gb" | "mig-7g.180gb" | "mig-7g.186gb"),
|
|
1049
|
+
count: ::Integer
|
|
1050
|
+
}?
|
|
1017
1051
|
},
|
|
1018
1052
|
]?,
|
|
1019
1053
|
resource_sharing_config: {
|
|
@@ -6680,7 +6714,7 @@ module Aws
|
|
|
6680
6714
|
def unhealthy_instance_count: () -> ::Integer
|
|
6681
6715
|
def available_spare_instance_count: () -> ::Integer
|
|
6682
6716
|
def total_ultra_server_count: () -> ::Integer
|
|
6683
|
-
def target_resources: () -> ::Array[("training-job" | "hyperpod-cluster")]
|
|
6717
|
+
def target_resources: () -> ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
|
|
6684
6718
|
def reserved_capacity_summaries: () -> ::Array[Types::ReservedCapacitySummary]
|
|
6685
6719
|
end
|
|
6686
6720
|
# https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#describe_training_plan-instance_method
|
|
@@ -8627,7 +8661,7 @@ module Aws
|
|
|
8627
8661
|
?start_time_after: ::Time,
|
|
8628
8662
|
?end_time_before: ::Time,
|
|
8629
8663
|
duration_hours: ::Integer,
|
|
8630
|
-
target_resources: Array[("training-job" | "hyperpod-cluster")]
|
|
8664
|
+
target_resources: Array[("training-job" | "hyperpod-cluster" | "endpoint")]
|
|
8631
8665
|
) -> _SearchTrainingPlanOfferingsResponseSuccess
|
|
8632
8666
|
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _SearchTrainingPlanOfferingsResponseSuccess
|
|
8633
8667
|
|
|
@@ -9150,7 +9184,11 @@ module Aws
|
|
|
9150
9184
|
count: ::Integer?,
|
|
9151
9185
|
accelerators: ::Integer?,
|
|
9152
9186
|
v_cpu: ::Float?,
|
|
9153
|
-
memory_in_gi_b: ::Float
|
|
9187
|
+
memory_in_gi_b: ::Float?,
|
|
9188
|
+
accelerator_partition: {
|
|
9189
|
+
type: ("mig-1g.5gb" | "mig-1g.10gb" | "mig-1g.18gb" | "mig-1g.20gb" | "mig-1g.23gb" | "mig-1g.35gb" | "mig-1g.45gb" | "mig-1g.47gb" | "mig-2g.10gb" | "mig-2g.20gb" | "mig-2g.35gb" | "mig-2g.45gb" | "mig-2g.47gb" | "mig-3g.20gb" | "mig-3g.40gb" | "mig-3g.71gb" | "mig-3g.90gb" | "mig-3g.93gb" | "mig-4g.20gb" | "mig-4g.40gb" | "mig-4g.71gb" | "mig-4g.90gb" | "mig-4g.93gb" | "mig-7g.40gb" | "mig-7g.80gb" | "mig-7g.141gb" | "mig-7g.180gb" | "mig-7g.186gb"),
|
|
9190
|
+
count: ::Integer
|
|
9191
|
+
}?
|
|
9154
9192
|
},
|
|
9155
9193
|
]?,
|
|
9156
9194
|
resource_sharing_config: {
|
data/sig/types.rbs
CHANGED
|
@@ -8,6 +8,12 @@
|
|
|
8
8
|
module Aws::SageMaker
|
|
9
9
|
module Types
|
|
10
10
|
|
|
11
|
+
class AcceleratorPartitionConfig
|
|
12
|
+
attr_accessor type: ("mig-1g.5gb" | "mig-1g.10gb" | "mig-1g.18gb" | "mig-1g.20gb" | "mig-1g.23gb" | "mig-1g.35gb" | "mig-1g.45gb" | "mig-1g.47gb" | "mig-2g.10gb" | "mig-2g.20gb" | "mig-2g.35gb" | "mig-2g.45gb" | "mig-2g.47gb" | "mig-3g.20gb" | "mig-3g.40gb" | "mig-3g.71gb" | "mig-3g.90gb" | "mig-3g.93gb" | "mig-4g.20gb" | "mig-4g.40gb" | "mig-4g.71gb" | "mig-4g.90gb" | "mig-4g.93gb" | "mig-7g.40gb" | "mig-7g.80gb" | "mig-7g.141gb" | "mig-7g.180gb" | "mig-7g.186gb")
|
|
13
|
+
attr_accessor count: ::Integer
|
|
14
|
+
SENSITIVE: []
|
|
15
|
+
end
|
|
16
|
+
|
|
11
17
|
class ActionSource
|
|
12
18
|
attr_accessor source_uri: ::String
|
|
13
19
|
attr_accessor source_type: ::String
|
|
@@ -598,6 +604,64 @@ module Aws::SageMaker
|
|
|
598
604
|
SENSITIVE: []
|
|
599
605
|
end
|
|
600
606
|
|
|
607
|
+
class BatchRebootClusterNodeLogicalIdsError
|
|
608
|
+
attr_accessor node_logical_id: ::String
|
|
609
|
+
attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
|
|
610
|
+
attr_accessor message: ::String
|
|
611
|
+
SENSITIVE: []
|
|
612
|
+
end
|
|
613
|
+
|
|
614
|
+
class BatchRebootClusterNodesError
|
|
615
|
+
attr_accessor node_id: ::String
|
|
616
|
+
attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
|
|
617
|
+
attr_accessor message: ::String
|
|
618
|
+
SENSITIVE: []
|
|
619
|
+
end
|
|
620
|
+
|
|
621
|
+
class BatchRebootClusterNodesRequest
|
|
622
|
+
attr_accessor cluster_name: ::String
|
|
623
|
+
attr_accessor node_ids: ::Array[::String]
|
|
624
|
+
attr_accessor node_logical_ids: ::Array[::String]
|
|
625
|
+
SENSITIVE: []
|
|
626
|
+
end
|
|
627
|
+
|
|
628
|
+
class BatchRebootClusterNodesResponse
|
|
629
|
+
attr_accessor successful: ::Array[::String]
|
|
630
|
+
attr_accessor failed: ::Array[Types::BatchRebootClusterNodesError]
|
|
631
|
+
attr_accessor failed_node_logical_ids: ::Array[Types::BatchRebootClusterNodeLogicalIdsError]
|
|
632
|
+
attr_accessor successful_node_logical_ids: ::Array[::String]
|
|
633
|
+
SENSITIVE: []
|
|
634
|
+
end
|
|
635
|
+
|
|
636
|
+
class BatchReplaceClusterNodeLogicalIdsError
|
|
637
|
+
attr_accessor node_logical_id: ::String
|
|
638
|
+
attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
|
|
639
|
+
attr_accessor message: ::String
|
|
640
|
+
SENSITIVE: []
|
|
641
|
+
end
|
|
642
|
+
|
|
643
|
+
class BatchReplaceClusterNodesError
|
|
644
|
+
attr_accessor node_id: ::String
|
|
645
|
+
attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
|
|
646
|
+
attr_accessor message: ::String
|
|
647
|
+
SENSITIVE: []
|
|
648
|
+
end
|
|
649
|
+
|
|
650
|
+
class BatchReplaceClusterNodesRequest
|
|
651
|
+
attr_accessor cluster_name: ::String
|
|
652
|
+
attr_accessor node_ids: ::Array[::String]
|
|
653
|
+
attr_accessor node_logical_ids: ::Array[::String]
|
|
654
|
+
SENSITIVE: []
|
|
655
|
+
end
|
|
656
|
+
|
|
657
|
+
class BatchReplaceClusterNodesResponse
|
|
658
|
+
attr_accessor successful: ::Array[::String]
|
|
659
|
+
attr_accessor failed: ::Array[Types::BatchReplaceClusterNodesError]
|
|
660
|
+
attr_accessor failed_node_logical_ids: ::Array[Types::BatchReplaceClusterNodeLogicalIdsError]
|
|
661
|
+
attr_accessor successful_node_logical_ids: ::Array[::String]
|
|
662
|
+
SENSITIVE: []
|
|
663
|
+
end
|
|
664
|
+
|
|
601
665
|
class BatchTransformInput
|
|
602
666
|
attr_accessor data_captured_destination_s3_uri: ::String
|
|
603
667
|
attr_accessor dataset_format: Types::MonitoringDatasetFormat
|
|
@@ -1005,6 +1069,7 @@ module Aws::SageMaker
|
|
|
1005
1069
|
attr_accessor last_software_update_time: ::Time
|
|
1006
1070
|
attr_accessor instance_status: Types::ClusterInstanceStatusDetails
|
|
1007
1071
|
attr_accessor ultra_server_info: Types::UltraServerInfo
|
|
1072
|
+
attr_accessor private_dns_hostname: ::String
|
|
1008
1073
|
SENSITIVE: []
|
|
1009
1074
|
end
|
|
1010
1075
|
|
|
@@ -1165,6 +1230,7 @@ module Aws::SageMaker
|
|
|
1165
1230
|
attr_accessor accelerators: ::Integer
|
|
1166
1231
|
attr_accessor v_cpu: ::Float
|
|
1167
1232
|
attr_accessor memory_in_gi_b: ::Float
|
|
1233
|
+
attr_accessor accelerator_partition: Types::AcceleratorPartitionConfig
|
|
1168
1234
|
SENSITIVE: []
|
|
1169
1235
|
end
|
|
1170
1236
|
|
|
@@ -4388,7 +4454,7 @@ module Aws::SageMaker
|
|
|
4388
4454
|
attr_accessor unhealthy_instance_count: ::Integer
|
|
4389
4455
|
attr_accessor available_spare_instance_count: ::Integer
|
|
4390
4456
|
attr_accessor total_ultra_server_count: ::Integer
|
|
4391
|
-
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
|
|
4457
|
+
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
|
|
4392
4458
|
attr_accessor reserved_capacity_summaries: ::Array[Types::ReservedCapacitySummary]
|
|
4393
4459
|
SENSITIVE: []
|
|
4394
4460
|
end
|
|
@@ -9567,7 +9633,7 @@ module Aws::SageMaker
|
|
|
9567
9633
|
attr_accessor start_time_after: ::Time
|
|
9568
9634
|
attr_accessor end_time_before: ::Time
|
|
9569
9635
|
attr_accessor duration_hours: ::Integer
|
|
9570
|
-
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
|
|
9636
|
+
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
|
|
9571
9637
|
SENSITIVE: []
|
|
9572
9638
|
end
|
|
9573
9639
|
|
|
@@ -10224,7 +10290,7 @@ module Aws::SageMaker
|
|
|
10224
10290
|
|
|
10225
10291
|
class TrainingPlanOffering
|
|
10226
10292
|
attr_accessor training_plan_offering_id: ::String
|
|
10227
|
-
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
|
|
10293
|
+
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
|
|
10228
10294
|
attr_accessor requested_start_time_after: ::Time
|
|
10229
10295
|
attr_accessor requested_end_time_before: ::Time
|
|
10230
10296
|
attr_accessor duration_hours: ::Integer
|
|
@@ -10250,7 +10316,7 @@ module Aws::SageMaker
|
|
|
10250
10316
|
attr_accessor available_instance_count: ::Integer
|
|
10251
10317
|
attr_accessor in_use_instance_count: ::Integer
|
|
10252
10318
|
attr_accessor total_ultra_server_count: ::Integer
|
|
10253
|
-
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
|
|
10319
|
+
attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
|
|
10254
10320
|
attr_accessor reserved_capacity_summaries: ::Array[Types::ReservedCapacitySummary]
|
|
10255
10321
|
SENSITIVE: []
|
|
10256
10322
|
end
|