aws-sdk-sagemaker 1.339.0 → 1.340.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f99f676fe2b17eb076e8761bee93ce0bfaee796c41dc984e1eab0803c1947f2e
4
- data.tar.gz: 6b3644ed5504af87e03d6b11d457c9cfa1bcf428b917150a2bad9a661968f654
3
+ metadata.gz: f760b6f6d6902ca08349489fe9e34c577365953a32aa2f031a4db9e67aa9cb08
4
+ data.tar.gz: 5d01231c9d2c1d978d56deee398fb98fe79da54085d362172671724d6bce3233
5
5
  SHA512:
6
- metadata.gz: c26fc869f314ef2b25b1b2e0c58c9926c7b20b740a5f46064e31618cd4af601938f5df74199fce53c2c2d5494059acbec30b71727ae6534400013bbee5516433
7
- data.tar.gz: 2bbffdc253a295bf9b9aa9fb1ae956ba268bb2d6d27abce4574ad0a4e0d1861c6ce0d84f655bbb45ed6959be27b34820b399c908c96e87de3b5d4c7dff93ed6b
6
+ metadata.gz: a658467635f982e5e53c0cd5a428c96d8f17acb120d16c31184b8ac8ddd2f21c9062c41e6df84610f95227118ae6de6a47053642188e8ed29208e2d44cfa5863
7
+ data.tar.gz: ec789fc4a9c2d3014b4e19c7a5b628f158fdc8a3b262139e86e44147b83a65107844ac19445d924aa41f1e90791d961c6c1bf8abb2ef19a9de49e6a54e63cba0
data/CHANGELOG.md CHANGED
@@ -1,6 +1,11 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.340.0 (2025-11-20)
5
+ ------------------
6
+
7
+ * Feature - Added training plan support for inference endpoints. Added HyperPod task governance with accelerator partition-based quota allocation. Added BatchRebootClusterNodes and BatchReplaceClusterNodes APIs. Updated ListClusterNodes to include privateDnsHostName.
8
+
4
9
  1.339.0 (2025-11-19)
5
10
  ------------------
6
11
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.339.0
1
+ 1.340.0
@@ -950,6 +950,209 @@ module Aws::SageMaker
950
950
  req.send_request(options)
951
951
  end
952
952
 
953
+ # Reboots specific nodes within a SageMaker HyperPod cluster using a
954
+ # soft recovery mechanism. `BatchRebootClusterNodes` performs a graceful
955
+ # reboot of the specified nodes by calling the Amazon Elastic Compute
956
+ # Cloud `RebootInstances` API, which attempts to cleanly shut down the
957
+ # operating system before restarting the instance.
958
+ #
959
+ # This operation is useful for recovering from transient issues or
960
+ # applying certain configuration changes that require a restart.
961
+ #
962
+ # <note markdown="1"> * Rebooting a node may cause temporary service interruption for
963
+ # workloads running on that node. Ensure your workloads can handle
964
+ # node restarts or use appropriate scheduling to minimize impact.
965
+ #
966
+ # * You can reboot up to 25 nodes in a single request.
967
+ #
968
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
969
+ # ensure rebooting nodes will not disrupt critical cluster operations.
970
+ #
971
+ # </note>
972
+ #
973
+ # @option params [required, String] :cluster_name
974
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
975
+ # cluster containing the nodes to reboot.
976
+ #
977
+ # @option params [Array<String>] :node_ids
978
+ # A list of EC2 instance IDs to reboot using soft recovery. You can
979
+ # specify between 1 and 25 instance IDs.
980
+ #
981
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
982
+ # at least one is required.
983
+ #
984
+ # * Each instance ID must follow the pattern `i-` followed by 17
985
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
986
+ #
987
+ # </note>
988
+ #
989
+ # @option params [Array<String>] :node_logical_ids
990
+ # A list of logical node IDs to reboot using soft recovery. You can
991
+ # specify between 1 and 25 logical node IDs.
992
+ #
993
+ # The `NodeLogicalId` is a unique identifier that persists throughout
994
+ # the node's lifecycle and can be used to track nodes that are still
995
+ # being provisioned and don't yet have an EC2 instance ID assigned.
996
+ #
997
+ # * This parameter is only supported for clusters using `Continuous` as
998
+ # the `NodeProvisioningMode`. For clusters using the default
999
+ # provisioning mode, use `NodeIds` instead.
1000
+ #
1001
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1002
+ # at least one is required.
1003
+ #
1004
+ # @return [Types::BatchRebootClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
1005
+ #
1006
+ # * {Types::BatchRebootClusterNodesResponse#successful #successful} => Array&lt;String&gt;
1007
+ # * {Types::BatchRebootClusterNodesResponse#failed #failed} => Array&lt;Types::BatchRebootClusterNodesError&gt;
1008
+ # * {Types::BatchRebootClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array&lt;Types::BatchRebootClusterNodeLogicalIdsError&gt;
1009
+ # * {Types::BatchRebootClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array&lt;String&gt;
1010
+ #
1011
+ # @example Request syntax with placeholder values
1012
+ #
1013
+ # resp = client.batch_reboot_cluster_nodes({
1014
+ # cluster_name: "ClusterNameOrArn", # required
1015
+ # node_ids: ["ClusterNodeId"],
1016
+ # node_logical_ids: ["ClusterNodeLogicalId"],
1017
+ # })
1018
+ #
1019
+ # @example Response structure
1020
+ #
1021
+ # resp.successful #=> Array
1022
+ # resp.successful[0] #=> String
1023
+ # resp.failed #=> Array
1024
+ # resp.failed[0].node_id #=> String
1025
+ # resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1026
+ # resp.failed[0].message #=> String
1027
+ # resp.failed_node_logical_ids #=> Array
1028
+ # resp.failed_node_logical_ids[0].node_logical_id #=> String
1029
+ # resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1030
+ # resp.failed_node_logical_ids[0].message #=> String
1031
+ # resp.successful_node_logical_ids #=> Array
1032
+ # resp.successful_node_logical_ids[0] #=> String
1033
+ #
1034
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodes AWS API Documentation
1035
+ #
1036
+ # @overload batch_reboot_cluster_nodes(params = {})
1037
+ # @param [Hash] params ({})
1038
+ def batch_reboot_cluster_nodes(params = {}, options = {})
1039
+ req = build_request(:batch_reboot_cluster_nodes, params)
1040
+ req.send_request(options)
1041
+ end
1042
+
1043
+ # Replaces specific nodes within a SageMaker HyperPod cluster with new
1044
+ # hardware. `BatchReplaceClusterNodes` terminates the specified
1045
+ # instances and provisions new replacement instances with the same
1046
+ # configuration but fresh hardware. The Amazon Machine Image (AMI) and
1047
+ # instance configuration remain the same.
1048
+ #
1049
+ # This operation is useful for recovering from hardware failures or
1050
+ # persistent issues that cannot be resolved through a reboot.
1051
+ #
1052
+ # * **Data Loss Warning:** Replacing nodes destroys all instance
1053
+ # volumes, including both root and secondary volumes. All data stored
1054
+ # on these volumes will be permanently lost and cannot be recovered.
1055
+ #
1056
+ # * To safeguard your work, back up your data to Amazon S3 or an FSx for
1057
+ # Lustre file system before invoking the API on a worker node group.
1058
+ # This will help prevent any potential data loss from the instance
1059
+ # root volume. For more information about backup, see [Use the backup
1060
+ # script provided by SageMaker HyperPod][1].
1061
+ #
1062
+ # * If you want to invoke this API on an existing cluster, you'll first
1063
+ # need to patch the cluster by running the [UpdateClusterSoftware
1064
+ # API][2]. For more information about patching a cluster, see [Update
1065
+ # the SageMaker HyperPod platform software of a cluster][3].
1066
+ #
1067
+ # * You can replace up to 25 nodes in a single request.
1068
+ #
1069
+ #
1070
+ #
1071
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software-backup
1072
+ # [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_UpdateClusterSoftware.html
1073
+ # [3]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software
1074
+ #
1075
+ # @option params [required, String] :cluster_name
1076
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
1077
+ # cluster containing the nodes to replace.
1078
+ #
1079
+ # @option params [Array<String>] :node_ids
1080
+ # A list of EC2 instance IDs to replace with new hardware. You can
1081
+ # specify between 1 and 25 instance IDs.
1082
+ #
1083
+ # Replace operations destroy all instance volumes (root and secondary).
1084
+ # Ensure you have backed up any important data before proceeding.
1085
+ #
1086
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1087
+ # at least one is required.
1088
+ #
1089
+ # * Each instance ID must follow the pattern `i-` followed by 17
1090
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
1091
+ #
1092
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
1093
+ # you cannot replace instances that are configured as Slurm controller
1094
+ # nodes.
1095
+ #
1096
+ # </note>
1097
+ #
1098
+ # @option params [Array<String>] :node_logical_ids
1099
+ # A list of logical node IDs to replace with new hardware. You can
1100
+ # specify between 1 and 25 logical node IDs.
1101
+ #
1102
+ # The `NodeLogicalId` is a unique identifier that persists throughout
1103
+ # the node's lifecycle and can be used to track nodes that are still
1104
+ # being provisioned and don't yet have an EC2 instance ID assigned.
1105
+ #
1106
+ # * Replace operations destroy all instance volumes (root and
1107
+ # secondary). Ensure you have backed up any important data before
1108
+ # proceeding.
1109
+ #
1110
+ # * This parameter is only supported for clusters using `Continuous` as
1111
+ # the `NodeProvisioningMode`. For clusters using the default
1112
+ # provisioning mode, use `NodeIds` instead.
1113
+ #
1114
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1115
+ # at least one is required.
1116
+ #
1117
+ # @return [Types::BatchReplaceClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
1118
+ #
1119
+ # * {Types::BatchReplaceClusterNodesResponse#successful #successful} => Array&lt;String&gt;
1120
+ # * {Types::BatchReplaceClusterNodesResponse#failed #failed} => Array&lt;Types::BatchReplaceClusterNodesError&gt;
1121
+ # * {Types::BatchReplaceClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array&lt;Types::BatchReplaceClusterNodeLogicalIdsError&gt;
1122
+ # * {Types::BatchReplaceClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array&lt;String&gt;
1123
+ #
1124
+ # @example Request syntax with placeholder values
1125
+ #
1126
+ # resp = client.batch_replace_cluster_nodes({
1127
+ # cluster_name: "ClusterNameOrArn", # required
1128
+ # node_ids: ["ClusterNodeId"],
1129
+ # node_logical_ids: ["ClusterNodeLogicalId"],
1130
+ # })
1131
+ #
1132
+ # @example Response structure
1133
+ #
1134
+ # resp.successful #=> Array
1135
+ # resp.successful[0] #=> String
1136
+ # resp.failed #=> Array
1137
+ # resp.failed[0].node_id #=> String
1138
+ # resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1139
+ # resp.failed[0].message #=> String
1140
+ # resp.failed_node_logical_ids #=> Array
1141
+ # resp.failed_node_logical_ids[0].node_logical_id #=> String
1142
+ # resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1143
+ # resp.failed_node_logical_ids[0].message #=> String
1144
+ # resp.successful_node_logical_ids #=> Array
1145
+ # resp.successful_node_logical_ids[0] #=> String
1146
+ #
1147
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodes AWS API Documentation
1148
+ #
1149
+ # @overload batch_replace_cluster_nodes(params = {})
1150
+ # @param [Hash] params ({})
1151
+ def batch_replace_cluster_nodes(params = {}, options = {})
1152
+ req = build_request(:batch_replace_cluster_nodes, params)
1153
+ req.send_request(options)
1154
+ end
1155
+
953
1156
  # Creates an *action*. An action is a lineage tracking entity that
954
1157
  # represents an action or activity. For example, a model deployment or
955
1158
  # an HPO job. Generally, an action involves at least one input or output
@@ -2725,6 +2928,10 @@ module Aws::SageMaker
2725
2928
  # accelerators: 1,
2726
2929
  # v_cpu: 1.0,
2727
2930
  # memory_in_gi_b: 1.0,
2931
+ # accelerator_partition: {
2932
+ # type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
2933
+ # count: 1, # required
2934
+ # },
2728
2935
  # },
2729
2936
  # ],
2730
2937
  # resource_sharing_config: {
@@ -13912,6 +14119,8 @@ module Aws::SageMaker
13912
14119
  # resp.compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
13913
14120
  # resp.compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
13914
14121
  # resp.compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
14122
+ # resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
14123
+ # resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
13915
14124
  # resp.compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
13916
14125
  # resp.compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
13917
14126
  # resp.compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
@@ -18411,7 +18620,7 @@ module Aws::SageMaker
18411
18620
  # resp.available_spare_instance_count #=> Integer
18412
18621
  # resp.total_ultra_server_count #=> Integer
18413
18622
  # resp.target_resources #=> Array
18414
- # resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
18623
+ # resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
18415
18624
  # resp.reserved_capacity_summaries #=> Array
18416
18625
  # resp.reserved_capacity_summaries[0].reserved_capacity_arn #=> String
18417
18626
  # resp.reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
@@ -20350,6 +20559,7 @@ module Aws::SageMaker
20350
20559
  # resp.cluster_node_summaries[0].instance_status.status #=> String, one of "Running", "Failure", "Pending", "ShuttingDown", "SystemUpdating", "DeepHealthCheckInProgress", "NotFound"
20351
20560
  # resp.cluster_node_summaries[0].instance_status.message #=> String
20352
20561
  # resp.cluster_node_summaries[0].ultra_server_info.id #=> String
20562
+ # resp.cluster_node_summaries[0].private_dns_hostname #=> String
20353
20563
  #
20354
20564
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListClusterNodes AWS API Documentation
20355
20565
  #
@@ -20813,6 +21023,8 @@ module Aws::SageMaker
20813
21023
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
20814
21024
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
20815
21025
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
21026
+ # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
21027
+ # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
20816
21028
  # resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
20817
21029
  # resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
20818
21030
  # resp.compute_quota_summaries[0].compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
@@ -25460,7 +25672,7 @@ module Aws::SageMaker
25460
25672
  # resp.training_plan_summaries[0].in_use_instance_count #=> Integer
25461
25673
  # resp.training_plan_summaries[0].total_ultra_server_count #=> Integer
25462
25674
  # resp.training_plan_summaries[0].target_resources #=> Array
25463
- # resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
25675
+ # resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
25464
25676
  # resp.training_plan_summaries[0].reserved_capacity_summaries #=> Array
25465
25677
  # resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_arn #=> String
25466
25678
  # resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
@@ -26481,7 +26693,7 @@ module Aws::SageMaker
26481
26693
  #
26482
26694
  # @option params [required, Array<String>] :target_resources
26483
26695
  # The target resources (e.g., SageMaker Training Jobs, SageMaker
26484
- # HyperPod) to search for in the offerings.
26696
+ # HyperPod, SageMaker Endpoints) to search for in the offerings.
26485
26697
  #
26486
26698
  # Training plans are specific to their target resource.
26487
26699
  #
@@ -26491,6 +26703,10 @@ module Aws::SageMaker
26491
26703
  # * A training plan for HyperPod clusters can be used exclusively to
26492
26704
  # provide compute resources to a cluster's instance group.
26493
26705
  #
26706
+ # * A training plan for SageMaker endpoints can be used exclusively to
26707
+ # provide compute resources to SageMaker endpoints for model
26708
+ # deployment.
26709
+ #
26494
26710
  # @return [Types::SearchTrainingPlanOfferingsResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
26495
26711
  #
26496
26712
  # * {Types::SearchTrainingPlanOfferingsResponse#training_plan_offerings #training_plan_offerings} => Array&lt;Types::TrainingPlanOffering&gt;
@@ -26505,7 +26721,7 @@ module Aws::SageMaker
26505
26721
  # start_time_after: Time.now,
26506
26722
  # end_time_before: Time.now,
26507
26723
  # duration_hours: 1, # required
26508
- # target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster
26724
+ # target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster, endpoint
26509
26725
  # })
26510
26726
  #
26511
26727
  # @example Response structure
@@ -26513,7 +26729,7 @@ module Aws::SageMaker
26513
26729
  # resp.training_plan_offerings #=> Array
26514
26730
  # resp.training_plan_offerings[0].training_plan_offering_id #=> String
26515
26731
  # resp.training_plan_offerings[0].target_resources #=> Array
26516
- # resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
26732
+ # resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
26517
26733
  # resp.training_plan_offerings[0].requested_start_time_after #=> Time
26518
26734
  # resp.training_plan_offerings[0].requested_end_time_before #=> Time
26519
26735
  # resp.training_plan_offerings[0].duration_hours #=> Integer
@@ -27951,6 +28167,10 @@ module Aws::SageMaker
27951
28167
  # accelerators: 1,
27952
28168
  # v_cpu: 1.0,
27953
28169
  # memory_in_gi_b: 1.0,
28170
+ # accelerator_partition: {
28171
+ # type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
28172
+ # count: 1, # required
28173
+ # },
27954
28174
  # },
27955
28175
  # ],
27956
28176
  # resource_sharing_config: {
@@ -31359,7 +31579,7 @@ module Aws::SageMaker
31359
31579
  tracer: tracer
31360
31580
  )
31361
31581
  context[:gem_name] = 'aws-sdk-sagemaker'
31362
- context[:gem_version] = '1.339.0'
31582
+ context[:gem_version] = '1.340.0'
31363
31583
  Seahorse::Client::Request.new(handlers, context)
31364
31584
  end
31365
31585
 
@@ -14,6 +14,8 @@ module Aws::SageMaker
14
14
 
15
15
  include Seahorse::Model
16
16
 
17
+ AcceleratorPartitionConfig = Shapes::StructureShape.new(name: 'AcceleratorPartitionConfig')
18
+ AcceleratorPartitionConfigCountInteger = Shapes::IntegerShape.new(name: 'AcceleratorPartitionConfigCountInteger')
17
19
  AcceleratorsAmount = Shapes::IntegerShape.new(name: 'AcceleratorsAmount')
18
20
  Accept = Shapes::StringShape.new(name: 'Accept')
19
21
  AcceptEula = Shapes::BooleanShape.new(name: 'AcceptEula')
@@ -211,6 +213,24 @@ module Aws::SageMaker
211
213
  BatchDescribeModelPackageInput = Shapes::StructureShape.new(name: 'BatchDescribeModelPackageInput')
212
214
  BatchDescribeModelPackageOutput = Shapes::StructureShape.new(name: 'BatchDescribeModelPackageOutput')
213
215
  BatchDescribeModelPackageSummary = Shapes::StructureShape.new(name: 'BatchDescribeModelPackageSummary')
216
+ BatchRebootClusterNodeLogicalIdsError = Shapes::StructureShape.new(name: 'BatchRebootClusterNodeLogicalIdsError')
217
+ BatchRebootClusterNodeLogicalIdsErrors = Shapes::ListShape.new(name: 'BatchRebootClusterNodeLogicalIdsErrors')
218
+ BatchRebootClusterNodesError = Shapes::StructureShape.new(name: 'BatchRebootClusterNodesError')
219
+ BatchRebootClusterNodesErrorCode = Shapes::StringShape.new(name: 'BatchRebootClusterNodesErrorCode')
220
+ BatchRebootClusterNodesErrors = Shapes::ListShape.new(name: 'BatchRebootClusterNodesErrors')
221
+ BatchRebootClusterNodesRequest = Shapes::StructureShape.new(name: 'BatchRebootClusterNodesRequest')
222
+ BatchRebootClusterNodesRequestNodeIdsList = Shapes::ListShape.new(name: 'BatchRebootClusterNodesRequestNodeIdsList')
223
+ BatchRebootClusterNodesRequestNodeLogicalIdsList = Shapes::ListShape.new(name: 'BatchRebootClusterNodesRequestNodeLogicalIdsList')
224
+ BatchRebootClusterNodesResponse = Shapes::StructureShape.new(name: 'BatchRebootClusterNodesResponse')
225
+ BatchReplaceClusterNodeLogicalIdsError = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodeLogicalIdsError')
226
+ BatchReplaceClusterNodeLogicalIdsErrors = Shapes::ListShape.new(name: 'BatchReplaceClusterNodeLogicalIdsErrors')
227
+ BatchReplaceClusterNodesError = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodesError')
228
+ BatchReplaceClusterNodesErrorCode = Shapes::StringShape.new(name: 'BatchReplaceClusterNodesErrorCode')
229
+ BatchReplaceClusterNodesErrors = Shapes::ListShape.new(name: 'BatchReplaceClusterNodesErrors')
230
+ BatchReplaceClusterNodesRequest = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodesRequest')
231
+ BatchReplaceClusterNodesRequestNodeIdsList = Shapes::ListShape.new(name: 'BatchReplaceClusterNodesRequestNodeIdsList')
232
+ BatchReplaceClusterNodesRequestNodeLogicalIdsList = Shapes::ListShape.new(name: 'BatchReplaceClusterNodesRequestNodeLogicalIdsList')
233
+ BatchReplaceClusterNodesResponse = Shapes::StructureShape.new(name: 'BatchReplaceClusterNodesResponse')
214
234
  BatchStrategy = Shapes::StringShape.new(name: 'BatchStrategy')
215
235
  BatchTransformInput = Shapes::StructureShape.new(name: 'BatchTransformInput')
216
236
  BestObjectiveNotImproving = Shapes::StructureShape.new(name: 'BestObjectiveNotImproving')
@@ -1569,6 +1589,7 @@ module Aws::SageMaker
1569
1589
  LocalPath = Shapes::StringShape.new(name: 'LocalPath')
1570
1590
  Long = Shapes::IntegerShape.new(name: 'Long')
1571
1591
  LongS3Uri = Shapes::StringShape.new(name: 'LongS3Uri')
1592
+ MIGProfileType = Shapes::StringShape.new(name: 'MIGProfileType')
1572
1593
  MLFramework = Shapes::StringShape.new(name: 'MLFramework')
1573
1594
  MajorMinorVersion = Shapes::StringShape.new(name: 'MajorMinorVersion')
1574
1595
  ManagedInstanceScalingMaxInstanceCount = Shapes::IntegerShape.new(name: 'ManagedInstanceScalingMaxInstanceCount')
@@ -2708,6 +2729,10 @@ module Aws::SageMaker
2708
2729
  WorkteamName = Shapes::StringShape.new(name: 'WorkteamName')
2709
2730
  Workteams = Shapes::ListShape.new(name: 'Workteams')
2710
2731
 
2732
+ AcceleratorPartitionConfig.add_member(:type, Shapes::ShapeRef.new(shape: MIGProfileType, required: true, location_name: "Type"))
2733
+ AcceleratorPartitionConfig.add_member(:count, Shapes::ShapeRef.new(shape: AcceleratorPartitionConfigCountInteger, required: true, location_name: "Count", metadata: {"box" => true}))
2734
+ AcceleratorPartitionConfig.struct_class = Types::AcceleratorPartitionConfig
2735
+
2711
2736
  ActionSource.add_member(:source_uri, Shapes::ShapeRef.new(shape: SourceUri, required: true, location_name: "SourceUri"))
2712
2737
  ActionSource.add_member(:source_type, Shapes::ShapeRef.new(shape: String256, location_name: "SourceType"))
2713
2738
  ActionSource.add_member(:source_id, Shapes::ShapeRef.new(shape: String256, location_name: "SourceId"))
@@ -3210,6 +3235,64 @@ module Aws::SageMaker
3210
3235
  BatchDescribeModelPackageSummary.add_member(:model_approval_status, Shapes::ShapeRef.new(shape: ModelApprovalStatus, location_name: "ModelApprovalStatus"))
3211
3236
  BatchDescribeModelPackageSummary.struct_class = Types::BatchDescribeModelPackageSummary
3212
3237
 
3238
+ BatchRebootClusterNodeLogicalIdsError.add_member(:node_logical_id, Shapes::ShapeRef.new(shape: ClusterNodeLogicalId, required: true, location_name: "NodeLogicalId"))
3239
+ BatchRebootClusterNodeLogicalIdsError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
3240
+ BatchRebootClusterNodeLogicalIdsError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
3241
+ BatchRebootClusterNodeLogicalIdsError.struct_class = Types::BatchRebootClusterNodeLogicalIdsError
3242
+
3243
+ BatchRebootClusterNodeLogicalIdsErrors.member = Shapes::ShapeRef.new(shape: BatchRebootClusterNodeLogicalIdsError)
3244
+
3245
+ BatchRebootClusterNodesError.add_member(:node_id, Shapes::ShapeRef.new(shape: ClusterNodeId, required: true, location_name: "NodeId"))
3246
+ BatchRebootClusterNodesError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
3247
+ BatchRebootClusterNodesError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
3248
+ BatchRebootClusterNodesError.struct_class = Types::BatchRebootClusterNodesError
3249
+
3250
+ BatchRebootClusterNodesErrors.member = Shapes::ShapeRef.new(shape: BatchRebootClusterNodesError)
3251
+
3252
+ BatchRebootClusterNodesRequest.add_member(:cluster_name, Shapes::ShapeRef.new(shape: ClusterNameOrArn, required: true, location_name: "ClusterName"))
3253
+ BatchRebootClusterNodesRequest.add_member(:node_ids, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesRequestNodeIdsList, location_name: "NodeIds"))
3254
+ BatchRebootClusterNodesRequest.add_member(:node_logical_ids, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesRequestNodeLogicalIdsList, location_name: "NodeLogicalIds"))
3255
+ BatchRebootClusterNodesRequest.struct_class = Types::BatchRebootClusterNodesRequest
3256
+
3257
+ BatchRebootClusterNodesRequestNodeIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeId)
3258
+
3259
+ BatchRebootClusterNodesRequestNodeLogicalIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeLogicalId)
3260
+
3261
+ BatchRebootClusterNodesResponse.add_member(:successful, Shapes::ShapeRef.new(shape: ClusterNodeIds, location_name: "Successful"))
3262
+ BatchRebootClusterNodesResponse.add_member(:failed, Shapes::ShapeRef.new(shape: BatchRebootClusterNodesErrors, location_name: "Failed"))
3263
+ BatchRebootClusterNodesResponse.add_member(:failed_node_logical_ids, Shapes::ShapeRef.new(shape: BatchRebootClusterNodeLogicalIdsErrors, location_name: "FailedNodeLogicalIds"))
3264
+ BatchRebootClusterNodesResponse.add_member(:successful_node_logical_ids, Shapes::ShapeRef.new(shape: ClusterNodeLogicalIdList, location_name: "SuccessfulNodeLogicalIds"))
3265
+ BatchRebootClusterNodesResponse.struct_class = Types::BatchRebootClusterNodesResponse
3266
+
3267
+ BatchReplaceClusterNodeLogicalIdsError.add_member(:node_logical_id, Shapes::ShapeRef.new(shape: ClusterNodeLogicalId, required: true, location_name: "NodeLogicalId"))
3268
+ BatchReplaceClusterNodeLogicalIdsError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
3269
+ BatchReplaceClusterNodeLogicalIdsError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
3270
+ BatchReplaceClusterNodeLogicalIdsError.struct_class = Types::BatchReplaceClusterNodeLogicalIdsError
3271
+
3272
+ BatchReplaceClusterNodeLogicalIdsErrors.member = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodeLogicalIdsError)
3273
+
3274
+ BatchReplaceClusterNodesError.add_member(:node_id, Shapes::ShapeRef.new(shape: ClusterNodeId, required: true, location_name: "NodeId"))
3275
+ BatchReplaceClusterNodesError.add_member(:error_code, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesErrorCode, required: true, location_name: "ErrorCode"))
3276
+ BatchReplaceClusterNodesError.add_member(:message, Shapes::ShapeRef.new(shape: String, required: true, location_name: "Message"))
3277
+ BatchReplaceClusterNodesError.struct_class = Types::BatchReplaceClusterNodesError
3278
+
3279
+ BatchReplaceClusterNodesErrors.member = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesError)
3280
+
3281
+ BatchReplaceClusterNodesRequest.add_member(:cluster_name, Shapes::ShapeRef.new(shape: ClusterNameOrArn, required: true, location_name: "ClusterName"))
3282
+ BatchReplaceClusterNodesRequest.add_member(:node_ids, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesRequestNodeIdsList, location_name: "NodeIds"))
3283
+ BatchReplaceClusterNodesRequest.add_member(:node_logical_ids, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesRequestNodeLogicalIdsList, location_name: "NodeLogicalIds"))
3284
+ BatchReplaceClusterNodesRequest.struct_class = Types::BatchReplaceClusterNodesRequest
3285
+
3286
+ BatchReplaceClusterNodesRequestNodeIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeId)
3287
+
3288
+ BatchReplaceClusterNodesRequestNodeLogicalIdsList.member = Shapes::ShapeRef.new(shape: ClusterNodeLogicalId)
3289
+
3290
+ BatchReplaceClusterNodesResponse.add_member(:successful, Shapes::ShapeRef.new(shape: ClusterNodeIds, location_name: "Successful"))
3291
+ BatchReplaceClusterNodesResponse.add_member(:failed, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesErrors, location_name: "Failed"))
3292
+ BatchReplaceClusterNodesResponse.add_member(:failed_node_logical_ids, Shapes::ShapeRef.new(shape: BatchReplaceClusterNodeLogicalIdsErrors, location_name: "FailedNodeLogicalIds"))
3293
+ BatchReplaceClusterNodesResponse.add_member(:successful_node_logical_ids, Shapes::ShapeRef.new(shape: ClusterNodeLogicalIdList, location_name: "SuccessfulNodeLogicalIds"))
3294
+ BatchReplaceClusterNodesResponse.struct_class = Types::BatchReplaceClusterNodesResponse
3295
+
3213
3296
  BatchTransformInput.add_member(:data_captured_destination_s3_uri, Shapes::ShapeRef.new(shape: DestinationS3Uri, required: true, location_name: "DataCapturedDestinationS3Uri"))
3214
3297
  BatchTransformInput.add_member(:dataset_format, Shapes::ShapeRef.new(shape: MonitoringDatasetFormat, required: true, location_name: "DatasetFormat"))
3215
3298
  BatchTransformInput.add_member(:local_path, Shapes::ShapeRef.new(shape: ProcessingLocalPath, required: true, location_name: "LocalPath"))
@@ -3561,6 +3644,7 @@ module Aws::SageMaker
3561
3644
  ClusterNodeSummary.add_member(:last_software_update_time, Shapes::ShapeRef.new(shape: Timestamp, location_name: "LastSoftwareUpdateTime"))
3562
3645
  ClusterNodeSummary.add_member(:instance_status, Shapes::ShapeRef.new(shape: ClusterInstanceStatusDetails, required: true, location_name: "InstanceStatus"))
3563
3646
  ClusterNodeSummary.add_member(:ultra_server_info, Shapes::ShapeRef.new(shape: UltraServerInfo, location_name: "UltraServerInfo"))
3647
+ ClusterNodeSummary.add_member(:private_dns_hostname, Shapes::ShapeRef.new(shape: ClusterPrivateDnsHostname, location_name: "PrivateDnsHostname"))
3564
3648
  ClusterNodeSummary.struct_class = Types::ClusterNodeSummary
3565
3649
 
3566
3650
  ClusterOrchestrator.add_member(:eks, Shapes::ShapeRef.new(shape: ClusterOrchestratorEksConfig, required: true, location_name: "Eks"))
@@ -3703,6 +3787,7 @@ module Aws::SageMaker
3703
3787
  ComputeQuotaResourceConfig.add_member(:accelerators, Shapes::ShapeRef.new(shape: AcceleratorsAmount, location_name: "Accelerators"))
3704
3788
  ComputeQuotaResourceConfig.add_member(:v_cpu, Shapes::ShapeRef.new(shape: VCpuAmount, location_name: "VCpu"))
3705
3789
  ComputeQuotaResourceConfig.add_member(:memory_in_gi_b, Shapes::ShapeRef.new(shape: MemoryInGiBAmount, location_name: "MemoryInGiB"))
3790
+ ComputeQuotaResourceConfig.add_member(:accelerator_partition, Shapes::ShapeRef.new(shape: AcceleratorPartitionConfig, location_name: "AcceleratorPartition"))
3706
3791
  ComputeQuotaResourceConfig.struct_class = Types::ComputeQuotaResourceConfig
3707
3792
 
3708
3793
  ComputeQuotaResourceConfigList.member = Shapes::ShapeRef.new(shape: ComputeQuotaResourceConfig)
@@ -12019,6 +12104,24 @@ module Aws::SageMaker
12019
12104
  o.output = Shapes::ShapeRef.new(shape: BatchDescribeModelPackageOutput)
12020
12105
  end)
12021
12106
 
12107
+ api.add_operation(:batch_reboot_cluster_nodes, Seahorse::Model::Operation.new.tap do |o|
12108
+ o.name = "BatchRebootClusterNodes"
12109
+ o.http_method = "POST"
12110
+ o.http_request_uri = "/"
12111
+ o.input = Shapes::ShapeRef.new(shape: BatchRebootClusterNodesRequest)
12112
+ o.output = Shapes::ShapeRef.new(shape: BatchRebootClusterNodesResponse)
12113
+ o.errors << Shapes::ShapeRef.new(shape: ResourceNotFound)
12114
+ end)
12115
+
12116
+ api.add_operation(:batch_replace_cluster_nodes, Seahorse::Model::Operation.new.tap do |o|
12117
+ o.name = "BatchReplaceClusterNodes"
12118
+ o.http_method = "POST"
12119
+ o.http_request_uri = "/"
12120
+ o.input = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesRequest)
12121
+ o.output = Shapes::ShapeRef.new(shape: BatchReplaceClusterNodesResponse)
12122
+ o.errors << Shapes::ShapeRef.new(shape: ResourceNotFound)
12123
+ end)
12124
+
12022
12125
  api.add_operation(:create_action, Seahorse::Model::Operation.new.tap do |o|
12023
12126
  o.name = "CreateAction"
12024
12127
  o.http_method = "POST"
@@ -10,6 +10,33 @@
10
10
  module Aws::SageMaker
11
11
  module Types
12
12
 
13
+ # Configuration for allocating accelerator partitions.
14
+ #
15
+ # @!attribute [rw] type
16
+ # The Multi-Instance GPU (MIG) profile type that defines the partition
17
+ # configuration. The profile specifies the compute and memory
18
+ # allocation for each partition instance. The available profile types
19
+ # depend on the instance type specified in the compute quota
20
+ # configuration.
21
+ # @return [String]
22
+ #
23
+ # @!attribute [rw] count
24
+ # The number of accelerator partitions to allocate with the specified
25
+ # partition type. If you don't specify a value for vCPU and
26
+ # MemoryInGiB, SageMaker AI automatically allocates ratio-based values
27
+ # for those parameters based on the accelerator partition count you
28
+ # provide.
29
+ # @return [Integer]
30
+ #
31
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/AcceleratorPartitionConfig AWS API Documentation
32
+ #
33
+ class AcceleratorPartitionConfig < Struct.new(
34
+ :type,
35
+ :count)
36
+ SENSITIVE = []
37
+ include Aws::Structure
38
+ end
39
+
13
40
  # A structure describing the source of an action.
14
41
  #
15
42
  # @!attribute [rw] source_uri
@@ -3452,6 +3479,348 @@ module Aws::SageMaker
3452
3479
  include Aws::Structure
3453
3480
  end
3454
3481
 
3482
+ # Represents an error encountered when rebooting a node (identified by
3483
+ # its logical node ID) from a SageMaker HyperPod cluster.
3484
+ #
3485
+ # @!attribute [rw] node_logical_id
3486
+ # The logical node ID of the node that encountered an error during the
3487
+ # reboot operation.
3488
+ # @return [String]
3489
+ #
3490
+ # @!attribute [rw] error_code
3491
+ # The error code associated with the error encountered when rebooting
3492
+ # a node by logical node ID.
3493
+ #
3494
+ # Possible values:
3495
+ #
3496
+ # * `InstanceIdNotFound`: The node does not exist in the specified
3497
+ # cluster.
3498
+ #
3499
+ # * `InvalidInstanceStatus`: The node is in a state that does not
3500
+ # allow rebooting. Wait for the node to finish any ongoing changes
3501
+ # before retrying.
3502
+ #
3503
+ # * `InstanceIdInUse`: Another operation is already in progress for
3504
+ # this node. Wait for the operation to complete before retrying.
3505
+ #
3506
+ # * `InternalServerError`: An internal error occurred while processing
3507
+ # this node.
3508
+ # @return [String]
3509
+ #
3510
+ # @!attribute [rw] message
3511
+ # A human-readable message describing the error encountered when
3512
+ # rebooting a node by logical node ID.
3513
+ # @return [String]
3514
+ #
3515
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodeLogicalIdsError AWS API Documentation
3516
+ #
3517
+ class BatchRebootClusterNodeLogicalIdsError < Struct.new(
3518
+ :node_logical_id,
3519
+ :error_code,
3520
+ :message)
3521
+ SENSITIVE = []
3522
+ include Aws::Structure
3523
+ end
3524
+
3525
+ # Represents an error encountered when rebooting a node from a SageMaker
3526
+ # HyperPod cluster.
3527
+ #
3528
+ # @!attribute [rw] node_id
3529
+ # The EC2 instance ID of the node that encountered an error during the
3530
+ # reboot operation.
3531
+ # @return [String]
3532
+ #
3533
+ # @!attribute [rw] error_code
3534
+ # The error code associated with the error encountered when rebooting
3535
+ # a node.
3536
+ #
3537
+ # Possible values:
3538
+ #
3539
+ # * `InstanceIdNotFound`: The instance does not exist in the specified
3540
+ # cluster.
3541
+ #
3542
+ # * `InvalidInstanceStatus`: The instance is in a state that does not
3543
+ # allow rebooting. Wait for the instance to finish any ongoing
3544
+ # changes before retrying.
3545
+ #
3546
+ # * `InstanceIdInUse`: Another operation is already in progress for
3547
+ # this node. Wait for the operation to complete before retrying.
3548
+ #
3549
+ # * `InternalServerError`: An internal error occurred while processing
3550
+ # this node.
3551
+ # @return [String]
3552
+ #
3553
+ # @!attribute [rw] message
3554
+ # A human-readable message describing the error encountered when
3555
+ # rebooting a node.
3556
+ # @return [String]
3557
+ #
3558
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodesError AWS API Documentation
3559
+ #
3560
+ class BatchRebootClusterNodesError < Struct.new(
3561
+ :node_id,
3562
+ :error_code,
3563
+ :message)
3564
+ SENSITIVE = []
3565
+ include Aws::Structure
3566
+ end
3567
+
3568
+ # @!attribute [rw] cluster_name
3569
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
3570
+ # cluster containing the nodes to reboot.
3571
+ # @return [String]
3572
+ #
3573
+ # @!attribute [rw] node_ids
3574
+ # A list of EC2 instance IDs to reboot using soft recovery. You can
3575
+ # specify between 1 and 25 instance IDs.
3576
+ #
3577
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
3578
+ # but at least one is required.
3579
+ #
3580
+ # * Each instance ID must follow the pattern `i-` followed by 17
3581
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
3582
+ #
3583
+ # </note>
3584
+ # @return [Array<String>]
3585
+ #
3586
+ # @!attribute [rw] node_logical_ids
3587
+ # A list of logical node IDs to reboot using soft recovery. You can
3588
+ # specify between 1 and 25 logical node IDs.
3589
+ #
3590
+ # The `NodeLogicalId` is a unique identifier that persists throughout
3591
+ # the node's lifecycle and can be used to track nodes that are still
3592
+ # being provisioned and don't yet have an EC2 instance ID assigned.
3593
+ #
3594
+ # * This parameter is only supported for clusters using `Continuous`
3595
+ # as the `NodeProvisioningMode`. For clusters using the default
3596
+ # provisioning mode, use `NodeIds` instead.
3597
+ #
3598
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
3599
+ # but at least one is required.
3600
+ # @return [Array<String>]
3601
+ #
3602
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodesRequest AWS API Documentation
3603
+ #
3604
+ class BatchRebootClusterNodesRequest < Struct.new(
3605
+ :cluster_name,
3606
+ :node_ids,
3607
+ :node_logical_ids)
3608
+ SENSITIVE = []
3609
+ include Aws::Structure
3610
+ end
3611
+
3612
+ # @!attribute [rw] successful
3613
+ # A list of EC2 instance IDs for which the reboot operation was
3614
+ # successfully initiated.
3615
+ # @return [Array<String>]
3616
+ #
3617
+ # @!attribute [rw] failed
3618
+ # A list of errors encountered for EC2 instance IDs that could not be
3619
+ # rebooted. Each error includes the instance ID, an error code, and a
3620
+ # descriptive message.
3621
+ # @return [Array<Types::BatchRebootClusterNodesError>]
3622
+ #
3623
+ # @!attribute [rw] failed_node_logical_ids
3624
+ # A list of errors encountered for logical node IDs that could not be
3625
+ # rebooted. Each error includes the logical node ID, an error code,
3626
+ # and a descriptive message. This field is only present when
3627
+ # `NodeLogicalIds` were provided in the request.
3628
+ # @return [Array<Types::BatchRebootClusterNodeLogicalIdsError>]
3629
+ #
3630
+ # @!attribute [rw] successful_node_logical_ids
3631
+ # A list of logical node IDs for which the reboot operation was
3632
+ # successfully initiated. This field is only present when
3633
+ # `NodeLogicalIds` were provided in the request.
3634
+ # @return [Array<String>]
3635
+ #
3636
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodesResponse AWS API Documentation
3637
+ #
3638
+ class BatchRebootClusterNodesResponse < Struct.new(
3639
+ :successful,
3640
+ :failed,
3641
+ :failed_node_logical_ids,
3642
+ :successful_node_logical_ids)
3643
+ SENSITIVE = []
3644
+ include Aws::Structure
3645
+ end
3646
+
3647
+ # Represents an error encountered when replacing a node (identified by
3648
+ # its logical node ID) in a SageMaker HyperPod cluster.
3649
+ #
3650
+ # @!attribute [rw] node_logical_id
3651
+ # The logical node ID of the node that encountered an error during the
3652
+ # replacement operation.
3653
+ # @return [String]
3654
+ #
3655
+ # @!attribute [rw] error_code
3656
+ # The error code associated with the error encountered when replacing
3657
+ # a node by logical node ID.
3658
+ #
3659
+ # Possible values:
3660
+ #
3661
+ # * `InstanceIdNotFound`: The node does not exist in the specified
3662
+ # cluster.
3663
+ #
3664
+ # * `InvalidInstanceStatus`: The node is in a state that does not
3665
+ # allow replacement. Wait for the node to finish any ongoing changes
3666
+ # before retrying.
3667
+ #
3668
+ # * `InstanceIdInUse`: Another operation is already in progress for
3669
+ # this node. Wait for the operation to complete before retrying.
3670
+ #
3671
+ # * `InternalServerError`: An internal error occurred while processing
3672
+ # this node.
3673
+ # @return [String]
3674
+ #
3675
+ # @!attribute [rw] message
3676
+ # A human-readable message describing the error encountered when
3677
+ # replacing a node by logical node ID.
3678
+ # @return [String]
3679
+ #
3680
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodeLogicalIdsError AWS API Documentation
3681
+ #
3682
+ class BatchReplaceClusterNodeLogicalIdsError < Struct.new(
3683
+ :node_logical_id,
3684
+ :error_code,
3685
+ :message)
3686
+ SENSITIVE = []
3687
+ include Aws::Structure
3688
+ end
3689
+
3690
+ # Represents an error encountered when replacing a node in a SageMaker
3691
+ # HyperPod cluster.
3692
+ #
3693
+ # @!attribute [rw] node_id
3694
+ # The EC2 instance ID of the node that encountered an error during the
3695
+ # replacement operation.
3696
+ # @return [String]
3697
+ #
3698
+ # @!attribute [rw] error_code
3699
+ # The error code associated with the error encountered when replacing
3700
+ # a node.
3701
+ #
3702
+ # Possible values:
3703
+ #
3704
+ # * `InstanceIdNotFound`: The instance does not exist in the specified
3705
+ # cluster.
3706
+ #
3707
+ # * `InvalidInstanceStatus`: The instance is in a state that does not
3708
+ # allow replacement. Wait for the instance to finish any ongoing
3709
+ # changes before retrying.
3710
+ #
3711
+ # * `InstanceIdInUse`: Another operation is already in progress for
3712
+ # this node. Wait for the operation to complete before retrying.
3713
+ #
3714
+ # * `InternalServerError`: An internal error occurred while processing
3715
+ # this node.
3716
+ # @return [String]
3717
+ #
3718
+ # @!attribute [rw] message
3719
+ # A human-readable message describing the error encountered when
3720
+ # replacing a node.
3721
+ # @return [String]
3722
+ #
3723
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodesError AWS API Documentation
3724
+ #
3725
+ class BatchReplaceClusterNodesError < Struct.new(
3726
+ :node_id,
3727
+ :error_code,
3728
+ :message)
3729
+ SENSITIVE = []
3730
+ include Aws::Structure
3731
+ end
3732
+
3733
+ # @!attribute [rw] cluster_name
3734
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
3735
+ # cluster containing the nodes to replace.
3736
+ # @return [String]
3737
+ #
3738
+ # @!attribute [rw] node_ids
3739
+ # A list of EC2 instance IDs to replace with new hardware. You can
3740
+ # specify between 1 and 25 instance IDs.
3741
+ #
3742
+ # Replace operations destroy all instance volumes (root and
3743
+ # secondary). Ensure you have backed up any important data before
3744
+ # proceeding.
3745
+ #
3746
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
3747
+ # but at least one is required.
3748
+ #
3749
+ # * Each instance ID must follow the pattern `i-` followed by 17
3750
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
3751
+ #
3752
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
3753
+ # you cannot replace instances that are configured as Slurm
3754
+ # controller nodes.
3755
+ #
3756
+ # </note>
3757
+ # @return [Array<String>]
3758
+ #
3759
+ # @!attribute [rw] node_logical_ids
3760
+ # A list of logical node IDs to replace with new hardware. You can
3761
+ # specify between 1 and 25 logical node IDs.
3762
+ #
3763
+ # The `NodeLogicalId` is a unique identifier that persists throughout
3764
+ # the node's lifecycle and can be used to track nodes that are still
3765
+ # being provisioned and don't yet have an EC2 instance ID assigned.
3766
+ #
3767
+ # * Replace operations destroy all instance volumes (root and
3768
+ # secondary). Ensure you have backed up any important data before
3769
+ # proceeding.
3770
+ #
3771
+ # * This parameter is only supported for clusters using `Continuous`
3772
+ # as the `NodeProvisioningMode`. For clusters using the default
3773
+ # provisioning mode, use `NodeIds` instead.
3774
+ #
3775
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both),
3776
+ # but at least one is required.
3777
+ # @return [Array<String>]
3778
+ #
3779
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodesRequest AWS API Documentation
3780
+ #
3781
+ class BatchReplaceClusterNodesRequest < Struct.new(
3782
+ :cluster_name,
3783
+ :node_ids,
3784
+ :node_logical_ids)
3785
+ SENSITIVE = []
3786
+ include Aws::Structure
3787
+ end
3788
+
3789
+ # @!attribute [rw] successful
3790
+ # A list of EC2 instance IDs for which the replacement operation was
3791
+ # successfully initiated.
3792
+ # @return [Array<String>]
3793
+ #
3794
+ # @!attribute [rw] failed
3795
+ # A list of errors encountered for EC2 instance IDs that could not be
3796
+ # replaced. Each error includes the instance ID, an error code, and a
3797
+ # descriptive message.
3798
+ # @return [Array<Types::BatchReplaceClusterNodesError>]
3799
+ #
3800
+ # @!attribute [rw] failed_node_logical_ids
3801
+ # A list of errors encountered for logical node IDs that could not be
3802
+ # replaced. Each error includes the logical node ID, an error code,
3803
+ # and a descriptive message. This field is only present when
3804
+ # `NodeLogicalIds` were provided in the request.
3805
+ # @return [Array<Types::BatchReplaceClusterNodeLogicalIdsError>]
3806
+ #
3807
+ # @!attribute [rw] successful_node_logical_ids
3808
+ # A list of logical node IDs for which the replacement operation was
3809
+ # successfully initiated. This field is only present when
3810
+ # `NodeLogicalIds` were provided in the request.
3811
+ # @return [Array<String>]
3812
+ #
3813
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodesResponse AWS API Documentation
3814
+ #
3815
+ class BatchReplaceClusterNodesResponse < Struct.new(
3816
+ :successful,
3817
+ :failed,
3818
+ :failed_node_logical_ids,
3819
+ :successful_node_logical_ids)
3820
+ SENSITIVE = []
3821
+ include Aws::Structure
3822
+ end
3823
+
3455
3824
  # Input object for the batch transform job.
3456
3825
  #
3457
3826
  # @!attribute [rw] data_captured_destination_s3_uri
@@ -5536,6 +5905,10 @@ module Aws::SageMaker
5536
5905
  # Contains information about the UltraServer.
5537
5906
  # @return [Types::UltraServerInfo]
5538
5907
  #
5908
+ # @!attribute [rw] private_dns_hostname
5909
+ # The private DNS hostname of the SageMaker HyperPod cluster node.
5910
+ # @return [String]
5911
+ #
5539
5912
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ClusterNodeSummary AWS API Documentation
5540
5913
  #
5541
5914
  class ClusterNodeSummary < Struct.new(
@@ -5546,7 +5919,8 @@ module Aws::SageMaker
5546
5919
  :launch_time,
5547
5920
  :last_software_update_time,
5548
5921
  :instance_status,
5549
- :ultra_server_info)
5922
+ :ultra_server_info,
5923
+ :private_dns_hostname)
5550
5924
  SENSITIVE = []
5551
5925
  include Aws::Structure
5552
5926
  end
@@ -6294,6 +6668,11 @@ module Aws::SageMaker
6294
6668
  # Accelerators are set to 0.
6295
6669
  # @return [Float]
6296
6670
  #
6671
+ # @!attribute [rw] accelerator_partition
6672
+ # The accelerator partition configuration for fractional GPU
6673
+ # allocation.
6674
+ # @return [Types::AcceleratorPartitionConfig]
6675
+ #
6297
6676
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ComputeQuotaResourceConfig AWS API Documentation
6298
6677
  #
6299
6678
  class ComputeQuotaResourceConfig < Struct.new(
@@ -6301,7 +6680,8 @@ module Aws::SageMaker
6301
6680
  :count,
6302
6681
  :accelerators,
6303
6682
  :v_cpu,
6304
- :memory_in_gi_b)
6683
+ :memory_in_gi_b,
6684
+ :accelerator_partition)
6305
6685
  SENSITIVE = []
6306
6686
  include Aws::Structure
6307
6687
  end
@@ -20816,7 +21196,7 @@ module Aws::SageMaker
20816
21196
  #
20817
21197
  # @!attribute [rw] target_resources
20818
21198
  # The target resources (e.g., SageMaker Training Jobs, SageMaker
20819
- # HyperPod) that can use this training plan.
21199
+ # HyperPod, SageMaker Endpoints) that can use this training plan.
20820
21200
  #
20821
21201
  # Training plans are specific to their target resource.
20822
21202
  #
@@ -20825,6 +21205,10 @@ module Aws::SageMaker
20825
21205
  #
20826
21206
  # * A training plan for HyperPod clusters can be used exclusively to
20827
21207
  # provide compute resources to a cluster's instance group.
21208
+ #
21209
+ # * A training plan for SageMaker endpoints can be used exclusively to
21210
+ # provide compute resources to SageMaker endpoints for model
21211
+ # deployment.
20828
21212
  # @return [Array<String>]
20829
21213
  #
20830
21214
  # @!attribute [rw] reserved_capacity_summaries
@@ -45661,7 +46045,7 @@ module Aws::SageMaker
45661
46045
  #
45662
46046
  # @!attribute [rw] target_resources
45663
46047
  # The target resources (e.g., SageMaker Training Jobs, SageMaker
45664
- # HyperPod) to search for in the offerings.
46048
+ # HyperPod, SageMaker Endpoints) to search for in the offerings.
45665
46049
  #
45666
46050
  # Training plans are specific to their target resource.
45667
46051
  #
@@ -45670,6 +46054,10 @@ module Aws::SageMaker
45670
46054
  #
45671
46055
  # * A training plan for HyperPod clusters can be used exclusively to
45672
46056
  # provide compute resources to a cluster's instance group.
46057
+ #
46058
+ # * A training plan for SageMaker endpoints can be used exclusively to
46059
+ # provide compute resources to SageMaker endpoints for model
46060
+ # deployment.
45673
46061
  # @return [Array<String>]
45674
46062
  #
45675
46063
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/SearchTrainingPlanOfferingsRequest AWS API Documentation
@@ -48905,7 +49293,7 @@ module Aws::SageMaker
48905
49293
  #
48906
49294
  # @!attribute [rw] target_resources
48907
49295
  # The target resources (e.g., SageMaker Training Jobs, SageMaker
48908
- # HyperPod) for this training plan offering.
49296
+ # HyperPod, SageMaker Endpoints) for this training plan offering.
48909
49297
  #
48910
49298
  # Training plans are specific to their target resource.
48911
49299
  #
@@ -48914,6 +49302,10 @@ module Aws::SageMaker
48914
49302
  #
48915
49303
  # * A training plan for HyperPod clusters can be used exclusively to
48916
49304
  # provide compute resources to a cluster's instance group.
49305
+ #
49306
+ # * A training plan for SageMaker endpoints can be used exclusively to
49307
+ # provide compute resources to SageMaker endpoints for model
49308
+ # deployment.
48917
49309
  # @return [Array<String>]
48918
49310
  #
48919
49311
  # @!attribute [rw] requested_start_time_after
@@ -49035,8 +49427,8 @@ module Aws::SageMaker
49035
49427
  # @return [Integer]
49036
49428
  #
49037
49429
  # @!attribute [rw] target_resources
49038
- # The target resources (e.g., training jobs, HyperPod clusters) that
49039
- # can use this training plan.
49430
+ # The target resources (e.g., training jobs, HyperPod clusters,
49431
+ # Endpoints) that can use this training plan.
49040
49432
  #
49041
49433
  # Training plans are specific to their target resource.
49042
49434
  #
@@ -49045,6 +49437,10 @@ module Aws::SageMaker
49045
49437
  #
49046
49438
  # * A training plan for HyperPod clusters can be used exclusively to
49047
49439
  # provide compute resources to a cluster's instance group.
49440
+ #
49441
+ # * A training plan for SageMaker endpoints can be used exclusively to
49442
+ # provide compute resources to SageMaker endpoints for model
49443
+ # deployment.
49048
49444
  # @return [Array<String>]
49049
49445
  #
49050
49446
  # @!attribute [rw] reserved_capacity_summaries
@@ -55,7 +55,7 @@ module Aws::SageMaker
55
55
  autoload :EndpointProvider, 'aws-sdk-sagemaker/endpoint_provider'
56
56
  autoload :Endpoints, 'aws-sdk-sagemaker/endpoints'
57
57
 
58
- GEM_VERSION = '1.339.0'
58
+ GEM_VERSION = '1.340.0'
59
59
 
60
60
  end
61
61
 
data/sig/client.rbs CHANGED
@@ -181,6 +181,36 @@ module Aws
181
181
  ) -> _BatchDescribeModelPackageResponseSuccess
182
182
  | (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _BatchDescribeModelPackageResponseSuccess
183
183
 
184
+ interface _BatchRebootClusterNodesResponseSuccess
185
+ include ::Seahorse::Client::_ResponseSuccess[Types::BatchRebootClusterNodesResponse]
186
+ def successful: () -> ::Array[::String]
187
+ def failed: () -> ::Array[Types::BatchRebootClusterNodesError]
188
+ def failed_node_logical_ids: () -> ::Array[Types::BatchRebootClusterNodeLogicalIdsError]
189
+ def successful_node_logical_ids: () -> ::Array[::String]
190
+ end
191
+ # https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#batch_reboot_cluster_nodes-instance_method
192
+ def batch_reboot_cluster_nodes: (
193
+ cluster_name: ::String,
194
+ ?node_ids: Array[::String],
195
+ ?node_logical_ids: Array[::String]
196
+ ) -> _BatchRebootClusterNodesResponseSuccess
197
+ | (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _BatchRebootClusterNodesResponseSuccess
198
+
199
+ interface _BatchReplaceClusterNodesResponseSuccess
200
+ include ::Seahorse::Client::_ResponseSuccess[Types::BatchReplaceClusterNodesResponse]
201
+ def successful: () -> ::Array[::String]
202
+ def failed: () -> ::Array[Types::BatchReplaceClusterNodesError]
203
+ def failed_node_logical_ids: () -> ::Array[Types::BatchReplaceClusterNodeLogicalIdsError]
204
+ def successful_node_logical_ids: () -> ::Array[::String]
205
+ end
206
+ # https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#batch_replace_cluster_nodes-instance_method
207
+ def batch_replace_cluster_nodes: (
208
+ cluster_name: ::String,
209
+ ?node_ids: Array[::String],
210
+ ?node_logical_ids: Array[::String]
211
+ ) -> _BatchReplaceClusterNodesResponseSuccess
212
+ | (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _BatchReplaceClusterNodesResponseSuccess
213
+
184
214
  interface _CreateActionResponseSuccess
185
215
  include ::Seahorse::Client::_ResponseSuccess[Types::CreateActionResponse]
186
216
  def action_arn: () -> ::String
@@ -1013,7 +1043,11 @@ module Aws
1013
1043
  count: ::Integer?,
1014
1044
  accelerators: ::Integer?,
1015
1045
  v_cpu: ::Float?,
1016
- memory_in_gi_b: ::Float?
1046
+ memory_in_gi_b: ::Float?,
1047
+ accelerator_partition: {
1048
+ type: ("mig-1g.5gb" | "mig-1g.10gb" | "mig-1g.18gb" | "mig-1g.20gb" | "mig-1g.23gb" | "mig-1g.35gb" | "mig-1g.45gb" | "mig-1g.47gb" | "mig-2g.10gb" | "mig-2g.20gb" | "mig-2g.35gb" | "mig-2g.45gb" | "mig-2g.47gb" | "mig-3g.20gb" | "mig-3g.40gb" | "mig-3g.71gb" | "mig-3g.90gb" | "mig-3g.93gb" | "mig-4g.20gb" | "mig-4g.40gb" | "mig-4g.71gb" | "mig-4g.90gb" | "mig-4g.93gb" | "mig-7g.40gb" | "mig-7g.80gb" | "mig-7g.141gb" | "mig-7g.180gb" | "mig-7g.186gb"),
1049
+ count: ::Integer
1050
+ }?
1017
1051
  },
1018
1052
  ]?,
1019
1053
  resource_sharing_config: {
@@ -6680,7 +6714,7 @@ module Aws
6680
6714
  def unhealthy_instance_count: () -> ::Integer
6681
6715
  def available_spare_instance_count: () -> ::Integer
6682
6716
  def total_ultra_server_count: () -> ::Integer
6683
- def target_resources: () -> ::Array[("training-job" | "hyperpod-cluster")]
6717
+ def target_resources: () -> ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
6684
6718
  def reserved_capacity_summaries: () -> ::Array[Types::ReservedCapacitySummary]
6685
6719
  end
6686
6720
  # https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#describe_training_plan-instance_method
@@ -8627,7 +8661,7 @@ module Aws
8627
8661
  ?start_time_after: ::Time,
8628
8662
  ?end_time_before: ::Time,
8629
8663
  duration_hours: ::Integer,
8630
- target_resources: Array[("training-job" | "hyperpod-cluster")]
8664
+ target_resources: Array[("training-job" | "hyperpod-cluster" | "endpoint")]
8631
8665
  ) -> _SearchTrainingPlanOfferingsResponseSuccess
8632
8666
  | (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _SearchTrainingPlanOfferingsResponseSuccess
8633
8667
 
@@ -9150,7 +9184,11 @@ module Aws
9150
9184
  count: ::Integer?,
9151
9185
  accelerators: ::Integer?,
9152
9186
  v_cpu: ::Float?,
9153
- memory_in_gi_b: ::Float?
9187
+ memory_in_gi_b: ::Float?,
9188
+ accelerator_partition: {
9189
+ type: ("mig-1g.5gb" | "mig-1g.10gb" | "mig-1g.18gb" | "mig-1g.20gb" | "mig-1g.23gb" | "mig-1g.35gb" | "mig-1g.45gb" | "mig-1g.47gb" | "mig-2g.10gb" | "mig-2g.20gb" | "mig-2g.35gb" | "mig-2g.45gb" | "mig-2g.47gb" | "mig-3g.20gb" | "mig-3g.40gb" | "mig-3g.71gb" | "mig-3g.90gb" | "mig-3g.93gb" | "mig-4g.20gb" | "mig-4g.40gb" | "mig-4g.71gb" | "mig-4g.90gb" | "mig-4g.93gb" | "mig-7g.40gb" | "mig-7g.80gb" | "mig-7g.141gb" | "mig-7g.180gb" | "mig-7g.186gb"),
9190
+ count: ::Integer
9191
+ }?
9154
9192
  },
9155
9193
  ]?,
9156
9194
  resource_sharing_config: {
data/sig/types.rbs CHANGED
@@ -8,6 +8,12 @@
8
8
  module Aws::SageMaker
9
9
  module Types
10
10
 
11
+ class AcceleratorPartitionConfig
12
+ attr_accessor type: ("mig-1g.5gb" | "mig-1g.10gb" | "mig-1g.18gb" | "mig-1g.20gb" | "mig-1g.23gb" | "mig-1g.35gb" | "mig-1g.45gb" | "mig-1g.47gb" | "mig-2g.10gb" | "mig-2g.20gb" | "mig-2g.35gb" | "mig-2g.45gb" | "mig-2g.47gb" | "mig-3g.20gb" | "mig-3g.40gb" | "mig-3g.71gb" | "mig-3g.90gb" | "mig-3g.93gb" | "mig-4g.20gb" | "mig-4g.40gb" | "mig-4g.71gb" | "mig-4g.90gb" | "mig-4g.93gb" | "mig-7g.40gb" | "mig-7g.80gb" | "mig-7g.141gb" | "mig-7g.180gb" | "mig-7g.186gb")
13
+ attr_accessor count: ::Integer
14
+ SENSITIVE: []
15
+ end
16
+
11
17
  class ActionSource
12
18
  attr_accessor source_uri: ::String
13
19
  attr_accessor source_type: ::String
@@ -598,6 +604,64 @@ module Aws::SageMaker
598
604
  SENSITIVE: []
599
605
  end
600
606
 
607
+ class BatchRebootClusterNodeLogicalIdsError
608
+ attr_accessor node_logical_id: ::String
609
+ attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
610
+ attr_accessor message: ::String
611
+ SENSITIVE: []
612
+ end
613
+
614
+ class BatchRebootClusterNodesError
615
+ attr_accessor node_id: ::String
616
+ attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
617
+ attr_accessor message: ::String
618
+ SENSITIVE: []
619
+ end
620
+
621
+ class BatchRebootClusterNodesRequest
622
+ attr_accessor cluster_name: ::String
623
+ attr_accessor node_ids: ::Array[::String]
624
+ attr_accessor node_logical_ids: ::Array[::String]
625
+ SENSITIVE: []
626
+ end
627
+
628
+ class BatchRebootClusterNodesResponse
629
+ attr_accessor successful: ::Array[::String]
630
+ attr_accessor failed: ::Array[Types::BatchRebootClusterNodesError]
631
+ attr_accessor failed_node_logical_ids: ::Array[Types::BatchRebootClusterNodeLogicalIdsError]
632
+ attr_accessor successful_node_logical_ids: ::Array[::String]
633
+ SENSITIVE: []
634
+ end
635
+
636
+ class BatchReplaceClusterNodeLogicalIdsError
637
+ attr_accessor node_logical_id: ::String
638
+ attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
639
+ attr_accessor message: ::String
640
+ SENSITIVE: []
641
+ end
642
+
643
+ class BatchReplaceClusterNodesError
644
+ attr_accessor node_id: ::String
645
+ attr_accessor error_code: ("InstanceIdNotFound" | "InvalidInstanceStatus" | "InstanceIdInUse" | "InternalServerError")
646
+ attr_accessor message: ::String
647
+ SENSITIVE: []
648
+ end
649
+
650
+ class BatchReplaceClusterNodesRequest
651
+ attr_accessor cluster_name: ::String
652
+ attr_accessor node_ids: ::Array[::String]
653
+ attr_accessor node_logical_ids: ::Array[::String]
654
+ SENSITIVE: []
655
+ end
656
+
657
+ class BatchReplaceClusterNodesResponse
658
+ attr_accessor successful: ::Array[::String]
659
+ attr_accessor failed: ::Array[Types::BatchReplaceClusterNodesError]
660
+ attr_accessor failed_node_logical_ids: ::Array[Types::BatchReplaceClusterNodeLogicalIdsError]
661
+ attr_accessor successful_node_logical_ids: ::Array[::String]
662
+ SENSITIVE: []
663
+ end
664
+
601
665
  class BatchTransformInput
602
666
  attr_accessor data_captured_destination_s3_uri: ::String
603
667
  attr_accessor dataset_format: Types::MonitoringDatasetFormat
@@ -1005,6 +1069,7 @@ module Aws::SageMaker
1005
1069
  attr_accessor last_software_update_time: ::Time
1006
1070
  attr_accessor instance_status: Types::ClusterInstanceStatusDetails
1007
1071
  attr_accessor ultra_server_info: Types::UltraServerInfo
1072
+ attr_accessor private_dns_hostname: ::String
1008
1073
  SENSITIVE: []
1009
1074
  end
1010
1075
 
@@ -1165,6 +1230,7 @@ module Aws::SageMaker
1165
1230
  attr_accessor accelerators: ::Integer
1166
1231
  attr_accessor v_cpu: ::Float
1167
1232
  attr_accessor memory_in_gi_b: ::Float
1233
+ attr_accessor accelerator_partition: Types::AcceleratorPartitionConfig
1168
1234
  SENSITIVE: []
1169
1235
  end
1170
1236
 
@@ -4388,7 +4454,7 @@ module Aws::SageMaker
4388
4454
  attr_accessor unhealthy_instance_count: ::Integer
4389
4455
  attr_accessor available_spare_instance_count: ::Integer
4390
4456
  attr_accessor total_ultra_server_count: ::Integer
4391
- attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
4457
+ attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
4392
4458
  attr_accessor reserved_capacity_summaries: ::Array[Types::ReservedCapacitySummary]
4393
4459
  SENSITIVE: []
4394
4460
  end
@@ -9567,7 +9633,7 @@ module Aws::SageMaker
9567
9633
  attr_accessor start_time_after: ::Time
9568
9634
  attr_accessor end_time_before: ::Time
9569
9635
  attr_accessor duration_hours: ::Integer
9570
- attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
9636
+ attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
9571
9637
  SENSITIVE: []
9572
9638
  end
9573
9639
 
@@ -10224,7 +10290,7 @@ module Aws::SageMaker
10224
10290
 
10225
10291
  class TrainingPlanOffering
10226
10292
  attr_accessor training_plan_offering_id: ::String
10227
- attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
10293
+ attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
10228
10294
  attr_accessor requested_start_time_after: ::Time
10229
10295
  attr_accessor requested_end_time_before: ::Time
10230
10296
  attr_accessor duration_hours: ::Integer
@@ -10250,7 +10316,7 @@ module Aws::SageMaker
10250
10316
  attr_accessor available_instance_count: ::Integer
10251
10317
  attr_accessor in_use_instance_count: ::Integer
10252
10318
  attr_accessor total_ultra_server_count: ::Integer
10253
- attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster")]
10319
+ attr_accessor target_resources: ::Array[("training-job" | "hyperpod-cluster" | "endpoint")]
10254
10320
  attr_accessor reserved_capacity_summaries: ::Array[Types::ReservedCapacitySummary]
10255
10321
  SENSITIVE: []
10256
10322
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: aws-sdk-sagemaker
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.339.0
4
+ version: 1.340.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Amazon Web Services