aws-sdk-sagemaker 1.339.0 → 1.341.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f99f676fe2b17eb076e8761bee93ce0bfaee796c41dc984e1eab0803c1947f2e
4
- data.tar.gz: 6b3644ed5504af87e03d6b11d457c9cfa1bcf428b917150a2bad9a661968f654
3
+ metadata.gz: 26865b73cdcf61e9575a07d832b43aa93e24edce14672d0fec79742958394014
4
+ data.tar.gz: 0d0613bf3801d91d0d176695ccf4422a7e531ec6054f80a735069034eb79a2a1
5
5
  SHA512:
6
- metadata.gz: c26fc869f314ef2b25b1b2e0c58c9926c7b20b740a5f46064e31618cd4af601938f5df74199fce53c2c2d5494059acbec30b71727ae6534400013bbee5516433
7
- data.tar.gz: 2bbffdc253a295bf9b9aa9fb1ae956ba268bb2d6d27abce4574ad0a4e0d1861c6ce0d84f655bbb45ed6959be27b34820b399c908c96e87de3b5d4c7dff93ed6b
6
+ metadata.gz: 06ee60e1d183dab830facd89ff879c1df147cc673f511e681cf0ecc2f45211585f034dbeb9893534cf8d1f4486554e59a8375d1acf5b8cd4398f8944245ad875
7
+ data.tar.gz: 913fb03b0fea5374c8eb21cfc8d4668e1705b493f94b9fb1ab30646ef2bc0bce18bc9deddbf5c0a20034dc466cb34b532de52eaeda6e822999d525659eda3585
data/CHANGELOG.md CHANGED
@@ -1,6 +1,16 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.341.0 (2025-11-21)
5
+ ------------------
6
+
7
+ * Feature - Enhanced SageMaker HyperPod instance groups with support for MinInstanceCount, CapacityRequirements (Spot/On-Demand), and KubernetesConfig (labels and taints). Also Added speculative decoding and MaxInstanceCount for model optimization jobs.
8
+
9
+ 1.340.0 (2025-11-20)
10
+ ------------------
11
+
12
+ * Feature - Added training plan support for inference endpoints. Added HyperPod task governance with accelerator partition-based quota allocation. Added BatchRebootClusterNodes and BatchReplaceClusterNodes APIs. Updated ListClusterNodes to include privateDnsHostName.
13
+
4
14
  1.339.0 (2025-11-19)
5
15
  ------------------
6
16
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.339.0
1
+ 1.341.0
@@ -950,6 +950,209 @@ module Aws::SageMaker
950
950
  req.send_request(options)
951
951
  end
952
952
 
953
+ # Reboots specific nodes within a SageMaker HyperPod cluster using a
954
+ # soft recovery mechanism. `BatchRebootClusterNodes` performs a graceful
955
+ # reboot of the specified nodes by calling the Amazon Elastic Compute
956
+ # Cloud `RebootInstances` API, which attempts to cleanly shut down the
957
+ # operating system before restarting the instance.
958
+ #
959
+ # This operation is useful for recovering from transient issues or
960
+ # applying certain configuration changes that require a restart.
961
+ #
962
+ # <note markdown="1"> * Rebooting a node may cause temporary service interruption for
963
+ # workloads running on that node. Ensure your workloads can handle
964
+ # node restarts or use appropriate scheduling to minimize impact.
965
+ #
966
+ # * You can reboot up to 25 nodes in a single request.
967
+ #
968
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
969
+ # ensure rebooting nodes will not disrupt critical cluster operations.
970
+ #
971
+ # </note>
972
+ #
973
+ # @option params [required, String] :cluster_name
974
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
975
+ # cluster containing the nodes to reboot.
976
+ #
977
+ # @option params [Array<String>] :node_ids
978
+ # A list of EC2 instance IDs to reboot using soft recovery. You can
979
+ # specify between 1 and 25 instance IDs.
980
+ #
981
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
982
+ # at least one is required.
983
+ #
984
+ # * Each instance ID must follow the pattern `i-` followed by 17
985
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
986
+ #
987
+ # </note>
988
+ #
989
+ # @option params [Array<String>] :node_logical_ids
990
+ # A list of logical node IDs to reboot using soft recovery. You can
991
+ # specify between 1 and 25 logical node IDs.
992
+ #
993
+ # The `NodeLogicalId` is a unique identifier that persists throughout
994
+ # the node's lifecycle and can be used to track nodes that are still
995
+ # being provisioned and don't yet have an EC2 instance ID assigned.
996
+ #
997
+ # * This parameter is only supported for clusters using `Continuous` as
998
+ # the `NodeProvisioningMode`. For clusters using the default
999
+ # provisioning mode, use `NodeIds` instead.
1000
+ #
1001
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1002
+ # at least one is required.
1003
+ #
1004
+ # @return [Types::BatchRebootClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
1005
+ #
1006
+ # * {Types::BatchRebootClusterNodesResponse#successful #successful} => Array&lt;String&gt;
1007
+ # * {Types::BatchRebootClusterNodesResponse#failed #failed} => Array&lt;Types::BatchRebootClusterNodesError&gt;
1008
+ # * {Types::BatchRebootClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array&lt;Types::BatchRebootClusterNodeLogicalIdsError&gt;
1009
+ # * {Types::BatchRebootClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array&lt;String&gt;
1010
+ #
1011
+ # @example Request syntax with placeholder values
1012
+ #
1013
+ # resp = client.batch_reboot_cluster_nodes({
1014
+ # cluster_name: "ClusterNameOrArn", # required
1015
+ # node_ids: ["ClusterNodeId"],
1016
+ # node_logical_ids: ["ClusterNodeLogicalId"],
1017
+ # })
1018
+ #
1019
+ # @example Response structure
1020
+ #
1021
+ # resp.successful #=> Array
1022
+ # resp.successful[0] #=> String
1023
+ # resp.failed #=> Array
1024
+ # resp.failed[0].node_id #=> String
1025
+ # resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1026
+ # resp.failed[0].message #=> String
1027
+ # resp.failed_node_logical_ids #=> Array
1028
+ # resp.failed_node_logical_ids[0].node_logical_id #=> String
1029
+ # resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1030
+ # resp.failed_node_logical_ids[0].message #=> String
1031
+ # resp.successful_node_logical_ids #=> Array
1032
+ # resp.successful_node_logical_ids[0] #=> String
1033
+ #
1034
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchRebootClusterNodes AWS API Documentation
1035
+ #
1036
+ # @overload batch_reboot_cluster_nodes(params = {})
1037
+ # @param [Hash] params ({})
1038
+ def batch_reboot_cluster_nodes(params = {}, options = {})
1039
+ req = build_request(:batch_reboot_cluster_nodes, params)
1040
+ req.send_request(options)
1041
+ end
1042
+
1043
+ # Replaces specific nodes within a SageMaker HyperPod cluster with new
1044
+ # hardware. `BatchReplaceClusterNodes` terminates the specified
1045
+ # instances and provisions new replacement instances with the same
1046
+ # configuration but fresh hardware. The Amazon Machine Image (AMI) and
1047
+ # instance configuration remain the same.
1048
+ #
1049
+ # This operation is useful for recovering from hardware failures or
1050
+ # persistent issues that cannot be resolved through a reboot.
1051
+ #
1052
+ # * **Data Loss Warning:** Replacing nodes destroys all instance
1053
+ # volumes, including both root and secondary volumes. All data stored
1054
+ # on these volumes will be permanently lost and cannot be recovered.
1055
+ #
1056
+ # * To safeguard your work, back up your data to Amazon S3 or an FSx for
1057
+ # Lustre file system before invoking the API on a worker node group.
1058
+ # This will help prevent any potential data loss from the instance
1059
+ # root volume. For more information about backup, see [Use the backup
1060
+ # script provided by SageMaker HyperPod][1].
1061
+ #
1062
+ # * If you want to invoke this API on an existing cluster, you'll first
1063
+ # need to patch the cluster by running the [UpdateClusterSoftware
1064
+ # API][2]. For more information about patching a cluster, see [Update
1065
+ # the SageMaker HyperPod platform software of a cluster][3].
1066
+ #
1067
+ # * You can replace up to 25 nodes in a single request.
1068
+ #
1069
+ #
1070
+ #
1071
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software-backup
1072
+ # [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_UpdateClusterSoftware.html
1073
+ # [3]: https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-hyperpod-operate-cli-command.html#sagemaker-hyperpod-operate-cli-command-update-cluster-software
1074
+ #
1075
+ # @option params [required, String] :cluster_name
1076
+ # The name or Amazon Resource Name (ARN) of the SageMaker HyperPod
1077
+ # cluster containing the nodes to replace.
1078
+ #
1079
+ # @option params [Array<String>] :node_ids
1080
+ # A list of EC2 instance IDs to replace with new hardware. You can
1081
+ # specify between 1 and 25 instance IDs.
1082
+ #
1083
+ # Replace operations destroy all instance volumes (root and secondary).
1084
+ # Ensure you have backed up any important data before proceeding.
1085
+ #
1086
+ # <note markdown="1"> * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1087
+ # at least one is required.
1088
+ #
1089
+ # * Each instance ID must follow the pattern `i-` followed by 17
1090
+ # hexadecimal characters (for example, `i-0123456789abcdef0`).
1091
+ #
1092
+ # * For SageMaker HyperPod clusters using the Slurm workload manager,
1093
+ # you cannot replace instances that are configured as Slurm controller
1094
+ # nodes.
1095
+ #
1096
+ # </note>
1097
+ #
1098
+ # @option params [Array<String>] :node_logical_ids
1099
+ # A list of logical node IDs to replace with new hardware. You can
1100
+ # specify between 1 and 25 logical node IDs.
1101
+ #
1102
+ # The `NodeLogicalId` is a unique identifier that persists throughout
1103
+ # the node's lifecycle and can be used to track nodes that are still
1104
+ # being provisioned and don't yet have an EC2 instance ID assigned.
1105
+ #
1106
+ # * Replace operations destroy all instance volumes (root and
1107
+ # secondary). Ensure you have backed up any important data before
1108
+ # proceeding.
1109
+ #
1110
+ # * This parameter is only supported for clusters using `Continuous` as
1111
+ # the `NodeProvisioningMode`. For clusters using the default
1112
+ # provisioning mode, use `NodeIds` instead.
1113
+ #
1114
+ # * Either `NodeIds` or `NodeLogicalIds` must be provided (or both), but
1115
+ # at least one is required.
1116
+ #
1117
+ # @return [Types::BatchReplaceClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
1118
+ #
1119
+ # * {Types::BatchReplaceClusterNodesResponse#successful #successful} => Array&lt;String&gt;
1120
+ # * {Types::BatchReplaceClusterNodesResponse#failed #failed} => Array&lt;Types::BatchReplaceClusterNodesError&gt;
1121
+ # * {Types::BatchReplaceClusterNodesResponse#failed_node_logical_ids #failed_node_logical_ids} => Array&lt;Types::BatchReplaceClusterNodeLogicalIdsError&gt;
1122
+ # * {Types::BatchReplaceClusterNodesResponse#successful_node_logical_ids #successful_node_logical_ids} => Array&lt;String&gt;
1123
+ #
1124
+ # @example Request syntax with placeholder values
1125
+ #
1126
+ # resp = client.batch_replace_cluster_nodes({
1127
+ # cluster_name: "ClusterNameOrArn", # required
1128
+ # node_ids: ["ClusterNodeId"],
1129
+ # node_logical_ids: ["ClusterNodeLogicalId"],
1130
+ # })
1131
+ #
1132
+ # @example Response structure
1133
+ #
1134
+ # resp.successful #=> Array
1135
+ # resp.successful[0] #=> String
1136
+ # resp.failed #=> Array
1137
+ # resp.failed[0].node_id #=> String
1138
+ # resp.failed[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1139
+ # resp.failed[0].message #=> String
1140
+ # resp.failed_node_logical_ids #=> Array
1141
+ # resp.failed_node_logical_ids[0].node_logical_id #=> String
1142
+ # resp.failed_node_logical_ids[0].error_code #=> String, one of "InstanceIdNotFound", "InvalidInstanceStatus", "InstanceIdInUse", "InternalServerError"
1143
+ # resp.failed_node_logical_ids[0].message #=> String
1144
+ # resp.successful_node_logical_ids #=> Array
1145
+ # resp.successful_node_logical_ids[0] #=> String
1146
+ #
1147
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchReplaceClusterNodes AWS API Documentation
1148
+ #
1149
+ # @overload batch_replace_cluster_nodes(params = {})
1150
+ # @param [Hash] params ({})
1151
+ def batch_replace_cluster_nodes(params = {}, options = {})
1152
+ req = build_request(:batch_replace_cluster_nodes, params)
1153
+ req.send_request(options)
1154
+ end
1155
+
953
1156
  # Creates an *action*. An action is a lineage tracking entity that
954
1157
  # represents an action or activity. For example, a model deployment or
955
1158
  # an HPO job. Generally, an action involves at least one input or output
@@ -2243,6 +2446,7 @@ module Aws::SageMaker
2243
2446
  # instance_groups: [
2244
2447
  # {
2245
2448
  # instance_count: 1, # required
2449
+ # min_instance_count: 1,
2246
2450
  # instance_group_name: "ClusterInstanceGroupName", # required
2247
2451
  # instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p6e-gb200.36xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.12xlarge, ml.c5.18xlarge, ml.c5.24xlarge, ml.c5n.large, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.8xlarge, ml.m5.12xlarge, ml.m5.16xlarge, ml.m5.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.gr6.4xlarge, ml.gr6.8xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.p6-b200.48xlarge, ml.trn2.3xlarge, ml.trn2.48xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.r6i.large, ml.r6i.xlarge, ml.r6i.2xlarge, ml.r6i.4xlarge, ml.r6i.8xlarge, ml.r6i.12xlarge, ml.r6i.16xlarge, ml.r6i.24xlarge, ml.r6i.32xlarge, ml.i3en.large, ml.i3en.xlarge, ml.i3en.2xlarge, ml.i3en.3xlarge, ml.i3en.6xlarge, ml.i3en.12xlarge, ml.i3en.24xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge
2248
2452
  # life_cycle_config: { # required
@@ -2288,6 +2492,24 @@ module Aws::SageMaker
2288
2492
  # },
2289
2493
  # },
2290
2494
  # image_id: "ImageId",
2495
+ # kubernetes_config: {
2496
+ # labels: {
2497
+ # "ClusterKubernetesLabelKey" => "ClusterKubernetesLabelValue",
2498
+ # },
2499
+ # taints: [
2500
+ # {
2501
+ # key: "ClusterKubernetesTaintKey", # required
2502
+ # value: "ClusterKubernetesTaintValue",
2503
+ # effect: "NoSchedule", # required, accepts NoSchedule, PreferNoSchedule, NoExecute
2504
+ # },
2505
+ # ],
2506
+ # },
2507
+ # capacity_requirements: {
2508
+ # spot: {
2509
+ # },
2510
+ # on_demand: {
2511
+ # },
2512
+ # },
2291
2513
  # },
2292
2514
  # ],
2293
2515
  # restricted_instance_groups: [
@@ -2725,6 +2947,10 @@ module Aws::SageMaker
2725
2947
  # accelerators: 1,
2726
2948
  # v_cpu: 1.0,
2727
2949
  # memory_in_gi_b: 1.0,
2950
+ # accelerator_partition: {
2951
+ # type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
2952
+ # count: 1, # required
2953
+ # },
2728
2954
  # },
2729
2955
  # ],
2730
2956
  # resource_sharing_config: {
@@ -8363,6 +8589,9 @@ module Aws::SageMaker
8363
8589
  # The type of instance that hosts the optimized model that you create
8364
8590
  # with the optimization job.
8365
8591
  #
8592
+ # @option params [Integer] :max_instance_count
8593
+ # The maximum number of instances to use for the optimization job.
8594
+ #
8366
8595
  # @option params [Hash<String,String>] :optimization_environment
8367
8596
  # The environment variables to set in the model container.
8368
8597
  #
@@ -8424,8 +8653,12 @@ module Aws::SageMaker
8424
8653
  # accept_eula: false, # required
8425
8654
  # },
8426
8655
  # },
8656
+ # sage_maker_model: {
8657
+ # model_name: "ModelName",
8658
+ # },
8427
8659
  # },
8428
- # deployment_instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.12xlarge, ml.g6.16xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.12xlarge, ml.g6e.16xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge
8660
+ # deployment_instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.12xlarge, ml.g6.16xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.12xlarge, ml.g6e.16xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge
8661
+ # max_instance_count: 1,
8429
8662
  # optimization_environment: {
8430
8663
  # "NonEmptyString256" => "String256",
8431
8664
  # },
@@ -8449,11 +8682,21 @@ module Aws::SageMaker
8449
8682
  # "NonEmptyString256" => "String256",
8450
8683
  # },
8451
8684
  # },
8685
+ # model_speculative_decoding_config: {
8686
+ # technique: "EAGLE", # required, accepts EAGLE
8687
+ # training_data_source: {
8688
+ # s3_uri: "S3Uri", # required
8689
+ # s3_data_type: "S3Prefix", # required, accepts S3Prefix, ManifestFile
8690
+ # },
8691
+ # },
8452
8692
  # },
8453
8693
  # ],
8454
8694
  # output_config: { # required
8455
8695
  # kms_key_id: "KmsKeyId",
8456
8696
  # s3_output_location: "S3Uri", # required
8697
+ # sage_maker_model: {
8698
+ # model_name: "ModelName",
8699
+ # },
8457
8700
  # },
8458
8701
  # stopping_condition: { # required
8459
8702
  # max_runtime_in_seconds: 1,
@@ -13443,6 +13686,7 @@ module Aws::SageMaker
13443
13686
  # resp.instance_groups #=> Array
13444
13687
  # resp.instance_groups[0].current_count #=> Integer
13445
13688
  # resp.instance_groups[0].target_count #=> Integer
13689
+ # resp.instance_groups[0].min_count #=> Integer
13446
13690
  # resp.instance_groups[0].instance_group_name #=> String
13447
13691
  # resp.instance_groups[0].instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p6e-gb200.36xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.12xlarge", "ml.c5.18xlarge", "ml.c5.24xlarge", "ml.c5n.large", "ml.c5n.2xlarge", "ml.c5n.4xlarge", "ml.c5n.9xlarge", "ml.c5n.18xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.8xlarge", "ml.m5.12xlarge", "ml.m5.16xlarge", "ml.m5.24xlarge", "ml.t3.medium", "ml.t3.large", "ml.t3.xlarge", "ml.t3.2xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.16xlarge", "ml.g6.12xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.gr6.4xlarge", "ml.gr6.8xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.16xlarge", "ml.g6e.12xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.p6-b200.48xlarge", "ml.trn2.3xlarge", "ml.trn2.48xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.m6i.large", "ml.m6i.xlarge", "ml.m6i.2xlarge", "ml.m6i.4xlarge", "ml.m6i.8xlarge", "ml.m6i.12xlarge", "ml.m6i.16xlarge", "ml.m6i.24xlarge", "ml.m6i.32xlarge", "ml.r6i.large", "ml.r6i.xlarge", "ml.r6i.2xlarge", "ml.r6i.4xlarge", "ml.r6i.8xlarge", "ml.r6i.12xlarge", "ml.r6i.16xlarge", "ml.r6i.24xlarge", "ml.r6i.32xlarge", "ml.i3en.large", "ml.i3en.xlarge", "ml.i3en.2xlarge", "ml.i3en.3xlarge", "ml.i3en.6xlarge", "ml.i3en.12xlarge", "ml.i3en.24xlarge", "ml.m7i.large", "ml.m7i.xlarge", "ml.m7i.2xlarge", "ml.m7i.4xlarge", "ml.m7i.8xlarge", "ml.m7i.12xlarge", "ml.m7i.16xlarge", "ml.m7i.24xlarge", "ml.m7i.48xlarge", "ml.r7i.large", "ml.r7i.xlarge", "ml.r7i.2xlarge", "ml.r7i.4xlarge", "ml.r7i.8xlarge", "ml.r7i.12xlarge", "ml.r7i.16xlarge", "ml.r7i.24xlarge", "ml.r7i.48xlarge"
13448
13692
  # resp.instance_groups[0].life_cycle_config.source_s3_uri #=> String
@@ -13472,6 +13716,20 @@ module Aws::SageMaker
13472
13716
  # resp.instance_groups[0].scheduled_update_config.deployment_config.auto_rollback_configuration[0].alarm_name #=> String
13473
13717
  # resp.instance_groups[0].current_image_id #=> String
13474
13718
  # resp.instance_groups[0].desired_image_id #=> String
13719
+ # resp.instance_groups[0].active_operations #=> Hash
13720
+ # resp.instance_groups[0].active_operations["ActiveClusterOperationName"] #=> Integer
13721
+ # resp.instance_groups[0].kubernetes_config.current_labels #=> Hash
13722
+ # resp.instance_groups[0].kubernetes_config.current_labels["ClusterKubernetesLabelKey"] #=> String
13723
+ # resp.instance_groups[0].kubernetes_config.desired_labels #=> Hash
13724
+ # resp.instance_groups[0].kubernetes_config.desired_labels["ClusterKubernetesLabelKey"] #=> String
13725
+ # resp.instance_groups[0].kubernetes_config.current_taints #=> Array
13726
+ # resp.instance_groups[0].kubernetes_config.current_taints[0].key #=> String
13727
+ # resp.instance_groups[0].kubernetes_config.current_taints[0].value #=> String
13728
+ # resp.instance_groups[0].kubernetes_config.current_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13729
+ # resp.instance_groups[0].kubernetes_config.desired_taints #=> Array
13730
+ # resp.instance_groups[0].kubernetes_config.desired_taints[0].key #=> String
13731
+ # resp.instance_groups[0].kubernetes_config.desired_taints[0].value #=> String
13732
+ # resp.instance_groups[0].kubernetes_config.desired_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13475
13733
  # resp.instance_groups[0].target_state_count #=> Integer
13476
13734
  # resp.instance_groups[0].software_update_status #=> String, one of "Pending", "InProgress", "Succeeded", "Failed", "RollbackInProgress", "RollbackComplete"
13477
13735
  # resp.instance_groups[0].active_software_update_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENTAGE"
@@ -13582,6 +13840,7 @@ module Aws::SageMaker
13582
13840
  # resp.event_details.event_details.event_metadata.instance_group.ami_override #=> String
13583
13841
  # resp.event_details.event_details.event_metadata.instance_group_scaling.instance_count #=> Integer
13584
13842
  # resp.event_details.event_details.event_metadata.instance_group_scaling.target_count #=> Integer
13843
+ # resp.event_details.event_details.event_metadata.instance_group_scaling.min_count #=> Integer
13585
13844
  # resp.event_details.event_details.event_metadata.instance_group_scaling.failure_message #=> String
13586
13845
  # resp.event_details.event_details.event_metadata.instance.customer_eni #=> String
13587
13846
  # resp.event_details.event_details.event_metadata.instance.additional_enis.efa_enis #=> Array
@@ -13659,6 +13918,19 @@ module Aws::SageMaker
13659
13918
  # resp.node_details.current_image_id #=> String
13660
13919
  # resp.node_details.desired_image_id #=> String
13661
13920
  # resp.node_details.ultra_server_info.id #=> String
13921
+ # resp.node_details.kubernetes_config.current_labels #=> Hash
13922
+ # resp.node_details.kubernetes_config.current_labels["ClusterKubernetesLabelKey"] #=> String
13923
+ # resp.node_details.kubernetes_config.desired_labels #=> Hash
13924
+ # resp.node_details.kubernetes_config.desired_labels["ClusterKubernetesLabelKey"] #=> String
13925
+ # resp.node_details.kubernetes_config.current_taints #=> Array
13926
+ # resp.node_details.kubernetes_config.current_taints[0].key #=> String
13927
+ # resp.node_details.kubernetes_config.current_taints[0].value #=> String
13928
+ # resp.node_details.kubernetes_config.current_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13929
+ # resp.node_details.kubernetes_config.desired_taints #=> Array
13930
+ # resp.node_details.kubernetes_config.desired_taints[0].key #=> String
13931
+ # resp.node_details.kubernetes_config.desired_taints[0].value #=> String
13932
+ # resp.node_details.kubernetes_config.desired_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13933
+ # resp.node_details.capacity_type #=> String, one of "Spot", "OnDemand"
13662
13934
  #
13663
13935
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeClusterNode AWS API Documentation
13664
13936
  #
@@ -13912,6 +14184,8 @@ module Aws::SageMaker
13912
14184
  # resp.compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
13913
14185
  # resp.compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
13914
14186
  # resp.compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
14187
+ # resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
14188
+ # resp.compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
13915
14189
  # resp.compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
13916
14190
  # resp.compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
13917
14191
  # resp.compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
@@ -17399,6 +17673,7 @@ module Aws::SageMaker
17399
17673
  # * {Types::DescribeOptimizationJobResponse#model_source #model_source} => Types::OptimizationJobModelSource
17400
17674
  # * {Types::DescribeOptimizationJobResponse#optimization_environment #optimization_environment} => Hash&lt;String,String&gt;
17401
17675
  # * {Types::DescribeOptimizationJobResponse#deployment_instance_type #deployment_instance_type} => String
17676
+ # * {Types::DescribeOptimizationJobResponse#max_instance_count #max_instance_count} => Integer
17402
17677
  # * {Types::DescribeOptimizationJobResponse#optimization_configs #optimization_configs} => Array&lt;Types::OptimizationConfig&gt;
17403
17678
  # * {Types::DescribeOptimizationJobResponse#output_config #output_config} => Types::OptimizationJobOutputConfig
17404
17679
  # * {Types::DescribeOptimizationJobResponse#optimization_output #optimization_output} => Types::OptimizationOutput
@@ -17424,9 +17699,11 @@ module Aws::SageMaker
17424
17699
  # resp.optimization_job_name #=> String
17425
17700
  # resp.model_source.s3.s3_uri #=> String
17426
17701
  # resp.model_source.s3.model_access_config.accept_eula #=> Boolean
17702
+ # resp.model_source.sage_maker_model.model_name #=> String
17427
17703
  # resp.optimization_environment #=> Hash
17428
17704
  # resp.optimization_environment["NonEmptyString256"] #=> String
17429
- # resp.deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
17705
+ # resp.deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
17706
+ # resp.max_instance_count #=> Integer
17430
17707
  # resp.optimization_configs #=> Array
17431
17708
  # resp.optimization_configs[0].model_quantization_config.image #=> String
17432
17709
  # resp.optimization_configs[0].model_quantization_config.override_environment #=> Hash
@@ -17437,8 +17714,12 @@ module Aws::SageMaker
17437
17714
  # resp.optimization_configs[0].model_sharding_config.image #=> String
17438
17715
  # resp.optimization_configs[0].model_sharding_config.override_environment #=> Hash
17439
17716
  # resp.optimization_configs[0].model_sharding_config.override_environment["NonEmptyString256"] #=> String
17717
+ # resp.optimization_configs[0].model_speculative_decoding_config.technique #=> String, one of "EAGLE"
17718
+ # resp.optimization_configs[0].model_speculative_decoding_config.training_data_source.s3_uri #=> String
17719
+ # resp.optimization_configs[0].model_speculative_decoding_config.training_data_source.s3_data_type #=> String, one of "S3Prefix", "ManifestFile"
17440
17720
  # resp.output_config.kms_key_id #=> String
17441
17721
  # resp.output_config.s3_output_location #=> String
17722
+ # resp.output_config.sage_maker_model.model_name #=> String
17442
17723
  # resp.optimization_output.recommended_inference_image #=> String
17443
17724
  # resp.role_arn #=> String
17444
17725
  # resp.stopping_condition.max_runtime_in_seconds #=> Integer
@@ -18411,7 +18692,7 @@ module Aws::SageMaker
18411
18692
  # resp.available_spare_instance_count #=> Integer
18412
18693
  # resp.total_ultra_server_count #=> Integer
18413
18694
  # resp.target_resources #=> Array
18414
- # resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
18695
+ # resp.target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
18415
18696
  # resp.reserved_capacity_summaries #=> Array
18416
18697
  # resp.reserved_capacity_summaries[0].reserved_capacity_arn #=> String
18417
18698
  # resp.reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
@@ -20350,6 +20631,7 @@ module Aws::SageMaker
20350
20631
  # resp.cluster_node_summaries[0].instance_status.status #=> String, one of "Running", "Failure", "Pending", "ShuttingDown", "SystemUpdating", "DeepHealthCheckInProgress", "NotFound"
20351
20632
  # resp.cluster_node_summaries[0].instance_status.message #=> String
20352
20633
  # resp.cluster_node_summaries[0].ultra_server_info.id #=> String
20634
+ # resp.cluster_node_summaries[0].private_dns_hostname #=> String
20353
20635
  #
20354
20636
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListClusterNodes AWS API Documentation
20355
20637
  #
@@ -20813,6 +21095,8 @@ module Aws::SageMaker
20813
21095
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerators #=> Integer
20814
21096
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].v_cpu #=> Float
20815
21097
  # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].memory_in_gi_b #=> Float
21098
+ # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.type #=> String, one of "mig-1g.5gb", "mig-1g.10gb", "mig-1g.18gb", "mig-1g.20gb", "mig-1g.23gb", "mig-1g.35gb", "mig-1g.45gb", "mig-1g.47gb", "mig-2g.10gb", "mig-2g.20gb", "mig-2g.35gb", "mig-2g.45gb", "mig-2g.47gb", "mig-3g.20gb", "mig-3g.40gb", "mig-3g.71gb", "mig-3g.90gb", "mig-3g.93gb", "mig-4g.20gb", "mig-4g.40gb", "mig-4g.71gb", "mig-4g.90gb", "mig-4g.93gb", "mig-7g.40gb", "mig-7g.80gb", "mig-7g.141gb", "mig-7g.180gb", "mig-7g.186gb"
21099
+ # resp.compute_quota_summaries[0].compute_quota_config.compute_quota_resources[0].accelerator_partition.count #=> Integer
20816
21100
  # resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.strategy #=> String, one of "Lend", "DontLend", "LendAndBorrow"
20817
21101
  # resp.compute_quota_summaries[0].compute_quota_config.resource_sharing_config.borrow_limit #=> Integer
20818
21102
  # resp.compute_quota_summaries[0].compute_quota_config.preempt_team_tasks #=> String, one of "Never", "LowerPriority"
@@ -24261,7 +24545,8 @@ module Aws::SageMaker
24261
24545
  # resp.optimization_job_summaries[0].optimization_start_time #=> Time
24262
24546
  # resp.optimization_job_summaries[0].optimization_end_time #=> Time
24263
24547
  # resp.optimization_job_summaries[0].last_modified_time #=> Time
24264
- # resp.optimization_job_summaries[0].deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
24548
+ # resp.optimization_job_summaries[0].deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
24549
+ # resp.optimization_job_summaries[0].max_instance_count #=> Integer
24265
24550
  # resp.optimization_job_summaries[0].optimization_types #=> Array
24266
24551
  # resp.optimization_job_summaries[0].optimization_types[0] #=> String
24267
24552
  # resp.next_token #=> String
@@ -25460,7 +25745,7 @@ module Aws::SageMaker
25460
25745
  # resp.training_plan_summaries[0].in_use_instance_count #=> Integer
25461
25746
  # resp.training_plan_summaries[0].total_ultra_server_count #=> Integer
25462
25747
  # resp.training_plan_summaries[0].target_resources #=> Array
25463
- # resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
25748
+ # resp.training_plan_summaries[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
25464
25749
  # resp.training_plan_summaries[0].reserved_capacity_summaries #=> Array
25465
25750
  # resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_arn #=> String
25466
25751
  # resp.training_plan_summaries[0].reserved_capacity_summaries[0].reserved_capacity_type #=> String, one of "UltraServer", "Instance"
@@ -26481,7 +26766,7 @@ module Aws::SageMaker
26481
26766
  #
26482
26767
  # @option params [required, Array<String>] :target_resources
26483
26768
  # The target resources (e.g., SageMaker Training Jobs, SageMaker
26484
- # HyperPod) to search for in the offerings.
26769
+ # HyperPod, SageMaker Endpoints) to search for in the offerings.
26485
26770
  #
26486
26771
  # Training plans are specific to their target resource.
26487
26772
  #
@@ -26491,6 +26776,10 @@ module Aws::SageMaker
26491
26776
  # * A training plan for HyperPod clusters can be used exclusively to
26492
26777
  # provide compute resources to a cluster's instance group.
26493
26778
  #
26779
+ # * A training plan for SageMaker endpoints can be used exclusively to
26780
+ # provide compute resources to SageMaker endpoints for model
26781
+ # deployment.
26782
+ #
26494
26783
  # @return [Types::SearchTrainingPlanOfferingsResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
26495
26784
  #
26496
26785
  # * {Types::SearchTrainingPlanOfferingsResponse#training_plan_offerings #training_plan_offerings} => Array&lt;Types::TrainingPlanOffering&gt;
@@ -26505,7 +26794,7 @@ module Aws::SageMaker
26505
26794
  # start_time_after: Time.now,
26506
26795
  # end_time_before: Time.now,
26507
26796
  # duration_hours: 1, # required
26508
- # target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster
26797
+ # target_resources: ["training-job"], # required, accepts training-job, hyperpod-cluster, endpoint
26509
26798
  # })
26510
26799
  #
26511
26800
  # @example Response structure
@@ -26513,7 +26802,7 @@ module Aws::SageMaker
26513
26802
  # resp.training_plan_offerings #=> Array
26514
26803
  # resp.training_plan_offerings[0].training_plan_offering_id #=> String
26515
26804
  # resp.training_plan_offerings[0].target_resources #=> Array
26516
- # resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster"
26805
+ # resp.training_plan_offerings[0].target_resources[0] #=> String, one of "training-job", "hyperpod-cluster", "endpoint"
26517
26806
  # resp.training_plan_offerings[0].requested_start_time_after #=> Time
26518
26807
  # resp.training_plan_offerings[0].requested_end_time_before #=> Time
26519
26808
  # resp.training_plan_offerings[0].duration_hours #=> Integer
@@ -27596,6 +27885,7 @@ module Aws::SageMaker
27596
27885
  # instance_groups: [
27597
27886
  # {
27598
27887
  # instance_count: 1, # required
27888
+ # min_instance_count: 1,
27599
27889
  # instance_group_name: "ClusterInstanceGroupName", # required
27600
27890
  # instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p6e-gb200.36xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.12xlarge, ml.c5.18xlarge, ml.c5.24xlarge, ml.c5n.large, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.8xlarge, ml.m5.12xlarge, ml.m5.16xlarge, ml.m5.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.gr6.4xlarge, ml.gr6.8xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.p6-b200.48xlarge, ml.trn2.3xlarge, ml.trn2.48xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.r6i.large, ml.r6i.xlarge, ml.r6i.2xlarge, ml.r6i.4xlarge, ml.r6i.8xlarge, ml.r6i.12xlarge, ml.r6i.16xlarge, ml.r6i.24xlarge, ml.r6i.32xlarge, ml.i3en.large, ml.i3en.xlarge, ml.i3en.2xlarge, ml.i3en.3xlarge, ml.i3en.6xlarge, ml.i3en.12xlarge, ml.i3en.24xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge
27601
27891
  # life_cycle_config: { # required
@@ -27641,6 +27931,24 @@ module Aws::SageMaker
27641
27931
  # },
27642
27932
  # },
27643
27933
  # image_id: "ImageId",
27934
+ # kubernetes_config: {
27935
+ # labels: {
27936
+ # "ClusterKubernetesLabelKey" => "ClusterKubernetesLabelValue",
27937
+ # },
27938
+ # taints: [
27939
+ # {
27940
+ # key: "ClusterKubernetesTaintKey", # required
27941
+ # value: "ClusterKubernetesTaintValue",
27942
+ # effect: "NoSchedule", # required, accepts NoSchedule, PreferNoSchedule, NoExecute
27943
+ # },
27944
+ # ],
27945
+ # },
27946
+ # capacity_requirements: {
27947
+ # spot: {
27948
+ # },
27949
+ # on_demand: {
27950
+ # },
27951
+ # },
27644
27952
  # },
27645
27953
  # ],
27646
27954
  # restricted_instance_groups: [
@@ -27951,6 +28259,10 @@ module Aws::SageMaker
27951
28259
  # accelerators: 1,
27952
28260
  # v_cpu: 1.0,
27953
28261
  # memory_in_gi_b: 1.0,
28262
+ # accelerator_partition: {
28263
+ # type: "mig-1g.5gb", # required, accepts mig-1g.5gb, mig-1g.10gb, mig-1g.18gb, mig-1g.20gb, mig-1g.23gb, mig-1g.35gb, mig-1g.45gb, mig-1g.47gb, mig-2g.10gb, mig-2g.20gb, mig-2g.35gb, mig-2g.45gb, mig-2g.47gb, mig-3g.20gb, mig-3g.40gb, mig-3g.71gb, mig-3g.90gb, mig-3g.93gb, mig-4g.20gb, mig-4g.40gb, mig-4g.71gb, mig-4g.90gb, mig-4g.93gb, mig-7g.40gb, mig-7g.80gb, mig-7g.141gb, mig-7g.180gb, mig-7g.186gb
28264
+ # count: 1, # required
28265
+ # },
27954
28266
  # },
27955
28267
  # ],
27956
28268
  # resource_sharing_config: {
@@ -31359,7 +31671,7 @@ module Aws::SageMaker
31359
31671
  tracer: tracer
31360
31672
  )
31361
31673
  context[:gem_name] = 'aws-sdk-sagemaker'
31362
- context[:gem_version] = '1.339.0'
31674
+ context[:gem_version] = '1.341.0'
31363
31675
  Seahorse::Client::Request.new(handlers, context)
31364
31676
  end
31365
31677