aws-sdk-sagemaker 1.340.0 → 1.341.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f760b6f6d6902ca08349489fe9e34c577365953a32aa2f031a4db9e67aa9cb08
4
- data.tar.gz: 5d01231c9d2c1d978d56deee398fb98fe79da54085d362172671724d6bce3233
3
+ metadata.gz: 26865b73cdcf61e9575a07d832b43aa93e24edce14672d0fec79742958394014
4
+ data.tar.gz: 0d0613bf3801d91d0d176695ccf4422a7e531ec6054f80a735069034eb79a2a1
5
5
  SHA512:
6
- metadata.gz: a658467635f982e5e53c0cd5a428c96d8f17acb120d16c31184b8ac8ddd2f21c9062c41e6df84610f95227118ae6de6a47053642188e8ed29208e2d44cfa5863
7
- data.tar.gz: ec789fc4a9c2d3014b4e19c7a5b628f158fdc8a3b262139e86e44147b83a65107844ac19445d924aa41f1e90791d961c6c1bf8abb2ef19a9de49e6a54e63cba0
6
+ metadata.gz: 06ee60e1d183dab830facd89ff879c1df147cc673f511e681cf0ecc2f45211585f034dbeb9893534cf8d1f4486554e59a8375d1acf5b8cd4398f8944245ad875
7
+ data.tar.gz: 913fb03b0fea5374c8eb21cfc8d4668e1705b493f94b9fb1ab30646ef2bc0bce18bc9deddbf5c0a20034dc466cb34b532de52eaeda6e822999d525659eda3585
data/CHANGELOG.md CHANGED
@@ -1,6 +1,11 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.341.0 (2025-11-21)
5
+ ------------------
6
+
7
+ * Feature - Enhanced SageMaker HyperPod instance groups with support for MinInstanceCount, CapacityRequirements (Spot/On-Demand), and KubernetesConfig (labels and taints). Also Added speculative decoding and MaxInstanceCount for model optimization jobs.
8
+
4
9
  1.340.0 (2025-11-20)
5
10
  ------------------
6
11
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.340.0
1
+ 1.341.0
@@ -2446,6 +2446,7 @@ module Aws::SageMaker
2446
2446
  # instance_groups: [
2447
2447
  # {
2448
2448
  # instance_count: 1, # required
2449
+ # min_instance_count: 1,
2449
2450
  # instance_group_name: "ClusterInstanceGroupName", # required
2450
2451
  # instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p6e-gb200.36xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.12xlarge, ml.c5.18xlarge, ml.c5.24xlarge, ml.c5n.large, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.8xlarge, ml.m5.12xlarge, ml.m5.16xlarge, ml.m5.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.gr6.4xlarge, ml.gr6.8xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.p6-b200.48xlarge, ml.trn2.3xlarge, ml.trn2.48xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.r6i.large, ml.r6i.xlarge, ml.r6i.2xlarge, ml.r6i.4xlarge, ml.r6i.8xlarge, ml.r6i.12xlarge, ml.r6i.16xlarge, ml.r6i.24xlarge, ml.r6i.32xlarge, ml.i3en.large, ml.i3en.xlarge, ml.i3en.2xlarge, ml.i3en.3xlarge, ml.i3en.6xlarge, ml.i3en.12xlarge, ml.i3en.24xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge
2451
2452
  # life_cycle_config: { # required
@@ -2491,6 +2492,24 @@ module Aws::SageMaker
2491
2492
  # },
2492
2493
  # },
2493
2494
  # image_id: "ImageId",
2495
+ # kubernetes_config: {
2496
+ # labels: {
2497
+ # "ClusterKubernetesLabelKey" => "ClusterKubernetesLabelValue",
2498
+ # },
2499
+ # taints: [
2500
+ # {
2501
+ # key: "ClusterKubernetesTaintKey", # required
2502
+ # value: "ClusterKubernetesTaintValue",
2503
+ # effect: "NoSchedule", # required, accepts NoSchedule, PreferNoSchedule, NoExecute
2504
+ # },
2505
+ # ],
2506
+ # },
2507
+ # capacity_requirements: {
2508
+ # spot: {
2509
+ # },
2510
+ # on_demand: {
2511
+ # },
2512
+ # },
2494
2513
  # },
2495
2514
  # ],
2496
2515
  # restricted_instance_groups: [
@@ -8570,6 +8589,9 @@ module Aws::SageMaker
8570
8589
  # The type of instance that hosts the optimized model that you create
8571
8590
  # with the optimization job.
8572
8591
  #
8592
+ # @option params [Integer] :max_instance_count
8593
+ # The maximum number of instances to use for the optimization job.
8594
+ #
8573
8595
  # @option params [Hash<String,String>] :optimization_environment
8574
8596
  # The environment variables to set in the model container.
8575
8597
  #
@@ -8631,8 +8653,12 @@ module Aws::SageMaker
8631
8653
  # accept_eula: false, # required
8632
8654
  # },
8633
8655
  # },
8656
+ # sage_maker_model: {
8657
+ # model_name: "ModelName",
8658
+ # },
8634
8659
  # },
8635
- # deployment_instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.12xlarge, ml.g6.16xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.12xlarge, ml.g6e.16xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge
8660
+ # deployment_instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.12xlarge, ml.g6.16xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.12xlarge, ml.g6e.16xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge
8661
+ # max_instance_count: 1,
8636
8662
  # optimization_environment: {
8637
8663
  # "NonEmptyString256" => "String256",
8638
8664
  # },
@@ -8656,11 +8682,21 @@ module Aws::SageMaker
8656
8682
  # "NonEmptyString256" => "String256",
8657
8683
  # },
8658
8684
  # },
8685
+ # model_speculative_decoding_config: {
8686
+ # technique: "EAGLE", # required, accepts EAGLE
8687
+ # training_data_source: {
8688
+ # s3_uri: "S3Uri", # required
8689
+ # s3_data_type: "S3Prefix", # required, accepts S3Prefix, ManifestFile
8690
+ # },
8691
+ # },
8659
8692
  # },
8660
8693
  # ],
8661
8694
  # output_config: { # required
8662
8695
  # kms_key_id: "KmsKeyId",
8663
8696
  # s3_output_location: "S3Uri", # required
8697
+ # sage_maker_model: {
8698
+ # model_name: "ModelName",
8699
+ # },
8664
8700
  # },
8665
8701
  # stopping_condition: { # required
8666
8702
  # max_runtime_in_seconds: 1,
@@ -13650,6 +13686,7 @@ module Aws::SageMaker
13650
13686
  # resp.instance_groups #=> Array
13651
13687
  # resp.instance_groups[0].current_count #=> Integer
13652
13688
  # resp.instance_groups[0].target_count #=> Integer
13689
+ # resp.instance_groups[0].min_count #=> Integer
13653
13690
  # resp.instance_groups[0].instance_group_name #=> String
13654
13691
  # resp.instance_groups[0].instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p6e-gb200.36xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.12xlarge", "ml.c5.18xlarge", "ml.c5.24xlarge", "ml.c5n.large", "ml.c5n.2xlarge", "ml.c5n.4xlarge", "ml.c5n.9xlarge", "ml.c5n.18xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.8xlarge", "ml.m5.12xlarge", "ml.m5.16xlarge", "ml.m5.24xlarge", "ml.t3.medium", "ml.t3.large", "ml.t3.xlarge", "ml.t3.2xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.16xlarge", "ml.g6.12xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.gr6.4xlarge", "ml.gr6.8xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.16xlarge", "ml.g6e.12xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.p6-b200.48xlarge", "ml.trn2.3xlarge", "ml.trn2.48xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.m6i.large", "ml.m6i.xlarge", "ml.m6i.2xlarge", "ml.m6i.4xlarge", "ml.m6i.8xlarge", "ml.m6i.12xlarge", "ml.m6i.16xlarge", "ml.m6i.24xlarge", "ml.m6i.32xlarge", "ml.r6i.large", "ml.r6i.xlarge", "ml.r6i.2xlarge", "ml.r6i.4xlarge", "ml.r6i.8xlarge", "ml.r6i.12xlarge", "ml.r6i.16xlarge", "ml.r6i.24xlarge", "ml.r6i.32xlarge", "ml.i3en.large", "ml.i3en.xlarge", "ml.i3en.2xlarge", "ml.i3en.3xlarge", "ml.i3en.6xlarge", "ml.i3en.12xlarge", "ml.i3en.24xlarge", "ml.m7i.large", "ml.m7i.xlarge", "ml.m7i.2xlarge", "ml.m7i.4xlarge", "ml.m7i.8xlarge", "ml.m7i.12xlarge", "ml.m7i.16xlarge", "ml.m7i.24xlarge", "ml.m7i.48xlarge", "ml.r7i.large", "ml.r7i.xlarge", "ml.r7i.2xlarge", "ml.r7i.4xlarge", "ml.r7i.8xlarge", "ml.r7i.12xlarge", "ml.r7i.16xlarge", "ml.r7i.24xlarge", "ml.r7i.48xlarge"
13655
13692
  # resp.instance_groups[0].life_cycle_config.source_s3_uri #=> String
@@ -13679,6 +13716,20 @@ module Aws::SageMaker
13679
13716
  # resp.instance_groups[0].scheduled_update_config.deployment_config.auto_rollback_configuration[0].alarm_name #=> String
13680
13717
  # resp.instance_groups[0].current_image_id #=> String
13681
13718
  # resp.instance_groups[0].desired_image_id #=> String
13719
+ # resp.instance_groups[0].active_operations #=> Hash
13720
+ # resp.instance_groups[0].active_operations["ActiveClusterOperationName"] #=> Integer
13721
+ # resp.instance_groups[0].kubernetes_config.current_labels #=> Hash
13722
+ # resp.instance_groups[0].kubernetes_config.current_labels["ClusterKubernetesLabelKey"] #=> String
13723
+ # resp.instance_groups[0].kubernetes_config.desired_labels #=> Hash
13724
+ # resp.instance_groups[0].kubernetes_config.desired_labels["ClusterKubernetesLabelKey"] #=> String
13725
+ # resp.instance_groups[0].kubernetes_config.current_taints #=> Array
13726
+ # resp.instance_groups[0].kubernetes_config.current_taints[0].key #=> String
13727
+ # resp.instance_groups[0].kubernetes_config.current_taints[0].value #=> String
13728
+ # resp.instance_groups[0].kubernetes_config.current_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13729
+ # resp.instance_groups[0].kubernetes_config.desired_taints #=> Array
13730
+ # resp.instance_groups[0].kubernetes_config.desired_taints[0].key #=> String
13731
+ # resp.instance_groups[0].kubernetes_config.desired_taints[0].value #=> String
13732
+ # resp.instance_groups[0].kubernetes_config.desired_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13682
13733
  # resp.instance_groups[0].target_state_count #=> Integer
13683
13734
  # resp.instance_groups[0].software_update_status #=> String, one of "Pending", "InProgress", "Succeeded", "Failed", "RollbackInProgress", "RollbackComplete"
13684
13735
  # resp.instance_groups[0].active_software_update_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENTAGE"
@@ -13789,6 +13840,7 @@ module Aws::SageMaker
13789
13840
  # resp.event_details.event_details.event_metadata.instance_group.ami_override #=> String
13790
13841
  # resp.event_details.event_details.event_metadata.instance_group_scaling.instance_count #=> Integer
13791
13842
  # resp.event_details.event_details.event_metadata.instance_group_scaling.target_count #=> Integer
13843
+ # resp.event_details.event_details.event_metadata.instance_group_scaling.min_count #=> Integer
13792
13844
  # resp.event_details.event_details.event_metadata.instance_group_scaling.failure_message #=> String
13793
13845
  # resp.event_details.event_details.event_metadata.instance.customer_eni #=> String
13794
13846
  # resp.event_details.event_details.event_metadata.instance.additional_enis.efa_enis #=> Array
@@ -13866,6 +13918,19 @@ module Aws::SageMaker
13866
13918
  # resp.node_details.current_image_id #=> String
13867
13919
  # resp.node_details.desired_image_id #=> String
13868
13920
  # resp.node_details.ultra_server_info.id #=> String
13921
+ # resp.node_details.kubernetes_config.current_labels #=> Hash
13922
+ # resp.node_details.kubernetes_config.current_labels["ClusterKubernetesLabelKey"] #=> String
13923
+ # resp.node_details.kubernetes_config.desired_labels #=> Hash
13924
+ # resp.node_details.kubernetes_config.desired_labels["ClusterKubernetesLabelKey"] #=> String
13925
+ # resp.node_details.kubernetes_config.current_taints #=> Array
13926
+ # resp.node_details.kubernetes_config.current_taints[0].key #=> String
13927
+ # resp.node_details.kubernetes_config.current_taints[0].value #=> String
13928
+ # resp.node_details.kubernetes_config.current_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13929
+ # resp.node_details.kubernetes_config.desired_taints #=> Array
13930
+ # resp.node_details.kubernetes_config.desired_taints[0].key #=> String
13931
+ # resp.node_details.kubernetes_config.desired_taints[0].value #=> String
13932
+ # resp.node_details.kubernetes_config.desired_taints[0].effect #=> String, one of "NoSchedule", "PreferNoSchedule", "NoExecute"
13933
+ # resp.node_details.capacity_type #=> String, one of "Spot", "OnDemand"
13869
13934
  #
13870
13935
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeClusterNode AWS API Documentation
13871
13936
  #
@@ -17608,6 +17673,7 @@ module Aws::SageMaker
17608
17673
  # * {Types::DescribeOptimizationJobResponse#model_source #model_source} => Types::OptimizationJobModelSource
17609
17674
  # * {Types::DescribeOptimizationJobResponse#optimization_environment #optimization_environment} => Hash&lt;String,String&gt;
17610
17675
  # * {Types::DescribeOptimizationJobResponse#deployment_instance_type #deployment_instance_type} => String
17676
+ # * {Types::DescribeOptimizationJobResponse#max_instance_count #max_instance_count} => Integer
17611
17677
  # * {Types::DescribeOptimizationJobResponse#optimization_configs #optimization_configs} => Array&lt;Types::OptimizationConfig&gt;
17612
17678
  # * {Types::DescribeOptimizationJobResponse#output_config #output_config} => Types::OptimizationJobOutputConfig
17613
17679
  # * {Types::DescribeOptimizationJobResponse#optimization_output #optimization_output} => Types::OptimizationOutput
@@ -17633,9 +17699,11 @@ module Aws::SageMaker
17633
17699
  # resp.optimization_job_name #=> String
17634
17700
  # resp.model_source.s3.s3_uri #=> String
17635
17701
  # resp.model_source.s3.model_access_config.accept_eula #=> Boolean
17702
+ # resp.model_source.sage_maker_model.model_name #=> String
17636
17703
  # resp.optimization_environment #=> Hash
17637
17704
  # resp.optimization_environment["NonEmptyString256"] #=> String
17638
- # resp.deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
17705
+ # resp.deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
17706
+ # resp.max_instance_count #=> Integer
17639
17707
  # resp.optimization_configs #=> Array
17640
17708
  # resp.optimization_configs[0].model_quantization_config.image #=> String
17641
17709
  # resp.optimization_configs[0].model_quantization_config.override_environment #=> Hash
@@ -17646,8 +17714,12 @@ module Aws::SageMaker
17646
17714
  # resp.optimization_configs[0].model_sharding_config.image #=> String
17647
17715
  # resp.optimization_configs[0].model_sharding_config.override_environment #=> Hash
17648
17716
  # resp.optimization_configs[0].model_sharding_config.override_environment["NonEmptyString256"] #=> String
17717
+ # resp.optimization_configs[0].model_speculative_decoding_config.technique #=> String, one of "EAGLE"
17718
+ # resp.optimization_configs[0].model_speculative_decoding_config.training_data_source.s3_uri #=> String
17719
+ # resp.optimization_configs[0].model_speculative_decoding_config.training_data_source.s3_data_type #=> String, one of "S3Prefix", "ManifestFile"
17649
17720
  # resp.output_config.kms_key_id #=> String
17650
17721
  # resp.output_config.s3_output_location #=> String
17722
+ # resp.output_config.sage_maker_model.model_name #=> String
17651
17723
  # resp.optimization_output.recommended_inference_image #=> String
17652
17724
  # resp.role_arn #=> String
17653
17725
  # resp.stopping_condition.max_runtime_in_seconds #=> Integer
@@ -24473,7 +24545,8 @@ module Aws::SageMaker
24473
24545
  # resp.optimization_job_summaries[0].optimization_start_time #=> Time
24474
24546
  # resp.optimization_job_summaries[0].optimization_end_time #=> Time
24475
24547
  # resp.optimization_job_summaries[0].last_modified_time #=> Time
24476
- # resp.optimization_job_summaries[0].deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
24548
+ # resp.optimization_job_summaries[0].deployment_instance_type #=> String, one of "ml.p4d.24xlarge", "ml.p4de.24xlarge", "ml.p5.48xlarge", "ml.p5e.48xlarge", "ml.p5en.48xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.g6.xlarge", "ml.g6.2xlarge", "ml.g6.4xlarge", "ml.g6.8xlarge", "ml.g6.12xlarge", "ml.g6.16xlarge", "ml.g6.24xlarge", "ml.g6.48xlarge", "ml.g6e.xlarge", "ml.g6e.2xlarge", "ml.g6e.4xlarge", "ml.g6e.8xlarge", "ml.g6e.12xlarge", "ml.g6e.16xlarge", "ml.g6e.24xlarge", "ml.g6e.48xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.trn1n.32xlarge"
24549
+ # resp.optimization_job_summaries[0].max_instance_count #=> Integer
24477
24550
  # resp.optimization_job_summaries[0].optimization_types #=> Array
24478
24551
  # resp.optimization_job_summaries[0].optimization_types[0] #=> String
24479
24552
  # resp.next_token #=> String
@@ -27812,6 +27885,7 @@ module Aws::SageMaker
27812
27885
  # instance_groups: [
27813
27886
  # {
27814
27887
  # instance_count: 1, # required
27888
+ # min_instance_count: 1,
27815
27889
  # instance_group_name: "ClusterInstanceGroupName", # required
27816
27890
  # instance_type: "ml.p4d.24xlarge", # required, accepts ml.p4d.24xlarge, ml.p4de.24xlarge, ml.p5.48xlarge, ml.p6e-gb200.36xlarge, ml.trn1.32xlarge, ml.trn1n.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.12xlarge, ml.c5.18xlarge, ml.c5.24xlarge, ml.c5n.large, ml.c5n.2xlarge, ml.c5n.4xlarge, ml.c5n.9xlarge, ml.c5n.18xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.8xlarge, ml.m5.12xlarge, ml.m5.16xlarge, ml.m5.24xlarge, ml.t3.medium, ml.t3.large, ml.t3.xlarge, ml.t3.2xlarge, ml.g6.xlarge, ml.g6.2xlarge, ml.g6.4xlarge, ml.g6.8xlarge, ml.g6.16xlarge, ml.g6.12xlarge, ml.g6.24xlarge, ml.g6.48xlarge, ml.gr6.4xlarge, ml.gr6.8xlarge, ml.g6e.xlarge, ml.g6e.2xlarge, ml.g6e.4xlarge, ml.g6e.8xlarge, ml.g6e.16xlarge, ml.g6e.12xlarge, ml.g6e.24xlarge, ml.g6e.48xlarge, ml.p5e.48xlarge, ml.p5en.48xlarge, ml.p6-b200.48xlarge, ml.trn2.3xlarge, ml.trn2.48xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.m6i.large, ml.m6i.xlarge, ml.m6i.2xlarge, ml.m6i.4xlarge, ml.m6i.8xlarge, ml.m6i.12xlarge, ml.m6i.16xlarge, ml.m6i.24xlarge, ml.m6i.32xlarge, ml.r6i.large, ml.r6i.xlarge, ml.r6i.2xlarge, ml.r6i.4xlarge, ml.r6i.8xlarge, ml.r6i.12xlarge, ml.r6i.16xlarge, ml.r6i.24xlarge, ml.r6i.32xlarge, ml.i3en.large, ml.i3en.xlarge, ml.i3en.2xlarge, ml.i3en.3xlarge, ml.i3en.6xlarge, ml.i3en.12xlarge, ml.i3en.24xlarge, ml.m7i.large, ml.m7i.xlarge, ml.m7i.2xlarge, ml.m7i.4xlarge, ml.m7i.8xlarge, ml.m7i.12xlarge, ml.m7i.16xlarge, ml.m7i.24xlarge, ml.m7i.48xlarge, ml.r7i.large, ml.r7i.xlarge, ml.r7i.2xlarge, ml.r7i.4xlarge, ml.r7i.8xlarge, ml.r7i.12xlarge, ml.r7i.16xlarge, ml.r7i.24xlarge, ml.r7i.48xlarge
27817
27891
  # life_cycle_config: { # required
@@ -27857,6 +27931,24 @@ module Aws::SageMaker
27857
27931
  # },
27858
27932
  # },
27859
27933
  # image_id: "ImageId",
27934
+ # kubernetes_config: {
27935
+ # labels: {
27936
+ # "ClusterKubernetesLabelKey" => "ClusterKubernetesLabelValue",
27937
+ # },
27938
+ # taints: [
27939
+ # {
27940
+ # key: "ClusterKubernetesTaintKey", # required
27941
+ # value: "ClusterKubernetesTaintValue",
27942
+ # effect: "NoSchedule", # required, accepts NoSchedule, PreferNoSchedule, NoExecute
27943
+ # },
27944
+ # ],
27945
+ # },
27946
+ # capacity_requirements: {
27947
+ # spot: {
27948
+ # },
27949
+ # on_demand: {
27950
+ # },
27951
+ # },
27860
27952
  # },
27861
27953
  # ],
27862
27954
  # restricted_instance_groups: [
@@ -31579,7 +31671,7 @@ module Aws::SageMaker
31579
31671
  tracer: tracer
31580
31672
  )
31581
31673
  context[:gem_name] = 'aws-sdk-sagemaker'
31582
- context[:gem_version] = '1.340.0'
31674
+ context[:gem_version] = '1.341.0'
31583
31675
  Seahorse::Client::Request.new(handlers, context)
31584
31676
  end
31585
31677
 
@@ -26,6 +26,9 @@ module Aws::SageMaker
26
26
  ActionSummaries = Shapes::ListShape.new(name: 'ActionSummaries')
27
27
  ActionSummary = Shapes::StructureShape.new(name: 'ActionSummary')
28
28
  ActivationState = Shapes::StringShape.new(name: 'ActivationState')
29
+ ActiveClusterOperationCount = Shapes::IntegerShape.new(name: 'ActiveClusterOperationCount')
30
+ ActiveClusterOperationName = Shapes::StringShape.new(name: 'ActiveClusterOperationName')
31
+ ActiveOperations = Shapes::MapShape.new(name: 'ActiveOperations')
29
32
  AddAssociationRequest = Shapes::StructureShape.new(name: 'AddAssociationRequest')
30
33
  AddAssociationResponse = Shapes::StructureShape.new(name: 'AddAssociationResponse')
31
34
  AddClusterNodeSpecification = Shapes::StructureShape.new(name: 'AddClusterNodeSpecification')
@@ -342,6 +345,8 @@ module Aws::SageMaker
342
345
  ClusterAutoScalingStatus = Shapes::StringShape.new(name: 'ClusterAutoScalingStatus')
343
346
  ClusterAvailabilityZone = Shapes::StringShape.new(name: 'ClusterAvailabilityZone')
344
347
  ClusterAvailabilityZoneId = Shapes::StringShape.new(name: 'ClusterAvailabilityZoneId')
348
+ ClusterCapacityRequirements = Shapes::StructureShape.new(name: 'ClusterCapacityRequirements')
349
+ ClusterCapacityType = Shapes::StringShape.new(name: 'ClusterCapacityType')
345
350
  ClusterConfigMode = Shapes::StringShape.new(name: 'ClusterConfigMode')
346
351
  ClusterEbsVolumeConfig = Shapes::StructureShape.new(name: 'ClusterEbsVolumeConfig')
347
352
  ClusterEbsVolumeSizeInGB = Shapes::IntegerShape.new(name: 'ClusterEbsVolumeSizeInGB')
@@ -364,6 +369,17 @@ module Aws::SageMaker
364
369
  ClusterInstanceStorageConfig = Shapes::UnionShape.new(name: 'ClusterInstanceStorageConfig')
365
370
  ClusterInstanceStorageConfigs = Shapes::ListShape.new(name: 'ClusterInstanceStorageConfigs')
366
371
  ClusterInstanceType = Shapes::StringShape.new(name: 'ClusterInstanceType')
372
+ ClusterKubernetesConfig = Shapes::StructureShape.new(name: 'ClusterKubernetesConfig')
373
+ ClusterKubernetesConfigDetails = Shapes::StructureShape.new(name: 'ClusterKubernetesConfigDetails')
374
+ ClusterKubernetesConfigNodeDetails = Shapes::StructureShape.new(name: 'ClusterKubernetesConfigNodeDetails')
375
+ ClusterKubernetesLabelKey = Shapes::StringShape.new(name: 'ClusterKubernetesLabelKey')
376
+ ClusterKubernetesLabelValue = Shapes::StringShape.new(name: 'ClusterKubernetesLabelValue')
377
+ ClusterKubernetesLabels = Shapes::MapShape.new(name: 'ClusterKubernetesLabels')
378
+ ClusterKubernetesTaint = Shapes::StructureShape.new(name: 'ClusterKubernetesTaint')
379
+ ClusterKubernetesTaintEffect = Shapes::StringShape.new(name: 'ClusterKubernetesTaintEffect')
380
+ ClusterKubernetesTaintKey = Shapes::StringShape.new(name: 'ClusterKubernetesTaintKey')
381
+ ClusterKubernetesTaintValue = Shapes::StringShape.new(name: 'ClusterKubernetesTaintValue')
382
+ ClusterKubernetesTaints = Shapes::ListShape.new(name: 'ClusterKubernetesTaints')
367
383
  ClusterLifeCycleConfig = Shapes::StructureShape.new(name: 'ClusterLifeCycleConfig')
368
384
  ClusterLifeCycleConfigFileName = Shapes::StringShape.new(name: 'ClusterLifeCycleConfigFileName')
369
385
  ClusterMetadata = Shapes::StructureShape.new(name: 'ClusterMetadata')
@@ -379,6 +395,7 @@ module Aws::SageMaker
379
395
  ClusterNodeSummaries = Shapes::ListShape.new(name: 'ClusterNodeSummaries')
380
396
  ClusterNodeSummary = Shapes::StructureShape.new(name: 'ClusterNodeSummary')
381
397
  ClusterNonNegativeInstanceCount = Shapes::IntegerShape.new(name: 'ClusterNonNegativeInstanceCount')
398
+ ClusterOnDemandOptions = Shapes::StructureShape.new(name: 'ClusterOnDemandOptions')
382
399
  ClusterOrchestrator = Shapes::StructureShape.new(name: 'ClusterOrchestrator')
383
400
  ClusterOrchestratorEksConfig = Shapes::StructureShape.new(name: 'ClusterOrchestratorEksConfig')
384
401
  ClusterPrivateDnsHostname = Shapes::StringShape.new(name: 'ClusterPrivateDnsHostname')
@@ -394,6 +411,7 @@ module Aws::SageMaker
394
411
  ClusterSchedulerConfigSummaryList = Shapes::ListShape.new(name: 'ClusterSchedulerConfigSummaryList')
395
412
  ClusterSchedulerPriorityClassName = Shapes::StringShape.new(name: 'ClusterSchedulerPriorityClassName')
396
413
  ClusterSortBy = Shapes::StringShape.new(name: 'ClusterSortBy')
414
+ ClusterSpotOptions = Shapes::StructureShape.new(name: 'ClusterSpotOptions')
397
415
  ClusterStatus = Shapes::StringShape.new(name: 'ClusterStatus')
398
416
  ClusterSummaries = Shapes::ListShape.new(name: 'ClusterSummaries')
399
417
  ClusterSummary = Shapes::StructureShape.new(name: 'ClusterSummary')
@@ -1743,6 +1761,10 @@ module Aws::SageMaker
1743
1761
  ModelSetupTime = Shapes::IntegerShape.new(name: 'ModelSetupTime')
1744
1762
  ModelShardingConfig = Shapes::StructureShape.new(name: 'ModelShardingConfig')
1745
1763
  ModelSortKey = Shapes::StringShape.new(name: 'ModelSortKey')
1764
+ ModelSpeculativeDecodingConfig = Shapes::StructureShape.new(name: 'ModelSpeculativeDecodingConfig')
1765
+ ModelSpeculativeDecodingS3DataType = Shapes::StringShape.new(name: 'ModelSpeculativeDecodingS3DataType')
1766
+ ModelSpeculativeDecodingTechnique = Shapes::StringShape.new(name: 'ModelSpeculativeDecodingTechnique')
1767
+ ModelSpeculativeDecodingTrainingDataSource = Shapes::StructureShape.new(name: 'ModelSpeculativeDecodingTrainingDataSource')
1746
1768
  ModelStepMetadata = Shapes::StructureShape.new(name: 'ModelStepMetadata')
1747
1769
  ModelSummary = Shapes::StructureShape.new(name: 'ModelSummary')
1748
1770
  ModelSummaryList = Shapes::ListShape.new(name: 'ModelSummaryList')
@@ -1877,6 +1899,7 @@ module Aws::SageMaker
1877
1899
  OptimizationJobArn = Shapes::StringShape.new(name: 'OptimizationJobArn')
1878
1900
  OptimizationJobDeploymentInstanceType = Shapes::StringShape.new(name: 'OptimizationJobDeploymentInstanceType')
1879
1901
  OptimizationJobEnvironmentVariables = Shapes::MapShape.new(name: 'OptimizationJobEnvironmentVariables')
1902
+ OptimizationJobMaxInstanceCount = Shapes::IntegerShape.new(name: 'OptimizationJobMaxInstanceCount')
1880
1903
  OptimizationJobModelSource = Shapes::StructureShape.new(name: 'OptimizationJobModelSource')
1881
1904
  OptimizationJobModelSourceS3 = Shapes::StructureShape.new(name: 'OptimizationJobModelSourceS3')
1882
1905
  OptimizationJobOutputConfig = Shapes::StructureShape.new(name: 'OptimizationJobOutputConfig')
@@ -1886,6 +1909,7 @@ module Aws::SageMaker
1886
1909
  OptimizationModelAcceptEula = Shapes::BooleanShape.new(name: 'OptimizationModelAcceptEula')
1887
1910
  OptimizationModelAccessConfig = Shapes::StructureShape.new(name: 'OptimizationModelAccessConfig')
1888
1911
  OptimizationOutput = Shapes::StructureShape.new(name: 'OptimizationOutput')
1912
+ OptimizationSageMakerModel = Shapes::StructureShape.new(name: 'OptimizationSageMakerModel')
1889
1913
  OptimizationType = Shapes::StringShape.new(name: 'OptimizationType')
1890
1914
  OptimizationTypes = Shapes::ListShape.new(name: 'OptimizationTypes')
1891
1915
  OptimizationVpcConfig = Shapes::StructureShape.new(name: 'OptimizationVpcConfig')
@@ -2749,6 +2773,9 @@ module Aws::SageMaker
2749
2773
  ActionSummary.add_member(:last_modified_time, Shapes::ShapeRef.new(shape: Timestamp, location_name: "LastModifiedTime"))
2750
2774
  ActionSummary.struct_class = Types::ActionSummary
2751
2775
 
2776
+ ActiveOperations.key = Shapes::ShapeRef.new(shape: ActiveClusterOperationName)
2777
+ ActiveOperations.value = Shapes::ShapeRef.new(shape: ActiveClusterOperationCount)
2778
+
2752
2779
  AddAssociationRequest.add_member(:source_arn, Shapes::ShapeRef.new(shape: AssociationEntityArn, required: true, location_name: "SourceArn"))
2753
2780
  AddAssociationRequest.add_member(:destination_arn, Shapes::ShapeRef.new(shape: AssociationEntityArn, required: true, location_name: "DestinationArn"))
2754
2781
  AddAssociationRequest.add_member(:association_type, Shapes::ShapeRef.new(shape: AssociationEdgeType, location_name: "AssociationType"))
@@ -3516,6 +3543,10 @@ module Aws::SageMaker
3516
3543
  ClusterAutoScalingConfigOutput.add_member(:failure_message, Shapes::ShapeRef.new(shape: String, location_name: "FailureMessage"))
3517
3544
  ClusterAutoScalingConfigOutput.struct_class = Types::ClusterAutoScalingConfigOutput
3518
3545
 
3546
+ ClusterCapacityRequirements.add_member(:spot, Shapes::ShapeRef.new(shape: ClusterSpotOptions, location_name: "Spot"))
3547
+ ClusterCapacityRequirements.add_member(:on_demand, Shapes::ShapeRef.new(shape: ClusterOnDemandOptions, location_name: "OnDemand"))
3548
+ ClusterCapacityRequirements.struct_class = Types::ClusterCapacityRequirements
3549
+
3519
3550
  ClusterEbsVolumeConfig.add_member(:volume_size_in_gb, Shapes::ShapeRef.new(shape: ClusterEbsVolumeSizeInGB, location_name: "VolumeSizeInGB"))
3520
3551
  ClusterEbsVolumeConfig.add_member(:volume_kms_key_id, Shapes::ShapeRef.new(shape: KmsKeyId, location_name: "VolumeKmsKeyId"))
3521
3552
  ClusterEbsVolumeConfig.add_member(:root_volume, Shapes::ShapeRef.new(shape: Boolean, location_name: "RootVolume", metadata: {"box" => true}))
@@ -3546,6 +3577,7 @@ module Aws::SageMaker
3546
3577
 
3547
3578
  ClusterInstanceGroupDetails.add_member(:current_count, Shapes::ShapeRef.new(shape: ClusterNonNegativeInstanceCount, location_name: "CurrentCount"))
3548
3579
  ClusterInstanceGroupDetails.add_member(:target_count, Shapes::ShapeRef.new(shape: ClusterInstanceCount, location_name: "TargetCount"))
3580
+ ClusterInstanceGroupDetails.add_member(:min_count, Shapes::ShapeRef.new(shape: ClusterInstanceCount, location_name: "MinCount"))
3549
3581
  ClusterInstanceGroupDetails.add_member(:instance_group_name, Shapes::ShapeRef.new(shape: ClusterInstanceGroupName, location_name: "InstanceGroupName"))
3550
3582
  ClusterInstanceGroupDetails.add_member(:instance_type, Shapes::ShapeRef.new(shape: ClusterInstanceType, location_name: "InstanceType"))
3551
3583
  ClusterInstanceGroupDetails.add_member(:life_cycle_config, Shapes::ShapeRef.new(shape: ClusterLifeCycleConfig, location_name: "LifeCycleConfig"))
@@ -3560,6 +3592,9 @@ module Aws::SageMaker
3560
3592
  ClusterInstanceGroupDetails.add_member(:scheduled_update_config, Shapes::ShapeRef.new(shape: ScheduledUpdateConfig, location_name: "ScheduledUpdateConfig"))
3561
3593
  ClusterInstanceGroupDetails.add_member(:current_image_id, Shapes::ShapeRef.new(shape: ImageId, location_name: "CurrentImageId"))
3562
3594
  ClusterInstanceGroupDetails.add_member(:desired_image_id, Shapes::ShapeRef.new(shape: ImageId, location_name: "DesiredImageId"))
3595
+ ClusterInstanceGroupDetails.add_member(:active_operations, Shapes::ShapeRef.new(shape: ActiveOperations, location_name: "ActiveOperations"))
3596
+ ClusterInstanceGroupDetails.add_member(:kubernetes_config, Shapes::ShapeRef.new(shape: ClusterKubernetesConfigDetails, location_name: "KubernetesConfig"))
3597
+ ClusterInstanceGroupDetails.add_member(:capacity_requirements, Shapes::ShapeRef.new(shape: ClusterCapacityRequirements, location_name: "CapacityRequirements"))
3563
3598
  ClusterInstanceGroupDetails.add_member(:target_state_count, Shapes::ShapeRef.new(shape: ClusterInstanceCount, location_name: "TargetStateCount"))
3564
3599
  ClusterInstanceGroupDetails.add_member(:software_update_status, Shapes::ShapeRef.new(shape: SoftwareUpdateStatus, location_name: "SoftwareUpdateStatus"))
3565
3600
  ClusterInstanceGroupDetails.add_member(:active_software_update_config, Shapes::ShapeRef.new(shape: DeploymentConfiguration, location_name: "ActiveSoftwareUpdateConfig"))
@@ -3568,6 +3603,7 @@ module Aws::SageMaker
3568
3603
  ClusterInstanceGroupDetailsList.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupDetails)
3569
3604
 
3570
3605
  ClusterInstanceGroupSpecification.add_member(:instance_count, Shapes::ShapeRef.new(shape: ClusterInstanceCount, required: true, location_name: "InstanceCount"))
3606
+ ClusterInstanceGroupSpecification.add_member(:min_instance_count, Shapes::ShapeRef.new(shape: ClusterInstanceCount, location_name: "MinInstanceCount"))
3571
3607
  ClusterInstanceGroupSpecification.add_member(:instance_group_name, Shapes::ShapeRef.new(shape: ClusterInstanceGroupName, required: true, location_name: "InstanceGroupName"))
3572
3608
  ClusterInstanceGroupSpecification.add_member(:instance_type, Shapes::ShapeRef.new(shape: ClusterInstanceType, required: true, location_name: "InstanceType"))
3573
3609
  ClusterInstanceGroupSpecification.add_member(:life_cycle_config, Shapes::ShapeRef.new(shape: ClusterLifeCycleConfig, required: true, location_name: "LifeCycleConfig"))
@@ -3579,6 +3615,8 @@ module Aws::SageMaker
3579
3615
  ClusterInstanceGroupSpecification.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3580
3616
  ClusterInstanceGroupSpecification.add_member(:scheduled_update_config, Shapes::ShapeRef.new(shape: ScheduledUpdateConfig, location_name: "ScheduledUpdateConfig"))
3581
3617
  ClusterInstanceGroupSpecification.add_member(:image_id, Shapes::ShapeRef.new(shape: ImageId, location_name: "ImageId"))
3618
+ ClusterInstanceGroupSpecification.add_member(:kubernetes_config, Shapes::ShapeRef.new(shape: ClusterKubernetesConfig, location_name: "KubernetesConfig"))
3619
+ ClusterInstanceGroupSpecification.add_member(:capacity_requirements, Shapes::ShapeRef.new(shape: ClusterCapacityRequirements, location_name: "CapacityRequirements"))
3582
3620
  ClusterInstanceGroupSpecification.struct_class = Types::ClusterInstanceGroupSpecification
3583
3621
 
3584
3622
  ClusterInstanceGroupSpecifications.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecification)
@@ -3601,6 +3639,32 @@ module Aws::SageMaker
3601
3639
 
3602
3640
  ClusterInstanceStorageConfigs.member = Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfig)
3603
3641
 
3642
+ ClusterKubernetesConfig.add_member(:labels, Shapes::ShapeRef.new(shape: ClusterKubernetesLabels, location_name: "Labels"))
3643
+ ClusterKubernetesConfig.add_member(:taints, Shapes::ShapeRef.new(shape: ClusterKubernetesTaints, location_name: "Taints"))
3644
+ ClusterKubernetesConfig.struct_class = Types::ClusterKubernetesConfig
3645
+
3646
+ ClusterKubernetesConfigDetails.add_member(:current_labels, Shapes::ShapeRef.new(shape: ClusterKubernetesLabels, location_name: "CurrentLabels"))
3647
+ ClusterKubernetesConfigDetails.add_member(:desired_labels, Shapes::ShapeRef.new(shape: ClusterKubernetesLabels, location_name: "DesiredLabels"))
3648
+ ClusterKubernetesConfigDetails.add_member(:current_taints, Shapes::ShapeRef.new(shape: ClusterKubernetesTaints, location_name: "CurrentTaints"))
3649
+ ClusterKubernetesConfigDetails.add_member(:desired_taints, Shapes::ShapeRef.new(shape: ClusterKubernetesTaints, location_name: "DesiredTaints"))
3650
+ ClusterKubernetesConfigDetails.struct_class = Types::ClusterKubernetesConfigDetails
3651
+
3652
+ ClusterKubernetesConfigNodeDetails.add_member(:current_labels, Shapes::ShapeRef.new(shape: ClusterKubernetesLabels, location_name: "CurrentLabels"))
3653
+ ClusterKubernetesConfigNodeDetails.add_member(:desired_labels, Shapes::ShapeRef.new(shape: ClusterKubernetesLabels, location_name: "DesiredLabels"))
3654
+ ClusterKubernetesConfigNodeDetails.add_member(:current_taints, Shapes::ShapeRef.new(shape: ClusterKubernetesTaints, location_name: "CurrentTaints"))
3655
+ ClusterKubernetesConfigNodeDetails.add_member(:desired_taints, Shapes::ShapeRef.new(shape: ClusterKubernetesTaints, location_name: "DesiredTaints"))
3656
+ ClusterKubernetesConfigNodeDetails.struct_class = Types::ClusterKubernetesConfigNodeDetails
3657
+
3658
+ ClusterKubernetesLabels.key = Shapes::ShapeRef.new(shape: ClusterKubernetesLabelKey)
3659
+ ClusterKubernetesLabels.value = Shapes::ShapeRef.new(shape: ClusterKubernetesLabelValue)
3660
+
3661
+ ClusterKubernetesTaint.add_member(:key, Shapes::ShapeRef.new(shape: ClusterKubernetesTaintKey, required: true, location_name: "Key"))
3662
+ ClusterKubernetesTaint.add_member(:value, Shapes::ShapeRef.new(shape: ClusterKubernetesTaintValue, location_name: "Value"))
3663
+ ClusterKubernetesTaint.add_member(:effect, Shapes::ShapeRef.new(shape: ClusterKubernetesTaintEffect, required: true, location_name: "Effect"))
3664
+ ClusterKubernetesTaint.struct_class = Types::ClusterKubernetesTaint
3665
+
3666
+ ClusterKubernetesTaints.member = Shapes::ShapeRef.new(shape: ClusterKubernetesTaint)
3667
+
3604
3668
  ClusterLifeCycleConfig.add_member(:source_s3_uri, Shapes::ShapeRef.new(shape: S3Uri, required: true, location_name: "SourceS3Uri"))
3605
3669
  ClusterLifeCycleConfig.add_member(:on_create, Shapes::ShapeRef.new(shape: ClusterLifeCycleConfigFileName, required: true, location_name: "OnCreate"))
3606
3670
  ClusterLifeCycleConfig.struct_class = Types::ClusterLifeCycleConfig
@@ -3628,6 +3692,8 @@ module Aws::SageMaker
3628
3692
  ClusterNodeDetails.add_member(:current_image_id, Shapes::ShapeRef.new(shape: ImageId, location_name: "CurrentImageId"))
3629
3693
  ClusterNodeDetails.add_member(:desired_image_id, Shapes::ShapeRef.new(shape: ImageId, location_name: "DesiredImageId"))
3630
3694
  ClusterNodeDetails.add_member(:ultra_server_info, Shapes::ShapeRef.new(shape: UltraServerInfo, location_name: "UltraServerInfo"))
3695
+ ClusterNodeDetails.add_member(:kubernetes_config, Shapes::ShapeRef.new(shape: ClusterKubernetesConfigNodeDetails, location_name: "KubernetesConfig"))
3696
+ ClusterNodeDetails.add_member(:capacity_type, Shapes::ShapeRef.new(shape: ClusterCapacityType, location_name: "CapacityType"))
3631
3697
  ClusterNodeDetails.struct_class = Types::ClusterNodeDetails
3632
3698
 
3633
3699
  ClusterNodeIds.member = Shapes::ShapeRef.new(shape: ClusterNodeId)
@@ -3647,6 +3713,8 @@ module Aws::SageMaker
3647
3713
  ClusterNodeSummary.add_member(:private_dns_hostname, Shapes::ShapeRef.new(shape: ClusterPrivateDnsHostname, location_name: "PrivateDnsHostname"))
3648
3714
  ClusterNodeSummary.struct_class = Types::ClusterNodeSummary
3649
3715
 
3716
+ ClusterOnDemandOptions.struct_class = Types::ClusterOnDemandOptions
3717
+
3650
3718
  ClusterOrchestrator.add_member(:eks, Shapes::ShapeRef.new(shape: ClusterOrchestratorEksConfig, required: true, location_name: "Eks"))
3651
3719
  ClusterOrchestrator.struct_class = Types::ClusterOrchestrator
3652
3720
 
@@ -3698,6 +3766,8 @@ module Aws::SageMaker
3698
3766
 
3699
3767
  ClusterSchedulerConfigSummaryList.member = Shapes::ShapeRef.new(shape: ClusterSchedulerConfigSummary)
3700
3768
 
3769
+ ClusterSpotOptions.struct_class = Types::ClusterSpotOptions
3770
+
3701
3771
  ClusterSummaries.member = Shapes::ShapeRef.new(shape: ClusterSummary)
3702
3772
 
3703
3773
  ClusterSummary.add_member(:cluster_arn, Shapes::ShapeRef.new(shape: ClusterArn, required: true, location_name: "ClusterArn"))
@@ -4471,6 +4541,7 @@ module Aws::SageMaker
4471
4541
  CreateOptimizationJobRequest.add_member(:role_arn, Shapes::ShapeRef.new(shape: RoleArn, required: true, location_name: "RoleArn"))
4472
4542
  CreateOptimizationJobRequest.add_member(:model_source, Shapes::ShapeRef.new(shape: OptimizationJobModelSource, required: true, location_name: "ModelSource"))
4473
4543
  CreateOptimizationJobRequest.add_member(:deployment_instance_type, Shapes::ShapeRef.new(shape: OptimizationJobDeploymentInstanceType, required: true, location_name: "DeploymentInstanceType"))
4544
+ CreateOptimizationJobRequest.add_member(:max_instance_count, Shapes::ShapeRef.new(shape: OptimizationJobMaxInstanceCount, location_name: "MaxInstanceCount"))
4474
4545
  CreateOptimizationJobRequest.add_member(:optimization_environment, Shapes::ShapeRef.new(shape: OptimizationJobEnvironmentVariables, location_name: "OptimizationEnvironment"))
4475
4546
  CreateOptimizationJobRequest.add_member(:optimization_configs, Shapes::ShapeRef.new(shape: OptimizationConfigs, required: true, location_name: "OptimizationConfigs"))
4476
4547
  CreateOptimizationJobRequest.add_member(:output_config, Shapes::ShapeRef.new(shape: OptimizationJobOutputConfig, required: true, location_name: "OutputConfig"))
@@ -6071,6 +6142,7 @@ module Aws::SageMaker
6071
6142
  DescribeOptimizationJobResponse.add_member(:model_source, Shapes::ShapeRef.new(shape: OptimizationJobModelSource, required: true, location_name: "ModelSource"))
6072
6143
  DescribeOptimizationJobResponse.add_member(:optimization_environment, Shapes::ShapeRef.new(shape: OptimizationJobEnvironmentVariables, location_name: "OptimizationEnvironment"))
6073
6144
  DescribeOptimizationJobResponse.add_member(:deployment_instance_type, Shapes::ShapeRef.new(shape: OptimizationJobDeploymentInstanceType, required: true, location_name: "DeploymentInstanceType"))
6145
+ DescribeOptimizationJobResponse.add_member(:max_instance_count, Shapes::ShapeRef.new(shape: OptimizationJobMaxInstanceCount, location_name: "MaxInstanceCount"))
6074
6146
  DescribeOptimizationJobResponse.add_member(:optimization_configs, Shapes::ShapeRef.new(shape: OptimizationConfigs, required: true, location_name: "OptimizationConfigs"))
6075
6147
  DescribeOptimizationJobResponse.add_member(:output_config, Shapes::ShapeRef.new(shape: OptimizationJobOutputConfig, required: true, location_name: "OutputConfig"))
6076
6148
  DescribeOptimizationJobResponse.add_member(:optimization_output, Shapes::ShapeRef.new(shape: OptimizationOutput, location_name: "OptimizationOutput"))
@@ -7561,6 +7633,7 @@ module Aws::SageMaker
7561
7633
 
7562
7634
  InstanceGroupScalingMetadata.add_member(:instance_count, Shapes::ShapeRef.new(shape: InstanceCount, location_name: "InstanceCount"))
7563
7635
  InstanceGroupScalingMetadata.add_member(:target_count, Shapes::ShapeRef.new(shape: TargetCount, location_name: "TargetCount"))
7636
+ InstanceGroupScalingMetadata.add_member(:min_count, Shapes::ShapeRef.new(shape: InstanceCount, location_name: "MinCount"))
7564
7637
  InstanceGroupScalingMetadata.add_member(:failure_message, Shapes::ShapeRef.new(shape: String, location_name: "FailureMessage"))
7565
7638
  InstanceGroupScalingMetadata.struct_class = Types::InstanceGroupScalingMetadata
7566
7639
 
@@ -9319,6 +9392,14 @@ module Aws::SageMaker
9319
9392
  ModelShardingConfig.add_member(:override_environment, Shapes::ShapeRef.new(shape: OptimizationJobEnvironmentVariables, location_name: "OverrideEnvironment"))
9320
9393
  ModelShardingConfig.struct_class = Types::ModelShardingConfig
9321
9394
 
9395
+ ModelSpeculativeDecodingConfig.add_member(:technique, Shapes::ShapeRef.new(shape: ModelSpeculativeDecodingTechnique, required: true, location_name: "Technique"))
9396
+ ModelSpeculativeDecodingConfig.add_member(:training_data_source, Shapes::ShapeRef.new(shape: ModelSpeculativeDecodingTrainingDataSource, location_name: "TrainingDataSource"))
9397
+ ModelSpeculativeDecodingConfig.struct_class = Types::ModelSpeculativeDecodingConfig
9398
+
9399
+ ModelSpeculativeDecodingTrainingDataSource.add_member(:s3_uri, Shapes::ShapeRef.new(shape: S3Uri, required: true, location_name: "S3Uri"))
9400
+ ModelSpeculativeDecodingTrainingDataSource.add_member(:s3_data_type, Shapes::ShapeRef.new(shape: ModelSpeculativeDecodingS3DataType, required: true, location_name: "S3DataType"))
9401
+ ModelSpeculativeDecodingTrainingDataSource.struct_class = Types::ModelSpeculativeDecodingTrainingDataSource
9402
+
9322
9403
  ModelStepMetadata.add_member(:arn, Shapes::ShapeRef.new(shape: String256, location_name: "Arn"))
9323
9404
  ModelStepMetadata.struct_class = Types::ModelStepMetadata
9324
9405
 
@@ -9630,10 +9711,12 @@ module Aws::SageMaker
9630
9711
  OptimizationConfig.add_member(:model_quantization_config, Shapes::ShapeRef.new(shape: ModelQuantizationConfig, location_name: "ModelQuantizationConfig"))
9631
9712
  OptimizationConfig.add_member(:model_compilation_config, Shapes::ShapeRef.new(shape: ModelCompilationConfig, location_name: "ModelCompilationConfig"))
9632
9713
  OptimizationConfig.add_member(:model_sharding_config, Shapes::ShapeRef.new(shape: ModelShardingConfig, location_name: "ModelShardingConfig"))
9714
+ OptimizationConfig.add_member(:model_speculative_decoding_config, Shapes::ShapeRef.new(shape: ModelSpeculativeDecodingConfig, location_name: "ModelSpeculativeDecodingConfig"))
9633
9715
  OptimizationConfig.add_member(:unknown, Shapes::ShapeRef.new(shape: nil, location_name: 'unknown'))
9634
9716
  OptimizationConfig.add_member_subclass(:model_quantization_config, Types::OptimizationConfig::ModelQuantizationConfig)
9635
9717
  OptimizationConfig.add_member_subclass(:model_compilation_config, Types::OptimizationConfig::ModelCompilationConfig)
9636
9718
  OptimizationConfig.add_member_subclass(:model_sharding_config, Types::OptimizationConfig::ModelShardingConfig)
9719
+ OptimizationConfig.add_member_subclass(:model_speculative_decoding_config, Types::OptimizationConfig::ModelSpeculativeDecodingConfig)
9637
9720
  OptimizationConfig.add_member_subclass(:unknown, Types::OptimizationConfig::Unknown)
9638
9721
  OptimizationConfig.struct_class = Types::OptimizationConfig
9639
9722
 
@@ -9643,6 +9726,7 @@ module Aws::SageMaker
9643
9726
  OptimizationJobEnvironmentVariables.value = Shapes::ShapeRef.new(shape: String256)
9644
9727
 
9645
9728
  OptimizationJobModelSource.add_member(:s3, Shapes::ShapeRef.new(shape: OptimizationJobModelSourceS3, location_name: "S3"))
9729
+ OptimizationJobModelSource.add_member(:sage_maker_model, Shapes::ShapeRef.new(shape: OptimizationSageMakerModel, location_name: "SageMakerModel"))
9646
9730
  OptimizationJobModelSource.struct_class = Types::OptimizationJobModelSource
9647
9731
 
9648
9732
  OptimizationJobModelSourceS3.add_member(:s3_uri, Shapes::ShapeRef.new(shape: S3Uri, location_name: "S3Uri"))
@@ -9651,6 +9735,7 @@ module Aws::SageMaker
9651
9735
 
9652
9736
  OptimizationJobOutputConfig.add_member(:kms_key_id, Shapes::ShapeRef.new(shape: KmsKeyId, location_name: "KmsKeyId"))
9653
9737
  OptimizationJobOutputConfig.add_member(:s3_output_location, Shapes::ShapeRef.new(shape: S3Uri, required: true, location_name: "S3OutputLocation"))
9738
+ OptimizationJobOutputConfig.add_member(:sage_maker_model, Shapes::ShapeRef.new(shape: OptimizationSageMakerModel, location_name: "SageMakerModel"))
9654
9739
  OptimizationJobOutputConfig.struct_class = Types::OptimizationJobOutputConfig
9655
9740
 
9656
9741
  OptimizationJobSummaries.member = Shapes::ShapeRef.new(shape: OptimizationJobSummary)
@@ -9663,6 +9748,7 @@ module Aws::SageMaker
9663
9748
  OptimizationJobSummary.add_member(:optimization_end_time, Shapes::ShapeRef.new(shape: Timestamp, location_name: "OptimizationEndTime"))
9664
9749
  OptimizationJobSummary.add_member(:last_modified_time, Shapes::ShapeRef.new(shape: LastModifiedTime, location_name: "LastModifiedTime"))
9665
9750
  OptimizationJobSummary.add_member(:deployment_instance_type, Shapes::ShapeRef.new(shape: OptimizationJobDeploymentInstanceType, required: true, location_name: "DeploymentInstanceType"))
9751
+ OptimizationJobSummary.add_member(:max_instance_count, Shapes::ShapeRef.new(shape: OptimizationJobMaxInstanceCount, location_name: "MaxInstanceCount"))
9666
9752
  OptimizationJobSummary.add_member(:optimization_types, Shapes::ShapeRef.new(shape: OptimizationTypes, required: true, location_name: "OptimizationTypes"))
9667
9753
  OptimizationJobSummary.struct_class = Types::OptimizationJobSummary
9668
9754
 
@@ -9672,6 +9758,9 @@ module Aws::SageMaker
9672
9758
  OptimizationOutput.add_member(:recommended_inference_image, Shapes::ShapeRef.new(shape: OptimizationContainerImage, location_name: "RecommendedInferenceImage"))
9673
9759
  OptimizationOutput.struct_class = Types::OptimizationOutput
9674
9760
 
9761
+ OptimizationSageMakerModel.add_member(:model_name, Shapes::ShapeRef.new(shape: ModelName, location_name: "ModelName"))
9762
+ OptimizationSageMakerModel.struct_class = Types::OptimizationSageMakerModel
9763
+
9675
9764
  OptimizationTypes.member = Shapes::ShapeRef.new(shape: OptimizationType)
9676
9765
 
9677
9766
  OptimizationVpcConfig.add_member(:security_group_ids, Shapes::ShapeRef.new(shape: OptimizationVpcSecurityGroupIds, required: true, location_name: "SecurityGroupIds"))