aws-sdk-sagemaker 1.289.0 → 1.291.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 48bc7bf9cd437043fe6fd85e1e963bd4ec06a843845f3fd4120d6b753b6e1bd4
4
- data.tar.gz: 4d7b5e4cd2328b97a6432df94d0df560bac9ff1b170c565fc271eecc9d09e46d
3
+ metadata.gz: 89ca78842e4cb8cee6d80d8a8daf2c8b4dc0e47455067caecf7afd1ef6ffbd2e
4
+ data.tar.gz: dbbcf82690c0aba025bd9c60d7ca1dbe5855d544bb6b9b630f44daaad00a5ad0
5
5
  SHA512:
6
- metadata.gz: f278f70e08b0c47a077149c57586ee8288dca48fbf836a008b3960e304854bf6712e704db088fd4b594f0c60b449df1d483102bf94c676e5e221b8823874c2ff
7
- data.tar.gz: 9abe9a91d967cca566a9ea0fbc026ada3d9c393a2bc28c9c2f5f5c8fe8d074b97022fc41c2fad90f585b2409ef12ccde44a4ab82be2c61b84446e60489415885
6
+ metadata.gz: de74eb8d70134e088fc61dfdf423b080ca19e84ecec8e21f73788c7abb2c5663b61e43be64ef04f4747bdc5b5377852e97a4b4bf451912291d6de3441c1fb682
7
+ data.tar.gz: 989fb4e7701a4455905eab5850c7e18b44b0df00b57e1a771c4f21386e41d00e7198b00cedaf5ed50e470130e3918b9f58d286331b99a1ff1c822c80c0b67d4b
data/CHANGELOG.md CHANGED
@@ -1,6 +1,16 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.291.0 (2025-02-26)
5
+ ------------------
6
+
7
+ * Feature - AWS SageMaker InferenceComponents now support rolling update deployments for Inference Components.
8
+
9
+ 1.290.0 (2025-02-20)
10
+ ------------------
11
+
12
+ * Feature - Added new capability in the UpdateCluster operation to remove instance groups from your SageMaker HyperPod cluster.
13
+
4
14
  1.289.0 (2025-02-19)
5
15
  ------------------
6
16
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.289.0
1
+ 1.291.0
@@ -689,11 +689,19 @@ module Aws::SageMaker
689
689
  # @option params [required, Array<String>] :node_ids
690
690
  # A list of node IDs to be deleted from the specified cluster.
691
691
  #
692
- # <note markdown="1"> For SageMaker HyperPod clusters using the Slurm workload manager, you
693
- # cannot remove instances that are configured as Slurm controller nodes.
692
+ # <note markdown="1"> * For SageMaker HyperPod clusters using the Slurm workload manager,
693
+ # you cannot remove instances that are configured as Slurm controller
694
+ # nodes.
695
+ #
696
+ # * If you need to delete more than 99 instances, contact [Support][1]
697
+ # for assistance.
694
698
  #
695
699
  # </note>
696
700
  #
701
+ #
702
+ #
703
+ # [1]: http://aws.amazon.com/contact-us/
704
+ #
697
705
  # @return [Types::BatchDeleteClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
698
706
  #
699
707
  # * {Types::BatchDeleteClusterNodesResponse#failed #failed} => Array&lt;Types::BatchDeleteClusterNodesError&gt;
@@ -14977,6 +14985,7 @@ module Aws::SageMaker
14977
14985
  # * {Types::DescribeInferenceComponentOutput#creation_time #creation_time} => Time
14978
14986
  # * {Types::DescribeInferenceComponentOutput#last_modified_time #last_modified_time} => Time
14979
14987
  # * {Types::DescribeInferenceComponentOutput#inference_component_status #inference_component_status} => String
14988
+ # * {Types::DescribeInferenceComponentOutput#last_deployment_config #last_deployment_config} => Types::InferenceComponentDeploymentConfig
14980
14989
  #
14981
14990
  # @example Request syntax with placeholder values
14982
14991
  #
@@ -15011,6 +15020,14 @@ module Aws::SageMaker
15011
15020
  # resp.creation_time #=> Time
15012
15021
  # resp.last_modified_time #=> Time
15013
15022
  # resp.inference_component_status #=> String, one of "InService", "Creating", "Updating", "Failed", "Deleting"
15023
+ # resp.last_deployment_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "COPY_COUNT", "CAPACITY_PERCENT"
15024
+ # resp.last_deployment_config.rolling_update_policy.maximum_batch_size.value #=> Integer
15025
+ # resp.last_deployment_config.rolling_update_policy.wait_interval_in_seconds #=> Integer
15026
+ # resp.last_deployment_config.rolling_update_policy.maximum_execution_timeout_in_seconds #=> Integer
15027
+ # resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.type #=> String, one of "COPY_COUNT", "CAPACITY_PERCENT"
15028
+ # resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.value #=> Integer
15029
+ # resp.last_deployment_config.auto_rollback_configuration.alarms #=> Array
15030
+ # resp.last_deployment_config.auto_rollback_configuration.alarms[0].alarm_name #=> String
15014
15031
  #
15015
15032
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeInferenceComponent AWS API Documentation
15016
15033
  #
@@ -26207,6 +26224,10 @@ module Aws::SageMaker
26207
26224
  # The node recovery mode to be applied to the SageMaker HyperPod
26208
26225
  # cluster.
26209
26226
  #
26227
+ # @option params [Array<String>] :instance_groups_to_delete
26228
+ # Specify the names of the instance groups to delete. Use a single `,`
26229
+ # as the separator between multiple names.
26230
+ #
26210
26231
  # @return [Types::UpdateClusterResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
26211
26232
  #
26212
26233
  # * {Types::UpdateClusterResponse#cluster_arn #cluster_arn} => String
@@ -26242,6 +26263,7 @@ module Aws::SageMaker
26242
26263
  # },
26243
26264
  # ],
26244
26265
  # node_recovery: "Automatic", # accepts Automatic, None
26266
+ # instance_groups_to_delete: ["ClusterInstanceGroupName"],
26245
26267
  # })
26246
26268
  #
26247
26269
  # @example Response structure
@@ -27532,6 +27554,11 @@ module Aws::SageMaker
27532
27554
  # Runtime settings for a model that is deployed with an inference
27533
27555
  # component.
27534
27556
  #
27557
+ # @option params [Types::InferenceComponentDeploymentConfig] :deployment_config
27558
+ # The deployment configuration for the inference component. The
27559
+ # configuration contains the desired deployment strategy and rollback
27560
+ # settings.
27561
+ #
27535
27562
  # @return [Types::UpdateInferenceComponentOutput] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
27536
27563
  #
27537
27564
  # * {Types::UpdateInferenceComponentOutput#inference_component_arn #inference_component_arn} => String
@@ -27564,6 +27591,27 @@ module Aws::SageMaker
27564
27591
  # runtime_config: {
27565
27592
  # copy_count: 1, # required
27566
27593
  # },
27594
+ # deployment_config: {
27595
+ # rolling_update_policy: { # required
27596
+ # maximum_batch_size: { # required
27597
+ # type: "COPY_COUNT", # required, accepts COPY_COUNT, CAPACITY_PERCENT
27598
+ # value: 1, # required
27599
+ # },
27600
+ # wait_interval_in_seconds: 1, # required
27601
+ # maximum_execution_timeout_in_seconds: 1,
27602
+ # rollback_maximum_batch_size: {
27603
+ # type: "COPY_COUNT", # required, accepts COPY_COUNT, CAPACITY_PERCENT
27604
+ # value: 1, # required
27605
+ # },
27606
+ # },
27607
+ # auto_rollback_configuration: {
27608
+ # alarms: [
27609
+ # {
27610
+ # alarm_name: "AlarmName",
27611
+ # },
27612
+ # ],
27613
+ # },
27614
+ # },
27567
27615
  # })
27568
27616
  #
27569
27617
  # @example Response structure
@@ -29497,7 +29545,7 @@ module Aws::SageMaker
29497
29545
  tracer: tracer
29498
29546
  )
29499
29547
  context[:gem_name] = 'aws-sdk-sagemaker'
29500
- context[:gem_version] = '1.289.0'
29548
+ context[:gem_version] = '1.291.0'
29501
29549
  Seahorse::Client::Request.new(handlers, context)
29502
29550
  end
29503
29551
 
@@ -281,6 +281,7 @@ module Aws::SageMaker
281
281
  ClusterInstanceGroupName = Shapes::StringShape.new(name: 'ClusterInstanceGroupName')
282
282
  ClusterInstanceGroupSpecification = Shapes::StructureShape.new(name: 'ClusterInstanceGroupSpecification')
283
283
  ClusterInstanceGroupSpecifications = Shapes::ListShape.new(name: 'ClusterInstanceGroupSpecifications')
284
+ ClusterInstanceGroupsToDelete = Shapes::ListShape.new(name: 'ClusterInstanceGroupsToDelete')
284
285
  ClusterInstancePlacement = Shapes::StructureShape.new(name: 'ClusterInstancePlacement')
285
286
  ClusterInstanceStatus = Shapes::StringShape.new(name: 'ClusterInstanceStatus')
286
287
  ClusterInstanceStatusDetails = Shapes::StructureShape.new(name: 'ClusterInstanceStatusDetails')
@@ -1148,12 +1149,16 @@ module Aws::SageMaker
1148
1149
  ImportHubContentResponse = Shapes::StructureShape.new(name: 'ImportHubContentResponse')
1149
1150
  InUseInstanceCount = Shapes::IntegerShape.new(name: 'InUseInstanceCount')
1150
1151
  InferenceComponentArn = Shapes::StringShape.new(name: 'InferenceComponentArn')
1152
+ InferenceComponentCapacitySize = Shapes::StructureShape.new(name: 'InferenceComponentCapacitySize')
1153
+ InferenceComponentCapacitySizeType = Shapes::StringShape.new(name: 'InferenceComponentCapacitySizeType')
1151
1154
  InferenceComponentComputeResourceRequirements = Shapes::StructureShape.new(name: 'InferenceComponentComputeResourceRequirements')
1152
1155
  InferenceComponentContainerSpecification = Shapes::StructureShape.new(name: 'InferenceComponentContainerSpecification')
1153
1156
  InferenceComponentContainerSpecificationSummary = Shapes::StructureShape.new(name: 'InferenceComponentContainerSpecificationSummary')
1154
1157
  InferenceComponentCopyCount = Shapes::IntegerShape.new(name: 'InferenceComponentCopyCount')
1158
+ InferenceComponentDeploymentConfig = Shapes::StructureShape.new(name: 'InferenceComponentDeploymentConfig')
1155
1159
  InferenceComponentName = Shapes::StringShape.new(name: 'InferenceComponentName')
1156
1160
  InferenceComponentNameContains = Shapes::StringShape.new(name: 'InferenceComponentNameContains')
1161
+ InferenceComponentRollingUpdatePolicy = Shapes::StructureShape.new(name: 'InferenceComponentRollingUpdatePolicy')
1157
1162
  InferenceComponentRuntimeConfig = Shapes::StructureShape.new(name: 'InferenceComponentRuntimeConfig')
1158
1163
  InferenceComponentRuntimeConfigSummary = Shapes::StructureShape.new(name: 'InferenceComponentRuntimeConfigSummary')
1159
1164
  InferenceComponentSortKey = Shapes::StringShape.new(name: 'InferenceComponentSortKey')
@@ -3147,6 +3152,8 @@ module Aws::SageMaker
3147
3152
 
3148
3153
  ClusterInstanceGroupSpecifications.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecification)
3149
3154
 
3155
+ ClusterInstanceGroupsToDelete.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupName)
3156
+
3150
3157
  ClusterInstancePlacement.add_member(:availability_zone, Shapes::ShapeRef.new(shape: ClusterAvailabilityZone, location_name: "AvailabilityZone"))
3151
3158
  ClusterInstancePlacement.add_member(:availability_zone_id, Shapes::ShapeRef.new(shape: ClusterAvailabilityZoneId, location_name: "AvailabilityZoneId"))
3152
3159
  ClusterInstancePlacement.struct_class = Types::ClusterInstancePlacement
@@ -5201,6 +5208,7 @@ module Aws::SageMaker
5201
5208
  DescribeInferenceComponentOutput.add_member(:creation_time, Shapes::ShapeRef.new(shape: Timestamp, required: true, location_name: "CreationTime"))
5202
5209
  DescribeInferenceComponentOutput.add_member(:last_modified_time, Shapes::ShapeRef.new(shape: Timestamp, required: true, location_name: "LastModifiedTime"))
5203
5210
  DescribeInferenceComponentOutput.add_member(:inference_component_status, Shapes::ShapeRef.new(shape: InferenceComponentStatus, location_name: "InferenceComponentStatus"))
5211
+ DescribeInferenceComponentOutput.add_member(:last_deployment_config, Shapes::ShapeRef.new(shape: InferenceComponentDeploymentConfig, location_name: "LastDeploymentConfig"))
5204
5212
  DescribeInferenceComponentOutput.struct_class = Types::DescribeInferenceComponentOutput
5205
5213
 
5206
5214
  DescribeInferenceExperimentRequest.add_member(:name, Shapes::ShapeRef.new(shape: InferenceExperimentName, required: true, location_name: "Name"))
@@ -6721,6 +6729,10 @@ module Aws::SageMaker
6721
6729
  ImportHubContentResponse.add_member(:hub_content_arn, Shapes::ShapeRef.new(shape: HubContentArn, required: true, location_name: "HubContentArn"))
6722
6730
  ImportHubContentResponse.struct_class = Types::ImportHubContentResponse
6723
6731
 
6732
+ InferenceComponentCapacitySize.add_member(:type, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySizeType, required: true, location_name: "Type"))
6733
+ InferenceComponentCapacitySize.add_member(:value, Shapes::ShapeRef.new(shape: CapacitySizeValue, required: true, location_name: "Value"))
6734
+ InferenceComponentCapacitySize.struct_class = Types::InferenceComponentCapacitySize
6735
+
6724
6736
  InferenceComponentComputeResourceRequirements.add_member(:number_of_cpu_cores_required, Shapes::ShapeRef.new(shape: NumberOfCpuCores, location_name: "NumberOfCpuCoresRequired"))
6725
6737
  InferenceComponentComputeResourceRequirements.add_member(:number_of_accelerator_devices_required, Shapes::ShapeRef.new(shape: NumberOfAcceleratorDevices, location_name: "NumberOfAcceleratorDevicesRequired"))
6726
6738
  InferenceComponentComputeResourceRequirements.add_member(:min_memory_required_in_mb, Shapes::ShapeRef.new(shape: MemoryInMb, required: true, location_name: "MinMemoryRequiredInMb"))
@@ -6737,6 +6749,16 @@ module Aws::SageMaker
6737
6749
  InferenceComponentContainerSpecificationSummary.add_member(:environment, Shapes::ShapeRef.new(shape: EnvironmentMap, location_name: "Environment"))
6738
6750
  InferenceComponentContainerSpecificationSummary.struct_class = Types::InferenceComponentContainerSpecificationSummary
6739
6751
 
6752
+ InferenceComponentDeploymentConfig.add_member(:rolling_update_policy, Shapes::ShapeRef.new(shape: InferenceComponentRollingUpdatePolicy, required: true, location_name: "RollingUpdatePolicy"))
6753
+ InferenceComponentDeploymentConfig.add_member(:auto_rollback_configuration, Shapes::ShapeRef.new(shape: AutoRollbackConfig, location_name: "AutoRollbackConfiguration"))
6754
+ InferenceComponentDeploymentConfig.struct_class = Types::InferenceComponentDeploymentConfig
6755
+
6756
+ InferenceComponentRollingUpdatePolicy.add_member(:maximum_batch_size, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySize, required: true, location_name: "MaximumBatchSize"))
6757
+ InferenceComponentRollingUpdatePolicy.add_member(:wait_interval_in_seconds, Shapes::ShapeRef.new(shape: WaitIntervalInSeconds, required: true, location_name: "WaitIntervalInSeconds"))
6758
+ InferenceComponentRollingUpdatePolicy.add_member(:maximum_execution_timeout_in_seconds, Shapes::ShapeRef.new(shape: MaximumExecutionTimeoutInSeconds, location_name: "MaximumExecutionTimeoutInSeconds"))
6759
+ InferenceComponentRollingUpdatePolicy.add_member(:rollback_maximum_batch_size, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySize, location_name: "RollbackMaximumBatchSize"))
6760
+ InferenceComponentRollingUpdatePolicy.struct_class = Types::InferenceComponentRollingUpdatePolicy
6761
+
6740
6762
  InferenceComponentRuntimeConfig.add_member(:copy_count, Shapes::ShapeRef.new(shape: InferenceComponentCopyCount, required: true, location_name: "CopyCount"))
6741
6763
  InferenceComponentRuntimeConfig.struct_class = Types::InferenceComponentRuntimeConfig
6742
6764
 
@@ -10561,6 +10583,7 @@ module Aws::SageMaker
10561
10583
  UpdateClusterRequest.add_member(:cluster_name, Shapes::ShapeRef.new(shape: ClusterNameOrArn, required: true, location_name: "ClusterName"))
10562
10584
  UpdateClusterRequest.add_member(:instance_groups, Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecifications, required: true, location_name: "InstanceGroups"))
10563
10585
  UpdateClusterRequest.add_member(:node_recovery, Shapes::ShapeRef.new(shape: ClusterNodeRecovery, location_name: "NodeRecovery"))
10586
+ UpdateClusterRequest.add_member(:instance_groups_to_delete, Shapes::ShapeRef.new(shape: ClusterInstanceGroupsToDelete, location_name: "InstanceGroupsToDelete"))
10564
10587
  UpdateClusterRequest.struct_class = Types::UpdateClusterRequest
10565
10588
 
10566
10589
  UpdateClusterResponse.add_member(:cluster_arn, Shapes::ShapeRef.new(shape: ClusterArn, required: true, location_name: "ClusterArn"))
@@ -10715,6 +10738,7 @@ module Aws::SageMaker
10715
10738
  UpdateInferenceComponentInput.add_member(:inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, required: true, location_name: "InferenceComponentName"))
10716
10739
  UpdateInferenceComponentInput.add_member(:specification, Shapes::ShapeRef.new(shape: InferenceComponentSpecification, location_name: "Specification"))
10717
10740
  UpdateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, location_name: "RuntimeConfig"))
10741
+ UpdateInferenceComponentInput.add_member(:deployment_config, Shapes::ShapeRef.new(shape: InferenceComponentDeploymentConfig, location_name: "DeploymentConfig"))
10718
10742
  UpdateInferenceComponentInput.struct_class = Types::UpdateInferenceComponentInput
10719
10743
 
10720
10744
  UpdateInferenceComponentOutput.add_member(:inference_component_arn, Shapes::ShapeRef.new(shape: InferenceComponentArn, required: true, location_name: "InferenceComponentArn"))
@@ -2989,11 +2989,18 @@ module Aws::SageMaker
2989
2989
  # @!attribute [rw] node_ids
2990
2990
  # A list of node IDs to be deleted from the specified cluster.
2991
2991
  #
2992
- # <note markdown="1"> For SageMaker HyperPod clusters using the Slurm workload manager,
2993
- # you cannot remove instances that are configured as Slurm controller
2994
- # nodes.
2992
+ # <note markdown="1"> * For SageMaker HyperPod clusters using the Slurm workload manager,
2993
+ # you cannot remove instances that are configured as Slurm
2994
+ # controller nodes.
2995
+ #
2996
+ # * If you need to delete more than 99 instances, contact [Support][1]
2997
+ # for assistance.
2995
2998
  #
2996
2999
  # </note>
3000
+ #
3001
+ #
3002
+ #
3003
+ # [1]: http://aws.amazon.com/contact-us/
2997
3004
  # @return [Array<String>]
2998
3005
  #
2999
3006
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchDeleteClusterNodesRequest AWS API Documentation
@@ -16028,6 +16035,11 @@ module Aws::SageMaker
16028
16035
  # The status of the inference component.
16029
16036
  # @return [String]
16030
16037
  #
16038
+ # @!attribute [rw] last_deployment_config
16039
+ # The deployment and rollback settings that you assigned to the
16040
+ # inference component.
16041
+ # @return [Types::InferenceComponentDeploymentConfig]
16042
+ #
16031
16043
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeInferenceComponentOutput AWS API Documentation
16032
16044
  #
16033
16045
  class DescribeInferenceComponentOutput < Struct.new(
@@ -16041,7 +16053,8 @@ module Aws::SageMaker
16041
16053
  :runtime_config,
16042
16054
  :creation_time,
16043
16055
  :last_modified_time,
16044
- :inference_component_status)
16056
+ :inference_component_status,
16057
+ :last_deployment_config)
16045
16058
  SENSITIVE = []
16046
16059
  include Aws::Structure
16047
16060
  end
@@ -21280,10 +21293,12 @@ module Aws::SageMaker
21280
21293
  end
21281
21294
 
21282
21295
  # The properties of an experiment as returned by the [Search][1] API.
21296
+ # For information about experiments, see the [CreateExperiment][2] API.
21283
21297
  #
21284
21298
  #
21285
21299
  #
21286
21300
  # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_Search.html
21301
+ # [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateExperiment.html
21287
21302
  #
21288
21303
  # @!attribute [rw] experiment_name
21289
21304
  # The name of the experiment.
@@ -25376,6 +25391,47 @@ module Aws::SageMaker
25376
25391
  include Aws::Structure
25377
25392
  end
25378
25393
 
25394
+ # Specifies the type and size of the endpoint capacity to activate for a
25395
+ # rolling deployment or a rollback strategy. You can specify your
25396
+ # batches as either of the following:
25397
+ #
25398
+ # * A count of inference component copies
25399
+ #
25400
+ # * The overall percentage or your fleet
25401
+ #
25402
+ # For a rollback strategy, if you don't specify the fields in this
25403
+ # object, or if you set the `Value` parameter to 100%, then SageMaker AI
25404
+ # uses a blue/green rollback strategy and rolls all traffic back to the
25405
+ # blue fleet.
25406
+ #
25407
+ # @!attribute [rw] type
25408
+ # Specifies the endpoint capacity type.
25409
+ #
25410
+ # COPY\_COUNT
25411
+ #
25412
+ # : The endpoint activates based on the number of inference component
25413
+ # copies.
25414
+ #
25415
+ # CAPACITY\_PERCENT
25416
+ #
25417
+ # : The endpoint activates based on the specified percentage of
25418
+ # capacity.
25419
+ # @return [String]
25420
+ #
25421
+ # @!attribute [rw] value
25422
+ # Defines the capacity size, either as a number of inference component
25423
+ # copies or a capacity percentage.
25424
+ # @return [Integer]
25425
+ #
25426
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentCapacitySize AWS API Documentation
25427
+ #
25428
+ class InferenceComponentCapacitySize < Struct.new(
25429
+ :type,
25430
+ :value)
25431
+ SENSITIVE = []
25432
+ include Aws::Structure
25433
+ end
25434
+
25379
25435
  # Defines the compute resources to allocate to run a model, plus any
25380
25436
  # adapter models, that you assign to an inference component. These
25381
25437
  # resources include CPU cores, accelerators, and memory.
@@ -25481,6 +25537,69 @@ module Aws::SageMaker
25481
25537
  include Aws::Structure
25482
25538
  end
25483
25539
 
25540
+ # The deployment configuration for an endpoint that hosts inference
25541
+ # components. The configuration includes the desired deployment strategy
25542
+ # and rollback settings.
25543
+ #
25544
+ # @!attribute [rw] rolling_update_policy
25545
+ # Specifies a rolling deployment strategy for updating a SageMaker AI
25546
+ # endpoint.
25547
+ # @return [Types::InferenceComponentRollingUpdatePolicy]
25548
+ #
25549
+ # @!attribute [rw] auto_rollback_configuration
25550
+ # Automatic rollback configuration for handling endpoint deployment
25551
+ # failures and recovery.
25552
+ # @return [Types::AutoRollbackConfig]
25553
+ #
25554
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentDeploymentConfig AWS API Documentation
25555
+ #
25556
+ class InferenceComponentDeploymentConfig < Struct.new(
25557
+ :rolling_update_policy,
25558
+ :auto_rollback_configuration)
25559
+ SENSITIVE = []
25560
+ include Aws::Structure
25561
+ end
25562
+
25563
+ # Specifies a rolling deployment strategy for updating a SageMaker AI
25564
+ # inference component.
25565
+ #
25566
+ # @!attribute [rw] maximum_batch_size
25567
+ # The batch size for each rolling step in the deployment process. For
25568
+ # each step, SageMaker AI provisions capacity on the new endpoint
25569
+ # fleet, routes traffic to that fleet, and terminates capacity on the
25570
+ # old endpoint fleet. The value must be between 5% to 50% of the copy
25571
+ # count of the inference component.
25572
+ # @return [Types::InferenceComponentCapacitySize]
25573
+ #
25574
+ # @!attribute [rw] wait_interval_in_seconds
25575
+ # The length of the baking period, during which SageMaker AI monitors
25576
+ # alarms for each batch on the new fleet.
25577
+ # @return [Integer]
25578
+ #
25579
+ # @!attribute [rw] maximum_execution_timeout_in_seconds
25580
+ # The time limit for the total deployment. Exceeding this limit causes
25581
+ # a timeout.
25582
+ # @return [Integer]
25583
+ #
25584
+ # @!attribute [rw] rollback_maximum_batch_size
25585
+ # The batch size for a rollback to the old endpoint fleet. If this
25586
+ # field is absent, the value is set to the default, which is 100% of
25587
+ # the total capacity. When the default is used, SageMaker AI
25588
+ # provisions the entire capacity of the old fleet at once during
25589
+ # rollback.
25590
+ # @return [Types::InferenceComponentCapacitySize]
25591
+ #
25592
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentRollingUpdatePolicy AWS API Documentation
25593
+ #
25594
+ class InferenceComponentRollingUpdatePolicy < Struct.new(
25595
+ :maximum_batch_size,
25596
+ :wait_interval_in_seconds,
25597
+ :maximum_execution_timeout_in_seconds,
25598
+ :rollback_maximum_batch_size)
25599
+ SENSITIVE = []
25600
+ include Aws::Structure
25601
+ end
25602
+
25484
25603
  # Runtime settings for a model that is deployed with an inference
25485
25604
  # component.
25486
25605
  #
@@ -34551,10 +34670,29 @@ module Aws::SageMaker
34551
34670
  include Aws::Structure
34552
34671
  end
34553
34672
 
34554
- # A versioned model that can be deployed for SageMaker inference.
34673
+ # A container for your trained model that can be deployed for SageMaker
34674
+ # inference. This can include inference code, artifacts, and metadata.
34675
+ # The model package type can be one of the following.
34676
+ #
34677
+ # * Versioned model: A part of a model package group in Model Registry.
34678
+ #
34679
+ # * Unversioned model: Not part of a model package group and used in
34680
+ # Amazon Web Services Marketplace.
34681
+ #
34682
+ # For more information, see [ `CreateModelPackage` ][1].
34683
+ #
34684
+ #
34685
+ #
34686
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateModelPackage.html
34555
34687
  #
34556
34688
  # @!attribute [rw] model_package_name
34557
- # The name of the model.
34689
+ # The name of the model package. The name can be as follows:
34690
+ #
34691
+ # * For a versioned model, the name is automatically generated by
34692
+ # SageMaker Model Registry and follows the format
34693
+ # '`ModelPackageGroupName/ModelPackageVersion`'.
34694
+ #
34695
+ # * For an unversioned model, you must provide the name.
34558
34696
  # @return [String]
34559
34697
  #
34560
34698
  # @!attribute [rw] model_package_group_name
@@ -34879,7 +35017,7 @@ module Aws::SageMaker
34879
35017
  include Aws::Structure
34880
35018
  end
34881
35019
 
34882
- # A group of versioned models in the model registry.
35020
+ # A group of versioned models in the Model Registry.
34883
35021
  #
34884
35022
  # @!attribute [rw] model_package_group_name
34885
35023
  # The name of the model group.
@@ -42316,11 +42454,25 @@ module Aws::SageMaker
42316
42454
  # @return [Types::Endpoint]
42317
42455
  #
42318
42456
  # @!attribute [rw] model_package
42319
- # A versioned model that can be deployed for SageMaker inference.
42457
+ # A container for your trained model that can be deployed for
42458
+ # SageMaker inference. This can include inference code, artifacts, and
42459
+ # metadata. The model package type can be one of the following.
42460
+ #
42461
+ # * Versioned model: A part of a model package group in Model
42462
+ # Registry.
42463
+ #
42464
+ # * Unversioned model: Not part of a model package group and used in
42465
+ # Amazon Web Services Marketplace.
42466
+ #
42467
+ # For more information, see [ `CreateModelPackage` ][1].
42468
+ #
42469
+ #
42470
+ #
42471
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateModelPackage.html
42320
42472
  # @return [Types::ModelPackage]
42321
42473
  #
42322
42474
  # @!attribute [rw] model_package_group
42323
- # A group of versioned models in the model registry.
42475
+ # A group of versioned models in the Model Registry.
42324
42476
  # @return [Types::ModelPackageGroup]
42325
42477
  #
42326
42478
  # @!attribute [rw] pipeline
@@ -47402,12 +47554,18 @@ module Aws::SageMaker
47402
47554
  # cluster.
47403
47555
  # @return [String]
47404
47556
  #
47557
+ # @!attribute [rw] instance_groups_to_delete
47558
+ # Specify the names of the instance groups to delete. Use a single `,`
47559
+ # as the separator between multiple names.
47560
+ # @return [Array<String>]
47561
+ #
47405
47562
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/UpdateClusterRequest AWS API Documentation
47406
47563
  #
47407
47564
  class UpdateClusterRequest < Struct.new(
47408
47565
  :cluster_name,
47409
47566
  :instance_groups,
47410
- :node_recovery)
47567
+ :node_recovery,
47568
+ :instance_groups_to_delete)
47411
47569
  SENSITIVE = []
47412
47570
  include Aws::Structure
47413
47571
  end
@@ -48187,12 +48345,19 @@ module Aws::SageMaker
48187
48345
  # component.
48188
48346
  # @return [Types::InferenceComponentRuntimeConfig]
48189
48347
  #
48348
+ # @!attribute [rw] deployment_config
48349
+ # The deployment configuration for the inference component. The
48350
+ # configuration contains the desired deployment strategy and rollback
48351
+ # settings.
48352
+ # @return [Types::InferenceComponentDeploymentConfig]
48353
+ #
48190
48354
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/UpdateInferenceComponentInput AWS API Documentation
48191
48355
  #
48192
48356
  class UpdateInferenceComponentInput < Struct.new(
48193
48357
  :inference_component_name,
48194
48358
  :specification,
48195
- :runtime_config)
48359
+ :runtime_config,
48360
+ :deployment_config)
48196
48361
  SENSITIVE = []
48197
48362
  include Aws::Structure
48198
48363
  end
@@ -55,7 +55,7 @@ module Aws::SageMaker
55
55
  autoload :EndpointProvider, 'aws-sdk-sagemaker/endpoint_provider'
56
56
  autoload :Endpoints, 'aws-sdk-sagemaker/endpoints'
57
57
 
58
- GEM_VERSION = '1.289.0'
58
+ GEM_VERSION = '1.291.0'
59
59
 
60
60
  end
61
61
 
data/sig/client.rbs CHANGED
@@ -5686,6 +5686,7 @@ module Aws
5686
5686
  def creation_time: () -> ::Time
5687
5687
  def last_modified_time: () -> ::Time
5688
5688
  def inference_component_status: () -> ("InService" | "Creating" | "Updating" | "Failed" | "Deleting")
5689
+ def last_deployment_config: () -> Types::InferenceComponentDeploymentConfig
5689
5690
  end
5690
5691
  # https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#describe_inference_component-instance_method
5691
5692
  def describe_inference_component: (
@@ -8526,7 +8527,8 @@ module Aws
8526
8527
  }?
8527
8528
  },
8528
8529
  ],
8529
- ?node_recovery: ("Automatic" | "None")
8530
+ ?node_recovery: ("Automatic" | "None"),
8531
+ ?instance_groups_to_delete: Array[::String]
8530
8532
  ) -> _UpdateClusterResponseSuccess
8531
8533
  | (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _UpdateClusterResponseSuccess
8532
8534
 
@@ -9191,6 +9193,27 @@ module Aws
9191
9193
  },
9192
9194
  ?runtime_config: {
9193
9195
  copy_count: ::Integer
9196
+ },
9197
+ ?deployment_config: {
9198
+ rolling_update_policy: {
9199
+ maximum_batch_size: {
9200
+ type: ("COPY_COUNT" | "CAPACITY_PERCENT"),
9201
+ value: ::Integer
9202
+ },
9203
+ wait_interval_in_seconds: ::Integer,
9204
+ maximum_execution_timeout_in_seconds: ::Integer?,
9205
+ rollback_maximum_batch_size: {
9206
+ type: ("COPY_COUNT" | "CAPACITY_PERCENT"),
9207
+ value: ::Integer
9208
+ }?
9209
+ },
9210
+ auto_rollback_configuration: {
9211
+ alarms: Array[
9212
+ {
9213
+ alarm_name: ::String?
9214
+ },
9215
+ ]?
9216
+ }?
9194
9217
  }
9195
9218
  ) -> _UpdateInferenceComponentResponseSuccess
9196
9219
  | (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _UpdateInferenceComponentResponseSuccess
data/sig/types.rbs CHANGED
@@ -3394,6 +3394,7 @@ module Aws::SageMaker
3394
3394
  attr_accessor creation_time: ::Time
3395
3395
  attr_accessor last_modified_time: ::Time
3396
3396
  attr_accessor inference_component_status: ("InService" | "Creating" | "Updating" | "Failed" | "Deleting")
3397
+ attr_accessor last_deployment_config: Types::InferenceComponentDeploymentConfig
3397
3398
  SENSITIVE: []
3398
3399
  end
3399
3400
 
@@ -5174,6 +5175,12 @@ module Aws::SageMaker
5174
5175
  SENSITIVE: []
5175
5176
  end
5176
5177
 
5178
+ class InferenceComponentCapacitySize
5179
+ attr_accessor type: ("COPY_COUNT" | "CAPACITY_PERCENT")
5180
+ attr_accessor value: ::Integer
5181
+ SENSITIVE: []
5182
+ end
5183
+
5177
5184
  class InferenceComponentComputeResourceRequirements
5178
5185
  attr_accessor number_of_cpu_cores_required: ::Float
5179
5186
  attr_accessor number_of_accelerator_devices_required: ::Float
@@ -5196,6 +5203,20 @@ module Aws::SageMaker
5196
5203
  SENSITIVE: []
5197
5204
  end
5198
5205
 
5206
+ class InferenceComponentDeploymentConfig
5207
+ attr_accessor rolling_update_policy: Types::InferenceComponentRollingUpdatePolicy
5208
+ attr_accessor auto_rollback_configuration: Types::AutoRollbackConfig
5209
+ SENSITIVE: []
5210
+ end
5211
+
5212
+ class InferenceComponentRollingUpdatePolicy
5213
+ attr_accessor maximum_batch_size: Types::InferenceComponentCapacitySize
5214
+ attr_accessor wait_interval_in_seconds: ::Integer
5215
+ attr_accessor maximum_execution_timeout_in_seconds: ::Integer
5216
+ attr_accessor rollback_maximum_batch_size: Types::InferenceComponentCapacitySize
5217
+ SENSITIVE: []
5218
+ end
5219
+
5199
5220
  class InferenceComponentRuntimeConfig
5200
5221
  attr_accessor copy_count: ::Integer
5201
5222
  SENSITIVE: []
@@ -9869,6 +9890,7 @@ module Aws::SageMaker
9869
9890
  attr_accessor cluster_name: ::String
9870
9891
  attr_accessor instance_groups: ::Array[Types::ClusterInstanceGroupSpecification]
9871
9892
  attr_accessor node_recovery: ("Automatic" | "None")
9893
+ attr_accessor instance_groups_to_delete: ::Array[::String]
9872
9894
  SENSITIVE: []
9873
9895
  end
9874
9896
 
@@ -10085,6 +10107,7 @@ module Aws::SageMaker
10085
10107
  attr_accessor inference_component_name: ::String
10086
10108
  attr_accessor specification: Types::InferenceComponentSpecification
10087
10109
  attr_accessor runtime_config: Types::InferenceComponentRuntimeConfig
10110
+ attr_accessor deployment_config: Types::InferenceComponentDeploymentConfig
10088
10111
  SENSITIVE: []
10089
10112
  end
10090
10113
 
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: aws-sdk-sagemaker
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.289.0
4
+ version: 1.291.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Amazon Web Services
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2025-02-19 00:00:00.000000000 Z
11
+ date: 2025-02-26 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: aws-sdk-core