aws-sdk-sagemaker 1.289.0 → 1.291.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +10 -0
- data/VERSION +1 -1
- data/lib/aws-sdk-sagemaker/client.rb +51 -3
- data/lib/aws-sdk-sagemaker/client_api.rb +24 -0
- data/lib/aws-sdk-sagemaker/types.rb +176 -11
- data/lib/aws-sdk-sagemaker.rb +1 -1
- data/sig/client.rbs +24 -1
- data/sig/types.rbs +23 -0
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 89ca78842e4cb8cee6d80d8a8daf2c8b4dc0e47455067caecf7afd1ef6ffbd2e
|
4
|
+
data.tar.gz: dbbcf82690c0aba025bd9c60d7ca1dbe5855d544bb6b9b630f44daaad00a5ad0
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: de74eb8d70134e088fc61dfdf423b080ca19e84ecec8e21f73788c7abb2c5663b61e43be64ef04f4747bdc5b5377852e97a4b4bf451912291d6de3441c1fb682
|
7
|
+
data.tar.gz: 989fb4e7701a4455905eab5850c7e18b44b0df00b57e1a771c4f21386e41d00e7198b00cedaf5ed50e470130e3918b9f58d286331b99a1ff1c822c80c0b67d4b
|
data/CHANGELOG.md
CHANGED
@@ -1,6 +1,16 @@
|
|
1
1
|
Unreleased Changes
|
2
2
|
------------------
|
3
3
|
|
4
|
+
1.291.0 (2025-02-26)
|
5
|
+
------------------
|
6
|
+
|
7
|
+
* Feature - AWS SageMaker InferenceComponents now support rolling update deployments for Inference Components.
|
8
|
+
|
9
|
+
1.290.0 (2025-02-20)
|
10
|
+
------------------
|
11
|
+
|
12
|
+
* Feature - Added new capability in the UpdateCluster operation to remove instance groups from your SageMaker HyperPod cluster.
|
13
|
+
|
4
14
|
1.289.0 (2025-02-19)
|
5
15
|
------------------
|
6
16
|
|
data/VERSION
CHANGED
@@ -1 +1 @@
|
|
1
|
-
1.
|
1
|
+
1.291.0
|
@@ -689,11 +689,19 @@ module Aws::SageMaker
|
|
689
689
|
# @option params [required, Array<String>] :node_ids
|
690
690
|
# A list of node IDs to be deleted from the specified cluster.
|
691
691
|
#
|
692
|
-
# <note markdown="1"> For SageMaker HyperPod clusters using the Slurm workload manager,
|
693
|
-
#
|
692
|
+
# <note markdown="1"> * For SageMaker HyperPod clusters using the Slurm workload manager,
|
693
|
+
# you cannot remove instances that are configured as Slurm controller
|
694
|
+
# nodes.
|
695
|
+
#
|
696
|
+
# * If you need to delete more than 99 instances, contact [Support][1]
|
697
|
+
# for assistance.
|
694
698
|
#
|
695
699
|
# </note>
|
696
700
|
#
|
701
|
+
#
|
702
|
+
#
|
703
|
+
# [1]: http://aws.amazon.com/contact-us/
|
704
|
+
#
|
697
705
|
# @return [Types::BatchDeleteClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
698
706
|
#
|
699
707
|
# * {Types::BatchDeleteClusterNodesResponse#failed #failed} => Array<Types::BatchDeleteClusterNodesError>
|
@@ -14977,6 +14985,7 @@ module Aws::SageMaker
|
|
14977
14985
|
# * {Types::DescribeInferenceComponentOutput#creation_time #creation_time} => Time
|
14978
14986
|
# * {Types::DescribeInferenceComponentOutput#last_modified_time #last_modified_time} => Time
|
14979
14987
|
# * {Types::DescribeInferenceComponentOutput#inference_component_status #inference_component_status} => String
|
14988
|
+
# * {Types::DescribeInferenceComponentOutput#last_deployment_config #last_deployment_config} => Types::InferenceComponentDeploymentConfig
|
14980
14989
|
#
|
14981
14990
|
# @example Request syntax with placeholder values
|
14982
14991
|
#
|
@@ -15011,6 +15020,14 @@ module Aws::SageMaker
|
|
15011
15020
|
# resp.creation_time #=> Time
|
15012
15021
|
# resp.last_modified_time #=> Time
|
15013
15022
|
# resp.inference_component_status #=> String, one of "InService", "Creating", "Updating", "Failed", "Deleting"
|
15023
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "COPY_COUNT", "CAPACITY_PERCENT"
|
15024
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_batch_size.value #=> Integer
|
15025
|
+
# resp.last_deployment_config.rolling_update_policy.wait_interval_in_seconds #=> Integer
|
15026
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_execution_timeout_in_seconds #=> Integer
|
15027
|
+
# resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.type #=> String, one of "COPY_COUNT", "CAPACITY_PERCENT"
|
15028
|
+
# resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.value #=> Integer
|
15029
|
+
# resp.last_deployment_config.auto_rollback_configuration.alarms #=> Array
|
15030
|
+
# resp.last_deployment_config.auto_rollback_configuration.alarms[0].alarm_name #=> String
|
15014
15031
|
#
|
15015
15032
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeInferenceComponent AWS API Documentation
|
15016
15033
|
#
|
@@ -26207,6 +26224,10 @@ module Aws::SageMaker
|
|
26207
26224
|
# The node recovery mode to be applied to the SageMaker HyperPod
|
26208
26225
|
# cluster.
|
26209
26226
|
#
|
26227
|
+
# @option params [Array<String>] :instance_groups_to_delete
|
26228
|
+
# Specify the names of the instance groups to delete. Use a single `,`
|
26229
|
+
# as the separator between multiple names.
|
26230
|
+
#
|
26210
26231
|
# @return [Types::UpdateClusterResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
26211
26232
|
#
|
26212
26233
|
# * {Types::UpdateClusterResponse#cluster_arn #cluster_arn} => String
|
@@ -26242,6 +26263,7 @@ module Aws::SageMaker
|
|
26242
26263
|
# },
|
26243
26264
|
# ],
|
26244
26265
|
# node_recovery: "Automatic", # accepts Automatic, None
|
26266
|
+
# instance_groups_to_delete: ["ClusterInstanceGroupName"],
|
26245
26267
|
# })
|
26246
26268
|
#
|
26247
26269
|
# @example Response structure
|
@@ -27532,6 +27554,11 @@ module Aws::SageMaker
|
|
27532
27554
|
# Runtime settings for a model that is deployed with an inference
|
27533
27555
|
# component.
|
27534
27556
|
#
|
27557
|
+
# @option params [Types::InferenceComponentDeploymentConfig] :deployment_config
|
27558
|
+
# The deployment configuration for the inference component. The
|
27559
|
+
# configuration contains the desired deployment strategy and rollback
|
27560
|
+
# settings.
|
27561
|
+
#
|
27535
27562
|
# @return [Types::UpdateInferenceComponentOutput] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
27536
27563
|
#
|
27537
27564
|
# * {Types::UpdateInferenceComponentOutput#inference_component_arn #inference_component_arn} => String
|
@@ -27564,6 +27591,27 @@ module Aws::SageMaker
|
|
27564
27591
|
# runtime_config: {
|
27565
27592
|
# copy_count: 1, # required
|
27566
27593
|
# },
|
27594
|
+
# deployment_config: {
|
27595
|
+
# rolling_update_policy: { # required
|
27596
|
+
# maximum_batch_size: { # required
|
27597
|
+
# type: "COPY_COUNT", # required, accepts COPY_COUNT, CAPACITY_PERCENT
|
27598
|
+
# value: 1, # required
|
27599
|
+
# },
|
27600
|
+
# wait_interval_in_seconds: 1, # required
|
27601
|
+
# maximum_execution_timeout_in_seconds: 1,
|
27602
|
+
# rollback_maximum_batch_size: {
|
27603
|
+
# type: "COPY_COUNT", # required, accepts COPY_COUNT, CAPACITY_PERCENT
|
27604
|
+
# value: 1, # required
|
27605
|
+
# },
|
27606
|
+
# },
|
27607
|
+
# auto_rollback_configuration: {
|
27608
|
+
# alarms: [
|
27609
|
+
# {
|
27610
|
+
# alarm_name: "AlarmName",
|
27611
|
+
# },
|
27612
|
+
# ],
|
27613
|
+
# },
|
27614
|
+
# },
|
27567
27615
|
# })
|
27568
27616
|
#
|
27569
27617
|
# @example Response structure
|
@@ -29497,7 +29545,7 @@ module Aws::SageMaker
|
|
29497
29545
|
tracer: tracer
|
29498
29546
|
)
|
29499
29547
|
context[:gem_name] = 'aws-sdk-sagemaker'
|
29500
|
-
context[:gem_version] = '1.
|
29548
|
+
context[:gem_version] = '1.291.0'
|
29501
29549
|
Seahorse::Client::Request.new(handlers, context)
|
29502
29550
|
end
|
29503
29551
|
|
@@ -281,6 +281,7 @@ module Aws::SageMaker
|
|
281
281
|
ClusterInstanceGroupName = Shapes::StringShape.new(name: 'ClusterInstanceGroupName')
|
282
282
|
ClusterInstanceGroupSpecification = Shapes::StructureShape.new(name: 'ClusterInstanceGroupSpecification')
|
283
283
|
ClusterInstanceGroupSpecifications = Shapes::ListShape.new(name: 'ClusterInstanceGroupSpecifications')
|
284
|
+
ClusterInstanceGroupsToDelete = Shapes::ListShape.new(name: 'ClusterInstanceGroupsToDelete')
|
284
285
|
ClusterInstancePlacement = Shapes::StructureShape.new(name: 'ClusterInstancePlacement')
|
285
286
|
ClusterInstanceStatus = Shapes::StringShape.new(name: 'ClusterInstanceStatus')
|
286
287
|
ClusterInstanceStatusDetails = Shapes::StructureShape.new(name: 'ClusterInstanceStatusDetails')
|
@@ -1148,12 +1149,16 @@ module Aws::SageMaker
|
|
1148
1149
|
ImportHubContentResponse = Shapes::StructureShape.new(name: 'ImportHubContentResponse')
|
1149
1150
|
InUseInstanceCount = Shapes::IntegerShape.new(name: 'InUseInstanceCount')
|
1150
1151
|
InferenceComponentArn = Shapes::StringShape.new(name: 'InferenceComponentArn')
|
1152
|
+
InferenceComponentCapacitySize = Shapes::StructureShape.new(name: 'InferenceComponentCapacitySize')
|
1153
|
+
InferenceComponentCapacitySizeType = Shapes::StringShape.new(name: 'InferenceComponentCapacitySizeType')
|
1151
1154
|
InferenceComponentComputeResourceRequirements = Shapes::StructureShape.new(name: 'InferenceComponentComputeResourceRequirements')
|
1152
1155
|
InferenceComponentContainerSpecification = Shapes::StructureShape.new(name: 'InferenceComponentContainerSpecification')
|
1153
1156
|
InferenceComponentContainerSpecificationSummary = Shapes::StructureShape.new(name: 'InferenceComponentContainerSpecificationSummary')
|
1154
1157
|
InferenceComponentCopyCount = Shapes::IntegerShape.new(name: 'InferenceComponentCopyCount')
|
1158
|
+
InferenceComponentDeploymentConfig = Shapes::StructureShape.new(name: 'InferenceComponentDeploymentConfig')
|
1155
1159
|
InferenceComponentName = Shapes::StringShape.new(name: 'InferenceComponentName')
|
1156
1160
|
InferenceComponentNameContains = Shapes::StringShape.new(name: 'InferenceComponentNameContains')
|
1161
|
+
InferenceComponentRollingUpdatePolicy = Shapes::StructureShape.new(name: 'InferenceComponentRollingUpdatePolicy')
|
1157
1162
|
InferenceComponentRuntimeConfig = Shapes::StructureShape.new(name: 'InferenceComponentRuntimeConfig')
|
1158
1163
|
InferenceComponentRuntimeConfigSummary = Shapes::StructureShape.new(name: 'InferenceComponentRuntimeConfigSummary')
|
1159
1164
|
InferenceComponentSortKey = Shapes::StringShape.new(name: 'InferenceComponentSortKey')
|
@@ -3147,6 +3152,8 @@ module Aws::SageMaker
|
|
3147
3152
|
|
3148
3153
|
ClusterInstanceGroupSpecifications.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecification)
|
3149
3154
|
|
3155
|
+
ClusterInstanceGroupsToDelete.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupName)
|
3156
|
+
|
3150
3157
|
ClusterInstancePlacement.add_member(:availability_zone, Shapes::ShapeRef.new(shape: ClusterAvailabilityZone, location_name: "AvailabilityZone"))
|
3151
3158
|
ClusterInstancePlacement.add_member(:availability_zone_id, Shapes::ShapeRef.new(shape: ClusterAvailabilityZoneId, location_name: "AvailabilityZoneId"))
|
3152
3159
|
ClusterInstancePlacement.struct_class = Types::ClusterInstancePlacement
|
@@ -5201,6 +5208,7 @@ module Aws::SageMaker
|
|
5201
5208
|
DescribeInferenceComponentOutput.add_member(:creation_time, Shapes::ShapeRef.new(shape: Timestamp, required: true, location_name: "CreationTime"))
|
5202
5209
|
DescribeInferenceComponentOutput.add_member(:last_modified_time, Shapes::ShapeRef.new(shape: Timestamp, required: true, location_name: "LastModifiedTime"))
|
5203
5210
|
DescribeInferenceComponentOutput.add_member(:inference_component_status, Shapes::ShapeRef.new(shape: InferenceComponentStatus, location_name: "InferenceComponentStatus"))
|
5211
|
+
DescribeInferenceComponentOutput.add_member(:last_deployment_config, Shapes::ShapeRef.new(shape: InferenceComponentDeploymentConfig, location_name: "LastDeploymentConfig"))
|
5204
5212
|
DescribeInferenceComponentOutput.struct_class = Types::DescribeInferenceComponentOutput
|
5205
5213
|
|
5206
5214
|
DescribeInferenceExperimentRequest.add_member(:name, Shapes::ShapeRef.new(shape: InferenceExperimentName, required: true, location_name: "Name"))
|
@@ -6721,6 +6729,10 @@ module Aws::SageMaker
|
|
6721
6729
|
ImportHubContentResponse.add_member(:hub_content_arn, Shapes::ShapeRef.new(shape: HubContentArn, required: true, location_name: "HubContentArn"))
|
6722
6730
|
ImportHubContentResponse.struct_class = Types::ImportHubContentResponse
|
6723
6731
|
|
6732
|
+
InferenceComponentCapacitySize.add_member(:type, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySizeType, required: true, location_name: "Type"))
|
6733
|
+
InferenceComponentCapacitySize.add_member(:value, Shapes::ShapeRef.new(shape: CapacitySizeValue, required: true, location_name: "Value"))
|
6734
|
+
InferenceComponentCapacitySize.struct_class = Types::InferenceComponentCapacitySize
|
6735
|
+
|
6724
6736
|
InferenceComponentComputeResourceRequirements.add_member(:number_of_cpu_cores_required, Shapes::ShapeRef.new(shape: NumberOfCpuCores, location_name: "NumberOfCpuCoresRequired"))
|
6725
6737
|
InferenceComponentComputeResourceRequirements.add_member(:number_of_accelerator_devices_required, Shapes::ShapeRef.new(shape: NumberOfAcceleratorDevices, location_name: "NumberOfAcceleratorDevicesRequired"))
|
6726
6738
|
InferenceComponentComputeResourceRequirements.add_member(:min_memory_required_in_mb, Shapes::ShapeRef.new(shape: MemoryInMb, required: true, location_name: "MinMemoryRequiredInMb"))
|
@@ -6737,6 +6749,16 @@ module Aws::SageMaker
|
|
6737
6749
|
InferenceComponentContainerSpecificationSummary.add_member(:environment, Shapes::ShapeRef.new(shape: EnvironmentMap, location_name: "Environment"))
|
6738
6750
|
InferenceComponentContainerSpecificationSummary.struct_class = Types::InferenceComponentContainerSpecificationSummary
|
6739
6751
|
|
6752
|
+
InferenceComponentDeploymentConfig.add_member(:rolling_update_policy, Shapes::ShapeRef.new(shape: InferenceComponentRollingUpdatePolicy, required: true, location_name: "RollingUpdatePolicy"))
|
6753
|
+
InferenceComponentDeploymentConfig.add_member(:auto_rollback_configuration, Shapes::ShapeRef.new(shape: AutoRollbackConfig, location_name: "AutoRollbackConfiguration"))
|
6754
|
+
InferenceComponentDeploymentConfig.struct_class = Types::InferenceComponentDeploymentConfig
|
6755
|
+
|
6756
|
+
InferenceComponentRollingUpdatePolicy.add_member(:maximum_batch_size, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySize, required: true, location_name: "MaximumBatchSize"))
|
6757
|
+
InferenceComponentRollingUpdatePolicy.add_member(:wait_interval_in_seconds, Shapes::ShapeRef.new(shape: WaitIntervalInSeconds, required: true, location_name: "WaitIntervalInSeconds"))
|
6758
|
+
InferenceComponentRollingUpdatePolicy.add_member(:maximum_execution_timeout_in_seconds, Shapes::ShapeRef.new(shape: MaximumExecutionTimeoutInSeconds, location_name: "MaximumExecutionTimeoutInSeconds"))
|
6759
|
+
InferenceComponentRollingUpdatePolicy.add_member(:rollback_maximum_batch_size, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySize, location_name: "RollbackMaximumBatchSize"))
|
6760
|
+
InferenceComponentRollingUpdatePolicy.struct_class = Types::InferenceComponentRollingUpdatePolicy
|
6761
|
+
|
6740
6762
|
InferenceComponentRuntimeConfig.add_member(:copy_count, Shapes::ShapeRef.new(shape: InferenceComponentCopyCount, required: true, location_name: "CopyCount"))
|
6741
6763
|
InferenceComponentRuntimeConfig.struct_class = Types::InferenceComponentRuntimeConfig
|
6742
6764
|
|
@@ -10561,6 +10583,7 @@ module Aws::SageMaker
|
|
10561
10583
|
UpdateClusterRequest.add_member(:cluster_name, Shapes::ShapeRef.new(shape: ClusterNameOrArn, required: true, location_name: "ClusterName"))
|
10562
10584
|
UpdateClusterRequest.add_member(:instance_groups, Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecifications, required: true, location_name: "InstanceGroups"))
|
10563
10585
|
UpdateClusterRequest.add_member(:node_recovery, Shapes::ShapeRef.new(shape: ClusterNodeRecovery, location_name: "NodeRecovery"))
|
10586
|
+
UpdateClusterRequest.add_member(:instance_groups_to_delete, Shapes::ShapeRef.new(shape: ClusterInstanceGroupsToDelete, location_name: "InstanceGroupsToDelete"))
|
10564
10587
|
UpdateClusterRequest.struct_class = Types::UpdateClusterRequest
|
10565
10588
|
|
10566
10589
|
UpdateClusterResponse.add_member(:cluster_arn, Shapes::ShapeRef.new(shape: ClusterArn, required: true, location_name: "ClusterArn"))
|
@@ -10715,6 +10738,7 @@ module Aws::SageMaker
|
|
10715
10738
|
UpdateInferenceComponentInput.add_member(:inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, required: true, location_name: "InferenceComponentName"))
|
10716
10739
|
UpdateInferenceComponentInput.add_member(:specification, Shapes::ShapeRef.new(shape: InferenceComponentSpecification, location_name: "Specification"))
|
10717
10740
|
UpdateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, location_name: "RuntimeConfig"))
|
10741
|
+
UpdateInferenceComponentInput.add_member(:deployment_config, Shapes::ShapeRef.new(shape: InferenceComponentDeploymentConfig, location_name: "DeploymentConfig"))
|
10718
10742
|
UpdateInferenceComponentInput.struct_class = Types::UpdateInferenceComponentInput
|
10719
10743
|
|
10720
10744
|
UpdateInferenceComponentOutput.add_member(:inference_component_arn, Shapes::ShapeRef.new(shape: InferenceComponentArn, required: true, location_name: "InferenceComponentArn"))
|
@@ -2989,11 +2989,18 @@ module Aws::SageMaker
|
|
2989
2989
|
# @!attribute [rw] node_ids
|
2990
2990
|
# A list of node IDs to be deleted from the specified cluster.
|
2991
2991
|
#
|
2992
|
-
# <note markdown="1"> For SageMaker HyperPod clusters using the Slurm workload manager,
|
2993
|
-
#
|
2994
|
-
#
|
2992
|
+
# <note markdown="1"> * For SageMaker HyperPod clusters using the Slurm workload manager,
|
2993
|
+
# you cannot remove instances that are configured as Slurm
|
2994
|
+
# controller nodes.
|
2995
|
+
#
|
2996
|
+
# * If you need to delete more than 99 instances, contact [Support][1]
|
2997
|
+
# for assistance.
|
2995
2998
|
#
|
2996
2999
|
# </note>
|
3000
|
+
#
|
3001
|
+
#
|
3002
|
+
#
|
3003
|
+
# [1]: http://aws.amazon.com/contact-us/
|
2997
3004
|
# @return [Array<String>]
|
2998
3005
|
#
|
2999
3006
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchDeleteClusterNodesRequest AWS API Documentation
|
@@ -16028,6 +16035,11 @@ module Aws::SageMaker
|
|
16028
16035
|
# The status of the inference component.
|
16029
16036
|
# @return [String]
|
16030
16037
|
#
|
16038
|
+
# @!attribute [rw] last_deployment_config
|
16039
|
+
# The deployment and rollback settings that you assigned to the
|
16040
|
+
# inference component.
|
16041
|
+
# @return [Types::InferenceComponentDeploymentConfig]
|
16042
|
+
#
|
16031
16043
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeInferenceComponentOutput AWS API Documentation
|
16032
16044
|
#
|
16033
16045
|
class DescribeInferenceComponentOutput < Struct.new(
|
@@ -16041,7 +16053,8 @@ module Aws::SageMaker
|
|
16041
16053
|
:runtime_config,
|
16042
16054
|
:creation_time,
|
16043
16055
|
:last_modified_time,
|
16044
|
-
:inference_component_status
|
16056
|
+
:inference_component_status,
|
16057
|
+
:last_deployment_config)
|
16045
16058
|
SENSITIVE = []
|
16046
16059
|
include Aws::Structure
|
16047
16060
|
end
|
@@ -21280,10 +21293,12 @@ module Aws::SageMaker
|
|
21280
21293
|
end
|
21281
21294
|
|
21282
21295
|
# The properties of an experiment as returned by the [Search][1] API.
|
21296
|
+
# For information about experiments, see the [CreateExperiment][2] API.
|
21283
21297
|
#
|
21284
21298
|
#
|
21285
21299
|
#
|
21286
21300
|
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_Search.html
|
21301
|
+
# [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateExperiment.html
|
21287
21302
|
#
|
21288
21303
|
# @!attribute [rw] experiment_name
|
21289
21304
|
# The name of the experiment.
|
@@ -25376,6 +25391,47 @@ module Aws::SageMaker
|
|
25376
25391
|
include Aws::Structure
|
25377
25392
|
end
|
25378
25393
|
|
25394
|
+
# Specifies the type and size of the endpoint capacity to activate for a
|
25395
|
+
# rolling deployment or a rollback strategy. You can specify your
|
25396
|
+
# batches as either of the following:
|
25397
|
+
#
|
25398
|
+
# * A count of inference component copies
|
25399
|
+
#
|
25400
|
+
# * The overall percentage or your fleet
|
25401
|
+
#
|
25402
|
+
# For a rollback strategy, if you don't specify the fields in this
|
25403
|
+
# object, or if you set the `Value` parameter to 100%, then SageMaker AI
|
25404
|
+
# uses a blue/green rollback strategy and rolls all traffic back to the
|
25405
|
+
# blue fleet.
|
25406
|
+
#
|
25407
|
+
# @!attribute [rw] type
|
25408
|
+
# Specifies the endpoint capacity type.
|
25409
|
+
#
|
25410
|
+
# COPY\_COUNT
|
25411
|
+
#
|
25412
|
+
# : The endpoint activates based on the number of inference component
|
25413
|
+
# copies.
|
25414
|
+
#
|
25415
|
+
# CAPACITY\_PERCENT
|
25416
|
+
#
|
25417
|
+
# : The endpoint activates based on the specified percentage of
|
25418
|
+
# capacity.
|
25419
|
+
# @return [String]
|
25420
|
+
#
|
25421
|
+
# @!attribute [rw] value
|
25422
|
+
# Defines the capacity size, either as a number of inference component
|
25423
|
+
# copies or a capacity percentage.
|
25424
|
+
# @return [Integer]
|
25425
|
+
#
|
25426
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentCapacitySize AWS API Documentation
|
25427
|
+
#
|
25428
|
+
class InferenceComponentCapacitySize < Struct.new(
|
25429
|
+
:type,
|
25430
|
+
:value)
|
25431
|
+
SENSITIVE = []
|
25432
|
+
include Aws::Structure
|
25433
|
+
end
|
25434
|
+
|
25379
25435
|
# Defines the compute resources to allocate to run a model, plus any
|
25380
25436
|
# adapter models, that you assign to an inference component. These
|
25381
25437
|
# resources include CPU cores, accelerators, and memory.
|
@@ -25481,6 +25537,69 @@ module Aws::SageMaker
|
|
25481
25537
|
include Aws::Structure
|
25482
25538
|
end
|
25483
25539
|
|
25540
|
+
# The deployment configuration for an endpoint that hosts inference
|
25541
|
+
# components. The configuration includes the desired deployment strategy
|
25542
|
+
# and rollback settings.
|
25543
|
+
#
|
25544
|
+
# @!attribute [rw] rolling_update_policy
|
25545
|
+
# Specifies a rolling deployment strategy for updating a SageMaker AI
|
25546
|
+
# endpoint.
|
25547
|
+
# @return [Types::InferenceComponentRollingUpdatePolicy]
|
25548
|
+
#
|
25549
|
+
# @!attribute [rw] auto_rollback_configuration
|
25550
|
+
# Automatic rollback configuration for handling endpoint deployment
|
25551
|
+
# failures and recovery.
|
25552
|
+
# @return [Types::AutoRollbackConfig]
|
25553
|
+
#
|
25554
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentDeploymentConfig AWS API Documentation
|
25555
|
+
#
|
25556
|
+
class InferenceComponentDeploymentConfig < Struct.new(
|
25557
|
+
:rolling_update_policy,
|
25558
|
+
:auto_rollback_configuration)
|
25559
|
+
SENSITIVE = []
|
25560
|
+
include Aws::Structure
|
25561
|
+
end
|
25562
|
+
|
25563
|
+
# Specifies a rolling deployment strategy for updating a SageMaker AI
|
25564
|
+
# inference component.
|
25565
|
+
#
|
25566
|
+
# @!attribute [rw] maximum_batch_size
|
25567
|
+
# The batch size for each rolling step in the deployment process. For
|
25568
|
+
# each step, SageMaker AI provisions capacity on the new endpoint
|
25569
|
+
# fleet, routes traffic to that fleet, and terminates capacity on the
|
25570
|
+
# old endpoint fleet. The value must be between 5% to 50% of the copy
|
25571
|
+
# count of the inference component.
|
25572
|
+
# @return [Types::InferenceComponentCapacitySize]
|
25573
|
+
#
|
25574
|
+
# @!attribute [rw] wait_interval_in_seconds
|
25575
|
+
# The length of the baking period, during which SageMaker AI monitors
|
25576
|
+
# alarms for each batch on the new fleet.
|
25577
|
+
# @return [Integer]
|
25578
|
+
#
|
25579
|
+
# @!attribute [rw] maximum_execution_timeout_in_seconds
|
25580
|
+
# The time limit for the total deployment. Exceeding this limit causes
|
25581
|
+
# a timeout.
|
25582
|
+
# @return [Integer]
|
25583
|
+
#
|
25584
|
+
# @!attribute [rw] rollback_maximum_batch_size
|
25585
|
+
# The batch size for a rollback to the old endpoint fleet. If this
|
25586
|
+
# field is absent, the value is set to the default, which is 100% of
|
25587
|
+
# the total capacity. When the default is used, SageMaker AI
|
25588
|
+
# provisions the entire capacity of the old fleet at once during
|
25589
|
+
# rollback.
|
25590
|
+
# @return [Types::InferenceComponentCapacitySize]
|
25591
|
+
#
|
25592
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentRollingUpdatePolicy AWS API Documentation
|
25593
|
+
#
|
25594
|
+
class InferenceComponentRollingUpdatePolicy < Struct.new(
|
25595
|
+
:maximum_batch_size,
|
25596
|
+
:wait_interval_in_seconds,
|
25597
|
+
:maximum_execution_timeout_in_seconds,
|
25598
|
+
:rollback_maximum_batch_size)
|
25599
|
+
SENSITIVE = []
|
25600
|
+
include Aws::Structure
|
25601
|
+
end
|
25602
|
+
|
25484
25603
|
# Runtime settings for a model that is deployed with an inference
|
25485
25604
|
# component.
|
25486
25605
|
#
|
@@ -34551,10 +34670,29 @@ module Aws::SageMaker
|
|
34551
34670
|
include Aws::Structure
|
34552
34671
|
end
|
34553
34672
|
|
34554
|
-
# A
|
34673
|
+
# A container for your trained model that can be deployed for SageMaker
|
34674
|
+
# inference. This can include inference code, artifacts, and metadata.
|
34675
|
+
# The model package type can be one of the following.
|
34676
|
+
#
|
34677
|
+
# * Versioned model: A part of a model package group in Model Registry.
|
34678
|
+
#
|
34679
|
+
# * Unversioned model: Not part of a model package group and used in
|
34680
|
+
# Amazon Web Services Marketplace.
|
34681
|
+
#
|
34682
|
+
# For more information, see [ `CreateModelPackage` ][1].
|
34683
|
+
#
|
34684
|
+
#
|
34685
|
+
#
|
34686
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateModelPackage.html
|
34555
34687
|
#
|
34556
34688
|
# @!attribute [rw] model_package_name
|
34557
|
-
# The name of the model.
|
34689
|
+
# The name of the model package. The name can be as follows:
|
34690
|
+
#
|
34691
|
+
# * For a versioned model, the name is automatically generated by
|
34692
|
+
# SageMaker Model Registry and follows the format
|
34693
|
+
# '`ModelPackageGroupName/ModelPackageVersion`'.
|
34694
|
+
#
|
34695
|
+
# * For an unversioned model, you must provide the name.
|
34558
34696
|
# @return [String]
|
34559
34697
|
#
|
34560
34698
|
# @!attribute [rw] model_package_group_name
|
@@ -34879,7 +35017,7 @@ module Aws::SageMaker
|
|
34879
35017
|
include Aws::Structure
|
34880
35018
|
end
|
34881
35019
|
|
34882
|
-
# A group of versioned models in the
|
35020
|
+
# A group of versioned models in the Model Registry.
|
34883
35021
|
#
|
34884
35022
|
# @!attribute [rw] model_package_group_name
|
34885
35023
|
# The name of the model group.
|
@@ -42316,11 +42454,25 @@ module Aws::SageMaker
|
|
42316
42454
|
# @return [Types::Endpoint]
|
42317
42455
|
#
|
42318
42456
|
# @!attribute [rw] model_package
|
42319
|
-
# A
|
42457
|
+
# A container for your trained model that can be deployed for
|
42458
|
+
# SageMaker inference. This can include inference code, artifacts, and
|
42459
|
+
# metadata. The model package type can be one of the following.
|
42460
|
+
#
|
42461
|
+
# * Versioned model: A part of a model package group in Model
|
42462
|
+
# Registry.
|
42463
|
+
#
|
42464
|
+
# * Unversioned model: Not part of a model package group and used in
|
42465
|
+
# Amazon Web Services Marketplace.
|
42466
|
+
#
|
42467
|
+
# For more information, see [ `CreateModelPackage` ][1].
|
42468
|
+
#
|
42469
|
+
#
|
42470
|
+
#
|
42471
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateModelPackage.html
|
42320
42472
|
# @return [Types::ModelPackage]
|
42321
42473
|
#
|
42322
42474
|
# @!attribute [rw] model_package_group
|
42323
|
-
# A group of versioned models in the
|
42475
|
+
# A group of versioned models in the Model Registry.
|
42324
42476
|
# @return [Types::ModelPackageGroup]
|
42325
42477
|
#
|
42326
42478
|
# @!attribute [rw] pipeline
|
@@ -47402,12 +47554,18 @@ module Aws::SageMaker
|
|
47402
47554
|
# cluster.
|
47403
47555
|
# @return [String]
|
47404
47556
|
#
|
47557
|
+
# @!attribute [rw] instance_groups_to_delete
|
47558
|
+
# Specify the names of the instance groups to delete. Use a single `,`
|
47559
|
+
# as the separator between multiple names.
|
47560
|
+
# @return [Array<String>]
|
47561
|
+
#
|
47405
47562
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/UpdateClusterRequest AWS API Documentation
|
47406
47563
|
#
|
47407
47564
|
class UpdateClusterRequest < Struct.new(
|
47408
47565
|
:cluster_name,
|
47409
47566
|
:instance_groups,
|
47410
|
-
:node_recovery
|
47567
|
+
:node_recovery,
|
47568
|
+
:instance_groups_to_delete)
|
47411
47569
|
SENSITIVE = []
|
47412
47570
|
include Aws::Structure
|
47413
47571
|
end
|
@@ -48187,12 +48345,19 @@ module Aws::SageMaker
|
|
48187
48345
|
# component.
|
48188
48346
|
# @return [Types::InferenceComponentRuntimeConfig]
|
48189
48347
|
#
|
48348
|
+
# @!attribute [rw] deployment_config
|
48349
|
+
# The deployment configuration for the inference component. The
|
48350
|
+
# configuration contains the desired deployment strategy and rollback
|
48351
|
+
# settings.
|
48352
|
+
# @return [Types::InferenceComponentDeploymentConfig]
|
48353
|
+
#
|
48190
48354
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/UpdateInferenceComponentInput AWS API Documentation
|
48191
48355
|
#
|
48192
48356
|
class UpdateInferenceComponentInput < Struct.new(
|
48193
48357
|
:inference_component_name,
|
48194
48358
|
:specification,
|
48195
|
-
:runtime_config
|
48359
|
+
:runtime_config,
|
48360
|
+
:deployment_config)
|
48196
48361
|
SENSITIVE = []
|
48197
48362
|
include Aws::Structure
|
48198
48363
|
end
|
data/lib/aws-sdk-sagemaker.rb
CHANGED
data/sig/client.rbs
CHANGED
@@ -5686,6 +5686,7 @@ module Aws
|
|
5686
5686
|
def creation_time: () -> ::Time
|
5687
5687
|
def last_modified_time: () -> ::Time
|
5688
5688
|
def inference_component_status: () -> ("InService" | "Creating" | "Updating" | "Failed" | "Deleting")
|
5689
|
+
def last_deployment_config: () -> Types::InferenceComponentDeploymentConfig
|
5689
5690
|
end
|
5690
5691
|
# https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#describe_inference_component-instance_method
|
5691
5692
|
def describe_inference_component: (
|
@@ -8526,7 +8527,8 @@ module Aws
|
|
8526
8527
|
}?
|
8527
8528
|
},
|
8528
8529
|
],
|
8529
|
-
?node_recovery: ("Automatic" | "None")
|
8530
|
+
?node_recovery: ("Automatic" | "None"),
|
8531
|
+
?instance_groups_to_delete: Array[::String]
|
8530
8532
|
) -> _UpdateClusterResponseSuccess
|
8531
8533
|
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _UpdateClusterResponseSuccess
|
8532
8534
|
|
@@ -9191,6 +9193,27 @@ module Aws
|
|
9191
9193
|
},
|
9192
9194
|
?runtime_config: {
|
9193
9195
|
copy_count: ::Integer
|
9196
|
+
},
|
9197
|
+
?deployment_config: {
|
9198
|
+
rolling_update_policy: {
|
9199
|
+
maximum_batch_size: {
|
9200
|
+
type: ("COPY_COUNT" | "CAPACITY_PERCENT"),
|
9201
|
+
value: ::Integer
|
9202
|
+
},
|
9203
|
+
wait_interval_in_seconds: ::Integer,
|
9204
|
+
maximum_execution_timeout_in_seconds: ::Integer?,
|
9205
|
+
rollback_maximum_batch_size: {
|
9206
|
+
type: ("COPY_COUNT" | "CAPACITY_PERCENT"),
|
9207
|
+
value: ::Integer
|
9208
|
+
}?
|
9209
|
+
},
|
9210
|
+
auto_rollback_configuration: {
|
9211
|
+
alarms: Array[
|
9212
|
+
{
|
9213
|
+
alarm_name: ::String?
|
9214
|
+
},
|
9215
|
+
]?
|
9216
|
+
}?
|
9194
9217
|
}
|
9195
9218
|
) -> _UpdateInferenceComponentResponseSuccess
|
9196
9219
|
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _UpdateInferenceComponentResponseSuccess
|
data/sig/types.rbs
CHANGED
@@ -3394,6 +3394,7 @@ module Aws::SageMaker
|
|
3394
3394
|
attr_accessor creation_time: ::Time
|
3395
3395
|
attr_accessor last_modified_time: ::Time
|
3396
3396
|
attr_accessor inference_component_status: ("InService" | "Creating" | "Updating" | "Failed" | "Deleting")
|
3397
|
+
attr_accessor last_deployment_config: Types::InferenceComponentDeploymentConfig
|
3397
3398
|
SENSITIVE: []
|
3398
3399
|
end
|
3399
3400
|
|
@@ -5174,6 +5175,12 @@ module Aws::SageMaker
|
|
5174
5175
|
SENSITIVE: []
|
5175
5176
|
end
|
5176
5177
|
|
5178
|
+
class InferenceComponentCapacitySize
|
5179
|
+
attr_accessor type: ("COPY_COUNT" | "CAPACITY_PERCENT")
|
5180
|
+
attr_accessor value: ::Integer
|
5181
|
+
SENSITIVE: []
|
5182
|
+
end
|
5183
|
+
|
5177
5184
|
class InferenceComponentComputeResourceRequirements
|
5178
5185
|
attr_accessor number_of_cpu_cores_required: ::Float
|
5179
5186
|
attr_accessor number_of_accelerator_devices_required: ::Float
|
@@ -5196,6 +5203,20 @@ module Aws::SageMaker
|
|
5196
5203
|
SENSITIVE: []
|
5197
5204
|
end
|
5198
5205
|
|
5206
|
+
class InferenceComponentDeploymentConfig
|
5207
|
+
attr_accessor rolling_update_policy: Types::InferenceComponentRollingUpdatePolicy
|
5208
|
+
attr_accessor auto_rollback_configuration: Types::AutoRollbackConfig
|
5209
|
+
SENSITIVE: []
|
5210
|
+
end
|
5211
|
+
|
5212
|
+
class InferenceComponentRollingUpdatePolicy
|
5213
|
+
attr_accessor maximum_batch_size: Types::InferenceComponentCapacitySize
|
5214
|
+
attr_accessor wait_interval_in_seconds: ::Integer
|
5215
|
+
attr_accessor maximum_execution_timeout_in_seconds: ::Integer
|
5216
|
+
attr_accessor rollback_maximum_batch_size: Types::InferenceComponentCapacitySize
|
5217
|
+
SENSITIVE: []
|
5218
|
+
end
|
5219
|
+
|
5199
5220
|
class InferenceComponentRuntimeConfig
|
5200
5221
|
attr_accessor copy_count: ::Integer
|
5201
5222
|
SENSITIVE: []
|
@@ -9869,6 +9890,7 @@ module Aws::SageMaker
|
|
9869
9890
|
attr_accessor cluster_name: ::String
|
9870
9891
|
attr_accessor instance_groups: ::Array[Types::ClusterInstanceGroupSpecification]
|
9871
9892
|
attr_accessor node_recovery: ("Automatic" | "None")
|
9893
|
+
attr_accessor instance_groups_to_delete: ::Array[::String]
|
9872
9894
|
SENSITIVE: []
|
9873
9895
|
end
|
9874
9896
|
|
@@ -10085,6 +10107,7 @@ module Aws::SageMaker
|
|
10085
10107
|
attr_accessor inference_component_name: ::String
|
10086
10108
|
attr_accessor specification: Types::InferenceComponentSpecification
|
10087
10109
|
attr_accessor runtime_config: Types::InferenceComponentRuntimeConfig
|
10110
|
+
attr_accessor deployment_config: Types::InferenceComponentDeploymentConfig
|
10088
10111
|
SENSITIVE: []
|
10089
10112
|
end
|
10090
10113
|
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: aws-sdk-sagemaker
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.291.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Amazon Web Services
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2025-02-
|
11
|
+
date: 2025-02-26 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: aws-sdk-core
|