aws-sdk-sagemaker 1.290.0 → 1.291.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +5 -0
- data/VERSION +1 -1
- data/lib/aws-sdk-sagemaker/client.rb +46 -3
- data/lib/aws-sdk-sagemaker/client_api.rb +20 -0
- data/lib/aws-sdk-sagemaker/types.rb +169 -10
- data/lib/aws-sdk-sagemaker.rb +1 -1
- data/sig/client.rbs +22 -0
- data/sig/types.rbs +22 -0
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 89ca78842e4cb8cee6d80d8a8daf2c8b4dc0e47455067caecf7afd1ef6ffbd2e
|
4
|
+
data.tar.gz: dbbcf82690c0aba025bd9c60d7ca1dbe5855d544bb6b9b630f44daaad00a5ad0
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: de74eb8d70134e088fc61dfdf423b080ca19e84ecec8e21f73788c7abb2c5663b61e43be64ef04f4747bdc5b5377852e97a4b4bf451912291d6de3441c1fb682
|
7
|
+
data.tar.gz: 989fb4e7701a4455905eab5850c7e18b44b0df00b57e1a771c4f21386e41d00e7198b00cedaf5ed50e470130e3918b9f58d286331b99a1ff1c822c80c0b67d4b
|
data/CHANGELOG.md
CHANGED
data/VERSION
CHANGED
@@ -1 +1 @@
|
|
1
|
-
1.
|
1
|
+
1.291.0
|
@@ -689,11 +689,19 @@ module Aws::SageMaker
|
|
689
689
|
# @option params [required, Array<String>] :node_ids
|
690
690
|
# A list of node IDs to be deleted from the specified cluster.
|
691
691
|
#
|
692
|
-
# <note markdown="1"> For SageMaker HyperPod clusters using the Slurm workload manager,
|
693
|
-
#
|
692
|
+
# <note markdown="1"> * For SageMaker HyperPod clusters using the Slurm workload manager,
|
693
|
+
# you cannot remove instances that are configured as Slurm controller
|
694
|
+
# nodes.
|
695
|
+
#
|
696
|
+
# * If you need to delete more than 99 instances, contact [Support][1]
|
697
|
+
# for assistance.
|
694
698
|
#
|
695
699
|
# </note>
|
696
700
|
#
|
701
|
+
#
|
702
|
+
#
|
703
|
+
# [1]: http://aws.amazon.com/contact-us/
|
704
|
+
#
|
697
705
|
# @return [Types::BatchDeleteClusterNodesResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
698
706
|
#
|
699
707
|
# * {Types::BatchDeleteClusterNodesResponse#failed #failed} => Array<Types::BatchDeleteClusterNodesError>
|
@@ -14977,6 +14985,7 @@ module Aws::SageMaker
|
|
14977
14985
|
# * {Types::DescribeInferenceComponentOutput#creation_time #creation_time} => Time
|
14978
14986
|
# * {Types::DescribeInferenceComponentOutput#last_modified_time #last_modified_time} => Time
|
14979
14987
|
# * {Types::DescribeInferenceComponentOutput#inference_component_status #inference_component_status} => String
|
14988
|
+
# * {Types::DescribeInferenceComponentOutput#last_deployment_config #last_deployment_config} => Types::InferenceComponentDeploymentConfig
|
14980
14989
|
#
|
14981
14990
|
# @example Request syntax with placeholder values
|
14982
14991
|
#
|
@@ -15011,6 +15020,14 @@ module Aws::SageMaker
|
|
15011
15020
|
# resp.creation_time #=> Time
|
15012
15021
|
# resp.last_modified_time #=> Time
|
15013
15022
|
# resp.inference_component_status #=> String, one of "InService", "Creating", "Updating", "Failed", "Deleting"
|
15023
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "COPY_COUNT", "CAPACITY_PERCENT"
|
15024
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_batch_size.value #=> Integer
|
15025
|
+
# resp.last_deployment_config.rolling_update_policy.wait_interval_in_seconds #=> Integer
|
15026
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_execution_timeout_in_seconds #=> Integer
|
15027
|
+
# resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.type #=> String, one of "COPY_COUNT", "CAPACITY_PERCENT"
|
15028
|
+
# resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.value #=> Integer
|
15029
|
+
# resp.last_deployment_config.auto_rollback_configuration.alarms #=> Array
|
15030
|
+
# resp.last_deployment_config.auto_rollback_configuration.alarms[0].alarm_name #=> String
|
15014
15031
|
#
|
15015
15032
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeInferenceComponent AWS API Documentation
|
15016
15033
|
#
|
@@ -27537,6 +27554,11 @@ module Aws::SageMaker
|
|
27537
27554
|
# Runtime settings for a model that is deployed with an inference
|
27538
27555
|
# component.
|
27539
27556
|
#
|
27557
|
+
# @option params [Types::InferenceComponentDeploymentConfig] :deployment_config
|
27558
|
+
# The deployment configuration for the inference component. The
|
27559
|
+
# configuration contains the desired deployment strategy and rollback
|
27560
|
+
# settings.
|
27561
|
+
#
|
27540
27562
|
# @return [Types::UpdateInferenceComponentOutput] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
27541
27563
|
#
|
27542
27564
|
# * {Types::UpdateInferenceComponentOutput#inference_component_arn #inference_component_arn} => String
|
@@ -27569,6 +27591,27 @@ module Aws::SageMaker
|
|
27569
27591
|
# runtime_config: {
|
27570
27592
|
# copy_count: 1, # required
|
27571
27593
|
# },
|
27594
|
+
# deployment_config: {
|
27595
|
+
# rolling_update_policy: { # required
|
27596
|
+
# maximum_batch_size: { # required
|
27597
|
+
# type: "COPY_COUNT", # required, accepts COPY_COUNT, CAPACITY_PERCENT
|
27598
|
+
# value: 1, # required
|
27599
|
+
# },
|
27600
|
+
# wait_interval_in_seconds: 1, # required
|
27601
|
+
# maximum_execution_timeout_in_seconds: 1,
|
27602
|
+
# rollback_maximum_batch_size: {
|
27603
|
+
# type: "COPY_COUNT", # required, accepts COPY_COUNT, CAPACITY_PERCENT
|
27604
|
+
# value: 1, # required
|
27605
|
+
# },
|
27606
|
+
# },
|
27607
|
+
# auto_rollback_configuration: {
|
27608
|
+
# alarms: [
|
27609
|
+
# {
|
27610
|
+
# alarm_name: "AlarmName",
|
27611
|
+
# },
|
27612
|
+
# ],
|
27613
|
+
# },
|
27614
|
+
# },
|
27572
27615
|
# })
|
27573
27616
|
#
|
27574
27617
|
# @example Response structure
|
@@ -29502,7 +29545,7 @@ module Aws::SageMaker
|
|
29502
29545
|
tracer: tracer
|
29503
29546
|
)
|
29504
29547
|
context[:gem_name] = 'aws-sdk-sagemaker'
|
29505
|
-
context[:gem_version] = '1.
|
29548
|
+
context[:gem_version] = '1.291.0'
|
29506
29549
|
Seahorse::Client::Request.new(handlers, context)
|
29507
29550
|
end
|
29508
29551
|
|
@@ -1149,12 +1149,16 @@ module Aws::SageMaker
|
|
1149
1149
|
ImportHubContentResponse = Shapes::StructureShape.new(name: 'ImportHubContentResponse')
|
1150
1150
|
InUseInstanceCount = Shapes::IntegerShape.new(name: 'InUseInstanceCount')
|
1151
1151
|
InferenceComponentArn = Shapes::StringShape.new(name: 'InferenceComponentArn')
|
1152
|
+
InferenceComponentCapacitySize = Shapes::StructureShape.new(name: 'InferenceComponentCapacitySize')
|
1153
|
+
InferenceComponentCapacitySizeType = Shapes::StringShape.new(name: 'InferenceComponentCapacitySizeType')
|
1152
1154
|
InferenceComponentComputeResourceRequirements = Shapes::StructureShape.new(name: 'InferenceComponentComputeResourceRequirements')
|
1153
1155
|
InferenceComponentContainerSpecification = Shapes::StructureShape.new(name: 'InferenceComponentContainerSpecification')
|
1154
1156
|
InferenceComponentContainerSpecificationSummary = Shapes::StructureShape.new(name: 'InferenceComponentContainerSpecificationSummary')
|
1155
1157
|
InferenceComponentCopyCount = Shapes::IntegerShape.new(name: 'InferenceComponentCopyCount')
|
1158
|
+
InferenceComponentDeploymentConfig = Shapes::StructureShape.new(name: 'InferenceComponentDeploymentConfig')
|
1156
1159
|
InferenceComponentName = Shapes::StringShape.new(name: 'InferenceComponentName')
|
1157
1160
|
InferenceComponentNameContains = Shapes::StringShape.new(name: 'InferenceComponentNameContains')
|
1161
|
+
InferenceComponentRollingUpdatePolicy = Shapes::StructureShape.new(name: 'InferenceComponentRollingUpdatePolicy')
|
1158
1162
|
InferenceComponentRuntimeConfig = Shapes::StructureShape.new(name: 'InferenceComponentRuntimeConfig')
|
1159
1163
|
InferenceComponentRuntimeConfigSummary = Shapes::StructureShape.new(name: 'InferenceComponentRuntimeConfigSummary')
|
1160
1164
|
InferenceComponentSortKey = Shapes::StringShape.new(name: 'InferenceComponentSortKey')
|
@@ -5204,6 +5208,7 @@ module Aws::SageMaker
|
|
5204
5208
|
DescribeInferenceComponentOutput.add_member(:creation_time, Shapes::ShapeRef.new(shape: Timestamp, required: true, location_name: "CreationTime"))
|
5205
5209
|
DescribeInferenceComponentOutput.add_member(:last_modified_time, Shapes::ShapeRef.new(shape: Timestamp, required: true, location_name: "LastModifiedTime"))
|
5206
5210
|
DescribeInferenceComponentOutput.add_member(:inference_component_status, Shapes::ShapeRef.new(shape: InferenceComponentStatus, location_name: "InferenceComponentStatus"))
|
5211
|
+
DescribeInferenceComponentOutput.add_member(:last_deployment_config, Shapes::ShapeRef.new(shape: InferenceComponentDeploymentConfig, location_name: "LastDeploymentConfig"))
|
5207
5212
|
DescribeInferenceComponentOutput.struct_class = Types::DescribeInferenceComponentOutput
|
5208
5213
|
|
5209
5214
|
DescribeInferenceExperimentRequest.add_member(:name, Shapes::ShapeRef.new(shape: InferenceExperimentName, required: true, location_name: "Name"))
|
@@ -6724,6 +6729,10 @@ module Aws::SageMaker
|
|
6724
6729
|
ImportHubContentResponse.add_member(:hub_content_arn, Shapes::ShapeRef.new(shape: HubContentArn, required: true, location_name: "HubContentArn"))
|
6725
6730
|
ImportHubContentResponse.struct_class = Types::ImportHubContentResponse
|
6726
6731
|
|
6732
|
+
InferenceComponentCapacitySize.add_member(:type, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySizeType, required: true, location_name: "Type"))
|
6733
|
+
InferenceComponentCapacitySize.add_member(:value, Shapes::ShapeRef.new(shape: CapacitySizeValue, required: true, location_name: "Value"))
|
6734
|
+
InferenceComponentCapacitySize.struct_class = Types::InferenceComponentCapacitySize
|
6735
|
+
|
6727
6736
|
InferenceComponentComputeResourceRequirements.add_member(:number_of_cpu_cores_required, Shapes::ShapeRef.new(shape: NumberOfCpuCores, location_name: "NumberOfCpuCoresRequired"))
|
6728
6737
|
InferenceComponentComputeResourceRequirements.add_member(:number_of_accelerator_devices_required, Shapes::ShapeRef.new(shape: NumberOfAcceleratorDevices, location_name: "NumberOfAcceleratorDevicesRequired"))
|
6729
6738
|
InferenceComponentComputeResourceRequirements.add_member(:min_memory_required_in_mb, Shapes::ShapeRef.new(shape: MemoryInMb, required: true, location_name: "MinMemoryRequiredInMb"))
|
@@ -6740,6 +6749,16 @@ module Aws::SageMaker
|
|
6740
6749
|
InferenceComponentContainerSpecificationSummary.add_member(:environment, Shapes::ShapeRef.new(shape: EnvironmentMap, location_name: "Environment"))
|
6741
6750
|
InferenceComponentContainerSpecificationSummary.struct_class = Types::InferenceComponentContainerSpecificationSummary
|
6742
6751
|
|
6752
|
+
InferenceComponentDeploymentConfig.add_member(:rolling_update_policy, Shapes::ShapeRef.new(shape: InferenceComponentRollingUpdatePolicy, required: true, location_name: "RollingUpdatePolicy"))
|
6753
|
+
InferenceComponentDeploymentConfig.add_member(:auto_rollback_configuration, Shapes::ShapeRef.new(shape: AutoRollbackConfig, location_name: "AutoRollbackConfiguration"))
|
6754
|
+
InferenceComponentDeploymentConfig.struct_class = Types::InferenceComponentDeploymentConfig
|
6755
|
+
|
6756
|
+
InferenceComponentRollingUpdatePolicy.add_member(:maximum_batch_size, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySize, required: true, location_name: "MaximumBatchSize"))
|
6757
|
+
InferenceComponentRollingUpdatePolicy.add_member(:wait_interval_in_seconds, Shapes::ShapeRef.new(shape: WaitIntervalInSeconds, required: true, location_name: "WaitIntervalInSeconds"))
|
6758
|
+
InferenceComponentRollingUpdatePolicy.add_member(:maximum_execution_timeout_in_seconds, Shapes::ShapeRef.new(shape: MaximumExecutionTimeoutInSeconds, location_name: "MaximumExecutionTimeoutInSeconds"))
|
6759
|
+
InferenceComponentRollingUpdatePolicy.add_member(:rollback_maximum_batch_size, Shapes::ShapeRef.new(shape: InferenceComponentCapacitySize, location_name: "RollbackMaximumBatchSize"))
|
6760
|
+
InferenceComponentRollingUpdatePolicy.struct_class = Types::InferenceComponentRollingUpdatePolicy
|
6761
|
+
|
6743
6762
|
InferenceComponentRuntimeConfig.add_member(:copy_count, Shapes::ShapeRef.new(shape: InferenceComponentCopyCount, required: true, location_name: "CopyCount"))
|
6744
6763
|
InferenceComponentRuntimeConfig.struct_class = Types::InferenceComponentRuntimeConfig
|
6745
6764
|
|
@@ -10719,6 +10738,7 @@ module Aws::SageMaker
|
|
10719
10738
|
UpdateInferenceComponentInput.add_member(:inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, required: true, location_name: "InferenceComponentName"))
|
10720
10739
|
UpdateInferenceComponentInput.add_member(:specification, Shapes::ShapeRef.new(shape: InferenceComponentSpecification, location_name: "Specification"))
|
10721
10740
|
UpdateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, location_name: "RuntimeConfig"))
|
10741
|
+
UpdateInferenceComponentInput.add_member(:deployment_config, Shapes::ShapeRef.new(shape: InferenceComponentDeploymentConfig, location_name: "DeploymentConfig"))
|
10722
10742
|
UpdateInferenceComponentInput.struct_class = Types::UpdateInferenceComponentInput
|
10723
10743
|
|
10724
10744
|
UpdateInferenceComponentOutput.add_member(:inference_component_arn, Shapes::ShapeRef.new(shape: InferenceComponentArn, required: true, location_name: "InferenceComponentArn"))
|
@@ -2989,11 +2989,18 @@ module Aws::SageMaker
|
|
2989
2989
|
# @!attribute [rw] node_ids
|
2990
2990
|
# A list of node IDs to be deleted from the specified cluster.
|
2991
2991
|
#
|
2992
|
-
# <note markdown="1"> For SageMaker HyperPod clusters using the Slurm workload manager,
|
2993
|
-
#
|
2994
|
-
#
|
2992
|
+
# <note markdown="1"> * For SageMaker HyperPod clusters using the Slurm workload manager,
|
2993
|
+
# you cannot remove instances that are configured as Slurm
|
2994
|
+
# controller nodes.
|
2995
|
+
#
|
2996
|
+
# * If you need to delete more than 99 instances, contact [Support][1]
|
2997
|
+
# for assistance.
|
2995
2998
|
#
|
2996
2999
|
# </note>
|
3000
|
+
#
|
3001
|
+
#
|
3002
|
+
#
|
3003
|
+
# [1]: http://aws.amazon.com/contact-us/
|
2997
3004
|
# @return [Array<String>]
|
2998
3005
|
#
|
2999
3006
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/BatchDeleteClusterNodesRequest AWS API Documentation
|
@@ -16028,6 +16035,11 @@ module Aws::SageMaker
|
|
16028
16035
|
# The status of the inference component.
|
16029
16036
|
# @return [String]
|
16030
16037
|
#
|
16038
|
+
# @!attribute [rw] last_deployment_config
|
16039
|
+
# The deployment and rollback settings that you assigned to the
|
16040
|
+
# inference component.
|
16041
|
+
# @return [Types::InferenceComponentDeploymentConfig]
|
16042
|
+
#
|
16031
16043
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DescribeInferenceComponentOutput AWS API Documentation
|
16032
16044
|
#
|
16033
16045
|
class DescribeInferenceComponentOutput < Struct.new(
|
@@ -16041,7 +16053,8 @@ module Aws::SageMaker
|
|
16041
16053
|
:runtime_config,
|
16042
16054
|
:creation_time,
|
16043
16055
|
:last_modified_time,
|
16044
|
-
:inference_component_status
|
16056
|
+
:inference_component_status,
|
16057
|
+
:last_deployment_config)
|
16045
16058
|
SENSITIVE = []
|
16046
16059
|
include Aws::Structure
|
16047
16060
|
end
|
@@ -21280,10 +21293,12 @@ module Aws::SageMaker
|
|
21280
21293
|
end
|
21281
21294
|
|
21282
21295
|
# The properties of an experiment as returned by the [Search][1] API.
|
21296
|
+
# For information about experiments, see the [CreateExperiment][2] API.
|
21283
21297
|
#
|
21284
21298
|
#
|
21285
21299
|
#
|
21286
21300
|
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_Search.html
|
21301
|
+
# [2]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateExperiment.html
|
21287
21302
|
#
|
21288
21303
|
# @!attribute [rw] experiment_name
|
21289
21304
|
# The name of the experiment.
|
@@ -25376,6 +25391,47 @@ module Aws::SageMaker
|
|
25376
25391
|
include Aws::Structure
|
25377
25392
|
end
|
25378
25393
|
|
25394
|
+
# Specifies the type and size of the endpoint capacity to activate for a
|
25395
|
+
# rolling deployment or a rollback strategy. You can specify your
|
25396
|
+
# batches as either of the following:
|
25397
|
+
#
|
25398
|
+
# * A count of inference component copies
|
25399
|
+
#
|
25400
|
+
# * The overall percentage or your fleet
|
25401
|
+
#
|
25402
|
+
# For a rollback strategy, if you don't specify the fields in this
|
25403
|
+
# object, or if you set the `Value` parameter to 100%, then SageMaker AI
|
25404
|
+
# uses a blue/green rollback strategy and rolls all traffic back to the
|
25405
|
+
# blue fleet.
|
25406
|
+
#
|
25407
|
+
# @!attribute [rw] type
|
25408
|
+
# Specifies the endpoint capacity type.
|
25409
|
+
#
|
25410
|
+
# COPY\_COUNT
|
25411
|
+
#
|
25412
|
+
# : The endpoint activates based on the number of inference component
|
25413
|
+
# copies.
|
25414
|
+
#
|
25415
|
+
# CAPACITY\_PERCENT
|
25416
|
+
#
|
25417
|
+
# : The endpoint activates based on the specified percentage of
|
25418
|
+
# capacity.
|
25419
|
+
# @return [String]
|
25420
|
+
#
|
25421
|
+
# @!attribute [rw] value
|
25422
|
+
# Defines the capacity size, either as a number of inference component
|
25423
|
+
# copies or a capacity percentage.
|
25424
|
+
# @return [Integer]
|
25425
|
+
#
|
25426
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentCapacitySize AWS API Documentation
|
25427
|
+
#
|
25428
|
+
class InferenceComponentCapacitySize < Struct.new(
|
25429
|
+
:type,
|
25430
|
+
:value)
|
25431
|
+
SENSITIVE = []
|
25432
|
+
include Aws::Structure
|
25433
|
+
end
|
25434
|
+
|
25379
25435
|
# Defines the compute resources to allocate to run a model, plus any
|
25380
25436
|
# adapter models, that you assign to an inference component. These
|
25381
25437
|
# resources include CPU cores, accelerators, and memory.
|
@@ -25481,6 +25537,69 @@ module Aws::SageMaker
|
|
25481
25537
|
include Aws::Structure
|
25482
25538
|
end
|
25483
25539
|
|
25540
|
+
# The deployment configuration for an endpoint that hosts inference
|
25541
|
+
# components. The configuration includes the desired deployment strategy
|
25542
|
+
# and rollback settings.
|
25543
|
+
#
|
25544
|
+
# @!attribute [rw] rolling_update_policy
|
25545
|
+
# Specifies a rolling deployment strategy for updating a SageMaker AI
|
25546
|
+
# endpoint.
|
25547
|
+
# @return [Types::InferenceComponentRollingUpdatePolicy]
|
25548
|
+
#
|
25549
|
+
# @!attribute [rw] auto_rollback_configuration
|
25550
|
+
# Automatic rollback configuration for handling endpoint deployment
|
25551
|
+
# failures and recovery.
|
25552
|
+
# @return [Types::AutoRollbackConfig]
|
25553
|
+
#
|
25554
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentDeploymentConfig AWS API Documentation
|
25555
|
+
#
|
25556
|
+
class InferenceComponentDeploymentConfig < Struct.new(
|
25557
|
+
:rolling_update_policy,
|
25558
|
+
:auto_rollback_configuration)
|
25559
|
+
SENSITIVE = []
|
25560
|
+
include Aws::Structure
|
25561
|
+
end
|
25562
|
+
|
25563
|
+
# Specifies a rolling deployment strategy for updating a SageMaker AI
|
25564
|
+
# inference component.
|
25565
|
+
#
|
25566
|
+
# @!attribute [rw] maximum_batch_size
|
25567
|
+
# The batch size for each rolling step in the deployment process. For
|
25568
|
+
# each step, SageMaker AI provisions capacity on the new endpoint
|
25569
|
+
# fleet, routes traffic to that fleet, and terminates capacity on the
|
25570
|
+
# old endpoint fleet. The value must be between 5% to 50% of the copy
|
25571
|
+
# count of the inference component.
|
25572
|
+
# @return [Types::InferenceComponentCapacitySize]
|
25573
|
+
#
|
25574
|
+
# @!attribute [rw] wait_interval_in_seconds
|
25575
|
+
# The length of the baking period, during which SageMaker AI monitors
|
25576
|
+
# alarms for each batch on the new fleet.
|
25577
|
+
# @return [Integer]
|
25578
|
+
#
|
25579
|
+
# @!attribute [rw] maximum_execution_timeout_in_seconds
|
25580
|
+
# The time limit for the total deployment. Exceeding this limit causes
|
25581
|
+
# a timeout.
|
25582
|
+
# @return [Integer]
|
25583
|
+
#
|
25584
|
+
# @!attribute [rw] rollback_maximum_batch_size
|
25585
|
+
# The batch size for a rollback to the old endpoint fleet. If this
|
25586
|
+
# field is absent, the value is set to the default, which is 100% of
|
25587
|
+
# the total capacity. When the default is used, SageMaker AI
|
25588
|
+
# provisions the entire capacity of the old fleet at once during
|
25589
|
+
# rollback.
|
25590
|
+
# @return [Types::InferenceComponentCapacitySize]
|
25591
|
+
#
|
25592
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentRollingUpdatePolicy AWS API Documentation
|
25593
|
+
#
|
25594
|
+
class InferenceComponentRollingUpdatePolicy < Struct.new(
|
25595
|
+
:maximum_batch_size,
|
25596
|
+
:wait_interval_in_seconds,
|
25597
|
+
:maximum_execution_timeout_in_seconds,
|
25598
|
+
:rollback_maximum_batch_size)
|
25599
|
+
SENSITIVE = []
|
25600
|
+
include Aws::Structure
|
25601
|
+
end
|
25602
|
+
|
25484
25603
|
# Runtime settings for a model that is deployed with an inference
|
25485
25604
|
# component.
|
25486
25605
|
#
|
@@ -34551,10 +34670,29 @@ module Aws::SageMaker
|
|
34551
34670
|
include Aws::Structure
|
34552
34671
|
end
|
34553
34672
|
|
34554
|
-
# A
|
34673
|
+
# A container for your trained model that can be deployed for SageMaker
|
34674
|
+
# inference. This can include inference code, artifacts, and metadata.
|
34675
|
+
# The model package type can be one of the following.
|
34676
|
+
#
|
34677
|
+
# * Versioned model: A part of a model package group in Model Registry.
|
34678
|
+
#
|
34679
|
+
# * Unversioned model: Not part of a model package group and used in
|
34680
|
+
# Amazon Web Services Marketplace.
|
34681
|
+
#
|
34682
|
+
# For more information, see [ `CreateModelPackage` ][1].
|
34683
|
+
#
|
34684
|
+
#
|
34685
|
+
#
|
34686
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateModelPackage.html
|
34555
34687
|
#
|
34556
34688
|
# @!attribute [rw] model_package_name
|
34557
|
-
# The name of the model.
|
34689
|
+
# The name of the model package. The name can be as follows:
|
34690
|
+
#
|
34691
|
+
# * For a versioned model, the name is automatically generated by
|
34692
|
+
# SageMaker Model Registry and follows the format
|
34693
|
+
# '`ModelPackageGroupName/ModelPackageVersion`'.
|
34694
|
+
#
|
34695
|
+
# * For an unversioned model, you must provide the name.
|
34558
34696
|
# @return [String]
|
34559
34697
|
#
|
34560
34698
|
# @!attribute [rw] model_package_group_name
|
@@ -34879,7 +35017,7 @@ module Aws::SageMaker
|
|
34879
35017
|
include Aws::Structure
|
34880
35018
|
end
|
34881
35019
|
|
34882
|
-
# A group of versioned models in the
|
35020
|
+
# A group of versioned models in the Model Registry.
|
34883
35021
|
#
|
34884
35022
|
# @!attribute [rw] model_package_group_name
|
34885
35023
|
# The name of the model group.
|
@@ -42316,11 +42454,25 @@ module Aws::SageMaker
|
|
42316
42454
|
# @return [Types::Endpoint]
|
42317
42455
|
#
|
42318
42456
|
# @!attribute [rw] model_package
|
42319
|
-
# A
|
42457
|
+
# A container for your trained model that can be deployed for
|
42458
|
+
# SageMaker inference. This can include inference code, artifacts, and
|
42459
|
+
# metadata. The model package type can be one of the following.
|
42460
|
+
#
|
42461
|
+
# * Versioned model: A part of a model package group in Model
|
42462
|
+
# Registry.
|
42463
|
+
#
|
42464
|
+
# * Unversioned model: Not part of a model package group and used in
|
42465
|
+
# Amazon Web Services Marketplace.
|
42466
|
+
#
|
42467
|
+
# For more information, see [ `CreateModelPackage` ][1].
|
42468
|
+
#
|
42469
|
+
#
|
42470
|
+
#
|
42471
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateModelPackage.html
|
42320
42472
|
# @return [Types::ModelPackage]
|
42321
42473
|
#
|
42322
42474
|
# @!attribute [rw] model_package_group
|
42323
|
-
# A group of versioned models in the
|
42475
|
+
# A group of versioned models in the Model Registry.
|
42324
42476
|
# @return [Types::ModelPackageGroup]
|
42325
42477
|
#
|
42326
42478
|
# @!attribute [rw] pipeline
|
@@ -48193,12 +48345,19 @@ module Aws::SageMaker
|
|
48193
48345
|
# component.
|
48194
48346
|
# @return [Types::InferenceComponentRuntimeConfig]
|
48195
48347
|
#
|
48348
|
+
# @!attribute [rw] deployment_config
|
48349
|
+
# The deployment configuration for the inference component. The
|
48350
|
+
# configuration contains the desired deployment strategy and rollback
|
48351
|
+
# settings.
|
48352
|
+
# @return [Types::InferenceComponentDeploymentConfig]
|
48353
|
+
#
|
48196
48354
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/UpdateInferenceComponentInput AWS API Documentation
|
48197
48355
|
#
|
48198
48356
|
class UpdateInferenceComponentInput < Struct.new(
|
48199
48357
|
:inference_component_name,
|
48200
48358
|
:specification,
|
48201
|
-
:runtime_config
|
48359
|
+
:runtime_config,
|
48360
|
+
:deployment_config)
|
48202
48361
|
SENSITIVE = []
|
48203
48362
|
include Aws::Structure
|
48204
48363
|
end
|
data/lib/aws-sdk-sagemaker.rb
CHANGED
data/sig/client.rbs
CHANGED
@@ -5686,6 +5686,7 @@ module Aws
|
|
5686
5686
|
def creation_time: () -> ::Time
|
5687
5687
|
def last_modified_time: () -> ::Time
|
5688
5688
|
def inference_component_status: () -> ("InService" | "Creating" | "Updating" | "Failed" | "Deleting")
|
5689
|
+
def last_deployment_config: () -> Types::InferenceComponentDeploymentConfig
|
5689
5690
|
end
|
5690
5691
|
# https://docs.aws.amazon.com/sdk-for-ruby/v3/api/Aws/SageMaker/Client.html#describe_inference_component-instance_method
|
5691
5692
|
def describe_inference_component: (
|
@@ -9192,6 +9193,27 @@ module Aws
|
|
9192
9193
|
},
|
9193
9194
|
?runtime_config: {
|
9194
9195
|
copy_count: ::Integer
|
9196
|
+
},
|
9197
|
+
?deployment_config: {
|
9198
|
+
rolling_update_policy: {
|
9199
|
+
maximum_batch_size: {
|
9200
|
+
type: ("COPY_COUNT" | "CAPACITY_PERCENT"),
|
9201
|
+
value: ::Integer
|
9202
|
+
},
|
9203
|
+
wait_interval_in_seconds: ::Integer,
|
9204
|
+
maximum_execution_timeout_in_seconds: ::Integer?,
|
9205
|
+
rollback_maximum_batch_size: {
|
9206
|
+
type: ("COPY_COUNT" | "CAPACITY_PERCENT"),
|
9207
|
+
value: ::Integer
|
9208
|
+
}?
|
9209
|
+
},
|
9210
|
+
auto_rollback_configuration: {
|
9211
|
+
alarms: Array[
|
9212
|
+
{
|
9213
|
+
alarm_name: ::String?
|
9214
|
+
},
|
9215
|
+
]?
|
9216
|
+
}?
|
9195
9217
|
}
|
9196
9218
|
) -> _UpdateInferenceComponentResponseSuccess
|
9197
9219
|
| (Hash[Symbol, untyped] params, ?Hash[Symbol, untyped] options) -> _UpdateInferenceComponentResponseSuccess
|
data/sig/types.rbs
CHANGED
@@ -3394,6 +3394,7 @@ module Aws::SageMaker
|
|
3394
3394
|
attr_accessor creation_time: ::Time
|
3395
3395
|
attr_accessor last_modified_time: ::Time
|
3396
3396
|
attr_accessor inference_component_status: ("InService" | "Creating" | "Updating" | "Failed" | "Deleting")
|
3397
|
+
attr_accessor last_deployment_config: Types::InferenceComponentDeploymentConfig
|
3397
3398
|
SENSITIVE: []
|
3398
3399
|
end
|
3399
3400
|
|
@@ -5174,6 +5175,12 @@ module Aws::SageMaker
|
|
5174
5175
|
SENSITIVE: []
|
5175
5176
|
end
|
5176
5177
|
|
5178
|
+
class InferenceComponentCapacitySize
|
5179
|
+
attr_accessor type: ("COPY_COUNT" | "CAPACITY_PERCENT")
|
5180
|
+
attr_accessor value: ::Integer
|
5181
|
+
SENSITIVE: []
|
5182
|
+
end
|
5183
|
+
|
5177
5184
|
class InferenceComponentComputeResourceRequirements
|
5178
5185
|
attr_accessor number_of_cpu_cores_required: ::Float
|
5179
5186
|
attr_accessor number_of_accelerator_devices_required: ::Float
|
@@ -5196,6 +5203,20 @@ module Aws::SageMaker
|
|
5196
5203
|
SENSITIVE: []
|
5197
5204
|
end
|
5198
5205
|
|
5206
|
+
class InferenceComponentDeploymentConfig
|
5207
|
+
attr_accessor rolling_update_policy: Types::InferenceComponentRollingUpdatePolicy
|
5208
|
+
attr_accessor auto_rollback_configuration: Types::AutoRollbackConfig
|
5209
|
+
SENSITIVE: []
|
5210
|
+
end
|
5211
|
+
|
5212
|
+
class InferenceComponentRollingUpdatePolicy
|
5213
|
+
attr_accessor maximum_batch_size: Types::InferenceComponentCapacitySize
|
5214
|
+
attr_accessor wait_interval_in_seconds: ::Integer
|
5215
|
+
attr_accessor maximum_execution_timeout_in_seconds: ::Integer
|
5216
|
+
attr_accessor rollback_maximum_batch_size: Types::InferenceComponentCapacitySize
|
5217
|
+
SENSITIVE: []
|
5218
|
+
end
|
5219
|
+
|
5199
5220
|
class InferenceComponentRuntimeConfig
|
5200
5221
|
attr_accessor copy_count: ::Integer
|
5201
5222
|
SENSITIVE: []
|
@@ -10086,6 +10107,7 @@ module Aws::SageMaker
|
|
10086
10107
|
attr_accessor inference_component_name: ::String
|
10087
10108
|
attr_accessor specification: Types::InferenceComponentSpecification
|
10088
10109
|
attr_accessor runtime_config: Types::InferenceComponentRuntimeConfig
|
10110
|
+
attr_accessor deployment_config: Types::InferenceComponentDeploymentConfig
|
10089
10111
|
SENSITIVE: []
|
10090
10112
|
end
|
10091
10113
|
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: aws-sdk-sagemaker
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.291.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Amazon Web Services
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2025-02-
|
11
|
+
date: 2025-02-26 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: aws-sdk-core
|