aws-sdk-sagemaker 1.192.0 → 1.194.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +10 -0
- data/VERSION +1 -1
- data/lib/aws-sdk-sagemaker/client.rb +56 -8
- data/lib/aws-sdk-sagemaker/client_api.rb +19 -4
- data/lib/aws-sdk-sagemaker/types.rb +113 -6
- data/lib/aws-sdk-sagemaker.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 60973ee75145a047cd16273b84e2c90c71e5f4f79410ca18abc405d322530142
|
4
|
+
data.tar.gz: c3b8a0d376ecde588856d2902f2260fda4df5ee686004457f25edccff047fab3
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: ab144375ebe73e9a8ba1db86cfc76be055d4a904277d6f8fc474dd1cbc846980c66ab87b90d6892a99798c55fe84197a03c5911bac12295b441c130e7ee12e1c
|
7
|
+
data.tar.gz: 76a347049d001562cda69eb23edab0abe7a60de6f84ecdb31b4aa237ef850122be6210bcf87927af77fcbb2e492d06dd95ebd795a1350113a007ca5cae7e60b4
|
data/CHANGELOG.md
CHANGED
@@ -1,6 +1,16 @@
|
|
1
1
|
Unreleased Changes
|
2
2
|
------------------
|
3
3
|
|
4
|
+
1.194.0 (2023-07-03)
|
5
|
+
------------------
|
6
|
+
|
7
|
+
* Feature - SageMaker Inference Recommender now accepts new fields SupportedEndpointType and ServerlessConfiguration to support serverless endpoints.
|
8
|
+
|
9
|
+
1.193.0 (2023-06-30)
|
10
|
+
------------------
|
11
|
+
|
12
|
+
* Feature - This release adds support for rolling deployment in SageMaker Inference.
|
13
|
+
|
4
14
|
1.192.0 (2023-06-29)
|
5
15
|
------------------
|
6
16
|
|
data/VERSION
CHANGED
@@ -1 +1 @@
|
|
1
|
-
1.
|
1
|
+
1.194.0
|
@@ -2719,7 +2719,7 @@ module Aws::SageMaker
|
|
2719
2719
|
# endpoint_name: "EndpointName", # required
|
2720
2720
|
# endpoint_config_name: "EndpointConfigName", # required
|
2721
2721
|
# deployment_config: {
|
2722
|
-
# blue_green_update_policy: {
|
2722
|
+
# blue_green_update_policy: {
|
2723
2723
|
# traffic_routing_configuration: { # required
|
2724
2724
|
# type: "ALL_AT_ONCE", # required, accepts ALL_AT_ONCE, CANARY, LINEAR
|
2725
2725
|
# wait_interval_in_seconds: 1, # required
|
@@ -2742,6 +2742,18 @@ module Aws::SageMaker
|
|
2742
2742
|
# },
|
2743
2743
|
# ],
|
2744
2744
|
# },
|
2745
|
+
# rolling_update_policy: {
|
2746
|
+
# maximum_batch_size: { # required
|
2747
|
+
# type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
|
2748
|
+
# value: 1, # required
|
2749
|
+
# },
|
2750
|
+
# wait_interval_in_seconds: 1, # required
|
2751
|
+
# maximum_execution_timeout_in_seconds: 1,
|
2752
|
+
# rollback_maximum_batch_size: {
|
2753
|
+
# type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
|
2754
|
+
# value: 1, # required
|
2755
|
+
# },
|
2756
|
+
# },
|
2745
2757
|
# },
|
2746
2758
|
# tags: [
|
2747
2759
|
# {
|
@@ -4447,7 +4459,7 @@ module Aws::SageMaker
|
|
4447
4459
|
# },
|
4448
4460
|
# endpoint_configurations: [
|
4449
4461
|
# {
|
4450
|
-
# instance_type: "ml.t2.medium", #
|
4462
|
+
# instance_type: "ml.t2.medium", # accepts ml.t2.medium, ml.t2.large, ml.t2.xlarge, ml.t2.2xlarge, ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.m5d.large, ml.m5d.xlarge, ml.m5d.2xlarge, ml.m5d.4xlarge, ml.m5d.12xlarge, ml.m5d.24xlarge, ml.c4.large, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5d.large, ml.c5d.xlarge, ml.c5d.2xlarge, ml.c5d.4xlarge, ml.c5d.9xlarge, ml.c5d.18xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.12xlarge, ml.r5.24xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.12xlarge, ml.r5d.24xlarge, ml.inf1.xlarge, ml.inf1.2xlarge, ml.inf1.6xlarge, ml.inf1.24xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.p4d.24xlarge, ml.c7g.large, ml.c7g.xlarge, ml.c7g.2xlarge, ml.c7g.4xlarge, ml.c7g.8xlarge, ml.c7g.12xlarge, ml.c7g.16xlarge, ml.m6g.large, ml.m6g.xlarge, ml.m6g.2xlarge, ml.m6g.4xlarge, ml.m6g.8xlarge, ml.m6g.12xlarge, ml.m6g.16xlarge, ml.m6gd.large, ml.m6gd.xlarge, ml.m6gd.2xlarge, ml.m6gd.4xlarge, ml.m6gd.8xlarge, ml.m6gd.12xlarge, ml.m6gd.16xlarge, ml.c6g.large, ml.c6g.xlarge, ml.c6g.2xlarge, ml.c6g.4xlarge, ml.c6g.8xlarge, ml.c6g.12xlarge, ml.c6g.16xlarge, ml.c6gd.large, ml.c6gd.xlarge, ml.c6gd.2xlarge, ml.c6gd.4xlarge, ml.c6gd.8xlarge, ml.c6gd.12xlarge, ml.c6gd.16xlarge, ml.c6gn.large, ml.c6gn.xlarge, ml.c6gn.2xlarge, ml.c6gn.4xlarge, ml.c6gn.8xlarge, ml.c6gn.12xlarge, ml.c6gn.16xlarge, ml.r6g.large, ml.r6g.xlarge, ml.r6g.2xlarge, ml.r6g.4xlarge, ml.r6g.8xlarge, ml.r6g.12xlarge, ml.r6g.16xlarge, ml.r6gd.large, ml.r6gd.xlarge, ml.r6gd.2xlarge, ml.r6gd.4xlarge, ml.r6gd.8xlarge, ml.r6gd.12xlarge, ml.r6gd.16xlarge, ml.p4de.24xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge
|
4451
4463
|
# inference_specification_name: "InferenceSpecificationName",
|
4452
4464
|
# environment_parameter_ranges: {
|
4453
4465
|
# categorical_parameter_ranges: [
|
@@ -4457,6 +4469,11 @@ module Aws::SageMaker
|
|
4457
4469
|
# },
|
4458
4470
|
# ],
|
4459
4471
|
# },
|
4472
|
+
# serverless_config: {
|
4473
|
+
# memory_size_in_mb: 1, # required
|
4474
|
+
# max_concurrency: 1, # required
|
4475
|
+
# provisioned_concurrency: 1,
|
4476
|
+
# },
|
4460
4477
|
# },
|
4461
4478
|
# ],
|
4462
4479
|
# volume_kms_key_id: "KmsKeyId",
|
@@ -4472,6 +4489,7 @@ module Aws::SageMaker
|
|
4472
4489
|
# nearest_model_name: "String",
|
4473
4490
|
# supported_instance_types: ["String"],
|
4474
4491
|
# data_input_config: "RecommendationJobDataInputConfig",
|
4492
|
+
# supported_endpoint_type: "RealTime", # accepts RealTime, Serverless
|
4475
4493
|
# },
|
4476
4494
|
# endpoints: [
|
4477
4495
|
# {
|
@@ -11078,7 +11096,7 @@ module Aws::SageMaker
|
|
11078
11096
|
# resp.data_capture_config.current_sampling_percentage #=> Integer
|
11079
11097
|
# resp.data_capture_config.destination_s3_uri #=> String
|
11080
11098
|
# resp.data_capture_config.kms_key_id #=> String
|
11081
|
-
# resp.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed"
|
11099
|
+
# resp.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed", "UpdateRollbackFailed"
|
11082
11100
|
# resp.failure_reason #=> String
|
11083
11101
|
# resp.creation_time #=> Time
|
11084
11102
|
# resp.last_modified_time #=> Time
|
@@ -11092,6 +11110,12 @@ module Aws::SageMaker
|
|
11092
11110
|
# resp.last_deployment_config.blue_green_update_policy.maximum_execution_timeout_in_seconds #=> Integer
|
11093
11111
|
# resp.last_deployment_config.auto_rollback_configuration.alarms #=> Array
|
11094
11112
|
# resp.last_deployment_config.auto_rollback_configuration.alarms[0].alarm_name #=> String
|
11113
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENT"
|
11114
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_batch_size.value #=> Integer
|
11115
|
+
# resp.last_deployment_config.rolling_update_policy.wait_interval_in_seconds #=> Integer
|
11116
|
+
# resp.last_deployment_config.rolling_update_policy.maximum_execution_timeout_in_seconds #=> Integer
|
11117
|
+
# resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENT"
|
11118
|
+
# resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.value #=> Integer
|
11095
11119
|
# resp.async_inference_config.client_config.max_concurrent_invocations_per_instance #=> Integer
|
11096
11120
|
# resp.async_inference_config.output_config.kms_key_id #=> String
|
11097
11121
|
# resp.async_inference_config.output_config.s3_output_path #=> String
|
@@ -12190,7 +12214,7 @@ module Aws::SageMaker
|
|
12190
12214
|
# resp.role_arn #=> String
|
12191
12215
|
# resp.endpoint_metadata.endpoint_name #=> String
|
12192
12216
|
# resp.endpoint_metadata.endpoint_config_name #=> String
|
12193
|
-
# resp.endpoint_metadata.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed"
|
12217
|
+
# resp.endpoint_metadata.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed", "UpdateRollbackFailed"
|
12194
12218
|
# resp.endpoint_metadata.failure_reason #=> String
|
12195
12219
|
# resp.model_variants #=> Array
|
12196
12220
|
# resp.model_variants[0].model_name #=> String
|
@@ -12278,6 +12302,9 @@ module Aws::SageMaker
|
|
12278
12302
|
# resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].name #=> String
|
12279
12303
|
# resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].value #=> Array
|
12280
12304
|
# resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].value[0] #=> String
|
12305
|
+
# resp.input_config.endpoint_configurations[0].serverless_config.memory_size_in_mb #=> Integer
|
12306
|
+
# resp.input_config.endpoint_configurations[0].serverless_config.max_concurrency #=> Integer
|
12307
|
+
# resp.input_config.endpoint_configurations[0].serverless_config.provisioned_concurrency #=> Integer
|
12281
12308
|
# resp.input_config.volume_kms_key_id #=> String
|
12282
12309
|
# resp.input_config.container_config.domain #=> String
|
12283
12310
|
# resp.input_config.container_config.task #=> String
|
@@ -12290,6 +12317,7 @@ module Aws::SageMaker
|
|
12290
12317
|
# resp.input_config.container_config.supported_instance_types #=> Array
|
12291
12318
|
# resp.input_config.container_config.supported_instance_types[0] #=> String
|
12292
12319
|
# resp.input_config.container_config.data_input_config #=> String
|
12320
|
+
# resp.input_config.container_config.supported_endpoint_type #=> String, one of "RealTime", "Serverless"
|
12293
12321
|
# resp.input_config.endpoints #=> Array
|
12294
12322
|
# resp.input_config.endpoints[0].endpoint_name #=> String
|
12295
12323
|
# resp.input_config.vpc_config.security_group_ids #=> Array
|
@@ -12308,10 +12336,14 @@ module Aws::SageMaker
|
|
12308
12336
|
# resp.inference_recommendations[0].metrics.model_latency #=> Integer
|
12309
12337
|
# resp.inference_recommendations[0].metrics.cpu_utilization #=> Float
|
12310
12338
|
# resp.inference_recommendations[0].metrics.memory_utilization #=> Float
|
12339
|
+
# resp.inference_recommendations[0].metrics.model_setup_time #=> Integer
|
12311
12340
|
# resp.inference_recommendations[0].endpoint_configuration.endpoint_name #=> String
|
12312
12341
|
# resp.inference_recommendations[0].endpoint_configuration.variant_name #=> String
|
12313
12342
|
# resp.inference_recommendations[0].endpoint_configuration.instance_type #=> String, one of "ml.t2.medium", "ml.t2.large", "ml.t2.xlarge", "ml.t2.2xlarge", "ml.m4.xlarge", "ml.m4.2xlarge", "ml.m4.4xlarge", "ml.m4.10xlarge", "ml.m4.16xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.12xlarge", "ml.m5.24xlarge", "ml.m5d.large", "ml.m5d.xlarge", "ml.m5d.2xlarge", "ml.m5d.4xlarge", "ml.m5d.12xlarge", "ml.m5d.24xlarge", "ml.c4.large", "ml.c4.xlarge", "ml.c4.2xlarge", "ml.c4.4xlarge", "ml.c4.8xlarge", "ml.p2.xlarge", "ml.p2.8xlarge", "ml.p2.16xlarge", "ml.p3.2xlarge", "ml.p3.8xlarge", "ml.p3.16xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.18xlarge", "ml.c5d.large", "ml.c5d.xlarge", "ml.c5d.2xlarge", "ml.c5d.4xlarge", "ml.c5d.9xlarge", "ml.c5d.18xlarge", "ml.g4dn.xlarge", "ml.g4dn.2xlarge", "ml.g4dn.4xlarge", "ml.g4dn.8xlarge", "ml.g4dn.12xlarge", "ml.g4dn.16xlarge", "ml.r5.large", "ml.r5.xlarge", "ml.r5.2xlarge", "ml.r5.4xlarge", "ml.r5.12xlarge", "ml.r5.24xlarge", "ml.r5d.large", "ml.r5d.xlarge", "ml.r5d.2xlarge", "ml.r5d.4xlarge", "ml.r5d.12xlarge", "ml.r5d.24xlarge", "ml.inf1.xlarge", "ml.inf1.2xlarge", "ml.inf1.6xlarge", "ml.inf1.24xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.p4d.24xlarge", "ml.c7g.large", "ml.c7g.xlarge", "ml.c7g.2xlarge", "ml.c7g.4xlarge", "ml.c7g.8xlarge", "ml.c7g.12xlarge", "ml.c7g.16xlarge", "ml.m6g.large", "ml.m6g.xlarge", "ml.m6g.2xlarge", "ml.m6g.4xlarge", "ml.m6g.8xlarge", "ml.m6g.12xlarge", "ml.m6g.16xlarge", "ml.m6gd.large", "ml.m6gd.xlarge", "ml.m6gd.2xlarge", "ml.m6gd.4xlarge", "ml.m6gd.8xlarge", "ml.m6gd.12xlarge", "ml.m6gd.16xlarge", "ml.c6g.large", "ml.c6g.xlarge", "ml.c6g.2xlarge", "ml.c6g.4xlarge", "ml.c6g.8xlarge", "ml.c6g.12xlarge", "ml.c6g.16xlarge", "ml.c6gd.large", "ml.c6gd.xlarge", "ml.c6gd.2xlarge", "ml.c6gd.4xlarge", "ml.c6gd.8xlarge", "ml.c6gd.12xlarge", "ml.c6gd.16xlarge", "ml.c6gn.large", "ml.c6gn.xlarge", "ml.c6gn.2xlarge", "ml.c6gn.4xlarge", "ml.c6gn.8xlarge", "ml.c6gn.12xlarge", "ml.c6gn.16xlarge", "ml.r6g.large", "ml.r6g.xlarge", "ml.r6g.2xlarge", "ml.r6g.4xlarge", "ml.r6g.8xlarge", "ml.r6g.12xlarge", "ml.r6g.16xlarge", "ml.r6gd.large", "ml.r6gd.xlarge", "ml.r6gd.2xlarge", "ml.r6gd.4xlarge", "ml.r6gd.8xlarge", "ml.r6gd.12xlarge", "ml.r6gd.16xlarge", "ml.p4de.24xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge"
|
12314
12343
|
# resp.inference_recommendations[0].endpoint_configuration.initial_instance_count #=> Integer
|
12344
|
+
# resp.inference_recommendations[0].endpoint_configuration.serverless_config.memory_size_in_mb #=> Integer
|
12345
|
+
# resp.inference_recommendations[0].endpoint_configuration.serverless_config.max_concurrency #=> Integer
|
12346
|
+
# resp.inference_recommendations[0].endpoint_configuration.serverless_config.provisioned_concurrency #=> Integer
|
12315
12347
|
# resp.inference_recommendations[0].model_configuration.inference_specification_name #=> String
|
12316
12348
|
# resp.inference_recommendations[0].model_configuration.environment_parameters #=> Array
|
12317
12349
|
# resp.inference_recommendations[0].model_configuration.environment_parameters[0].key #=> String
|
@@ -16402,7 +16434,7 @@ module Aws::SageMaker
|
|
16402
16434
|
# creation_time_after: Time.now,
|
16403
16435
|
# last_modified_time_before: Time.now,
|
16404
16436
|
# last_modified_time_after: Time.now,
|
16405
|
-
# status_equals: "OutOfService", # accepts OutOfService, Creating, Updating, SystemUpdating, RollingBack, InService, Deleting, Failed
|
16437
|
+
# status_equals: "OutOfService", # accepts OutOfService, Creating, Updating, SystemUpdating, RollingBack, InService, Deleting, Failed, UpdateRollbackFailed
|
16406
16438
|
# })
|
16407
16439
|
#
|
16408
16440
|
# @example Response structure
|
@@ -16412,7 +16444,7 @@ module Aws::SageMaker
|
|
16412
16444
|
# resp.endpoints[0].endpoint_arn #=> String
|
16413
16445
|
# resp.endpoints[0].creation_time #=> Time
|
16414
16446
|
# resp.endpoints[0].last_modified_time #=> Time
|
16415
|
-
# resp.endpoints[0].endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed"
|
16447
|
+
# resp.endpoints[0].endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed", "UpdateRollbackFailed"
|
16416
16448
|
# resp.next_token #=> String
|
16417
16449
|
#
|
16418
16450
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListEndpoints AWS API Documentation
|
@@ -17342,10 +17374,14 @@ module Aws::SageMaker
|
|
17342
17374
|
# resp.steps[0].inference_benchmark.metrics.model_latency #=> Integer
|
17343
17375
|
# resp.steps[0].inference_benchmark.metrics.cpu_utilization #=> Float
|
17344
17376
|
# resp.steps[0].inference_benchmark.metrics.memory_utilization #=> Float
|
17377
|
+
# resp.steps[0].inference_benchmark.metrics.model_setup_time #=> Integer
|
17345
17378
|
# resp.steps[0].inference_benchmark.endpoint_configuration.endpoint_name #=> String
|
17346
17379
|
# resp.steps[0].inference_benchmark.endpoint_configuration.variant_name #=> String
|
17347
17380
|
# resp.steps[0].inference_benchmark.endpoint_configuration.instance_type #=> String, one of "ml.t2.medium", "ml.t2.large", "ml.t2.xlarge", "ml.t2.2xlarge", "ml.m4.xlarge", "ml.m4.2xlarge", "ml.m4.4xlarge", "ml.m4.10xlarge", "ml.m4.16xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.12xlarge", "ml.m5.24xlarge", "ml.m5d.large", "ml.m5d.xlarge", "ml.m5d.2xlarge", "ml.m5d.4xlarge", "ml.m5d.12xlarge", "ml.m5d.24xlarge", "ml.c4.large", "ml.c4.xlarge", "ml.c4.2xlarge", "ml.c4.4xlarge", "ml.c4.8xlarge", "ml.p2.xlarge", "ml.p2.8xlarge", "ml.p2.16xlarge", "ml.p3.2xlarge", "ml.p3.8xlarge", "ml.p3.16xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.18xlarge", "ml.c5d.large", "ml.c5d.xlarge", "ml.c5d.2xlarge", "ml.c5d.4xlarge", "ml.c5d.9xlarge", "ml.c5d.18xlarge", "ml.g4dn.xlarge", "ml.g4dn.2xlarge", "ml.g4dn.4xlarge", "ml.g4dn.8xlarge", "ml.g4dn.12xlarge", "ml.g4dn.16xlarge", "ml.r5.large", "ml.r5.xlarge", "ml.r5.2xlarge", "ml.r5.4xlarge", "ml.r5.12xlarge", "ml.r5.24xlarge", "ml.r5d.large", "ml.r5d.xlarge", "ml.r5d.2xlarge", "ml.r5d.4xlarge", "ml.r5d.12xlarge", "ml.r5d.24xlarge", "ml.inf1.xlarge", "ml.inf1.2xlarge", "ml.inf1.6xlarge", "ml.inf1.24xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.p4d.24xlarge", "ml.c7g.large", "ml.c7g.xlarge", "ml.c7g.2xlarge", "ml.c7g.4xlarge", "ml.c7g.8xlarge", "ml.c7g.12xlarge", "ml.c7g.16xlarge", "ml.m6g.large", "ml.m6g.xlarge", "ml.m6g.2xlarge", "ml.m6g.4xlarge", "ml.m6g.8xlarge", "ml.m6g.12xlarge", "ml.m6g.16xlarge", "ml.m6gd.large", "ml.m6gd.xlarge", "ml.m6gd.2xlarge", "ml.m6gd.4xlarge", "ml.m6gd.8xlarge", "ml.m6gd.12xlarge", "ml.m6gd.16xlarge", "ml.c6g.large", "ml.c6g.xlarge", "ml.c6g.2xlarge", "ml.c6g.4xlarge", "ml.c6g.8xlarge", "ml.c6g.12xlarge", "ml.c6g.16xlarge", "ml.c6gd.large", "ml.c6gd.xlarge", "ml.c6gd.2xlarge", "ml.c6gd.4xlarge", "ml.c6gd.8xlarge", "ml.c6gd.12xlarge", "ml.c6gd.16xlarge", "ml.c6gn.large", "ml.c6gn.xlarge", "ml.c6gn.2xlarge", "ml.c6gn.4xlarge", "ml.c6gn.8xlarge", "ml.c6gn.12xlarge", "ml.c6gn.16xlarge", "ml.r6g.large", "ml.r6g.xlarge", "ml.r6g.2xlarge", "ml.r6g.4xlarge", "ml.r6g.8xlarge", "ml.r6g.12xlarge", "ml.r6g.16xlarge", "ml.r6gd.large", "ml.r6gd.xlarge", "ml.r6gd.2xlarge", "ml.r6gd.4xlarge", "ml.r6gd.8xlarge", "ml.r6gd.12xlarge", "ml.r6gd.16xlarge", "ml.p4de.24xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge"
|
17348
17381
|
# resp.steps[0].inference_benchmark.endpoint_configuration.initial_instance_count #=> Integer
|
17382
|
+
# resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.memory_size_in_mb #=> Integer
|
17383
|
+
# resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.max_concurrency #=> Integer
|
17384
|
+
# resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.provisioned_concurrency #=> Integer
|
17349
17385
|
# resp.steps[0].inference_benchmark.model_configuration.inference_specification_name #=> String
|
17350
17386
|
# resp.steps[0].inference_benchmark.model_configuration.environment_parameters #=> Array
|
17351
17387
|
# resp.steps[0].inference_benchmark.model_configuration.environment_parameters[0].key #=> String
|
@@ -21994,7 +22030,7 @@ module Aws::SageMaker
|
|
21994
22030
|
# },
|
21995
22031
|
# ],
|
21996
22032
|
# deployment_config: {
|
21997
|
-
# blue_green_update_policy: {
|
22033
|
+
# blue_green_update_policy: {
|
21998
22034
|
# traffic_routing_configuration: { # required
|
21999
22035
|
# type: "ALL_AT_ONCE", # required, accepts ALL_AT_ONCE, CANARY, LINEAR
|
22000
22036
|
# wait_interval_in_seconds: 1, # required
|
@@ -22017,6 +22053,18 @@ module Aws::SageMaker
|
|
22017
22053
|
# },
|
22018
22054
|
# ],
|
22019
22055
|
# },
|
22056
|
+
# rolling_update_policy: {
|
22057
|
+
# maximum_batch_size: { # required
|
22058
|
+
# type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
|
22059
|
+
# value: 1, # required
|
22060
|
+
# },
|
22061
|
+
# wait_interval_in_seconds: 1, # required
|
22062
|
+
# maximum_execution_timeout_in_seconds: 1,
|
22063
|
+
# rollback_maximum_batch_size: {
|
22064
|
+
# type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
|
22065
|
+
# value: 1, # required
|
22066
|
+
# },
|
22067
|
+
# },
|
22020
22068
|
# },
|
22021
22069
|
# retain_deployment_config: false,
|
22022
22070
|
# })
|
@@ -23818,7 +23866,7 @@ module Aws::SageMaker
|
|
23818
23866
|
params: params,
|
23819
23867
|
config: config)
|
23820
23868
|
context[:gem_name] = 'aws-sdk-sagemaker'
|
23821
|
-
context[:gem_version] = '1.
|
23869
|
+
context[:gem_version] = '1.194.0'
|
23822
23870
|
Seahorse::Client::Request.new(handlers, context)
|
23823
23871
|
end
|
23824
23872
|
|
@@ -963,6 +963,7 @@ module Aws::SageMaker
|
|
963
963
|
InferenceRecommendationsJobs = Shapes::ListShape.new(name: 'InferenceRecommendationsJobs')
|
964
964
|
InferenceSpecification = Shapes::StructureShape.new(name: 'InferenceSpecification')
|
965
965
|
InferenceSpecificationName = Shapes::StringShape.new(name: 'InferenceSpecificationName')
|
966
|
+
InitialInstanceCount = Shapes::IntegerShape.new(name: 'InitialInstanceCount')
|
966
967
|
InitialNumberOfUsers = Shapes::IntegerShape.new(name: 'InitialNumberOfUsers')
|
967
968
|
InitialTaskCount = Shapes::IntegerShape.new(name: 'InitialTaskCount')
|
968
969
|
InputConfig = Shapes::StructureShape.new(name: 'InputConfig')
|
@@ -1322,6 +1323,7 @@ module Aws::SageMaker
|
|
1322
1323
|
ModelQualityBaselineConfig = Shapes::StructureShape.new(name: 'ModelQualityBaselineConfig')
|
1323
1324
|
ModelQualityJobInput = Shapes::StructureShape.new(name: 'ModelQualityJobInput')
|
1324
1325
|
ModelRegisterSettings = Shapes::StructureShape.new(name: 'ModelRegisterSettings')
|
1326
|
+
ModelSetupTime = Shapes::IntegerShape.new(name: 'ModelSetupTime')
|
1325
1327
|
ModelSortKey = Shapes::StringShape.new(name: 'ModelSortKey')
|
1326
1328
|
ModelStepMetadata = Shapes::StructureShape.new(name: 'ModelStepMetadata')
|
1327
1329
|
ModelSummary = Shapes::StructureShape.new(name: 'ModelSummary')
|
@@ -1616,6 +1618,7 @@ module Aws::SageMaker
|
|
1616
1618
|
RecommendationJobStatus = Shapes::StringShape.new(name: 'RecommendationJobStatus')
|
1617
1619
|
RecommendationJobStoppingConditions = Shapes::StructureShape.new(name: 'RecommendationJobStoppingConditions')
|
1618
1620
|
RecommendationJobSupportedContentTypes = Shapes::ListShape.new(name: 'RecommendationJobSupportedContentTypes')
|
1621
|
+
RecommendationJobSupportedEndpointType = Shapes::StringShape.new(name: 'RecommendationJobSupportedEndpointType')
|
1619
1622
|
RecommendationJobSupportedInstanceTypes = Shapes::ListShape.new(name: 'RecommendationJobSupportedInstanceTypes')
|
1620
1623
|
RecommendationJobType = Shapes::StringShape.new(name: 'RecommendationJobType')
|
1621
1624
|
RecommendationJobVpcConfig = Shapes::StructureShape.new(name: 'RecommendationJobVpcConfig')
|
@@ -1668,6 +1671,7 @@ module Aws::SageMaker
|
|
1668
1671
|
RetryPipelineExecutionResponse = Shapes::StructureShape.new(name: 'RetryPipelineExecutionResponse')
|
1669
1672
|
RetryStrategy = Shapes::StructureShape.new(name: 'RetryStrategy')
|
1670
1673
|
RoleArn = Shapes::StringShape.new(name: 'RoleArn')
|
1674
|
+
RollingUpdatePolicy = Shapes::StructureShape.new(name: 'RollingUpdatePolicy')
|
1671
1675
|
RootAccess = Shapes::StringShape.new(name: 'RootAccess')
|
1672
1676
|
RuleConfigurationName = Shapes::StringShape.new(name: 'RuleConfigurationName')
|
1673
1677
|
RuleEvaluationStatus = Shapes::StringShape.new(name: 'RuleEvaluationStatus')
|
@@ -3666,8 +3670,9 @@ module Aws::SageMaker
|
|
3666
3670
|
|
3667
3671
|
DeployedImages.member = Shapes::ShapeRef.new(shape: DeployedImage)
|
3668
3672
|
|
3669
|
-
DeploymentConfig.add_member(:blue_green_update_policy, Shapes::ShapeRef.new(shape: BlueGreenUpdatePolicy,
|
3673
|
+
DeploymentConfig.add_member(:blue_green_update_policy, Shapes::ShapeRef.new(shape: BlueGreenUpdatePolicy, location_name: "BlueGreenUpdatePolicy"))
|
3670
3674
|
DeploymentConfig.add_member(:auto_rollback_configuration, Shapes::ShapeRef.new(shape: AutoRollbackConfig, location_name: "AutoRollbackConfiguration"))
|
3675
|
+
DeploymentConfig.add_member(:rolling_update_policy, Shapes::ShapeRef.new(shape: RollingUpdatePolicy, location_name: "RollingUpdatePolicy"))
|
3671
3676
|
DeploymentConfig.struct_class = Types::DeploymentConfig
|
3672
3677
|
|
3673
3678
|
DeploymentRecommendation.add_member(:recommendation_status, Shapes::ShapeRef.new(shape: RecommendationStatus, required: true, location_name: "RecommendationStatus"))
|
@@ -4966,9 +4971,10 @@ module Aws::SageMaker
|
|
4966
4971
|
EndpointInput.add_member(:end_time_offset, Shapes::ShapeRef.new(shape: MonitoringTimeOffsetString, location_name: "EndTimeOffset"))
|
4967
4972
|
EndpointInput.struct_class = Types::EndpointInput
|
4968
4973
|
|
4969
|
-
EndpointInputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType,
|
4974
|
+
EndpointInputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, location_name: "InstanceType"))
|
4970
4975
|
EndpointInputConfiguration.add_member(:inference_specification_name, Shapes::ShapeRef.new(shape: InferenceSpecificationName, location_name: "InferenceSpecificationName"))
|
4971
4976
|
EndpointInputConfiguration.add_member(:environment_parameter_ranges, Shapes::ShapeRef.new(shape: EnvironmentParameterRanges, location_name: "EnvironmentParameterRanges"))
|
4977
|
+
EndpointInputConfiguration.add_member(:serverless_config, Shapes::ShapeRef.new(shape: ProductionVariantServerlessConfig, location_name: "ServerlessConfig"))
|
4972
4978
|
EndpointInputConfiguration.struct_class = Types::EndpointInputConfiguration
|
4973
4979
|
|
4974
4980
|
EndpointInputConfigurations.member = Shapes::ShapeRef.new(shape: EndpointInputConfiguration)
|
@@ -4981,8 +4987,9 @@ module Aws::SageMaker
|
|
4981
4987
|
|
4982
4988
|
EndpointOutputConfiguration.add_member(:endpoint_name, Shapes::ShapeRef.new(shape: String, required: true, location_name: "EndpointName"))
|
4983
4989
|
EndpointOutputConfiguration.add_member(:variant_name, Shapes::ShapeRef.new(shape: String, required: true, location_name: "VariantName"))
|
4984
|
-
EndpointOutputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType,
|
4985
|
-
EndpointOutputConfiguration.add_member(:initial_instance_count, Shapes::ShapeRef.new(shape:
|
4990
|
+
EndpointOutputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, location_name: "InstanceType"))
|
4991
|
+
EndpointOutputConfiguration.add_member(:initial_instance_count, Shapes::ShapeRef.new(shape: InitialInstanceCount, location_name: "InitialInstanceCount"))
|
4992
|
+
EndpointOutputConfiguration.add_member(:serverless_config, Shapes::ShapeRef.new(shape: ProductionVariantServerlessConfig, location_name: "ServerlessConfig"))
|
4986
4993
|
EndpointOutputConfiguration.struct_class = Types::EndpointOutputConfiguration
|
4987
4994
|
|
4988
4995
|
EndpointPerformance.add_member(:metrics, Shapes::ShapeRef.new(shape: InferenceMetrics, required: true, location_name: "Metrics"))
|
@@ -7865,6 +7872,7 @@ module Aws::SageMaker
|
|
7865
7872
|
RecommendationJobContainerConfig.add_member(:nearest_model_name, Shapes::ShapeRef.new(shape: String, location_name: "NearestModelName"))
|
7866
7873
|
RecommendationJobContainerConfig.add_member(:supported_instance_types, Shapes::ShapeRef.new(shape: RecommendationJobSupportedInstanceTypes, location_name: "SupportedInstanceTypes"))
|
7867
7874
|
RecommendationJobContainerConfig.add_member(:data_input_config, Shapes::ShapeRef.new(shape: RecommendationJobDataInputConfig, location_name: "DataInputConfig"))
|
7875
|
+
RecommendationJobContainerConfig.add_member(:supported_endpoint_type, Shapes::ShapeRef.new(shape: RecommendationJobSupportedEndpointType, location_name: "SupportedEndpointType"))
|
7868
7876
|
RecommendationJobContainerConfig.struct_class = Types::RecommendationJobContainerConfig
|
7869
7877
|
|
7870
7878
|
RecommendationJobInferenceBenchmark.add_member(:metrics, Shapes::ShapeRef.new(shape: RecommendationMetrics, location_name: "Metrics"))
|
@@ -7922,6 +7930,7 @@ module Aws::SageMaker
|
|
7922
7930
|
RecommendationMetrics.add_member(:model_latency, Shapes::ShapeRef.new(shape: Integer, required: true, location_name: "ModelLatency"))
|
7923
7931
|
RecommendationMetrics.add_member(:cpu_utilization, Shapes::ShapeRef.new(shape: UtilizationMetric, location_name: "CpuUtilization"))
|
7924
7932
|
RecommendationMetrics.add_member(:memory_utilization, Shapes::ShapeRef.new(shape: UtilizationMetric, location_name: "MemoryUtilization"))
|
7933
|
+
RecommendationMetrics.add_member(:model_setup_time, Shapes::ShapeRef.new(shape: ModelSetupTime, location_name: "ModelSetupTime"))
|
7925
7934
|
RecommendationMetrics.struct_class = Types::RecommendationMetrics
|
7926
7935
|
|
7927
7936
|
RedshiftDatasetDefinition.add_member(:cluster_id, Shapes::ShapeRef.new(shape: RedshiftClusterId, required: true, location_name: "ClusterId"))
|
@@ -8017,6 +8026,12 @@ module Aws::SageMaker
|
|
8017
8026
|
RetryStrategy.add_member(:maximum_retry_attempts, Shapes::ShapeRef.new(shape: MaximumRetryAttempts, required: true, location_name: "MaximumRetryAttempts"))
|
8018
8027
|
RetryStrategy.struct_class = Types::RetryStrategy
|
8019
8028
|
|
8029
|
+
RollingUpdatePolicy.add_member(:maximum_batch_size, Shapes::ShapeRef.new(shape: CapacitySize, required: true, location_name: "MaximumBatchSize"))
|
8030
|
+
RollingUpdatePolicy.add_member(:wait_interval_in_seconds, Shapes::ShapeRef.new(shape: WaitIntervalInSeconds, required: true, location_name: "WaitIntervalInSeconds"))
|
8031
|
+
RollingUpdatePolicy.add_member(:maximum_execution_timeout_in_seconds, Shapes::ShapeRef.new(shape: MaximumExecutionTimeoutInSeconds, location_name: "MaximumExecutionTimeoutInSeconds"))
|
8032
|
+
RollingUpdatePolicy.add_member(:rollback_maximum_batch_size, Shapes::ShapeRef.new(shape: CapacitySize, location_name: "RollbackMaximumBatchSize"))
|
8033
|
+
RollingUpdatePolicy.struct_class = Types::RollingUpdatePolicy
|
8034
|
+
|
8020
8035
|
RuleParameters.key = Shapes::ShapeRef.new(shape: ConfigKey)
|
8021
8036
|
RuleParameters.value = Shapes::ShapeRef.new(shape: ConfigValue)
|
8022
8037
|
|
@@ -2415,6 +2415,12 @@ module Aws::SageMaker
|
|
2415
2415
|
# @!attribute [rw] time_series_forecasting_job_config
|
2416
2416
|
# Settings used to configure an AutoML job V2 for a time-series
|
2417
2417
|
# forecasting problem type.
|
2418
|
+
#
|
2419
|
+
# <note markdown="1"> The `TimeSeriesForecastingJobConfig` problem type is only available
|
2420
|
+
# in private beta. Contact Amazon Web Services Support or your account
|
2421
|
+
# manager to learn more about access privileges.
|
2422
|
+
#
|
2423
|
+
# </note>
|
2418
2424
|
# @return [Types::TimeSeriesForecastingJobConfig]
|
2419
2425
|
#
|
2420
2426
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/AutoMLProblemTypeConfig AWS API Documentation
|
@@ -3106,7 +3112,15 @@ module Aws::SageMaker
|
|
3106
3112
|
include Aws::Structure
|
3107
3113
|
end
|
3108
3114
|
|
3109
|
-
# Specifies the endpoint capacity to activate for
|
3115
|
+
# Specifies the type and size of the endpoint capacity to activate for a
|
3116
|
+
# blue/green deployment, a rolling deployment, or a rollback strategy.
|
3117
|
+
# You can specify your batches as either instance count or the overall
|
3118
|
+
# percentage or your fleet.
|
3119
|
+
#
|
3120
|
+
# For a rollback strategy, if you don't specify the fields in this
|
3121
|
+
# object, or if you set the `Value` to 100%, then SageMaker uses a
|
3122
|
+
# blue/green rollback strategy and rolls all traffic back to the blue
|
3123
|
+
# fleet.
|
3110
3124
|
#
|
3111
3125
|
# @!attribute [rw] type
|
3112
3126
|
# Specifies the endpoint capacity type.
|
@@ -10194,11 +10208,17 @@ module Aws::SageMaker
|
|
10194
10208
|
# failures and recovery.
|
10195
10209
|
# @return [Types::AutoRollbackConfig]
|
10196
10210
|
#
|
10211
|
+
# @!attribute [rw] rolling_update_policy
|
10212
|
+
# Specifies a rolling deployment strategy for updating a SageMaker
|
10213
|
+
# endpoint.
|
10214
|
+
# @return [Types::RollingUpdatePolicy]
|
10215
|
+
#
|
10197
10216
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DeploymentConfig AWS API Documentation
|
10198
10217
|
#
|
10199
10218
|
class DeploymentConfig < Struct.new(
|
10200
10219
|
:blue_green_update_policy,
|
10201
|
-
:auto_rollback_configuration
|
10220
|
+
:auto_rollback_configuration,
|
10221
|
+
:rolling_update_policy)
|
10202
10222
|
SENSITIVE = []
|
10203
10223
|
include Aws::Structure
|
10204
10224
|
end
|
@@ -17115,12 +17135,17 @@ module Aws::SageMaker
|
|
17115
17135
|
# The parameter you want to benchmark against.
|
17116
17136
|
# @return [Types::EnvironmentParameterRanges]
|
17117
17137
|
#
|
17138
|
+
# @!attribute [rw] serverless_config
|
17139
|
+
# Specifies the serverless configuration for an endpoint variant.
|
17140
|
+
# @return [Types::ProductionVariantServerlessConfig]
|
17141
|
+
#
|
17118
17142
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/EndpointInputConfiguration AWS API Documentation
|
17119
17143
|
#
|
17120
17144
|
class EndpointInputConfiguration < Struct.new(
|
17121
17145
|
:instance_type,
|
17122
17146
|
:inference_specification_name,
|
17123
|
-
:environment_parameter_ranges
|
17147
|
+
:environment_parameter_ranges,
|
17148
|
+
:serverless_config)
|
17124
17149
|
SENSITIVE = []
|
17125
17150
|
include Aws::Structure
|
17126
17151
|
end
|
@@ -17182,13 +17207,18 @@ module Aws::SageMaker
|
|
17182
17207
|
# The number of instances recommended to launch initially.
|
17183
17208
|
# @return [Integer]
|
17184
17209
|
#
|
17210
|
+
# @!attribute [rw] serverless_config
|
17211
|
+
# Specifies the serverless configuration for an endpoint variant.
|
17212
|
+
# @return [Types::ProductionVariantServerlessConfig]
|
17213
|
+
#
|
17185
17214
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/EndpointOutputConfiguration AWS API Documentation
|
17186
17215
|
#
|
17187
17216
|
class EndpointOutputConfiguration < Struct.new(
|
17188
17217
|
:endpoint_name,
|
17189
17218
|
:variant_name,
|
17190
17219
|
:instance_type,
|
17191
|
-
:initial_instance_count
|
17220
|
+
:initial_instance_count,
|
17221
|
+
:serverless_config)
|
17192
17222
|
SENSITIVE = []
|
17193
17223
|
include Aws::Structure
|
17194
17224
|
end
|
@@ -32870,6 +32900,17 @@ module Aws::SageMaker
|
|
32870
32900
|
# @!attribute [rw] provisioned_concurrency
|
32871
32901
|
# The amount of provisioned concurrency to allocate for the serverless
|
32872
32902
|
# endpoint. Should be less than or equal to `MaxConcurrency`.
|
32903
|
+
#
|
32904
|
+
# <note markdown="1"> This field is not supported for serverless endpoint recommendations
|
32905
|
+
# for Inference Recommender jobs. For more information about creating
|
32906
|
+
# an Inference Recommender job, see
|
32907
|
+
# [CreateInferenceRecommendationsJobs][1].
|
32908
|
+
#
|
32909
|
+
# </note>
|
32910
|
+
#
|
32911
|
+
#
|
32912
|
+
#
|
32913
|
+
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateInferenceRecommendationsJob.html
|
32873
32914
|
# @return [Integer]
|
32874
32915
|
#
|
32875
32916
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ProductionVariantServerlessConfig AWS API Documentation
|
@@ -34074,6 +34115,14 @@ module Aws::SageMaker
|
|
34074
34115
|
# [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_InputConfig.html#sagemaker-Type-InputConfig-DataInputConfig
|
34075
34116
|
# @return [String]
|
34076
34117
|
#
|
34118
|
+
# @!attribute [rw] supported_endpoint_type
|
34119
|
+
# The endpoint type to receive recommendations for. By default this is
|
34120
|
+
# null, and the results of the inference recommendation job return a
|
34121
|
+
# combined list of both real-time and serverless benchmarks. By
|
34122
|
+
# specifying a value for this field, you can receive a longer list of
|
34123
|
+
# benchmarks for the desired endpoint type.
|
34124
|
+
# @return [String]
|
34125
|
+
#
|
34077
34126
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RecommendationJobContainerConfig AWS API Documentation
|
34078
34127
|
#
|
34079
34128
|
class RecommendationJobContainerConfig < Struct.new(
|
@@ -34084,7 +34133,8 @@ module Aws::SageMaker
|
|
34084
34133
|
:payload_config,
|
34085
34134
|
:nearest_model_name,
|
34086
34135
|
:supported_instance_types,
|
34087
|
-
:data_input_config
|
34136
|
+
:data_input_config,
|
34137
|
+
:supported_endpoint_type)
|
34088
34138
|
SENSITIVE = []
|
34089
34139
|
include Aws::Structure
|
34090
34140
|
end
|
@@ -34408,6 +34458,14 @@ module Aws::SageMaker
|
|
34408
34458
|
# `NaN` indicates that the value is not available.
|
34409
34459
|
# @return [Float]
|
34410
34460
|
#
|
34461
|
+
# @!attribute [rw] model_setup_time
|
34462
|
+
# The time it takes to launch new compute resources for a serverless
|
34463
|
+
# endpoint. The time can vary depending on the model size, how long it
|
34464
|
+
# takes to download the model, and the start-up time of the container.
|
34465
|
+
#
|
34466
|
+
# `NaN` indicates that the value is not available.
|
34467
|
+
# @return [Integer]
|
34468
|
+
#
|
34411
34469
|
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RecommendationMetrics AWS API Documentation
|
34412
34470
|
#
|
34413
34471
|
class RecommendationMetrics < Struct.new(
|
@@ -34416,7 +34474,8 @@ module Aws::SageMaker
|
|
34416
34474
|
:max_invocations,
|
34417
34475
|
:model_latency,
|
34418
34476
|
:cpu_utilization,
|
34419
|
-
:memory_utilization
|
34477
|
+
:memory_utilization,
|
34478
|
+
:model_setup_time)
|
34420
34479
|
SENSITIVE = []
|
34421
34480
|
include Aws::Structure
|
34422
34481
|
end
|
@@ -34994,6 +35053,54 @@ module Aws::SageMaker
|
|
34994
35053
|
include Aws::Structure
|
34995
35054
|
end
|
34996
35055
|
|
35056
|
+
# Specifies a rolling deployment strategy for updating a SageMaker
|
35057
|
+
# endpoint.
|
35058
|
+
#
|
35059
|
+
# @!attribute [rw] maximum_batch_size
|
35060
|
+
# Specifies the type and size of the endpoint capacity to activate for
|
35061
|
+
# a blue/green deployment, a rolling deployment, or a rollback
|
35062
|
+
# strategy. You can specify your batches as either instance count or
|
35063
|
+
# the overall percentage or your fleet.
|
35064
|
+
#
|
35065
|
+
# For a rollback strategy, if you don't specify the fields in this
|
35066
|
+
# object, or if you set the `Value` to 100%, then SageMaker uses a
|
35067
|
+
# blue/green rollback strategy and rolls all traffic back to the blue
|
35068
|
+
# fleet.
|
35069
|
+
# @return [Types::CapacitySize]
|
35070
|
+
#
|
35071
|
+
# @!attribute [rw] wait_interval_in_seconds
|
35072
|
+
# The length of the baking period, during which SageMaker monitors
|
35073
|
+
# alarms for each batch on the new fleet.
|
35074
|
+
# @return [Integer]
|
35075
|
+
#
|
35076
|
+
# @!attribute [rw] maximum_execution_timeout_in_seconds
|
35077
|
+
# The time limit for the total deployment. Exceeding this limit causes
|
35078
|
+
# a timeout.
|
35079
|
+
# @return [Integer]
|
35080
|
+
#
|
35081
|
+
# @!attribute [rw] rollback_maximum_batch_size
|
35082
|
+
# Specifies the type and size of the endpoint capacity to activate for
|
35083
|
+
# a blue/green deployment, a rolling deployment, or a rollback
|
35084
|
+
# strategy. You can specify your batches as either instance count or
|
35085
|
+
# the overall percentage or your fleet.
|
35086
|
+
#
|
35087
|
+
# For a rollback strategy, if you don't specify the fields in this
|
35088
|
+
# object, or if you set the `Value` to 100%, then SageMaker uses a
|
35089
|
+
# blue/green rollback strategy and rolls all traffic back to the blue
|
35090
|
+
# fleet.
|
35091
|
+
# @return [Types::CapacitySize]
|
35092
|
+
#
|
35093
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RollingUpdatePolicy AWS API Documentation
|
35094
|
+
#
|
35095
|
+
class RollingUpdatePolicy < Struct.new(
|
35096
|
+
:maximum_batch_size,
|
35097
|
+
:wait_interval_in_seconds,
|
35098
|
+
:maximum_execution_timeout_in_seconds,
|
35099
|
+
:rollback_maximum_batch_size)
|
35100
|
+
SENSITIVE = []
|
35101
|
+
include Aws::Structure
|
35102
|
+
end
|
35103
|
+
|
34997
35104
|
# Describes the S3 data source.
|
34998
35105
|
#
|
34999
35106
|
# Your input bucket must be in the same Amazon Web Services region as
|
data/lib/aws-sdk-sagemaker.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: aws-sdk-sagemaker
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.194.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Amazon Web Services
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-
|
11
|
+
date: 2023-07-03 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: aws-sdk-core
|