aws-sdk-sagemaker 1.192.0 → 1.194.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: ea2b0bfd3b4390fa357475a5d054208271cd3aaf4e450e89531bf0f205b22a66
4
- data.tar.gz: b84a2185dffd514d6f76fa68a05b2f546939b70177779278f88853e7e328be0a
3
+ metadata.gz: 60973ee75145a047cd16273b84e2c90c71e5f4f79410ca18abc405d322530142
4
+ data.tar.gz: c3b8a0d376ecde588856d2902f2260fda4df5ee686004457f25edccff047fab3
5
5
  SHA512:
6
- metadata.gz: d8835cdf47bbb5c4e1b3bbc42cb782b0da023e3cb3790deeb32d6f006c901999aa620e04aea27f688410d70c0fed4efe8d970f592c0b1d9a36b6514f765c5d0c
7
- data.tar.gz: abe87a3fa189453639cb875bdcd2750775c3f9716ea8fca2803879cfbc3252ed496954e2bd1f53452e4f0a0c9932331c05e80c36e1dfa138dc1a83d720c509e1
6
+ metadata.gz: ab144375ebe73e9a8ba1db86cfc76be055d4a904277d6f8fc474dd1cbc846980c66ab87b90d6892a99798c55fe84197a03c5911bac12295b441c130e7ee12e1c
7
+ data.tar.gz: 76a347049d001562cda69eb23edab0abe7a60de6f84ecdb31b4aa237ef850122be6210bcf87927af77fcbb2e492d06dd95ebd795a1350113a007ca5cae7e60b4
data/CHANGELOG.md CHANGED
@@ -1,6 +1,16 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.194.0 (2023-07-03)
5
+ ------------------
6
+
7
+ * Feature - SageMaker Inference Recommender now accepts new fields SupportedEndpointType and ServerlessConfiguration to support serverless endpoints.
8
+
9
+ 1.193.0 (2023-06-30)
10
+ ------------------
11
+
12
+ * Feature - This release adds support for rolling deployment in SageMaker Inference.
13
+
4
14
  1.192.0 (2023-06-29)
5
15
  ------------------
6
16
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.192.0
1
+ 1.194.0
@@ -2719,7 +2719,7 @@ module Aws::SageMaker
2719
2719
  # endpoint_name: "EndpointName", # required
2720
2720
  # endpoint_config_name: "EndpointConfigName", # required
2721
2721
  # deployment_config: {
2722
- # blue_green_update_policy: { # required
2722
+ # blue_green_update_policy: {
2723
2723
  # traffic_routing_configuration: { # required
2724
2724
  # type: "ALL_AT_ONCE", # required, accepts ALL_AT_ONCE, CANARY, LINEAR
2725
2725
  # wait_interval_in_seconds: 1, # required
@@ -2742,6 +2742,18 @@ module Aws::SageMaker
2742
2742
  # },
2743
2743
  # ],
2744
2744
  # },
2745
+ # rolling_update_policy: {
2746
+ # maximum_batch_size: { # required
2747
+ # type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
2748
+ # value: 1, # required
2749
+ # },
2750
+ # wait_interval_in_seconds: 1, # required
2751
+ # maximum_execution_timeout_in_seconds: 1,
2752
+ # rollback_maximum_batch_size: {
2753
+ # type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
2754
+ # value: 1, # required
2755
+ # },
2756
+ # },
2745
2757
  # },
2746
2758
  # tags: [
2747
2759
  # {
@@ -4447,7 +4459,7 @@ module Aws::SageMaker
4447
4459
  # },
4448
4460
  # endpoint_configurations: [
4449
4461
  # {
4450
- # instance_type: "ml.t2.medium", # required, accepts ml.t2.medium, ml.t2.large, ml.t2.xlarge, ml.t2.2xlarge, ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.m5d.large, ml.m5d.xlarge, ml.m5d.2xlarge, ml.m5d.4xlarge, ml.m5d.12xlarge, ml.m5d.24xlarge, ml.c4.large, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5d.large, ml.c5d.xlarge, ml.c5d.2xlarge, ml.c5d.4xlarge, ml.c5d.9xlarge, ml.c5d.18xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.12xlarge, ml.r5.24xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.12xlarge, ml.r5d.24xlarge, ml.inf1.xlarge, ml.inf1.2xlarge, ml.inf1.6xlarge, ml.inf1.24xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.p4d.24xlarge, ml.c7g.large, ml.c7g.xlarge, ml.c7g.2xlarge, ml.c7g.4xlarge, ml.c7g.8xlarge, ml.c7g.12xlarge, ml.c7g.16xlarge, ml.m6g.large, ml.m6g.xlarge, ml.m6g.2xlarge, ml.m6g.4xlarge, ml.m6g.8xlarge, ml.m6g.12xlarge, ml.m6g.16xlarge, ml.m6gd.large, ml.m6gd.xlarge, ml.m6gd.2xlarge, ml.m6gd.4xlarge, ml.m6gd.8xlarge, ml.m6gd.12xlarge, ml.m6gd.16xlarge, ml.c6g.large, ml.c6g.xlarge, ml.c6g.2xlarge, ml.c6g.4xlarge, ml.c6g.8xlarge, ml.c6g.12xlarge, ml.c6g.16xlarge, ml.c6gd.large, ml.c6gd.xlarge, ml.c6gd.2xlarge, ml.c6gd.4xlarge, ml.c6gd.8xlarge, ml.c6gd.12xlarge, ml.c6gd.16xlarge, ml.c6gn.large, ml.c6gn.xlarge, ml.c6gn.2xlarge, ml.c6gn.4xlarge, ml.c6gn.8xlarge, ml.c6gn.12xlarge, ml.c6gn.16xlarge, ml.r6g.large, ml.r6g.xlarge, ml.r6g.2xlarge, ml.r6g.4xlarge, ml.r6g.8xlarge, ml.r6g.12xlarge, ml.r6g.16xlarge, ml.r6gd.large, ml.r6gd.xlarge, ml.r6gd.2xlarge, ml.r6gd.4xlarge, ml.r6gd.8xlarge, ml.r6gd.12xlarge, ml.r6gd.16xlarge, ml.p4de.24xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge
4462
+ # instance_type: "ml.t2.medium", # accepts ml.t2.medium, ml.t2.large, ml.t2.xlarge, ml.t2.2xlarge, ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.m5d.large, ml.m5d.xlarge, ml.m5d.2xlarge, ml.m5d.4xlarge, ml.m5d.12xlarge, ml.m5d.24xlarge, ml.c4.large, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5d.large, ml.c5d.xlarge, ml.c5d.2xlarge, ml.c5d.4xlarge, ml.c5d.9xlarge, ml.c5d.18xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.12xlarge, ml.r5.24xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.12xlarge, ml.r5d.24xlarge, ml.inf1.xlarge, ml.inf1.2xlarge, ml.inf1.6xlarge, ml.inf1.24xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.p4d.24xlarge, ml.c7g.large, ml.c7g.xlarge, ml.c7g.2xlarge, ml.c7g.4xlarge, ml.c7g.8xlarge, ml.c7g.12xlarge, ml.c7g.16xlarge, ml.m6g.large, ml.m6g.xlarge, ml.m6g.2xlarge, ml.m6g.4xlarge, ml.m6g.8xlarge, ml.m6g.12xlarge, ml.m6g.16xlarge, ml.m6gd.large, ml.m6gd.xlarge, ml.m6gd.2xlarge, ml.m6gd.4xlarge, ml.m6gd.8xlarge, ml.m6gd.12xlarge, ml.m6gd.16xlarge, ml.c6g.large, ml.c6g.xlarge, ml.c6g.2xlarge, ml.c6g.4xlarge, ml.c6g.8xlarge, ml.c6g.12xlarge, ml.c6g.16xlarge, ml.c6gd.large, ml.c6gd.xlarge, ml.c6gd.2xlarge, ml.c6gd.4xlarge, ml.c6gd.8xlarge, ml.c6gd.12xlarge, ml.c6gd.16xlarge, ml.c6gn.large, ml.c6gn.xlarge, ml.c6gn.2xlarge, ml.c6gn.4xlarge, ml.c6gn.8xlarge, ml.c6gn.12xlarge, ml.c6gn.16xlarge, ml.r6g.large, ml.r6g.xlarge, ml.r6g.2xlarge, ml.r6g.4xlarge, ml.r6g.8xlarge, ml.r6g.12xlarge, ml.r6g.16xlarge, ml.r6gd.large, ml.r6gd.xlarge, ml.r6gd.2xlarge, ml.r6gd.4xlarge, ml.r6gd.8xlarge, ml.r6gd.12xlarge, ml.r6gd.16xlarge, ml.p4de.24xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge
4451
4463
  # inference_specification_name: "InferenceSpecificationName",
4452
4464
  # environment_parameter_ranges: {
4453
4465
  # categorical_parameter_ranges: [
@@ -4457,6 +4469,11 @@ module Aws::SageMaker
4457
4469
  # },
4458
4470
  # ],
4459
4471
  # },
4472
+ # serverless_config: {
4473
+ # memory_size_in_mb: 1, # required
4474
+ # max_concurrency: 1, # required
4475
+ # provisioned_concurrency: 1,
4476
+ # },
4460
4477
  # },
4461
4478
  # ],
4462
4479
  # volume_kms_key_id: "KmsKeyId",
@@ -4472,6 +4489,7 @@ module Aws::SageMaker
4472
4489
  # nearest_model_name: "String",
4473
4490
  # supported_instance_types: ["String"],
4474
4491
  # data_input_config: "RecommendationJobDataInputConfig",
4492
+ # supported_endpoint_type: "RealTime", # accepts RealTime, Serverless
4475
4493
  # },
4476
4494
  # endpoints: [
4477
4495
  # {
@@ -11078,7 +11096,7 @@ module Aws::SageMaker
11078
11096
  # resp.data_capture_config.current_sampling_percentage #=> Integer
11079
11097
  # resp.data_capture_config.destination_s3_uri #=> String
11080
11098
  # resp.data_capture_config.kms_key_id #=> String
11081
- # resp.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed"
11099
+ # resp.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed", "UpdateRollbackFailed"
11082
11100
  # resp.failure_reason #=> String
11083
11101
  # resp.creation_time #=> Time
11084
11102
  # resp.last_modified_time #=> Time
@@ -11092,6 +11110,12 @@ module Aws::SageMaker
11092
11110
  # resp.last_deployment_config.blue_green_update_policy.maximum_execution_timeout_in_seconds #=> Integer
11093
11111
  # resp.last_deployment_config.auto_rollback_configuration.alarms #=> Array
11094
11112
  # resp.last_deployment_config.auto_rollback_configuration.alarms[0].alarm_name #=> String
11113
+ # resp.last_deployment_config.rolling_update_policy.maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENT"
11114
+ # resp.last_deployment_config.rolling_update_policy.maximum_batch_size.value #=> Integer
11115
+ # resp.last_deployment_config.rolling_update_policy.wait_interval_in_seconds #=> Integer
11116
+ # resp.last_deployment_config.rolling_update_policy.maximum_execution_timeout_in_seconds #=> Integer
11117
+ # resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.type #=> String, one of "INSTANCE_COUNT", "CAPACITY_PERCENT"
11118
+ # resp.last_deployment_config.rolling_update_policy.rollback_maximum_batch_size.value #=> Integer
11095
11119
  # resp.async_inference_config.client_config.max_concurrent_invocations_per_instance #=> Integer
11096
11120
  # resp.async_inference_config.output_config.kms_key_id #=> String
11097
11121
  # resp.async_inference_config.output_config.s3_output_path #=> String
@@ -12190,7 +12214,7 @@ module Aws::SageMaker
12190
12214
  # resp.role_arn #=> String
12191
12215
  # resp.endpoint_metadata.endpoint_name #=> String
12192
12216
  # resp.endpoint_metadata.endpoint_config_name #=> String
12193
- # resp.endpoint_metadata.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed"
12217
+ # resp.endpoint_metadata.endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed", "UpdateRollbackFailed"
12194
12218
  # resp.endpoint_metadata.failure_reason #=> String
12195
12219
  # resp.model_variants #=> Array
12196
12220
  # resp.model_variants[0].model_name #=> String
@@ -12278,6 +12302,9 @@ module Aws::SageMaker
12278
12302
  # resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].name #=> String
12279
12303
  # resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].value #=> Array
12280
12304
  # resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].value[0] #=> String
12305
+ # resp.input_config.endpoint_configurations[0].serverless_config.memory_size_in_mb #=> Integer
12306
+ # resp.input_config.endpoint_configurations[0].serverless_config.max_concurrency #=> Integer
12307
+ # resp.input_config.endpoint_configurations[0].serverless_config.provisioned_concurrency #=> Integer
12281
12308
  # resp.input_config.volume_kms_key_id #=> String
12282
12309
  # resp.input_config.container_config.domain #=> String
12283
12310
  # resp.input_config.container_config.task #=> String
@@ -12290,6 +12317,7 @@ module Aws::SageMaker
12290
12317
  # resp.input_config.container_config.supported_instance_types #=> Array
12291
12318
  # resp.input_config.container_config.supported_instance_types[0] #=> String
12292
12319
  # resp.input_config.container_config.data_input_config #=> String
12320
+ # resp.input_config.container_config.supported_endpoint_type #=> String, one of "RealTime", "Serverless"
12293
12321
  # resp.input_config.endpoints #=> Array
12294
12322
  # resp.input_config.endpoints[0].endpoint_name #=> String
12295
12323
  # resp.input_config.vpc_config.security_group_ids #=> Array
@@ -12308,10 +12336,14 @@ module Aws::SageMaker
12308
12336
  # resp.inference_recommendations[0].metrics.model_latency #=> Integer
12309
12337
  # resp.inference_recommendations[0].metrics.cpu_utilization #=> Float
12310
12338
  # resp.inference_recommendations[0].metrics.memory_utilization #=> Float
12339
+ # resp.inference_recommendations[0].metrics.model_setup_time #=> Integer
12311
12340
  # resp.inference_recommendations[0].endpoint_configuration.endpoint_name #=> String
12312
12341
  # resp.inference_recommendations[0].endpoint_configuration.variant_name #=> String
12313
12342
  # resp.inference_recommendations[0].endpoint_configuration.instance_type #=> String, one of "ml.t2.medium", "ml.t2.large", "ml.t2.xlarge", "ml.t2.2xlarge", "ml.m4.xlarge", "ml.m4.2xlarge", "ml.m4.4xlarge", "ml.m4.10xlarge", "ml.m4.16xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.12xlarge", "ml.m5.24xlarge", "ml.m5d.large", "ml.m5d.xlarge", "ml.m5d.2xlarge", "ml.m5d.4xlarge", "ml.m5d.12xlarge", "ml.m5d.24xlarge", "ml.c4.large", "ml.c4.xlarge", "ml.c4.2xlarge", "ml.c4.4xlarge", "ml.c4.8xlarge", "ml.p2.xlarge", "ml.p2.8xlarge", "ml.p2.16xlarge", "ml.p3.2xlarge", "ml.p3.8xlarge", "ml.p3.16xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.18xlarge", "ml.c5d.large", "ml.c5d.xlarge", "ml.c5d.2xlarge", "ml.c5d.4xlarge", "ml.c5d.9xlarge", "ml.c5d.18xlarge", "ml.g4dn.xlarge", "ml.g4dn.2xlarge", "ml.g4dn.4xlarge", "ml.g4dn.8xlarge", "ml.g4dn.12xlarge", "ml.g4dn.16xlarge", "ml.r5.large", "ml.r5.xlarge", "ml.r5.2xlarge", "ml.r5.4xlarge", "ml.r5.12xlarge", "ml.r5.24xlarge", "ml.r5d.large", "ml.r5d.xlarge", "ml.r5d.2xlarge", "ml.r5d.4xlarge", "ml.r5d.12xlarge", "ml.r5d.24xlarge", "ml.inf1.xlarge", "ml.inf1.2xlarge", "ml.inf1.6xlarge", "ml.inf1.24xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.p4d.24xlarge", "ml.c7g.large", "ml.c7g.xlarge", "ml.c7g.2xlarge", "ml.c7g.4xlarge", "ml.c7g.8xlarge", "ml.c7g.12xlarge", "ml.c7g.16xlarge", "ml.m6g.large", "ml.m6g.xlarge", "ml.m6g.2xlarge", "ml.m6g.4xlarge", "ml.m6g.8xlarge", "ml.m6g.12xlarge", "ml.m6g.16xlarge", "ml.m6gd.large", "ml.m6gd.xlarge", "ml.m6gd.2xlarge", "ml.m6gd.4xlarge", "ml.m6gd.8xlarge", "ml.m6gd.12xlarge", "ml.m6gd.16xlarge", "ml.c6g.large", "ml.c6g.xlarge", "ml.c6g.2xlarge", "ml.c6g.4xlarge", "ml.c6g.8xlarge", "ml.c6g.12xlarge", "ml.c6g.16xlarge", "ml.c6gd.large", "ml.c6gd.xlarge", "ml.c6gd.2xlarge", "ml.c6gd.4xlarge", "ml.c6gd.8xlarge", "ml.c6gd.12xlarge", "ml.c6gd.16xlarge", "ml.c6gn.large", "ml.c6gn.xlarge", "ml.c6gn.2xlarge", "ml.c6gn.4xlarge", "ml.c6gn.8xlarge", "ml.c6gn.12xlarge", "ml.c6gn.16xlarge", "ml.r6g.large", "ml.r6g.xlarge", "ml.r6g.2xlarge", "ml.r6g.4xlarge", "ml.r6g.8xlarge", "ml.r6g.12xlarge", "ml.r6g.16xlarge", "ml.r6gd.large", "ml.r6gd.xlarge", "ml.r6gd.2xlarge", "ml.r6gd.4xlarge", "ml.r6gd.8xlarge", "ml.r6gd.12xlarge", "ml.r6gd.16xlarge", "ml.p4de.24xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge"
12314
12343
  # resp.inference_recommendations[0].endpoint_configuration.initial_instance_count #=> Integer
12344
+ # resp.inference_recommendations[0].endpoint_configuration.serverless_config.memory_size_in_mb #=> Integer
12345
+ # resp.inference_recommendations[0].endpoint_configuration.serverless_config.max_concurrency #=> Integer
12346
+ # resp.inference_recommendations[0].endpoint_configuration.serverless_config.provisioned_concurrency #=> Integer
12315
12347
  # resp.inference_recommendations[0].model_configuration.inference_specification_name #=> String
12316
12348
  # resp.inference_recommendations[0].model_configuration.environment_parameters #=> Array
12317
12349
  # resp.inference_recommendations[0].model_configuration.environment_parameters[0].key #=> String
@@ -16402,7 +16434,7 @@ module Aws::SageMaker
16402
16434
  # creation_time_after: Time.now,
16403
16435
  # last_modified_time_before: Time.now,
16404
16436
  # last_modified_time_after: Time.now,
16405
- # status_equals: "OutOfService", # accepts OutOfService, Creating, Updating, SystemUpdating, RollingBack, InService, Deleting, Failed
16437
+ # status_equals: "OutOfService", # accepts OutOfService, Creating, Updating, SystemUpdating, RollingBack, InService, Deleting, Failed, UpdateRollbackFailed
16406
16438
  # })
16407
16439
  #
16408
16440
  # @example Response structure
@@ -16412,7 +16444,7 @@ module Aws::SageMaker
16412
16444
  # resp.endpoints[0].endpoint_arn #=> String
16413
16445
  # resp.endpoints[0].creation_time #=> Time
16414
16446
  # resp.endpoints[0].last_modified_time #=> Time
16415
- # resp.endpoints[0].endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed"
16447
+ # resp.endpoints[0].endpoint_status #=> String, one of "OutOfService", "Creating", "Updating", "SystemUpdating", "RollingBack", "InService", "Deleting", "Failed", "UpdateRollbackFailed"
16416
16448
  # resp.next_token #=> String
16417
16449
  #
16418
16450
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ListEndpoints AWS API Documentation
@@ -17342,10 +17374,14 @@ module Aws::SageMaker
17342
17374
  # resp.steps[0].inference_benchmark.metrics.model_latency #=> Integer
17343
17375
  # resp.steps[0].inference_benchmark.metrics.cpu_utilization #=> Float
17344
17376
  # resp.steps[0].inference_benchmark.metrics.memory_utilization #=> Float
17377
+ # resp.steps[0].inference_benchmark.metrics.model_setup_time #=> Integer
17345
17378
  # resp.steps[0].inference_benchmark.endpoint_configuration.endpoint_name #=> String
17346
17379
  # resp.steps[0].inference_benchmark.endpoint_configuration.variant_name #=> String
17347
17380
  # resp.steps[0].inference_benchmark.endpoint_configuration.instance_type #=> String, one of "ml.t2.medium", "ml.t2.large", "ml.t2.xlarge", "ml.t2.2xlarge", "ml.m4.xlarge", "ml.m4.2xlarge", "ml.m4.4xlarge", "ml.m4.10xlarge", "ml.m4.16xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.12xlarge", "ml.m5.24xlarge", "ml.m5d.large", "ml.m5d.xlarge", "ml.m5d.2xlarge", "ml.m5d.4xlarge", "ml.m5d.12xlarge", "ml.m5d.24xlarge", "ml.c4.large", "ml.c4.xlarge", "ml.c4.2xlarge", "ml.c4.4xlarge", "ml.c4.8xlarge", "ml.p2.xlarge", "ml.p2.8xlarge", "ml.p2.16xlarge", "ml.p3.2xlarge", "ml.p3.8xlarge", "ml.p3.16xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.18xlarge", "ml.c5d.large", "ml.c5d.xlarge", "ml.c5d.2xlarge", "ml.c5d.4xlarge", "ml.c5d.9xlarge", "ml.c5d.18xlarge", "ml.g4dn.xlarge", "ml.g4dn.2xlarge", "ml.g4dn.4xlarge", "ml.g4dn.8xlarge", "ml.g4dn.12xlarge", "ml.g4dn.16xlarge", "ml.r5.large", "ml.r5.xlarge", "ml.r5.2xlarge", "ml.r5.4xlarge", "ml.r5.12xlarge", "ml.r5.24xlarge", "ml.r5d.large", "ml.r5d.xlarge", "ml.r5d.2xlarge", "ml.r5d.4xlarge", "ml.r5d.12xlarge", "ml.r5d.24xlarge", "ml.inf1.xlarge", "ml.inf1.2xlarge", "ml.inf1.6xlarge", "ml.inf1.24xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.p4d.24xlarge", "ml.c7g.large", "ml.c7g.xlarge", "ml.c7g.2xlarge", "ml.c7g.4xlarge", "ml.c7g.8xlarge", "ml.c7g.12xlarge", "ml.c7g.16xlarge", "ml.m6g.large", "ml.m6g.xlarge", "ml.m6g.2xlarge", "ml.m6g.4xlarge", "ml.m6g.8xlarge", "ml.m6g.12xlarge", "ml.m6g.16xlarge", "ml.m6gd.large", "ml.m6gd.xlarge", "ml.m6gd.2xlarge", "ml.m6gd.4xlarge", "ml.m6gd.8xlarge", "ml.m6gd.12xlarge", "ml.m6gd.16xlarge", "ml.c6g.large", "ml.c6g.xlarge", "ml.c6g.2xlarge", "ml.c6g.4xlarge", "ml.c6g.8xlarge", "ml.c6g.12xlarge", "ml.c6g.16xlarge", "ml.c6gd.large", "ml.c6gd.xlarge", "ml.c6gd.2xlarge", "ml.c6gd.4xlarge", "ml.c6gd.8xlarge", "ml.c6gd.12xlarge", "ml.c6gd.16xlarge", "ml.c6gn.large", "ml.c6gn.xlarge", "ml.c6gn.2xlarge", "ml.c6gn.4xlarge", "ml.c6gn.8xlarge", "ml.c6gn.12xlarge", "ml.c6gn.16xlarge", "ml.r6g.large", "ml.r6g.xlarge", "ml.r6g.2xlarge", "ml.r6g.4xlarge", "ml.r6g.8xlarge", "ml.r6g.12xlarge", "ml.r6g.16xlarge", "ml.r6gd.large", "ml.r6gd.xlarge", "ml.r6gd.2xlarge", "ml.r6gd.4xlarge", "ml.r6gd.8xlarge", "ml.r6gd.12xlarge", "ml.r6gd.16xlarge", "ml.p4de.24xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge"
17348
17381
  # resp.steps[0].inference_benchmark.endpoint_configuration.initial_instance_count #=> Integer
17382
+ # resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.memory_size_in_mb #=> Integer
17383
+ # resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.max_concurrency #=> Integer
17384
+ # resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.provisioned_concurrency #=> Integer
17349
17385
  # resp.steps[0].inference_benchmark.model_configuration.inference_specification_name #=> String
17350
17386
  # resp.steps[0].inference_benchmark.model_configuration.environment_parameters #=> Array
17351
17387
  # resp.steps[0].inference_benchmark.model_configuration.environment_parameters[0].key #=> String
@@ -21994,7 +22030,7 @@ module Aws::SageMaker
21994
22030
  # },
21995
22031
  # ],
21996
22032
  # deployment_config: {
21997
- # blue_green_update_policy: { # required
22033
+ # blue_green_update_policy: {
21998
22034
  # traffic_routing_configuration: { # required
21999
22035
  # type: "ALL_AT_ONCE", # required, accepts ALL_AT_ONCE, CANARY, LINEAR
22000
22036
  # wait_interval_in_seconds: 1, # required
@@ -22017,6 +22053,18 @@ module Aws::SageMaker
22017
22053
  # },
22018
22054
  # ],
22019
22055
  # },
22056
+ # rolling_update_policy: {
22057
+ # maximum_batch_size: { # required
22058
+ # type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
22059
+ # value: 1, # required
22060
+ # },
22061
+ # wait_interval_in_seconds: 1, # required
22062
+ # maximum_execution_timeout_in_seconds: 1,
22063
+ # rollback_maximum_batch_size: {
22064
+ # type: "INSTANCE_COUNT", # required, accepts INSTANCE_COUNT, CAPACITY_PERCENT
22065
+ # value: 1, # required
22066
+ # },
22067
+ # },
22020
22068
  # },
22021
22069
  # retain_deployment_config: false,
22022
22070
  # })
@@ -23818,7 +23866,7 @@ module Aws::SageMaker
23818
23866
  params: params,
23819
23867
  config: config)
23820
23868
  context[:gem_name] = 'aws-sdk-sagemaker'
23821
- context[:gem_version] = '1.192.0'
23869
+ context[:gem_version] = '1.194.0'
23822
23870
  Seahorse::Client::Request.new(handlers, context)
23823
23871
  end
23824
23872
 
@@ -963,6 +963,7 @@ module Aws::SageMaker
963
963
  InferenceRecommendationsJobs = Shapes::ListShape.new(name: 'InferenceRecommendationsJobs')
964
964
  InferenceSpecification = Shapes::StructureShape.new(name: 'InferenceSpecification')
965
965
  InferenceSpecificationName = Shapes::StringShape.new(name: 'InferenceSpecificationName')
966
+ InitialInstanceCount = Shapes::IntegerShape.new(name: 'InitialInstanceCount')
966
967
  InitialNumberOfUsers = Shapes::IntegerShape.new(name: 'InitialNumberOfUsers')
967
968
  InitialTaskCount = Shapes::IntegerShape.new(name: 'InitialTaskCount')
968
969
  InputConfig = Shapes::StructureShape.new(name: 'InputConfig')
@@ -1322,6 +1323,7 @@ module Aws::SageMaker
1322
1323
  ModelQualityBaselineConfig = Shapes::StructureShape.new(name: 'ModelQualityBaselineConfig')
1323
1324
  ModelQualityJobInput = Shapes::StructureShape.new(name: 'ModelQualityJobInput')
1324
1325
  ModelRegisterSettings = Shapes::StructureShape.new(name: 'ModelRegisterSettings')
1326
+ ModelSetupTime = Shapes::IntegerShape.new(name: 'ModelSetupTime')
1325
1327
  ModelSortKey = Shapes::StringShape.new(name: 'ModelSortKey')
1326
1328
  ModelStepMetadata = Shapes::StructureShape.new(name: 'ModelStepMetadata')
1327
1329
  ModelSummary = Shapes::StructureShape.new(name: 'ModelSummary')
@@ -1616,6 +1618,7 @@ module Aws::SageMaker
1616
1618
  RecommendationJobStatus = Shapes::StringShape.new(name: 'RecommendationJobStatus')
1617
1619
  RecommendationJobStoppingConditions = Shapes::StructureShape.new(name: 'RecommendationJobStoppingConditions')
1618
1620
  RecommendationJobSupportedContentTypes = Shapes::ListShape.new(name: 'RecommendationJobSupportedContentTypes')
1621
+ RecommendationJobSupportedEndpointType = Shapes::StringShape.new(name: 'RecommendationJobSupportedEndpointType')
1619
1622
  RecommendationJobSupportedInstanceTypes = Shapes::ListShape.new(name: 'RecommendationJobSupportedInstanceTypes')
1620
1623
  RecommendationJobType = Shapes::StringShape.new(name: 'RecommendationJobType')
1621
1624
  RecommendationJobVpcConfig = Shapes::StructureShape.new(name: 'RecommendationJobVpcConfig')
@@ -1668,6 +1671,7 @@ module Aws::SageMaker
1668
1671
  RetryPipelineExecutionResponse = Shapes::StructureShape.new(name: 'RetryPipelineExecutionResponse')
1669
1672
  RetryStrategy = Shapes::StructureShape.new(name: 'RetryStrategy')
1670
1673
  RoleArn = Shapes::StringShape.new(name: 'RoleArn')
1674
+ RollingUpdatePolicy = Shapes::StructureShape.new(name: 'RollingUpdatePolicy')
1671
1675
  RootAccess = Shapes::StringShape.new(name: 'RootAccess')
1672
1676
  RuleConfigurationName = Shapes::StringShape.new(name: 'RuleConfigurationName')
1673
1677
  RuleEvaluationStatus = Shapes::StringShape.new(name: 'RuleEvaluationStatus')
@@ -3666,8 +3670,9 @@ module Aws::SageMaker
3666
3670
 
3667
3671
  DeployedImages.member = Shapes::ShapeRef.new(shape: DeployedImage)
3668
3672
 
3669
- DeploymentConfig.add_member(:blue_green_update_policy, Shapes::ShapeRef.new(shape: BlueGreenUpdatePolicy, required: true, location_name: "BlueGreenUpdatePolicy"))
3673
+ DeploymentConfig.add_member(:blue_green_update_policy, Shapes::ShapeRef.new(shape: BlueGreenUpdatePolicy, location_name: "BlueGreenUpdatePolicy"))
3670
3674
  DeploymentConfig.add_member(:auto_rollback_configuration, Shapes::ShapeRef.new(shape: AutoRollbackConfig, location_name: "AutoRollbackConfiguration"))
3675
+ DeploymentConfig.add_member(:rolling_update_policy, Shapes::ShapeRef.new(shape: RollingUpdatePolicy, location_name: "RollingUpdatePolicy"))
3671
3676
  DeploymentConfig.struct_class = Types::DeploymentConfig
3672
3677
 
3673
3678
  DeploymentRecommendation.add_member(:recommendation_status, Shapes::ShapeRef.new(shape: RecommendationStatus, required: true, location_name: "RecommendationStatus"))
@@ -4966,9 +4971,10 @@ module Aws::SageMaker
4966
4971
  EndpointInput.add_member(:end_time_offset, Shapes::ShapeRef.new(shape: MonitoringTimeOffsetString, location_name: "EndTimeOffset"))
4967
4972
  EndpointInput.struct_class = Types::EndpointInput
4968
4973
 
4969
- EndpointInputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, required: true, location_name: "InstanceType"))
4974
+ EndpointInputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, location_name: "InstanceType"))
4970
4975
  EndpointInputConfiguration.add_member(:inference_specification_name, Shapes::ShapeRef.new(shape: InferenceSpecificationName, location_name: "InferenceSpecificationName"))
4971
4976
  EndpointInputConfiguration.add_member(:environment_parameter_ranges, Shapes::ShapeRef.new(shape: EnvironmentParameterRanges, location_name: "EnvironmentParameterRanges"))
4977
+ EndpointInputConfiguration.add_member(:serverless_config, Shapes::ShapeRef.new(shape: ProductionVariantServerlessConfig, location_name: "ServerlessConfig"))
4972
4978
  EndpointInputConfiguration.struct_class = Types::EndpointInputConfiguration
4973
4979
 
4974
4980
  EndpointInputConfigurations.member = Shapes::ShapeRef.new(shape: EndpointInputConfiguration)
@@ -4981,8 +4987,9 @@ module Aws::SageMaker
4981
4987
 
4982
4988
  EndpointOutputConfiguration.add_member(:endpoint_name, Shapes::ShapeRef.new(shape: String, required: true, location_name: "EndpointName"))
4983
4989
  EndpointOutputConfiguration.add_member(:variant_name, Shapes::ShapeRef.new(shape: String, required: true, location_name: "VariantName"))
4984
- EndpointOutputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, required: true, location_name: "InstanceType"))
4985
- EndpointOutputConfiguration.add_member(:initial_instance_count, Shapes::ShapeRef.new(shape: Integer, required: true, location_name: "InitialInstanceCount"))
4990
+ EndpointOutputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, location_name: "InstanceType"))
4991
+ EndpointOutputConfiguration.add_member(:initial_instance_count, Shapes::ShapeRef.new(shape: InitialInstanceCount, location_name: "InitialInstanceCount"))
4992
+ EndpointOutputConfiguration.add_member(:serverless_config, Shapes::ShapeRef.new(shape: ProductionVariantServerlessConfig, location_name: "ServerlessConfig"))
4986
4993
  EndpointOutputConfiguration.struct_class = Types::EndpointOutputConfiguration
4987
4994
 
4988
4995
  EndpointPerformance.add_member(:metrics, Shapes::ShapeRef.new(shape: InferenceMetrics, required: true, location_name: "Metrics"))
@@ -7865,6 +7872,7 @@ module Aws::SageMaker
7865
7872
  RecommendationJobContainerConfig.add_member(:nearest_model_name, Shapes::ShapeRef.new(shape: String, location_name: "NearestModelName"))
7866
7873
  RecommendationJobContainerConfig.add_member(:supported_instance_types, Shapes::ShapeRef.new(shape: RecommendationJobSupportedInstanceTypes, location_name: "SupportedInstanceTypes"))
7867
7874
  RecommendationJobContainerConfig.add_member(:data_input_config, Shapes::ShapeRef.new(shape: RecommendationJobDataInputConfig, location_name: "DataInputConfig"))
7875
+ RecommendationJobContainerConfig.add_member(:supported_endpoint_type, Shapes::ShapeRef.new(shape: RecommendationJobSupportedEndpointType, location_name: "SupportedEndpointType"))
7868
7876
  RecommendationJobContainerConfig.struct_class = Types::RecommendationJobContainerConfig
7869
7877
 
7870
7878
  RecommendationJobInferenceBenchmark.add_member(:metrics, Shapes::ShapeRef.new(shape: RecommendationMetrics, location_name: "Metrics"))
@@ -7922,6 +7930,7 @@ module Aws::SageMaker
7922
7930
  RecommendationMetrics.add_member(:model_latency, Shapes::ShapeRef.new(shape: Integer, required: true, location_name: "ModelLatency"))
7923
7931
  RecommendationMetrics.add_member(:cpu_utilization, Shapes::ShapeRef.new(shape: UtilizationMetric, location_name: "CpuUtilization"))
7924
7932
  RecommendationMetrics.add_member(:memory_utilization, Shapes::ShapeRef.new(shape: UtilizationMetric, location_name: "MemoryUtilization"))
7933
+ RecommendationMetrics.add_member(:model_setup_time, Shapes::ShapeRef.new(shape: ModelSetupTime, location_name: "ModelSetupTime"))
7925
7934
  RecommendationMetrics.struct_class = Types::RecommendationMetrics
7926
7935
 
7927
7936
  RedshiftDatasetDefinition.add_member(:cluster_id, Shapes::ShapeRef.new(shape: RedshiftClusterId, required: true, location_name: "ClusterId"))
@@ -8017,6 +8026,12 @@ module Aws::SageMaker
8017
8026
  RetryStrategy.add_member(:maximum_retry_attempts, Shapes::ShapeRef.new(shape: MaximumRetryAttempts, required: true, location_name: "MaximumRetryAttempts"))
8018
8027
  RetryStrategy.struct_class = Types::RetryStrategy
8019
8028
 
8029
+ RollingUpdatePolicy.add_member(:maximum_batch_size, Shapes::ShapeRef.new(shape: CapacitySize, required: true, location_name: "MaximumBatchSize"))
8030
+ RollingUpdatePolicy.add_member(:wait_interval_in_seconds, Shapes::ShapeRef.new(shape: WaitIntervalInSeconds, required: true, location_name: "WaitIntervalInSeconds"))
8031
+ RollingUpdatePolicy.add_member(:maximum_execution_timeout_in_seconds, Shapes::ShapeRef.new(shape: MaximumExecutionTimeoutInSeconds, location_name: "MaximumExecutionTimeoutInSeconds"))
8032
+ RollingUpdatePolicy.add_member(:rollback_maximum_batch_size, Shapes::ShapeRef.new(shape: CapacitySize, location_name: "RollbackMaximumBatchSize"))
8033
+ RollingUpdatePolicy.struct_class = Types::RollingUpdatePolicy
8034
+
8020
8035
  RuleParameters.key = Shapes::ShapeRef.new(shape: ConfigKey)
8021
8036
  RuleParameters.value = Shapes::ShapeRef.new(shape: ConfigValue)
8022
8037
 
@@ -2415,6 +2415,12 @@ module Aws::SageMaker
2415
2415
  # @!attribute [rw] time_series_forecasting_job_config
2416
2416
  # Settings used to configure an AutoML job V2 for a time-series
2417
2417
  # forecasting problem type.
2418
+ #
2419
+ # <note markdown="1"> The `TimeSeriesForecastingJobConfig` problem type is only available
2420
+ # in private beta. Contact Amazon Web Services Support or your account
2421
+ # manager to learn more about access privileges.
2422
+ #
2423
+ # </note>
2418
2424
  # @return [Types::TimeSeriesForecastingJobConfig]
2419
2425
  #
2420
2426
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/AutoMLProblemTypeConfig AWS API Documentation
@@ -3106,7 +3112,15 @@ module Aws::SageMaker
3106
3112
  include Aws::Structure
3107
3113
  end
3108
3114
 
3109
- # Specifies the endpoint capacity to activate for production.
3115
+ # Specifies the type and size of the endpoint capacity to activate for a
3116
+ # blue/green deployment, a rolling deployment, or a rollback strategy.
3117
+ # You can specify your batches as either instance count or the overall
3118
+ # percentage or your fleet.
3119
+ #
3120
+ # For a rollback strategy, if you don't specify the fields in this
3121
+ # object, or if you set the `Value` to 100%, then SageMaker uses a
3122
+ # blue/green rollback strategy and rolls all traffic back to the blue
3123
+ # fleet.
3110
3124
  #
3111
3125
  # @!attribute [rw] type
3112
3126
  # Specifies the endpoint capacity type.
@@ -10194,11 +10208,17 @@ module Aws::SageMaker
10194
10208
  # failures and recovery.
10195
10209
  # @return [Types::AutoRollbackConfig]
10196
10210
  #
10211
+ # @!attribute [rw] rolling_update_policy
10212
+ # Specifies a rolling deployment strategy for updating a SageMaker
10213
+ # endpoint.
10214
+ # @return [Types::RollingUpdatePolicy]
10215
+ #
10197
10216
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/DeploymentConfig AWS API Documentation
10198
10217
  #
10199
10218
  class DeploymentConfig < Struct.new(
10200
10219
  :blue_green_update_policy,
10201
- :auto_rollback_configuration)
10220
+ :auto_rollback_configuration,
10221
+ :rolling_update_policy)
10202
10222
  SENSITIVE = []
10203
10223
  include Aws::Structure
10204
10224
  end
@@ -17115,12 +17135,17 @@ module Aws::SageMaker
17115
17135
  # The parameter you want to benchmark against.
17116
17136
  # @return [Types::EnvironmentParameterRanges]
17117
17137
  #
17138
+ # @!attribute [rw] serverless_config
17139
+ # Specifies the serverless configuration for an endpoint variant.
17140
+ # @return [Types::ProductionVariantServerlessConfig]
17141
+ #
17118
17142
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/EndpointInputConfiguration AWS API Documentation
17119
17143
  #
17120
17144
  class EndpointInputConfiguration < Struct.new(
17121
17145
  :instance_type,
17122
17146
  :inference_specification_name,
17123
- :environment_parameter_ranges)
17147
+ :environment_parameter_ranges,
17148
+ :serverless_config)
17124
17149
  SENSITIVE = []
17125
17150
  include Aws::Structure
17126
17151
  end
@@ -17182,13 +17207,18 @@ module Aws::SageMaker
17182
17207
  # The number of instances recommended to launch initially.
17183
17208
  # @return [Integer]
17184
17209
  #
17210
+ # @!attribute [rw] serverless_config
17211
+ # Specifies the serverless configuration for an endpoint variant.
17212
+ # @return [Types::ProductionVariantServerlessConfig]
17213
+ #
17185
17214
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/EndpointOutputConfiguration AWS API Documentation
17186
17215
  #
17187
17216
  class EndpointOutputConfiguration < Struct.new(
17188
17217
  :endpoint_name,
17189
17218
  :variant_name,
17190
17219
  :instance_type,
17191
- :initial_instance_count)
17220
+ :initial_instance_count,
17221
+ :serverless_config)
17192
17222
  SENSITIVE = []
17193
17223
  include Aws::Structure
17194
17224
  end
@@ -32870,6 +32900,17 @@ module Aws::SageMaker
32870
32900
  # @!attribute [rw] provisioned_concurrency
32871
32901
  # The amount of provisioned concurrency to allocate for the serverless
32872
32902
  # endpoint. Should be less than or equal to `MaxConcurrency`.
32903
+ #
32904
+ # <note markdown="1"> This field is not supported for serverless endpoint recommendations
32905
+ # for Inference Recommender jobs. For more information about creating
32906
+ # an Inference Recommender job, see
32907
+ # [CreateInferenceRecommendationsJobs][1].
32908
+ #
32909
+ # </note>
32910
+ #
32911
+ #
32912
+ #
32913
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateInferenceRecommendationsJob.html
32873
32914
  # @return [Integer]
32874
32915
  #
32875
32916
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ProductionVariantServerlessConfig AWS API Documentation
@@ -34074,6 +34115,14 @@ module Aws::SageMaker
34074
34115
  # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_InputConfig.html#sagemaker-Type-InputConfig-DataInputConfig
34075
34116
  # @return [String]
34076
34117
  #
34118
+ # @!attribute [rw] supported_endpoint_type
34119
+ # The endpoint type to receive recommendations for. By default this is
34120
+ # null, and the results of the inference recommendation job return a
34121
+ # combined list of both real-time and serverless benchmarks. By
34122
+ # specifying a value for this field, you can receive a longer list of
34123
+ # benchmarks for the desired endpoint type.
34124
+ # @return [String]
34125
+ #
34077
34126
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RecommendationJobContainerConfig AWS API Documentation
34078
34127
  #
34079
34128
  class RecommendationJobContainerConfig < Struct.new(
@@ -34084,7 +34133,8 @@ module Aws::SageMaker
34084
34133
  :payload_config,
34085
34134
  :nearest_model_name,
34086
34135
  :supported_instance_types,
34087
- :data_input_config)
34136
+ :data_input_config,
34137
+ :supported_endpoint_type)
34088
34138
  SENSITIVE = []
34089
34139
  include Aws::Structure
34090
34140
  end
@@ -34408,6 +34458,14 @@ module Aws::SageMaker
34408
34458
  # `NaN` indicates that the value is not available.
34409
34459
  # @return [Float]
34410
34460
  #
34461
+ # @!attribute [rw] model_setup_time
34462
+ # The time it takes to launch new compute resources for a serverless
34463
+ # endpoint. The time can vary depending on the model size, how long it
34464
+ # takes to download the model, and the start-up time of the container.
34465
+ #
34466
+ # `NaN` indicates that the value is not available.
34467
+ # @return [Integer]
34468
+ #
34411
34469
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RecommendationMetrics AWS API Documentation
34412
34470
  #
34413
34471
  class RecommendationMetrics < Struct.new(
@@ -34416,7 +34474,8 @@ module Aws::SageMaker
34416
34474
  :max_invocations,
34417
34475
  :model_latency,
34418
34476
  :cpu_utilization,
34419
- :memory_utilization)
34477
+ :memory_utilization,
34478
+ :model_setup_time)
34420
34479
  SENSITIVE = []
34421
34480
  include Aws::Structure
34422
34481
  end
@@ -34994,6 +35053,54 @@ module Aws::SageMaker
34994
35053
  include Aws::Structure
34995
35054
  end
34996
35055
 
35056
+ # Specifies a rolling deployment strategy for updating a SageMaker
35057
+ # endpoint.
35058
+ #
35059
+ # @!attribute [rw] maximum_batch_size
35060
+ # Specifies the type and size of the endpoint capacity to activate for
35061
+ # a blue/green deployment, a rolling deployment, or a rollback
35062
+ # strategy. You can specify your batches as either instance count or
35063
+ # the overall percentage or your fleet.
35064
+ #
35065
+ # For a rollback strategy, if you don't specify the fields in this
35066
+ # object, or if you set the `Value` to 100%, then SageMaker uses a
35067
+ # blue/green rollback strategy and rolls all traffic back to the blue
35068
+ # fleet.
35069
+ # @return [Types::CapacitySize]
35070
+ #
35071
+ # @!attribute [rw] wait_interval_in_seconds
35072
+ # The length of the baking period, during which SageMaker monitors
35073
+ # alarms for each batch on the new fleet.
35074
+ # @return [Integer]
35075
+ #
35076
+ # @!attribute [rw] maximum_execution_timeout_in_seconds
35077
+ # The time limit for the total deployment. Exceeding this limit causes
35078
+ # a timeout.
35079
+ # @return [Integer]
35080
+ #
35081
+ # @!attribute [rw] rollback_maximum_batch_size
35082
+ # Specifies the type and size of the endpoint capacity to activate for
35083
+ # a blue/green deployment, a rolling deployment, or a rollback
35084
+ # strategy. You can specify your batches as either instance count or
35085
+ # the overall percentage or your fleet.
35086
+ #
35087
+ # For a rollback strategy, if you don't specify the fields in this
35088
+ # object, or if you set the `Value` to 100%, then SageMaker uses a
35089
+ # blue/green rollback strategy and rolls all traffic back to the blue
35090
+ # fleet.
35091
+ # @return [Types::CapacitySize]
35092
+ #
35093
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RollingUpdatePolicy AWS API Documentation
35094
+ #
35095
+ class RollingUpdatePolicy < Struct.new(
35096
+ :maximum_batch_size,
35097
+ :wait_interval_in_seconds,
35098
+ :maximum_execution_timeout_in_seconds,
35099
+ :rollback_maximum_batch_size)
35100
+ SENSITIVE = []
35101
+ include Aws::Structure
35102
+ end
35103
+
34997
35104
  # Describes the S3 data source.
34998
35105
  #
34999
35106
  # Your input bucket must be in the same Amazon Web Services region as
@@ -53,6 +53,6 @@ require_relative 'aws-sdk-sagemaker/customizations'
53
53
  # @!group service
54
54
  module Aws::SageMaker
55
55
 
56
- GEM_VERSION = '1.192.0'
56
+ GEM_VERSION = '1.194.0'
57
57
 
58
58
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: aws-sdk-sagemaker
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.192.0
4
+ version: 1.194.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Amazon Web Services
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2023-06-29 00:00:00.000000000 Z
11
+ date: 2023-07-03 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: aws-sdk-core