aws-sdk-sagemaker 1.193.0 → 1.194.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: e8563212194efe3f885db18ded340750c68719059405c10110a98fe0a254de83
4
- data.tar.gz: 8c32b946394f67fac58c560a9a048ec39d56ab2ea1f1416484de48dbeb99947c
3
+ metadata.gz: 60973ee75145a047cd16273b84e2c90c71e5f4f79410ca18abc405d322530142
4
+ data.tar.gz: c3b8a0d376ecde588856d2902f2260fda4df5ee686004457f25edccff047fab3
5
5
  SHA512:
6
- metadata.gz: 1632e061172d86fd8998029d2b91c397c527dc6329297cacff63dd191a7b81e349ad4ba938c85a178d7056a47b4bbe084f7adc327087dc8c652d87effcc75be5
7
- data.tar.gz: 6e7c6e026568146cea2404421c7ce6028e509a6d042af8c25ede1c4e5b141f0b89303e1c4d801d7405338204ea4f27d75c1f7670de963cb6593951988c110559
6
+ metadata.gz: ab144375ebe73e9a8ba1db86cfc76be055d4a904277d6f8fc474dd1cbc846980c66ab87b90d6892a99798c55fe84197a03c5911bac12295b441c130e7ee12e1c
7
+ data.tar.gz: 76a347049d001562cda69eb23edab0abe7a60de6f84ecdb31b4aa237ef850122be6210bcf87927af77fcbb2e492d06dd95ebd795a1350113a007ca5cae7e60b4
data/CHANGELOG.md CHANGED
@@ -1,6 +1,11 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.194.0 (2023-07-03)
5
+ ------------------
6
+
7
+ * Feature - SageMaker Inference Recommender now accepts new fields SupportedEndpointType and ServerlessConfiguration to support serverless endpoints.
8
+
4
9
  1.193.0 (2023-06-30)
5
10
  ------------------
6
11
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.193.0
1
+ 1.194.0
@@ -4459,7 +4459,7 @@ module Aws::SageMaker
4459
4459
  # },
4460
4460
  # endpoint_configurations: [
4461
4461
  # {
4462
- # instance_type: "ml.t2.medium", # required, accepts ml.t2.medium, ml.t2.large, ml.t2.xlarge, ml.t2.2xlarge, ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.m5d.large, ml.m5d.xlarge, ml.m5d.2xlarge, ml.m5d.4xlarge, ml.m5d.12xlarge, ml.m5d.24xlarge, ml.c4.large, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5d.large, ml.c5d.xlarge, ml.c5d.2xlarge, ml.c5d.4xlarge, ml.c5d.9xlarge, ml.c5d.18xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.12xlarge, ml.r5.24xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.12xlarge, ml.r5d.24xlarge, ml.inf1.xlarge, ml.inf1.2xlarge, ml.inf1.6xlarge, ml.inf1.24xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.p4d.24xlarge, ml.c7g.large, ml.c7g.xlarge, ml.c7g.2xlarge, ml.c7g.4xlarge, ml.c7g.8xlarge, ml.c7g.12xlarge, ml.c7g.16xlarge, ml.m6g.large, ml.m6g.xlarge, ml.m6g.2xlarge, ml.m6g.4xlarge, ml.m6g.8xlarge, ml.m6g.12xlarge, ml.m6g.16xlarge, ml.m6gd.large, ml.m6gd.xlarge, ml.m6gd.2xlarge, ml.m6gd.4xlarge, ml.m6gd.8xlarge, ml.m6gd.12xlarge, ml.m6gd.16xlarge, ml.c6g.large, ml.c6g.xlarge, ml.c6g.2xlarge, ml.c6g.4xlarge, ml.c6g.8xlarge, ml.c6g.12xlarge, ml.c6g.16xlarge, ml.c6gd.large, ml.c6gd.xlarge, ml.c6gd.2xlarge, ml.c6gd.4xlarge, ml.c6gd.8xlarge, ml.c6gd.12xlarge, ml.c6gd.16xlarge, ml.c6gn.large, ml.c6gn.xlarge, ml.c6gn.2xlarge, ml.c6gn.4xlarge, ml.c6gn.8xlarge, ml.c6gn.12xlarge, ml.c6gn.16xlarge, ml.r6g.large, ml.r6g.xlarge, ml.r6g.2xlarge, ml.r6g.4xlarge, ml.r6g.8xlarge, ml.r6g.12xlarge, ml.r6g.16xlarge, ml.r6gd.large, ml.r6gd.xlarge, ml.r6gd.2xlarge, ml.r6gd.4xlarge, ml.r6gd.8xlarge, ml.r6gd.12xlarge, ml.r6gd.16xlarge, ml.p4de.24xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge
4462
+ # instance_type: "ml.t2.medium", # accepts ml.t2.medium, ml.t2.large, ml.t2.xlarge, ml.t2.2xlarge, ml.m4.xlarge, ml.m4.2xlarge, ml.m4.4xlarge, ml.m4.10xlarge, ml.m4.16xlarge, ml.m5.large, ml.m5.xlarge, ml.m5.2xlarge, ml.m5.4xlarge, ml.m5.12xlarge, ml.m5.24xlarge, ml.m5d.large, ml.m5d.xlarge, ml.m5d.2xlarge, ml.m5d.4xlarge, ml.m5d.12xlarge, ml.m5d.24xlarge, ml.c4.large, ml.c4.xlarge, ml.c4.2xlarge, ml.c4.4xlarge, ml.c4.8xlarge, ml.p2.xlarge, ml.p2.8xlarge, ml.p2.16xlarge, ml.p3.2xlarge, ml.p3.8xlarge, ml.p3.16xlarge, ml.c5.large, ml.c5.xlarge, ml.c5.2xlarge, ml.c5.4xlarge, ml.c5.9xlarge, ml.c5.18xlarge, ml.c5d.large, ml.c5d.xlarge, ml.c5d.2xlarge, ml.c5d.4xlarge, ml.c5d.9xlarge, ml.c5d.18xlarge, ml.g4dn.xlarge, ml.g4dn.2xlarge, ml.g4dn.4xlarge, ml.g4dn.8xlarge, ml.g4dn.12xlarge, ml.g4dn.16xlarge, ml.r5.large, ml.r5.xlarge, ml.r5.2xlarge, ml.r5.4xlarge, ml.r5.12xlarge, ml.r5.24xlarge, ml.r5d.large, ml.r5d.xlarge, ml.r5d.2xlarge, ml.r5d.4xlarge, ml.r5d.12xlarge, ml.r5d.24xlarge, ml.inf1.xlarge, ml.inf1.2xlarge, ml.inf1.6xlarge, ml.inf1.24xlarge, ml.c6i.large, ml.c6i.xlarge, ml.c6i.2xlarge, ml.c6i.4xlarge, ml.c6i.8xlarge, ml.c6i.12xlarge, ml.c6i.16xlarge, ml.c6i.24xlarge, ml.c6i.32xlarge, ml.g5.xlarge, ml.g5.2xlarge, ml.g5.4xlarge, ml.g5.8xlarge, ml.g5.12xlarge, ml.g5.16xlarge, ml.g5.24xlarge, ml.g5.48xlarge, ml.p4d.24xlarge, ml.c7g.large, ml.c7g.xlarge, ml.c7g.2xlarge, ml.c7g.4xlarge, ml.c7g.8xlarge, ml.c7g.12xlarge, ml.c7g.16xlarge, ml.m6g.large, ml.m6g.xlarge, ml.m6g.2xlarge, ml.m6g.4xlarge, ml.m6g.8xlarge, ml.m6g.12xlarge, ml.m6g.16xlarge, ml.m6gd.large, ml.m6gd.xlarge, ml.m6gd.2xlarge, ml.m6gd.4xlarge, ml.m6gd.8xlarge, ml.m6gd.12xlarge, ml.m6gd.16xlarge, ml.c6g.large, ml.c6g.xlarge, ml.c6g.2xlarge, ml.c6g.4xlarge, ml.c6g.8xlarge, ml.c6g.12xlarge, ml.c6g.16xlarge, ml.c6gd.large, ml.c6gd.xlarge, ml.c6gd.2xlarge, ml.c6gd.4xlarge, ml.c6gd.8xlarge, ml.c6gd.12xlarge, ml.c6gd.16xlarge, ml.c6gn.large, ml.c6gn.xlarge, ml.c6gn.2xlarge, ml.c6gn.4xlarge, ml.c6gn.8xlarge, ml.c6gn.12xlarge, ml.c6gn.16xlarge, ml.r6g.large, ml.r6g.xlarge, ml.r6g.2xlarge, ml.r6g.4xlarge, ml.r6g.8xlarge, ml.r6g.12xlarge, ml.r6g.16xlarge, ml.r6gd.large, ml.r6gd.xlarge, ml.r6gd.2xlarge, ml.r6gd.4xlarge, ml.r6gd.8xlarge, ml.r6gd.12xlarge, ml.r6gd.16xlarge, ml.p4de.24xlarge, ml.trn1.2xlarge, ml.trn1.32xlarge, ml.inf2.xlarge, ml.inf2.8xlarge, ml.inf2.24xlarge, ml.inf2.48xlarge
4463
4463
  # inference_specification_name: "InferenceSpecificationName",
4464
4464
  # environment_parameter_ranges: {
4465
4465
  # categorical_parameter_ranges: [
@@ -4469,6 +4469,11 @@ module Aws::SageMaker
4469
4469
  # },
4470
4470
  # ],
4471
4471
  # },
4472
+ # serverless_config: {
4473
+ # memory_size_in_mb: 1, # required
4474
+ # max_concurrency: 1, # required
4475
+ # provisioned_concurrency: 1,
4476
+ # },
4472
4477
  # },
4473
4478
  # ],
4474
4479
  # volume_kms_key_id: "KmsKeyId",
@@ -4484,6 +4489,7 @@ module Aws::SageMaker
4484
4489
  # nearest_model_name: "String",
4485
4490
  # supported_instance_types: ["String"],
4486
4491
  # data_input_config: "RecommendationJobDataInputConfig",
4492
+ # supported_endpoint_type: "RealTime", # accepts RealTime, Serverless
4487
4493
  # },
4488
4494
  # endpoints: [
4489
4495
  # {
@@ -12296,6 +12302,9 @@ module Aws::SageMaker
12296
12302
  # resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].name #=> String
12297
12303
  # resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].value #=> Array
12298
12304
  # resp.input_config.endpoint_configurations[0].environment_parameter_ranges.categorical_parameter_ranges[0].value[0] #=> String
12305
+ # resp.input_config.endpoint_configurations[0].serverless_config.memory_size_in_mb #=> Integer
12306
+ # resp.input_config.endpoint_configurations[0].serverless_config.max_concurrency #=> Integer
12307
+ # resp.input_config.endpoint_configurations[0].serverless_config.provisioned_concurrency #=> Integer
12299
12308
  # resp.input_config.volume_kms_key_id #=> String
12300
12309
  # resp.input_config.container_config.domain #=> String
12301
12310
  # resp.input_config.container_config.task #=> String
@@ -12308,6 +12317,7 @@ module Aws::SageMaker
12308
12317
  # resp.input_config.container_config.supported_instance_types #=> Array
12309
12318
  # resp.input_config.container_config.supported_instance_types[0] #=> String
12310
12319
  # resp.input_config.container_config.data_input_config #=> String
12320
+ # resp.input_config.container_config.supported_endpoint_type #=> String, one of "RealTime", "Serverless"
12311
12321
  # resp.input_config.endpoints #=> Array
12312
12322
  # resp.input_config.endpoints[0].endpoint_name #=> String
12313
12323
  # resp.input_config.vpc_config.security_group_ids #=> Array
@@ -12326,10 +12336,14 @@ module Aws::SageMaker
12326
12336
  # resp.inference_recommendations[0].metrics.model_latency #=> Integer
12327
12337
  # resp.inference_recommendations[0].metrics.cpu_utilization #=> Float
12328
12338
  # resp.inference_recommendations[0].metrics.memory_utilization #=> Float
12339
+ # resp.inference_recommendations[0].metrics.model_setup_time #=> Integer
12329
12340
  # resp.inference_recommendations[0].endpoint_configuration.endpoint_name #=> String
12330
12341
  # resp.inference_recommendations[0].endpoint_configuration.variant_name #=> String
12331
12342
  # resp.inference_recommendations[0].endpoint_configuration.instance_type #=> String, one of "ml.t2.medium", "ml.t2.large", "ml.t2.xlarge", "ml.t2.2xlarge", "ml.m4.xlarge", "ml.m4.2xlarge", "ml.m4.4xlarge", "ml.m4.10xlarge", "ml.m4.16xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.12xlarge", "ml.m5.24xlarge", "ml.m5d.large", "ml.m5d.xlarge", "ml.m5d.2xlarge", "ml.m5d.4xlarge", "ml.m5d.12xlarge", "ml.m5d.24xlarge", "ml.c4.large", "ml.c4.xlarge", "ml.c4.2xlarge", "ml.c4.4xlarge", "ml.c4.8xlarge", "ml.p2.xlarge", "ml.p2.8xlarge", "ml.p2.16xlarge", "ml.p3.2xlarge", "ml.p3.8xlarge", "ml.p3.16xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.18xlarge", "ml.c5d.large", "ml.c5d.xlarge", "ml.c5d.2xlarge", "ml.c5d.4xlarge", "ml.c5d.9xlarge", "ml.c5d.18xlarge", "ml.g4dn.xlarge", "ml.g4dn.2xlarge", "ml.g4dn.4xlarge", "ml.g4dn.8xlarge", "ml.g4dn.12xlarge", "ml.g4dn.16xlarge", "ml.r5.large", "ml.r5.xlarge", "ml.r5.2xlarge", "ml.r5.4xlarge", "ml.r5.12xlarge", "ml.r5.24xlarge", "ml.r5d.large", "ml.r5d.xlarge", "ml.r5d.2xlarge", "ml.r5d.4xlarge", "ml.r5d.12xlarge", "ml.r5d.24xlarge", "ml.inf1.xlarge", "ml.inf1.2xlarge", "ml.inf1.6xlarge", "ml.inf1.24xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.p4d.24xlarge", "ml.c7g.large", "ml.c7g.xlarge", "ml.c7g.2xlarge", "ml.c7g.4xlarge", "ml.c7g.8xlarge", "ml.c7g.12xlarge", "ml.c7g.16xlarge", "ml.m6g.large", "ml.m6g.xlarge", "ml.m6g.2xlarge", "ml.m6g.4xlarge", "ml.m6g.8xlarge", "ml.m6g.12xlarge", "ml.m6g.16xlarge", "ml.m6gd.large", "ml.m6gd.xlarge", "ml.m6gd.2xlarge", "ml.m6gd.4xlarge", "ml.m6gd.8xlarge", "ml.m6gd.12xlarge", "ml.m6gd.16xlarge", "ml.c6g.large", "ml.c6g.xlarge", "ml.c6g.2xlarge", "ml.c6g.4xlarge", "ml.c6g.8xlarge", "ml.c6g.12xlarge", "ml.c6g.16xlarge", "ml.c6gd.large", "ml.c6gd.xlarge", "ml.c6gd.2xlarge", "ml.c6gd.4xlarge", "ml.c6gd.8xlarge", "ml.c6gd.12xlarge", "ml.c6gd.16xlarge", "ml.c6gn.large", "ml.c6gn.xlarge", "ml.c6gn.2xlarge", "ml.c6gn.4xlarge", "ml.c6gn.8xlarge", "ml.c6gn.12xlarge", "ml.c6gn.16xlarge", "ml.r6g.large", "ml.r6g.xlarge", "ml.r6g.2xlarge", "ml.r6g.4xlarge", "ml.r6g.8xlarge", "ml.r6g.12xlarge", "ml.r6g.16xlarge", "ml.r6gd.large", "ml.r6gd.xlarge", "ml.r6gd.2xlarge", "ml.r6gd.4xlarge", "ml.r6gd.8xlarge", "ml.r6gd.12xlarge", "ml.r6gd.16xlarge", "ml.p4de.24xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge"
12332
12343
  # resp.inference_recommendations[0].endpoint_configuration.initial_instance_count #=> Integer
12344
+ # resp.inference_recommendations[0].endpoint_configuration.serverless_config.memory_size_in_mb #=> Integer
12345
+ # resp.inference_recommendations[0].endpoint_configuration.serverless_config.max_concurrency #=> Integer
12346
+ # resp.inference_recommendations[0].endpoint_configuration.serverless_config.provisioned_concurrency #=> Integer
12333
12347
  # resp.inference_recommendations[0].model_configuration.inference_specification_name #=> String
12334
12348
  # resp.inference_recommendations[0].model_configuration.environment_parameters #=> Array
12335
12349
  # resp.inference_recommendations[0].model_configuration.environment_parameters[0].key #=> String
@@ -17360,10 +17374,14 @@ module Aws::SageMaker
17360
17374
  # resp.steps[0].inference_benchmark.metrics.model_latency #=> Integer
17361
17375
  # resp.steps[0].inference_benchmark.metrics.cpu_utilization #=> Float
17362
17376
  # resp.steps[0].inference_benchmark.metrics.memory_utilization #=> Float
17377
+ # resp.steps[0].inference_benchmark.metrics.model_setup_time #=> Integer
17363
17378
  # resp.steps[0].inference_benchmark.endpoint_configuration.endpoint_name #=> String
17364
17379
  # resp.steps[0].inference_benchmark.endpoint_configuration.variant_name #=> String
17365
17380
  # resp.steps[0].inference_benchmark.endpoint_configuration.instance_type #=> String, one of "ml.t2.medium", "ml.t2.large", "ml.t2.xlarge", "ml.t2.2xlarge", "ml.m4.xlarge", "ml.m4.2xlarge", "ml.m4.4xlarge", "ml.m4.10xlarge", "ml.m4.16xlarge", "ml.m5.large", "ml.m5.xlarge", "ml.m5.2xlarge", "ml.m5.4xlarge", "ml.m5.12xlarge", "ml.m5.24xlarge", "ml.m5d.large", "ml.m5d.xlarge", "ml.m5d.2xlarge", "ml.m5d.4xlarge", "ml.m5d.12xlarge", "ml.m5d.24xlarge", "ml.c4.large", "ml.c4.xlarge", "ml.c4.2xlarge", "ml.c4.4xlarge", "ml.c4.8xlarge", "ml.p2.xlarge", "ml.p2.8xlarge", "ml.p2.16xlarge", "ml.p3.2xlarge", "ml.p3.8xlarge", "ml.p3.16xlarge", "ml.c5.large", "ml.c5.xlarge", "ml.c5.2xlarge", "ml.c5.4xlarge", "ml.c5.9xlarge", "ml.c5.18xlarge", "ml.c5d.large", "ml.c5d.xlarge", "ml.c5d.2xlarge", "ml.c5d.4xlarge", "ml.c5d.9xlarge", "ml.c5d.18xlarge", "ml.g4dn.xlarge", "ml.g4dn.2xlarge", "ml.g4dn.4xlarge", "ml.g4dn.8xlarge", "ml.g4dn.12xlarge", "ml.g4dn.16xlarge", "ml.r5.large", "ml.r5.xlarge", "ml.r5.2xlarge", "ml.r5.4xlarge", "ml.r5.12xlarge", "ml.r5.24xlarge", "ml.r5d.large", "ml.r5d.xlarge", "ml.r5d.2xlarge", "ml.r5d.4xlarge", "ml.r5d.12xlarge", "ml.r5d.24xlarge", "ml.inf1.xlarge", "ml.inf1.2xlarge", "ml.inf1.6xlarge", "ml.inf1.24xlarge", "ml.c6i.large", "ml.c6i.xlarge", "ml.c6i.2xlarge", "ml.c6i.4xlarge", "ml.c6i.8xlarge", "ml.c6i.12xlarge", "ml.c6i.16xlarge", "ml.c6i.24xlarge", "ml.c6i.32xlarge", "ml.g5.xlarge", "ml.g5.2xlarge", "ml.g5.4xlarge", "ml.g5.8xlarge", "ml.g5.12xlarge", "ml.g5.16xlarge", "ml.g5.24xlarge", "ml.g5.48xlarge", "ml.p4d.24xlarge", "ml.c7g.large", "ml.c7g.xlarge", "ml.c7g.2xlarge", "ml.c7g.4xlarge", "ml.c7g.8xlarge", "ml.c7g.12xlarge", "ml.c7g.16xlarge", "ml.m6g.large", "ml.m6g.xlarge", "ml.m6g.2xlarge", "ml.m6g.4xlarge", "ml.m6g.8xlarge", "ml.m6g.12xlarge", "ml.m6g.16xlarge", "ml.m6gd.large", "ml.m6gd.xlarge", "ml.m6gd.2xlarge", "ml.m6gd.4xlarge", "ml.m6gd.8xlarge", "ml.m6gd.12xlarge", "ml.m6gd.16xlarge", "ml.c6g.large", "ml.c6g.xlarge", "ml.c6g.2xlarge", "ml.c6g.4xlarge", "ml.c6g.8xlarge", "ml.c6g.12xlarge", "ml.c6g.16xlarge", "ml.c6gd.large", "ml.c6gd.xlarge", "ml.c6gd.2xlarge", "ml.c6gd.4xlarge", "ml.c6gd.8xlarge", "ml.c6gd.12xlarge", "ml.c6gd.16xlarge", "ml.c6gn.large", "ml.c6gn.xlarge", "ml.c6gn.2xlarge", "ml.c6gn.4xlarge", "ml.c6gn.8xlarge", "ml.c6gn.12xlarge", "ml.c6gn.16xlarge", "ml.r6g.large", "ml.r6g.xlarge", "ml.r6g.2xlarge", "ml.r6g.4xlarge", "ml.r6g.8xlarge", "ml.r6g.12xlarge", "ml.r6g.16xlarge", "ml.r6gd.large", "ml.r6gd.xlarge", "ml.r6gd.2xlarge", "ml.r6gd.4xlarge", "ml.r6gd.8xlarge", "ml.r6gd.12xlarge", "ml.r6gd.16xlarge", "ml.p4de.24xlarge", "ml.trn1.2xlarge", "ml.trn1.32xlarge", "ml.inf2.xlarge", "ml.inf2.8xlarge", "ml.inf2.24xlarge", "ml.inf2.48xlarge"
17366
17381
  # resp.steps[0].inference_benchmark.endpoint_configuration.initial_instance_count #=> Integer
17382
+ # resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.memory_size_in_mb #=> Integer
17383
+ # resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.max_concurrency #=> Integer
17384
+ # resp.steps[0].inference_benchmark.endpoint_configuration.serverless_config.provisioned_concurrency #=> Integer
17367
17385
  # resp.steps[0].inference_benchmark.model_configuration.inference_specification_name #=> String
17368
17386
  # resp.steps[0].inference_benchmark.model_configuration.environment_parameters #=> Array
17369
17387
  # resp.steps[0].inference_benchmark.model_configuration.environment_parameters[0].key #=> String
@@ -23848,7 +23866,7 @@ module Aws::SageMaker
23848
23866
  params: params,
23849
23867
  config: config)
23850
23868
  context[:gem_name] = 'aws-sdk-sagemaker'
23851
- context[:gem_version] = '1.193.0'
23869
+ context[:gem_version] = '1.194.0'
23852
23870
  Seahorse::Client::Request.new(handlers, context)
23853
23871
  end
23854
23872
 
@@ -963,6 +963,7 @@ module Aws::SageMaker
963
963
  InferenceRecommendationsJobs = Shapes::ListShape.new(name: 'InferenceRecommendationsJobs')
964
964
  InferenceSpecification = Shapes::StructureShape.new(name: 'InferenceSpecification')
965
965
  InferenceSpecificationName = Shapes::StringShape.new(name: 'InferenceSpecificationName')
966
+ InitialInstanceCount = Shapes::IntegerShape.new(name: 'InitialInstanceCount')
966
967
  InitialNumberOfUsers = Shapes::IntegerShape.new(name: 'InitialNumberOfUsers')
967
968
  InitialTaskCount = Shapes::IntegerShape.new(name: 'InitialTaskCount')
968
969
  InputConfig = Shapes::StructureShape.new(name: 'InputConfig')
@@ -1322,6 +1323,7 @@ module Aws::SageMaker
1322
1323
  ModelQualityBaselineConfig = Shapes::StructureShape.new(name: 'ModelQualityBaselineConfig')
1323
1324
  ModelQualityJobInput = Shapes::StructureShape.new(name: 'ModelQualityJobInput')
1324
1325
  ModelRegisterSettings = Shapes::StructureShape.new(name: 'ModelRegisterSettings')
1326
+ ModelSetupTime = Shapes::IntegerShape.new(name: 'ModelSetupTime')
1325
1327
  ModelSortKey = Shapes::StringShape.new(name: 'ModelSortKey')
1326
1328
  ModelStepMetadata = Shapes::StructureShape.new(name: 'ModelStepMetadata')
1327
1329
  ModelSummary = Shapes::StructureShape.new(name: 'ModelSummary')
@@ -1616,6 +1618,7 @@ module Aws::SageMaker
1616
1618
  RecommendationJobStatus = Shapes::StringShape.new(name: 'RecommendationJobStatus')
1617
1619
  RecommendationJobStoppingConditions = Shapes::StructureShape.new(name: 'RecommendationJobStoppingConditions')
1618
1620
  RecommendationJobSupportedContentTypes = Shapes::ListShape.new(name: 'RecommendationJobSupportedContentTypes')
1621
+ RecommendationJobSupportedEndpointType = Shapes::StringShape.new(name: 'RecommendationJobSupportedEndpointType')
1619
1622
  RecommendationJobSupportedInstanceTypes = Shapes::ListShape.new(name: 'RecommendationJobSupportedInstanceTypes')
1620
1623
  RecommendationJobType = Shapes::StringShape.new(name: 'RecommendationJobType')
1621
1624
  RecommendationJobVpcConfig = Shapes::StructureShape.new(name: 'RecommendationJobVpcConfig')
@@ -4968,9 +4971,10 @@ module Aws::SageMaker
4968
4971
  EndpointInput.add_member(:end_time_offset, Shapes::ShapeRef.new(shape: MonitoringTimeOffsetString, location_name: "EndTimeOffset"))
4969
4972
  EndpointInput.struct_class = Types::EndpointInput
4970
4973
 
4971
- EndpointInputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, required: true, location_name: "InstanceType"))
4974
+ EndpointInputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, location_name: "InstanceType"))
4972
4975
  EndpointInputConfiguration.add_member(:inference_specification_name, Shapes::ShapeRef.new(shape: InferenceSpecificationName, location_name: "InferenceSpecificationName"))
4973
4976
  EndpointInputConfiguration.add_member(:environment_parameter_ranges, Shapes::ShapeRef.new(shape: EnvironmentParameterRanges, location_name: "EnvironmentParameterRanges"))
4977
+ EndpointInputConfiguration.add_member(:serverless_config, Shapes::ShapeRef.new(shape: ProductionVariantServerlessConfig, location_name: "ServerlessConfig"))
4974
4978
  EndpointInputConfiguration.struct_class = Types::EndpointInputConfiguration
4975
4979
 
4976
4980
  EndpointInputConfigurations.member = Shapes::ShapeRef.new(shape: EndpointInputConfiguration)
@@ -4983,8 +4987,9 @@ module Aws::SageMaker
4983
4987
 
4984
4988
  EndpointOutputConfiguration.add_member(:endpoint_name, Shapes::ShapeRef.new(shape: String, required: true, location_name: "EndpointName"))
4985
4989
  EndpointOutputConfiguration.add_member(:variant_name, Shapes::ShapeRef.new(shape: String, required: true, location_name: "VariantName"))
4986
- EndpointOutputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, required: true, location_name: "InstanceType"))
4987
- EndpointOutputConfiguration.add_member(:initial_instance_count, Shapes::ShapeRef.new(shape: Integer, required: true, location_name: "InitialInstanceCount"))
4990
+ EndpointOutputConfiguration.add_member(:instance_type, Shapes::ShapeRef.new(shape: ProductionVariantInstanceType, location_name: "InstanceType"))
4991
+ EndpointOutputConfiguration.add_member(:initial_instance_count, Shapes::ShapeRef.new(shape: InitialInstanceCount, location_name: "InitialInstanceCount"))
4992
+ EndpointOutputConfiguration.add_member(:serverless_config, Shapes::ShapeRef.new(shape: ProductionVariantServerlessConfig, location_name: "ServerlessConfig"))
4988
4993
  EndpointOutputConfiguration.struct_class = Types::EndpointOutputConfiguration
4989
4994
 
4990
4995
  EndpointPerformance.add_member(:metrics, Shapes::ShapeRef.new(shape: InferenceMetrics, required: true, location_name: "Metrics"))
@@ -7867,6 +7872,7 @@ module Aws::SageMaker
7867
7872
  RecommendationJobContainerConfig.add_member(:nearest_model_name, Shapes::ShapeRef.new(shape: String, location_name: "NearestModelName"))
7868
7873
  RecommendationJobContainerConfig.add_member(:supported_instance_types, Shapes::ShapeRef.new(shape: RecommendationJobSupportedInstanceTypes, location_name: "SupportedInstanceTypes"))
7869
7874
  RecommendationJobContainerConfig.add_member(:data_input_config, Shapes::ShapeRef.new(shape: RecommendationJobDataInputConfig, location_name: "DataInputConfig"))
7875
+ RecommendationJobContainerConfig.add_member(:supported_endpoint_type, Shapes::ShapeRef.new(shape: RecommendationJobSupportedEndpointType, location_name: "SupportedEndpointType"))
7870
7876
  RecommendationJobContainerConfig.struct_class = Types::RecommendationJobContainerConfig
7871
7877
 
7872
7878
  RecommendationJobInferenceBenchmark.add_member(:metrics, Shapes::ShapeRef.new(shape: RecommendationMetrics, location_name: "Metrics"))
@@ -7924,6 +7930,7 @@ module Aws::SageMaker
7924
7930
  RecommendationMetrics.add_member(:model_latency, Shapes::ShapeRef.new(shape: Integer, required: true, location_name: "ModelLatency"))
7925
7931
  RecommendationMetrics.add_member(:cpu_utilization, Shapes::ShapeRef.new(shape: UtilizationMetric, location_name: "CpuUtilization"))
7926
7932
  RecommendationMetrics.add_member(:memory_utilization, Shapes::ShapeRef.new(shape: UtilizationMetric, location_name: "MemoryUtilization"))
7933
+ RecommendationMetrics.add_member(:model_setup_time, Shapes::ShapeRef.new(shape: ModelSetupTime, location_name: "ModelSetupTime"))
7927
7934
  RecommendationMetrics.struct_class = Types::RecommendationMetrics
7928
7935
 
7929
7936
  RedshiftDatasetDefinition.add_member(:cluster_id, Shapes::ShapeRef.new(shape: RedshiftClusterId, required: true, location_name: "ClusterId"))
@@ -2415,6 +2415,12 @@ module Aws::SageMaker
2415
2415
  # @!attribute [rw] time_series_forecasting_job_config
2416
2416
  # Settings used to configure an AutoML job V2 for a time-series
2417
2417
  # forecasting problem type.
2418
+ #
2419
+ # <note markdown="1"> The `TimeSeriesForecastingJobConfig` problem type is only available
2420
+ # in private beta. Contact Amazon Web Services Support or your account
2421
+ # manager to learn more about access privileges.
2422
+ #
2423
+ # </note>
2418
2424
  # @return [Types::TimeSeriesForecastingJobConfig]
2419
2425
  #
2420
2426
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/AutoMLProblemTypeConfig AWS API Documentation
@@ -17129,12 +17135,17 @@ module Aws::SageMaker
17129
17135
  # The parameter you want to benchmark against.
17130
17136
  # @return [Types::EnvironmentParameterRanges]
17131
17137
  #
17138
+ # @!attribute [rw] serverless_config
17139
+ # Specifies the serverless configuration for an endpoint variant.
17140
+ # @return [Types::ProductionVariantServerlessConfig]
17141
+ #
17132
17142
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/EndpointInputConfiguration AWS API Documentation
17133
17143
  #
17134
17144
  class EndpointInputConfiguration < Struct.new(
17135
17145
  :instance_type,
17136
17146
  :inference_specification_name,
17137
- :environment_parameter_ranges)
17147
+ :environment_parameter_ranges,
17148
+ :serverless_config)
17138
17149
  SENSITIVE = []
17139
17150
  include Aws::Structure
17140
17151
  end
@@ -17196,13 +17207,18 @@ module Aws::SageMaker
17196
17207
  # The number of instances recommended to launch initially.
17197
17208
  # @return [Integer]
17198
17209
  #
17210
+ # @!attribute [rw] serverless_config
17211
+ # Specifies the serverless configuration for an endpoint variant.
17212
+ # @return [Types::ProductionVariantServerlessConfig]
17213
+ #
17199
17214
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/EndpointOutputConfiguration AWS API Documentation
17200
17215
  #
17201
17216
  class EndpointOutputConfiguration < Struct.new(
17202
17217
  :endpoint_name,
17203
17218
  :variant_name,
17204
17219
  :instance_type,
17205
- :initial_instance_count)
17220
+ :initial_instance_count,
17221
+ :serverless_config)
17206
17222
  SENSITIVE = []
17207
17223
  include Aws::Structure
17208
17224
  end
@@ -32884,6 +32900,17 @@ module Aws::SageMaker
32884
32900
  # @!attribute [rw] provisioned_concurrency
32885
32901
  # The amount of provisioned concurrency to allocate for the serverless
32886
32902
  # endpoint. Should be less than or equal to `MaxConcurrency`.
32903
+ #
32904
+ # <note markdown="1"> This field is not supported for serverless endpoint recommendations
32905
+ # for Inference Recommender jobs. For more information about creating
32906
+ # an Inference Recommender job, see
32907
+ # [CreateInferenceRecommendationsJobs][1].
32908
+ #
32909
+ # </note>
32910
+ #
32911
+ #
32912
+ #
32913
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_CreateInferenceRecommendationsJob.html
32887
32914
  # @return [Integer]
32888
32915
  #
32889
32916
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ProductionVariantServerlessConfig AWS API Documentation
@@ -34088,6 +34115,14 @@ module Aws::SageMaker
34088
34115
  # [1]: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_InputConfig.html#sagemaker-Type-InputConfig-DataInputConfig
34089
34116
  # @return [String]
34090
34117
  #
34118
+ # @!attribute [rw] supported_endpoint_type
34119
+ # The endpoint type to receive recommendations for. By default this is
34120
+ # null, and the results of the inference recommendation job return a
34121
+ # combined list of both real-time and serverless benchmarks. By
34122
+ # specifying a value for this field, you can receive a longer list of
34123
+ # benchmarks for the desired endpoint type.
34124
+ # @return [String]
34125
+ #
34091
34126
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RecommendationJobContainerConfig AWS API Documentation
34092
34127
  #
34093
34128
  class RecommendationJobContainerConfig < Struct.new(
@@ -34098,7 +34133,8 @@ module Aws::SageMaker
34098
34133
  :payload_config,
34099
34134
  :nearest_model_name,
34100
34135
  :supported_instance_types,
34101
- :data_input_config)
34136
+ :data_input_config,
34137
+ :supported_endpoint_type)
34102
34138
  SENSITIVE = []
34103
34139
  include Aws::Structure
34104
34140
  end
@@ -34422,6 +34458,14 @@ module Aws::SageMaker
34422
34458
  # `NaN` indicates that the value is not available.
34423
34459
  # @return [Float]
34424
34460
  #
34461
+ # @!attribute [rw] model_setup_time
34462
+ # The time it takes to launch new compute resources for a serverless
34463
+ # endpoint. The time can vary depending on the model size, how long it
34464
+ # takes to download the model, and the start-up time of the container.
34465
+ #
34466
+ # `NaN` indicates that the value is not available.
34467
+ # @return [Integer]
34468
+ #
34425
34469
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RecommendationMetrics AWS API Documentation
34426
34470
  #
34427
34471
  class RecommendationMetrics < Struct.new(
@@ -34430,7 +34474,8 @@ module Aws::SageMaker
34430
34474
  :max_invocations,
34431
34475
  :model_latency,
34432
34476
  :cpu_utilization,
34433
- :memory_utilization)
34477
+ :memory_utilization,
34478
+ :model_setup_time)
34434
34479
  SENSITIVE = []
34435
34480
  include Aws::Structure
34436
34481
  end
@@ -35012,10 +35057,15 @@ module Aws::SageMaker
35012
35057
  # endpoint.
35013
35058
  #
35014
35059
  # @!attribute [rw] maximum_batch_size
35015
- # Batch size for each rolling step to provision capacity and turn on
35016
- # traffic on the new endpoint fleet, and terminate capacity on the old
35017
- # endpoint fleet. Value must be between 5% to 50% of the variant's
35018
- # total instance count.
35060
+ # Specifies the type and size of the endpoint capacity to activate for
35061
+ # a blue/green deployment, a rolling deployment, or a rollback
35062
+ # strategy. You can specify your batches as either instance count or
35063
+ # the overall percentage or your fleet.
35064
+ #
35065
+ # For a rollback strategy, if you don't specify the fields in this
35066
+ # object, or if you set the `Value` to 100%, then SageMaker uses a
35067
+ # blue/green rollback strategy and rolls all traffic back to the blue
35068
+ # fleet.
35019
35069
  # @return [Types::CapacitySize]
35020
35070
  #
35021
35071
  # @!attribute [rw] wait_interval_in_seconds
@@ -35029,12 +35079,15 @@ module Aws::SageMaker
35029
35079
  # @return [Integer]
35030
35080
  #
35031
35081
  # @!attribute [rw] rollback_maximum_batch_size
35032
- # Batch size for rollback to the old endpoint fleet. Each rolling step
35033
- # to provision capacity and turn on traffic on the old endpoint fleet,
35034
- # and terminate capacity on the new endpoint fleet. If this field is
35035
- # absent, the default value will be set to 100% of total capacity
35036
- # which means to bring up the whole capacity of the old fleet at once
35037
- # during rollback.
35082
+ # Specifies the type and size of the endpoint capacity to activate for
35083
+ # a blue/green deployment, a rolling deployment, or a rollback
35084
+ # strategy. You can specify your batches as either instance count or
35085
+ # the overall percentage or your fleet.
35086
+ #
35087
+ # For a rollback strategy, if you don't specify the fields in this
35088
+ # object, or if you set the `Value` to 100%, then SageMaker uses a
35089
+ # blue/green rollback strategy and rolls all traffic back to the blue
35090
+ # fleet.
35038
35091
  # @return [Types::CapacitySize]
35039
35092
  #
35040
35093
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/RollingUpdatePolicy AWS API Documentation
@@ -53,6 +53,6 @@ require_relative 'aws-sdk-sagemaker/customizations'
53
53
  # @!group service
54
54
  module Aws::SageMaker
55
55
 
56
- GEM_VERSION = '1.193.0'
56
+ GEM_VERSION = '1.194.0'
57
57
 
58
58
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: aws-sdk-sagemaker
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.193.0
4
+ version: 1.194.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Amazon Web Services
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2023-06-30 00:00:00.000000000 Z
11
+ date: 2023-07-03 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: aws-sdk-core