aws-sdk-sagemaker 1.275.0 → 1.276.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -1535,6 +1535,7 @@ module Aws::SageMaker
1535
1535
  ModelQuantizationConfig = Shapes::StructureShape.new(name: 'ModelQuantizationConfig')
1536
1536
  ModelRegisterSettings = Shapes::StructureShape.new(name: 'ModelRegisterSettings')
1537
1537
  ModelSetupTime = Shapes::IntegerShape.new(name: 'ModelSetupTime')
1538
+ ModelShardingConfig = Shapes::StructureShape.new(name: 'ModelShardingConfig')
1538
1539
  ModelSortKey = Shapes::StringShape.new(name: 'ModelSortKey')
1539
1540
  ModelStepMetadata = Shapes::StructureShape.new(name: 'ModelStepMetadata')
1540
1541
  ModelSummary = Shapes::StructureShape.new(name: 'ModelSummary')
@@ -3002,6 +3003,7 @@ module Aws::SageMaker
3002
3003
  ClusterInstanceGroupDetails.add_member(:threads_per_core, Shapes::ShapeRef.new(shape: ClusterThreadsPerCore, location_name: "ThreadsPerCore"))
3003
3004
  ClusterInstanceGroupDetails.add_member(:instance_storage_configs, Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfigs, location_name: "InstanceStorageConfigs"))
3004
3005
  ClusterInstanceGroupDetails.add_member(:on_start_deep_health_checks, Shapes::ShapeRef.new(shape: OnStartDeepHealthChecks, location_name: "OnStartDeepHealthChecks"))
3006
+ ClusterInstanceGroupDetails.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3005
3007
  ClusterInstanceGroupDetails.struct_class = Types::ClusterInstanceGroupDetails
3006
3008
 
3007
3009
  ClusterInstanceGroupDetailsList.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupDetails)
@@ -3014,6 +3016,7 @@ module Aws::SageMaker
3014
3016
  ClusterInstanceGroupSpecification.add_member(:threads_per_core, Shapes::ShapeRef.new(shape: ClusterThreadsPerCore, location_name: "ThreadsPerCore"))
3015
3017
  ClusterInstanceGroupSpecification.add_member(:instance_storage_configs, Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfigs, location_name: "InstanceStorageConfigs"))
3016
3018
  ClusterInstanceGroupSpecification.add_member(:on_start_deep_health_checks, Shapes::ShapeRef.new(shape: OnStartDeepHealthChecks, location_name: "OnStartDeepHealthChecks"))
3019
+ ClusterInstanceGroupSpecification.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3017
3020
  ClusterInstanceGroupSpecification.struct_class = Types::ClusterInstanceGroupSpecification
3018
3021
 
3019
3022
  ClusterInstanceGroupSpecifications.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecification)
@@ -3044,6 +3047,7 @@ module Aws::SageMaker
3044
3047
  ClusterNodeDetails.add_member(:instance_type, Shapes::ShapeRef.new(shape: ClusterInstanceType, location_name: "InstanceType"))
3045
3048
  ClusterNodeDetails.add_member(:launch_time, Shapes::ShapeRef.new(shape: Timestamp, location_name: "LaunchTime"))
3046
3049
  ClusterNodeDetails.add_member(:life_cycle_config, Shapes::ShapeRef.new(shape: ClusterLifeCycleConfig, location_name: "LifeCycleConfig"))
3050
+ ClusterNodeDetails.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3047
3051
  ClusterNodeDetails.add_member(:threads_per_core, Shapes::ShapeRef.new(shape: ClusterThreadsPerCore, location_name: "ThreadsPerCore"))
3048
3052
  ClusterNodeDetails.add_member(:instance_storage_configs, Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfigs, location_name: "InstanceStorageConfigs"))
3049
3053
  ClusterNodeDetails.add_member(:private_primary_ip, Shapes::ShapeRef.new(shape: ClusterPrivatePrimaryIp, location_name: "PrivatePrimaryIp"))
@@ -3535,9 +3539,9 @@ module Aws::SageMaker
3535
3539
 
3536
3540
  CreateInferenceComponentInput.add_member(:inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, required: true, location_name: "InferenceComponentName"))
3537
3541
  CreateInferenceComponentInput.add_member(:endpoint_name, Shapes::ShapeRef.new(shape: EndpointName, required: true, location_name: "EndpointName"))
3538
- CreateInferenceComponentInput.add_member(:variant_name, Shapes::ShapeRef.new(shape: VariantName, required: true, location_name: "VariantName"))
3542
+ CreateInferenceComponentInput.add_member(:variant_name, Shapes::ShapeRef.new(shape: VariantName, location_name: "VariantName"))
3539
3543
  CreateInferenceComponentInput.add_member(:specification, Shapes::ShapeRef.new(shape: InferenceComponentSpecification, required: true, location_name: "Specification"))
3540
- CreateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, required: true, location_name: "RuntimeConfig"))
3544
+ CreateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, location_name: "RuntimeConfig"))
3541
3545
  CreateInferenceComponentInput.add_member(:tags, Shapes::ShapeRef.new(shape: TagList, location_name: "Tags"))
3542
3546
  CreateInferenceComponentInput.struct_class = Types::CreateInferenceComponentInput
3543
3547
 
@@ -6411,13 +6415,15 @@ module Aws::SageMaker
6411
6415
  InferenceComponentSpecification.add_member(:model_name, Shapes::ShapeRef.new(shape: ModelName, location_name: "ModelName"))
6412
6416
  InferenceComponentSpecification.add_member(:container, Shapes::ShapeRef.new(shape: InferenceComponentContainerSpecification, location_name: "Container"))
6413
6417
  InferenceComponentSpecification.add_member(:startup_parameters, Shapes::ShapeRef.new(shape: InferenceComponentStartupParameters, location_name: "StartupParameters"))
6414
- InferenceComponentSpecification.add_member(:compute_resource_requirements, Shapes::ShapeRef.new(shape: InferenceComponentComputeResourceRequirements, required: true, location_name: "ComputeResourceRequirements"))
6418
+ InferenceComponentSpecification.add_member(:compute_resource_requirements, Shapes::ShapeRef.new(shape: InferenceComponentComputeResourceRequirements, location_name: "ComputeResourceRequirements"))
6419
+ InferenceComponentSpecification.add_member(:base_inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, location_name: "BaseInferenceComponentName"))
6415
6420
  InferenceComponentSpecification.struct_class = Types::InferenceComponentSpecification
6416
6421
 
6417
6422
  InferenceComponentSpecificationSummary.add_member(:model_name, Shapes::ShapeRef.new(shape: ModelName, location_name: "ModelName"))
6418
6423
  InferenceComponentSpecificationSummary.add_member(:container, Shapes::ShapeRef.new(shape: InferenceComponentContainerSpecificationSummary, location_name: "Container"))
6419
6424
  InferenceComponentSpecificationSummary.add_member(:startup_parameters, Shapes::ShapeRef.new(shape: InferenceComponentStartupParameters, location_name: "StartupParameters"))
6420
6425
  InferenceComponentSpecificationSummary.add_member(:compute_resource_requirements, Shapes::ShapeRef.new(shape: InferenceComponentComputeResourceRequirements, location_name: "ComputeResourceRequirements"))
6426
+ InferenceComponentSpecificationSummary.add_member(:base_inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, location_name: "BaseInferenceComponentName"))
6421
6427
  InferenceComponentSpecificationSummary.struct_class = Types::InferenceComponentSpecificationSummary
6422
6428
 
6423
6429
  InferenceComponentStartupParameters.add_member(:model_data_download_timeout_in_seconds, Shapes::ShapeRef.new(shape: ProductionVariantModelDataDownloadTimeoutInSeconds, location_name: "ModelDataDownloadTimeoutInSeconds"))
@@ -8173,6 +8179,10 @@ module Aws::SageMaker
8173
8179
  ModelRegisterSettings.add_member(:cross_account_model_register_role_arn, Shapes::ShapeRef.new(shape: RoleArn, location_name: "CrossAccountModelRegisterRoleArn"))
8174
8180
  ModelRegisterSettings.struct_class = Types::ModelRegisterSettings
8175
8181
 
8182
+ ModelShardingConfig.add_member(:image, Shapes::ShapeRef.new(shape: OptimizationContainerImage, location_name: "Image"))
8183
+ ModelShardingConfig.add_member(:override_environment, Shapes::ShapeRef.new(shape: OptimizationJobEnvironmentVariables, location_name: "OverrideEnvironment"))
8184
+ ModelShardingConfig.struct_class = Types::ModelShardingConfig
8185
+
8176
8186
  ModelStepMetadata.add_member(:arn, Shapes::ShapeRef.new(shape: String256, location_name: "Arn"))
8177
8187
  ModelStepMetadata.struct_class = Types::ModelStepMetadata
8178
8188
 
@@ -8476,9 +8486,11 @@ module Aws::SageMaker
8476
8486
 
8477
8487
  OptimizationConfig.add_member(:model_quantization_config, Shapes::ShapeRef.new(shape: ModelQuantizationConfig, location_name: "ModelQuantizationConfig"))
8478
8488
  OptimizationConfig.add_member(:model_compilation_config, Shapes::ShapeRef.new(shape: ModelCompilationConfig, location_name: "ModelCompilationConfig"))
8489
+ OptimizationConfig.add_member(:model_sharding_config, Shapes::ShapeRef.new(shape: ModelShardingConfig, location_name: "ModelShardingConfig"))
8479
8490
  OptimizationConfig.add_member(:unknown, Shapes::ShapeRef.new(shape: nil, location_name: 'unknown'))
8480
8491
  OptimizationConfig.add_member_subclass(:model_quantization_config, Types::OptimizationConfig::ModelQuantizationConfig)
8481
8492
  OptimizationConfig.add_member_subclass(:model_compilation_config, Types::OptimizationConfig::ModelCompilationConfig)
8493
+ OptimizationConfig.add_member_subclass(:model_sharding_config, Types::OptimizationConfig::ModelShardingConfig)
8482
8494
  OptimizationConfig.add_member_subclass(:unknown, Types::OptimizationConfig::Unknown)
8483
8495
  OptimizationConfig.struct_class = Types::OptimizationConfig
8484
8496
 
@@ -4227,6 +4227,18 @@ module Aws::SageMaker
4227
4227
  # when the cluster instance group is created or updated.
4228
4228
  # @return [Array<String>]
4229
4229
  #
4230
+ # @!attribute [rw] override_vpc_config
4231
+ # Specifies an Amazon Virtual Private Cloud (VPC) that your SageMaker
4232
+ # jobs, hosted models, and compute resources have access to. You can
4233
+ # control access to and from your resources by configuring a VPC. For
4234
+ # more information, see [Give SageMaker Access to Resources in your
4235
+ # Amazon VPC][1].
4236
+ #
4237
+ #
4238
+ #
4239
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/infrastructure-give-access.html
4240
+ # @return [Types::VpcConfig]
4241
+ #
4230
4242
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ClusterInstanceGroupDetails AWS API Documentation
4231
4243
  #
4232
4244
  class ClusterInstanceGroupDetails < Struct.new(
@@ -4238,7 +4250,8 @@ module Aws::SageMaker
4238
4250
  :execution_role,
4239
4251
  :threads_per_core,
4240
4252
  :instance_storage_configs,
4241
- :on_start_deep_health_checks)
4253
+ :on_start_deep_health_checks,
4254
+ :override_vpc_config)
4242
4255
  SENSITIVE = []
4243
4256
  include Aws::Structure
4244
4257
  end
@@ -4290,6 +4303,18 @@ module Aws::SageMaker
4290
4303
  # when the cluster instance group is created or updated.
4291
4304
  # @return [Array<String>]
4292
4305
  #
4306
+ # @!attribute [rw] override_vpc_config
4307
+ # Specifies an Amazon Virtual Private Cloud (VPC) that your SageMaker
4308
+ # jobs, hosted models, and compute resources have access to. You can
4309
+ # control access to and from your resources by configuring a VPC. For
4310
+ # more information, see [Give SageMaker Access to Resources in your
4311
+ # Amazon VPC][1].
4312
+ #
4313
+ #
4314
+ #
4315
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/infrastructure-give-access.html
4316
+ # @return [Types::VpcConfig]
4317
+ #
4293
4318
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ClusterInstanceGroupSpecification AWS API Documentation
4294
4319
  #
4295
4320
  class ClusterInstanceGroupSpecification < Struct.new(
@@ -4300,7 +4325,8 @@ module Aws::SageMaker
4300
4325
  :execution_role,
4301
4326
  :threads_per_core,
4302
4327
  :instance_storage_configs,
4303
- :on_start_deep_health_checks)
4328
+ :on_start_deep_health_checks,
4329
+ :override_vpc_config)
4304
4330
  SENSITIVE = []
4305
4331
  include Aws::Structure
4306
4332
  end
@@ -4437,6 +4463,18 @@ module Aws::SageMaker
4437
4463
  # The LifeCycle configuration applied to the instance.
4438
4464
  # @return [Types::ClusterLifeCycleConfig]
4439
4465
  #
4466
+ # @!attribute [rw] override_vpc_config
4467
+ # Specifies an Amazon Virtual Private Cloud (VPC) that your SageMaker
4468
+ # jobs, hosted models, and compute resources have access to. You can
4469
+ # control access to and from your resources by configuring a VPC. For
4470
+ # more information, see [Give SageMaker Access to Resources in your
4471
+ # Amazon VPC][1].
4472
+ #
4473
+ #
4474
+ #
4475
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/infrastructure-give-access.html
4476
+ # @return [Types::VpcConfig]
4477
+ #
4440
4478
  # @!attribute [rw] threads_per_core
4441
4479
  # The number of threads per CPU core you specified under
4442
4480
  # `CreateCluster`.
@@ -4469,6 +4507,7 @@ module Aws::SageMaker
4469
4507
  :instance_type,
4470
4508
  :launch_time,
4471
4509
  :life_cycle_config,
4510
+ :override_vpc_config,
4472
4511
  :threads_per_core,
4473
4512
  :instance_storage_configs,
4474
4513
  :private_primary_ip,
@@ -24194,9 +24233,9 @@ module Aws::SageMaker
24194
24233
  include Aws::Structure
24195
24234
  end
24196
24235
 
24197
- # Defines the compute resources to allocate to run a model that you
24198
- # assign to an inference component. These resources include CPU cores,
24199
- # accelerators, and memory.
24236
+ # Defines the compute resources to allocate to run a model, plus any
24237
+ # adapter models, that you assign to an inference component. These
24238
+ # resources include CPU cores, accelerators, and memory.
24200
24239
  #
24201
24240
  # @!attribute [rw] number_of_cpu_cores_required
24202
24241
  # The number of CPU cores to allocate to run a model that you assign
@@ -24355,17 +24394,45 @@ module Aws::SageMaker
24355
24394
  # @return [Types::InferenceComponentStartupParameters]
24356
24395
  #
24357
24396
  # @!attribute [rw] compute_resource_requirements
24358
- # The compute resources allocated to run the model assigned to the
24359
- # inference component.
24397
+ # The compute resources allocated to run the model, plus any adapter
24398
+ # models, that you assign to the inference component.
24399
+ #
24400
+ # Omit this parameter if your request is meant to create an adapter
24401
+ # inference component. An adapter inference component is loaded by a
24402
+ # base inference component, and it uses the compute resources of the
24403
+ # base inference component.
24360
24404
  # @return [Types::InferenceComponentComputeResourceRequirements]
24361
24405
  #
24406
+ # @!attribute [rw] base_inference_component_name
24407
+ # The name of an existing inference component that is to contain the
24408
+ # inference component that you're creating with your request.
24409
+ #
24410
+ # Specify this parameter only if your request is meant to create an
24411
+ # adapter inference component. An adapter inference component contains
24412
+ # the path to an adapter model. The purpose of the adapter model is to
24413
+ # tailor the inference output of a base foundation model, which is
24414
+ # hosted by the base inference component. The adapter inference
24415
+ # component uses the compute resources that you assigned to the base
24416
+ # inference component.
24417
+ #
24418
+ # When you create an adapter inference component, use the `Container`
24419
+ # parameter to specify the location of the adapter artifacts. In the
24420
+ # parameter value, use the `ArtifactUrl` parameter of the
24421
+ # `InferenceComponentContainerSpecification` data type.
24422
+ #
24423
+ # Before you can create an adapter inference component, you must have
24424
+ # an existing inference component that contains the foundation model
24425
+ # that you want to adapt.
24426
+ # @return [String]
24427
+ #
24362
24428
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentSpecification AWS API Documentation
24363
24429
  #
24364
24430
  class InferenceComponentSpecification < Struct.new(
24365
24431
  :model_name,
24366
24432
  :container,
24367
24433
  :startup_parameters,
24368
- :compute_resource_requirements)
24434
+ :compute_resource_requirements,
24435
+ :base_inference_component_name)
24369
24436
  SENSITIVE = []
24370
24437
  include Aws::Structure
24371
24438
  end
@@ -24388,17 +24455,23 @@ module Aws::SageMaker
24388
24455
  # @return [Types::InferenceComponentStartupParameters]
24389
24456
  #
24390
24457
  # @!attribute [rw] compute_resource_requirements
24391
- # The compute resources allocated to run the model assigned to the
24392
- # inference component.
24458
+ # The compute resources allocated to run the model, plus any adapter
24459
+ # models, that you assign to the inference component.
24393
24460
  # @return [Types::InferenceComponentComputeResourceRequirements]
24394
24461
  #
24462
+ # @!attribute [rw] base_inference_component_name
24463
+ # The name of the base inference component that contains this
24464
+ # inference component.
24465
+ # @return [String]
24466
+ #
24395
24467
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentSpecificationSummary AWS API Documentation
24396
24468
  #
24397
24469
  class InferenceComponentSpecificationSummary < Struct.new(
24398
24470
  :model_name,
24399
24471
  :container,
24400
24472
  :startup_parameters,
24401
- :compute_resource_requirements)
24473
+ :compute_resource_requirements,
24474
+ :base_inference_component_name)
24402
24475
  SENSITIVE = []
24403
24476
  include Aws::Structure
24404
24477
  end
@@ -33836,6 +33909,28 @@ module Aws::SageMaker
33836
33909
  include Aws::Structure
33837
33910
  end
33838
33911
 
33912
+ # Settings for the model sharding technique that's applied by a model
33913
+ # optimization job.
33914
+ #
33915
+ # @!attribute [rw] image
33916
+ # The URI of an LMI DLC in Amazon ECR. SageMaker uses this image to
33917
+ # run the optimization.
33918
+ # @return [String]
33919
+ #
33920
+ # @!attribute [rw] override_environment
33921
+ # Environment variables that override the default ones in the model
33922
+ # container.
33923
+ # @return [Hash<String,String>]
33924
+ #
33925
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ModelShardingConfig AWS API Documentation
33926
+ #
33927
+ class ModelShardingConfig < Struct.new(
33928
+ :image,
33929
+ :override_environment)
33930
+ SENSITIVE = []
33931
+ include Aws::Structure
33932
+ end
33933
+
33839
33934
  # Metadata for Model steps.
33840
33935
  #
33841
33936
  # @!attribute [rw] arn
@@ -35415,11 +35510,17 @@ module Aws::SageMaker
35415
35510
  # model optimization job.
35416
35511
  # @return [Types::ModelCompilationConfig]
35417
35512
  #
35513
+ # @!attribute [rw] model_sharding_config
35514
+ # Settings for the model sharding technique that's applied by a model
35515
+ # optimization job.
35516
+ # @return [Types::ModelShardingConfig]
35517
+ #
35418
35518
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/OptimizationConfig AWS API Documentation
35419
35519
  #
35420
35520
  class OptimizationConfig < Struct.new(
35421
35521
  :model_quantization_config,
35422
35522
  :model_compilation_config,
35523
+ :model_sharding_config,
35423
35524
  :unknown)
35424
35525
  SENSITIVE = []
35425
35526
  include Aws::Structure
@@ -35427,6 +35528,7 @@ module Aws::SageMaker
35427
35528
 
35428
35529
  class ModelQuantizationConfig < OptimizationConfig; end
35429
35530
  class ModelCompilationConfig < OptimizationConfig; end
35531
+ class ModelShardingConfig < OptimizationConfig; end
35430
35532
  class Unknown < OptimizationConfig; end
35431
35533
  end
35432
35534
 
@@ -55,7 +55,7 @@ module Aws::SageMaker
55
55
  autoload :EndpointProvider, 'aws-sdk-sagemaker/endpoint_provider'
56
56
  autoload :Endpoints, 'aws-sdk-sagemaker/endpoints'
57
57
 
58
- GEM_VERSION = '1.275.0'
58
+ GEM_VERSION = '1.276.0'
59
59
 
60
60
  end
61
61