aws-sdk-sagemaker 1.275.0 → 1.276.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1535,6 +1535,7 @@ module Aws::SageMaker
1535
1535
  ModelQuantizationConfig = Shapes::StructureShape.new(name: 'ModelQuantizationConfig')
1536
1536
  ModelRegisterSettings = Shapes::StructureShape.new(name: 'ModelRegisterSettings')
1537
1537
  ModelSetupTime = Shapes::IntegerShape.new(name: 'ModelSetupTime')
1538
+ ModelShardingConfig = Shapes::StructureShape.new(name: 'ModelShardingConfig')
1538
1539
  ModelSortKey = Shapes::StringShape.new(name: 'ModelSortKey')
1539
1540
  ModelStepMetadata = Shapes::StructureShape.new(name: 'ModelStepMetadata')
1540
1541
  ModelSummary = Shapes::StructureShape.new(name: 'ModelSummary')
@@ -3002,6 +3003,7 @@ module Aws::SageMaker
3002
3003
  ClusterInstanceGroupDetails.add_member(:threads_per_core, Shapes::ShapeRef.new(shape: ClusterThreadsPerCore, location_name: "ThreadsPerCore"))
3003
3004
  ClusterInstanceGroupDetails.add_member(:instance_storage_configs, Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfigs, location_name: "InstanceStorageConfigs"))
3004
3005
  ClusterInstanceGroupDetails.add_member(:on_start_deep_health_checks, Shapes::ShapeRef.new(shape: OnStartDeepHealthChecks, location_name: "OnStartDeepHealthChecks"))
3006
+ ClusterInstanceGroupDetails.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3005
3007
  ClusterInstanceGroupDetails.struct_class = Types::ClusterInstanceGroupDetails
3006
3008
 
3007
3009
  ClusterInstanceGroupDetailsList.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupDetails)
@@ -3014,6 +3016,7 @@ module Aws::SageMaker
3014
3016
  ClusterInstanceGroupSpecification.add_member(:threads_per_core, Shapes::ShapeRef.new(shape: ClusterThreadsPerCore, location_name: "ThreadsPerCore"))
3015
3017
  ClusterInstanceGroupSpecification.add_member(:instance_storage_configs, Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfigs, location_name: "InstanceStorageConfigs"))
3016
3018
  ClusterInstanceGroupSpecification.add_member(:on_start_deep_health_checks, Shapes::ShapeRef.new(shape: OnStartDeepHealthChecks, location_name: "OnStartDeepHealthChecks"))
3019
+ ClusterInstanceGroupSpecification.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3017
3020
  ClusterInstanceGroupSpecification.struct_class = Types::ClusterInstanceGroupSpecification
3018
3021
 
3019
3022
  ClusterInstanceGroupSpecifications.member = Shapes::ShapeRef.new(shape: ClusterInstanceGroupSpecification)
@@ -3044,6 +3047,7 @@ module Aws::SageMaker
3044
3047
  ClusterNodeDetails.add_member(:instance_type, Shapes::ShapeRef.new(shape: ClusterInstanceType, location_name: "InstanceType"))
3045
3048
  ClusterNodeDetails.add_member(:launch_time, Shapes::ShapeRef.new(shape: Timestamp, location_name: "LaunchTime"))
3046
3049
  ClusterNodeDetails.add_member(:life_cycle_config, Shapes::ShapeRef.new(shape: ClusterLifeCycleConfig, location_name: "LifeCycleConfig"))
3050
+ ClusterNodeDetails.add_member(:override_vpc_config, Shapes::ShapeRef.new(shape: VpcConfig, location_name: "OverrideVpcConfig"))
3047
3051
  ClusterNodeDetails.add_member(:threads_per_core, Shapes::ShapeRef.new(shape: ClusterThreadsPerCore, location_name: "ThreadsPerCore"))
3048
3052
  ClusterNodeDetails.add_member(:instance_storage_configs, Shapes::ShapeRef.new(shape: ClusterInstanceStorageConfigs, location_name: "InstanceStorageConfigs"))
3049
3053
  ClusterNodeDetails.add_member(:private_primary_ip, Shapes::ShapeRef.new(shape: ClusterPrivatePrimaryIp, location_name: "PrivatePrimaryIp"))
@@ -3535,9 +3539,9 @@ module Aws::SageMaker
3535
3539
 
3536
3540
  CreateInferenceComponentInput.add_member(:inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, required: true, location_name: "InferenceComponentName"))
3537
3541
  CreateInferenceComponentInput.add_member(:endpoint_name, Shapes::ShapeRef.new(shape: EndpointName, required: true, location_name: "EndpointName"))
3538
- CreateInferenceComponentInput.add_member(:variant_name, Shapes::ShapeRef.new(shape: VariantName, required: true, location_name: "VariantName"))
3542
+ CreateInferenceComponentInput.add_member(:variant_name, Shapes::ShapeRef.new(shape: VariantName, location_name: "VariantName"))
3539
3543
  CreateInferenceComponentInput.add_member(:specification, Shapes::ShapeRef.new(shape: InferenceComponentSpecification, required: true, location_name: "Specification"))
3540
- CreateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, required: true, location_name: "RuntimeConfig"))
3544
+ CreateInferenceComponentInput.add_member(:runtime_config, Shapes::ShapeRef.new(shape: InferenceComponentRuntimeConfig, location_name: "RuntimeConfig"))
3541
3545
  CreateInferenceComponentInput.add_member(:tags, Shapes::ShapeRef.new(shape: TagList, location_name: "Tags"))
3542
3546
  CreateInferenceComponentInput.struct_class = Types::CreateInferenceComponentInput
3543
3547
 
@@ -6411,13 +6415,15 @@ module Aws::SageMaker
6411
6415
  InferenceComponentSpecification.add_member(:model_name, Shapes::ShapeRef.new(shape: ModelName, location_name: "ModelName"))
6412
6416
  InferenceComponentSpecification.add_member(:container, Shapes::ShapeRef.new(shape: InferenceComponentContainerSpecification, location_name: "Container"))
6413
6417
  InferenceComponentSpecification.add_member(:startup_parameters, Shapes::ShapeRef.new(shape: InferenceComponentStartupParameters, location_name: "StartupParameters"))
6414
- InferenceComponentSpecification.add_member(:compute_resource_requirements, Shapes::ShapeRef.new(shape: InferenceComponentComputeResourceRequirements, required: true, location_name: "ComputeResourceRequirements"))
6418
+ InferenceComponentSpecification.add_member(:compute_resource_requirements, Shapes::ShapeRef.new(shape: InferenceComponentComputeResourceRequirements, location_name: "ComputeResourceRequirements"))
6419
+ InferenceComponentSpecification.add_member(:base_inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, location_name: "BaseInferenceComponentName"))
6415
6420
  InferenceComponentSpecification.struct_class = Types::InferenceComponentSpecification
6416
6421
 
6417
6422
  InferenceComponentSpecificationSummary.add_member(:model_name, Shapes::ShapeRef.new(shape: ModelName, location_name: "ModelName"))
6418
6423
  InferenceComponentSpecificationSummary.add_member(:container, Shapes::ShapeRef.new(shape: InferenceComponentContainerSpecificationSummary, location_name: "Container"))
6419
6424
  InferenceComponentSpecificationSummary.add_member(:startup_parameters, Shapes::ShapeRef.new(shape: InferenceComponentStartupParameters, location_name: "StartupParameters"))
6420
6425
  InferenceComponentSpecificationSummary.add_member(:compute_resource_requirements, Shapes::ShapeRef.new(shape: InferenceComponentComputeResourceRequirements, location_name: "ComputeResourceRequirements"))
6426
+ InferenceComponentSpecificationSummary.add_member(:base_inference_component_name, Shapes::ShapeRef.new(shape: InferenceComponentName, location_name: "BaseInferenceComponentName"))
6421
6427
  InferenceComponentSpecificationSummary.struct_class = Types::InferenceComponentSpecificationSummary
6422
6428
 
6423
6429
  InferenceComponentStartupParameters.add_member(:model_data_download_timeout_in_seconds, Shapes::ShapeRef.new(shape: ProductionVariantModelDataDownloadTimeoutInSeconds, location_name: "ModelDataDownloadTimeoutInSeconds"))
@@ -8173,6 +8179,10 @@ module Aws::SageMaker
8173
8179
  ModelRegisterSettings.add_member(:cross_account_model_register_role_arn, Shapes::ShapeRef.new(shape: RoleArn, location_name: "CrossAccountModelRegisterRoleArn"))
8174
8180
  ModelRegisterSettings.struct_class = Types::ModelRegisterSettings
8175
8181
 
8182
+ ModelShardingConfig.add_member(:image, Shapes::ShapeRef.new(shape: OptimizationContainerImage, location_name: "Image"))
8183
+ ModelShardingConfig.add_member(:override_environment, Shapes::ShapeRef.new(shape: OptimizationJobEnvironmentVariables, location_name: "OverrideEnvironment"))
8184
+ ModelShardingConfig.struct_class = Types::ModelShardingConfig
8185
+
8176
8186
  ModelStepMetadata.add_member(:arn, Shapes::ShapeRef.new(shape: String256, location_name: "Arn"))
8177
8187
  ModelStepMetadata.struct_class = Types::ModelStepMetadata
8178
8188
 
@@ -8476,9 +8486,11 @@ module Aws::SageMaker
8476
8486
 
8477
8487
  OptimizationConfig.add_member(:model_quantization_config, Shapes::ShapeRef.new(shape: ModelQuantizationConfig, location_name: "ModelQuantizationConfig"))
8478
8488
  OptimizationConfig.add_member(:model_compilation_config, Shapes::ShapeRef.new(shape: ModelCompilationConfig, location_name: "ModelCompilationConfig"))
8489
+ OptimizationConfig.add_member(:model_sharding_config, Shapes::ShapeRef.new(shape: ModelShardingConfig, location_name: "ModelShardingConfig"))
8479
8490
  OptimizationConfig.add_member(:unknown, Shapes::ShapeRef.new(shape: nil, location_name: 'unknown'))
8480
8491
  OptimizationConfig.add_member_subclass(:model_quantization_config, Types::OptimizationConfig::ModelQuantizationConfig)
8481
8492
  OptimizationConfig.add_member_subclass(:model_compilation_config, Types::OptimizationConfig::ModelCompilationConfig)
8493
+ OptimizationConfig.add_member_subclass(:model_sharding_config, Types::OptimizationConfig::ModelShardingConfig)
8482
8494
  OptimizationConfig.add_member_subclass(:unknown, Types::OptimizationConfig::Unknown)
8483
8495
  OptimizationConfig.struct_class = Types::OptimizationConfig
8484
8496
 
@@ -4227,6 +4227,18 @@ module Aws::SageMaker
4227
4227
  # when the cluster instance group is created or updated.
4228
4228
  # @return [Array<String>]
4229
4229
  #
4230
+ # @!attribute [rw] override_vpc_config
4231
+ # Specifies an Amazon Virtual Private Cloud (VPC) that your SageMaker
4232
+ # jobs, hosted models, and compute resources have access to. You can
4233
+ # control access to and from your resources by configuring a VPC. For
4234
+ # more information, see [Give SageMaker Access to Resources in your
4235
+ # Amazon VPC][1].
4236
+ #
4237
+ #
4238
+ #
4239
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/infrastructure-give-access.html
4240
+ # @return [Types::VpcConfig]
4241
+ #
4230
4242
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ClusterInstanceGroupDetails AWS API Documentation
4231
4243
  #
4232
4244
  class ClusterInstanceGroupDetails < Struct.new(
@@ -4238,7 +4250,8 @@ module Aws::SageMaker
4238
4250
  :execution_role,
4239
4251
  :threads_per_core,
4240
4252
  :instance_storage_configs,
4241
- :on_start_deep_health_checks)
4253
+ :on_start_deep_health_checks,
4254
+ :override_vpc_config)
4242
4255
  SENSITIVE = []
4243
4256
  include Aws::Structure
4244
4257
  end
@@ -4290,6 +4303,18 @@ module Aws::SageMaker
4290
4303
  # when the cluster instance group is created or updated.
4291
4304
  # @return [Array<String>]
4292
4305
  #
4306
+ # @!attribute [rw] override_vpc_config
4307
+ # Specifies an Amazon Virtual Private Cloud (VPC) that your SageMaker
4308
+ # jobs, hosted models, and compute resources have access to. You can
4309
+ # control access to and from your resources by configuring a VPC. For
4310
+ # more information, see [Give SageMaker Access to Resources in your
4311
+ # Amazon VPC][1].
4312
+ #
4313
+ #
4314
+ #
4315
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/infrastructure-give-access.html
4316
+ # @return [Types::VpcConfig]
4317
+ #
4293
4318
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ClusterInstanceGroupSpecification AWS API Documentation
4294
4319
  #
4295
4320
  class ClusterInstanceGroupSpecification < Struct.new(
@@ -4300,7 +4325,8 @@ module Aws::SageMaker
4300
4325
  :execution_role,
4301
4326
  :threads_per_core,
4302
4327
  :instance_storage_configs,
4303
- :on_start_deep_health_checks)
4328
+ :on_start_deep_health_checks,
4329
+ :override_vpc_config)
4304
4330
  SENSITIVE = []
4305
4331
  include Aws::Structure
4306
4332
  end
@@ -4437,6 +4463,18 @@ module Aws::SageMaker
4437
4463
  # The LifeCycle configuration applied to the instance.
4438
4464
  # @return [Types::ClusterLifeCycleConfig]
4439
4465
  #
4466
+ # @!attribute [rw] override_vpc_config
4467
+ # Specifies an Amazon Virtual Private Cloud (VPC) that your SageMaker
4468
+ # jobs, hosted models, and compute resources have access to. You can
4469
+ # control access to and from your resources by configuring a VPC. For
4470
+ # more information, see [Give SageMaker Access to Resources in your
4471
+ # Amazon VPC][1].
4472
+ #
4473
+ #
4474
+ #
4475
+ # [1]: https://docs.aws.amazon.com/sagemaker/latest/dg/infrastructure-give-access.html
4476
+ # @return [Types::VpcConfig]
4477
+ #
4440
4478
  # @!attribute [rw] threads_per_core
4441
4479
  # The number of threads per CPU core you specified under
4442
4480
  # `CreateCluster`.
@@ -4469,6 +4507,7 @@ module Aws::SageMaker
4469
4507
  :instance_type,
4470
4508
  :launch_time,
4471
4509
  :life_cycle_config,
4510
+ :override_vpc_config,
4472
4511
  :threads_per_core,
4473
4512
  :instance_storage_configs,
4474
4513
  :private_primary_ip,
@@ -24194,9 +24233,9 @@ module Aws::SageMaker
24194
24233
  include Aws::Structure
24195
24234
  end
24196
24235
 
24197
- # Defines the compute resources to allocate to run a model that you
24198
- # assign to an inference component. These resources include CPU cores,
24199
- # accelerators, and memory.
24236
+ # Defines the compute resources to allocate to run a model, plus any
24237
+ # adapter models, that you assign to an inference component. These
24238
+ # resources include CPU cores, accelerators, and memory.
24200
24239
  #
24201
24240
  # @!attribute [rw] number_of_cpu_cores_required
24202
24241
  # The number of CPU cores to allocate to run a model that you assign
@@ -24355,17 +24394,45 @@ module Aws::SageMaker
24355
24394
  # @return [Types::InferenceComponentStartupParameters]
24356
24395
  #
24357
24396
  # @!attribute [rw] compute_resource_requirements
24358
- # The compute resources allocated to run the model assigned to the
24359
- # inference component.
24397
+ # The compute resources allocated to run the model, plus any adapter
24398
+ # models, that you assign to the inference component.
24399
+ #
24400
+ # Omit this parameter if your request is meant to create an adapter
24401
+ # inference component. An adapter inference component is loaded by a
24402
+ # base inference component, and it uses the compute resources of the
24403
+ # base inference component.
24360
24404
  # @return [Types::InferenceComponentComputeResourceRequirements]
24361
24405
  #
24406
+ # @!attribute [rw] base_inference_component_name
24407
+ # The name of an existing inference component that is to contain the
24408
+ # inference component that you're creating with your request.
24409
+ #
24410
+ # Specify this parameter only if your request is meant to create an
24411
+ # adapter inference component. An adapter inference component contains
24412
+ # the path to an adapter model. The purpose of the adapter model is to
24413
+ # tailor the inference output of a base foundation model, which is
24414
+ # hosted by the base inference component. The adapter inference
24415
+ # component uses the compute resources that you assigned to the base
24416
+ # inference component.
24417
+ #
24418
+ # When you create an adapter inference component, use the `Container`
24419
+ # parameter to specify the location of the adapter artifacts. In the
24420
+ # parameter value, use the `ArtifactUrl` parameter of the
24421
+ # `InferenceComponentContainerSpecification` data type.
24422
+ #
24423
+ # Before you can create an adapter inference component, you must have
24424
+ # an existing inference component that contains the foundation model
24425
+ # that you want to adapt.
24426
+ # @return [String]
24427
+ #
24362
24428
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentSpecification AWS API Documentation
24363
24429
  #
24364
24430
  class InferenceComponentSpecification < Struct.new(
24365
24431
  :model_name,
24366
24432
  :container,
24367
24433
  :startup_parameters,
24368
- :compute_resource_requirements)
24434
+ :compute_resource_requirements,
24435
+ :base_inference_component_name)
24369
24436
  SENSITIVE = []
24370
24437
  include Aws::Structure
24371
24438
  end
@@ -24388,17 +24455,23 @@ module Aws::SageMaker
24388
24455
  # @return [Types::InferenceComponentStartupParameters]
24389
24456
  #
24390
24457
  # @!attribute [rw] compute_resource_requirements
24391
- # The compute resources allocated to run the model assigned to the
24392
- # inference component.
24458
+ # The compute resources allocated to run the model, plus any adapter
24459
+ # models, that you assign to the inference component.
24393
24460
  # @return [Types::InferenceComponentComputeResourceRequirements]
24394
24461
  #
24462
+ # @!attribute [rw] base_inference_component_name
24463
+ # The name of the base inference component that contains this
24464
+ # inference component.
24465
+ # @return [String]
24466
+ #
24395
24467
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/InferenceComponentSpecificationSummary AWS API Documentation
24396
24468
  #
24397
24469
  class InferenceComponentSpecificationSummary < Struct.new(
24398
24470
  :model_name,
24399
24471
  :container,
24400
24472
  :startup_parameters,
24401
- :compute_resource_requirements)
24473
+ :compute_resource_requirements,
24474
+ :base_inference_component_name)
24402
24475
  SENSITIVE = []
24403
24476
  include Aws::Structure
24404
24477
  end
@@ -33836,6 +33909,28 @@ module Aws::SageMaker
33836
33909
  include Aws::Structure
33837
33910
  end
33838
33911
 
33912
+ # Settings for the model sharding technique that's applied by a model
33913
+ # optimization job.
33914
+ #
33915
+ # @!attribute [rw] image
33916
+ # The URI of an LMI DLC in Amazon ECR. SageMaker uses this image to
33917
+ # run the optimization.
33918
+ # @return [String]
33919
+ #
33920
+ # @!attribute [rw] override_environment
33921
+ # Environment variables that override the default ones in the model
33922
+ # container.
33923
+ # @return [Hash<String,String>]
33924
+ #
33925
+ # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/ModelShardingConfig AWS API Documentation
33926
+ #
33927
+ class ModelShardingConfig < Struct.new(
33928
+ :image,
33929
+ :override_environment)
33930
+ SENSITIVE = []
33931
+ include Aws::Structure
33932
+ end
33933
+
33839
33934
  # Metadata for Model steps.
33840
33935
  #
33841
33936
  # @!attribute [rw] arn
@@ -35415,11 +35510,17 @@ module Aws::SageMaker
35415
35510
  # model optimization job.
35416
35511
  # @return [Types::ModelCompilationConfig]
35417
35512
  #
35513
+ # @!attribute [rw] model_sharding_config
35514
+ # Settings for the model sharding technique that's applied by a model
35515
+ # optimization job.
35516
+ # @return [Types::ModelShardingConfig]
35517
+ #
35418
35518
  # @see http://docs.aws.amazon.com/goto/WebAPI/sagemaker-2017-07-24/OptimizationConfig AWS API Documentation
35419
35519
  #
35420
35520
  class OptimizationConfig < Struct.new(
35421
35521
  :model_quantization_config,
35422
35522
  :model_compilation_config,
35523
+ :model_sharding_config,
35423
35524
  :unknown)
35424
35525
  SENSITIVE = []
35425
35526
  include Aws::Structure
@@ -35427,6 +35528,7 @@ module Aws::SageMaker
35427
35528
 
35428
35529
  class ModelQuantizationConfig < OptimizationConfig; end
35429
35530
  class ModelCompilationConfig < OptimizationConfig; end
35531
+ class ModelShardingConfig < OptimizationConfig; end
35430
35532
  class Unknown < OptimizationConfig; end
35431
35533
  end
35432
35534
 
@@ -55,7 +55,7 @@ module Aws::SageMaker
55
55
  autoload :EndpointProvider, 'aws-sdk-sagemaker/endpoint_provider'
56
56
  autoload :Endpoints, 'aws-sdk-sagemaker/endpoints'
57
57
 
58
- GEM_VERSION = '1.275.0'
58
+ GEM_VERSION = '1.276.0'
59
59
 
60
60
  end
61
61