@aws-sdk/client-sagemaker 3.820.0 → 3.821.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (42) hide show
  1. package/dist-cjs/index.js +62 -23
  2. package/dist-es/models/models_0.js +3 -0
  3. package/dist-es/models/models_2.js +0 -15
  4. package/dist-es/models/models_3.js +15 -5
  5. package/dist-es/models/models_4.js +5 -0
  6. package/dist-es/protocols/Aws_json1_1.js +36 -0
  7. package/dist-types/commands/CreateDomainCommand.d.ts +1 -0
  8. package/dist-types/commands/CreateEndpointConfigCommand.d.ts +8 -0
  9. package/dist-types/commands/DescribeDomainCommand.d.ts +1 -0
  10. package/dist-types/commands/DescribeEndpointCommand.d.ts +30 -0
  11. package/dist-types/commands/DescribeEndpointConfigCommand.d.ts +8 -0
  12. package/dist-types/commands/DescribeFlowDefinitionCommand.d.ts +2 -1
  13. package/dist-types/commands/DescribeHubCommand.d.ts +1 -2
  14. package/dist-types/commands/ListCodeRepositoriesCommand.d.ts +1 -1
  15. package/dist-types/commands/ListCompilationJobsCommand.d.ts +1 -2
  16. package/dist-types/commands/SearchCommand.d.ts +30 -0
  17. package/dist-types/commands/StopCompilationJobCommand.d.ts +1 -1
  18. package/dist-types/commands/StopEdgeDeploymentStageCommand.d.ts +1 -1
  19. package/dist-types/commands/StopEdgePackagingJobCommand.d.ts +1 -1
  20. package/dist-types/commands/StopHyperParameterTuningJobCommand.d.ts +1 -1
  21. package/dist-types/commands/UpdateDomainCommand.d.ts +1 -0
  22. package/dist-types/models/models_0.d.ts +11 -11
  23. package/dist-types/models/models_1.d.ts +38 -53
  24. package/dist-types/models/models_2.d.ts +121 -98
  25. package/dist-types/models/models_3.d.ts +99 -136
  26. package/dist-types/models/models_4.d.ts +134 -46
  27. package/dist-types/models/models_5.d.ts +45 -0
  28. package/dist-types/ts3.4/commands/DescribeFlowDefinitionCommand.d.ts +2 -4
  29. package/dist-types/ts3.4/commands/DescribeHubCommand.d.ts +1 -2
  30. package/dist-types/ts3.4/commands/ListCodeRepositoriesCommand.d.ts +1 -1
  31. package/dist-types/ts3.4/commands/ListCompilationJobsCommand.d.ts +4 -2
  32. package/dist-types/ts3.4/commands/StopCompilationJobCommand.d.ts +1 -1
  33. package/dist-types/ts3.4/commands/StopEdgeDeploymentStageCommand.d.ts +1 -1
  34. package/dist-types/ts3.4/commands/StopEdgePackagingJobCommand.d.ts +1 -1
  35. package/dist-types/ts3.4/commands/StopHyperParameterTuningJobCommand.d.ts +1 -1
  36. package/dist-types/ts3.4/models/models_0.d.ts +5 -3
  37. package/dist-types/ts3.4/models/models_1.d.ts +13 -13
  38. package/dist-types/ts3.4/models/models_2.d.ts +32 -39
  39. package/dist-types/ts3.4/models/models_3.d.ts +37 -40
  40. package/dist-types/ts3.4/models/models_4.d.ts +38 -13
  41. package/dist-types/ts3.4/models/models_5.d.ts +13 -0
  42. package/package.json +34 -34
@@ -1,6 +1,17 @@
1
1
  import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion, ExceptionOptionType as __ExceptionOptionType } from "@smithy/smithy-client";
2
- import { ActionSource, ActionStatus, ActivationState, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppInstanceType, AppLifecycleManagement, AppNetworkAccessType, AppSecurityGroupManagement, AppType, ArtifactSource, AsyncInferenceConfig, AuthMode, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoMountHomeEFS, AutoParameter, AutoRollbackConfig, Autotune, AwsManagedHumanLoopRequestSource, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterInstanceGroupSpecification, ClusterNodeRecovery, ClusterOrchestrator, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, CollectionType, CompleteOnConvergence, ComputeQuotaConfig, ComputeQuotaTarget, ContainerMode, CustomImage, FeatureStatus, GitConfig, ImageConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelApprovalStatus, ModelDataSource, MultiModelConfig, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, TrainingInputMode, TrainingInstanceType, TransformJobDefinition, VpcConfig } from "./models_0";
2
+ import { ActionSource, ActionStatus, ActivationState, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppInstanceType, AppLifecycleManagement, AppNetworkAccessType, AppSecurityGroupManagement, AppType, ArtifactSource, AsyncInferenceConfig, AuthMode, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoMountHomeEFS, AutoParameter, AutoRollbackConfig, Autotune, AwsManagedHumanLoopRequestSource, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacityReservationPreference, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterInstanceGroupSpecification, ClusterNodeRecovery, ClusterOrchestrator, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, CollectionType, CompleteOnConvergence, ComputeQuotaConfig, ComputeQuotaTarget, ContainerMode, CustomImage, FeatureStatus, GitConfig, ImageConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelApprovalStatus, ModelCacheSetting, ModelDataSource, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, TrainingInputMode, TrainingInstanceType, TransformJobDefinition, VpcConfig } from "./models_0";
3
3
  import { SageMakerServiceException as __BaseException } from "./SageMakerServiceException";
4
+ /**
5
+ * <p>Specifies additional configuration for hosting multi-model endpoints.</p>
6
+ * @public
7
+ */
8
+ export interface MultiModelConfig {
9
+ /**
10
+ * <p>Whether to cache models for a multi-model endpoint. By default, multi-model endpoints cache models so that a model does not have to be loaded into memory each time it is invoked. Some use cases do not benefit from model caching. For example, if an endpoint hosts a large number of models that are each invoked infrequently, the endpoint might perform better if you disable model caching. To disable model caching, set the value of this parameter to <code>Disabled</code>.</p>
11
+ * @public
12
+ */
13
+ ModelCacheSetting?: ModelCacheSetting | undefined;
14
+ }
4
15
  /**
5
16
  * <p>Describes the container, as part of model definition.</p>
6
17
  * @public
@@ -2408,6 +2419,11 @@ export interface UnifiedStudioSettings {
2408
2419
  * @public
2409
2420
  */
2410
2421
  ProjectS3Path?: string | undefined;
2422
+ /**
2423
+ * <p>The ARN of the application managed by SageMaker AI and SageMaker Unified Studio in the Amazon Web Services IAM Identity Center.</p>
2424
+ * @public
2425
+ */
2426
+ SingleSignOnApplicationArn?: string | undefined;
2411
2427
  }
2412
2428
  /**
2413
2429
  * <p>A collection of settings that apply to the <code>SageMaker Domain</code>. These settings are specified through the <code>CreateDomain</code> API call.</p>
@@ -2893,6 +2909,22 @@ export declare const ProductionVariantAcceleratorType: {
2893
2909
  * @public
2894
2910
  */
2895
2911
  export type ProductionVariantAcceleratorType = (typeof ProductionVariantAcceleratorType)[keyof typeof ProductionVariantAcceleratorType];
2912
+ /**
2913
+ * <p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>
2914
+ * @public
2915
+ */
2916
+ export interface ProductionVariantCapacityReservationConfig {
2917
+ /**
2918
+ * <p>Options that you can choose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>
2919
+ * @public
2920
+ */
2921
+ CapacityReservationPreference?: CapacityReservationPreference | undefined;
2922
+ /**
2923
+ * <p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>
2924
+ * @public
2925
+ */
2926
+ MlReservationArn?: string | undefined;
2927
+ }
2896
2928
  /**
2897
2929
  * <p>Specifies configuration for a core dump from the model container when the process crashes.</p>
2898
2930
  * @public
@@ -3080,6 +3112,11 @@ export interface ProductionVariant {
3080
3112
  * @public
3081
3113
  */
3082
3114
  InferenceAmiVersion?: ProductionVariantInferenceAmiVersion | undefined;
3115
+ /**
3116
+ * <p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>
3117
+ * @public
3118
+ */
3119
+ CapacityReservationConfig?: ProductionVariantCapacityReservationConfig | undefined;
3083
3120
  }
3084
3121
  /**
3085
3122
  * @public
@@ -6849,58 +6886,6 @@ export interface CreateModelQualityJobDefinitionResponse {
6849
6886
  */
6850
6887
  JobDefinitionArn: string | undefined;
6851
6888
  }
6852
- /**
6853
- * <p>Configuration for monitoring constraints and monitoring statistics. These baseline resources are compared against the results of the current job from the series of jobs scheduled to collect data periodically.</p>
6854
- * @public
6855
- */
6856
- export interface MonitoringBaselineConfig {
6857
- /**
6858
- * <p>The name of the job that performs baselining for the monitoring job.</p>
6859
- * @public
6860
- */
6861
- BaseliningJobName?: string | undefined;
6862
- /**
6863
- * <p>The baseline constraint file in Amazon S3 that the current monitoring job should validated against.</p>
6864
- * @public
6865
- */
6866
- ConstraintsResource?: MonitoringConstraintsResource | undefined;
6867
- /**
6868
- * <p>The baseline statistics file in Amazon S3 that the current monitoring job should be validated against.</p>
6869
- * @public
6870
- */
6871
- StatisticsResource?: MonitoringStatisticsResource | undefined;
6872
- }
6873
- /**
6874
- * <p>Container image configuration object for the monitoring job.</p>
6875
- * @public
6876
- */
6877
- export interface MonitoringAppSpecification {
6878
- /**
6879
- * <p>The container image to be run by the monitoring job.</p>
6880
- * @public
6881
- */
6882
- ImageUri: string | undefined;
6883
- /**
6884
- * <p>Specifies the entrypoint for a container used to run the monitoring job.</p>
6885
- * @public
6886
- */
6887
- ContainerEntrypoint?: string[] | undefined;
6888
- /**
6889
- * <p>An array of arguments for the container used to run the monitoring job.</p>
6890
- * @public
6891
- */
6892
- ContainerArguments?: string[] | undefined;
6893
- /**
6894
- * <p>An Amazon S3 URI to a script that is called per row prior to running analysis. It can base64 decode the payload and convert it into a flattened JSON so that the built-in container can use the converted data. Applicable only for the built-in (first party) containers.</p>
6895
- * @public
6896
- */
6897
- RecordPreprocessorSourceUri?: string | undefined;
6898
- /**
6899
- * <p>An Amazon S3 URI to a script that is called after analysis has been performed. Applicable only for the built-in (first party) containers.</p>
6900
- * @public
6901
- */
6902
- PostAnalyticsProcessorSourceUri?: string | undefined;
6903
- }
6904
6889
  /**
6905
6890
  * @internal
6906
6891
  */
@@ -1,5 +1,57 @@
1
- import { ActionSource, ActionStatus, ActivationState, AlgorithmSpecification, AlgorithmStatus, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppNetworkAccessType, AppSecurityGroupManagement, AppSpecification, AppStatus, AppType, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AuthMode, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLProblemTypeConfigName, AutoMLResolvedAttributes, AutoMLSecurityConfig, BatchDataCaptureConfig, BatchStrategy, BatchTransformInput, CaptureStatus, Channel, CheckpointConfig, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterNodeRecovery, ClusterOrchestrator, ClusterStatus, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, CompilationJobStatus, ComputeQuotaConfig, ComputeQuotaTarget, FeatureStatus, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
- import { _InstanceType, ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, EdgePresetDeploymentType, EndpointInput, ExplainerConfig, FeatureDefinition, FeatureType, FlowDefinitionOutputConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, ModelDeployConfig, MonitoringAppSpecification, MonitoringBaselineConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, OfflineStoreConfig, OnlineStoreConfig, OutputConfig, ProcessingInstanceType, ProcessingS3UploadMode, ProductionVariant, ProductionVariantAcceleratorType, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TagPropagation, ThroughputMode, TrainingSpecification, UserSettings } from "./models_1";
1
+ import { ActionSource, ActionStatus, ActivationState, AlgorithmSpecification, AlgorithmStatus, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppNetworkAccessType, AppSecurityGroupManagement, AppSpecification, AppStatus, AppType, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AuthMode, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLProblemTypeConfigName, AutoMLResolvedAttributes, AutoMLSecurityConfig, BatchDataCaptureConfig, BatchStrategy, BatchTransformInput, CapacityReservationPreference, CaptureStatus, Channel, CheckpointConfig, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterNodeRecovery, ClusterOrchestrator, ClusterStatus, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, CompilationJobStatus, ComputeQuotaConfig, ComputeQuotaTarget, FeatureStatus, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
+ import { _InstanceType, ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, EdgePresetDeploymentType, EndpointInput, ExplainerConfig, FeatureDefinition, FeatureType, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, ModelDeployConfig, MonitoringConstraintsResource, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStatisticsResource, MonitoringStoppingCondition, NeoVpcConfig, OfflineStoreConfig, OnlineStoreConfig, OutputConfig, ProcessingInstanceType, ProcessingS3UploadMode, ProductionVariant, ProductionVariantAcceleratorType, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TagPropagation, ThroughputMode, TrainingSpecification, UserSettings } from "./models_1";
3
+ /**
4
+ * <p>Configuration for monitoring constraints and monitoring statistics. These baseline resources are compared against the results of the current job from the series of jobs scheduled to collect data periodically.</p>
5
+ * @public
6
+ */
7
+ export interface MonitoringBaselineConfig {
8
+ /**
9
+ * <p>The name of the job that performs baselining for the monitoring job.</p>
10
+ * @public
11
+ */
12
+ BaseliningJobName?: string | undefined;
13
+ /**
14
+ * <p>The baseline constraint file in Amazon S3 that the current monitoring job should validated against.</p>
15
+ * @public
16
+ */
17
+ ConstraintsResource?: MonitoringConstraintsResource | undefined;
18
+ /**
19
+ * <p>The baseline statistics file in Amazon S3 that the current monitoring job should be validated against.</p>
20
+ * @public
21
+ */
22
+ StatisticsResource?: MonitoringStatisticsResource | undefined;
23
+ }
24
+ /**
25
+ * <p>Container image configuration object for the monitoring job.</p>
26
+ * @public
27
+ */
28
+ export interface MonitoringAppSpecification {
29
+ /**
30
+ * <p>The container image to be run by the monitoring job.</p>
31
+ * @public
32
+ */
33
+ ImageUri: string | undefined;
34
+ /**
35
+ * <p>Specifies the entrypoint for a container used to run the monitoring job.</p>
36
+ * @public
37
+ */
38
+ ContainerEntrypoint?: string[] | undefined;
39
+ /**
40
+ * <p>An array of arguments for the container used to run the monitoring job.</p>
41
+ * @public
42
+ */
43
+ ContainerArguments?: string[] | undefined;
44
+ /**
45
+ * <p>An Amazon S3 URI to a script that is called per row prior to running analysis. It can base64 decode the payload and convert it into a flattened JSON so that the built-in container can use the converted data. Applicable only for the built-in (first party) containers.</p>
46
+ * @public
47
+ */
48
+ RecordPreprocessorSourceUri?: string | undefined;
49
+ /**
50
+ * <p>An Amazon S3 URI to a script that is called after analysis has been performed. Applicable only for the built-in (first party) containers.</p>
51
+ * @public
52
+ */
53
+ PostAnalyticsProcessorSourceUri?: string | undefined;
54
+ }
3
55
  /**
4
56
  * <p>The inputs for a monitoring job.</p>
5
57
  * @public
@@ -5918,6 +5970,68 @@ export interface PendingDeploymentSummary {
5918
5970
  */
5919
5971
  ShadowProductionVariants?: PendingProductionVariantSummary[] | undefined;
5920
5972
  }
5973
+ /**
5974
+ * <p>The EC2 capacity reservations that are shared to an ML capacity reservation.</p>
5975
+ * @public
5976
+ */
5977
+ export interface Ec2CapacityReservation {
5978
+ /**
5979
+ * <p>The unique identifier for an EC2 capacity reservation that's part of the ML capacity reservation.</p>
5980
+ * @public
5981
+ */
5982
+ Ec2CapacityReservationId?: string | undefined;
5983
+ /**
5984
+ * <p>The number of instances that you allocated to the EC2 capacity reservation.</p>
5985
+ * @public
5986
+ */
5987
+ TotalInstanceCount?: number | undefined;
5988
+ /**
5989
+ * <p>The number of instances that are currently available in the EC2 capacity reservation.</p>
5990
+ * @public
5991
+ */
5992
+ AvailableInstanceCount?: number | undefined;
5993
+ /**
5994
+ * <p>The number of instances from the EC2 capacity reservation that are being used by the endpoint.</p>
5995
+ * @public
5996
+ */
5997
+ UsedByCurrentEndpoint?: number | undefined;
5998
+ }
5999
+ /**
6000
+ * <p>Details about an ML capacity reservation.</p>
6001
+ * @public
6002
+ */
6003
+ export interface ProductionVariantCapacityReservationSummary {
6004
+ /**
6005
+ * <p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>
6006
+ * @public
6007
+ */
6008
+ MlReservationArn?: string | undefined;
6009
+ /**
6010
+ * <p>The option that you chose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>
6011
+ * @public
6012
+ */
6013
+ CapacityReservationPreference?: CapacityReservationPreference | undefined;
6014
+ /**
6015
+ * <p>The number of instances that you allocated to the ML capacity reservation.</p>
6016
+ * @public
6017
+ */
6018
+ TotalInstanceCount?: number | undefined;
6019
+ /**
6020
+ * <p>The number of instances that are currently available in the ML capacity reservation.</p>
6021
+ * @public
6022
+ */
6023
+ AvailableInstanceCount?: number | undefined;
6024
+ /**
6025
+ * <p>The number of instances from the ML capacity reservation that are being used by the endpoint.</p>
6026
+ * @public
6027
+ */
6028
+ UsedByCurrentEndpoint?: number | undefined;
6029
+ /**
6030
+ * <p>The EC2 capacity reservations that are shared to this ML capacity reservation, if any.</p>
6031
+ * @public
6032
+ */
6033
+ Ec2CapacityReservations?: Ec2CapacityReservation[] | undefined;
6034
+ }
5921
6035
  /**
5922
6036
  * <p>Describes weight and capacities for a production variant associated with an endpoint. If you sent a request to the <code>UpdateEndpointWeightsAndCapacities</code> API and the endpoint status is <code>Updating</code>, you get different desired and current values. </p>
5923
6037
  * @public
@@ -5978,6 +6092,11 @@ export interface ProductionVariantSummary {
5978
6092
  * @public
5979
6093
  */
5980
6094
  RoutingConfig?: ProductionVariantRoutingConfig | undefined;
6095
+ /**
6096
+ * <p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>
6097
+ * @public
6098
+ */
6099
+ CapacityReservationConfig?: ProductionVariantCapacityReservationSummary | undefined;
5981
6100
  }
5982
6101
  /**
5983
6102
  * @public
@@ -6495,102 +6614,6 @@ export interface DescribeFlowDefinitionRequest {
6495
6614
  */
6496
6615
  FlowDefinitionName: string | undefined;
6497
6616
  }
6498
- /**
6499
- * @public
6500
- * @enum
6501
- */
6502
- export declare const FlowDefinitionStatus: {
6503
- readonly ACTIVE: "Active";
6504
- readonly DELETING: "Deleting";
6505
- readonly FAILED: "Failed";
6506
- readonly INITIALIZING: "Initializing";
6507
- };
6508
- /**
6509
- * @public
6510
- */
6511
- export type FlowDefinitionStatus = (typeof FlowDefinitionStatus)[keyof typeof FlowDefinitionStatus];
6512
- /**
6513
- * @public
6514
- */
6515
- export interface DescribeFlowDefinitionResponse {
6516
- /**
6517
- * <p>The Amazon Resource Name (ARN) of the flow defintion.</p>
6518
- * @public
6519
- */
6520
- FlowDefinitionArn: string | undefined;
6521
- /**
6522
- * <p>The Amazon Resource Name (ARN) of the flow definition.</p>
6523
- * @public
6524
- */
6525
- FlowDefinitionName: string | undefined;
6526
- /**
6527
- * <p>The status of the flow definition. Valid values are listed below.</p>
6528
- * @public
6529
- */
6530
- FlowDefinitionStatus: FlowDefinitionStatus | undefined;
6531
- /**
6532
- * <p>The timestamp when the flow definition was created.</p>
6533
- * @public
6534
- */
6535
- CreationTime: Date | undefined;
6536
- /**
6537
- * <p>Container for configuring the source of human task requests. Used to specify if Amazon Rekognition or Amazon Textract is used as an integration source.</p>
6538
- * @public
6539
- */
6540
- HumanLoopRequestSource?: HumanLoopRequestSource | undefined;
6541
- /**
6542
- * <p>An object containing information about what triggers a human review workflow.</p>
6543
- * @public
6544
- */
6545
- HumanLoopActivationConfig?: HumanLoopActivationConfig | undefined;
6546
- /**
6547
- * <p>An object containing information about who works on the task, the workforce task price, and other task details.</p>
6548
- * @public
6549
- */
6550
- HumanLoopConfig?: HumanLoopConfig | undefined;
6551
- /**
6552
- * <p>An object containing information about the output file.</p>
6553
- * @public
6554
- */
6555
- OutputConfig: FlowDefinitionOutputConfig | undefined;
6556
- /**
6557
- * <p>The Amazon Resource Name (ARN) of the Amazon Web Services Identity and Access Management (IAM) execution role for the flow definition.</p>
6558
- * @public
6559
- */
6560
- RoleArn: string | undefined;
6561
- /**
6562
- * <p>The reason your flow definition failed.</p>
6563
- * @public
6564
- */
6565
- FailureReason?: string | undefined;
6566
- }
6567
- /**
6568
- * @public
6569
- */
6570
- export interface DescribeHubRequest {
6571
- /**
6572
- * <p>The name of the hub to describe.</p>
6573
- * @public
6574
- */
6575
- HubName: string | undefined;
6576
- }
6577
- /**
6578
- * @public
6579
- * @enum
6580
- */
6581
- export declare const HubStatus: {
6582
- readonly CREATE_FAILED: "CreateFailed";
6583
- readonly CREATING: "Creating";
6584
- readonly DELETE_FAILED: "DeleteFailed";
6585
- readonly DELETING: "Deleting";
6586
- readonly IN_SERVICE: "InService";
6587
- readonly UPDATE_FAILED: "UpdateFailed";
6588
- readonly UPDATING: "Updating";
6589
- };
6590
- /**
6591
- * @public
6592
- */
6593
- export type HubStatus = (typeof HubStatus)[keyof typeof HubStatus];
6594
6617
  /**
6595
6618
  * @internal
6596
6619
  */
@@ -1,6 +1,102 @@
1
- import { ActionSummary, AdditionalInferenceSpecificationDefinition, AgentVersion, AlgorithmSortBy, AlgorithmSpecification, AlgorithmSummary, AmazonQSettings, AppDetails, AppImageConfigDetails, AppImageConfigSortKey, AppSortKey, AppSpecification, ArtifactSummary, AssociationEdgeType, AssociationSummary, AutoMLCandidate, AutoMLJobStatus, AutoMLJobSummary, AutoMLSortBy, AutoMLSortOrder, AutoRollbackConfig, Autotune, BatchDataCaptureConfig, BatchStrategy, CandidateSortBy, CandidateStatus, Channel, CheckpointConfig, ClusterNodeSummary, ClusterSchedulerConfigSummary, ClusterSortBy, ClusterSummary, CodeRepositorySortBy, CodeRepositorySortOrder, CodeRepositorySummary, CognitoConfig, CompilationJobStatus, InferenceSpecification, ModelApprovalStatus, ModelPackageStatus, ObjectiveStatus, OutputDataConfig, OutputParameter, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
- import { _InstanceType, ContainerDefinition, DockerSettings, DriftCheckBaselines, EdgeOutputConfig, EndpointInfo, ExecutionRoleIdentityConfig, FeatureDefinition, FeatureType, HubS3StorageConfig, HumanTaskConfig, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartConfig, InferenceComponentComputeResourceRequirements, InferenceComponentStartupParameters, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InferenceExperimentType, JobType, LabelingJobAlgorithmsConfig, LabelingJobInputConfig, LabelingJobOutputConfig, LabelingJobStoppingConditions, MetadataProperties, ModelBiasAppSpecification, ModelBiasBaselineConfig, ModelBiasJobInput, ModelCardExportOutputConfig, ModelCardSecurityConfig, ModelCardStatus, ModelExplainabilityAppSpecification, ModelExplainabilityBaselineConfig, ModelExplainabilityJobInput, ModelInfrastructureConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelQualityAppSpecification, ModelQualityBaselineConfig, ModelQualityJobInput, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, OfflineStoreConfig, OnlineStoreConfig, Processor, ProductionVariantServerlessConfig, RecommendationJobInputConfig, RecommendationJobStoppingConditions, RecommendationJobType, ResourceLimits, RetryStrategy, ShadowModeConfig, SkipModelValidation, SourceAlgorithmSpecification, TrackingServerSize, UnifiedStudioSettings, UserSettings, VendorGuidance } from "./models_1";
3
- import { CustomizedMetricSpecification, DataCaptureConfigSummary, DataProcessing, DebugHookConfig, DebugRuleConfiguration, DebugRuleEvaluationStatus, DeployedImage, DeploymentRecommendation, DirectInternetAccess, DomainStatus, EdgePackagingJobStatus, EndpointStatus, ExperimentConfig, ExperimentSource, FeatureGroupStatus, FeatureParameter, FlowDefinitionStatus, HubContentType, HubStatus, InfraCheckConfig, InstanceMetadataServiceConfiguration, LastUpdateStatus, MemberDefinition, ModelArtifacts, ModelClientConfig, MonitoringScheduleConfig, MonitoringType, NetworkConfig, NotebookInstanceAcceleratorType, NotebookInstanceLifecycleHook, NotificationConfiguration, OfflineStoreStatus, OptimizationConfig, OptimizationJobDeploymentInstanceType, OptimizationJobModelSource, OptimizationJobOutputConfig, OptimizationVpcConfig, OwnershipSettings, ParallelismConfiguration, PartnerAppAuthType, PartnerAppConfig, PartnerAppMaintenanceConfig, PartnerAppType, ProcessingInput, ProcessingOutputConfig, ProcessingResources, ProcessingStoppingCondition, ProductionVariantSummary, ProfilerConfig, ProfilerRuleConfiguration, RemoteDebugConfig, RootAccess, RuleEvaluationStatus, ServiceCatalogProvisioningDetails, SourceIpConfig, SpaceSettings, SpaceSharingSettings, StudioLifecycleConfigAppType, TensorBoardOutputConfig, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus, WorkerAccessConfiguration } from "./models_2";
1
+ import { ActionSummary, AdditionalInferenceSpecificationDefinition, AgentVersion, AlgorithmSortBy, AlgorithmSpecification, AlgorithmSummary, AmazonQSettings, AppDetails, AppImageConfigDetails, AppImageConfigSortKey, AppSortKey, AppSpecification, ArtifactSummary, AssociationEdgeType, AssociationSummary, AutoMLCandidate, AutoMLJobStatus, AutoMLJobSummary, AutoMLSortBy, AutoMLSortOrder, AutoRollbackConfig, Autotune, BatchDataCaptureConfig, BatchStrategy, CandidateSortBy, CandidateStatus, Channel, CheckpointConfig, ClusterNodeSummary, ClusterSchedulerConfigSummary, ClusterSortBy, ClusterSummary, CognitoConfig, InferenceSpecification, ModelApprovalStatus, ModelPackageStatus, ObjectiveStatus, OutputDataConfig, OutputParameter, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
+ import { _InstanceType, ContainerDefinition, DockerSettings, DriftCheckBaselines, EdgeOutputConfig, EndpointInfo, ExecutionRoleIdentityConfig, FeatureDefinition, FeatureType, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HumanTaskConfig, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartConfig, InferenceComponentComputeResourceRequirements, InferenceComponentStartupParameters, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InferenceExperimentType, JobType, LabelingJobAlgorithmsConfig, LabelingJobInputConfig, LabelingJobOutputConfig, LabelingJobStoppingConditions, MetadataProperties, ModelBiasAppSpecification, ModelBiasBaselineConfig, ModelBiasJobInput, ModelCardExportOutputConfig, ModelCardSecurityConfig, ModelCardStatus, ModelExplainabilityAppSpecification, ModelExplainabilityBaselineConfig, ModelExplainabilityJobInput, ModelInfrastructureConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelQualityAppSpecification, ModelQualityBaselineConfig, ModelQualityJobInput, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, OfflineStoreConfig, OnlineStoreConfig, Processor, ProductionVariantServerlessConfig, RecommendationJobInputConfig, RecommendationJobStoppingConditions, RecommendationJobType, ResourceLimits, RetryStrategy, ShadowModeConfig, SkipModelValidation, SourceAlgorithmSpecification, TrackingServerSize, UnifiedStudioSettings, UserSettings, VendorGuidance } from "./models_1";
3
+ import { CustomizedMetricSpecification, DataCaptureConfigSummary, DataProcessing, DebugHookConfig, DebugRuleConfiguration, DebugRuleEvaluationStatus, DeployedImage, DeploymentRecommendation, DirectInternetAccess, DomainStatus, EdgePackagingJobStatus, EndpointStatus, ExperimentConfig, ExperimentSource, FeatureGroupStatus, FeatureParameter, HubContentType, InfraCheckConfig, InstanceMetadataServiceConfiguration, LastUpdateStatus, MemberDefinition, ModelArtifacts, ModelClientConfig, MonitoringScheduleConfig, MonitoringType, NetworkConfig, NotebookInstanceAcceleratorType, NotebookInstanceLifecycleHook, NotificationConfiguration, OfflineStoreStatus, OptimizationConfig, OptimizationJobDeploymentInstanceType, OptimizationJobModelSource, OptimizationJobOutputConfig, OptimizationVpcConfig, OwnershipSettings, ParallelismConfiguration, PartnerAppAuthType, PartnerAppConfig, PartnerAppMaintenanceConfig, PartnerAppType, ProcessingInput, ProcessingOutputConfig, ProcessingResources, ProcessingStoppingCondition, ProductionVariantSummary, ProfilerConfig, ProfilerRuleConfiguration, RemoteDebugConfig, RootAccess, RuleEvaluationStatus, ServiceCatalogProvisioningDetails, SourceIpConfig, SpaceSettings, SpaceSharingSettings, StudioLifecycleConfigAppType, TensorBoardOutputConfig, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus, WorkerAccessConfiguration } from "./models_2";
4
+ /**
5
+ * @public
6
+ * @enum
7
+ */
8
+ export declare const FlowDefinitionStatus: {
9
+ readonly ACTIVE: "Active";
10
+ readonly DELETING: "Deleting";
11
+ readonly FAILED: "Failed";
12
+ readonly INITIALIZING: "Initializing";
13
+ };
14
+ /**
15
+ * @public
16
+ */
17
+ export type FlowDefinitionStatus = (typeof FlowDefinitionStatus)[keyof typeof FlowDefinitionStatus];
18
+ /**
19
+ * @public
20
+ */
21
+ export interface DescribeFlowDefinitionResponse {
22
+ /**
23
+ * <p>The Amazon Resource Name (ARN) of the flow defintion.</p>
24
+ * @public
25
+ */
26
+ FlowDefinitionArn: string | undefined;
27
+ /**
28
+ * <p>The Amazon Resource Name (ARN) of the flow definition.</p>
29
+ * @public
30
+ */
31
+ FlowDefinitionName: string | undefined;
32
+ /**
33
+ * <p>The status of the flow definition. Valid values are listed below.</p>
34
+ * @public
35
+ */
36
+ FlowDefinitionStatus: FlowDefinitionStatus | undefined;
37
+ /**
38
+ * <p>The timestamp when the flow definition was created.</p>
39
+ * @public
40
+ */
41
+ CreationTime: Date | undefined;
42
+ /**
43
+ * <p>Container for configuring the source of human task requests. Used to specify if Amazon Rekognition or Amazon Textract is used as an integration source.</p>
44
+ * @public
45
+ */
46
+ HumanLoopRequestSource?: HumanLoopRequestSource | undefined;
47
+ /**
48
+ * <p>An object containing information about what triggers a human review workflow.</p>
49
+ * @public
50
+ */
51
+ HumanLoopActivationConfig?: HumanLoopActivationConfig | undefined;
52
+ /**
53
+ * <p>An object containing information about who works on the task, the workforce task price, and other task details.</p>
54
+ * @public
55
+ */
56
+ HumanLoopConfig?: HumanLoopConfig | undefined;
57
+ /**
58
+ * <p>An object containing information about the output file.</p>
59
+ * @public
60
+ */
61
+ OutputConfig: FlowDefinitionOutputConfig | undefined;
62
+ /**
63
+ * <p>The Amazon Resource Name (ARN) of the Amazon Web Services Identity and Access Management (IAM) execution role for the flow definition.</p>
64
+ * @public
65
+ */
66
+ RoleArn: string | undefined;
67
+ /**
68
+ * <p>The reason your flow definition failed.</p>
69
+ * @public
70
+ */
71
+ FailureReason?: string | undefined;
72
+ }
73
+ /**
74
+ * @public
75
+ */
76
+ export interface DescribeHubRequest {
77
+ /**
78
+ * <p>The name of the hub to describe.</p>
79
+ * @public
80
+ */
81
+ HubName: string | undefined;
82
+ }
83
+ /**
84
+ * @public
85
+ * @enum
86
+ */
87
+ export declare const HubStatus: {
88
+ readonly CREATE_FAILED: "CreateFailed";
89
+ readonly CREATING: "Creating";
90
+ readonly DELETE_FAILED: "DeleteFailed";
91
+ readonly DELETING: "Deleting";
92
+ readonly IN_SERVICE: "InService";
93
+ readonly UPDATE_FAILED: "UpdateFailed";
94
+ readonly UPDATING: "Updating";
95
+ };
96
+ /**
97
+ * @public
98
+ */
99
+ export type HubStatus = (typeof HubStatus)[keyof typeof HubStatus];
4
100
  /**
5
101
  * @public
6
102
  */
@@ -8626,139 +8722,6 @@ export interface ListClusterSchedulerConfigsResponse {
8626
8722
  */
8627
8723
  NextToken?: string | undefined;
8628
8724
  }
8629
- /**
8630
- * @public
8631
- */
8632
- export interface ListCodeRepositoriesInput {
8633
- /**
8634
- * <p>A filter that returns only Git repositories that were created after the specified time.</p>
8635
- * @public
8636
- */
8637
- CreationTimeAfter?: Date | undefined;
8638
- /**
8639
- * <p>A filter that returns only Git repositories that were created before the specified time.</p>
8640
- * @public
8641
- */
8642
- CreationTimeBefore?: Date | undefined;
8643
- /**
8644
- * <p>A filter that returns only Git repositories that were last modified after the specified time.</p>
8645
- * @public
8646
- */
8647
- LastModifiedTimeAfter?: Date | undefined;
8648
- /**
8649
- * <p>A filter that returns only Git repositories that were last modified before the specified time.</p>
8650
- * @public
8651
- */
8652
- LastModifiedTimeBefore?: Date | undefined;
8653
- /**
8654
- * <p>The maximum number of Git repositories to return in the response.</p>
8655
- * @public
8656
- */
8657
- MaxResults?: number | undefined;
8658
- /**
8659
- * <p>A string in the Git repositories name. This filter returns only repositories whose name contains the specified string.</p>
8660
- * @public
8661
- */
8662
- NameContains?: string | undefined;
8663
- /**
8664
- * <p>If the result of a <code>ListCodeRepositoriesOutput</code> request was truncated, the response includes a <code>NextToken</code>. To get the next set of Git repositories, use the token in the next request.</p>
8665
- * @public
8666
- */
8667
- NextToken?: string | undefined;
8668
- /**
8669
- * <p>The field to sort results by. The default is <code>Name</code>.</p>
8670
- * @public
8671
- */
8672
- SortBy?: CodeRepositorySortBy | undefined;
8673
- /**
8674
- * <p>The sort order for results. The default is <code>Ascending</code>.</p>
8675
- * @public
8676
- */
8677
- SortOrder?: CodeRepositorySortOrder | undefined;
8678
- }
8679
- /**
8680
- * @public
8681
- */
8682
- export interface ListCodeRepositoriesOutput {
8683
- /**
8684
- * <p>Gets a list of summaries of the Git repositories. Each summary specifies the following values for the repository: </p> <ul> <li> <p>Name</p> </li> <li> <p>Amazon Resource Name (ARN)</p> </li> <li> <p>Creation time</p> </li> <li> <p>Last modified time</p> </li> <li> <p>Configuration information, including the URL location of the repository and the ARN of the Amazon Web Services Secrets Manager secret that contains the credentials used to access the repository.</p> </li> </ul>
8685
- * @public
8686
- */
8687
- CodeRepositorySummaryList: CodeRepositorySummary[] | undefined;
8688
- /**
8689
- * <p>If the result of a <code>ListCodeRepositoriesOutput</code> request was truncated, the response includes a <code>NextToken</code>. To get the next set of Git repositories, use the token in the next request.</p>
8690
- * @public
8691
- */
8692
- NextToken?: string | undefined;
8693
- }
8694
- /**
8695
- * @public
8696
- * @enum
8697
- */
8698
- export declare const ListCompilationJobsSortBy: {
8699
- readonly CREATION_TIME: "CreationTime";
8700
- readonly NAME: "Name";
8701
- readonly STATUS: "Status";
8702
- };
8703
- /**
8704
- * @public
8705
- */
8706
- export type ListCompilationJobsSortBy = (typeof ListCompilationJobsSortBy)[keyof typeof ListCompilationJobsSortBy];
8707
- /**
8708
- * @public
8709
- */
8710
- export interface ListCompilationJobsRequest {
8711
- /**
8712
- * <p>If the result of the previous <code>ListCompilationJobs</code> request was truncated, the response includes a <code>NextToken</code>. To retrieve the next set of model compilation jobs, use the token in the next request.</p>
8713
- * @public
8714
- */
8715
- NextToken?: string | undefined;
8716
- /**
8717
- * <p>The maximum number of model compilation jobs to return in the response.</p>
8718
- * @public
8719
- */
8720
- MaxResults?: number | undefined;
8721
- /**
8722
- * <p>A filter that returns the model compilation jobs that were created after a specified time. </p>
8723
- * @public
8724
- */
8725
- CreationTimeAfter?: Date | undefined;
8726
- /**
8727
- * <p>A filter that returns the model compilation jobs that were created before a specified time.</p>
8728
- * @public
8729
- */
8730
- CreationTimeBefore?: Date | undefined;
8731
- /**
8732
- * <p>A filter that returns the model compilation jobs that were modified after a specified time.</p>
8733
- * @public
8734
- */
8735
- LastModifiedTimeAfter?: Date | undefined;
8736
- /**
8737
- * <p>A filter that returns the model compilation jobs that were modified before a specified time.</p>
8738
- * @public
8739
- */
8740
- LastModifiedTimeBefore?: Date | undefined;
8741
- /**
8742
- * <p>A filter that returns the model compilation jobs whose name contains a specified string.</p>
8743
- * @public
8744
- */
8745
- NameContains?: string | undefined;
8746
- /**
8747
- * <p>A filter that retrieves model compilation jobs with a specific <code>CompilationJobStatus</code> status.</p>
8748
- * @public
8749
- */
8750
- StatusEquals?: CompilationJobStatus | undefined;
8751
- /**
8752
- * <p>The field by which to sort results. The default is <code>CreationTime</code>.</p>
8753
- * @public
8754
- */
8755
- SortBy?: ListCompilationJobsSortBy | undefined;
8756
- /**
8757
- * <p>The sort order for results. The default is <code>Ascending</code>.</p>
8758
- * @public
8759
- */
8760
- SortOrder?: SortOrder | undefined;
8761
- }
8762
8725
  /**
8763
8726
  * @internal
8764
8727
  */