@aws-sdk/client-sagemaker 3.817.0 → 3.821.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (45) hide show
  1. package/dist-cjs/index.js +70 -23
  2. package/dist-es/models/models_0.js +3 -0
  3. package/dist-es/models/models_2.js +0 -15
  4. package/dist-es/models/models_3.js +20 -5
  5. package/dist-es/models/models_4.js +5 -0
  6. package/dist-es/protocols/Aws_json1_1.js +37 -0
  7. package/dist-types/commands/CreateDomainCommand.d.ts +1 -0
  8. package/dist-types/commands/CreateEndpointConfigCommand.d.ts +8 -0
  9. package/dist-types/commands/DescribeDomainCommand.d.ts +1 -0
  10. package/dist-types/commands/DescribeEndpointCommand.d.ts +30 -0
  11. package/dist-types/commands/DescribeEndpointConfigCommand.d.ts +8 -0
  12. package/dist-types/commands/DescribeFlowDefinitionCommand.d.ts +2 -1
  13. package/dist-types/commands/DescribeHubCommand.d.ts +1 -2
  14. package/dist-types/commands/DescribeMlflowTrackingServerCommand.d.ts +1 -0
  15. package/dist-types/commands/ListCodeRepositoriesCommand.d.ts +1 -1
  16. package/dist-types/commands/ListCompilationJobsCommand.d.ts +1 -1
  17. package/dist-types/commands/SearchCommand.d.ts +30 -0
  18. package/dist-types/commands/StopCompilationJobCommand.d.ts +1 -1
  19. package/dist-types/commands/StopEdgeDeploymentStageCommand.d.ts +1 -1
  20. package/dist-types/commands/StopEdgePackagingJobCommand.d.ts +1 -1
  21. package/dist-types/commands/StopHyperParameterTuningJobCommand.d.ts +1 -1
  22. package/dist-types/commands/StopInferenceExperimentCommand.d.ts +1 -2
  23. package/dist-types/commands/UpdateDomainCommand.d.ts +1 -0
  24. package/dist-types/models/models_0.d.ts +11 -11
  25. package/dist-types/models/models_1.d.ts +38 -53
  26. package/dist-types/models/models_2.d.ts +121 -98
  27. package/dist-types/models/models_3.d.ts +117 -151
  28. package/dist-types/models/models_4.d.ts +151 -78
  29. package/dist-types/models/models_5.d.ts +77 -2
  30. package/dist-types/ts3.4/commands/DescribeFlowDefinitionCommand.d.ts +2 -4
  31. package/dist-types/ts3.4/commands/DescribeHubCommand.d.ts +1 -2
  32. package/dist-types/ts3.4/commands/ListCodeRepositoriesCommand.d.ts +1 -1
  33. package/dist-types/ts3.4/commands/ListCompilationJobsCommand.d.ts +1 -1
  34. package/dist-types/ts3.4/commands/StopCompilationJobCommand.d.ts +1 -1
  35. package/dist-types/ts3.4/commands/StopEdgeDeploymentStageCommand.d.ts +1 -1
  36. package/dist-types/ts3.4/commands/StopEdgePackagingJobCommand.d.ts +1 -1
  37. package/dist-types/ts3.4/commands/StopHyperParameterTuningJobCommand.d.ts +1 -1
  38. package/dist-types/ts3.4/commands/StopInferenceExperimentCommand.d.ts +4 -2
  39. package/dist-types/ts3.4/models/models_0.d.ts +5 -3
  40. package/dist-types/ts3.4/models/models_1.d.ts +13 -13
  41. package/dist-types/ts3.4/models/models_2.d.ts +32 -39
  42. package/dist-types/ts3.4/models/models_3.d.ts +45 -45
  43. package/dist-types/ts3.4/models/models_4.d.ts +43 -22
  44. package/dist-types/ts3.4/models/models_5.d.ts +22 -0
  45. package/package.json +34 -34
@@ -4884,6 +4884,17 @@ export interface CanvasAppSettings {
4884
4884
  */
4885
4885
  EmrServerlessSettings?: EmrServerlessSettings | undefined;
4886
4886
  }
4887
+ /**
4888
+ * @public
4889
+ * @enum
4890
+ */
4891
+ export declare const CapacityReservationPreference: {
4892
+ readonly CAPACITY_RESERVATIONS_ONLY: "capacity-reservations-only";
4893
+ };
4894
+ /**
4895
+ * @public
4896
+ */
4897
+ export type CapacityReservationPreference = (typeof CapacityReservationPreference)[keyof typeof CapacityReservationPreference];
4887
4898
  /**
4888
4899
  * @public
4889
4900
  * @enum
@@ -6748,14 +6759,3 @@ export declare const ModelCacheSetting: {
6748
6759
  * @public
6749
6760
  */
6750
6761
  export type ModelCacheSetting = (typeof ModelCacheSetting)[keyof typeof ModelCacheSetting];
6751
- /**
6752
- * <p>Specifies additional configuration for hosting multi-model endpoints.</p>
6753
- * @public
6754
- */
6755
- export interface MultiModelConfig {
6756
- /**
6757
- * <p>Whether to cache models for a multi-model endpoint. By default, multi-model endpoints cache models so that a model does not have to be loaded into memory each time it is invoked. Some use cases do not benefit from model caching. For example, if an endpoint hosts a large number of models that are each invoked infrequently, the endpoint might perform better if you disable model caching. To disable model caching, set the value of this parameter to <code>Disabled</code>.</p>
6758
- * @public
6759
- */
6760
- ModelCacheSetting?: ModelCacheSetting | undefined;
6761
- }
@@ -1,6 +1,17 @@
1
1
  import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion, ExceptionOptionType as __ExceptionOptionType } from "@smithy/smithy-client";
2
- import { ActionSource, ActionStatus, ActivationState, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppInstanceType, AppLifecycleManagement, AppNetworkAccessType, AppSecurityGroupManagement, AppType, ArtifactSource, AsyncInferenceConfig, AuthMode, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoMountHomeEFS, AutoParameter, AutoRollbackConfig, Autotune, AwsManagedHumanLoopRequestSource, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterInstanceGroupSpecification, ClusterNodeRecovery, ClusterOrchestrator, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, CollectionType, CompleteOnConvergence, ComputeQuotaConfig, ComputeQuotaTarget, ContainerMode, CustomImage, FeatureStatus, GitConfig, ImageConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelApprovalStatus, ModelDataSource, MultiModelConfig, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, TrainingInputMode, TrainingInstanceType, TransformJobDefinition, VpcConfig } from "./models_0";
2
+ import { ActionSource, ActionStatus, ActivationState, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppInstanceType, AppLifecycleManagement, AppNetworkAccessType, AppSecurityGroupManagement, AppType, ArtifactSource, AsyncInferenceConfig, AuthMode, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoMountHomeEFS, AutoParameter, AutoRollbackConfig, Autotune, AwsManagedHumanLoopRequestSource, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacityReservationPreference, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterInstanceGroupSpecification, ClusterNodeRecovery, ClusterOrchestrator, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, CollectionType, CompleteOnConvergence, ComputeQuotaConfig, ComputeQuotaTarget, ContainerMode, CustomImage, FeatureStatus, GitConfig, ImageConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelApprovalStatus, ModelCacheSetting, ModelDataSource, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, TrainingInputMode, TrainingInstanceType, TransformJobDefinition, VpcConfig } from "./models_0";
3
3
  import { SageMakerServiceException as __BaseException } from "./SageMakerServiceException";
4
+ /**
5
+ * <p>Specifies additional configuration for hosting multi-model endpoints.</p>
6
+ * @public
7
+ */
8
+ export interface MultiModelConfig {
9
+ /**
10
+ * <p>Whether to cache models for a multi-model endpoint. By default, multi-model endpoints cache models so that a model does not have to be loaded into memory each time it is invoked. Some use cases do not benefit from model caching. For example, if an endpoint hosts a large number of models that are each invoked infrequently, the endpoint might perform better if you disable model caching. To disable model caching, set the value of this parameter to <code>Disabled</code>.</p>
11
+ * @public
12
+ */
13
+ ModelCacheSetting?: ModelCacheSetting | undefined;
14
+ }
4
15
  /**
5
16
  * <p>Describes the container, as part of model definition.</p>
6
17
  * @public
@@ -2408,6 +2419,11 @@ export interface UnifiedStudioSettings {
2408
2419
  * @public
2409
2420
  */
2410
2421
  ProjectS3Path?: string | undefined;
2422
+ /**
2423
+ * <p>The ARN of the application managed by SageMaker AI and SageMaker Unified Studio in the Amazon Web Services IAM Identity Center.</p>
2424
+ * @public
2425
+ */
2426
+ SingleSignOnApplicationArn?: string | undefined;
2411
2427
  }
2412
2428
  /**
2413
2429
  * <p>A collection of settings that apply to the <code>SageMaker Domain</code>. These settings are specified through the <code>CreateDomain</code> API call.</p>
@@ -2893,6 +2909,22 @@ export declare const ProductionVariantAcceleratorType: {
2893
2909
  * @public
2894
2910
  */
2895
2911
  export type ProductionVariantAcceleratorType = (typeof ProductionVariantAcceleratorType)[keyof typeof ProductionVariantAcceleratorType];
2912
+ /**
2913
+ * <p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>
2914
+ * @public
2915
+ */
2916
+ export interface ProductionVariantCapacityReservationConfig {
2917
+ /**
2918
+ * <p>Options that you can choose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>
2919
+ * @public
2920
+ */
2921
+ CapacityReservationPreference?: CapacityReservationPreference | undefined;
2922
+ /**
2923
+ * <p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>
2924
+ * @public
2925
+ */
2926
+ MlReservationArn?: string | undefined;
2927
+ }
2896
2928
  /**
2897
2929
  * <p>Specifies configuration for a core dump from the model container when the process crashes.</p>
2898
2930
  * @public
@@ -3080,6 +3112,11 @@ export interface ProductionVariant {
3080
3112
  * @public
3081
3113
  */
3082
3114
  InferenceAmiVersion?: ProductionVariantInferenceAmiVersion | undefined;
3115
+ /**
3116
+ * <p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>
3117
+ * @public
3118
+ */
3119
+ CapacityReservationConfig?: ProductionVariantCapacityReservationConfig | undefined;
3083
3120
  }
3084
3121
  /**
3085
3122
  * @public
@@ -6849,58 +6886,6 @@ export interface CreateModelQualityJobDefinitionResponse {
6849
6886
  */
6850
6887
  JobDefinitionArn: string | undefined;
6851
6888
  }
6852
- /**
6853
- * <p>Configuration for monitoring constraints and monitoring statistics. These baseline resources are compared against the results of the current job from the series of jobs scheduled to collect data periodically.</p>
6854
- * @public
6855
- */
6856
- export interface MonitoringBaselineConfig {
6857
- /**
6858
- * <p>The name of the job that performs baselining for the monitoring job.</p>
6859
- * @public
6860
- */
6861
- BaseliningJobName?: string | undefined;
6862
- /**
6863
- * <p>The baseline constraint file in Amazon S3 that the current monitoring job should validated against.</p>
6864
- * @public
6865
- */
6866
- ConstraintsResource?: MonitoringConstraintsResource | undefined;
6867
- /**
6868
- * <p>The baseline statistics file in Amazon S3 that the current monitoring job should be validated against.</p>
6869
- * @public
6870
- */
6871
- StatisticsResource?: MonitoringStatisticsResource | undefined;
6872
- }
6873
- /**
6874
- * <p>Container image configuration object for the monitoring job.</p>
6875
- * @public
6876
- */
6877
- export interface MonitoringAppSpecification {
6878
- /**
6879
- * <p>The container image to be run by the monitoring job.</p>
6880
- * @public
6881
- */
6882
- ImageUri: string | undefined;
6883
- /**
6884
- * <p>Specifies the entrypoint for a container used to run the monitoring job.</p>
6885
- * @public
6886
- */
6887
- ContainerEntrypoint?: string[] | undefined;
6888
- /**
6889
- * <p>An array of arguments for the container used to run the monitoring job.</p>
6890
- * @public
6891
- */
6892
- ContainerArguments?: string[] | undefined;
6893
- /**
6894
- * <p>An Amazon S3 URI to a script that is called per row prior to running analysis. It can base64 decode the payload and convert it into a flattened JSON so that the built-in container can use the converted data. Applicable only for the built-in (first party) containers.</p>
6895
- * @public
6896
- */
6897
- RecordPreprocessorSourceUri?: string | undefined;
6898
- /**
6899
- * <p>An Amazon S3 URI to a script that is called after analysis has been performed. Applicable only for the built-in (first party) containers.</p>
6900
- * @public
6901
- */
6902
- PostAnalyticsProcessorSourceUri?: string | undefined;
6903
- }
6904
6889
  /**
6905
6890
  * @internal
6906
6891
  */
@@ -1,5 +1,57 @@
1
- import { ActionSource, ActionStatus, ActivationState, AlgorithmSpecification, AlgorithmStatus, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppNetworkAccessType, AppSecurityGroupManagement, AppSpecification, AppStatus, AppType, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AuthMode, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLProblemTypeConfigName, AutoMLResolvedAttributes, AutoMLSecurityConfig, BatchDataCaptureConfig, BatchStrategy, BatchTransformInput, CaptureStatus, Channel, CheckpointConfig, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterNodeRecovery, ClusterOrchestrator, ClusterStatus, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, CompilationJobStatus, ComputeQuotaConfig, ComputeQuotaTarget, FeatureStatus, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
- import { _InstanceType, ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, EdgePresetDeploymentType, EndpointInput, ExplainerConfig, FeatureDefinition, FeatureType, FlowDefinitionOutputConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, ModelDeployConfig, MonitoringAppSpecification, MonitoringBaselineConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, OfflineStoreConfig, OnlineStoreConfig, OutputConfig, ProcessingInstanceType, ProcessingS3UploadMode, ProductionVariant, ProductionVariantAcceleratorType, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TagPropagation, ThroughputMode, TrainingSpecification, UserSettings } from "./models_1";
1
+ import { ActionSource, ActionStatus, ActivationState, AlgorithmSpecification, AlgorithmStatus, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppNetworkAccessType, AppSecurityGroupManagement, AppSpecification, AppStatus, AppType, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AuthMode, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLProblemTypeConfigName, AutoMLResolvedAttributes, AutoMLSecurityConfig, BatchDataCaptureConfig, BatchStrategy, BatchTransformInput, CapacityReservationPreference, CaptureStatus, Channel, CheckpointConfig, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterNodeRecovery, ClusterOrchestrator, ClusterStatus, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, CompilationJobStatus, ComputeQuotaConfig, ComputeQuotaTarget, FeatureStatus, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
+ import { _InstanceType, ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, EdgePresetDeploymentType, EndpointInput, ExplainerConfig, FeatureDefinition, FeatureType, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, ModelDeployConfig, MonitoringConstraintsResource, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStatisticsResource, MonitoringStoppingCondition, NeoVpcConfig, OfflineStoreConfig, OnlineStoreConfig, OutputConfig, ProcessingInstanceType, ProcessingS3UploadMode, ProductionVariant, ProductionVariantAcceleratorType, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TagPropagation, ThroughputMode, TrainingSpecification, UserSettings } from "./models_1";
3
+ /**
4
+ * <p>Configuration for monitoring constraints and monitoring statistics. These baseline resources are compared against the results of the current job from the series of jobs scheduled to collect data periodically.</p>
5
+ * @public
6
+ */
7
+ export interface MonitoringBaselineConfig {
8
+ /**
9
+ * <p>The name of the job that performs baselining for the monitoring job.</p>
10
+ * @public
11
+ */
12
+ BaseliningJobName?: string | undefined;
13
+ /**
14
+ * <p>The baseline constraint file in Amazon S3 that the current monitoring job should validated against.</p>
15
+ * @public
16
+ */
17
+ ConstraintsResource?: MonitoringConstraintsResource | undefined;
18
+ /**
19
+ * <p>The baseline statistics file in Amazon S3 that the current monitoring job should be validated against.</p>
20
+ * @public
21
+ */
22
+ StatisticsResource?: MonitoringStatisticsResource | undefined;
23
+ }
24
+ /**
25
+ * <p>Container image configuration object for the monitoring job.</p>
26
+ * @public
27
+ */
28
+ export interface MonitoringAppSpecification {
29
+ /**
30
+ * <p>The container image to be run by the monitoring job.</p>
31
+ * @public
32
+ */
33
+ ImageUri: string | undefined;
34
+ /**
35
+ * <p>Specifies the entrypoint for a container used to run the monitoring job.</p>
36
+ * @public
37
+ */
38
+ ContainerEntrypoint?: string[] | undefined;
39
+ /**
40
+ * <p>An array of arguments for the container used to run the monitoring job.</p>
41
+ * @public
42
+ */
43
+ ContainerArguments?: string[] | undefined;
44
+ /**
45
+ * <p>An Amazon S3 URI to a script that is called per row prior to running analysis. It can base64 decode the payload and convert it into a flattened JSON so that the built-in container can use the converted data. Applicable only for the built-in (first party) containers.</p>
46
+ * @public
47
+ */
48
+ RecordPreprocessorSourceUri?: string | undefined;
49
+ /**
50
+ * <p>An Amazon S3 URI to a script that is called after analysis has been performed. Applicable only for the built-in (first party) containers.</p>
51
+ * @public
52
+ */
53
+ PostAnalyticsProcessorSourceUri?: string | undefined;
54
+ }
3
55
  /**
4
56
  * <p>The inputs for a monitoring job.</p>
5
57
  * @public
@@ -5918,6 +5970,68 @@ export interface PendingDeploymentSummary {
5918
5970
  */
5919
5971
  ShadowProductionVariants?: PendingProductionVariantSummary[] | undefined;
5920
5972
  }
5973
+ /**
5974
+ * <p>The EC2 capacity reservations that are shared to an ML capacity reservation.</p>
5975
+ * @public
5976
+ */
5977
+ export interface Ec2CapacityReservation {
5978
+ /**
5979
+ * <p>The unique identifier for an EC2 capacity reservation that's part of the ML capacity reservation.</p>
5980
+ * @public
5981
+ */
5982
+ Ec2CapacityReservationId?: string | undefined;
5983
+ /**
5984
+ * <p>The number of instances that you allocated to the EC2 capacity reservation.</p>
5985
+ * @public
5986
+ */
5987
+ TotalInstanceCount?: number | undefined;
5988
+ /**
5989
+ * <p>The number of instances that are currently available in the EC2 capacity reservation.</p>
5990
+ * @public
5991
+ */
5992
+ AvailableInstanceCount?: number | undefined;
5993
+ /**
5994
+ * <p>The number of instances from the EC2 capacity reservation that are being used by the endpoint.</p>
5995
+ * @public
5996
+ */
5997
+ UsedByCurrentEndpoint?: number | undefined;
5998
+ }
5999
+ /**
6000
+ * <p>Details about an ML capacity reservation.</p>
6001
+ * @public
6002
+ */
6003
+ export interface ProductionVariantCapacityReservationSummary {
6004
+ /**
6005
+ * <p>The Amazon Resource Name (ARN) that uniquely identifies the ML capacity reservation that SageMaker AI applies when it deploys the endpoint.</p>
6006
+ * @public
6007
+ */
6008
+ MlReservationArn?: string | undefined;
6009
+ /**
6010
+ * <p>The option that you chose for the capacity reservation. SageMaker AI supports the following options:</p> <dl> <dt>capacity-reservations-only</dt> <dd> <p>SageMaker AI launches instances only into an ML capacity reservation. If no capacity is available, the instances fail to launch.</p> </dd> </dl>
6011
+ * @public
6012
+ */
6013
+ CapacityReservationPreference?: CapacityReservationPreference | undefined;
6014
+ /**
6015
+ * <p>The number of instances that you allocated to the ML capacity reservation.</p>
6016
+ * @public
6017
+ */
6018
+ TotalInstanceCount?: number | undefined;
6019
+ /**
6020
+ * <p>The number of instances that are currently available in the ML capacity reservation.</p>
6021
+ * @public
6022
+ */
6023
+ AvailableInstanceCount?: number | undefined;
6024
+ /**
6025
+ * <p>The number of instances from the ML capacity reservation that are being used by the endpoint.</p>
6026
+ * @public
6027
+ */
6028
+ UsedByCurrentEndpoint?: number | undefined;
6029
+ /**
6030
+ * <p>The EC2 capacity reservations that are shared to this ML capacity reservation, if any.</p>
6031
+ * @public
6032
+ */
6033
+ Ec2CapacityReservations?: Ec2CapacityReservation[] | undefined;
6034
+ }
5921
6035
  /**
5922
6036
  * <p>Describes weight and capacities for a production variant associated with an endpoint. If you sent a request to the <code>UpdateEndpointWeightsAndCapacities</code> API and the endpoint status is <code>Updating</code>, you get different desired and current values. </p>
5923
6037
  * @public
@@ -5978,6 +6092,11 @@ export interface ProductionVariantSummary {
5978
6092
  * @public
5979
6093
  */
5980
6094
  RoutingConfig?: ProductionVariantRoutingConfig | undefined;
6095
+ /**
6096
+ * <p>Settings for the capacity reservation for the compute instances that SageMaker AI reserves for an endpoint. </p>
6097
+ * @public
6098
+ */
6099
+ CapacityReservationConfig?: ProductionVariantCapacityReservationSummary | undefined;
5981
6100
  }
5982
6101
  /**
5983
6102
  * @public
@@ -6495,102 +6614,6 @@ export interface DescribeFlowDefinitionRequest {
6495
6614
  */
6496
6615
  FlowDefinitionName: string | undefined;
6497
6616
  }
6498
- /**
6499
- * @public
6500
- * @enum
6501
- */
6502
- export declare const FlowDefinitionStatus: {
6503
- readonly ACTIVE: "Active";
6504
- readonly DELETING: "Deleting";
6505
- readonly FAILED: "Failed";
6506
- readonly INITIALIZING: "Initializing";
6507
- };
6508
- /**
6509
- * @public
6510
- */
6511
- export type FlowDefinitionStatus = (typeof FlowDefinitionStatus)[keyof typeof FlowDefinitionStatus];
6512
- /**
6513
- * @public
6514
- */
6515
- export interface DescribeFlowDefinitionResponse {
6516
- /**
6517
- * <p>The Amazon Resource Name (ARN) of the flow defintion.</p>
6518
- * @public
6519
- */
6520
- FlowDefinitionArn: string | undefined;
6521
- /**
6522
- * <p>The Amazon Resource Name (ARN) of the flow definition.</p>
6523
- * @public
6524
- */
6525
- FlowDefinitionName: string | undefined;
6526
- /**
6527
- * <p>The status of the flow definition. Valid values are listed below.</p>
6528
- * @public
6529
- */
6530
- FlowDefinitionStatus: FlowDefinitionStatus | undefined;
6531
- /**
6532
- * <p>The timestamp when the flow definition was created.</p>
6533
- * @public
6534
- */
6535
- CreationTime: Date | undefined;
6536
- /**
6537
- * <p>Container for configuring the source of human task requests. Used to specify if Amazon Rekognition or Amazon Textract is used as an integration source.</p>
6538
- * @public
6539
- */
6540
- HumanLoopRequestSource?: HumanLoopRequestSource | undefined;
6541
- /**
6542
- * <p>An object containing information about what triggers a human review workflow.</p>
6543
- * @public
6544
- */
6545
- HumanLoopActivationConfig?: HumanLoopActivationConfig | undefined;
6546
- /**
6547
- * <p>An object containing information about who works on the task, the workforce task price, and other task details.</p>
6548
- * @public
6549
- */
6550
- HumanLoopConfig?: HumanLoopConfig | undefined;
6551
- /**
6552
- * <p>An object containing information about the output file.</p>
6553
- * @public
6554
- */
6555
- OutputConfig: FlowDefinitionOutputConfig | undefined;
6556
- /**
6557
- * <p>The Amazon Resource Name (ARN) of the Amazon Web Services Identity and Access Management (IAM) execution role for the flow definition.</p>
6558
- * @public
6559
- */
6560
- RoleArn: string | undefined;
6561
- /**
6562
- * <p>The reason your flow definition failed.</p>
6563
- * @public
6564
- */
6565
- FailureReason?: string | undefined;
6566
- }
6567
- /**
6568
- * @public
6569
- */
6570
- export interface DescribeHubRequest {
6571
- /**
6572
- * <p>The name of the hub to describe.</p>
6573
- * @public
6574
- */
6575
- HubName: string | undefined;
6576
- }
6577
- /**
6578
- * @public
6579
- * @enum
6580
- */
6581
- export declare const HubStatus: {
6582
- readonly CREATE_FAILED: "CreateFailed";
6583
- readonly CREATING: "Creating";
6584
- readonly DELETE_FAILED: "DeleteFailed";
6585
- readonly DELETING: "Deleting";
6586
- readonly IN_SERVICE: "InService";
6587
- readonly UPDATE_FAILED: "UpdateFailed";
6588
- readonly UPDATING: "Updating";
6589
- };
6590
- /**
6591
- * @public
6592
- */
6593
- export type HubStatus = (typeof HubStatus)[keyof typeof HubStatus];
6594
6617
  /**
6595
6618
  * @internal
6596
6619
  */