@aws-sdk/client-sagemaker 3.862.0 → 3.864.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (66) hide show
  1. package/README.md +16 -0
  2. package/dist-cjs/index.js +575 -392
  3. package/dist-es/SageMaker.js +4 -0
  4. package/dist-es/commands/DescribeReservedCapacityCommand.js +22 -0
  5. package/dist-es/commands/ListUltraServersByReservedCapacityCommand.js +22 -0
  6. package/dist-es/commands/index.js +2 -0
  7. package/dist-es/models/models_0.js +1 -13
  8. package/dist-es/models/models_1.js +13 -0
  9. package/dist-es/models/models_3.js +22 -33
  10. package/dist-es/models/models_4.js +21 -14
  11. package/dist-es/models/models_5.js +12 -1
  12. package/dist-es/pagination/ListUltraServersByReservedCapacityPaginator.js +4 -0
  13. package/dist-es/pagination/index.js +1 -0
  14. package/dist-es/protocols/Aws_json1_1.js +133 -0
  15. package/dist-types/SageMaker.d.ts +14 -0
  16. package/dist-types/SageMakerClient.d.ts +4 -2
  17. package/dist-types/commands/AttachClusterNodeVolumeCommand.d.ts +1 -1
  18. package/dist-types/commands/CreateAlgorithmCommand.d.ts +12 -3
  19. package/dist-types/commands/CreateHyperParameterTuningJobCommand.d.ts +26 -8
  20. package/dist-types/commands/CreateModelBiasJobDefinitionCommand.d.ts +1 -2
  21. package/dist-types/commands/CreateTrainingJobCommand.d.ts +11 -2
  22. package/dist-types/commands/CreateTrainingPlanCommand.d.ts +1 -0
  23. package/dist-types/commands/DescribeAlgorithmCommand.d.ts +12 -3
  24. package/dist-types/commands/DescribeClusterNodeCommand.d.ts +3 -0
  25. package/dist-types/commands/DescribeComputeQuotaCommand.d.ts +1 -1
  26. package/dist-types/commands/DescribeContextCommand.d.ts +1 -2
  27. package/dist-types/commands/DescribeHyperParameterTuningJobCommand.d.ts +26 -8
  28. package/dist-types/commands/DescribeReservedCapacityCommand.d.ts +93 -0
  29. package/dist-types/commands/DescribeTrainingJobCommand.d.ts +11 -2
  30. package/dist-types/commands/DescribeTrainingPlanCommand.d.ts +7 -1
  31. package/dist-types/commands/DetachClusterNodeVolumeCommand.d.ts +1 -1
  32. package/dist-types/commands/ListClusterNodesCommand.d.ts +3 -0
  33. package/dist-types/commands/ListTrainingPlansCommand.d.ts +5 -1
  34. package/dist-types/commands/ListUltraServersByReservedCapacityCommand.d.ts +92 -0
  35. package/dist-types/commands/ListWorkteamsCommand.d.ts +1 -1
  36. package/dist-types/commands/SearchCommand.d.ts +26 -8
  37. package/dist-types/commands/SearchTrainingPlanOfferingsCommand.d.ts +7 -2
  38. package/dist-types/commands/index.d.ts +2 -0
  39. package/dist-types/models/models_0.d.ts +71 -87
  40. package/dist-types/models/models_1.d.ts +77 -89
  41. package/dist-types/models/models_2.d.ts +94 -107
  42. package/dist-types/models/models_3.d.ts +295 -295
  43. package/dist-types/models/models_4.d.ts +374 -674
  44. package/dist-types/models/models_5.d.ts +703 -5
  45. package/dist-types/pagination/ListUltraServersByReservedCapacityPaginator.d.ts +7 -0
  46. package/dist-types/pagination/index.d.ts +1 -0
  47. package/dist-types/protocols/Aws_json1_1.d.ts +18 -0
  48. package/dist-types/ts3.4/SageMaker.d.ts +40 -0
  49. package/dist-types/ts3.4/SageMakerClient.d.ts +12 -0
  50. package/dist-types/ts3.4/commands/CreateModelBiasJobDefinitionCommand.d.ts +4 -2
  51. package/dist-types/ts3.4/commands/DescribeComputeQuotaCommand.d.ts +1 -1
  52. package/dist-types/ts3.4/commands/DescribeContextCommand.d.ts +4 -2
  53. package/dist-types/ts3.4/commands/DescribeReservedCapacityCommand.d.ts +51 -0
  54. package/dist-types/ts3.4/commands/ListUltraServersByReservedCapacityCommand.d.ts +51 -0
  55. package/dist-types/ts3.4/commands/ListWorkteamsCommand.d.ts +1 -1
  56. package/dist-types/ts3.4/commands/index.d.ts +2 -0
  57. package/dist-types/ts3.4/models/models_0.d.ts +15 -25
  58. package/dist-types/ts3.4/models/models_1.d.ts +25 -21
  59. package/dist-types/ts3.4/models/models_2.d.ts +24 -29
  60. package/dist-types/ts3.4/models/models_3.d.ts +88 -93
  61. package/dist-types/ts3.4/models/models_4.d.ts +112 -184
  62. package/dist-types/ts3.4/models/models_5.d.ts +183 -5
  63. package/dist-types/ts3.4/pagination/ListUltraServersByReservedCapacityPaginator.d.ts +11 -0
  64. package/dist-types/ts3.4/pagination/index.d.ts +1 -0
  65. package/dist-types/ts3.4/protocols/Aws_json1_1.d.ts +24 -0
  66. package/package.json +5 -5
@@ -1533,6 +1533,7 @@ export declare const TrainingInstanceType: {
1533
1533
  readonly ML_P5EN_48XLARGE: "ml.p5en.48xlarge";
1534
1534
  readonly ML_P5E_48XLARGE: "ml.p5e.48xlarge";
1535
1535
  readonly ML_P5_48XLARGE: "ml.p5.48xlarge";
1536
+ readonly ML_P6E_GB200_36XLARGE: "ml.p6e-gb200.36xlarge";
1536
1537
  readonly ML_P6_B200_48XLARGE: "ml.p6-b200.48xlarge";
1537
1538
  readonly ML_R5D_12XLARGE: "ml.r5d.12xlarge";
1538
1539
  readonly ML_R5D_16XLARGE: "ml.r5d.16xlarge";
@@ -1593,6 +1594,38 @@ export interface InstanceGroup {
1593
1594
  */
1594
1595
  InstanceGroupName: string | undefined;
1595
1596
  }
1597
+ /**
1598
+ * <p>Specifies how instances should be placed on a specific UltraServer.</p>
1599
+ * @public
1600
+ */
1601
+ export interface PlacementSpecification {
1602
+ /**
1603
+ * <p>The unique identifier of the UltraServer where instances should be placed.</p>
1604
+ * @public
1605
+ */
1606
+ UltraServerId?: string | undefined;
1607
+ /**
1608
+ * <p>The number of ML compute instances required to be placed together on the same UltraServer. Minimum value of 1.</p>
1609
+ * @public
1610
+ */
1611
+ InstanceCount: number | undefined;
1612
+ }
1613
+ /**
1614
+ * <p>Configuration for how instances are placed and allocated within UltraServers. This is only applicable for UltraServer capacity.</p>
1615
+ * @public
1616
+ */
1617
+ export interface InstancePlacementConfig {
1618
+ /**
1619
+ * <p>If set to true, allows multiple jobs to share the same UltraServer instances. If set to false, ensures this job's instances are placed on an UltraServer exclusively, with no other jobs sharing the same UltraServer. Default is false.</p>
1620
+ * @public
1621
+ */
1622
+ EnableMultipleJobs?: boolean | undefined;
1623
+ /**
1624
+ * <p>A list of specifications for how instances should be placed on specific UltraServers. Maximum of 10 items is supported.</p>
1625
+ * @public
1626
+ */
1627
+ PlacementSpecifications?: PlacementSpecification[] | undefined;
1628
+ }
1596
1629
  /**
1597
1630
  * <p>Describes the resources, including machine learning (ML) compute instances and ML storage volumes, to use for model training. </p>
1598
1631
  * @public
@@ -1633,6 +1666,11 @@ export interface ResourceConfig {
1633
1666
  * @public
1634
1667
  */
1635
1668
  TrainingPlanArn?: string | undefined;
1669
+ /**
1670
+ * <p>Configuration for how training job instances are placed and allocated within UltraServers. Only applicable for UltraServer capacity.</p>
1671
+ * @public
1672
+ */
1673
+ InstancePlacementConfig?: InstancePlacementConfig | undefined;
1636
1674
  }
1637
1675
  /**
1638
1676
  * <p>Specifies a limit to how long a job can run. When the job reaches the time limit, SageMaker ends the job. Use this API to cap costs.</p> <p>To stop a training job, SageMaker sends the algorithm the <code>SIGTERM</code> signal, which delays job termination for 120 seconds. Algorithms can use this 120-second window to save the model artifacts, so the results of training are not lost. </p> <p>The training algorithms provided by SageMaker automatically save the intermediate results of a model training job when possible. This attempt to save artifacts is only a best effort case as model might not be in a state from which it can be saved. For example, if training has just started, the model might not be ready to save. When saved, this intermediate data is a valid model artifact. You can use it to create a model with <code>CreateModel</code>.</p> <note> <p>The Neural Topic Model (NTM) currently does not support saving intermediate model artifacts. When training NTMs, make sure that the maximum runtime is sufficient for the training job to complete.</p> </note>
@@ -5877,7 +5915,7 @@ export interface ClusterEbsVolumeConfig {
5877
5915
  VolumeSizeInGB?: number | undefined;
5878
5916
  }
5879
5917
  /**
5880
- * <p>Metadata information about a SageMaker HyperPod cluster showing information about the cluster level operations, such as creating, updating, and deleting.</p>
5918
+ * <p>Metadata information about a HyperPod cluster showing information about the cluster level operations, such as creating, updating, and deleting.</p>
5881
5919
  * @public
5882
5920
  */
5883
5921
  export interface ClusterMetadata {
@@ -5887,12 +5925,12 @@ export interface ClusterMetadata {
5887
5925
  */
5888
5926
  FailureMessage?: string | undefined;
5889
5927
  /**
5890
- * <p>A list of Amazon EKS IAM role ARNs associated with the cluster. This is created by SageMaker HyperPod on your behalf and only applies for EKS-orchestrated clusters.</p>
5928
+ * <p>A list of Amazon EKS IAM role ARNs associated with the cluster. This is created by HyperPod on your behalf and only applies for EKS orchestrated clusters.</p>
5891
5929
  * @public
5892
5930
  */
5893
5931
  EksRoleAccessEntries?: string[] | undefined;
5894
5932
  /**
5895
- * <p>The Service-Linked Role (SLR) associated with the cluster. This is created by SageMaker HyperPod on your behalf and only applies for EKS-orchestrated clusters.</p>
5933
+ * <p>The Service-Linked Role (SLR) associated with the cluster. This is created by HyperPod on your behalf and only applies for EKS orchestrated clusters.</p>
5896
5934
  * @public
5897
5935
  */
5898
5936
  SlrAccessEntry?: string | undefined;
@@ -5934,7 +5972,7 @@ export interface InstanceMetadata {
5934
5972
  NodeLogicalId?: string | undefined;
5935
5973
  }
5936
5974
  /**
5937
- * <p>Metadata information about an instance group in a SageMaker HyperPod cluster.</p>
5975
+ * <p>Metadata information about an instance group in a HyperPod cluster.</p>
5938
5976
  * @public
5939
5977
  */
5940
5978
  export interface InstanceGroupMetadata {
@@ -6097,12 +6135,12 @@ export interface ClusterEventDetail {
6097
6135
  */
6098
6136
  EventId: string | undefined;
6099
6137
  /**
6100
- * <p>The Amazon Resource Name (ARN) of the SageMaker HyperPod cluster associated with the event.</p>
6138
+ * <p>The Amazon Resource Name (ARN) of the HyperPod cluster associated with the event.</p>
6101
6139
  * @public
6102
6140
  */
6103
6141
  ClusterArn: string | undefined;
6104
6142
  /**
6105
- * <p>The name of the SageMaker HyperPod cluster associated with the event.</p>
6143
+ * <p>The name of the HyperPod cluster associated with the event.</p>
6106
6144
  * @public
6107
6145
  */
6108
6146
  ClusterName: string | undefined;
@@ -6117,7 +6155,7 @@ export interface ClusterEventDetail {
6117
6155
  */
6118
6156
  InstanceId?: string | undefined;
6119
6157
  /**
6120
- * <p>The type of resource associated with the event. Valid values are "Cluster", "InstanceGroup", or "Instance".</p>
6158
+ * <p>The type of resource associated with the event. Valid values are <code>Cluster</code>, <code>InstanceGroup</code>, or <code>Instance</code>.</p>
6121
6159
  * @public
6122
6160
  */
6123
6161
  ResourceType: ClusterEventResourceType | undefined;
@@ -6138,7 +6176,7 @@ export interface ClusterEventDetail {
6138
6176
  Description?: string | undefined;
6139
6177
  }
6140
6178
  /**
6141
- * <p>A summary of an event in a SageMaker HyperPod cluster.</p>
6179
+ * <p>A summary of an event in a HyperPod cluster.</p>
6142
6180
  * @public
6143
6181
  */
6144
6182
  export interface ClusterEventSummary {
@@ -6148,12 +6186,12 @@ export interface ClusterEventSummary {
6148
6186
  */
6149
6187
  EventId: string | undefined;
6150
6188
  /**
6151
- * <p>The Amazon Resource Name (ARN) of the SageMaker HyperPod cluster associated with the event.</p>
6189
+ * <p>The Amazon Resource Name (ARN) of the HyperPod cluster associated with the event.</p>
6152
6190
  * @public
6153
6191
  */
6154
6192
  ClusterArn: string | undefined;
6155
6193
  /**
6156
- * <p>The name of the SageMaker HyperPod cluster associated with the event.</p>
6194
+ * <p>The name of the HyperPod cluster associated with the event.</p>
6157
6195
  * @public
6158
6196
  */
6159
6197
  ClusterName: string | undefined;
@@ -6163,12 +6201,12 @@ export interface ClusterEventSummary {
6163
6201
  */
6164
6202
  InstanceGroupName?: string | undefined;
6165
6203
  /**
6166
- * <p>The EC2 instance ID associated with the event, if applicable.</p>
6204
+ * <p>The Amazon Elastic Compute Cloud (EC2) instance ID associated with the event, if applicable.</p>
6167
6205
  * @public
6168
6206
  */
6169
6207
  InstanceId?: string | undefined;
6170
6208
  /**
6171
- * <p>The type of resource associated with the event. Valid values are "Cluster", "InstanceGroup", or "Instance".</p>
6209
+ * <p>The type of resource associated with the event. Valid values are <code>Cluster</code>, <code>InstanceGroup</code>, or <code>Instance</code>.</p>
6172
6210
  * @public
6173
6211
  */
6174
6212
  ResourceType: ClusterEventResourceType | undefined;
@@ -6617,6 +6655,17 @@ export interface ClusterInstanceStatusDetails {
6617
6655
  */
6618
6656
  Message?: string | undefined;
6619
6657
  }
6658
+ /**
6659
+ * <p>Contains information about the UltraServer object.</p>
6660
+ * @public
6661
+ */
6662
+ export interface UltraServerInfo {
6663
+ /**
6664
+ * <p>The unique identifier of the UltraServer.</p>
6665
+ * @public
6666
+ */
6667
+ Id?: string | undefined;
6668
+ }
6620
6669
  /**
6621
6670
  * <p>Details of an instance (also called a <i>node</i> interchangeably) in a SageMaker HyperPod cluster.</p>
6622
6671
  * @public
@@ -6707,6 +6756,11 @@ export interface ClusterNodeDetails {
6707
6756
  * @public
6708
6757
  */
6709
6758
  DesiredImageId?: string | undefined;
6759
+ /**
6760
+ * <p>Contains information about the UltraServer.</p>
6761
+ * @public
6762
+ */
6763
+ UltraServerInfo?: UltraServerInfo | undefined;
6710
6764
  }
6711
6765
  /**
6712
6766
  * @public
@@ -6771,6 +6825,11 @@ export interface ClusterNodeSummary {
6771
6825
  * @public
6772
6826
  */
6773
6827
  InstanceStatus: ClusterInstanceStatusDetails | undefined;
6828
+ /**
6829
+ * <p>Contains information about the UltraServer.</p>
6830
+ * @public
6831
+ */
6832
+ UltraServerInfo?: UltraServerInfo | undefined;
6774
6833
  }
6775
6834
  /**
6776
6835
  * <p>The configuration settings for the Amazon EKS cluster used as the orchestrator for the SageMaker HyperPod cluster.</p>
@@ -6996,78 +7055,3 @@ export declare const SchedulerResourceStatus: {
6996
7055
  * @public
6997
7056
  */
6998
7057
  export type SchedulerResourceStatus = (typeof SchedulerResourceStatus)[keyof typeof SchedulerResourceStatus];
6999
- /**
7000
- * <p>Summary of the cluster policy.</p>
7001
- * @public
7002
- */
7003
- export interface ClusterSchedulerConfigSummary {
7004
- /**
7005
- * <p>ARN of the cluster policy.</p>
7006
- * @public
7007
- */
7008
- ClusterSchedulerConfigArn: string | undefined;
7009
- /**
7010
- * <p>ID of the cluster policy.</p>
7011
- * @public
7012
- */
7013
- ClusterSchedulerConfigId: string | undefined;
7014
- /**
7015
- * <p>Version of the cluster policy.</p>
7016
- * @public
7017
- */
7018
- ClusterSchedulerConfigVersion?: number | undefined;
7019
- /**
7020
- * <p>Name of the cluster policy.</p>
7021
- * @public
7022
- */
7023
- Name: string | undefined;
7024
- /**
7025
- * <p>Creation time of the cluster policy.</p>
7026
- * @public
7027
- */
7028
- CreationTime: Date | undefined;
7029
- /**
7030
- * <p>Last modified time of the cluster policy.</p>
7031
- * @public
7032
- */
7033
- LastModifiedTime?: Date | undefined;
7034
- /**
7035
- * <p>Status of the cluster policy.</p>
7036
- * @public
7037
- */
7038
- Status: SchedulerResourceStatus | undefined;
7039
- /**
7040
- * <p>ARN of the cluster.</p>
7041
- * @public
7042
- */
7043
- ClusterArn?: string | undefined;
7044
- }
7045
- /**
7046
- * @public
7047
- * @enum
7048
- */
7049
- export declare const ClusterSortBy: {
7050
- readonly CREATION_TIME: "CREATION_TIME";
7051
- readonly NAME: "NAME";
7052
- };
7053
- /**
7054
- * @public
7055
- */
7056
- export type ClusterSortBy = (typeof ClusterSortBy)[keyof typeof ClusterSortBy];
7057
- /**
7058
- * @public
7059
- * @enum
7060
- */
7061
- export declare const ClusterStatus: {
7062
- readonly CREATING: "Creating";
7063
- readonly DELETING: "Deleting";
7064
- readonly FAILED: "Failed";
7065
- readonly INSERVICE: "InService";
7066
- readonly ROLLINGBACK: "RollingBack";
7067
- readonly SYSTEMUPDATING: "SystemUpdating";
7068
- readonly UPDATING: "Updating";
7069
- };
7070
- /**
7071
- * @public
7072
- */
7073
- export type ClusterStatus = (typeof ClusterStatus)[keyof typeof ClusterStatus];
@@ -1,6 +1,81 @@
1
1
  import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion, ExceptionOptionType as __ExceptionOptionType } from "@smithy/smithy-client";
2
- import { ActionSource, ActionStatus, ActivationState, AdditionalModelDataSource, AdditionalS3DataSource, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppInstanceType, AppLifecycleManagement, AppNetworkAccessType, AppSecurityGroupManagement, AppType, ArtifactSource, AsyncInferenceConfig, AuthMode, AuthorizedUrl, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoMountHomeEFS, AutoParameter, AutoRollbackConfig, Autotune, AwsManagedHumanLoopRequestSource, BatchTransformInput, BestObjectiveNotImproving, BlueGreenUpdatePolicy, CanvasAppSettings, CapacityReservationPreference, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterInstanceGroupSpecification, ClusterInstanceType, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterOrchestrator, ClusterRestrictedInstanceGroupSpecification, ClusterStatus, CodeEditorAppImageConfig, FeatureStatus, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, ModelDataSource, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TrainingInputMode, TrainingInstanceType, VpcConfig } from "./models_0";
2
+ import { ActionSource, ActionStatus, ActivationState, AdditionalModelDataSource, AdditionalS3DataSource, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppInstanceType, AppLifecycleManagement, AppNetworkAccessType, AppSecurityGroupManagement, AppType, ArtifactSource, AsyncInferenceConfig, AuthMode, AuthorizedUrl, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoMountHomeEFS, AutoParameter, AutoRollbackConfig, Autotune, AwsManagedHumanLoopRequestSource, BatchTransformInput, BestObjectiveNotImproving, BlueGreenUpdatePolicy, CanvasAppSettings, CapacityReservationPreference, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterInstanceGroupSpecification, ClusterInstanceType, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterOrchestrator, ClusterRestrictedInstanceGroupSpecification, CodeEditorAppImageConfig, FeatureStatus, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, ModelDataSource, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TrainingInputMode, TrainingInstanceType, VpcConfig } from "./models_0";
3
3
  import { SageMakerServiceException as __BaseException } from "./SageMakerServiceException";
4
+ /**
5
+ * <p>Summary of the cluster policy.</p>
6
+ * @public
7
+ */
8
+ export interface ClusterSchedulerConfigSummary {
9
+ /**
10
+ * <p>ARN of the cluster policy.</p>
11
+ * @public
12
+ */
13
+ ClusterSchedulerConfigArn: string | undefined;
14
+ /**
15
+ * <p>ID of the cluster policy.</p>
16
+ * @public
17
+ */
18
+ ClusterSchedulerConfigId: string | undefined;
19
+ /**
20
+ * <p>Version of the cluster policy.</p>
21
+ * @public
22
+ */
23
+ ClusterSchedulerConfigVersion?: number | undefined;
24
+ /**
25
+ * <p>Name of the cluster policy.</p>
26
+ * @public
27
+ */
28
+ Name: string | undefined;
29
+ /**
30
+ * <p>Creation time of the cluster policy.</p>
31
+ * @public
32
+ */
33
+ CreationTime: Date | undefined;
34
+ /**
35
+ * <p>Last modified time of the cluster policy.</p>
36
+ * @public
37
+ */
38
+ LastModifiedTime?: Date | undefined;
39
+ /**
40
+ * <p>Status of the cluster policy.</p>
41
+ * @public
42
+ */
43
+ Status: SchedulerResourceStatus | undefined;
44
+ /**
45
+ * <p>ARN of the cluster.</p>
46
+ * @public
47
+ */
48
+ ClusterArn?: string | undefined;
49
+ }
50
+ /**
51
+ * @public
52
+ * @enum
53
+ */
54
+ export declare const ClusterSortBy: {
55
+ readonly CREATION_TIME: "CREATION_TIME";
56
+ readonly NAME: "NAME";
57
+ };
58
+ /**
59
+ * @public
60
+ */
61
+ export type ClusterSortBy = (typeof ClusterSortBy)[keyof typeof ClusterSortBy];
62
+ /**
63
+ * @public
64
+ * @enum
65
+ */
66
+ export declare const ClusterStatus: {
67
+ readonly CREATING: "Creating";
68
+ readonly DELETING: "Deleting";
69
+ readonly FAILED: "Failed";
70
+ readonly INSERVICE: "InService";
71
+ readonly ROLLINGBACK: "RollingBack";
72
+ readonly SYSTEMUPDATING: "SystemUpdating";
73
+ readonly UPDATING: "Updating";
74
+ };
75
+ /**
76
+ * @public
77
+ */
78
+ export type ClusterStatus = (typeof ClusterStatus)[keyof typeof ClusterStatus];
4
79
  /**
5
80
  * <p>Lists a summary of the properties of a SageMaker HyperPod cluster.</p>
6
81
  * @public
@@ -1554,7 +1629,7 @@ export interface CreateClusterRequest {
1554
1629
  */
1555
1630
  Tags?: Tag[] | undefined;
1556
1631
  /**
1557
- * <p>The type of orchestrator to use for the SageMaker HyperPod cluster. Currently, the only supported value is <code>"eks"</code>, which is to use an Amazon Elastic Kubernetes Service (EKS) cluster as the orchestrator.</p>
1632
+ * <p>The type of orchestrator to use for the SageMaker HyperPod cluster. Currently, the only supported value is <code>"eks"</code>, which is to use an Amazon Elastic Kubernetes Service cluster as the orchestrator.</p>
1558
1633
  * @public
1559
1634
  */
1560
1635
  Orchestrator?: ClusterOrchestrator | undefined;
@@ -6790,90 +6865,3 @@ export interface ModelBiasBaselineConfig {
6790
6865
  */
6791
6866
  ConstraintsResource?: MonitoringConstraintsResource | undefined;
6792
6867
  }
6793
- /**
6794
- * <p>The ground truth labels for the dataset used for the monitoring job.</p>
6795
- * @public
6796
- */
6797
- export interface MonitoringGroundTruthS3Input {
6798
- /**
6799
- * <p>The address of the Amazon S3 location of the ground truth labels.</p>
6800
- * @public
6801
- */
6802
- S3Uri?: string | undefined;
6803
- }
6804
- /**
6805
- * <p>Inputs for the model bias job.</p>
6806
- * @public
6807
- */
6808
- export interface ModelBiasJobInput {
6809
- /**
6810
- * <p>Input object for the endpoint</p>
6811
- * @public
6812
- */
6813
- EndpointInput?: EndpointInput | undefined;
6814
- /**
6815
- * <p>Input object for the batch transform job.</p>
6816
- * @public
6817
- */
6818
- BatchTransformInput?: BatchTransformInput | undefined;
6819
- /**
6820
- * <p>Location of ground truth labels to use in model bias job.</p>
6821
- * @public
6822
- */
6823
- GroundTruthS3Input: MonitoringGroundTruthS3Input | undefined;
6824
- }
6825
- /**
6826
- * @public
6827
- */
6828
- export interface CreateModelBiasJobDefinitionRequest {
6829
- /**
6830
- * <p>The name of the bias job definition. The name must be unique within an Amazon Web Services Region in the Amazon Web Services account.</p>
6831
- * @public
6832
- */
6833
- JobDefinitionName: string | undefined;
6834
- /**
6835
- * <p>The baseline configuration for a model bias job.</p>
6836
- * @public
6837
- */
6838
- ModelBiasBaselineConfig?: ModelBiasBaselineConfig | undefined;
6839
- /**
6840
- * <p>Configures the model bias job to run a specified Docker container image.</p>
6841
- * @public
6842
- */
6843
- ModelBiasAppSpecification: ModelBiasAppSpecification | undefined;
6844
- /**
6845
- * <p>Inputs for the model bias job.</p>
6846
- * @public
6847
- */
6848
- ModelBiasJobInput: ModelBiasJobInput | undefined;
6849
- /**
6850
- * <p>The output configuration for monitoring jobs.</p>
6851
- * @public
6852
- */
6853
- ModelBiasJobOutputConfig: MonitoringOutputConfig | undefined;
6854
- /**
6855
- * <p>Identifies the resources to deploy for a monitoring job.</p>
6856
- * @public
6857
- */
6858
- JobResources: MonitoringResources | undefined;
6859
- /**
6860
- * <p>Networking options for a model bias job.</p>
6861
- * @public
6862
- */
6863
- NetworkConfig?: MonitoringNetworkConfig | undefined;
6864
- /**
6865
- * <p>The Amazon Resource Name (ARN) of an IAM role that Amazon SageMaker AI can assume to perform tasks on your behalf.</p>
6866
- * @public
6867
- */
6868
- RoleArn: string | undefined;
6869
- /**
6870
- * <p>A time limit for how long the monitoring job is allowed to run before stopping.</p>
6871
- * @public
6872
- */
6873
- StoppingCondition?: MonitoringStoppingCondition | undefined;
6874
- /**
6875
- * <p>(Optional) An array of key-value pairs. For more information, see <a href="https://docs.aws.amazon.com/awsaccountbilling/latest/aboutv2/cost-alloc-tags.html#allocation-whatURL"> Using Cost Allocation Tags</a> in the <i>Amazon Web Services Billing and Cost Management User Guide</i>.</p>
6876
- * @public
6877
- */
6878
- Tags?: Tag[] | undefined;
6879
- }
@@ -1,5 +1,92 @@
1
- import { ActionSource, ActionStatus, ActivationState, AdditionalInferenceSpecificationDefinition, AlgorithmSpecification, AlgorithmStatus, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, AppStatus, AppType, ArtifactSource, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLProblemTypeConfigName, AutoMLResolvedAttributes, AutoMLSecurityConfig, BatchDataCaptureConfig, BatchStrategy, BatchTransformInput, Bias, CaptureStatus, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterStatus, CodeEditorAppImageConfig, FeatureStatus, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricsSource, ModelApprovalStatus, ModelDataSource, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformJobDefinition, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
- import { _InstanceType, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, CompilationJobStatus, ComputeQuotaConfig, ComputeQuotaTarget, DeviceSelectionConfig, EdgeDeploymentConfig, EndpointInput, GitConfig, HubContentType, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, ModelDeployConfig, MonitoringConstraintsResource, MonitoringGroundTruthS3Input, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStatisticsResource, MonitoringStoppingCondition, NeoVpcConfig, OutputConfig, ProcessingInstanceType, ProcessingS3UploadMode, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
1
+ import { ActionSource, ActionStatus, AdditionalInferenceSpecificationDefinition, AlgorithmSpecification, AlgorithmStatus, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, AppStatus, AppType, ArtifactSource, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLProblemTypeConfigName, AutoMLResolvedAttributes, AutoMLSecurityConfig, BatchDataCaptureConfig, BatchStrategy, BatchTransformInput, Bias, CaptureStatus, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, CodeEditorAppImageConfig, FeatureStatus, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricsSource, ModelApprovalStatus, ModelDataSource, OutputDataConfig, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, ResourceConfig, ResourceSpec, SchedulerResourceStatus, StoppingCondition, Tag, TransformInput, TransformJobDefinition, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
2
+ import { _InstanceType, ClusterStatus, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, CompilationJobStatus, DeviceSelectionConfig, EdgeDeploymentConfig, EndpointInput, GitConfig, HubContentType, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, ModelBiasAppSpecification, ModelBiasBaselineConfig, ModelDeployConfig, MonitoringConstraintsResource, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStatisticsResource, MonitoringStoppingCondition, NeoVpcConfig, OutputConfig, ProcessingInstanceType, ProcessingS3UploadMode, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
3
+ /**
4
+ * <p>The ground truth labels for the dataset used for the monitoring job.</p>
5
+ * @public
6
+ */
7
+ export interface MonitoringGroundTruthS3Input {
8
+ /**
9
+ * <p>The address of the Amazon S3 location of the ground truth labels.</p>
10
+ * @public
11
+ */
12
+ S3Uri?: string | undefined;
13
+ }
14
+ /**
15
+ * <p>Inputs for the model bias job.</p>
16
+ * @public
17
+ */
18
+ export interface ModelBiasJobInput {
19
+ /**
20
+ * <p>Input object for the endpoint</p>
21
+ * @public
22
+ */
23
+ EndpointInput?: EndpointInput | undefined;
24
+ /**
25
+ * <p>Input object for the batch transform job.</p>
26
+ * @public
27
+ */
28
+ BatchTransformInput?: BatchTransformInput | undefined;
29
+ /**
30
+ * <p>Location of ground truth labels to use in model bias job.</p>
31
+ * @public
32
+ */
33
+ GroundTruthS3Input: MonitoringGroundTruthS3Input | undefined;
34
+ }
35
+ /**
36
+ * @public
37
+ */
38
+ export interface CreateModelBiasJobDefinitionRequest {
39
+ /**
40
+ * <p>The name of the bias job definition. The name must be unique within an Amazon Web Services Region in the Amazon Web Services account.</p>
41
+ * @public
42
+ */
43
+ JobDefinitionName: string | undefined;
44
+ /**
45
+ * <p>The baseline configuration for a model bias job.</p>
46
+ * @public
47
+ */
48
+ ModelBiasBaselineConfig?: ModelBiasBaselineConfig | undefined;
49
+ /**
50
+ * <p>Configures the model bias job to run a specified Docker container image.</p>
51
+ * @public
52
+ */
53
+ ModelBiasAppSpecification: ModelBiasAppSpecification | undefined;
54
+ /**
55
+ * <p>Inputs for the model bias job.</p>
56
+ * @public
57
+ */
58
+ ModelBiasJobInput: ModelBiasJobInput | undefined;
59
+ /**
60
+ * <p>The output configuration for monitoring jobs.</p>
61
+ * @public
62
+ */
63
+ ModelBiasJobOutputConfig: MonitoringOutputConfig | undefined;
64
+ /**
65
+ * <p>Identifies the resources to deploy for a monitoring job.</p>
66
+ * @public
67
+ */
68
+ JobResources: MonitoringResources | undefined;
69
+ /**
70
+ * <p>Networking options for a model bias job.</p>
71
+ * @public
72
+ */
73
+ NetworkConfig?: MonitoringNetworkConfig | undefined;
74
+ /**
75
+ * <p>The Amazon Resource Name (ARN) of an IAM role that Amazon SageMaker AI can assume to perform tasks on your behalf.</p>
76
+ * @public
77
+ */
78
+ RoleArn: string | undefined;
79
+ /**
80
+ * <p>A time limit for how long the monitoring job is allowed to run before stopping.</p>
81
+ * @public
82
+ */
83
+ StoppingCondition?: MonitoringStoppingCondition | undefined;
84
+ /**
85
+ * <p>(Optional) An array of key-value pairs. For more information, see <a href="https://docs.aws.amazon.com/awsaccountbilling/latest/aboutv2/cost-alloc-tags.html#allocation-whatURL"> Using Cost Allocation Tags</a> in the <i>Amazon Web Services Billing and Cost Management User Guide</i>.</p>
86
+ * @public
87
+ */
88
+ Tags?: Tag[] | undefined;
89
+ }
3
90
  /**
4
91
  * @public
5
92
  */
@@ -3145,6 +3232,11 @@ export interface CreateTrainingPlanRequest {
3145
3232
  * @public
3146
3233
  */
3147
3234
  TrainingPlanOfferingId: string | undefined;
3235
+ /**
3236
+ * <p>Number of spare instances to reserve per UltraServer for enhanced resiliency. Default is 1.</p>
3237
+ * @public
3238
+ */
3239
+ SpareInstanceCountPerUltraServer?: number | undefined;
3148
3240
  /**
3149
3241
  * <p>An array of key-value pairs to apply to this training plan.</p>
3150
3242
  * @public
@@ -5998,111 +6090,6 @@ export interface DescribeCompilationJobResponse {
5998
6090
  */
5999
6091
  DerivedInformation?: DerivedInformation | undefined;
6000
6092
  }
6001
- /**
6002
- * @public
6003
- */
6004
- export interface DescribeComputeQuotaRequest {
6005
- /**
6006
- * <p>ID of the compute allocation definition.</p>
6007
- * @public
6008
- */
6009
- ComputeQuotaId: string | undefined;
6010
- /**
6011
- * <p>Version of the compute allocation definition.</p>
6012
- * @public
6013
- */
6014
- ComputeQuotaVersion?: number | undefined;
6015
- }
6016
- /**
6017
- * @public
6018
- */
6019
- export interface DescribeComputeQuotaResponse {
6020
- /**
6021
- * <p>ARN of the compute allocation definition.</p>
6022
- * @public
6023
- */
6024
- ComputeQuotaArn: string | undefined;
6025
- /**
6026
- * <p>ID of the compute allocation definition.</p>
6027
- * @public
6028
- */
6029
- ComputeQuotaId: string | undefined;
6030
- /**
6031
- * <p>Name of the compute allocation definition.</p>
6032
- * @public
6033
- */
6034
- Name: string | undefined;
6035
- /**
6036
- * <p>Description of the compute allocation definition.</p>
6037
- * @public
6038
- */
6039
- Description?: string | undefined;
6040
- /**
6041
- * <p>Version of the compute allocation definition.</p>
6042
- * @public
6043
- */
6044
- ComputeQuotaVersion: number | undefined;
6045
- /**
6046
- * <p>Status of the compute allocation definition.</p>
6047
- * @public
6048
- */
6049
- Status: SchedulerResourceStatus | undefined;
6050
- /**
6051
- * <p>Failure reason of the compute allocation definition.</p>
6052
- * @public
6053
- */
6054
- FailureReason?: string | undefined;
6055
- /**
6056
- * <p>ARN of the cluster.</p>
6057
- * @public
6058
- */
6059
- ClusterArn?: string | undefined;
6060
- /**
6061
- * <p>Configuration of the compute allocation definition. This includes the resource sharing option, and the setting to preempt low priority tasks.</p>
6062
- * @public
6063
- */
6064
- ComputeQuotaConfig?: ComputeQuotaConfig | undefined;
6065
- /**
6066
- * <p>The target entity to allocate compute resources to.</p>
6067
- * @public
6068
- */
6069
- ComputeQuotaTarget: ComputeQuotaTarget | undefined;
6070
- /**
6071
- * <p>The state of the compute allocation being described. Use to enable or disable compute allocation.</p> <p>Default is <code>Enabled</code>.</p>
6072
- * @public
6073
- */
6074
- ActivationState?: ActivationState | undefined;
6075
- /**
6076
- * <p>Creation time of the compute allocation configuration.</p>
6077
- * @public
6078
- */
6079
- CreationTime: Date | undefined;
6080
- /**
6081
- * <p>Information about the user who created or modified a SageMaker resource.</p>
6082
- * @public
6083
- */
6084
- CreatedBy?: UserContext | undefined;
6085
- /**
6086
- * <p>Last modified time of the compute allocation configuration.</p>
6087
- * @public
6088
- */
6089
- LastModifiedTime?: Date | undefined;
6090
- /**
6091
- * <p>Information about the user who created or modified a SageMaker resource.</p>
6092
- * @public
6093
- */
6094
- LastModifiedBy?: UserContext | undefined;
6095
- }
6096
- /**
6097
- * @public
6098
- */
6099
- export interface DescribeContextRequest {
6100
- /**
6101
- * <p>The name of the context to describe.</p>
6102
- * @public
6103
- */
6104
- ContextName: string | undefined;
6105
- }
6106
6093
  /**
6107
6094
  * @internal
6108
6095
  */