@aws-sdk/client-sagemaker 3.1062.0 → 3.1063.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (27) hide show
  1. package/dist-cjs/schemas/schemas_0.js +64 -58
  2. package/dist-es/schemas/schemas_0.js +25 -19
  3. package/dist-types/commands/CreateAIBenchmarkJobCommand.d.ts +5 -0
  4. package/dist-types/commands/CreateAIRecommendationJobCommand.d.ts +5 -0
  5. package/dist-types/commands/DescribeAIBenchmarkJobCommand.d.ts +5 -0
  6. package/dist-types/commands/DescribeAIRecommendationJobCommand.d.ts +5 -0
  7. package/dist-types/commands/DescribeInferenceComponentCommand.d.ts +1 -2
  8. package/dist-types/commands/ListInferenceRecommendationsJobStepsCommand.d.ts +1 -2
  9. package/dist-types/commands/UpdateNotebookInstanceCommand.d.ts +2 -1
  10. package/dist-types/models/models_0.d.ts +41 -16
  11. package/dist-types/models/models_1.d.ts +17 -17
  12. package/dist-types/models/models_2.d.ts +18 -12
  13. package/dist-types/models/models_3.d.ts +10 -30
  14. package/dist-types/models/models_4.d.ts +33 -8
  15. package/dist-types/models/models_5.d.ts +5 -0
  16. package/dist-types/schemas/schemas_0.d.ts +1 -0
  17. package/dist-types/ts3.4/commands/DescribeInferenceComponentCommand.d.ts +4 -2
  18. package/dist-types/ts3.4/commands/ListInferenceRecommendationsJobStepsCommand.d.ts +4 -2
  19. package/dist-types/ts3.4/commands/UpdateNotebookInstanceCommand.d.ts +2 -4
  20. package/dist-types/ts3.4/models/models_0.d.ts +9 -4
  21. package/dist-types/ts3.4/models/models_1.d.ts +4 -5
  22. package/dist-types/ts3.4/models/models_2.d.ts +5 -5
  23. package/dist-types/ts3.4/models/models_3.d.ts +3 -7
  24. package/dist-types/ts3.4/models/models_4.d.ts +10 -2
  25. package/dist-types/ts3.4/models/models_5.d.ts +1 -0
  26. package/dist-types/ts3.4/schemas/schemas_0.d.ts +1 -0
  27. package/package.json +5 -5
@@ -66,6 +66,7 @@ const _AICp = "AppImageConfigs";
66
66
  const _AICv = "AvailableInstanceCount";
67
67
  const _AIDC = "AIDatasetConfig";
68
68
  const _AIL = "AssociationInfoList";
69
+ const _AIMC = "AIMlflowConfig";
69
70
  const _AIMS = "AIModelSource";
70
71
  const _AIMSS = "AIModelSourceS3";
71
72
  const _AINC = "AsyncInferenceNotificationConfig";
@@ -2263,7 +2264,7 @@ const _MBC = "MonitoringBaselineConfig";
2263
2264
  const _MBJI = "ModelBiasJobInput";
2264
2265
  const _MBJOC = "ModelBiasJobOutputConfig";
2265
2266
  const _MBS = "MaximumBatchSize";
2266
- const _MC = "MaxCandidates";
2267
+ const _MC = "MlflowConfig";
2267
2268
  const _MCA = "ModelCardArn";
2268
2269
  const _MCC = "ModelCardContent";
2269
2270
  const _MCCo = "ModelClientConfig";
@@ -2293,14 +2294,14 @@ const _MCTC = "MaxConcurrentTaskCount";
2293
2294
  const _MCV = "ModelCardVersion";
2294
2295
  const _MCVS = "ModelCardVersionSummary";
2295
2296
  const _MCVSL = "ModelCardVersionSummaryList";
2296
- const _MCa = "ManagedConfiguration";
2297
+ const _MCa = "MaxCandidates";
2297
2298
  const _MCai = "MaintenanceConfig";
2299
+ const _MCan = "ManagedConfiguration";
2298
2300
  const _MCax = "MaxCapacity";
2299
2301
  const _MCaxo = "MaxConcurrency";
2300
2302
  const _MCe = "MetricsConfig";
2301
2303
  const _MCi = "MinCount";
2302
2304
  const _MCin = "MinCapacity";
2303
- const _MCl = "MlflowConfig";
2304
2305
  const _MCo = "ModelConfigs";
2305
2306
  const _MCod = "ModelCard";
2306
2307
  const _MCode = "ModelConfiguration";
@@ -3820,13 +3821,13 @@ export var AIBenchmarkNetworkConfig$ = [3, n0, _AIBNC,
3820
3821
  ];
3821
3822
  export var AIBenchmarkOutputConfig$ = [3, n0, _AIBOC,
3822
3823
  0,
3823
- [_SOL],
3824
- [0], 1
3824
+ [_SOL, _MC],
3825
+ [0, () => AIMlflowConfig$], 1
3825
3826
  ];
3826
3827
  export var AIBenchmarkOutputResult$ = [3, n0, _AIBOR,
3827
3828
  0,
3828
- [_SOL, _CWL],
3829
- [0, () => AICloudWatchLogsList], 1
3829
+ [_SOL, _CWL, _MC],
3830
+ [0, () => AICloudWatchLogsList, () => AIMlflowConfig$], 1
3830
3831
  ];
3831
3832
  export var AICapacityReservationConfig$ = [3, n0, _AICRC,
3832
3833
  0,
@@ -3838,6 +3839,11 @@ export var AICloudWatchLogs$ = [3, n0, _AICWL,
3838
3839
  [_LGA, _LSN],
3839
3840
  [0, 0]
3840
3841
  ];
3842
+ export var AIMlflowConfig$ = [3, n0, _AIMC,
3843
+ 0,
3844
+ [_MRAl, _MEN, _MRN],
3845
+ [0, 0, 0], 1
3846
+ ];
3841
3847
  export var AIModelSourceS3$ = [3, n0, _AIMSS,
3842
3848
  0,
3843
3849
  [_SUr],
@@ -3895,13 +3901,13 @@ export var AIRecommendationOptimizationDetail$ = [3, n0, _AIROD,
3895
3901
  ];
3896
3902
  export var AIRecommendationOutputConfig$ = [3, n0, _AIROC,
3897
3903
  0,
3898
- [_SOL, _MPGI],
3899
- [0, 0]
3904
+ [_SOL, _MPGI, _MC],
3905
+ [0, 0, () => AIMlflowConfig$]
3900
3906
  ];
3901
3907
  export var AIRecommendationOutputResult$ = [3, n0, _AIROR,
3902
3908
  0,
3903
- [_SOL, _MPGI],
3904
- [0, 0], 1
3909
+ [_SOL, _MPGI, _MC],
3910
+ [0, 0, () => AIMlflowConfig$], 1
3905
3911
  ];
3906
3912
  export var AIRecommendationPerformanceMetric$ = [3, n0, _AIRPM,
3907
3913
  0,
@@ -4140,7 +4146,7 @@ export var AutoMLJobChannel$ = [3, n0, _AMLJC,
4140
4146
  ];
4141
4147
  export var AutoMLJobCompletionCriteria$ = [3, n0, _AMLJCC,
4142
4148
  0,
4143
- [_MC, _MRPTJIS, _MAMLJRIS],
4149
+ [_MCa, _MRPTJIS, _MAMLJRIS],
4144
4150
  [1, 1, 1]
4145
4151
  ];
4146
4152
  export var AutoMLJobConfig$ = [3, n0, _AMLJCu,
@@ -5255,7 +5261,7 @@ export var CreateModelOutput$ = [3, n0, _CMO,
5255
5261
  ];
5256
5262
  export var CreateModelPackageGroupInput$ = [3, n0, _CMPGI,
5257
5263
  0,
5258
- [_MPGN, _MPGD, _Ta, _MCa],
5264
+ [_MPGN, _MPGD, _Ta, _MCan],
5259
5265
  [0, 0, () => TagList, () => ManagedConfiguration$], 1
5260
5266
  ];
5261
5267
  export var CreateModelPackageGroupOutput$ = [3, n0, _CMPGO,
@@ -5440,7 +5446,7 @@ export var CreateTemplateProvider$ = [3, n0, _CTP,
5440
5446
  ];
5441
5447
  export var CreateTrainingJobRequest$ = [3, n0, _CTJR,
5442
5448
  0,
5443
- [_TJN, _RAo, _ODC, _HP, _ASl, _IDC, _RCe, _VC, _SCt, _Ta, _ENI, _EICTE, _EMST, _CCh, _DHC, _DRC, _TBOC, _ECxp, _PCr, _PRC, _E, _RSe, _RDC, _ICC, _SCC, _SJC, _MCl, _MPC],
5449
+ [_TJN, _RAo, _ODC, _HP, _ASl, _IDC, _RCe, _VC, _SCt, _Ta, _ENI, _EICTE, _EMST, _CCh, _DHC, _DRC, _TBOC, _ECxp, _PCr, _PRC, _E, _RSe, _RDC, _ICC, _SCC, _SJC, _MC, _MPC],
5444
5450
  [0, 0, () => OutputDataConfig$, 128 | 0, () => AlgorithmSpecification$, () => InputDataConfig, () => ResourceConfig$, () => VpcConfig$, () => StoppingCondition$, () => TagList, 2, 2, 2, () => CheckpointConfig$, () => DebugHookConfig$, () => DebugRuleConfigurations, () => TensorBoardOutputConfig$, () => ExperimentConfig$, () => ProfilerConfig$, () => ProfilerRuleConfigurations, 128 | 0, () => RetryStrategy$, () => RemoteDebugConfig$, () => InfraCheckConfig$, () => SessionChainingConfig$, () => ServerlessJobConfig$, () => MlflowConfig$, () => ModelPackageConfig$], 3
5445
5451
  ];
5446
5452
  export var CreateTrainingJobResponse$ = [3, n0, _CTJRr,
@@ -6590,7 +6596,7 @@ export var DescribeModelPackageGroupInput$ = [3, n0, _DMPGIe,
6590
6596
  ];
6591
6597
  export var DescribeModelPackageGroupOutput$ = [3, n0, _DMPGO,
6592
6598
  0,
6593
- [_MPGN, _MPGA, _CT, _CB, _MPGS, _MPGD, _MCa],
6599
+ [_MPGN, _MPGA, _CT, _CB, _MPGS, _MPGD, _MCan],
6594
6600
  [0, 0, 4, () => UserContext$, 0, 0, () => ManagedConfiguration$], 5
6595
6601
  ];
6596
6602
  export var DescribeModelPackageInput$ = [3, n0, _DMPIe,
@@ -6760,7 +6766,7 @@ export var DescribeTrainingJobRequest$ = [3, n0, _DTJRe,
6760
6766
  ];
6761
6767
  export var DescribeTrainingJobResponse$ = [3, n0, _DTJRes,
6762
6768
  0,
6763
- [_TJN, _TJA, _MAo, _TJS, _SSe, _SCt, _CT, _TJAu, _LJA, _AMLJAu, _FR, _HP, _ASl, _RAo, _IDC, _ODC, _RCe, _WPS, _VC, _TST, _TET, _LMT, _SST, _FMDL, _ENI, _EICTE, _EMST, _CCh, _TTIS, _BTIS, _BTC, _DHC, _ECxp, _DRC, _TBOC, _DRESe, _PCr, _PRC, _PRES, _PSro, _E, _RSe, _RDC, _ICC, _SJC, _MCl, _MPC, _MDl, _PIrog, _OMPA],
6769
+ [_TJN, _TJA, _MAo, _TJS, _SSe, _SCt, _CT, _TJAu, _LJA, _AMLJAu, _FR, _HP, _ASl, _RAo, _IDC, _ODC, _RCe, _WPS, _VC, _TST, _TET, _LMT, _SST, _FMDL, _ENI, _EICTE, _EMST, _CCh, _TTIS, _BTIS, _BTC, _DHC, _ECxp, _DRC, _TBOC, _DRESe, _PCr, _PRC, _PRES, _PSro, _E, _RSe, _RDC, _ICC, _SJC, _MC, _MPC, _MDl, _PIrog, _OMPA],
6764
6770
  [0, 0, () => ModelArtifacts$, 0, 0, () => StoppingCondition$, 4, 0, 0, 0, 0, 128 | 0, () => AlgorithmSpecification$, 0, () => InputDataConfig, () => OutputDataConfig$, () => ResourceConfig$, () => WarmPoolStatus$, () => VpcConfig$, 4, 4, 4, () => SecondaryStatusTransitions, () => FinalMetricDataList, 2, 2, 2, () => CheckpointConfig$, 1, 1, 1, () => DebugHookConfig$, () => ExperimentConfig$, () => DebugRuleConfigurations, () => TensorBoardOutputConfig$, () => DebugRuleEvaluationStatuses, () => ProfilerConfig$, () => ProfilerRuleConfigurations, () => ProfilerRuleEvaluationStatuses, 0, 128 | 0, () => RetryStrategy$, () => RemoteDebugConfig$, () => InfraCheckConfig$, () => ServerlessJobConfig$, () => MlflowConfig$, () => ModelPackageConfig$, () => MlflowDetails$, () => TrainingProgressInfo$, 0], 7
6765
6771
  ];
6766
6772
  export var DescribeTrainingPlanExtensionHistoryRequest$ = [3, n0, _DTPEHR,
@@ -8803,7 +8809,7 @@ export var ListWorkteamsResponse$ = [3, n0, _LWRist,
8803
8809
  [_Work, _NTe],
8804
8810
  [() => Workteams, 0], 1
8805
8811
  ];
8806
- export var ManagedConfiguration$ = [3, n0, _MCa,
8812
+ export var ManagedConfiguration$ = [3, n0, _MCan,
8807
8813
  0,
8808
8814
  [_MST],
8809
8815
  [0]
@@ -8848,7 +8854,7 @@ export var MlflowAppSummary$ = [3, n0, _MASl,
8848
8854
  [_Ar, _N, _St, _CT, _LMT, _MVl],
8849
8855
  [0, 0, 0, 4, 4, 0]
8850
8856
  ];
8851
- export var MlflowConfig$ = [3, n0, _MCl,
8857
+ export var MlflowConfig$ = [3, n0, _MC,
8852
8858
  0,
8853
8859
  [_MRAl, _MEN, _MRN],
8854
8860
  [0, 0, 0], 1
@@ -9070,7 +9076,7 @@ export var ModelPackageGroup$ = [3, n0, _MPG,
9070
9076
  ];
9071
9077
  export var ModelPackageGroupSummary$ = [3, n0, _MPGSo,
9072
9078
  0,
9073
- [_MPGN, _MPGA, _CT, _MPGS, _MPGD, _MCa],
9079
+ [_MPGN, _MPGA, _CT, _MPGS, _MPGD, _MCan],
9074
9080
  [0, 0, 4, 0, 0, () => ManagedConfiguration$], 4
9075
9081
  ];
9076
9082
  export var ModelPackageModelCard$ = [3, n0, _MPMC,
@@ -53,6 +53,11 @@ declare const CreateAIBenchmarkJobCommand_base: {
53
53
  * },
54
54
  * OutputConfig: { // AIBenchmarkOutputConfig
55
55
  * S3OutputLocation: "STRING_VALUE", // required
56
+ * MlflowConfig: { // AIMlflowConfig
57
+ * MlflowResourceArn: "STRING_VALUE", // required
58
+ * MlflowExperimentName: "STRING_VALUE",
59
+ * MlflowRunName: "STRING_VALUE",
60
+ * },
56
61
  * },
57
62
  * AIWorkloadConfigIdentifier: "STRING_VALUE", // required
58
63
  * RoleArn: "STRING_VALUE", // required
@@ -48,6 +48,11 @@ declare const CreateAIRecommendationJobCommand_base: {
48
48
  * OutputConfig: { // AIRecommendationOutputConfig
49
49
  * S3OutputLocation: "STRING_VALUE",
50
50
  * ModelPackageGroupIdentifier: "STRING_VALUE",
51
+ * MlflowConfig: { // AIMlflowConfig
52
+ * MlflowResourceArn: "STRING_VALUE", // required
53
+ * MlflowExperimentName: "STRING_VALUE",
54
+ * MlflowRunName: "STRING_VALUE",
55
+ * },
51
56
  * },
52
57
  * AIWorkloadConfigIdentifier: "STRING_VALUE", // required
53
58
  * PerformanceTarget: { // AIRecommendationPerformanceTarget
@@ -67,6 +67,11 @@ declare const DescribeAIBenchmarkJobCommand_base: {
67
67
  * // LogStreamName: "STRING_VALUE",
68
68
  * // },
69
69
  * // ],
70
+ * // MlflowConfig: { // AIMlflowConfig
71
+ * // MlflowResourceArn: "STRING_VALUE", // required
72
+ * // MlflowExperimentName: "STRING_VALUE",
73
+ * // MlflowRunName: "STRING_VALUE",
74
+ * // },
70
75
  * // },
71
76
  * // AIWorkloadConfigIdentifier: "STRING_VALUE", // required
72
77
  * // RoleArn: "STRING_VALUE", // required
@@ -56,6 +56,11 @@ declare const DescribeAIRecommendationJobCommand_base: {
56
56
  * // OutputConfig: { // AIRecommendationOutputResult
57
57
  * // S3OutputLocation: "STRING_VALUE", // required
58
58
  * // ModelPackageGroupIdentifier: "STRING_VALUE",
59
+ * // MlflowConfig: { // AIMlflowConfig
60
+ * // MlflowResourceArn: "STRING_VALUE", // required
61
+ * // MlflowExperimentName: "STRING_VALUE",
62
+ * // MlflowRunName: "STRING_VALUE",
63
+ * // },
59
64
  * // },
60
65
  * // InferenceSpecification: { // AIRecommendationInferenceSpecification
61
66
  * // Framework: "LMI" || "VLLM",
@@ -1,7 +1,6 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import type { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import type { DescribeInferenceComponentInput } from "../models/models_2";
4
- import type { DescribeInferenceComponentOutput } from "../models/models_3";
3
+ import type { DescribeInferenceComponentInput, DescribeInferenceComponentOutput } from "../models/models_3";
5
4
  import type { SageMakerClientResolvedConfig, ServiceInputTypes, ServiceOutputTypes } from "../SageMakerClient";
6
5
  /**
7
6
  * @public
@@ -1,7 +1,6 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import type { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import type { ListInferenceRecommendationsJobStepsRequest } from "../models/models_3";
4
- import type { ListInferenceRecommendationsJobStepsResponse } from "../models/models_4";
3
+ import type { ListInferenceRecommendationsJobStepsRequest, ListInferenceRecommendationsJobStepsResponse } from "../models/models_4";
5
4
  import type { SageMakerClientResolvedConfig, ServiceInputTypes, ServiceOutputTypes } from "../SageMakerClient";
6
5
  /**
7
6
  * @public
@@ -1,6 +1,7 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import type { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import type { UpdateNotebookInstanceInput, UpdateNotebookInstanceOutput } from "../models/models_4";
3
+ import type { UpdateNotebookInstanceInput } from "../models/models_4";
4
+ import type { UpdateNotebookInstanceOutput } from "../models/models_5";
4
5
  import type { SageMakerClientResolvedConfig, ServiceInputTypes, ServiceOutputTypes } from "../SageMakerClient";
5
6
  /**
6
7
  * @public
@@ -617,6 +617,27 @@ export interface AIBenchmarkNetworkConfig {
617
617
  */
618
618
  VpcConfig?: VpcConfig | undefined;
619
619
  }
620
+ /**
621
+ * <p>The MLflow tracking configuration for logging metrics and parameters to a SageMaker managed MLflow tracking server.</p>
622
+ * @public
623
+ */
624
+ export interface AIMlflowConfig {
625
+ /**
626
+ * <p>The Amazon Resource Name (ARN) of the SageMaker managed MLflow resource.</p>
627
+ * @public
628
+ */
629
+ MlflowResourceArn: string | undefined;
630
+ /**
631
+ * <p>The MLflow experiment name used for tracking.</p>
632
+ * @public
633
+ */
634
+ MlflowExperimentName?: string | undefined;
635
+ /**
636
+ * <p>The MLflow run name used for tracking.</p>
637
+ * @public
638
+ */
639
+ MlflowRunName?: string | undefined;
640
+ }
620
641
  /**
621
642
  * <p>The output configuration for an AI benchmark job.</p>
622
643
  * @public
@@ -627,6 +648,11 @@ export interface AIBenchmarkOutputConfig {
627
648
  * @public
628
649
  */
629
650
  S3OutputLocation: string | undefined;
651
+ /**
652
+ * <p>The MLflow tracking configuration for the job. If you don't specify this parameter, MLflow tracking is disabled.</p>
653
+ * @public
654
+ */
655
+ MlflowConfig?: AIMlflowConfig | undefined;
630
656
  }
631
657
  /**
632
658
  * <p>CloudWatch log information for an AI benchmark or recommendation job.</p>
@@ -659,6 +685,11 @@ export interface AIBenchmarkOutputResult {
659
685
  * @public
660
686
  */
661
687
  CloudWatchLogs?: AICloudWatchLogs[] | undefined;
688
+ /**
689
+ * <p>The MLflow tracking configuration for the job.</p>
690
+ * @public
691
+ */
692
+ MlflowConfig?: AIMlflowConfig | undefined;
662
693
  }
663
694
  /**
664
695
  * <p>The target for an AI benchmark job. This is a union type — specify one of the members.</p>
@@ -1080,6 +1111,11 @@ export interface AIRecommendationOutputConfig {
1080
1111
  * @public
1081
1112
  */
1082
1113
  ModelPackageGroupIdentifier?: string | undefined;
1114
+ /**
1115
+ * <p>The MLflow tracking configuration for the job. If you don't specify this parameter, MLflow tracking is disabled.</p>
1116
+ * @public
1117
+ */
1118
+ MlflowConfig?: AIMlflowConfig | undefined;
1083
1119
  }
1084
1120
  /**
1085
1121
  * <p>The output configuration for an AI recommendation job, including the S3 location for results and the model package group for deployment.</p>
@@ -1096,6 +1132,11 @@ export interface AIRecommendationOutputResult {
1096
1132
  * @public
1097
1133
  */
1098
1134
  ModelPackageGroupIdentifier?: string | undefined;
1135
+ /**
1136
+ * <p>The MLflow tracking configuration for the job.</p>
1137
+ * @public
1138
+ */
1139
+ MlflowConfig?: AIMlflowConfig | undefined;
1099
1140
  }
1100
1141
  /**
1101
1142
  * <p>The performance targets for an AI recommendation job.</p>
@@ -7008,19 +7049,3 @@ export interface ComputeQuotaConfig {
7008
7049
  */
7009
7050
  PreemptTeamTasks?: PreemptTeamTasks | undefined;
7010
7051
  }
7011
- /**
7012
- * <p>The target entity to allocate compute resources to.</p>
7013
- * @public
7014
- */
7015
- export interface ComputeQuotaTarget {
7016
- /**
7017
- * <p>Name of the team to allocate compute resources to.</p>
7018
- * @public
7019
- */
7020
- TeamName: string | undefined;
7021
- /**
7022
- * <p>Assigned entity fair-share weight. Idle compute will be shared across entities based on these assigned weights. This weight is only used when <code>FairShare</code> is enabled.</p> <p>A weight of 0 is the lowest priority and 100 is the highest. Weight 0 is the default.</p>
7023
- * @public
7024
- */
7025
- FairShareWeight?: number | undefined;
7026
- }
@@ -1,6 +1,22 @@
1
1
  import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion } from "@smithy/core/serde";
2
2
  import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AvailabilityZoneBalanceEnforcementMode, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, ClusterNodeProvisioningMode, ClusterNodeRecovery, CollectionType, CompleteOnConvergence, ConditionOutcome, ContainerMode, ContentClassifier, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, ExecutionRoleSessionNameMode, FailureHandlingPolicy, FairShare, FeatureStatus, FeatureType, FlatInvocations, Framework, HomeEfsFileSystemCreation, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, IdleResourceSharing, InferenceComponentPlacementStrategy, InferenceExecutionMode, InferenceExperimentType, IPAddressType, JobCategory, JobType, ManagedInstanceScalingScaleInStrategy, ManagedInstanceScalingStatus, ManagedStorageType, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCacheSetting, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode, MonitoringProblemType, MonitoringType, NotebookInstanceAcceleratorType, NotebookOutputOption, ParameterType, ProblemType, ProcessingInstanceType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInferenceAmiVersion, ProductionVariantInstanceType, RecommendationJobSupportedEndpointType, RecommendationJobType, RepositoryAccessMode, RootAccess, RoutingStrategy, RStudioServerProAccessStatus, RStudioServerProUserGroup, SageMakerImageName, SchedulerResourceStatus, SkipModelValidation, StorageType, StudioWebPortal, TableFormat, TagPropagation, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, ThroughputMode, TrackingServerSize, TrafficType, TrainingInputMode, TrainingInstanceType, TrainingJobEarlyStoppingType, TtlDurationUnit, VendorGuidance } from "./enums";
3
- import type { ActionSource, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputConfig, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputConfig, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppLifecycleManagement, ArtifactSource, AsyncInferenceConfig, AuthorizedUrl, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoParameter, AutoRollbackConfig, Autotune, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, ComputeQuotaConfig, ComputeQuotaTarget, CustomImage, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelDataSource, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformJobDefinition, VpcConfig } from "./models_0";
3
+ import type { ActionSource, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputConfig, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputConfig, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppLifecycleManagement, ArtifactSource, AsyncInferenceConfig, AuthorizedUrl, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoParameter, AutoRollbackConfig, Autotune, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, ComputeQuotaConfig, CustomImage, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelDataSource, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformJobDefinition, VpcConfig } from "./models_0";
4
+ /**
5
+ * <p>The target entity to allocate compute resources to.</p>
6
+ * @public
7
+ */
8
+ export interface ComputeQuotaTarget {
9
+ /**
10
+ * <p>Name of the team to allocate compute resources to.</p>
11
+ * @public
12
+ */
13
+ TeamName: string | undefined;
14
+ /**
15
+ * <p>Assigned entity fair-share weight. Idle compute will be shared across entities based on these assigned weights. This weight is only used when <code>FairShare</code> is enabled.</p> <p>A weight of 0 is the lowest priority and 100 is the highest. Weight 0 is the default.</p>
16
+ * @public
17
+ */
18
+ FairShareWeight?: number | undefined;
19
+ }
4
20
  /**
5
21
  * <p>Summary of the compute allocation definition.</p>
6
22
  * @public
@@ -7164,19 +7180,3 @@ export interface ModelQuantizationConfig {
7164
7180
  */
7165
7181
  OverrideEnvironment?: Record<string, string> | undefined;
7166
7182
  }
7167
- /**
7168
- * <p>Settings for the model sharding technique that's applied by a model optimization job.</p>
7169
- * @public
7170
- */
7171
- export interface ModelShardingConfig {
7172
- /**
7173
- * <p>The URI of an LMI DLC in Amazon ECR. SageMaker uses this image to run the optimization.</p>
7174
- * @public
7175
- */
7176
- Image?: string | undefined;
7177
- /**
7178
- * <p>Environment variables that override the default ones in the model container.</p>
7179
- * @public
7180
- */
7181
- OverrideEnvironment?: Record<string, string> | undefined;
7182
- }
@@ -1,6 +1,22 @@
1
1
  import type { ActionStatus, ActivationState, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmStatus, AppNetworkAccessType, AppSecurityGroupManagement, AppStatus, AppType, AuthMode, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLProblemTypeConfigName, BatchStrategy, CapacityReservationPreference, CaptureStatus, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterStatus, CompilationJobStatus, CustomizationTechnique, DataDistributionType, DeepHealthCheckType, DomainStatus, EdgePackagingJobStatus, EdgePresetDeploymentStatus, EdgePresetDeploymentType, EnabledOrDisabled, EndpointStatus, EvaluationType, FeatureGroupStatus, FeatureStatus, FeatureType, FlowDefinitionStatus, HomeEfsFileSystemCreation, HubContentStatus, HubContentSupportStatus, HubContentType, HubStatus, HumanTaskUiStatus, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStatus, ImageStatus, ImageVersionStatus, InputMode, JobCategory, JobType, JoinSource, LastUpdateStatusValue, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, ObjectiveStatus, OfflineStoreStatusValue, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, Peft, ProblemType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInstanceType, RecommendationStatus, RedshiftResultCompressionType, RedshiftResultFormat, RetentionType, RuleEvaluationStatus, SchedulerConfigComponent, SchedulerResourceStatus, ServerlessJobType, SharingType, StageStatus, Statistic, StudioLifecycleConfigAppType, TagPropagation, ThroughputMode, TrainingJobStatus, TrialComponentPrimaryStatus, VariantStatus, VendorGuidance, WorkforceIpAddressType } from "./enums";
2
- import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, ComputeQuotaTarget, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
- import type { ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, ModelShardingConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
2
+ import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
+ import type { ComputeQuotaTarget, ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
4
+ /**
5
+ * <p>Settings for the model sharding technique that's applied by a model optimization job.</p>
6
+ * @public
7
+ */
8
+ export interface ModelShardingConfig {
9
+ /**
10
+ * <p>The URI of an LMI DLC in Amazon ECR. SageMaker uses this image to run the optimization.</p>
11
+ * @public
12
+ */
13
+ Image?: string | undefined;
14
+ /**
15
+ * <p>Environment variables that override the default ones in the model container.</p>
16
+ * @public
17
+ */
18
+ OverrideEnvironment?: Record<string, string> | undefined;
19
+ }
4
20
  /**
5
21
  * <p>Contains information about the training data source for speculative decoding.</p>
6
22
  * @public
@@ -7189,13 +7205,3 @@ export interface DescribeImageVersionResponse {
7189
7205
  */
7190
7206
  ReleaseNotes?: string | undefined;
7191
7207
  }
7192
- /**
7193
- * @public
7194
- */
7195
- export interface DescribeInferenceComponentInput {
7196
- /**
7197
- * <p>The name of the inference component.</p>
7198
- * @public
7199
- */
7200
- InferenceComponentName: string | undefined;
7201
- }
@@ -2,6 +2,16 @@ import type { _InstanceType, AccountDefaultStatus, AIBenchmarkJobStatus, AIRecom
2
2
  import type { ActionSummary, AdditionalInferenceSpecificationDefinition, AgentVersion, AIBenchmarkJobSummary, AIRecommendationJobSummary, AIWorkloadConfigSummary, AlgorithmSpecification, AlgorithmSummary, AmazonQSettings, AppDetails, AppImageConfigDetails, AppSpecification, ArtifactSummary, AssociationInfo, AssociationSummary, AutoMLCandidate, AutoMLJobSummary, AutoRollbackConfig, AvailableUpgrade, BatchDataCaptureConfig, CfnTemplateProviderDetail, Channel, CheckpointConfig, ClusterEventSummary, ClusterNodeSummary, ClusterSchedulerConfigSummary, ClusterSummary, CodeRepositorySummary, CognitoConfig, CompilationJobSummary, InferenceSpecification, OutputDataConfig, OutputParameter, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
3
  import type { ComputeQuotaSummary, ContainerDefinition, ContextSummary, DockerSettings, DriftCheckBaselines, EdgeOutputConfig, EndpointInfo, FeatureDefinition, HumanTaskConfig, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InferenceComponentComputeResourceRequirements, InferenceComponentSchedulingConfig, InferenceComponentStartupParameters, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InstanceMetadataServiceConfiguration, LabelingJobAlgorithmsConfig, LabelingJobInputConfig, LabelingJobOutputConfig, LabelingJobStoppingConditions, ManagedConfiguration, MetadataProperties, ModelBiasAppSpecification, ModelBiasBaselineConfig, ModelBiasJobInput, ModelCardExportOutputConfig, ModelCardSecurityConfig, ModelExplainabilityAppSpecification, ModelExplainabilityBaselineConfig, ModelExplainabilityJobInput, ModelInfrastructureConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelQualityAppSpecification, ModelQualityBaselineConfig, ModelQualityJobInput, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringScheduleConfig, MonitoringStoppingCondition, NetworkConfig, NotebookInstanceLifecycleHook, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, ProductionVariantServerlessConfig, RecommendationJobInputConfig, RecommendationJobStoppingConditions, ResourceLimits, RetryStrategy, ShadowModeConfig, SourceAlgorithmSpecification, TrustedIdentityPropagationSettings, UnifiedStudioSettings, UserSettings } from "./models_1";
4
4
  import type { CustomizedMetricSpecification, DataCaptureConfigSummary, DataProcessing, DebugHookConfig, DebugRuleConfiguration, DebugRuleEvaluationStatus, DeployedImage, DeploymentRecommendation, ExperimentConfig, ExperimentSource, FeatureParameter, HyperParameterTrainingJobSummary, HyperParameterTuningJobCompletionDetails, HyperParameterTuningJobConsumedResources, InfraCheckConfig, LastUpdateStatus, MemberDefinition, MlflowConfig, ModelArtifacts, ModelClientConfig, ModelPackageConfig, NotificationConfiguration, ObjectiveStatusCounters, OfflineStoreStatus, OptimizationConfig, OptimizationJobOutputConfig, OptimizationVpcConfig, OwnershipSettings, ParallelismConfiguration, PartnerAppConfig, PartnerAppMaintenanceConfig, ProcessingInput, ProcessingOutputConfig, ProcessingResources, ProcessingStoppingCondition, ProductionVariantSummary, ProfilerConfig, ProfilerRuleConfiguration, RemoteDebugConfig, ServerlessJobConfig, ServiceCatalogProvisioningDetails, SourceIpConfig, SpaceSettings, SpaceSharingSettings, TensorBoardOutputConfig, TrainingJobStatusCounters, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus, WorkerAccessConfiguration } from "./models_2";
5
+ /**
6
+ * @public
7
+ */
8
+ export interface DescribeInferenceComponentInput {
9
+ /**
10
+ * <p>The name of the inference component.</p>
11
+ * @public
12
+ */
13
+ InferenceComponentName: string | undefined;
14
+ }
5
15
  /**
6
16
  * <p>Specifies the type and size of the endpoint capacity to activate for a rolling deployment or a rollback strategy. You can specify your batches as either of the following:</p> <ul> <li> <p>A count of inference component copies </p> </li> <li> <p>The overall percentage or your fleet </p> </li> </ul> <p>For a rollback strategy, if you don't specify the fields in this object, or if you set the <code>Value</code> parameter to 100%, then SageMaker AI uses a blue/green rollback strategy and rolls all traffic back to the blue fleet.</p>
7
17
  * @public
@@ -9823,33 +9833,3 @@ export interface ListInferenceRecommendationsJobsResponse {
9823
9833
  */
9824
9834
  NextToken?: string | undefined;
9825
9835
  }
9826
- /**
9827
- * @public
9828
- */
9829
- export interface ListInferenceRecommendationsJobStepsRequest {
9830
- /**
9831
- * <p>The name for the Inference Recommender job.</p>
9832
- * @public
9833
- */
9834
- JobName: string | undefined;
9835
- /**
9836
- * <p>A filter to return benchmarks of a specified status. If this field is left empty, then all benchmarks are returned.</p>
9837
- * @public
9838
- */
9839
- Status?: RecommendationJobStatus | undefined;
9840
- /**
9841
- * <p>A filter to return details about the specified type of subtask.</p> <p> <code>BENCHMARK</code>: Evaluate the performance of your model on different instance types.</p>
9842
- * @public
9843
- */
9844
- StepType?: RecommendationStepType | undefined;
9845
- /**
9846
- * <p>The maximum number of results to return.</p>
9847
- * @public
9848
- */
9849
- MaxResults?: number | undefined;
9850
- /**
9851
- * <p>A token that you can specify to return more results from the list. Specify this field if you have a token that was returned from a previous request.</p>
9852
- * @public
9853
- */
9854
- NextToken?: string | undefined;
9855
- }
@@ -1,8 +1,38 @@
1
- import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppNetworkAccessType, AppSecurityGroupManagement, AppType, BatchStrategy, ClusterNodeProvisioningMode, ClusterNodeRecovery, CrossAccountFilterOption, Direction, EndpointStatus, ExecutionStatus, FeatureStatus, HomeEfsFileSystemCreation, HubContentSupportStatus, HubContentType, InferenceExperimentStopDesiredState, IPAddressType, IsTrackingServerActive, JobCategory, JobStatus, JobType, LabelingJobStatus, LineageType, ListLabelingJobsForWorkteamSortByOptions, ListOptimizationJobsSortBy, ListWorkforcesSortByOptions, ListWorkteamsSortByOptions, MlflowAppStatus, ModelApprovalStatus, ModelCardExportJobSortBy, ModelCardExportJobSortOrder, ModelCardExportJobStatus, ModelCardSortBy, ModelCardSortOrder, ModelCardStatus, ModelCardVersionSortBy, ModelMetadataFilterType, ModelPackageGroupSortBy, ModelPackageGroupStatus, ModelPackageRegistrationType, ModelPackageSortBy, ModelPackageStatus, ModelPackageType, ModelRegistrationMode, ModelSortKey, ModelVariantAction, MonitoringAlertHistorySortKey, MonitoringAlertStatus, MonitoringExecutionSortKey, MonitoringJobDefinitionSortKey, MonitoringScheduleSortKey, MonitoringType, NotebookInstanceAcceleratorType, NotebookInstanceLifecycleConfigSortKey, NotebookInstanceLifecycleConfigSortOrder, NotebookInstanceSortKey, NotebookInstanceSortOrder, NotebookInstanceStatus, OptimizationJobDeploymentInstanceType, OptimizationJobStatus, OrderKey, PartnerAppStatus, PartnerAppType, PipelineExecutionStatus, PipelineStatus, ProcessingJobStatus, Processor, ProjectSortBy, ProjectSortOrder, ProjectStatus, Relation, ReservedCapacityInstanceType, ReservedCapacityType, ResourceCatalogSortBy, ResourceCatalogSortOrder, RootAccess, SageMakerResourceName, ScheduleStatus, SecondaryStatus, SharingType, SkipModelValidation, SortBy, SortLineageGroupsBy, SortMlflowAppBy, SortOrder, SortPipelineExecutionsBy, SortPipelinesBy, SortTrackingServerBy, SortTrialComponentsBy, SortTrialsBy, SpaceSortKey, SpaceStatus, StepStatus, StudioLifecycleConfigAppType, StudioLifecycleConfigSortKey, TagPropagation, ThroughputMode, TrackingServerSize, TrackingServerStatus, TrainingJobSortByOptions, TrainingJobStatus, TrainingPlanFilterName, TrainingPlanSortBy, TrainingPlanSortOrder, TrainingPlanStatus, TransformJobStatus, UltraServerHealthStatus, UserProfileSortKey, UserProfileStatus, VariantPropertyType, VendorGuidance, WarmPoolResourceStatus } from "./enums";
2
- import type { AdditionalInferenceSpecificationDefinition, AlgorithmSpecification, AppSpecification, AutoMLJobStepMetadata, BatchDataCaptureConfig, BatchTransformInput, BedrockCustomModelDeploymentMetadata, BedrockCustomModelMetadata, BedrockModelImportMetadata, BedrockProvisionedModelThroughputMetadata, CacheHitResult, CallbackStepMetadata, Channel, CheckpointConfig, ClarifyCheckStepMetadata, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, ComputeQuotaConfig, ComputeQuotaTarget, DeploymentConfiguration, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, OutputParameter, ResourceConfig, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
- import type { ConditionStepMetadata, ContainerDefinition, DefaultSpaceSettings, DeploymentConfig, DriftCheckBaselines, EdgeOutputConfig, FeatureDefinition, InferenceComponentRuntimeConfig, InferenceComponentSpecification, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InstanceMetadataServiceConfiguration, ManagedConfiguration, MetadataProperties, ModelCardSecurityConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelVariantConfig, MonitoringScheduleConfig, NetworkConfig, RetryStrategy, SchedulerConfig, ShadowModeConfig, SourceAlgorithmSpecification, TtlDuration, UiTemplate, UserSettings } from "./models_1";
1
+ import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppNetworkAccessType, AppSecurityGroupManagement, AppType, BatchStrategy, ClusterNodeProvisioningMode, ClusterNodeRecovery, CrossAccountFilterOption, Direction, EndpointStatus, ExecutionStatus, FeatureStatus, HomeEfsFileSystemCreation, HubContentSupportStatus, HubContentType, InferenceExperimentStopDesiredState, IPAddressType, IsTrackingServerActive, JobCategory, JobStatus, JobType, LabelingJobStatus, LineageType, ListLabelingJobsForWorkteamSortByOptions, ListOptimizationJobsSortBy, ListWorkforcesSortByOptions, ListWorkteamsSortByOptions, MlflowAppStatus, ModelApprovalStatus, ModelCardExportJobSortBy, ModelCardExportJobSortOrder, ModelCardExportJobStatus, ModelCardSortBy, ModelCardSortOrder, ModelCardStatus, ModelCardVersionSortBy, ModelMetadataFilterType, ModelPackageGroupSortBy, ModelPackageGroupStatus, ModelPackageRegistrationType, ModelPackageSortBy, ModelPackageStatus, ModelPackageType, ModelRegistrationMode, ModelSortKey, ModelVariantAction, MonitoringAlertHistorySortKey, MonitoringAlertStatus, MonitoringExecutionSortKey, MonitoringJobDefinitionSortKey, MonitoringScheduleSortKey, MonitoringType, NotebookInstanceAcceleratorType, NotebookInstanceLifecycleConfigSortKey, NotebookInstanceLifecycleConfigSortOrder, NotebookInstanceSortKey, NotebookInstanceSortOrder, NotebookInstanceStatus, OptimizationJobDeploymentInstanceType, OptimizationJobStatus, OrderKey, PartnerAppStatus, PartnerAppType, PipelineExecutionStatus, PipelineStatus, ProcessingJobStatus, Processor, ProjectSortBy, ProjectSortOrder, ProjectStatus, RecommendationJobStatus, RecommendationStepType, Relation, ReservedCapacityInstanceType, ReservedCapacityType, ResourceCatalogSortBy, ResourceCatalogSortOrder, RootAccess, SageMakerResourceName, ScheduleStatus, SecondaryStatus, SharingType, SkipModelValidation, SortBy, SortLineageGroupsBy, SortMlflowAppBy, SortOrder, SortPipelineExecutionsBy, SortPipelinesBy, SortTrackingServerBy, SortTrialComponentsBy, SortTrialsBy, SpaceSortKey, SpaceStatus, StepStatus, StudioLifecycleConfigAppType, StudioLifecycleConfigSortKey, TagPropagation, ThroughputMode, TrackingServerSize, TrackingServerStatus, TrainingJobSortByOptions, TrainingJobStatus, TrainingPlanFilterName, TrainingPlanSortBy, TrainingPlanSortOrder, TrainingPlanStatus, TransformJobStatus, UltraServerHealthStatus, UserProfileSortKey, UserProfileStatus, VariantPropertyType, VendorGuidance, WarmPoolResourceStatus } from "./enums";
2
+ import type { AdditionalInferenceSpecificationDefinition, AlgorithmSpecification, AppSpecification, AutoMLJobStepMetadata, BatchDataCaptureConfig, BatchTransformInput, BedrockCustomModelDeploymentMetadata, BedrockCustomModelMetadata, BedrockModelImportMetadata, BedrockProvisionedModelThroughputMetadata, CacheHitResult, CallbackStepMetadata, Channel, CheckpointConfig, ClarifyCheckStepMetadata, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, ComputeQuotaConfig, DeploymentConfiguration, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, OutputParameter, ResourceConfig, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
+ import type { ComputeQuotaTarget, ConditionStepMetadata, ContainerDefinition, DefaultSpaceSettings, DeploymentConfig, DriftCheckBaselines, EdgeOutputConfig, FeatureDefinition, InferenceComponentRuntimeConfig, InferenceComponentSpecification, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InstanceMetadataServiceConfiguration, ManagedConfiguration, MetadataProperties, ModelCardSecurityConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelVariantConfig, MonitoringScheduleConfig, NetworkConfig, RetryStrategy, SchedulerConfig, ShadowModeConfig, SourceAlgorithmSpecification, TtlDuration, UiTemplate, UserSettings } from "./models_1";
4
4
  import type { DataProcessing, DebugHookConfig, DebugRuleConfiguration, DebugRuleEvaluationStatus, DeploymentRecommendation, ExperimentConfig, FeatureParameter, HyperParameterTrainingJobSummary, InstanceGroupHealthCheckConfiguration, ModelArtifacts, ModelClientConfig, ModelPackageConfig, ParallelismConfiguration, ProcessingInput, ProcessingOutputConfig, ProcessingResources, ProcessingStoppingCondition, ProfilerConfig, ServiceCatalogProvisioningDetails, SpaceStorageSettings, TensorBoardOutputConfig, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus } from "./models_2";
5
5
  import type { DesiredWeightAndCapacity, Device, DeviceDeploymentSummary, DomainSettingsForUpdate, Edge, EMRStepMetadata, Endpoint, EndpointConfigStepMetadata, EndpointStepMetadata, Experiment, FailStepMetadata, FeatureGroup, FeatureMetadata, Filter, GitConfigForUpdate, HyperParameterTuningJobSearchEntity, InferenceComponentDeploymentConfig, InferenceComponentMetadata, InferenceRecommendationsJobStep, Job, JobConfigSchemaVersionSummary, JobStepMetadata, JobSummary, LabelingJobForWorkteamSummary, LabelingJobSummary, LambdaStepMetadata, LineageGroupSummary, LineageMetadata, MetricData, ModelPackageStatusDetails, MonitoringExecutionSummary, MonitoringJobDefinitionSummary, PipelineExperimentConfig, ReservedCapacitySummary, SecondaryStatusTransition, SelectiveExecutionConfig, ServiceCatalogProvisionedProductDetails, SubscribedWorkteam, TemplateProviderDetail, TrialComponentMetricSummary, TrialComponentSource, TrialSource, WarmPoolStatus, Workforce, Workteam } from "./models_3";
6
+ /**
7
+ * @public
8
+ */
9
+ export interface ListInferenceRecommendationsJobStepsRequest {
10
+ /**
11
+ * <p>The name for the Inference Recommender job.</p>
12
+ * @public
13
+ */
14
+ JobName: string | undefined;
15
+ /**
16
+ * <p>A filter to return benchmarks of a specified status. If this field is left empty, then all benchmarks are returned.</p>
17
+ * @public
18
+ */
19
+ Status?: RecommendationJobStatus | undefined;
20
+ /**
21
+ * <p>A filter to return details about the specified type of subtask.</p> <p> <code>BENCHMARK</code>: Evaluate the performance of your model on different instance types.</p>
22
+ * @public
23
+ */
24
+ StepType?: RecommendationStepType | undefined;
25
+ /**
26
+ * <p>The maximum number of results to return.</p>
27
+ * @public
28
+ */
29
+ MaxResults?: number | undefined;
30
+ /**
31
+ * <p>A token that you can specify to return more results from the list. Specify this field if you have a token that was returned from a previous request.</p>
32
+ * @public
33
+ */
34
+ NextToken?: string | undefined;
35
+ }
6
36
  /**
7
37
  * @public
8
38
  */
@@ -8652,8 +8682,3 @@ export interface UpdateNotebookInstanceInput {
8652
8682
  */
8653
8683
  InstanceMetadataServiceConfiguration?: InstanceMetadataServiceConfiguration | undefined;
8654
8684
  }
8655
- /**
8656
- * @public
8657
- */
8658
- export interface UpdateNotebookInstanceOutput {
8659
- }
@@ -4,6 +4,11 @@ import type { NotebookInstanceLifecycleHook, UserSettings } from "./models_1";
4
4
  import type { MemberDefinition, NotificationConfiguration, OidcConfig, ParallelismConfiguration, PartnerAppConfig, PartnerAppMaintenanceConfig, PipelineDefinitionS3Location, ProfilerRuleConfiguration, ProvisioningParameter, SourceIpConfig, SpaceSettings, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus, WorkerAccessConfiguration, WorkforceVpcConfigRequest } from "./models_2";
5
5
  import type { Filter, Workforce, Workteam } from "./models_3";
6
6
  import type { NestedFilters, ProfilerConfigForUpdate, RemoteDebugConfigForUpdate, ResourceConfigForUpdate, VisibilityConditions } from "./models_4";
7
+ /**
8
+ * @public
9
+ */
10
+ export interface UpdateNotebookInstanceOutput {
11
+ }
7
12
  /**
8
13
  * @public
9
14
  */
@@ -32,6 +32,7 @@ export declare var AIBenchmarkOutputConfig$: StaticStructureSchema;
32
32
  export declare var AIBenchmarkOutputResult$: StaticStructureSchema;
33
33
  export declare var AICapacityReservationConfig$: StaticStructureSchema;
34
34
  export declare var AICloudWatchLogs$: StaticStructureSchema;
35
+ export declare var AIMlflowConfig$: StaticStructureSchema;
35
36
  export declare var AIModelSourceS3$: StaticStructureSchema;
36
37
  export declare var AIRecommendation$: StaticStructureSchema;
37
38
  export declare var AIRecommendationComputeSpec$: StaticStructureSchema;
@@ -1,7 +1,9 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import { DescribeInferenceComponentInput } from "../models/models_2";
4
- import { DescribeInferenceComponentOutput } from "../models/models_3";
3
+ import {
4
+ DescribeInferenceComponentInput,
5
+ DescribeInferenceComponentOutput,
6
+ } from "../models/models_3";
5
7
  import {
6
8
  SageMakerClientResolvedConfig,
7
9
  ServiceInputTypes,
@@ -1,7 +1,9 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import { ListInferenceRecommendationsJobStepsRequest } from "../models/models_3";
4
- import { ListInferenceRecommendationsJobStepsResponse } from "../models/models_4";
3
+ import {
4
+ ListInferenceRecommendationsJobStepsRequest,
5
+ ListInferenceRecommendationsJobStepsResponse,
6
+ } from "../models/models_4";
5
7
  import {
6
8
  SageMakerClientResolvedConfig,
7
9
  ServiceInputTypes,
@@ -1,9 +1,7 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import {
4
- UpdateNotebookInstanceInput,
5
- UpdateNotebookInstanceOutput,
6
- } from "../models/models_4";
3
+ import { UpdateNotebookInstanceInput } from "../models/models_4";
4
+ import { UpdateNotebookInstanceOutput } from "../models/models_5";
7
5
  import {
8
6
  SageMakerClientResolvedConfig,
9
7
  ServiceInputTypes,