@aws-sdk/client-sagemaker 3.1061.0 → 3.1063.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (37) hide show
  1. package/dist-cjs/index.js +6 -0
  2. package/dist-cjs/schemas/schemas_0.js +80 -68
  3. package/dist-es/models/enums.js +5 -0
  4. package/dist-es/schemas/schemas_0.js +41 -29
  5. package/dist-types/commands/CreateAIBenchmarkJobCommand.d.ts +5 -0
  6. package/dist-types/commands/CreateAIRecommendationJobCommand.d.ts +5 -0
  7. package/dist-types/commands/DescribeAIBenchmarkJobCommand.d.ts +5 -0
  8. package/dist-types/commands/DescribeAIRecommendationJobCommand.d.ts +5 -0
  9. package/dist-types/commands/DescribeInferenceComponentCommand.d.ts +1 -2
  10. package/dist-types/commands/DescribeModelCardCommand.d.ts +2 -1
  11. package/dist-types/commands/DescribeModelPackageCommand.d.ts +2 -1
  12. package/dist-types/commands/GetSearchSuggestionsCommand.d.ts +1 -1
  13. package/dist-types/commands/ListInferenceRecommendationsJobStepsCommand.d.ts +1 -1
  14. package/dist-types/commands/SearchCommand.d.ts +24 -1
  15. package/dist-types/commands/UpdateNotebookInstanceCommand.d.ts +2 -1
  16. package/dist-types/commands/UpdateNotebookInstanceLifecycleConfigCommand.d.ts +1 -2
  17. package/dist-types/models/enums.d.ts +13 -0
  18. package/dist-types/models/models_0.d.ts +41 -16
  19. package/dist-types/models/models_1.d.ts +17 -17
  20. package/dist-types/models/models_2.d.ts +18 -12
  21. package/dist-types/models/models_3.d.ts +100 -48
  22. package/dist-types/models/models_4.d.ts +55 -29
  23. package/dist-types/models/models_5.d.ts +26 -1
  24. package/dist-types/schemas/schemas_0.d.ts +2 -0
  25. package/dist-types/ts3.4/commands/DescribeInferenceComponentCommand.d.ts +4 -2
  26. package/dist-types/ts3.4/commands/ListInferenceRecommendationsJobStepsCommand.d.ts +1 -1
  27. package/dist-types/ts3.4/commands/UpdateNotebookInstanceCommand.d.ts +2 -4
  28. package/dist-types/ts3.4/commands/UpdateNotebookInstanceLifecycleConfigCommand.d.ts +4 -2
  29. package/dist-types/ts3.4/models/enums.d.ts +6 -0
  30. package/dist-types/ts3.4/models/models_0.d.ts +9 -4
  31. package/dist-types/ts3.4/models/models_1.d.ts +4 -5
  32. package/dist-types/ts3.4/models/models_2.d.ts +5 -5
  33. package/dist-types/ts3.4/models/models_3.d.ts +22 -11
  34. package/dist-types/ts3.4/models/models_4.d.ts +17 -8
  35. package/dist-types/ts3.4/models/models_5.d.ts +7 -1
  36. package/dist-types/ts3.4/schemas/schemas_0.d.ts +2 -0
  37. package/package.json +5 -5
@@ -1,6 +1,22 @@
1
1
  import type { ActionStatus, ActivationState, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmStatus, AppNetworkAccessType, AppSecurityGroupManagement, AppStatus, AppType, AuthMode, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLProblemTypeConfigName, BatchStrategy, CapacityReservationPreference, CaptureStatus, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterStatus, CompilationJobStatus, CustomizationTechnique, DataDistributionType, DeepHealthCheckType, DomainStatus, EdgePackagingJobStatus, EdgePresetDeploymentStatus, EdgePresetDeploymentType, EnabledOrDisabled, EndpointStatus, EvaluationType, FeatureGroupStatus, FeatureStatus, FeatureType, FlowDefinitionStatus, HomeEfsFileSystemCreation, HubContentStatus, HubContentSupportStatus, HubContentType, HubStatus, HumanTaskUiStatus, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStatus, ImageStatus, ImageVersionStatus, InputMode, JobCategory, JobType, JoinSource, LastUpdateStatusValue, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, ObjectiveStatus, OfflineStoreStatusValue, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, Peft, ProblemType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInstanceType, RecommendationStatus, RedshiftResultCompressionType, RedshiftResultFormat, RetentionType, RuleEvaluationStatus, SchedulerConfigComponent, SchedulerResourceStatus, ServerlessJobType, SharingType, StageStatus, Statistic, StudioLifecycleConfigAppType, TagPropagation, ThroughputMode, TrainingJobStatus, TrialComponentPrimaryStatus, VariantStatus, VendorGuidance, WorkforceIpAddressType } from "./enums";
2
- import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, ComputeQuotaTarget, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
- import type { ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, ModelShardingConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
2
+ import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
+ import type { ComputeQuotaTarget, ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
4
+ /**
5
+ * <p>Settings for the model sharding technique that's applied by a model optimization job.</p>
6
+ * @public
7
+ */
8
+ export interface ModelShardingConfig {
9
+ /**
10
+ * <p>The URI of an LMI DLC in Amazon ECR. SageMaker uses this image to run the optimization.</p>
11
+ * @public
12
+ */
13
+ Image?: string | undefined;
14
+ /**
15
+ * <p>Environment variables that override the default ones in the model container.</p>
16
+ * @public
17
+ */
18
+ OverrideEnvironment?: Record<string, string> | undefined;
19
+ }
4
20
  /**
5
21
  * <p>Contains information about the training data source for speculative decoding.</p>
6
22
  * @public
@@ -7189,13 +7205,3 @@ export interface DescribeImageVersionResponse {
7189
7205
  */
7190
7206
  ReleaseNotes?: string | undefined;
7191
7207
  }
7192
- /**
7193
- * @public
7194
- */
7195
- export interface DescribeInferenceComponentInput {
7196
- /**
7197
- * <p>The name of the inference component.</p>
7198
- * @public
7199
- */
7200
- InferenceComponentName: string | undefined;
7201
- }
@@ -1,7 +1,17 @@
1
- import type { _InstanceType, AccountDefaultStatus, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmSortBy, AppImageConfigSortKey, AppSortKey, AssociationEdgeType, AutoMLJobStatus, AutoMLSortBy, AutoMLSortOrder, BatchStrategy, CandidateSortBy, CandidateStatus, ClusterEventResourceType, ClusterSortBy, CodeRepositorySortBy, CodeRepositorySortOrder, CompilationJobStatus, DetailedModelPackageStatus, DeviceDeploymentStatus, DirectInternetAccess, DomainStatus, EdgePackagingJobStatus, EndpointConfigSortKey, EndpointSortKey, EndpointStatus, EventSortBy, ExecutionRoleIdentityConfig, ExecutionStatus, FeatureGroupSortBy, FeatureGroupSortOrder, FeatureGroupStatus, FeatureType, FlowDefinitionStatus, HubContentSortBy, HubContentStatus, HubContentSupportStatus, HubContentType, HubSortBy, HubStatus, HyperParameterTuningJobSortByOptions, HyperParameterTuningJobStatus, HyperParameterTuningJobStrategyType, ImageSortBy, ImageSortOrder, ImageStatus, ImageVersionSortBy, ImageVersionSortOrder, ImageVersionStatus, InferenceComponentCapacitySizeType, InferenceComponentSortKey, InferenceComponentStatus, InferenceExperimentStatus, InferenceExperimentType, IPAddressType, IsTrackingServerActive, JobCategory, JobSecondaryStatus, JobStatus, LabelingJobStatus, ListAIBenchmarkJobsSortBy, ListAIRecommendationJobsSortBy, ListAIWorkloadConfigsSortBy, ListCompilationJobsSortBy, ListDeviceFleetsSortBy, ListEdgeDeploymentPlansSortBy, ListEdgePackagingJobsSortBy, ListInferenceRecommendationsJobsSortBy, MaintenanceStatus, ManagedStorageType, MlflowAppStatus, ModelApprovalStatus, ModelCardExportJobStatus, ModelCardProcessingStatus, ModelCardStatus, ModelPackageGroupStatus, ModelPackageRegistrationType, ModelPackageStatus, ModelRegistrationMode, ModelVariantStatus, MonitoringJobDefinitionSortKey, MonitoringType, NotebookInstanceAcceleratorType, NotebookInstanceStatus, OfflineStoreStatusValue, Operator, OptimizationJobDeploymentInstanceType, OptimizationJobStatus, OrderKey, PartnerAppAuthType, PartnerAppStatus, PartnerAppType, PipelineExecutionStatus, PipelineStatus, ProcessingJobStatus, ProductionVariantInstanceType, ProfilingStatus, ProjectStatus, RecommendationJobStatus, RecommendationJobType, RecommendationStepType, ReservedCapacityInstanceType, ReservedCapacityStatus, ReservedCapacityType, ResourceType, RootAccess, RuleEvaluationStatus, SageMakerResourceName, SagemakerServicecatalogStatus, SchedulerResourceStatus, ScheduleStatus, SecondaryStatus, SkipModelValidation, SortActionsBy, SortArtifactsBy, SortAssociationsBy, SortClusterSchedulerConfigBy, SortContextsBy, SortExperimentsBy, SortInferenceExperimentsBy, SortOrder, SortQuotaBy, SpaceStatus, StudioLifecycleConfigAppType, TrackingServerMaintenanceStatus, TrackingServerSize, TrackingServerStatus, TrainingJobStatus, TrainingPlanStatus, TransformJobStatus, UserProfileStatus, VolumeAttachmentStatus, WarmPoolResourceStatus, WorkforceIpAddressType, WorkforceStatus } from "./enums";
1
+ import type { _InstanceType, AccountDefaultStatus, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmSortBy, AppImageConfigSortKey, AppSortKey, AssociationEdgeType, AutoMLJobStatus, AutoMLSortBy, AutoMLSortOrder, BatchStrategy, CandidateSortBy, CandidateStatus, ClusterEventResourceType, ClusterSortBy, CodeRepositorySortBy, CodeRepositorySortOrder, CompilationJobStatus, DetailedModelPackageStatus, DeviceDeploymentStatus, DirectInternetAccess, DomainStatus, EdgePackagingJobStatus, EndpointConfigSortKey, EndpointSortKey, EndpointStatus, EventSortBy, ExecutionRoleIdentityConfig, ExecutionStatus, FeatureGroupSortBy, FeatureGroupSortOrder, FeatureGroupStatus, FeatureType, FlowDefinitionStatus, HubContentSortBy, HubContentStatus, HubContentSupportStatus, HubContentType, HubSortBy, HubStatus, HyperParameterTuningJobSortByOptions, HyperParameterTuningJobStatus, HyperParameterTuningJobStrategyType, ImageSortBy, ImageSortOrder, ImageStatus, ImageVersionSortBy, ImageVersionSortOrder, ImageVersionStatus, IncludedData, InferenceComponentCapacitySizeType, InferenceComponentSortKey, InferenceComponentStatus, InferenceExperimentStatus, InferenceExperimentType, IPAddressType, IsTrackingServerActive, JobCategory, JobSecondaryStatus, JobStatus, LabelingJobStatus, ListAIBenchmarkJobsSortBy, ListAIRecommendationJobsSortBy, ListAIWorkloadConfigsSortBy, ListCompilationJobsSortBy, ListDeviceFleetsSortBy, ListEdgeDeploymentPlansSortBy, ListEdgePackagingJobsSortBy, ListInferenceRecommendationsJobsSortBy, MaintenanceStatus, ManagedStorageType, MlflowAppStatus, ModelApprovalStatus, ModelCardExportJobStatus, ModelCardProcessingStatus, ModelCardStatus, ModelPackageGroupStatus, ModelPackageRegistrationType, ModelPackageStatus, ModelRegistrationMode, ModelVariantStatus, MonitoringJobDefinitionSortKey, MonitoringType, NotebookInstanceAcceleratorType, NotebookInstanceStatus, OfflineStoreStatusValue, Operator, OptimizationJobDeploymentInstanceType, OptimizationJobStatus, OrderKey, PartnerAppAuthType, PartnerAppStatus, PartnerAppType, PipelineExecutionStatus, PipelineStatus, ProcessingJobStatus, ProductionVariantInstanceType, ProfilingStatus, ProjectStatus, RecommendationJobStatus, RecommendationJobType, RecommendationStepType, ReservedCapacityInstanceType, ReservedCapacityStatus, ReservedCapacityType, ResourceType, RootAccess, RuleEvaluationStatus, SageMakerResourceName, SagemakerServicecatalogStatus, SchedulerResourceStatus, ScheduleStatus, SecondaryStatus, SkipModelValidation, SortActionsBy, SortArtifactsBy, SortAssociationsBy, SortClusterSchedulerConfigBy, SortContextsBy, SortExperimentsBy, SortInferenceExperimentsBy, SortOrder, SortQuotaBy, SpaceStatus, StudioLifecycleConfigAppType, TrackingServerMaintenanceStatus, TrackingServerSize, TrackingServerStatus, TrainingJobStatus, TrainingPlanStatus, TransformJobStatus, UserProfileStatus, VolumeAttachmentStatus, WarmPoolResourceStatus, WorkforceIpAddressType, WorkforceStatus } from "./enums";
2
2
  import type { ActionSummary, AdditionalInferenceSpecificationDefinition, AgentVersion, AIBenchmarkJobSummary, AIRecommendationJobSummary, AIWorkloadConfigSummary, AlgorithmSpecification, AlgorithmSummary, AmazonQSettings, AppDetails, AppImageConfigDetails, AppSpecification, ArtifactSummary, AssociationInfo, AssociationSummary, AutoMLCandidate, AutoMLJobSummary, AutoRollbackConfig, AvailableUpgrade, BatchDataCaptureConfig, CfnTemplateProviderDetail, Channel, CheckpointConfig, ClusterEventSummary, ClusterNodeSummary, ClusterSchedulerConfigSummary, ClusterSummary, CodeRepositorySummary, CognitoConfig, CompilationJobSummary, InferenceSpecification, OutputDataConfig, OutputParameter, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
3
  import type { ComputeQuotaSummary, ContainerDefinition, ContextSummary, DockerSettings, DriftCheckBaselines, EdgeOutputConfig, EndpointInfo, FeatureDefinition, HumanTaskConfig, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InferenceComponentComputeResourceRequirements, InferenceComponentSchedulingConfig, InferenceComponentStartupParameters, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InstanceMetadataServiceConfiguration, LabelingJobAlgorithmsConfig, LabelingJobInputConfig, LabelingJobOutputConfig, LabelingJobStoppingConditions, ManagedConfiguration, MetadataProperties, ModelBiasAppSpecification, ModelBiasBaselineConfig, ModelBiasJobInput, ModelCardExportOutputConfig, ModelCardSecurityConfig, ModelExplainabilityAppSpecification, ModelExplainabilityBaselineConfig, ModelExplainabilityJobInput, ModelInfrastructureConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelQualityAppSpecification, ModelQualityBaselineConfig, ModelQualityJobInput, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringScheduleConfig, MonitoringStoppingCondition, NetworkConfig, NotebookInstanceLifecycleHook, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, ProductionVariantServerlessConfig, RecommendationJobInputConfig, RecommendationJobStoppingConditions, ResourceLimits, RetryStrategy, ShadowModeConfig, SourceAlgorithmSpecification, TrustedIdentityPropagationSettings, UnifiedStudioSettings, UserSettings } from "./models_1";
4
4
  import type { CustomizedMetricSpecification, DataCaptureConfigSummary, DataProcessing, DebugHookConfig, DebugRuleConfiguration, DebugRuleEvaluationStatus, DeployedImage, DeploymentRecommendation, ExperimentConfig, ExperimentSource, FeatureParameter, HyperParameterTrainingJobSummary, HyperParameterTuningJobCompletionDetails, HyperParameterTuningJobConsumedResources, InfraCheckConfig, LastUpdateStatus, MemberDefinition, MlflowConfig, ModelArtifacts, ModelClientConfig, ModelPackageConfig, NotificationConfiguration, ObjectiveStatusCounters, OfflineStoreStatus, OptimizationConfig, OptimizationJobOutputConfig, OptimizationVpcConfig, OwnershipSettings, ParallelismConfiguration, PartnerAppConfig, PartnerAppMaintenanceConfig, ProcessingInput, ProcessingOutputConfig, ProcessingResources, ProcessingStoppingCondition, ProductionVariantSummary, ProfilerConfig, ProfilerRuleConfiguration, RemoteDebugConfig, ServerlessJobConfig, ServiceCatalogProvisioningDetails, SourceIpConfig, SpaceSettings, SpaceSharingSettings, TensorBoardOutputConfig, TrainingJobStatusCounters, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus, WorkerAccessConfiguration } from "./models_2";
5
+ /**
6
+ * @public
7
+ */
8
+ export interface DescribeInferenceComponentInput {
9
+ /**
10
+ * <p>The name of the inference component.</p>
11
+ * @public
12
+ */
13
+ InferenceComponentName: string | undefined;
14
+ }
5
15
  /**
6
16
  * <p>Specifies the type and size of the endpoint capacity to activate for a rolling deployment or a rollback strategy. You can specify your batches as either of the following:</p> <ul> <li> <p>A count of inference component copies </p> </li> <li> <p>The overall percentage or your fleet </p> </li> </ul> <p>For a rollback strategy, if you don't specify the fields in this object, or if you set the <code>Value</code> parameter to 100%, then SageMaker AI uses a blue/green rollback strategy and rolls all traffic back to the blue fleet.</p>
7
17
  * @public
@@ -1361,6 +1371,11 @@ export interface DescribeModelCardRequest {
1361
1371
  * @public
1362
1372
  */
1363
1373
  ModelCardVersion?: number | undefined;
1374
+ /**
1375
+ * <p>Specifies the level of model card data to include in the response. Use this parameter to call <code>DescribeModelCard</code> without requiring <code>kms:Decrypt</code> permission on the customer-managed Amazon Web Services KMS key.</p> <ul> <li> <p> <code>AllData</code>: Returns the full model card <code>Content</code>. This option requires <code>kms:Decrypt</code> permission on the customer-managed key, if one is associated with the model card. This is the default.</p> </li> <li> <p> <code>MetadataOnly</code>: Returns the model card with sanitized <code>Content</code> that includes only a small set of unencrypted metadata fields. This option does not require <code>kms:Decrypt</code> permission. For the list of fields preserved in the response, see <code>Content</code>.</p> </li> </ul> <p>If you don't specify a value, SageMaker returns <code>AllData</code>.</p>
1376
+ * @public
1377
+ */
1378
+ IncludedData?: IncludedData | undefined;
1364
1379
  }
1365
1380
  /**
1366
1381
  * @public
@@ -1382,7 +1397,7 @@ export interface DescribeModelCardResponse {
1382
1397
  */
1383
1398
  ModelCardVersion: number | undefined;
1384
1399
  /**
1385
- * <p>The content of the model card.</p>
1400
+ * <p>The content of the model card. Content is provided as a string in the <a href="https://docs.aws.amazon.com/sagemaker/latest/dg/model-cards.html#model-cards-json-schema">model card JSON schema</a>.</p> <p>When you set <code>IncludedData</code> to <code>MetadataOnly</code> in the request, SageMaker returns a sanitized version of <code>Content</code> that includes only the following JSON paths, when present in the model card:</p> <ul> <li> <p> <code>model_overview.model_id</code> </p> </li> <li> <p> <code>model_overview.model_name</code> </p> </li> <li> <p> <code>intended_uses.risk_rating</code> </p> </li> <li> <p> <code>model_package_details.model_package_group_name</code> </p> </li> <li> <p> <code>model_package_details.model_package_arn</code> </p> </li> </ul> <p>All other fields are removed from <code>Content</code> when <code>IncludedData</code> is <code>MetadataOnly</code>, including model description, training details, evaluation details, business details, and additional information. To retrieve the complete <code>Content</code>, set <code>IncludedData</code> to <code>AllData</code> or omit the parameter.</p>
1386
1401
  * @public
1387
1402
  */
1388
1403
  Content: string | undefined;
@@ -1577,6 +1592,11 @@ export interface DescribeModelPackageInput {
1577
1592
  * @public
1578
1593
  */
1579
1594
  ModelPackageName: string | undefined;
1595
+ /**
1596
+ * <p>Specifies the level of model package data to include in the response. Use this parameter to call <code>DescribeModelPackage</code> on a model package that has an associated model card without requiring <code>kms:Decrypt</code> permission on the customer-managed KMS key associated with the embedded model card.</p> <ul> <li> <p> <code>AllData</code>: Returns the full model package response, including the unredacted <code>ModelCard.ModelCardContent</code>. This option requires <code>kms:Decrypt</code> permission on the customer-managed key, if one is associated with the embedded model card. This is the default.</p> </li> <li> <p> <code>MetadataOnly</code>: Returns the full model package response, but with the embedded <code>ModelCard.ModelCardContent</code> sanitized to include only a small set of unencrypted metadata fields. This option does not require <code>kms:Decrypt</code> permission. All other top-level response fields, including <code>InferenceSpecification</code>, <code>ModelMetrics</code>, <code>DriftCheckBaselines</code>, and <code>SecurityConfig</code>, are returned unchanged. For the list of fields preserved within <code>ModelCardContent</code>, see <a href="https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_DescribeModelPackage.html#sagemaker-DescribeModelPackage-response-ModelCard">ModelCard</a>.</p> </li> </ul> <p>If you don't specify a value, SageMaker returns <code>AllData</code>.</p>
1597
+ * @public
1598
+ */
1599
+ IncludedData?: IncludedData | undefined;
1580
1600
  }
1581
1601
  /**
1582
1602
  * <p>Represents the overall status of a model package.</p>
@@ -1765,7 +1785,7 @@ export interface DescribeModelPackageOutput {
1765
1785
  */
1766
1786
  SecurityConfig?: ModelPackageSecurityConfig | undefined;
1767
1787
  /**
1768
- * <p>The model card associated with the model package. Since <code>ModelPackageModelCard</code> is tied to a model package, it is a specific usage of a model card and its schema is simplified compared to the schema of <code>ModelCard</code>. The <code>ModelPackageModelCard</code> schema does not include <code>model_package_details</code>, and <code>model_overview</code> is composed of the <code>model_creator</code> and <code>model_artifact</code> properties. For more information about the model package model card schema, see <a href="https://docs.aws.amazon.com/sagemaker/latest/dg/model-registry-details.html#model-card-schema">Model package model card schema</a>. For more information about the model card associated with the model package, see <a href="https://docs.aws.amazon.com/sagemaker/latest/dg/model-registry-details.html">View the Details of a Model Version</a>.</p>
1788
+ * <p>The model card associated with the model package. Since <code>ModelPackageModelCard</code> is tied to a model package, it is a specific usage of a model card and its schema is simplified compared to the schema of <code>ModelCard</code>. The <code>ModelPackageModelCard</code> schema does not include <code>model_package_details</code>, and <code>model_overview</code> is composed of the <code>model_creator</code> and <code>model_artifact</code> properties. For more information about the model package model card schema, see <a href="https://docs.aws.amazon.com/sagemaker/latest/dg/model-registry-details.html#model-card-schema">Model package model card schema</a>. For more information about the model card associated with the model package, see <a href="https://docs.aws.amazon.com/sagemaker/latest/dg/model-registry-details.html">View the Details of a Model Version</a>.</p> <p>When you set <code>IncludedData</code> to <code>MetadataOnly</code> in the request, <code>ModelCardStatus</code> is preserved and <code>ModelCardContent</code> is sanitized to include only the following JSON paths, when present in the model card:</p> <ul> <li> <p> <code>model_overview.model_id</code> </p> </li> <li> <p> <code>model_overview.model_name</code> </p> </li> <li> <p> <code>intended_uses.risk_rating</code> </p> </li> <li> <p> <code>model_package_details.model_package_group_name</code> </p> </li> <li> <p> <code>model_package_details.model_package_arn</code> </p> </li> </ul> <p>Because the <code>ModelPackageModelCard</code> schema does not include <code>model_package_details</code> and limits <code>model_overview</code> to <code>model_creator</code> and <code>model_artifact</code>, the sanitized <code>ModelCardContent</code> for a model package typically contains only <code>intended_uses.risk_rating</code> if it was provided when the model card was created. To retrieve the complete <code>ModelCardContent</code>, set <code>IncludedData</code> to <code>AllData</code> or omit the parameter.</p>
1769
1789
  * @public
1770
1790
  */
1771
1791
  ModelCard?: ModelPackageModelCard | undefined;
@@ -6891,6 +6911,83 @@ export interface InferenceRecommendationsJobStep {
6891
6911
  */
6892
6912
  InferenceBenchmark?: RecommendationJobInferenceBenchmark | undefined;
6893
6913
  }
6914
+ /**
6915
+ * Search shape for Job. Mirrors DescribeJobResponse fields.
6916
+ * If you update DescribeJobResponse, update this structure as well.
6917
+ * @public
6918
+ */
6919
+ export interface Job {
6920
+ /**
6921
+ * <p>The name of the job.</p>
6922
+ * @public
6923
+ */
6924
+ JobName?: string | undefined;
6925
+ /**
6926
+ * <p>The Amazon Resource Name (ARN) of the job.</p>
6927
+ * @public
6928
+ */
6929
+ JobArn?: string | undefined;
6930
+ /**
6931
+ * <p>The ARN of the IAM role associated with the job.</p>
6932
+ * @public
6933
+ */
6934
+ RoleArn?: string | undefined;
6935
+ /**
6936
+ * <p>The category of the job.</p>
6937
+ * @public
6938
+ */
6939
+ JobCategory?: JobCategory | undefined;
6940
+ /**
6941
+ * <p>The schema version used for the job configuration document.</p>
6942
+ * @public
6943
+ */
6944
+ JobConfigSchemaVersion?: string | undefined;
6945
+ /**
6946
+ * <p>The JSON configuration document for the job.</p>
6947
+ * @public
6948
+ */
6949
+ JobConfigDocument?: string | undefined;
6950
+ /**
6951
+ * <p>The date and time that the job was created.</p>
6952
+ * @public
6953
+ */
6954
+ CreationTime?: Date | undefined;
6955
+ /**
6956
+ * <p>The date and time that the job was last modified.</p>
6957
+ * @public
6958
+ */
6959
+ LastModifiedTime?: Date | undefined;
6960
+ /**
6961
+ * <p>The date and time that the job ended.</p>
6962
+ * @public
6963
+ */
6964
+ EndTime?: Date | undefined;
6965
+ /**
6966
+ * <p>The current status of the job.</p>
6967
+ * @public
6968
+ */
6969
+ JobStatus?: JobStatus | undefined;
6970
+ /**
6971
+ * <p>The detailed secondary status of the job, providing more granular information about the job's progress.</p>
6972
+ * @public
6973
+ */
6974
+ SecondaryStatus?: JobSecondaryStatus | undefined;
6975
+ /**
6976
+ * <p>A list of secondary status transitions for the job, with timestamps and optional status messages.</p>
6977
+ * @public
6978
+ */
6979
+ SecondaryStatusTransitions?: JobSecondaryStatusTransition[] | undefined;
6980
+ /**
6981
+ * <p>If the job failed, the reason it failed.</p>
6982
+ * @public
6983
+ */
6984
+ FailureReason?: string | undefined;
6985
+ /**
6986
+ * <p>The tags associated with the job.</p>
6987
+ * @public
6988
+ */
6989
+ Tags?: Tag[] | undefined;
6990
+ }
6894
6991
  /**
6895
6992
  * <p>Provides summary information about a job configuration schema version.</p>
6896
6993
  * @public
@@ -9736,48 +9833,3 @@ export interface ListInferenceRecommendationsJobsResponse {
9736
9833
  */
9737
9834
  NextToken?: string | undefined;
9738
9835
  }
9739
- /**
9740
- * @public
9741
- */
9742
- export interface ListInferenceRecommendationsJobStepsRequest {
9743
- /**
9744
- * <p>The name for the Inference Recommender job.</p>
9745
- * @public
9746
- */
9747
- JobName: string | undefined;
9748
- /**
9749
- * <p>A filter to return benchmarks of a specified status. If this field is left empty, then all benchmarks are returned.</p>
9750
- * @public
9751
- */
9752
- Status?: RecommendationJobStatus | undefined;
9753
- /**
9754
- * <p>A filter to return details about the specified type of subtask.</p> <p> <code>BENCHMARK</code>: Evaluate the performance of your model on different instance types.</p>
9755
- * @public
9756
- */
9757
- StepType?: RecommendationStepType | undefined;
9758
- /**
9759
- * <p>The maximum number of results to return.</p>
9760
- * @public
9761
- */
9762
- MaxResults?: number | undefined;
9763
- /**
9764
- * <p>A token that you can specify to return more results from the list. Specify this field if you have a token that was returned from a previous request.</p>
9765
- * @public
9766
- */
9767
- NextToken?: string | undefined;
9768
- }
9769
- /**
9770
- * @public
9771
- */
9772
- export interface ListInferenceRecommendationsJobStepsResponse {
9773
- /**
9774
- * <p>A list of all subtask details in Inference Recommender.</p>
9775
- * @public
9776
- */
9777
- Steps?: InferenceRecommendationsJobStep[] | undefined;
9778
- /**
9779
- * <p>A token that you can specify in your next request to return more results from the list.</p>
9780
- * @public
9781
- */
9782
- NextToken?: string | undefined;
9783
- }
@@ -1,8 +1,53 @@
1
- import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppNetworkAccessType, AppSecurityGroupManagement, AppType, BatchStrategy, ClusterNodeProvisioningMode, ClusterNodeRecovery, CrossAccountFilterOption, Direction, EndpointStatus, ExecutionStatus, FeatureStatus, HomeEfsFileSystemCreation, HubContentSupportStatus, HubContentType, InferenceExperimentStopDesiredState, IPAddressType, IsTrackingServerActive, JobCategory, JobStatus, JobType, LabelingJobStatus, LineageType, ListLabelingJobsForWorkteamSortByOptions, ListOptimizationJobsSortBy, ListWorkforcesSortByOptions, ListWorkteamsSortByOptions, MlflowAppStatus, ModelApprovalStatus, ModelCardExportJobSortBy, ModelCardExportJobSortOrder, ModelCardExportJobStatus, ModelCardSortBy, ModelCardSortOrder, ModelCardStatus, ModelCardVersionSortBy, ModelMetadataFilterType, ModelPackageGroupSortBy, ModelPackageGroupStatus, ModelPackageRegistrationType, ModelPackageSortBy, ModelPackageStatus, ModelPackageType, ModelRegistrationMode, ModelSortKey, ModelVariantAction, MonitoringAlertHistorySortKey, MonitoringAlertStatus, MonitoringExecutionSortKey, MonitoringJobDefinitionSortKey, MonitoringScheduleSortKey, MonitoringType, NotebookInstanceAcceleratorType, NotebookInstanceLifecycleConfigSortKey, NotebookInstanceLifecycleConfigSortOrder, NotebookInstanceSortKey, NotebookInstanceSortOrder, NotebookInstanceStatus, OptimizationJobDeploymentInstanceType, OptimizationJobStatus, OrderKey, PartnerAppStatus, PartnerAppType, PipelineExecutionStatus, PipelineStatus, ProcessingJobStatus, Processor, ProjectSortBy, ProjectSortOrder, ProjectStatus, Relation, ReservedCapacityInstanceType, ReservedCapacityType, ResourceCatalogSortBy, ResourceCatalogSortOrder, RootAccess, SageMakerResourceName, ScheduleStatus, SecondaryStatus, SharingType, SkipModelValidation, SortBy, SortLineageGroupsBy, SortMlflowAppBy, SortOrder, SortPipelineExecutionsBy, SortPipelinesBy, SortTrackingServerBy, SortTrialComponentsBy, SortTrialsBy, SpaceSortKey, SpaceStatus, StepStatus, StudioLifecycleConfigAppType, StudioLifecycleConfigSortKey, TagPropagation, ThroughputMode, TrackingServerSize, TrackingServerStatus, TrainingJobSortByOptions, TrainingJobStatus, TrainingPlanFilterName, TrainingPlanSortBy, TrainingPlanSortOrder, TrainingPlanStatus, TransformJobStatus, UltraServerHealthStatus, UserProfileSortKey, UserProfileStatus, VariantPropertyType, VendorGuidance, WarmPoolResourceStatus } from "./enums";
2
- import type { AdditionalInferenceSpecificationDefinition, AlgorithmSpecification, AppSpecification, AutoMLJobStepMetadata, BatchDataCaptureConfig, BatchTransformInput, BedrockCustomModelDeploymentMetadata, BedrockCustomModelMetadata, BedrockModelImportMetadata, BedrockProvisionedModelThroughputMetadata, CacheHitResult, CallbackStepMetadata, Channel, CheckpointConfig, ClarifyCheckStepMetadata, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, ComputeQuotaConfig, ComputeQuotaTarget, DeploymentConfiguration, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, OutputParameter, ResourceConfig, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
- import type { ConditionStepMetadata, ContainerDefinition, DefaultSpaceSettings, DeploymentConfig, DriftCheckBaselines, EdgeOutputConfig, FeatureDefinition, InferenceComponentRuntimeConfig, InferenceComponentSpecification, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InstanceMetadataServiceConfiguration, ManagedConfiguration, MetadataProperties, ModelCardSecurityConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelVariantConfig, MonitoringScheduleConfig, NetworkConfig, NotebookInstanceLifecycleHook, RetryStrategy, SchedulerConfig, ShadowModeConfig, SourceAlgorithmSpecification, TtlDuration, UiTemplate, UserSettings } from "./models_1";
1
+ import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppNetworkAccessType, AppSecurityGroupManagement, AppType, BatchStrategy, ClusterNodeProvisioningMode, ClusterNodeRecovery, CrossAccountFilterOption, Direction, EndpointStatus, ExecutionStatus, FeatureStatus, HomeEfsFileSystemCreation, HubContentSupportStatus, HubContentType, InferenceExperimentStopDesiredState, IPAddressType, IsTrackingServerActive, JobCategory, JobStatus, JobType, LabelingJobStatus, LineageType, ListLabelingJobsForWorkteamSortByOptions, ListOptimizationJobsSortBy, ListWorkforcesSortByOptions, ListWorkteamsSortByOptions, MlflowAppStatus, ModelApprovalStatus, ModelCardExportJobSortBy, ModelCardExportJobSortOrder, ModelCardExportJobStatus, ModelCardSortBy, ModelCardSortOrder, ModelCardStatus, ModelCardVersionSortBy, ModelMetadataFilterType, ModelPackageGroupSortBy, ModelPackageGroupStatus, ModelPackageRegistrationType, ModelPackageSortBy, ModelPackageStatus, ModelPackageType, ModelRegistrationMode, ModelSortKey, ModelVariantAction, MonitoringAlertHistorySortKey, MonitoringAlertStatus, MonitoringExecutionSortKey, MonitoringJobDefinitionSortKey, MonitoringScheduleSortKey, MonitoringType, NotebookInstanceAcceleratorType, NotebookInstanceLifecycleConfigSortKey, NotebookInstanceLifecycleConfigSortOrder, NotebookInstanceSortKey, NotebookInstanceSortOrder, NotebookInstanceStatus, OptimizationJobDeploymentInstanceType, OptimizationJobStatus, OrderKey, PartnerAppStatus, PartnerAppType, PipelineExecutionStatus, PipelineStatus, ProcessingJobStatus, Processor, ProjectSortBy, ProjectSortOrder, ProjectStatus, RecommendationJobStatus, RecommendationStepType, Relation, ReservedCapacityInstanceType, ReservedCapacityType, ResourceCatalogSortBy, ResourceCatalogSortOrder, RootAccess, SageMakerResourceName, ScheduleStatus, SecondaryStatus, SharingType, SkipModelValidation, SortBy, SortLineageGroupsBy, SortMlflowAppBy, SortOrder, SortPipelineExecutionsBy, SortPipelinesBy, SortTrackingServerBy, SortTrialComponentsBy, SortTrialsBy, SpaceSortKey, SpaceStatus, StepStatus, StudioLifecycleConfigAppType, StudioLifecycleConfigSortKey, TagPropagation, ThroughputMode, TrackingServerSize, TrackingServerStatus, TrainingJobSortByOptions, TrainingJobStatus, TrainingPlanFilterName, TrainingPlanSortBy, TrainingPlanSortOrder, TrainingPlanStatus, TransformJobStatus, UltraServerHealthStatus, UserProfileSortKey, UserProfileStatus, VariantPropertyType, VendorGuidance, WarmPoolResourceStatus } from "./enums";
2
+ import type { AdditionalInferenceSpecificationDefinition, AlgorithmSpecification, AppSpecification, AutoMLJobStepMetadata, BatchDataCaptureConfig, BatchTransformInput, BedrockCustomModelDeploymentMetadata, BedrockCustomModelMetadata, BedrockModelImportMetadata, BedrockProvisionedModelThroughputMetadata, CacheHitResult, CallbackStepMetadata, Channel, CheckpointConfig, ClarifyCheckStepMetadata, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, ComputeQuotaConfig, DeploymentConfiguration, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, OutputParameter, ResourceConfig, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
+ import type { ComputeQuotaTarget, ConditionStepMetadata, ContainerDefinition, DefaultSpaceSettings, DeploymentConfig, DriftCheckBaselines, EdgeOutputConfig, FeatureDefinition, InferenceComponentRuntimeConfig, InferenceComponentSpecification, InferenceExecutionConfig, InferenceExperimentDataStorageConfig, InferenceExperimentSchedule, InstanceMetadataServiceConfiguration, ManagedConfiguration, MetadataProperties, ModelCardSecurityConfig, ModelLifeCycle, ModelMetrics, ModelPackageModelCard, ModelPackageSecurityConfig, ModelPackageValidationSpecification, ModelVariantConfig, MonitoringScheduleConfig, NetworkConfig, RetryStrategy, SchedulerConfig, ShadowModeConfig, SourceAlgorithmSpecification, TtlDuration, UiTemplate, UserSettings } from "./models_1";
4
4
  import type { DataProcessing, DebugHookConfig, DebugRuleConfiguration, DebugRuleEvaluationStatus, DeploymentRecommendation, ExperimentConfig, FeatureParameter, HyperParameterTrainingJobSummary, InstanceGroupHealthCheckConfiguration, ModelArtifacts, ModelClientConfig, ModelPackageConfig, ParallelismConfiguration, ProcessingInput, ProcessingOutputConfig, ProcessingResources, ProcessingStoppingCondition, ProfilerConfig, ServiceCatalogProvisioningDetails, SpaceStorageSettings, TensorBoardOutputConfig, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus } from "./models_2";
5
- import type { DesiredWeightAndCapacity, Device, DeviceDeploymentSummary, DomainSettingsForUpdate, Edge, EMRStepMetadata, Endpoint, EndpointConfigStepMetadata, EndpointStepMetadata, Experiment, FailStepMetadata, FeatureGroup, FeatureMetadata, Filter, GitConfigForUpdate, HyperParameterTuningJobSearchEntity, InferenceComponentDeploymentConfig, InferenceComponentMetadata, JobConfigSchemaVersionSummary, JobStepMetadata, JobSummary, LabelingJobForWorkteamSummary, LabelingJobSummary, LambdaStepMetadata, LineageGroupSummary, LineageMetadata, MetricData, ModelPackageStatusDetails, MonitoringExecutionSummary, MonitoringJobDefinitionSummary, PipelineExperimentConfig, ReservedCapacitySummary, SecondaryStatusTransition, SelectiveExecutionConfig, ServiceCatalogProvisionedProductDetails, SubscribedWorkteam, TemplateProviderDetail, TrialComponentMetricSummary, TrialComponentSource, TrialSource, WarmPoolStatus, Workforce, Workteam } from "./models_3";
5
+ import type { DesiredWeightAndCapacity, Device, DeviceDeploymentSummary, DomainSettingsForUpdate, Edge, EMRStepMetadata, Endpoint, EndpointConfigStepMetadata, EndpointStepMetadata, Experiment, FailStepMetadata, FeatureGroup, FeatureMetadata, Filter, GitConfigForUpdate, HyperParameterTuningJobSearchEntity, InferenceComponentDeploymentConfig, InferenceComponentMetadata, InferenceRecommendationsJobStep, Job, JobConfigSchemaVersionSummary, JobStepMetadata, JobSummary, LabelingJobForWorkteamSummary, LabelingJobSummary, LambdaStepMetadata, LineageGroupSummary, LineageMetadata, MetricData, ModelPackageStatusDetails, MonitoringExecutionSummary, MonitoringJobDefinitionSummary, PipelineExperimentConfig, ReservedCapacitySummary, SecondaryStatusTransition, SelectiveExecutionConfig, ServiceCatalogProvisionedProductDetails, SubscribedWorkteam, TemplateProviderDetail, TrialComponentMetricSummary, TrialComponentSource, TrialSource, WarmPoolStatus, Workforce, Workteam } from "./models_3";
6
+ /**
7
+ * @public
8
+ */
9
+ export interface ListInferenceRecommendationsJobStepsRequest {
10
+ /**
11
+ * <p>The name for the Inference Recommender job.</p>
12
+ * @public
13
+ */
14
+ JobName: string | undefined;
15
+ /**
16
+ * <p>A filter to return benchmarks of a specified status. If this field is left empty, then all benchmarks are returned.</p>
17
+ * @public
18
+ */
19
+ Status?: RecommendationJobStatus | undefined;
20
+ /**
21
+ * <p>A filter to return details about the specified type of subtask.</p> <p> <code>BENCHMARK</code>: Evaluate the performance of your model on different instance types.</p>
22
+ * @public
23
+ */
24
+ StepType?: RecommendationStepType | undefined;
25
+ /**
26
+ * <p>The maximum number of results to return.</p>
27
+ * @public
28
+ */
29
+ MaxResults?: number | undefined;
30
+ /**
31
+ * <p>A token that you can specify to return more results from the list. Specify this field if you have a token that was returned from a previous request.</p>
32
+ * @public
33
+ */
34
+ NextToken?: string | undefined;
35
+ }
36
+ /**
37
+ * @public
38
+ */
39
+ export interface ListInferenceRecommendationsJobStepsResponse {
40
+ /**
41
+ * <p>A list of all subtask details in Inference Recommender.</p>
42
+ * @public
43
+ */
44
+ Steps?: InferenceRecommendationsJobStep[] | undefined;
45
+ /**
46
+ * <p>A token that you can specify in your next request to return more results from the list.</p>
47
+ * @public
48
+ */
49
+ NextToken?: string | undefined;
50
+ }
6
51
  /**
7
52
  * @public
8
53
  */
@@ -6504,6 +6549,12 @@ export interface SearchRecord {
6504
6549
  * @public
6505
6550
  */
6506
6551
  Model?: ModelDashboardModel | undefined;
6552
+ /**
6553
+ * Search shape for Job. Mirrors DescribeJobResponse fields.
6554
+ * If you update DescribeJobResponse, update this structure as well.
6555
+ * @public
6556
+ */
6557
+ Job?: Job | undefined;
6507
6558
  }
6508
6559
  /**
6509
6560
  * <p>Represents the total number of matching results and indicates how accurate that count is.</p> <p>The <code>Value</code> field provides the count, which may be exact or estimated. The <code>Relation</code> field indicates whether it's an exact figure or a lower bound. This helps understand the full scope of search results, especially when dealing with large result sets.</p>
@@ -8631,28 +8682,3 @@ export interface UpdateNotebookInstanceInput {
8631
8682
  */
8632
8683
  InstanceMetadataServiceConfiguration?: InstanceMetadataServiceConfiguration | undefined;
8633
8684
  }
8634
- /**
8635
- * @public
8636
- */
8637
- export interface UpdateNotebookInstanceOutput {
8638
- }
8639
- /**
8640
- * @public
8641
- */
8642
- export interface UpdateNotebookInstanceLifecycleConfigInput {
8643
- /**
8644
- * <p>The name of the lifecycle configuration.</p>
8645
- * @public
8646
- */
8647
- NotebookInstanceLifecycleConfigName: string | undefined;
8648
- /**
8649
- * <p>The shell script that runs only once, when you create a notebook instance. The shell script must be a base64-encoded string.</p>
8650
- * @public
8651
- */
8652
- OnCreate?: NotebookInstanceLifecycleHook[] | undefined;
8653
- /**
8654
- * <p>The shell script that runs every time you start a notebook instance, including when you create the notebook instance. The shell script must be a base64-encoded string.</p>
8655
- * @public
8656
- */
8657
- OnStart?: NotebookInstanceLifecycleHook[] | undefined;
8658
- }
@@ -1,9 +1,34 @@
1
1
  import type { BooleanOperator, CrossAccountFilterOption, ResourceType, SearchSortOrder, WorkforceIpAddressType } from "./enums";
2
2
  import type { CfnUpdateTemplateProvider, Tag } from "./models_0";
3
- import type { UserSettings } from "./models_1";
3
+ import type { NotebookInstanceLifecycleHook, UserSettings } from "./models_1";
4
4
  import type { MemberDefinition, NotificationConfiguration, OidcConfig, ParallelismConfiguration, PartnerAppConfig, PartnerAppMaintenanceConfig, PipelineDefinitionS3Location, ProfilerRuleConfiguration, ProvisioningParameter, SourceIpConfig, SpaceSettings, TrialComponentArtifact, TrialComponentParameterValue, TrialComponentStatus, WorkerAccessConfiguration, WorkforceVpcConfigRequest } from "./models_2";
5
5
  import type { Filter, Workforce, Workteam } from "./models_3";
6
6
  import type { NestedFilters, ProfilerConfigForUpdate, RemoteDebugConfigForUpdate, ResourceConfigForUpdate, VisibilityConditions } from "./models_4";
7
+ /**
8
+ * @public
9
+ */
10
+ export interface UpdateNotebookInstanceOutput {
11
+ }
12
+ /**
13
+ * @public
14
+ */
15
+ export interface UpdateNotebookInstanceLifecycleConfigInput {
16
+ /**
17
+ * <p>The name of the lifecycle configuration.</p>
18
+ * @public
19
+ */
20
+ NotebookInstanceLifecycleConfigName: string | undefined;
21
+ /**
22
+ * <p>The shell script that runs only once, when you create a notebook instance. The shell script must be a base64-encoded string.</p>
23
+ * @public
24
+ */
25
+ OnCreate?: NotebookInstanceLifecycleHook[] | undefined;
26
+ /**
27
+ * <p>The shell script that runs every time you start a notebook instance, including when you create the notebook instance. The shell script must be a base64-encoded string.</p>
28
+ * @public
29
+ */
30
+ OnStart?: NotebookInstanceLifecycleHook[] | undefined;
31
+ }
7
32
  /**
8
33
  * @public
9
34
  */
@@ -32,6 +32,7 @@ export declare var AIBenchmarkOutputConfig$: StaticStructureSchema;
32
32
  export declare var AIBenchmarkOutputResult$: StaticStructureSchema;
33
33
  export declare var AICapacityReservationConfig$: StaticStructureSchema;
34
34
  export declare var AICloudWatchLogs$: StaticStructureSchema;
35
+ export declare var AIMlflowConfig$: StaticStructureSchema;
35
36
  export declare var AIModelSourceS3$: StaticStructureSchema;
36
37
  export declare var AIRecommendation$: StaticStructureSchema;
37
38
  export declare var AIRecommendationComputeSpec$: StaticStructureSchema;
@@ -815,6 +816,7 @@ export declare var InstancePoolSummary$: StaticStructureSchema;
815
816
  export declare var InstanceRequirementsEniConfiguration$: StaticStructureSchema;
816
817
  export declare var IntegerParameterRange$: StaticStructureSchema;
817
818
  export declare var IntegerParameterRangeSpecification$: StaticStructureSchema;
819
+ export declare var Job$: StaticStructureSchema;
818
820
  export declare var JobConfigSchemaVersionSummary$: StaticStructureSchema;
819
821
  export declare var JobSecondaryStatusTransition$: StaticStructureSchema;
820
822
  export declare var JobStepMetadata$: StaticStructureSchema;
@@ -1,7 +1,9 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import { DescribeInferenceComponentInput } from "../models/models_2";
4
- import { DescribeInferenceComponentOutput } from "../models/models_3";
3
+ import {
4
+ DescribeInferenceComponentInput,
5
+ DescribeInferenceComponentOutput,
6
+ } from "../models/models_3";
5
7
  import {
6
8
  SageMakerClientResolvedConfig,
7
9
  ServiceInputTypes,
@@ -3,7 +3,7 @@ import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
3
  import {
4
4
  ListInferenceRecommendationsJobStepsRequest,
5
5
  ListInferenceRecommendationsJobStepsResponse,
6
- } from "../models/models_3";
6
+ } from "../models/models_4";
7
7
  import {
8
8
  SageMakerClientResolvedConfig,
9
9
  ServiceInputTypes,
@@ -1,9 +1,7 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import {
4
- UpdateNotebookInstanceInput,
5
- UpdateNotebookInstanceOutput,
6
- } from "../models/models_4";
3
+ import { UpdateNotebookInstanceInput } from "../models/models_4";
4
+ import { UpdateNotebookInstanceOutput } from "../models/models_5";
7
5
  import {
8
6
  SageMakerClientResolvedConfig,
9
7
  ServiceInputTypes,
@@ -1,7 +1,9 @@
1
1
  import { Command as $Command } from "@smithy/core/client";
2
2
  import { MetadataBearer as __MetadataBearer } from "@smithy/types";
3
- import { UpdateNotebookInstanceLifecycleConfigInput } from "../models/models_4";
4
- import { UpdateNotebookInstanceLifecycleConfigOutput } from "../models/models_5";
3
+ import {
4
+ UpdateNotebookInstanceLifecycleConfigInput,
5
+ UpdateNotebookInstanceLifecycleConfigOutput,
6
+ } from "../models/models_5";
5
7
  import {
6
8
  SageMakerClientResolvedConfig,
7
9
  ServiceInputTypes,
@@ -3163,6 +3163,11 @@ export declare const TrackingServerStatus: {
3163
3163
  };
3164
3164
  export type TrackingServerStatus =
3165
3165
  (typeof TrackingServerStatus)[keyof typeof TrackingServerStatus];
3166
+ export declare const IncludedData: {
3167
+ readonly ALL_DATA: "AllData";
3168
+ readonly METADATA_ONLY: "MetadataOnly";
3169
+ };
3170
+ export type IncludedData = (typeof IncludedData)[keyof typeof IncludedData];
3166
3171
  export declare const ModelCardProcessingStatus: {
3167
3172
  readonly CONTENT_DELETED: "ContentDeleted";
3168
3173
  readonly DELETE_COMPLETED: "DeleteCompleted";
@@ -3483,6 +3488,7 @@ export declare const ResourceType: {
3483
3488
  readonly HYPER_PARAMETER_TUNING_JOB: "HyperParameterTuningJob";
3484
3489
  readonly IMAGE: "Image";
3485
3490
  readonly IMAGE_VERSION: "ImageVersion";
3491
+ readonly JOB: "Job";
3486
3492
  readonly MODEL: "Model";
3487
3493
  readonly MODEL_CARD: "ModelCard";
3488
3494
  readonly MODEL_PACKAGE: "ModelPackage";
@@ -252,8 +252,14 @@ export interface VpcConfig {
252
252
  export interface AIBenchmarkNetworkConfig {
253
253
  VpcConfig?: VpcConfig | undefined;
254
254
  }
255
+ export interface AIMlflowConfig {
256
+ MlflowResourceArn: string | undefined;
257
+ MlflowExperimentName?: string | undefined;
258
+ MlflowRunName?: string | undefined;
259
+ }
255
260
  export interface AIBenchmarkOutputConfig {
256
261
  S3OutputLocation: string | undefined;
262
+ MlflowConfig?: AIMlflowConfig | undefined;
257
263
  }
258
264
  export interface AICloudWatchLogs {
259
265
  LogGroupArn?: string | undefined;
@@ -262,6 +268,7 @@ export interface AICloudWatchLogs {
262
268
  export interface AIBenchmarkOutputResult {
263
269
  S3OutputLocation: string | undefined;
264
270
  CloudWatchLogs?: AICloudWatchLogs[] | undefined;
271
+ MlflowConfig?: AIMlflowConfig | undefined;
265
272
  }
266
273
  export type AIBenchmarkTarget =
267
274
  | AIBenchmarkTarget.EndpointMember
@@ -391,10 +398,12 @@ export interface AIRecommendationJobSummary {
391
398
  export interface AIRecommendationOutputConfig {
392
399
  S3OutputLocation?: string | undefined;
393
400
  ModelPackageGroupIdentifier?: string | undefined;
401
+ MlflowConfig?: AIMlflowConfig | undefined;
394
402
  }
395
403
  export interface AIRecommendationOutputResult {
396
404
  S3OutputLocation: string | undefined;
397
405
  ModelPackageGroupIdentifier?: string | undefined;
406
+ MlflowConfig?: AIMlflowConfig | undefined;
398
407
  }
399
408
  export interface AIRecommendationPerformanceTarget {
400
409
  Constraints: AIRecommendationConstraint[] | undefined;
@@ -1934,7 +1943,3 @@ export interface ComputeQuotaConfig {
1934
1943
  ResourceSharingConfig?: ResourceSharingConfig | undefined;
1935
1944
  PreemptTeamTasks?: PreemptTeamTasks | undefined;
1936
1945
  }
1937
- export interface ComputeQuotaTarget {
1938
- TeamName: string | undefined;
1939
- FairShareWeight?: number | undefined;
1940
- }
@@ -157,7 +157,6 @@ import {
157
157
  CodeRepository,
158
158
  CollectionConfig,
159
159
  ComputeQuotaConfig,
160
- ComputeQuotaTarget,
161
160
  CustomImage,
162
161
  GitConfig,
163
162
  InferenceSpecification,
@@ -174,6 +173,10 @@ import {
174
173
  TransformJobDefinition,
175
174
  VpcConfig,
176
175
  } from "./models_0";
176
+ export interface ComputeQuotaTarget {
177
+ TeamName: string | undefined;
178
+ FairShareWeight?: number | undefined;
179
+ }
177
180
  export interface ComputeQuotaSummary {
178
181
  ComputeQuotaArn: string | undefined;
179
182
  ComputeQuotaId: string | undefined;
@@ -1931,7 +1934,3 @@ export interface ModelQuantizationConfig {
1931
1934
  Image?: string | undefined;
1932
1935
  OverrideEnvironment?: Record<string, string> | undefined;
1933
1936
  }
1934
- export interface ModelShardingConfig {
1935
- Image?: string | undefined;
1936
- OverrideEnvironment?: Record<string, string> | undefined;
1937
- }
@@ -139,7 +139,6 @@ import {
139
139
  CognitoMemberDefinition,
140
140
  CollectionConfiguration,
141
141
  ComputeQuotaConfig,
142
- ComputeQuotaTarget,
143
142
  GitConfig,
144
143
  InferenceSpecification,
145
144
  JupyterLabAppImageConfig,
@@ -156,6 +155,7 @@ import {
156
155
  VpcConfig,
157
156
  } from "./models_0";
158
157
  import {
158
+ ComputeQuotaTarget,
159
159
  ContextSource,
160
160
  DataCaptureConfig,
161
161
  DataQualityAppSpecification,
@@ -186,7 +186,6 @@ import {
186
186
  ModelCompilationConfig,
187
187
  ModelDeployConfig,
188
188
  ModelQuantizationConfig,
189
- ModelShardingConfig,
190
189
  MonitoringNetworkConfig,
191
190
  MonitoringOutputConfig,
192
191
  MonitoringResources,
@@ -207,6 +206,10 @@ import {
207
206
  TrainingSpecification,
208
207
  UserSettings,
209
208
  } from "./models_1";
209
+ export interface ModelShardingConfig {
210
+ Image?: string | undefined;
211
+ OverrideEnvironment?: Record<string, string> | undefined;
212
+ }
210
213
  export interface ModelSpeculativeDecodingTrainingDataSource {
211
214
  S3Uri: string | undefined;
212
215
  S3DataType: ModelSpeculativeDecodingS3DataType | undefined;
@@ -2009,6 +2012,3 @@ export interface DescribeImageVersionResponse {
2009
2012
  Horovod?: boolean | undefined;
2010
2013
  ReleaseNotes?: string | undefined;
2011
2014
  }
2012
- export interface DescribeInferenceComponentInput {
2013
- InferenceComponentName: string | undefined;
2014
- }