@aws-sdk/client-sagemaker 3.1057.0 → 3.1059.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (87) hide show
  1. package/README.md +49 -0
  2. package/dist-cjs/index.js +139 -0
  3. package/dist-cjs/schemas/schemas_0.js +191 -36
  4. package/dist-es/SageMaker.js +18 -0
  5. package/dist-es/commands/CreateJobCommand.js +16 -0
  6. package/dist-es/commands/DeleteJobCommand.js +16 -0
  7. package/dist-es/commands/DescribeJobCommand.js +16 -0
  8. package/dist-es/commands/DescribeJobSchemaVersionCommand.js +16 -0
  9. package/dist-es/commands/ListJobSchemaVersionsCommand.js +16 -0
  10. package/dist-es/commands/ListJobsCommand.js +16 -0
  11. package/dist-es/commands/StopJobCommand.js +16 -0
  12. package/dist-es/commands/index.js +7 -0
  13. package/dist-es/models/enums.js +30 -0
  14. package/dist-es/pagination/ListJobSchemaVersionsPaginator.js +4 -0
  15. package/dist-es/pagination/ListJobsPaginator.js +4 -0
  16. package/dist-es/pagination/index.js +2 -0
  17. package/dist-es/schemas/schemas_0.js +157 -2
  18. package/dist-types/SageMaker.d.ts +63 -0
  19. package/dist-types/SageMakerClient.d.ts +9 -2
  20. package/dist-types/commands/CreateJobCommand.d.ts +95 -0
  21. package/dist-types/commands/DeleteJobCommand.d.ts +81 -0
  22. package/dist-types/commands/DescribeJobCommand.d.ts +105 -0
  23. package/dist-types/commands/DescribeJobSchemaVersionCommand.d.ts +82 -0
  24. package/dist-types/commands/ListJobSchemaVersionsCommand.d.ts +86 -0
  25. package/dist-types/commands/ListJobsCommand.d.ts +98 -0
  26. package/dist-types/commands/ListLabelingJobsCommand.d.ts +1 -1
  27. package/dist-types/commands/ListLabelingJobsForWorkteamCommand.d.ts +1 -1
  28. package/dist-types/commands/ListLineageGroupsCommand.d.ts +1 -1
  29. package/dist-types/commands/ListMlflowAppsCommand.d.ts +1 -1
  30. package/dist-types/commands/ListMlflowTrackingServersCommand.d.ts +1 -1
  31. package/dist-types/commands/ListPipelineExecutionStepsCommand.d.ts +3 -0
  32. package/dist-types/commands/StopJobCommand.d.ts +78 -0
  33. package/dist-types/commands/UpdateNotebookInstanceLifecycleConfigCommand.d.ts +2 -1
  34. package/dist-types/commands/UpdatePartnerAppCommand.d.ts +1 -1
  35. package/dist-types/commands/UpdatePipelineCommand.d.ts +1 -1
  36. package/dist-types/commands/UpdatePipelineExecutionCommand.d.ts +1 -1
  37. package/dist-types/commands/UpdatePipelineVersionCommand.d.ts +1 -1
  38. package/dist-types/commands/UpdateProjectCommand.d.ts +1 -1
  39. package/dist-types/commands/UpdateSpaceCommand.d.ts +1 -1
  40. package/dist-types/commands/UpdateTrainingJobCommand.d.ts +1 -1
  41. package/dist-types/commands/UpdateTrialCommand.d.ts +1 -2
  42. package/dist-types/commands/index.d.ts +7 -0
  43. package/dist-types/models/enums.d.ts +54 -0
  44. package/dist-types/models/models_1.d.ts +46 -33
  45. package/dist-types/models/models_2.d.ts +55 -77
  46. package/dist-types/models/models_3.d.ts +296 -390
  47. package/dist-types/models/models_4.d.ts +3902 -3732
  48. package/dist-types/models/models_5.d.ts +355 -2
  49. package/dist-types/pagination/ListJobSchemaVersionsPaginator.d.ts +7 -0
  50. package/dist-types/pagination/ListJobsPaginator.d.ts +7 -0
  51. package/dist-types/pagination/index.d.ts +2 -0
  52. package/dist-types/schemas/schemas_0.d.ts +25 -0
  53. package/dist-types/ts3.4/SageMaker.d.ts +133 -0
  54. package/dist-types/ts3.4/SageMakerClient.d.ts +42 -0
  55. package/dist-types/ts3.4/commands/CreateJobCommand.d.ts +45 -0
  56. package/dist-types/ts3.4/commands/DeleteJobCommand.d.ts +45 -0
  57. package/dist-types/ts3.4/commands/DescribeJobCommand.d.ts +49 -0
  58. package/dist-types/ts3.4/commands/DescribeJobSchemaVersionCommand.d.ts +53 -0
  59. package/dist-types/ts3.4/commands/ListJobSchemaVersionsCommand.d.ts +53 -0
  60. package/dist-types/ts3.4/commands/ListJobsCommand.d.ts +45 -0
  61. package/dist-types/ts3.4/commands/ListLabelingJobsCommand.d.ts +1 -1
  62. package/dist-types/ts3.4/commands/ListLabelingJobsForWorkteamCommand.d.ts +1 -1
  63. package/dist-types/ts3.4/commands/ListLineageGroupsCommand.d.ts +1 -1
  64. package/dist-types/ts3.4/commands/ListMlflowAppsCommand.d.ts +1 -1
  65. package/dist-types/ts3.4/commands/ListMlflowTrackingServersCommand.d.ts +1 -1
  66. package/dist-types/ts3.4/commands/StopJobCommand.d.ts +45 -0
  67. package/dist-types/ts3.4/commands/UpdateNotebookInstanceLifecycleConfigCommand.d.ts +2 -4
  68. package/dist-types/ts3.4/commands/UpdatePartnerAppCommand.d.ts +1 -1
  69. package/dist-types/ts3.4/commands/UpdatePipelineCommand.d.ts +1 -1
  70. package/dist-types/ts3.4/commands/UpdatePipelineExecutionCommand.d.ts +1 -1
  71. package/dist-types/ts3.4/commands/UpdatePipelineVersionCommand.d.ts +1 -1
  72. package/dist-types/ts3.4/commands/UpdateProjectCommand.d.ts +1 -1
  73. package/dist-types/ts3.4/commands/UpdateSpaceCommand.d.ts +1 -1
  74. package/dist-types/ts3.4/commands/UpdateTrainingJobCommand.d.ts +1 -1
  75. package/dist-types/ts3.4/commands/UpdateTrialCommand.d.ts +1 -2
  76. package/dist-types/ts3.4/commands/index.d.ts +7 -0
  77. package/dist-types/ts3.4/models/enums.d.ts +34 -0
  78. package/dist-types/ts3.4/models/models_1.d.ts +12 -10
  79. package/dist-types/ts3.4/models/models_2.d.ts +16 -21
  80. package/dist-types/ts3.4/models/models_3.d.ts +74 -96
  81. package/dist-types/ts3.4/models/models_4.d.ts +138 -97
  82. package/dist-types/ts3.4/models/models_5.d.ts +104 -1
  83. package/dist-types/ts3.4/pagination/ListJobSchemaVersionsPaginator.d.ts +11 -0
  84. package/dist-types/ts3.4/pagination/ListJobsPaginator.d.ts +11 -0
  85. package/dist-types/ts3.4/pagination/index.d.ts +2 -0
  86. package/dist-types/ts3.4/schemas/schemas_0.d.ts +25 -0
  87. package/package.json +9 -9
@@ -1,5 +1,5 @@
1
1
  import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion } from "@smithy/core/serde";
2
- import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AvailabilityZoneBalanceEnforcementMode, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, ClusterNodeProvisioningMode, ClusterNodeRecovery, CollectionType, CompleteOnConvergence, ConditionOutcome, ContainerMode, ContentClassifier, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, ExecutionRoleSessionNameMode, FailureHandlingPolicy, FairShare, FeatureStatus, FeatureType, FlatInvocations, Framework, HomeEfsFileSystemCreation, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, IdleResourceSharing, InferenceComponentPlacementStrategy, InferenceExecutionMode, InferenceExperimentType, IPAddressType, JobType, ManagedInstanceScalingScaleInStrategy, ManagedInstanceScalingStatus, ManagedStorageType, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCacheSetting, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, MonitoringProblemType, MonitoringType, NotebookInstanceAcceleratorType, NotebookOutputOption, ParameterType, ProblemType, ProcessingInstanceType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInferenceAmiVersion, ProductionVariantInstanceType, RecommendationJobSupportedEndpointType, RecommendationJobType, RepositoryAccessMode, RootAccess, RoutingStrategy, RStudioServerProAccessStatus, RStudioServerProUserGroup, SageMakerImageName, SchedulerResourceStatus, SkipModelValidation, StorageType, StudioWebPortal, TableFormat, TagPropagation, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, ThroughputMode, TrackingServerSize, TrafficType, TrainingInputMode, TrainingInstanceType, TrainingJobEarlyStoppingType, TtlDurationUnit, VendorGuidance } from "./enums";
2
+ import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AvailabilityZoneBalanceEnforcementMode, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, ClusterNodeProvisioningMode, ClusterNodeRecovery, CollectionType, CompleteOnConvergence, ConditionOutcome, ContainerMode, ContentClassifier, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, ExecutionRoleSessionNameMode, FailureHandlingPolicy, FairShare, FeatureStatus, FeatureType, FlatInvocations, Framework, HomeEfsFileSystemCreation, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, IdleResourceSharing, InferenceComponentPlacementStrategy, InferenceExecutionMode, InferenceExperimentType, IPAddressType, JobCategory, JobType, ManagedInstanceScalingScaleInStrategy, ManagedInstanceScalingStatus, ManagedStorageType, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCacheSetting, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode, MonitoringProblemType, MonitoringType, NotebookInstanceAcceleratorType, NotebookOutputOption, ParameterType, ProblemType, ProcessingInstanceType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInferenceAmiVersion, ProductionVariantInstanceType, RecommendationJobSupportedEndpointType, RecommendationJobType, RepositoryAccessMode, RootAccess, RoutingStrategy, RStudioServerProAccessStatus, RStudioServerProUserGroup, SageMakerImageName, SchedulerResourceStatus, SkipModelValidation, StorageType, StudioWebPortal, TableFormat, TagPropagation, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, ThroughputMode, TrackingServerSize, TrafficType, TrainingInputMode, TrainingInstanceType, TrainingJobEarlyStoppingType, TtlDurationUnit, VendorGuidance } from "./enums";
3
3
  import type { ActionSource, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputConfig, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputConfig, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppLifecycleManagement, ArtifactSource, AsyncInferenceConfig, AuthorizedUrl, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoParameter, AutoRollbackConfig, Autotune, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, ComputeQuotaConfig, ComputeQuotaTarget, CustomImage, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelDataSource, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformJobDefinition, VpcConfig } from "./models_0";
4
4
  /**
5
5
  * <p>Summary of the compute allocation definition.</p>
@@ -5207,6 +5207,51 @@ export interface CreateInferenceRecommendationsJobResponse {
5207
5207
  */
5208
5208
  JobArn: string | undefined;
5209
5209
  }
5210
+ /**
5211
+ * @public
5212
+ */
5213
+ export interface CreateJobRequest {
5214
+ /**
5215
+ * <p>The name of the job. The name must be unique within your account and Amazon Web Services Region.</p>
5216
+ * @public
5217
+ */
5218
+ JobName: string | undefined;
5219
+ /**
5220
+ * <p>The Amazon Resource Name (ARN) of the IAM role that Amazon SageMaker assumes to perform the job. The role must have the necessary permissions to access the resources required by the job configuration.</p>
5221
+ * @public
5222
+ */
5223
+ RoleArn: string | undefined;
5224
+ /**
5225
+ * <p>The category of the job. The category determines the type of workload that the job runs.</p>
5226
+ * @public
5227
+ */
5228
+ JobCategory: JobCategory | undefined;
5229
+ /**
5230
+ * <p>The version of the configuration schema to use for the job configuration document. Use <code>ListJobSchemaVersions</code> to get available schema versions for a job category.</p>
5231
+ * @public
5232
+ */
5233
+ JobConfigSchemaVersion: string | undefined;
5234
+ /**
5235
+ * <p>The JSON configuration document for the job. The document must conform to the schema specified by <code>JobConfigSchemaVersion</code>. Use <code>DescribeJobSchemaVersion</code> to retrieve the schema for validation.</p>
5236
+ * @public
5237
+ */
5238
+ JobConfigDocument: string | undefined;
5239
+ /**
5240
+ * <p>An array of key-value pairs to apply to the job as tags. For more information, see <a href="https://docs.aws.amazon.com/general/latest/gr/aws_tagging.html">Tagging Amazon Web Services Resources</a>.</p>
5241
+ * @public
5242
+ */
5243
+ Tags?: Tag[] | undefined;
5244
+ }
5245
+ /**
5246
+ * @public
5247
+ */
5248
+ export interface CreateJobResponse {
5249
+ /**
5250
+ * <p>The Amazon Resource Name (ARN) of the job.</p>
5251
+ * @public
5252
+ */
5253
+ JobArn: string | undefined;
5254
+ }
5210
5255
  /**
5211
5256
  * <p>Provided configuration information for the worker UI for a labeling job. Provide either <code>HumanTaskUiArn</code> or <code>UiTemplateS3Uri</code>.</p> <p>For named entity recognition, 3D point cloud and video frame labeling jobs, use <code>HumanTaskUiArn</code>.</p> <p>For all other Ground Truth built-in task types and custom task types, use <code>UiTemplateS3Uri</code> to specify the location of a worker task template in Amazon S3.</p>
5212
5257
  * @public
@@ -7135,35 +7180,3 @@ export interface ModelShardingConfig {
7135
7180
  */
7136
7181
  OverrideEnvironment?: Record<string, string> | undefined;
7137
7182
  }
7138
- /**
7139
- * <p>Contains information about the training data source for speculative decoding.</p>
7140
- * @public
7141
- */
7142
- export interface ModelSpeculativeDecodingTrainingDataSource {
7143
- /**
7144
- * <p>The Amazon S3 URI that points to the training data for speculative decoding.</p>
7145
- * @public
7146
- */
7147
- S3Uri: string | undefined;
7148
- /**
7149
- * <p>The type of data stored in the Amazon S3 location. Valid values are <code>S3Prefix</code> or <code>ManifestFile</code>.</p>
7150
- * @public
7151
- */
7152
- S3DataType: ModelSpeculativeDecodingS3DataType | undefined;
7153
- }
7154
- /**
7155
- * <p>Settings for the model speculative decoding technique that's applied by a model optimization job.</p>
7156
- * @public
7157
- */
7158
- export interface ModelSpeculativeDecodingConfig {
7159
- /**
7160
- * <p>The speculative decoding technique to apply during model optimization.</p>
7161
- * @public
7162
- */
7163
- Technique: ModelSpeculativeDecodingTechnique | undefined;
7164
- /**
7165
- * <p>The location of the training data to use for speculative decoding. The data must be formatted as ShareGPT, OpenAI Completions or OpenAI Chat Completions. The input can also be unencrypted captured data from a SageMaker endpoint as long as the endpoint uses one of the above formats.</p>
7166
- * @public
7167
- */
7168
- TrainingDataSource?: ModelSpeculativeDecodingTrainingDataSource | undefined;
7169
- }
@@ -1,6 +1,38 @@
1
- import type { ActionStatus, ActivationState, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmStatus, AppNetworkAccessType, AppSecurityGroupManagement, AppStatus, AppType, AuthMode, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLProblemTypeConfigName, BatchStrategy, CapacityReservationPreference, CaptureStatus, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterStatus, CompilationJobStatus, CustomizationTechnique, DataDistributionType, DeepHealthCheckType, DomainStatus, EdgePackagingJobStatus, EdgePresetDeploymentStatus, EdgePresetDeploymentType, EnabledOrDisabled, EndpointStatus, EvaluationType, FeatureGroupStatus, FeatureStatus, FeatureType, FlowDefinitionStatus, HomeEfsFileSystemCreation, HubContentStatus, HubContentSupportStatus, HubContentType, HubStatus, HumanTaskUiStatus, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStatus, ImageStatus, ImageVersionStatus, InferenceComponentCapacitySizeType, InputMode, JobType, JoinSource, LastUpdateStatusValue, ObjectiveStatus, OfflineStoreStatusValue, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, Peft, ProblemType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInstanceType, RecommendationStatus, RedshiftResultCompressionType, RedshiftResultFormat, RetentionType, RuleEvaluationStatus, SchedulerConfigComponent, SchedulerResourceStatus, ServerlessJobType, SharingType, StageStatus, Statistic, StudioLifecycleConfigAppType, TagPropagation, ThroughputMode, TrainingJobStatus, TrialComponentPrimaryStatus, VariantStatus, VendorGuidance, WorkforceIpAddressType } from "./enums";
2
- import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, AutoRollbackConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, ComputeQuotaTarget, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
- import type { ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, ModelShardingConfig, ModelSpeculativeDecodingConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
1
+ import type { ActionStatus, ActivationState, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmStatus, AppNetworkAccessType, AppSecurityGroupManagement, AppStatus, AppType, AuthMode, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLProblemTypeConfigName, BatchStrategy, CapacityReservationPreference, CaptureStatus, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterStatus, CompilationJobStatus, CustomizationTechnique, DataDistributionType, DeepHealthCheckType, DomainStatus, EdgePackagingJobStatus, EdgePresetDeploymentStatus, EdgePresetDeploymentType, EnabledOrDisabled, EndpointStatus, EvaluationType, FeatureGroupStatus, FeatureStatus, FeatureType, FlowDefinitionStatus, HomeEfsFileSystemCreation, HubContentStatus, HubContentSupportStatus, HubContentType, HubStatus, HumanTaskUiStatus, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStatus, ImageStatus, ImageVersionStatus, InputMode, JobCategory, JobType, JoinSource, LastUpdateStatusValue, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, ObjectiveStatus, OfflineStoreStatusValue, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, Peft, ProblemType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInstanceType, RecommendationStatus, RedshiftResultCompressionType, RedshiftResultFormat, RetentionType, RuleEvaluationStatus, SchedulerConfigComponent, SchedulerResourceStatus, ServerlessJobType, SharingType, StageStatus, Statistic, StudioLifecycleConfigAppType, TagPropagation, ThroughputMode, TrainingJobStatus, TrialComponentPrimaryStatus, VariantStatus, VendorGuidance, WorkforceIpAddressType } from "./enums";
2
+ import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, ComputeQuotaTarget, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
3
+ import type { ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, ModelShardingConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
4
+ /**
5
+ * <p>Contains information about the training data source for speculative decoding.</p>
6
+ * @public
7
+ */
8
+ export interface ModelSpeculativeDecodingTrainingDataSource {
9
+ /**
10
+ * <p>The Amazon S3 URI that points to the training data for speculative decoding.</p>
11
+ * @public
12
+ */
13
+ S3Uri: string | undefined;
14
+ /**
15
+ * <p>The type of data stored in the Amazon S3 location. Valid values are <code>S3Prefix</code> or <code>ManifestFile</code>.</p>
16
+ * @public
17
+ */
18
+ S3DataType: ModelSpeculativeDecodingS3DataType | undefined;
19
+ }
20
+ /**
21
+ * <p>Settings for the model speculative decoding technique that's applied by a model optimization job.</p>
22
+ * @public
23
+ */
24
+ export interface ModelSpeculativeDecodingConfig {
25
+ /**
26
+ * <p>The speculative decoding technique to apply during model optimization.</p>
27
+ * @public
28
+ */
29
+ Technique: ModelSpeculativeDecodingTechnique | undefined;
30
+ /**
31
+ * <p>The location of the training data to use for speculative decoding. The data must be formatted as ShareGPT, OpenAI Completions or OpenAI Chat Completions. The input can also be unencrypted captured data from a SageMaker endpoint as long as the endpoint uses one of the above formats.</p>
32
+ * @public
33
+ */
34
+ TrainingDataSource?: ModelSpeculativeDecodingTrainingDataSource | undefined;
35
+ }
4
36
  /**
5
37
  * <p>Settings for an optimization technique that you apply with a model optimization job.</p>
6
38
  * @public
@@ -3073,6 +3105,26 @@ export interface DeleteInferenceExperimentResponse {
3073
3105
  */
3074
3106
  InferenceExperimentArn: string | undefined;
3075
3107
  }
3108
+ /**
3109
+ * @public
3110
+ */
3111
+ export interface DeleteJobRequest {
3112
+ /**
3113
+ * <p>The name of the job to delete.</p>
3114
+ * @public
3115
+ */
3116
+ JobName: string | undefined;
3117
+ /**
3118
+ * <p>The category of the job to delete.</p>
3119
+ * @public
3120
+ */
3121
+ JobCategory: JobCategory | undefined;
3122
+ }
3123
+ /**
3124
+ * @public
3125
+ */
3126
+ export interface DeleteJobResponse {
3127
+ }
3076
3128
  /**
3077
3129
  * @public
3078
3130
  */
@@ -7147,77 +7199,3 @@ export interface DescribeInferenceComponentInput {
7147
7199
  */
7148
7200
  InferenceComponentName: string | undefined;
7149
7201
  }
7150
- /**
7151
- * <p>Specifies the type and size of the endpoint capacity to activate for a rolling deployment or a rollback strategy. You can specify your batches as either of the following:</p> <ul> <li> <p>A count of inference component copies </p> </li> <li> <p>The overall percentage or your fleet </p> </li> </ul> <p>For a rollback strategy, if you don't specify the fields in this object, or if you set the <code>Value</code> parameter to 100%, then SageMaker AI uses a blue/green rollback strategy and rolls all traffic back to the blue fleet.</p>
7152
- * @public
7153
- */
7154
- export interface InferenceComponentCapacitySize {
7155
- /**
7156
- * <p>Specifies the endpoint capacity type.</p> <dl> <dt>COPY_COUNT</dt> <dd> <p>The endpoint activates based on the number of inference component copies.</p> </dd> <dt>CAPACITY_PERCENT</dt> <dd> <p>The endpoint activates based on the specified percentage of capacity.</p> </dd> </dl>
7157
- * @public
7158
- */
7159
- Type: InferenceComponentCapacitySizeType | undefined;
7160
- /**
7161
- * <p>Defines the capacity size, either as a number of inference component copies or a capacity percentage.</p>
7162
- * @public
7163
- */
7164
- Value: number | undefined;
7165
- }
7166
- /**
7167
- * <p>Specifies a rolling deployment strategy for updating a SageMaker AI inference component.</p>
7168
- * @public
7169
- */
7170
- export interface InferenceComponentRollingUpdatePolicy {
7171
- /**
7172
- * <p>The batch size for each rolling step in the deployment process. For each step, SageMaker AI provisions capacity on the new endpoint fleet, routes traffic to that fleet, and terminates capacity on the old endpoint fleet. The value must be between 5% to 50% of the copy count of the inference component.</p>
7173
- * @public
7174
- */
7175
- MaximumBatchSize: InferenceComponentCapacitySize | undefined;
7176
- /**
7177
- * <p>The length of the baking period, during which SageMaker AI monitors alarms for each batch on the new fleet.</p>
7178
- * @public
7179
- */
7180
- WaitIntervalInSeconds: number | undefined;
7181
- /**
7182
- * <p>The time limit for the total deployment. Exceeding this limit causes a timeout.</p>
7183
- * @public
7184
- */
7185
- MaximumExecutionTimeoutInSeconds?: number | undefined;
7186
- /**
7187
- * <p>The batch size for a rollback to the old endpoint fleet. If this field is absent, the value is set to the default, which is 100% of the total capacity. When the default is used, SageMaker AI provisions the entire capacity of the old fleet at once during rollback.</p>
7188
- * @public
7189
- */
7190
- RollbackMaximumBatchSize?: InferenceComponentCapacitySize | undefined;
7191
- }
7192
- /**
7193
- * <p>The deployment configuration for an endpoint that hosts inference components. The configuration includes the desired deployment strategy and rollback settings.</p>
7194
- * @public
7195
- */
7196
- export interface InferenceComponentDeploymentConfig {
7197
- /**
7198
- * <p>Specifies a rolling deployment strategy for updating a SageMaker AI endpoint.</p>
7199
- * @public
7200
- */
7201
- RollingUpdatePolicy: InferenceComponentRollingUpdatePolicy | undefined;
7202
- /**
7203
- * <p>Automatic rollback configuration for handling endpoint deployment failures and recovery.</p>
7204
- * @public
7205
- */
7206
- AutoRollbackConfiguration?: AutoRollbackConfig | undefined;
7207
- }
7208
- /**
7209
- * <p>The placement status of an inference component on a specific instance type. Shows the number of inference component copies currently placed on instances of a given type.</p>
7210
- * @public
7211
- */
7212
- export interface InferenceComponentPlacementStatus {
7213
- /**
7214
- * <p>The ML compute instance type where the inference component copies are placed.</p>
7215
- * @public
7216
- */
7217
- InstanceType: ProductionVariantInstanceType | undefined;
7218
- /**
7219
- * <p>The number of inference component copies currently placed on instances of this type.</p>
7220
- * @public
7221
- */
7222
- CurrentCopyCount: number | undefined;
7223
- }