@aws-sdk/client-sagemaker 3.1057.0 → 3.1059.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +49 -0
- package/dist-cjs/index.js +139 -0
- package/dist-cjs/schemas/schemas_0.js +191 -36
- package/dist-es/SageMaker.js +18 -0
- package/dist-es/commands/CreateJobCommand.js +16 -0
- package/dist-es/commands/DeleteJobCommand.js +16 -0
- package/dist-es/commands/DescribeJobCommand.js +16 -0
- package/dist-es/commands/DescribeJobSchemaVersionCommand.js +16 -0
- package/dist-es/commands/ListJobSchemaVersionsCommand.js +16 -0
- package/dist-es/commands/ListJobsCommand.js +16 -0
- package/dist-es/commands/StopJobCommand.js +16 -0
- package/dist-es/commands/index.js +7 -0
- package/dist-es/models/enums.js +30 -0
- package/dist-es/pagination/ListJobSchemaVersionsPaginator.js +4 -0
- package/dist-es/pagination/ListJobsPaginator.js +4 -0
- package/dist-es/pagination/index.js +2 -0
- package/dist-es/schemas/schemas_0.js +157 -2
- package/dist-types/SageMaker.d.ts +63 -0
- package/dist-types/SageMakerClient.d.ts +9 -2
- package/dist-types/commands/CreateJobCommand.d.ts +95 -0
- package/dist-types/commands/DeleteJobCommand.d.ts +81 -0
- package/dist-types/commands/DescribeJobCommand.d.ts +105 -0
- package/dist-types/commands/DescribeJobSchemaVersionCommand.d.ts +82 -0
- package/dist-types/commands/ListJobSchemaVersionsCommand.d.ts +86 -0
- package/dist-types/commands/ListJobsCommand.d.ts +98 -0
- package/dist-types/commands/ListLabelingJobsCommand.d.ts +1 -1
- package/dist-types/commands/ListLabelingJobsForWorkteamCommand.d.ts +1 -1
- package/dist-types/commands/ListLineageGroupsCommand.d.ts +1 -1
- package/dist-types/commands/ListMlflowAppsCommand.d.ts +1 -1
- package/dist-types/commands/ListMlflowTrackingServersCommand.d.ts +1 -1
- package/dist-types/commands/ListPipelineExecutionStepsCommand.d.ts +3 -0
- package/dist-types/commands/StopJobCommand.d.ts +78 -0
- package/dist-types/commands/UpdateNotebookInstanceLifecycleConfigCommand.d.ts +2 -1
- package/dist-types/commands/UpdatePartnerAppCommand.d.ts +1 -1
- package/dist-types/commands/UpdatePipelineCommand.d.ts +1 -1
- package/dist-types/commands/UpdatePipelineExecutionCommand.d.ts +1 -1
- package/dist-types/commands/UpdatePipelineVersionCommand.d.ts +1 -1
- package/dist-types/commands/UpdateProjectCommand.d.ts +1 -1
- package/dist-types/commands/UpdateSpaceCommand.d.ts +1 -1
- package/dist-types/commands/UpdateTrainingJobCommand.d.ts +1 -1
- package/dist-types/commands/UpdateTrialCommand.d.ts +1 -2
- package/dist-types/commands/index.d.ts +7 -0
- package/dist-types/models/enums.d.ts +54 -0
- package/dist-types/models/models_1.d.ts +46 -33
- package/dist-types/models/models_2.d.ts +55 -77
- package/dist-types/models/models_3.d.ts +296 -390
- package/dist-types/models/models_4.d.ts +3902 -3732
- package/dist-types/models/models_5.d.ts +355 -2
- package/dist-types/pagination/ListJobSchemaVersionsPaginator.d.ts +7 -0
- package/dist-types/pagination/ListJobsPaginator.d.ts +7 -0
- package/dist-types/pagination/index.d.ts +2 -0
- package/dist-types/schemas/schemas_0.d.ts +25 -0
- package/dist-types/ts3.4/SageMaker.d.ts +133 -0
- package/dist-types/ts3.4/SageMakerClient.d.ts +42 -0
- package/dist-types/ts3.4/commands/CreateJobCommand.d.ts +45 -0
- package/dist-types/ts3.4/commands/DeleteJobCommand.d.ts +45 -0
- package/dist-types/ts3.4/commands/DescribeJobCommand.d.ts +49 -0
- package/dist-types/ts3.4/commands/DescribeJobSchemaVersionCommand.d.ts +53 -0
- package/dist-types/ts3.4/commands/ListJobSchemaVersionsCommand.d.ts +53 -0
- package/dist-types/ts3.4/commands/ListJobsCommand.d.ts +45 -0
- package/dist-types/ts3.4/commands/ListLabelingJobsCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/ListLabelingJobsForWorkteamCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/ListLineageGroupsCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/ListMlflowAppsCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/ListMlflowTrackingServersCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/StopJobCommand.d.ts +45 -0
- package/dist-types/ts3.4/commands/UpdateNotebookInstanceLifecycleConfigCommand.d.ts +2 -4
- package/dist-types/ts3.4/commands/UpdatePartnerAppCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdatePipelineCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdatePipelineExecutionCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdatePipelineVersionCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdateProjectCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdateSpaceCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdateTrainingJobCommand.d.ts +1 -1
- package/dist-types/ts3.4/commands/UpdateTrialCommand.d.ts +1 -2
- package/dist-types/ts3.4/commands/index.d.ts +7 -0
- package/dist-types/ts3.4/models/enums.d.ts +34 -0
- package/dist-types/ts3.4/models/models_1.d.ts +12 -10
- package/dist-types/ts3.4/models/models_2.d.ts +16 -21
- package/dist-types/ts3.4/models/models_3.d.ts +74 -96
- package/dist-types/ts3.4/models/models_4.d.ts +138 -97
- package/dist-types/ts3.4/models/models_5.d.ts +104 -1
- package/dist-types/ts3.4/pagination/ListJobSchemaVersionsPaginator.d.ts +11 -0
- package/dist-types/ts3.4/pagination/ListJobsPaginator.d.ts +11 -0
- package/dist-types/ts3.4/pagination/index.d.ts +2 -0
- package/dist-types/ts3.4/schemas/schemas_0.d.ts +25 -0
- package/package.json +9 -9
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion } from "@smithy/core/serde";
|
|
2
|
-
import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AvailabilityZoneBalanceEnforcementMode, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, ClusterNodeProvisioningMode, ClusterNodeRecovery, CollectionType, CompleteOnConvergence, ConditionOutcome, ContainerMode, ContentClassifier, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, ExecutionRoleSessionNameMode, FailureHandlingPolicy, FairShare, FeatureStatus, FeatureType, FlatInvocations, Framework, HomeEfsFileSystemCreation, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, IdleResourceSharing, InferenceComponentPlacementStrategy, InferenceExecutionMode, InferenceExperimentType, IPAddressType, JobType, ManagedInstanceScalingScaleInStrategy, ManagedInstanceScalingStatus, ManagedStorageType, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCacheSetting, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode,
|
|
2
|
+
import type { _InstanceType, AccountDefaultStatus, ActionStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AvailabilityZoneBalanceEnforcementMode, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, ClusterNodeProvisioningMode, ClusterNodeRecovery, CollectionType, CompleteOnConvergence, ConditionOutcome, ContainerMode, ContentClassifier, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, ExecutionRoleSessionNameMode, FailureHandlingPolicy, FairShare, FeatureStatus, FeatureType, FlatInvocations, Framework, HomeEfsFileSystemCreation, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, IdleResourceSharing, InferenceComponentPlacementStrategy, InferenceExecutionMode, InferenceExperimentType, IPAddressType, JobCategory, JobType, ManagedInstanceScalingScaleInStrategy, ManagedInstanceScalingStatus, ManagedStorageType, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCacheSetting, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode, MonitoringProblemType, MonitoringType, NotebookInstanceAcceleratorType, NotebookOutputOption, ParameterType, ProblemType, ProcessingInstanceType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInferenceAmiVersion, ProductionVariantInstanceType, RecommendationJobSupportedEndpointType, RecommendationJobType, RepositoryAccessMode, RootAccess, RoutingStrategy, RStudioServerProAccessStatus, RStudioServerProUserGroup, SageMakerImageName, SchedulerResourceStatus, SkipModelValidation, StorageType, StudioWebPortal, TableFormat, TagPropagation, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, ThroughputMode, TrackingServerSize, TrafficType, TrainingInputMode, TrainingInstanceType, TrainingJobEarlyStoppingType, TtlDurationUnit, VendorGuidance } from "./enums";
|
|
3
3
|
import type { ActionSource, AdditionalInferenceSpecificationDefinition, AdditionalModelDataSource, AdditionalS3DataSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputConfig, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputConfig, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmValidationSpecification, AmazonQSettings, AnnotationConsolidationConfig, AppLifecycleManagement, ArtifactSource, AsyncInferenceConfig, AuthorizedUrl, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobChannel, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLProblemTypeConfig, AutoMLSecurityConfig, AutoParameter, AutoRollbackConfig, Autotune, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CategoricalParameterRangeSpecification, Channel, ChannelSpecification, CheckpointConfig, ClarifyExplainerConfig, ClusterAutoScalingConfig, ClusterInstanceGroupSpecification, ClusterOrchestrator, ClusterRestrictedInstanceGroupsConfig, ClusterRestrictedInstanceGroupSpecification, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, ComputeQuotaConfig, ComputeQuotaTarget, CustomImage, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, MetricDefinition, MetricsSource, ModelDataSource, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformJobDefinition, VpcConfig } from "./models_0";
|
|
4
4
|
/**
|
|
5
5
|
* <p>Summary of the compute allocation definition.</p>
|
|
@@ -5207,6 +5207,51 @@ export interface CreateInferenceRecommendationsJobResponse {
|
|
|
5207
5207
|
*/
|
|
5208
5208
|
JobArn: string | undefined;
|
|
5209
5209
|
}
|
|
5210
|
+
/**
|
|
5211
|
+
* @public
|
|
5212
|
+
*/
|
|
5213
|
+
export interface CreateJobRequest {
|
|
5214
|
+
/**
|
|
5215
|
+
* <p>The name of the job. The name must be unique within your account and Amazon Web Services Region.</p>
|
|
5216
|
+
* @public
|
|
5217
|
+
*/
|
|
5218
|
+
JobName: string | undefined;
|
|
5219
|
+
/**
|
|
5220
|
+
* <p>The Amazon Resource Name (ARN) of the IAM role that Amazon SageMaker assumes to perform the job. The role must have the necessary permissions to access the resources required by the job configuration.</p>
|
|
5221
|
+
* @public
|
|
5222
|
+
*/
|
|
5223
|
+
RoleArn: string | undefined;
|
|
5224
|
+
/**
|
|
5225
|
+
* <p>The category of the job. The category determines the type of workload that the job runs.</p>
|
|
5226
|
+
* @public
|
|
5227
|
+
*/
|
|
5228
|
+
JobCategory: JobCategory | undefined;
|
|
5229
|
+
/**
|
|
5230
|
+
* <p>The version of the configuration schema to use for the job configuration document. Use <code>ListJobSchemaVersions</code> to get available schema versions for a job category.</p>
|
|
5231
|
+
* @public
|
|
5232
|
+
*/
|
|
5233
|
+
JobConfigSchemaVersion: string | undefined;
|
|
5234
|
+
/**
|
|
5235
|
+
* <p>The JSON configuration document for the job. The document must conform to the schema specified by <code>JobConfigSchemaVersion</code>. Use <code>DescribeJobSchemaVersion</code> to retrieve the schema for validation.</p>
|
|
5236
|
+
* @public
|
|
5237
|
+
*/
|
|
5238
|
+
JobConfigDocument: string | undefined;
|
|
5239
|
+
/**
|
|
5240
|
+
* <p>An array of key-value pairs to apply to the job as tags. For more information, see <a href="https://docs.aws.amazon.com/general/latest/gr/aws_tagging.html">Tagging Amazon Web Services Resources</a>.</p>
|
|
5241
|
+
* @public
|
|
5242
|
+
*/
|
|
5243
|
+
Tags?: Tag[] | undefined;
|
|
5244
|
+
}
|
|
5245
|
+
/**
|
|
5246
|
+
* @public
|
|
5247
|
+
*/
|
|
5248
|
+
export interface CreateJobResponse {
|
|
5249
|
+
/**
|
|
5250
|
+
* <p>The Amazon Resource Name (ARN) of the job.</p>
|
|
5251
|
+
* @public
|
|
5252
|
+
*/
|
|
5253
|
+
JobArn: string | undefined;
|
|
5254
|
+
}
|
|
5210
5255
|
/**
|
|
5211
5256
|
* <p>Provided configuration information for the worker UI for a labeling job. Provide either <code>HumanTaskUiArn</code> or <code>UiTemplateS3Uri</code>.</p> <p>For named entity recognition, 3D point cloud and video frame labeling jobs, use <code>HumanTaskUiArn</code>.</p> <p>For all other Ground Truth built-in task types and custom task types, use <code>UiTemplateS3Uri</code> to specify the location of a worker task template in Amazon S3.</p>
|
|
5212
5257
|
* @public
|
|
@@ -7135,35 +7180,3 @@ export interface ModelShardingConfig {
|
|
|
7135
7180
|
*/
|
|
7136
7181
|
OverrideEnvironment?: Record<string, string> | undefined;
|
|
7137
7182
|
}
|
|
7138
|
-
/**
|
|
7139
|
-
* <p>Contains information about the training data source for speculative decoding.</p>
|
|
7140
|
-
* @public
|
|
7141
|
-
*/
|
|
7142
|
-
export interface ModelSpeculativeDecodingTrainingDataSource {
|
|
7143
|
-
/**
|
|
7144
|
-
* <p>The Amazon S3 URI that points to the training data for speculative decoding.</p>
|
|
7145
|
-
* @public
|
|
7146
|
-
*/
|
|
7147
|
-
S3Uri: string | undefined;
|
|
7148
|
-
/**
|
|
7149
|
-
* <p>The type of data stored in the Amazon S3 location. Valid values are <code>S3Prefix</code> or <code>ManifestFile</code>.</p>
|
|
7150
|
-
* @public
|
|
7151
|
-
*/
|
|
7152
|
-
S3DataType: ModelSpeculativeDecodingS3DataType | undefined;
|
|
7153
|
-
}
|
|
7154
|
-
/**
|
|
7155
|
-
* <p>Settings for the model speculative decoding technique that's applied by a model optimization job.</p>
|
|
7156
|
-
* @public
|
|
7157
|
-
*/
|
|
7158
|
-
export interface ModelSpeculativeDecodingConfig {
|
|
7159
|
-
/**
|
|
7160
|
-
* <p>The speculative decoding technique to apply during model optimization.</p>
|
|
7161
|
-
* @public
|
|
7162
|
-
*/
|
|
7163
|
-
Technique: ModelSpeculativeDecodingTechnique | undefined;
|
|
7164
|
-
/**
|
|
7165
|
-
* <p>The location of the training data to use for speculative decoding. The data must be formatted as ShareGPT, OpenAI Completions or OpenAI Chat Completions. The input can also be unencrypted captured data from a SageMaker endpoint as long as the endpoint uses one of the above formats.</p>
|
|
7166
|
-
* @public
|
|
7167
|
-
*/
|
|
7168
|
-
TrainingDataSource?: ModelSpeculativeDecodingTrainingDataSource | undefined;
|
|
7169
|
-
}
|
|
@@ -1,6 +1,38 @@
|
|
|
1
|
-
import type { ActionStatus, ActivationState, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmStatus, AppNetworkAccessType, AppSecurityGroupManagement, AppStatus, AppType, AuthMode, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLProblemTypeConfigName, BatchStrategy, CapacityReservationPreference, CaptureStatus, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterStatus, CompilationJobStatus, CustomizationTechnique, DataDistributionType, DeepHealthCheckType, DomainStatus, EdgePackagingJobStatus, EdgePresetDeploymentStatus, EdgePresetDeploymentType, EnabledOrDisabled, EndpointStatus, EvaluationType, FeatureGroupStatus, FeatureStatus, FeatureType, FlowDefinitionStatus, HomeEfsFileSystemCreation, HubContentStatus, HubContentSupportStatus, HubContentType, HubStatus, HumanTaskUiStatus, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStatus, ImageStatus, ImageVersionStatus,
|
|
2
|
-
import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig,
|
|
3
|
-
import type { ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, ModelShardingConfig,
|
|
1
|
+
import type { ActionStatus, ActivationState, AIBenchmarkJobStatus, AIRecommendationJobStatus, AlgorithmStatus, AppNetworkAccessType, AppSecurityGroupManagement, AppStatus, AppType, AuthMode, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLProblemTypeConfigName, BatchStrategy, CapacityReservationPreference, CaptureStatus, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterStatus, CompilationJobStatus, CustomizationTechnique, DataDistributionType, DeepHealthCheckType, DomainStatus, EdgePackagingJobStatus, EdgePresetDeploymentStatus, EdgePresetDeploymentType, EnabledOrDisabled, EndpointStatus, EvaluationType, FeatureGroupStatus, FeatureStatus, FeatureType, FlowDefinitionStatus, HomeEfsFileSystemCreation, HubContentStatus, HubContentSupportStatus, HubContentType, HubStatus, HumanTaskUiStatus, HyperParameterTuningJobObjectiveType, HyperParameterTuningJobStatus, ImageStatus, ImageVersionStatus, InputMode, JobCategory, JobType, JoinSource, LastUpdateStatusValue, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, ObjectiveStatus, OfflineStoreStatusValue, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, Peft, ProblemType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInstanceType, RecommendationStatus, RedshiftResultCompressionType, RedshiftResultFormat, RetentionType, RuleEvaluationStatus, SchedulerConfigComponent, SchedulerResourceStatus, ServerlessJobType, SharingType, StageStatus, Statistic, StudioLifecycleConfigAppType, TagPropagation, ThroughputMode, TrainingJobStatus, TrialComponentPrimaryStatus, VariantStatus, VendorGuidance, WorkforceIpAddressType } from "./enums";
|
|
2
|
+
import type { ActionSource, AIBenchmarkNetworkConfig, AIBenchmarkOutputResult, AIBenchmarkTarget, AIDatasetConfig, AIModelSource, AIRecommendation, AIRecommendationComputeSpec, AIRecommendationInferenceSpecification, AIRecommendationOutputResult, AIRecommendationPerformanceTarget, AIWorkloadConfigs, AlgorithmSpecification, AlgorithmStatusDetails, AlgorithmValidationSpecification, AppSpecification, ArtifactSource, AsyncInferenceConfig, AthenaDatasetDefinition, AutoMLCandidate, AutoMLChannel, AutoMLComputeConfig, AutoMLDataSplitConfig, AutoMLJobArtifacts, AutoMLJobChannel, AutoMLJobCompletionCriteria, AutoMLJobConfig, AutoMLJobObjective, AutoMLOutputDataConfig, AutoMLPartialFailureReason, AutoMLProblemTypeConfig, AutoMLResolvedAttributes, AutoMLSecurityConfig, Autotune, BatchDataCaptureConfig, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClusterAutoScalingConfigOutput, ClusterEventDetail, ClusterInstanceGroupDetails, ClusterNodeDetails, ClusterOrchestrator, ClusterRestrictedInstanceGroupDetails, ClusterRestrictedInstanceGroupsConfigOutput, ClusterTieredStorageConfig, CodeEditorAppImageConfig, CodeRepository, CognitoConfig, CognitoMemberDefinition, CollectionConfiguration, ComputeQuotaConfig, ComputeQuotaTarget, GitConfig, InferenceSpecification, JupyterLabAppImageConfig, KernelGatewayImageConfig, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TransformInput, TransformOutput, TransformResources, UserContext, VpcConfig } from "./models_0";
|
|
3
|
+
import type { ContextSource, DataCaptureConfig, DataQualityAppSpecification, DataQualityBaselineConfig, DataQualityJobInput, DefaultSpaceSettings, DeploymentConfig, DeviceSelectionConfig, DomainSettings, EdgeDeploymentConfig, EdgeDeploymentModelConfig, EdgeOutputConfig, ExplainerConfig, FeatureDefinition, FlowDefinitionOutputConfig, HubS3StorageConfig, HumanLoopActivationConfig, HumanLoopConfig, HumanLoopRequestSource, HyperParameterTrainingJobDefinition, HyperParameterTuningJobConfig, HyperParameterTuningJobWarmStartConfig, InputConfig, JupyterServerAppSettings, KernelGatewayAppSettings, MetadataProperties, MetricsConfig, ModelCompilationConfig, ModelDeployConfig, ModelQuantizationConfig, ModelShardingConfig, MonitoringNetworkConfig, MonitoringOutputConfig, MonitoringResources, MonitoringStoppingCondition, NeoVpcConfig, NetworkConfig, OfflineStoreConfig, OnlineStoreConfig, OptimizationJobModelSource, OptimizationSageMakerModel, OutputConfig, ProductionVariant, ProductionVariantManagedInstanceScaling, ProductionVariantRoutingConfig, ProductionVariantServerlessConfig, RetryStrategy, SchedulerConfig, TrainingSpecification, UserSettings } from "./models_1";
|
|
4
|
+
/**
|
|
5
|
+
* <p>Contains information about the training data source for speculative decoding.</p>
|
|
6
|
+
* @public
|
|
7
|
+
*/
|
|
8
|
+
export interface ModelSpeculativeDecodingTrainingDataSource {
|
|
9
|
+
/**
|
|
10
|
+
* <p>The Amazon S3 URI that points to the training data for speculative decoding.</p>
|
|
11
|
+
* @public
|
|
12
|
+
*/
|
|
13
|
+
S3Uri: string | undefined;
|
|
14
|
+
/**
|
|
15
|
+
* <p>The type of data stored in the Amazon S3 location. Valid values are <code>S3Prefix</code> or <code>ManifestFile</code>.</p>
|
|
16
|
+
* @public
|
|
17
|
+
*/
|
|
18
|
+
S3DataType: ModelSpeculativeDecodingS3DataType | undefined;
|
|
19
|
+
}
|
|
20
|
+
/**
|
|
21
|
+
* <p>Settings for the model speculative decoding technique that's applied by a model optimization job.</p>
|
|
22
|
+
* @public
|
|
23
|
+
*/
|
|
24
|
+
export interface ModelSpeculativeDecodingConfig {
|
|
25
|
+
/**
|
|
26
|
+
* <p>The speculative decoding technique to apply during model optimization.</p>
|
|
27
|
+
* @public
|
|
28
|
+
*/
|
|
29
|
+
Technique: ModelSpeculativeDecodingTechnique | undefined;
|
|
30
|
+
/**
|
|
31
|
+
* <p>The location of the training data to use for speculative decoding. The data must be formatted as ShareGPT, OpenAI Completions or OpenAI Chat Completions. The input can also be unencrypted captured data from a SageMaker endpoint as long as the endpoint uses one of the above formats.</p>
|
|
32
|
+
* @public
|
|
33
|
+
*/
|
|
34
|
+
TrainingDataSource?: ModelSpeculativeDecodingTrainingDataSource | undefined;
|
|
35
|
+
}
|
|
4
36
|
/**
|
|
5
37
|
* <p>Settings for an optimization technique that you apply with a model optimization job.</p>
|
|
6
38
|
* @public
|
|
@@ -3073,6 +3105,26 @@ export interface DeleteInferenceExperimentResponse {
|
|
|
3073
3105
|
*/
|
|
3074
3106
|
InferenceExperimentArn: string | undefined;
|
|
3075
3107
|
}
|
|
3108
|
+
/**
|
|
3109
|
+
* @public
|
|
3110
|
+
*/
|
|
3111
|
+
export interface DeleteJobRequest {
|
|
3112
|
+
/**
|
|
3113
|
+
* <p>The name of the job to delete.</p>
|
|
3114
|
+
* @public
|
|
3115
|
+
*/
|
|
3116
|
+
JobName: string | undefined;
|
|
3117
|
+
/**
|
|
3118
|
+
* <p>The category of the job to delete.</p>
|
|
3119
|
+
* @public
|
|
3120
|
+
*/
|
|
3121
|
+
JobCategory: JobCategory | undefined;
|
|
3122
|
+
}
|
|
3123
|
+
/**
|
|
3124
|
+
* @public
|
|
3125
|
+
*/
|
|
3126
|
+
export interface DeleteJobResponse {
|
|
3127
|
+
}
|
|
3076
3128
|
/**
|
|
3077
3129
|
* @public
|
|
3078
3130
|
*/
|
|
@@ -7147,77 +7199,3 @@ export interface DescribeInferenceComponentInput {
|
|
|
7147
7199
|
*/
|
|
7148
7200
|
InferenceComponentName: string | undefined;
|
|
7149
7201
|
}
|
|
7150
|
-
/**
|
|
7151
|
-
* <p>Specifies the type and size of the endpoint capacity to activate for a rolling deployment or a rollback strategy. You can specify your batches as either of the following:</p> <ul> <li> <p>A count of inference component copies </p> </li> <li> <p>The overall percentage or your fleet </p> </li> </ul> <p>For a rollback strategy, if you don't specify the fields in this object, or if you set the <code>Value</code> parameter to 100%, then SageMaker AI uses a blue/green rollback strategy and rolls all traffic back to the blue fleet.</p>
|
|
7152
|
-
* @public
|
|
7153
|
-
*/
|
|
7154
|
-
export interface InferenceComponentCapacitySize {
|
|
7155
|
-
/**
|
|
7156
|
-
* <p>Specifies the endpoint capacity type.</p> <dl> <dt>COPY_COUNT</dt> <dd> <p>The endpoint activates based on the number of inference component copies.</p> </dd> <dt>CAPACITY_PERCENT</dt> <dd> <p>The endpoint activates based on the specified percentage of capacity.</p> </dd> </dl>
|
|
7157
|
-
* @public
|
|
7158
|
-
*/
|
|
7159
|
-
Type: InferenceComponentCapacitySizeType | undefined;
|
|
7160
|
-
/**
|
|
7161
|
-
* <p>Defines the capacity size, either as a number of inference component copies or a capacity percentage.</p>
|
|
7162
|
-
* @public
|
|
7163
|
-
*/
|
|
7164
|
-
Value: number | undefined;
|
|
7165
|
-
}
|
|
7166
|
-
/**
|
|
7167
|
-
* <p>Specifies a rolling deployment strategy for updating a SageMaker AI inference component.</p>
|
|
7168
|
-
* @public
|
|
7169
|
-
*/
|
|
7170
|
-
export interface InferenceComponentRollingUpdatePolicy {
|
|
7171
|
-
/**
|
|
7172
|
-
* <p>The batch size for each rolling step in the deployment process. For each step, SageMaker AI provisions capacity on the new endpoint fleet, routes traffic to that fleet, and terminates capacity on the old endpoint fleet. The value must be between 5% to 50% of the copy count of the inference component.</p>
|
|
7173
|
-
* @public
|
|
7174
|
-
*/
|
|
7175
|
-
MaximumBatchSize: InferenceComponentCapacitySize | undefined;
|
|
7176
|
-
/**
|
|
7177
|
-
* <p>The length of the baking period, during which SageMaker AI monitors alarms for each batch on the new fleet.</p>
|
|
7178
|
-
* @public
|
|
7179
|
-
*/
|
|
7180
|
-
WaitIntervalInSeconds: number | undefined;
|
|
7181
|
-
/**
|
|
7182
|
-
* <p>The time limit for the total deployment. Exceeding this limit causes a timeout.</p>
|
|
7183
|
-
* @public
|
|
7184
|
-
*/
|
|
7185
|
-
MaximumExecutionTimeoutInSeconds?: number | undefined;
|
|
7186
|
-
/**
|
|
7187
|
-
* <p>The batch size for a rollback to the old endpoint fleet. If this field is absent, the value is set to the default, which is 100% of the total capacity. When the default is used, SageMaker AI provisions the entire capacity of the old fleet at once during rollback.</p>
|
|
7188
|
-
* @public
|
|
7189
|
-
*/
|
|
7190
|
-
RollbackMaximumBatchSize?: InferenceComponentCapacitySize | undefined;
|
|
7191
|
-
}
|
|
7192
|
-
/**
|
|
7193
|
-
* <p>The deployment configuration for an endpoint that hosts inference components. The configuration includes the desired deployment strategy and rollback settings.</p>
|
|
7194
|
-
* @public
|
|
7195
|
-
*/
|
|
7196
|
-
export interface InferenceComponentDeploymentConfig {
|
|
7197
|
-
/**
|
|
7198
|
-
* <p>Specifies a rolling deployment strategy for updating a SageMaker AI endpoint.</p>
|
|
7199
|
-
* @public
|
|
7200
|
-
*/
|
|
7201
|
-
RollingUpdatePolicy: InferenceComponentRollingUpdatePolicy | undefined;
|
|
7202
|
-
/**
|
|
7203
|
-
* <p>Automatic rollback configuration for handling endpoint deployment failures and recovery.</p>
|
|
7204
|
-
* @public
|
|
7205
|
-
*/
|
|
7206
|
-
AutoRollbackConfiguration?: AutoRollbackConfig | undefined;
|
|
7207
|
-
}
|
|
7208
|
-
/**
|
|
7209
|
-
* <p>The placement status of an inference component on a specific instance type. Shows the number of inference component copies currently placed on instances of a given type.</p>
|
|
7210
|
-
* @public
|
|
7211
|
-
*/
|
|
7212
|
-
export interface InferenceComponentPlacementStatus {
|
|
7213
|
-
/**
|
|
7214
|
-
* <p>The ML compute instance type where the inference component copies are placed.</p>
|
|
7215
|
-
* @public
|
|
7216
|
-
*/
|
|
7217
|
-
InstanceType: ProductionVariantInstanceType | undefined;
|
|
7218
|
-
/**
|
|
7219
|
-
* <p>The number of inference component copies currently placed on instances of this type.</p>
|
|
7220
|
-
* @public
|
|
7221
|
-
*/
|
|
7222
|
-
CurrentCopyCount: number | undefined;
|
|
7223
|
-
}
|