@aws-sdk/client-sagemaker 3.1018.0 → 3.1020.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist-cjs/auth/httpAuthSchemeProvider.js +2 -2
- package/dist-cjs/index.js +14 -0
- package/dist-cjs/runtimeConfig.js +4 -3
- package/dist-cjs/runtimeConfig.shared.js +2 -2
- package/dist-cjs/schemas/schemas_0.js +69 -43
- package/dist-es/SageMaker.js +22 -22
- package/dist-es/auth/httpAuthSchemeProvider.js +1 -1
- package/dist-es/models/enums.js +11 -0
- package/dist-es/runtimeConfig.js +2 -1
- package/dist-es/runtimeConfig.shared.js +1 -1
- package/dist-es/schemas/schemas_0.js +46 -20
- package/dist-es/waiters/waitForEndpointDeleted.js +1 -1
- package/dist-es/waiters/waitForEndpointInService.js +1 -1
- package/dist-es/waiters/waitForImageCreated.js +1 -1
- package/dist-es/waiters/waitForImageDeleted.js +1 -1
- package/dist-es/waiters/waitForImageUpdated.js +1 -1
- package/dist-es/waiters/waitForImageVersionCreated.js +2 -2
- package/dist-es/waiters/waitForImageVersionDeleted.js +2 -2
- package/dist-es/waiters/waitForNotebookInstanceDeleted.js +1 -1
- package/dist-es/waiters/waitForNotebookInstanceInService.js +1 -1
- package/dist-es/waiters/waitForNotebookInstanceStopped.js +1 -1
- package/dist-es/waiters/waitForProcessingJobCompletedOrStopped.js +1 -1
- package/dist-es/waiters/waitForTrainingJobCompletedOrStopped.js +2 -2
- package/dist-es/waiters/waitForTransformJobCompletedOrStopped.js +2 -2
- package/dist-types/SageMaker.d.ts +381 -381
- package/dist-types/SageMakerClient.d.ts +384 -384
- package/dist-types/auth/httpAuthExtensionConfiguration.d.ts +1 -1
- package/dist-types/auth/httpAuthSchemeProvider.d.ts +1 -1
- package/dist-types/commands/CreateEndpointConfigCommand.d.ts +10 -0
- package/dist-types/commands/CreateInferenceComponentCommand.d.ts +7 -0
- package/dist-types/commands/DescribeEndpointCommand.d.ts +20 -0
- package/dist-types/commands/DescribeEndpointConfigCommand.d.ts +10 -0
- package/dist-types/commands/DescribeInferenceComponentCommand.d.ts +7 -0
- package/dist-types/commands/ListPipelineParametersForExecutionCommand.d.ts +2 -1
- package/dist-types/commands/ListPipelinesCommand.d.ts +1 -2
- package/dist-types/commands/SearchCommand.d.ts +10 -0
- package/dist-types/commands/UpdateInferenceComponentCommand.d.ts +7 -0
- package/dist-types/index.d.ts +1 -1
- package/dist-types/models/enums.d.ts +35 -0
- package/dist-types/models/models_0.d.ts +1 -1
- package/dist-types/models/models_1.d.ts +65 -93
- package/dist-types/models/models_2.d.ts +99 -46
- package/dist-types/models/models_3.d.ts +47 -105
- package/dist-types/models/models_4.d.ts +106 -5
- package/dist-types/pagination/CreateHubContentPresignedUrlsPaginator.d.ts +1 -1
- package/dist-types/pagination/DescribeTrainingPlanExtensionHistoryPaginator.d.ts +1 -1
- package/dist-types/pagination/ListActionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListAlgorithmsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListAliasesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListAppImageConfigsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListAppsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListArtifactsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListAssociationsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListAutoMLJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListCandidatesForAutoMLJobPaginator.d.ts +1 -1
- package/dist-types/pagination/ListClusterEventsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListClusterNodesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListClusterSchedulerConfigsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListClustersPaginator.d.ts +1 -1
- package/dist-types/pagination/ListCodeRepositoriesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListCompilationJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListComputeQuotasPaginator.d.ts +1 -1
- package/dist-types/pagination/ListContextsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListDataQualityJobDefinitionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListDeviceFleetsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListDevicesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListDomainsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListEdgeDeploymentPlansPaginator.d.ts +1 -1
- package/dist-types/pagination/ListEdgePackagingJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListEndpointConfigsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListEndpointsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListExperimentsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListFeatureGroupsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListFlowDefinitionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListHumanTaskUisPaginator.d.ts +1 -1
- package/dist-types/pagination/ListHyperParameterTuningJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListImageVersionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListImagesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListInferenceComponentsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListInferenceExperimentsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListInferenceRecommendationsJobStepsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListInferenceRecommendationsJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListLabelingJobsForWorkteamPaginator.d.ts +1 -1
- package/dist-types/pagination/ListLabelingJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListLineageGroupsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListMlflowAppsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListMlflowTrackingServersPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelBiasJobDefinitionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelCardExportJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelCardVersionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelCardsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelExplainabilityJobDefinitionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelMetadataPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelPackageGroupsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelPackagesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelQualityJobDefinitionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListModelsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListMonitoringAlertHistoryPaginator.d.ts +1 -1
- package/dist-types/pagination/ListMonitoringAlertsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListMonitoringExecutionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListMonitoringSchedulesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListNotebookInstanceLifecycleConfigsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListNotebookInstancesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListOptimizationJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListPartnerAppsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListPipelineExecutionStepsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListPipelineExecutionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListPipelineParametersForExecutionPaginator.d.ts +1 -1
- package/dist-types/pagination/ListPipelineVersionsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListPipelinesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListProcessingJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListProjectsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListResourceCatalogsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListSpacesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListStageDevicesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListStudioLifecycleConfigsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListSubscribedWorkteamsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTagsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTrainingJobsForHyperParameterTuningJobPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTrainingJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTrainingPlansPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTransformJobsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTrialComponentsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListTrialsPaginator.d.ts +1 -1
- package/dist-types/pagination/ListUltraServersByReservedCapacityPaginator.d.ts +1 -1
- package/dist-types/pagination/ListUserProfilesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListWorkforcesPaginator.d.ts +1 -1
- package/dist-types/pagination/ListWorkteamsPaginator.d.ts +1 -1
- package/dist-types/pagination/QueryLineagePaginator.d.ts +1 -1
- package/dist-types/pagination/SearchPaginator.d.ts +1 -1
- package/dist-types/runtimeConfig.browser.d.ts +1 -1
- package/dist-types/runtimeConfig.d.ts +1 -1
- package/dist-types/runtimeConfig.native.d.ts +1 -1
- package/dist-types/schemas/schemas_0.d.ts +3 -0
- package/dist-types/ts3.4/SageMakerClient.d.ts +2 -3
- package/dist-types/ts3.4/auth/httpAuthExtensionConfiguration.d.ts +1 -1
- package/dist-types/ts3.4/auth/httpAuthSchemeProvider.d.ts +1 -1
- package/dist-types/ts3.4/commands/ListPipelineParametersForExecutionCommand.d.ts +2 -4
- package/dist-types/ts3.4/commands/ListPipelinesCommand.d.ts +4 -2
- package/dist-types/ts3.4/models/enums.d.ts +17 -0
- package/dist-types/ts3.4/models/models_1.d.ts +35 -58
- package/dist-types/ts3.4/models/models_2.d.ts +68 -30
- package/dist-types/ts3.4/models/models_3.d.ts +45 -61
- package/dist-types/ts3.4/models/models_4.d.ts +55 -32
- package/dist-types/ts3.4/runtimeConfig.browser.d.ts +1 -1
- package/dist-types/ts3.4/runtimeConfig.d.ts +1 -1
- package/dist-types/ts3.4/runtimeConfig.native.d.ts +1 -1
- package/dist-types/ts3.4/schemas/schemas_0.d.ts +3 -0
- package/dist-types/waiters/waitForEndpointDeleted.d.ts +3 -3
- package/dist-types/waiters/waitForEndpointInService.d.ts +3 -3
- package/dist-types/waiters/waitForImageCreated.d.ts +3 -3
- package/dist-types/waiters/waitForImageDeleted.d.ts +3 -3
- package/dist-types/waiters/waitForImageUpdated.d.ts +3 -3
- package/dist-types/waiters/waitForImageVersionCreated.d.ts +3 -3
- package/dist-types/waiters/waitForImageVersionDeleted.d.ts +3 -3
- package/dist-types/waiters/waitForNotebookInstanceDeleted.d.ts +3 -3
- package/dist-types/waiters/waitForNotebookInstanceInService.d.ts +3 -3
- package/dist-types/waiters/waitForNotebookInstanceStopped.d.ts +3 -3
- package/dist-types/waiters/waitForProcessingJobCompletedOrStopped.d.ts +3 -3
- package/dist-types/waiters/waitForTrainingJobCompletedOrStopped.d.ts +3 -3
- package/dist-types/waiters/waitForTransformJobCompletedOrStopped.d.ts +3 -3
- package/package.json +15 -15
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import
|
|
1
|
+
import type { AwsCredentialIdentity, AwsCredentialIdentityProvider, HttpAuthScheme } from "@smithy/types";
|
|
2
2
|
import type { SageMakerHttpAuthSchemeProvider } from "./httpAuthSchemeProvider";
|
|
3
3
|
/**
|
|
4
4
|
* @internal
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { AwsSdkSigV4AuthInputConfig, AwsSdkSigV4AuthResolvedConfig, AwsSdkSigV4PreviouslyResolved } from "@aws-sdk/core";
|
|
1
|
+
import { AwsSdkSigV4AuthInputConfig, AwsSdkSigV4AuthResolvedConfig, AwsSdkSigV4PreviouslyResolved } from "@aws-sdk/core/httpAuthSchemes";
|
|
2
2
|
import type { HandlerExecutionContext, HttpAuthScheme, HttpAuthSchemeParameters, HttpAuthSchemeParametersProvider, HttpAuthSchemeProvider, Provider } from "@smithy/types";
|
|
3
3
|
import { type SageMakerClientResolvedConfig } from "../SageMakerClient";
|
|
4
4
|
/**
|
|
@@ -63,6 +63,11 @@ declare const CreateEndpointConfigCommand_base: {
|
|
|
63
63
|
* Status: "ENABLED" || "DISABLED",
|
|
64
64
|
* MinInstanceCount: Number("int"),
|
|
65
65
|
* MaxInstanceCount: Number("int"),
|
|
66
|
+
* ScaleInPolicy: { // ProductionVariantManagedInstanceScalingScaleInPolicy
|
|
67
|
+
* Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
68
|
+
* MaximumStepSize: Number("int"),
|
|
69
|
+
* CooldownInMinutes: Number("int"),
|
|
70
|
+
* },
|
|
66
71
|
* },
|
|
67
72
|
* RoutingConfig: { // ProductionVariantRoutingConfig
|
|
68
73
|
* RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -180,6 +185,11 @@ declare const CreateEndpointConfigCommand_base: {
|
|
|
180
185
|
* Status: "ENABLED" || "DISABLED",
|
|
181
186
|
* MinInstanceCount: Number("int"),
|
|
182
187
|
* MaxInstanceCount: Number("int"),
|
|
188
|
+
* ScaleInPolicy: {
|
|
189
|
+
* Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
190
|
+
* MaximumStepSize: Number("int"),
|
|
191
|
+
* CooldownInMinutes: Number("int"),
|
|
192
|
+
* },
|
|
183
193
|
* },
|
|
184
194
|
* RoutingConfig: {
|
|
185
195
|
* RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -63,6 +63,13 @@ declare const CreateInferenceComponentCommand_base: {
|
|
|
63
63
|
* DataCacheConfig: { // InferenceComponentDataCacheConfig
|
|
64
64
|
* EnableCaching: true || false, // required
|
|
65
65
|
* },
|
|
66
|
+
* SchedulingConfig: { // InferenceComponentSchedulingConfig
|
|
67
|
+
* PlacementStrategy: "SPREAD" || "BINPACK", // required
|
|
68
|
+
* AvailabilityZoneBalance: { // InferenceComponentAvailabilityZoneBalance
|
|
69
|
+
* EnforcementMode: "PERMISSIVE", // required
|
|
70
|
+
* MaxImbalance: Number("int"),
|
|
71
|
+
* },
|
|
72
|
+
* },
|
|
66
73
|
* },
|
|
67
74
|
* RuntimeConfig: { // InferenceComponentRuntimeConfig
|
|
68
75
|
* CopyCount: Number("int"), // required
|
|
@@ -80,6 +80,11 @@ declare const DescribeEndpointCommand_base: {
|
|
|
80
80
|
* // Status: "ENABLED" || "DISABLED",
|
|
81
81
|
* // MinInstanceCount: Number("int"),
|
|
82
82
|
* // MaxInstanceCount: Number("int"),
|
|
83
|
+
* // ScaleInPolicy: { // ProductionVariantManagedInstanceScalingScaleInPolicy
|
|
84
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
85
|
+
* // MaximumStepSize: Number("int"),
|
|
86
|
+
* // CooldownInMinutes: Number("int"),
|
|
87
|
+
* // },
|
|
83
88
|
* // },
|
|
84
89
|
* // RoutingConfig: { // ProductionVariantRoutingConfig
|
|
85
90
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -205,6 +210,11 @@ declare const DescribeEndpointCommand_base: {
|
|
|
205
210
|
* // Status: "ENABLED" || "DISABLED",
|
|
206
211
|
* // MinInstanceCount: Number("int"),
|
|
207
212
|
* // MaxInstanceCount: Number("int"),
|
|
213
|
+
* // ScaleInPolicy: {
|
|
214
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
215
|
+
* // MaximumStepSize: Number("int"),
|
|
216
|
+
* // CooldownInMinutes: Number("int"),
|
|
217
|
+
* // },
|
|
208
218
|
* // },
|
|
209
219
|
* // RoutingConfig: {
|
|
210
220
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -245,6 +255,11 @@ declare const DescribeEndpointCommand_base: {
|
|
|
245
255
|
* // Status: "ENABLED" || "DISABLED",
|
|
246
256
|
* // MinInstanceCount: Number("int"),
|
|
247
257
|
* // MaxInstanceCount: Number("int"),
|
|
258
|
+
* // ScaleInPolicy: {
|
|
259
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
260
|
+
* // MaximumStepSize: Number("int"),
|
|
261
|
+
* // CooldownInMinutes: Number("int"),
|
|
262
|
+
* // },
|
|
248
263
|
* // },
|
|
249
264
|
* // RoutingConfig: {
|
|
250
265
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -317,6 +332,11 @@ declare const DescribeEndpointCommand_base: {
|
|
|
317
332
|
* // Status: "ENABLED" || "DISABLED",
|
|
318
333
|
* // MinInstanceCount: Number("int"),
|
|
319
334
|
* // MaxInstanceCount: Number("int"),
|
|
335
|
+
* // ScaleInPolicy: {
|
|
336
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
337
|
+
* // MaximumStepSize: Number("int"),
|
|
338
|
+
* // CooldownInMinutes: Number("int"),
|
|
339
|
+
* // },
|
|
320
340
|
* // },
|
|
321
341
|
* // RoutingConfig: {
|
|
322
342
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -69,6 +69,11 @@ declare const DescribeEndpointConfigCommand_base: {
|
|
|
69
69
|
* // Status: "ENABLED" || "DISABLED",
|
|
70
70
|
* // MinInstanceCount: Number("int"),
|
|
71
71
|
* // MaxInstanceCount: Number("int"),
|
|
72
|
+
* // ScaleInPolicy: { // ProductionVariantManagedInstanceScalingScaleInPolicy
|
|
73
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
74
|
+
* // MaximumStepSize: Number("int"),
|
|
75
|
+
* // CooldownInMinutes: Number("int"),
|
|
76
|
+
* // },
|
|
72
77
|
* // },
|
|
73
78
|
* // RoutingConfig: { // ProductionVariantRoutingConfig
|
|
74
79
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -181,6 +186,11 @@ declare const DescribeEndpointConfigCommand_base: {
|
|
|
181
186
|
* // Status: "ENABLED" || "DISABLED",
|
|
182
187
|
* // MinInstanceCount: Number("int"),
|
|
183
188
|
* // MaxInstanceCount: Number("int"),
|
|
189
|
+
* // ScaleInPolicy: {
|
|
190
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
191
|
+
* // MaximumStepSize: Number("int"),
|
|
192
|
+
* // CooldownInMinutes: Number("int"),
|
|
193
|
+
* // },
|
|
184
194
|
* // },
|
|
185
195
|
* // RoutingConfig: {
|
|
186
196
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -75,6 +75,13 @@ declare const DescribeInferenceComponentCommand_base: {
|
|
|
75
75
|
* // DataCacheConfig: { // InferenceComponentDataCacheConfigSummary
|
|
76
76
|
* // EnableCaching: true || false, // required
|
|
77
77
|
* // },
|
|
78
|
+
* // SchedulingConfig: { // InferenceComponentSchedulingConfig
|
|
79
|
+
* // PlacementStrategy: "SPREAD" || "BINPACK", // required
|
|
80
|
+
* // AvailabilityZoneBalance: { // InferenceComponentAvailabilityZoneBalance
|
|
81
|
+
* // EnforcementMode: "PERMISSIVE", // required
|
|
82
|
+
* // MaxImbalance: Number("int"),
|
|
83
|
+
* // },
|
|
84
|
+
* // },
|
|
78
85
|
* // },
|
|
79
86
|
* // RuntimeConfig: { // InferenceComponentRuntimeConfigSummary
|
|
80
87
|
* // DesiredCopyCount: Number("int"),
|
|
@@ -1,6 +1,7 @@
|
|
|
1
1
|
import { Command as $Command } from "@smithy/smithy-client";
|
|
2
2
|
import type { MetadataBearer as __MetadataBearer } from "@smithy/types";
|
|
3
|
-
import type { ListPipelineParametersForExecutionRequest
|
|
3
|
+
import type { ListPipelineParametersForExecutionRequest } from "../models/models_3";
|
|
4
|
+
import type { ListPipelineParametersForExecutionResponse } from "../models/models_4";
|
|
4
5
|
import type { SageMakerClientResolvedConfig, ServiceInputTypes, ServiceOutputTypes } from "../SageMakerClient";
|
|
5
6
|
/**
|
|
6
7
|
* @public
|
|
@@ -1,7 +1,6 @@
|
|
|
1
1
|
import { Command as $Command } from "@smithy/smithy-client";
|
|
2
2
|
import type { MetadataBearer as __MetadataBearer } from "@smithy/types";
|
|
3
|
-
import type { ListPipelinesRequest } from "../models/
|
|
4
|
-
import type { ListPipelinesResponse } from "../models/models_4";
|
|
3
|
+
import type { ListPipelinesRequest, ListPipelinesResponse } from "../models/models_4";
|
|
5
4
|
import type { SageMakerClientResolvedConfig, ServiceInputTypes, ServiceOutputTypes } from "../SageMakerClient";
|
|
6
5
|
/**
|
|
7
6
|
* @public
|
|
@@ -928,6 +928,11 @@ declare const SearchCommand_base: {
|
|
|
928
928
|
* // Status: "ENABLED" || "DISABLED",
|
|
929
929
|
* // MinInstanceCount: Number("int"),
|
|
930
930
|
* // MaxInstanceCount: Number("int"),
|
|
931
|
+
* // ScaleInPolicy: { // ProductionVariantManagedInstanceScalingScaleInPolicy
|
|
932
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
933
|
+
* // MaximumStepSize: Number("int"),
|
|
934
|
+
* // CooldownInMinutes: Number("int"),
|
|
935
|
+
* // },
|
|
931
936
|
* // },
|
|
932
937
|
* // RoutingConfig: { // ProductionVariantRoutingConfig
|
|
933
938
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -1123,6 +1128,11 @@ declare const SearchCommand_base: {
|
|
|
1123
1128
|
* // Status: "ENABLED" || "DISABLED",
|
|
1124
1129
|
* // MinInstanceCount: Number("int"),
|
|
1125
1130
|
* // MaxInstanceCount: Number("int"),
|
|
1131
|
+
* // ScaleInPolicy: {
|
|
1132
|
+
* // Strategy: "IDLE_RELEASE" || "CONSOLIDATION", // required
|
|
1133
|
+
* // MaximumStepSize: Number("int"),
|
|
1134
|
+
* // CooldownInMinutes: Number("int"),
|
|
1135
|
+
* // },
|
|
1126
1136
|
* // },
|
|
1127
1137
|
* // RoutingConfig: {
|
|
1128
1138
|
* // RoutingStrategy: "LEAST_OUTSTANDING_REQUESTS" || "RANDOM", // required
|
|
@@ -61,6 +61,13 @@ declare const UpdateInferenceComponentCommand_base: {
|
|
|
61
61
|
* DataCacheConfig: { // InferenceComponentDataCacheConfig
|
|
62
62
|
* EnableCaching: true || false, // required
|
|
63
63
|
* },
|
|
64
|
+
* SchedulingConfig: { // InferenceComponentSchedulingConfig
|
|
65
|
+
* PlacementStrategy: "SPREAD" || "BINPACK", // required
|
|
66
|
+
* AvailabilityZoneBalance: { // InferenceComponentAvailabilityZoneBalance
|
|
67
|
+
* EnforcementMode: "PERMISSIVE", // required
|
|
68
|
+
* MaxImbalance: Number("int"),
|
|
69
|
+
* },
|
|
70
|
+
* },
|
|
64
71
|
* },
|
|
65
72
|
* RuntimeConfig: { // InferenceComponentRuntimeConfig
|
|
66
73
|
* CopyCount: Number("int"), // required
|
package/dist-types/index.d.ts
CHANGED
|
@@ -5,7 +5,7 @@
|
|
|
5
5
|
*/
|
|
6
6
|
export * from "./SageMakerClient";
|
|
7
7
|
export * from "./SageMaker";
|
|
8
|
-
export { ClientInputEndpointParameters } from "./endpoint/EndpointParameters";
|
|
8
|
+
export type { ClientInputEndpointParameters } from "./endpoint/EndpointParameters";
|
|
9
9
|
export type { RuntimeExtension } from "./runtimeExtensions";
|
|
10
10
|
export type { SageMakerExtensionConfiguration } from "./extensionConfiguration";
|
|
11
11
|
export * from "./commands";
|
|
@@ -1727,6 +1727,17 @@ export declare const AutotuneMode: {
|
|
|
1727
1727
|
* @public
|
|
1728
1728
|
*/
|
|
1729
1729
|
export type AutotuneMode = (typeof AutotuneMode)[keyof typeof AutotuneMode];
|
|
1730
|
+
/**
|
|
1731
|
+
* @public
|
|
1732
|
+
* @enum
|
|
1733
|
+
*/
|
|
1734
|
+
export declare const AvailabilityZoneBalanceEnforcementMode: {
|
|
1735
|
+
readonly PERMISSIVE: "PERMISSIVE";
|
|
1736
|
+
};
|
|
1737
|
+
/**
|
|
1738
|
+
* @public
|
|
1739
|
+
*/
|
|
1740
|
+
export type AvailabilityZoneBalanceEnforcementMode = (typeof AvailabilityZoneBalanceEnforcementMode)[keyof typeof AvailabilityZoneBalanceEnforcementMode];
|
|
1730
1741
|
/**
|
|
1731
1742
|
* @public
|
|
1732
1743
|
* @enum
|
|
@@ -2998,6 +3009,18 @@ export declare const ProductionVariantInferenceAmiVersion: {
|
|
|
2998
3009
|
* @public
|
|
2999
3010
|
*/
|
|
3000
3011
|
export type ProductionVariantInferenceAmiVersion = (typeof ProductionVariantInferenceAmiVersion)[keyof typeof ProductionVariantInferenceAmiVersion];
|
|
3012
|
+
/**
|
|
3013
|
+
* @public
|
|
3014
|
+
* @enum
|
|
3015
|
+
*/
|
|
3016
|
+
export declare const ManagedInstanceScalingScaleInStrategy: {
|
|
3017
|
+
readonly CONSOLIDATION: "CONSOLIDATION";
|
|
3018
|
+
readonly IDLE_RELEASE: "IDLE_RELEASE";
|
|
3019
|
+
};
|
|
3020
|
+
/**
|
|
3021
|
+
* @public
|
|
3022
|
+
*/
|
|
3023
|
+
export type ManagedInstanceScalingScaleInStrategy = (typeof ManagedInstanceScalingScaleInStrategy)[keyof typeof ManagedInstanceScalingScaleInStrategy];
|
|
3001
3024
|
/**
|
|
3002
3025
|
* @public
|
|
3003
3026
|
* @enum
|
|
@@ -3190,6 +3213,18 @@ export declare const VendorGuidance: {
|
|
|
3190
3213
|
* @public
|
|
3191
3214
|
*/
|
|
3192
3215
|
export type VendorGuidance = (typeof VendorGuidance)[keyof typeof VendorGuidance];
|
|
3216
|
+
/**
|
|
3217
|
+
* @public
|
|
3218
|
+
* @enum
|
|
3219
|
+
*/
|
|
3220
|
+
export declare const InferenceComponentPlacementStrategy: {
|
|
3221
|
+
readonly BINPACK: "BINPACK";
|
|
3222
|
+
readonly SPREAD: "SPREAD";
|
|
3223
|
+
};
|
|
3224
|
+
/**
|
|
3225
|
+
* @public
|
|
3226
|
+
*/
|
|
3227
|
+
export type InferenceComponentPlacementStrategy = (typeof InferenceComponentPlacementStrategy)[keyof typeof InferenceComponentPlacementStrategy];
|
|
3193
3228
|
/**
|
|
3194
3229
|
* @public
|
|
3195
3230
|
* @enum
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { ActionStatus, ActivationState, ActiveClusterOperationName, AdditionalS3DataSourceDataType, AggregationTransformationValue, AlgorithmStatus, AppInstanceType, AppStatus, AppType, ArtifactSourceIdType, AssemblyType, AssociationEdgeType, AsyncNotificationTopicTypes, AthenaResultCompressionType, AthenaResultFormat, AutoMLAlgorithm, AutoMLChannelType, AutoMLJobObjectiveType, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLMetricEnum, AutoMLMetricExtendedEnum, AutoMLMode, AutoMLProcessingUnit, AutoMLS3DataType, AutotuneMode, BatchAddClusterNodesErrorCode, BatchDeleteClusterNodesErrorCode, BatchRebootClusterNodesErrorCode, BatchReplaceClusterNodesErrorCode, BatchStrategy, CandidateStatus, CandidateStepType, CapacityReservationType, CapacitySizeType, CaptureMode, ClarifyFeatureType, ClarifyTextGranularity, ClarifyTextLanguage, ClusterAutoScalerType, ClusterAutoScalingMode, ClusterAutoScalingStatus, ClusterCapacityType, ClusterConfigMode, ClusterEventResourceType, ClusterInstanceStatus, ClusterInstanceType, ClusterKubernetesTaintEffect, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterSlurmConfigStrategy, ClusterSlurmNodeType, ClusterStatus, CompilationJobStatus, CompleteOnConvergence, CompressionType, ConditionOutcome, ContainerMode, DataSourceName, DeepHealthCheckType, DetailedAlgorithmStatus, FairShare, FeatureStatus, FileSystemAccessMode, FileSystemType, FillingType, Framework, HyperParameterScalingType, HyperParameterTuningJobObjectiveType, IdleResourceSharing, InstanceGroupStatus, LifecycleManagement, MetricSetSource, MIGProfileType, ModelApprovalStatus, ModelCacheSetting, ModelCompressionType, ModelPackageRegistrationType, ModelPackageStatus, NodeUnavailabilityType, ObjectiveStatus, OutputCompressionType, ParameterType, PreemptTeamTasks, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, RecordWrapper, RepositoryAccessMode, ResourceSharingStrategy, S3DataDistribution, S3DataType, S3ModelDataType, SchedulerResourceStatus, SoftwareUpdateStatus, SplitType, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, TrafficRoutingConfigType, TrainingInputMode, TrainingInstanceType, TrainingRepositoryAccessMode, TransformInstanceType, VolumeAttachmentStatus } from "./enums";
|
|
1
|
+
import type { ActionStatus, ActivationState, ActiveClusterOperationName, AdditionalS3DataSourceDataType, AggregationTransformationValue, AlgorithmStatus, AppInstanceType, AppStatus, AppType, ArtifactSourceIdType, AssemblyType, AssociationEdgeType, AsyncNotificationTopicTypes, AthenaResultCompressionType, AthenaResultFormat, AutoMLAlgorithm, AutoMLChannelType, AutoMLJobObjectiveType, AutoMLJobSecondaryStatus, AutoMLJobStatus, AutoMLMetricEnum, AutoMLMetricExtendedEnum, AutoMLMode, AutoMLProcessingUnit, AutoMLS3DataType, AutotuneMode, BatchAddClusterNodesErrorCode, BatchDeleteClusterNodesErrorCode, BatchRebootClusterNodesErrorCode, BatchReplaceClusterNodesErrorCode, BatchStrategy, CandidateStatus, CandidateStepType, CapacityReservationType, CapacitySizeType, CaptureMode, ClarifyFeatureType, ClarifyTextGranularity, ClarifyTextLanguage, ClusterAutoScalerType, ClusterAutoScalingMode, ClusterAutoScalingStatus, ClusterCapacityType, ClusterConfigMode, ClusterEventResourceType, ClusterInstanceStatus, ClusterInstanceType, ClusterKubernetesTaintEffect, ClusterNodeProvisioningMode, ClusterNodeRecovery, ClusterSlurmConfigStrategy, ClusterSlurmNodeType, ClusterStatus, CompilationJobStatus, CompleteOnConvergence, CompressionType, ConditionOutcome, ContainerMode, DataSourceName, DeepHealthCheckType, DetailedAlgorithmStatus, FairShare, FeatureStatus, FileSystemAccessMode, FileSystemType, FillingType, Framework, HyperParameterScalingType, HyperParameterTuningJobObjectiveType, IdleResourceSharing, InstanceGroupStatus, LifecycleManagement, MetricSetSource, MIGProfileType, ModelApprovalStatus, ModelCacheSetting, ModelCompressionType, ModelPackageRegistrationType, ModelPackageStatus, NodeUnavailabilityType, ObjectiveStatus, OutputCompressionType, ParameterType, PreemptTeamTasks, ProblemType, ProcessingS3DataDistributionType, ProcessingS3InputMode, ProductionVariantInstanceType, RecordWrapper, RepositoryAccessMode, ResourceSharingStrategy, S3DataDistribution, S3DataType, S3ModelDataType, SchedulerResourceStatus, SoftwareUpdateStatus, SplitType, TargetDevice, TargetPlatformAccelerator, TargetPlatformArch, TargetPlatformOs, TrafficRoutingConfigType, TrainingInputMode, TrainingInstanceType, TrainingRepositoryAccessMode, TransformInstanceType, VolumeAttachmentStatus } from "./enums";
|
|
2
2
|
/**
|
|
3
3
|
* <p>Configuration for allocating accelerator partitions.</p>
|
|
4
4
|
* @public
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
import { AutomaticJsonStringConversion as __AutomaticJsonStringConversion } from "@smithy/smithy-client";
|
|
2
|
-
import { _InstanceType, AccountDefaultStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, CollectionType, ContentClassifier, DataDistributionType, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, FailureHandlingPolicy, FeatureStatus, FeatureType, FlatInvocations, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, InferenceExecutionMode, InferenceExperimentType, InputMode, IPAddressType, JobType, ManagedInstanceScalingStatus, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, MonitoringProblemType, MonitoringType, NotebookInstanceAcceleratorType, NotebookOutputOption, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInferenceAmiVersion, ProductionVariantInstanceType, RecommendationJobSupportedEndpointType, RecommendationJobType, RedshiftResultCompressionType, RedshiftResultFormat, RootAccess, RoutingStrategy, RStudioServerProAccessStatus, RStudioServerProUserGroup, SageMakerImageName, SkipModelValidation, StorageType, StudioWebPortal, TableFormat, TagPropagation, TargetDevice, ThroughputMode, TrackingServerSize, TrafficType, TrainingInputMode, TrainingInstanceType, TrainingJobEarlyStoppingType, TtlDurationUnit, VendorGuidance } from "./enums";
|
|
3
|
-
import {
|
|
2
|
+
import type { _InstanceType, AccountDefaultStatus, ActivationState, AppInstanceType, AppNetworkAccessType, AppSecurityGroupManagement, AppType, AuthMode, AutoMountHomeEFS, AvailabilityZoneBalanceEnforcementMode, AwsManagedHumanLoopRequestSource, CapacityReservationPreference, CollectionType, ContentClassifier, DataDistributionType, DeviceSubsetType, DirectInternetAccess, EdgePresetDeploymentType, ExecutionRoleIdentityConfig, FailureHandlingPolicy, FeatureStatus, FeatureType, FlatInvocations, HubContentType, HyperParameterScalingType, HyperParameterTuningAllocationStrategy, HyperParameterTuningJobStrategyType, HyperParameterTuningJobWarmStartType, InferenceComponentPlacementStrategy, InferenceExecutionMode, InferenceExperimentType, InputMode, IPAddressType, JobType, ManagedInstanceScalingScaleInStrategy, ManagedInstanceScalingStatus, MetricPublishFrequencyInSeconds, MlTools, ModelApprovalStatus, ModelCardStatus, ModelInfrastructureType, ModelPackageRegistrationType, ModelRegistrationMode, ModelSpeculativeDecodingS3DataType, ModelSpeculativeDecodingTechnique, MonitoringProblemType, MonitoringType, NotebookInstanceAcceleratorType, NotebookOutputOption, OptimizationJobDeploymentInstanceType, PartnerAppAuthType, PartnerAppType, ProcessingInstanceType, ProcessingS3CompressionType, ProcessingS3DataDistributionType, ProcessingS3DataType, ProcessingS3InputMode, ProcessingS3UploadMode, Processor, ProductionVariantAcceleratorType, ProductionVariantInferenceAmiVersion, ProductionVariantInstanceType, RecommendationJobSupportedEndpointType, RecommendationJobType, RedshiftResultCompressionType, RedshiftResultFormat, RootAccess, RoutingStrategy, RStudioServerProAccessStatus, RStudioServerProUserGroup, SageMakerImageName, SkipModelValidation, StorageType, StudioWebPortal, TableFormat, TagPropagation, TargetDevice, ThroughputMode, TrackingServerSize, TrafficType, TrainingInputMode, TrainingInstanceType, TrainingJobEarlyStoppingType, TtlDurationUnit, VendorGuidance } from "./enums";
|
|
3
|
+
import type { AdditionalInferenceSpecificationDefinition, AmazonQSettings, AnnotationConsolidationConfig, AppLifecycleManagement, AppSpecification, AsyncInferenceConfig, AthenaDatasetDefinition, AuthorizedUrl, AutoParameter, AutoRollbackConfig, Autotune, BatchTransformInput, BestObjectiveNotImproving, Bias, BlueGreenUpdatePolicy, CanvasAppSettings, CapacitySize, CaptureContentTypeHeader, CaptureOption, CategoricalParameter, CategoricalParameterRange, CfnCreateTemplateProvider, Channel, CheckpointConfig, ClarifyExplainerConfig, CodeEditorAppSettings, CodeRepository, CollectionConfig, ComputeQuotaConfig, ComputeQuotaTarget, ContainerDefinition, ContextSource, ContinuousParameterRange, ConvergenceDetected, CustomImage, HyperParameterTuningJobObjective, InferenceSpecification, InputConfig, MetadataProperties, MetricDefinition, MetricsSource, ModelDataSource, OutputDataConfig, ResourceConfig, ResourceSpec, StoppingCondition, Tag, TargetPlatform, TransformJobDefinition, VpcConfig } from "./models_0";
|
|
4
4
|
/**
|
|
5
5
|
* <p>Contains information about the output location for the compiled model and the target device that the model runs on. <code>TargetDevice</code> and <code>TargetPlatform</code> are mutually exclusive, so you need to choose one between the two to specify your target device or platform. If you cannot find your device you want to use from the <code>TargetDevice</code> list, use <code>TargetPlatform</code> to describe the platform of your edge device and <code>CompilerOptions</code> if there are specific settings that are required or recommended to use for particular TargetPlatform.</p>
|
|
6
6
|
* @public
|
|
@@ -1692,6 +1692,27 @@ export interface ProductionVariantCoreDumpConfig {
|
|
|
1692
1692
|
*/
|
|
1693
1693
|
KmsKeyId?: string | undefined;
|
|
1694
1694
|
}
|
|
1695
|
+
/**
|
|
1696
|
+
* <p>Configures the scale-in behavior for managed instance scaling.</p>
|
|
1697
|
+
* @public
|
|
1698
|
+
*/
|
|
1699
|
+
export interface ProductionVariantManagedInstanceScalingScaleInPolicy {
|
|
1700
|
+
/**
|
|
1701
|
+
* <p>The strategy for scaling in instances.</p> <dl> <dt>IDLE_RELEASE</dt> <dd> <p>Releases instances that have no hosted inference component copies.</p> </dd> <dt>CONSOLIDATION</dt> <dd> <p>Consolidates inference component copies onto fewer instances to release more instances. Consolidation honors the scheduling configuration of each inference component. For example, if an inference component specifies Availability Zone balance, consolidation only proceeds when the resulting distribution does not increase the imbalance.</p> </dd> </dl>
|
|
1702
|
+
* @public
|
|
1703
|
+
*/
|
|
1704
|
+
Strategy: ManagedInstanceScalingScaleInStrategy | undefined;
|
|
1705
|
+
/**
|
|
1706
|
+
* <p>The maximum number of instances that the endpoint can terminate at a time during a consolidation scale-in operation.</p> <p>Default value: <code>1</code>.</p>
|
|
1707
|
+
* @public
|
|
1708
|
+
*/
|
|
1709
|
+
MaximumStepSize?: number | undefined;
|
|
1710
|
+
/**
|
|
1711
|
+
* <p>The cooldown period, in minutes, after the last endpoint operation before the endpoint evaluates consolidation scale-in opportunities.</p> <p>Default value: <code>20</code>.</p>
|
|
1712
|
+
* @public
|
|
1713
|
+
*/
|
|
1714
|
+
CooldownInMinutes?: number | undefined;
|
|
1715
|
+
}
|
|
1695
1716
|
/**
|
|
1696
1717
|
* <p>Settings that control the range in the number of instances that the endpoint provisions as it scales up or down to accommodate traffic. </p>
|
|
1697
1718
|
* @public
|
|
@@ -1712,6 +1733,11 @@ export interface ProductionVariantManagedInstanceScaling {
|
|
|
1712
1733
|
* @public
|
|
1713
1734
|
*/
|
|
1714
1735
|
MaxInstanceCount?: number | undefined;
|
|
1736
|
+
/**
|
|
1737
|
+
* <p>Configures the scale-in behavior for managed instance scaling.</p>
|
|
1738
|
+
* @public
|
|
1739
|
+
*/
|
|
1740
|
+
ScaleInPolicy?: ProductionVariantManagedInstanceScalingScaleInPolicy | undefined;
|
|
1715
1741
|
}
|
|
1716
1742
|
/**
|
|
1717
1743
|
* <p>Settings that control how the endpoint routes incoming traffic to the instances that the endpoint hosts.</p>
|
|
@@ -3182,6 +3208,38 @@ export interface InferenceComponentDataCacheConfig {
|
|
|
3182
3208
|
*/
|
|
3183
3209
|
EnableCaching: boolean | undefined;
|
|
3184
3210
|
}
|
|
3211
|
+
/**
|
|
3212
|
+
* <p>Configuration for balancing inference component copies across Availability Zones.</p>
|
|
3213
|
+
* @public
|
|
3214
|
+
*/
|
|
3215
|
+
export interface InferenceComponentAvailabilityZoneBalance {
|
|
3216
|
+
/**
|
|
3217
|
+
* <p>Determines how strictly the Availability Zone balance constraint is enforced.</p> <dl> <dt>PERMISSIVE</dt> <dd> <p>The endpoint attempts to balance copies across Availability Zones but proceeds with scheduling even if balance can't be achieved due to available capacity or instance distribution across Availability Zones.</p> </dd> </dl>
|
|
3218
|
+
* @public
|
|
3219
|
+
*/
|
|
3220
|
+
EnforcementMode: AvailabilityZoneBalanceEnforcementMode | undefined;
|
|
3221
|
+
/**
|
|
3222
|
+
* <p>The maximum allowed difference in the number of inference component copies between any two Availability Zones. This parameter applies only when the endpoint has instances across two or more Availability Zones. A copy placement is allowed if it reduces imbalance or the resulting imbalance is within this value.</p> <p>Default value: <code>0</code>.</p>
|
|
3223
|
+
* @public
|
|
3224
|
+
*/
|
|
3225
|
+
MaxImbalance?: number | undefined;
|
|
3226
|
+
}
|
|
3227
|
+
/**
|
|
3228
|
+
* <p>The scheduling configuration that determines how inference component copies are placed across available instances when copies are added or removed.</p>
|
|
3229
|
+
* @public
|
|
3230
|
+
*/
|
|
3231
|
+
export interface InferenceComponentSchedulingConfig {
|
|
3232
|
+
/**
|
|
3233
|
+
* <p>The strategy for placing inference component copies across available instances. If you also set <code>AvailabilityZoneBalance</code>, this strategy applies to placement within each Availability Zone.</p> <dl> <dt>SPREAD</dt> <dd> <p>Distributes copies evenly across available instances for better resilience.</p> </dd> <dt>BINPACK</dt> <dd> <p>Packs copies onto fewer instances to optimize resource utilization.</p> </dd> </dl>
|
|
3234
|
+
* @public
|
|
3235
|
+
*/
|
|
3236
|
+
PlacementStrategy: InferenceComponentPlacementStrategy | undefined;
|
|
3237
|
+
/**
|
|
3238
|
+
* <p>Configuration for balancing inference component copies across Availability Zones.</p>
|
|
3239
|
+
* @public
|
|
3240
|
+
*/
|
|
3241
|
+
AvailabilityZoneBalance?: InferenceComponentAvailabilityZoneBalance | undefined;
|
|
3242
|
+
}
|
|
3185
3243
|
/**
|
|
3186
3244
|
* <p>Settings that take effect while the model container starts up.</p>
|
|
3187
3245
|
* @public
|
|
@@ -3233,6 +3291,11 @@ export interface InferenceComponentSpecification {
|
|
|
3233
3291
|
* @public
|
|
3234
3292
|
*/
|
|
3235
3293
|
DataCacheConfig?: InferenceComponentDataCacheConfig | undefined;
|
|
3294
|
+
/**
|
|
3295
|
+
* <p>The scheduling configuration that determines how inference component copies are placed across available instances when copies are added or removed.</p>
|
|
3296
|
+
* @public
|
|
3297
|
+
*/
|
|
3298
|
+
SchedulingConfig?: InferenceComponentSchedulingConfig | undefined;
|
|
3236
3299
|
}
|
|
3237
3300
|
/**
|
|
3238
3301
|
* @public
|
|
@@ -6904,94 +6967,3 @@ export interface S3FileSystem {
|
|
|
6904
6967
|
*/
|
|
6905
6968
|
S3Uri: string | undefined;
|
|
6906
6969
|
}
|
|
6907
|
-
/**
|
|
6908
|
-
* <p>A file system, created by you, that you assign to a user profile or space for an Amazon SageMaker AI Domain. Permitted users can access this file system in Amazon SageMaker AI Studio.</p>
|
|
6909
|
-
* @public
|
|
6910
|
-
*/
|
|
6911
|
-
export type CustomFileSystem = CustomFileSystem.EFSFileSystemMember | CustomFileSystem.FSxLustreFileSystemMember | CustomFileSystem.S3FileSystemMember | CustomFileSystem.$UnknownMember;
|
|
6912
|
-
/**
|
|
6913
|
-
* @public
|
|
6914
|
-
*/
|
|
6915
|
-
export declare namespace CustomFileSystem {
|
|
6916
|
-
/**
|
|
6917
|
-
* <p>A custom file system in Amazon EFS.</p>
|
|
6918
|
-
* @public
|
|
6919
|
-
*/
|
|
6920
|
-
interface EFSFileSystemMember {
|
|
6921
|
-
EFSFileSystem: EFSFileSystem;
|
|
6922
|
-
FSxLustreFileSystem?: never;
|
|
6923
|
-
S3FileSystem?: never;
|
|
6924
|
-
$unknown?: never;
|
|
6925
|
-
}
|
|
6926
|
-
/**
|
|
6927
|
-
* <p>A custom file system in Amazon FSx for Lustre.</p>
|
|
6928
|
-
* @public
|
|
6929
|
-
*/
|
|
6930
|
-
interface FSxLustreFileSystemMember {
|
|
6931
|
-
EFSFileSystem?: never;
|
|
6932
|
-
FSxLustreFileSystem: FSxLustreFileSystem;
|
|
6933
|
-
S3FileSystem?: never;
|
|
6934
|
-
$unknown?: never;
|
|
6935
|
-
}
|
|
6936
|
-
/**
|
|
6937
|
-
* <p>A custom file system in Amazon S3. This is only supported in Amazon SageMaker Unified Studio.</p>
|
|
6938
|
-
* @public
|
|
6939
|
-
*/
|
|
6940
|
-
interface S3FileSystemMember {
|
|
6941
|
-
EFSFileSystem?: never;
|
|
6942
|
-
FSxLustreFileSystem?: never;
|
|
6943
|
-
S3FileSystem: S3FileSystem;
|
|
6944
|
-
$unknown?: never;
|
|
6945
|
-
}
|
|
6946
|
-
/**
|
|
6947
|
-
* @public
|
|
6948
|
-
*/
|
|
6949
|
-
interface $UnknownMember {
|
|
6950
|
-
EFSFileSystem?: never;
|
|
6951
|
-
FSxLustreFileSystem?: never;
|
|
6952
|
-
S3FileSystem?: never;
|
|
6953
|
-
$unknown: [string, any];
|
|
6954
|
-
}
|
|
6955
|
-
/**
|
|
6956
|
-
* @deprecated unused in schema-serde mode.
|
|
6957
|
-
*
|
|
6958
|
-
*/
|
|
6959
|
-
interface Visitor<T> {
|
|
6960
|
-
EFSFileSystem: (value: EFSFileSystem) => T;
|
|
6961
|
-
FSxLustreFileSystem: (value: FSxLustreFileSystem) => T;
|
|
6962
|
-
S3FileSystem: (value: S3FileSystem) => T;
|
|
6963
|
-
_: (name: string, value: any) => T;
|
|
6964
|
-
}
|
|
6965
|
-
}
|
|
6966
|
-
/**
|
|
6967
|
-
* <p>The settings for the JupyterLab application within a space.</p>
|
|
6968
|
-
* @public
|
|
6969
|
-
*/
|
|
6970
|
-
export interface SpaceJupyterLabAppSettings {
|
|
6971
|
-
/**
|
|
6972
|
-
* <p>Specifies the ARN's of a SageMaker AI image and SageMaker AI image version, and the instance type that the version runs on.</p> <note> <p>When both <code>SageMakerImageVersionArn</code> and <code>SageMakerImageArn</code> are passed, <code>SageMakerImageVersionArn</code> is used. Any updates to <code>SageMakerImageArn</code> will not take effect if <code>SageMakerImageVersionArn</code> already exists in the <code>ResourceSpec</code> because <code>SageMakerImageVersionArn</code> always takes precedence. To clear the value set for <code>SageMakerImageVersionArn</code>, pass <code>None</code> as the value.</p> </note>
|
|
6973
|
-
* @public
|
|
6974
|
-
*/
|
|
6975
|
-
DefaultResourceSpec?: ResourceSpec | undefined;
|
|
6976
|
-
/**
|
|
6977
|
-
* <p>A list of Git repositories that SageMaker automatically displays to users for cloning in the JupyterLab application.</p>
|
|
6978
|
-
* @public
|
|
6979
|
-
*/
|
|
6980
|
-
CodeRepositories?: CodeRepository[] | undefined;
|
|
6981
|
-
/**
|
|
6982
|
-
* <p>Settings that are used to configure and manage the lifecycle of JupyterLab applications in a space.</p>
|
|
6983
|
-
* @public
|
|
6984
|
-
*/
|
|
6985
|
-
AppLifecycleManagement?: SpaceAppLifecycleManagement | undefined;
|
|
6986
|
-
}
|
|
6987
|
-
/**
|
|
6988
|
-
* <p>A collection of EBS storage settings that apply to both private and shared spaces.</p>
|
|
6989
|
-
* @public
|
|
6990
|
-
*/
|
|
6991
|
-
export interface EbsStorageSettings {
|
|
6992
|
-
/**
|
|
6993
|
-
* <p>The size of an EBS storage volume for a space.</p>
|
|
6994
|
-
* @public
|
|
6995
|
-
*/
|
|
6996
|
-
EbsVolumeSizeInGb: number | undefined;
|
|
6997
|
-
}
|