sagemaker-core 1.0.3__py3-none-any.whl → 1.0.5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of sagemaker-core might be problematic. Click here for more details.
- sagemaker_core/main/code_injection/shape_dag.py +180 -2
- sagemaker_core/main/resources.py +457 -158
- sagemaker_core/main/shapes.py +405 -170
- sagemaker_core/main/utils.py +22 -37
- sagemaker_core/tools/constants.py +4 -0
- sagemaker_core/tools/data_extractor.py +20 -3
- sagemaker_core/tools/resources_codegen.py +2 -197
- sagemaker_core/tools/resources_extractor.py +1 -1
- sagemaker_core/tools/templates.py +1 -72
- {sagemaker_core-1.0.3.dist-info → sagemaker_core-1.0.5.dist-info}/METADATA +1 -1
- {sagemaker_core-1.0.3.dist-info → sagemaker_core-1.0.5.dist-info}/RECORD +14 -14
- {sagemaker_core-1.0.3.dist-info → sagemaker_core-1.0.5.dist-info}/WHEEL +1 -1
- {sagemaker_core-1.0.3.dist-info → sagemaker_core-1.0.5.dist-info}/LICENSE +0 -0
- {sagemaker_core-1.0.3.dist-info → sagemaker_core-1.0.5.dist-info}/top_level.txt +0 -0
sagemaker_core/main/shapes.py
CHANGED
|
@@ -21,6 +21,381 @@ class Base(BaseModel):
|
|
|
21
21
|
model_config = ConfigDict(protected_namespaces=(), validate_assignment=True, extra="forbid")
|
|
22
22
|
|
|
23
23
|
|
|
24
|
+
class InternalDependencyException(Base):
|
|
25
|
+
"""
|
|
26
|
+
InternalDependencyException
|
|
27
|
+
Your request caused an exception with an internal dependency. Contact customer support.
|
|
28
|
+
|
|
29
|
+
Attributes
|
|
30
|
+
----------------------
|
|
31
|
+
message
|
|
32
|
+
"""
|
|
33
|
+
|
|
34
|
+
message: Optional[str] = Unassigned()
|
|
35
|
+
|
|
36
|
+
|
|
37
|
+
class InternalFailure(Base):
|
|
38
|
+
"""
|
|
39
|
+
InternalFailure
|
|
40
|
+
An internal failure occurred. Try your request again. If the problem persists, contact Amazon Web Services customer support.
|
|
41
|
+
|
|
42
|
+
Attributes
|
|
43
|
+
----------------------
|
|
44
|
+
message
|
|
45
|
+
"""
|
|
46
|
+
|
|
47
|
+
message: Optional[str] = Unassigned()
|
|
48
|
+
|
|
49
|
+
|
|
50
|
+
class InternalStreamFailure(Base):
|
|
51
|
+
"""
|
|
52
|
+
InternalStreamFailure
|
|
53
|
+
The stream processing failed because of an unknown error, exception or failure. Try your request again.
|
|
54
|
+
|
|
55
|
+
Attributes
|
|
56
|
+
----------------------
|
|
57
|
+
message
|
|
58
|
+
"""
|
|
59
|
+
|
|
60
|
+
message: Optional[str] = Unassigned()
|
|
61
|
+
|
|
62
|
+
|
|
63
|
+
class InvokeEndpointAsyncOutput(Base):
|
|
64
|
+
"""
|
|
65
|
+
InvokeEndpointAsyncOutput
|
|
66
|
+
|
|
67
|
+
Attributes
|
|
68
|
+
----------------------
|
|
69
|
+
inference_id: Identifier for an inference request. This will be the same as the InferenceId specified in the input. Amazon SageMaker will generate an identifier for you if you do not specify one.
|
|
70
|
+
output_location: The Amazon S3 URI where the inference response payload is stored.
|
|
71
|
+
failure_location: The Amazon S3 URI where the inference failure response payload is stored.
|
|
72
|
+
"""
|
|
73
|
+
|
|
74
|
+
inference_id: Optional[str] = Unassigned()
|
|
75
|
+
output_location: Optional[str] = Unassigned()
|
|
76
|
+
failure_location: Optional[str] = Unassigned()
|
|
77
|
+
|
|
78
|
+
|
|
79
|
+
class InvokeEndpointOutput(Base):
|
|
80
|
+
"""
|
|
81
|
+
InvokeEndpointOutput
|
|
82
|
+
|
|
83
|
+
Attributes
|
|
84
|
+
----------------------
|
|
85
|
+
body: Includes the inference provided by the model. For information about the format of the response body, see Common Data Formats-Inference. If the explainer is activated, the body includes the explanations provided by the model. For more information, see the Response section under Invoke the Endpoint in the Developer Guide.
|
|
86
|
+
content_type: The MIME type of the inference returned from the model container.
|
|
87
|
+
invoked_production_variant: Identifies the production variant that was invoked.
|
|
88
|
+
custom_attributes: Provides additional information in the response about the inference returned by a model hosted at an Amazon SageMaker endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to return an ID received in the CustomAttributes header of a request or other metadata that a service endpoint was programmed to produce. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1). If the customer wants the custom attribute returned, the model must set the custom attribute to be included on the way back. The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function. This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker Python SDK.
|
|
89
|
+
new_session_id: If you created a stateful session with your request, the ID and expiration time that the model assigns to that session.
|
|
90
|
+
closed_session_id: If you closed a stateful session with your request, the ID of that session.
|
|
91
|
+
"""
|
|
92
|
+
|
|
93
|
+
body: Any
|
|
94
|
+
content_type: Optional[str] = Unassigned()
|
|
95
|
+
invoked_production_variant: Optional[str] = Unassigned()
|
|
96
|
+
custom_attributes: Optional[str] = Unassigned()
|
|
97
|
+
new_session_id: Optional[str] = Unassigned()
|
|
98
|
+
closed_session_id: Optional[str] = Unassigned()
|
|
99
|
+
|
|
100
|
+
|
|
101
|
+
class PayloadPart(Base):
|
|
102
|
+
"""
|
|
103
|
+
PayloadPart
|
|
104
|
+
A wrapper for pieces of the payload that's returned in response to a streaming inference request. A streaming inference response consists of one or more payload parts.
|
|
105
|
+
|
|
106
|
+
Attributes
|
|
107
|
+
----------------------
|
|
108
|
+
bytes: A blob that contains part of the response for your streaming inference request.
|
|
109
|
+
"""
|
|
110
|
+
|
|
111
|
+
bytes: Optional[Any] = Unassigned()
|
|
112
|
+
|
|
113
|
+
|
|
114
|
+
class ModelStreamError(Base):
|
|
115
|
+
"""
|
|
116
|
+
ModelStreamError
|
|
117
|
+
An error occurred while streaming the response body. This error can have the following error codes: ModelInvocationTimeExceeded The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker. StreamBroken The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
|
|
118
|
+
|
|
119
|
+
Attributes
|
|
120
|
+
----------------------
|
|
121
|
+
message
|
|
122
|
+
error_code: This error can have the following error codes: ModelInvocationTimeExceeded The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker. StreamBroken The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
|
|
123
|
+
"""
|
|
124
|
+
|
|
125
|
+
message: Optional[str] = Unassigned()
|
|
126
|
+
error_code: Optional[str] = Unassigned()
|
|
127
|
+
|
|
128
|
+
|
|
129
|
+
class ResponseStream(Base):
|
|
130
|
+
"""
|
|
131
|
+
ResponseStream
|
|
132
|
+
A stream of payload parts. Each part contains a portion of the response for a streaming inference request.
|
|
133
|
+
|
|
134
|
+
Attributes
|
|
135
|
+
----------------------
|
|
136
|
+
payload_part: A wrapper for pieces of the payload that's returned in response to a streaming inference request. A streaming inference response consists of one or more payload parts.
|
|
137
|
+
model_stream_error: An error occurred while streaming the response body. This error can have the following error codes: ModelInvocationTimeExceeded The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker. StreamBroken The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
|
|
138
|
+
internal_stream_failure: The stream processing failed because of an unknown error, exception or failure. Try your request again.
|
|
139
|
+
"""
|
|
140
|
+
|
|
141
|
+
payload_part: Optional[PayloadPart] = Unassigned()
|
|
142
|
+
model_stream_error: Optional[ModelStreamError] = Unassigned()
|
|
143
|
+
internal_stream_failure: Optional[InternalStreamFailure] = Unassigned()
|
|
144
|
+
|
|
145
|
+
|
|
146
|
+
class InvokeEndpointWithResponseStreamOutput(Base):
|
|
147
|
+
"""
|
|
148
|
+
InvokeEndpointWithResponseStreamOutput
|
|
149
|
+
|
|
150
|
+
Attributes
|
|
151
|
+
----------------------
|
|
152
|
+
body
|
|
153
|
+
content_type: The MIME type of the inference returned from the model container.
|
|
154
|
+
invoked_production_variant: Identifies the production variant that was invoked.
|
|
155
|
+
custom_attributes: Provides additional information in the response about the inference returned by a model hosted at an Amazon SageMaker endpoint. The information is an opaque value that is forwarded verbatim. You could use this value, for example, to return an ID received in the CustomAttributes header of a request or other metadata that a service endpoint was programmed to produce. The value must consist of no more than 1024 visible US-ASCII characters as specified in Section 3.3.6. Field Value Components of the Hypertext Transfer Protocol (HTTP/1.1). If the customer wants the custom attribute returned, the model must set the custom attribute to be included on the way back. The code in your model is responsible for setting or updating any custom attributes in the response. If your code does not set this value in the response, an empty value is returned. For example, if a custom attribute represents the trace ID, your model can prepend the custom attribute with Trace ID: in your post-processing function. This feature is currently supported in the Amazon Web Services SDKs but not in the Amazon SageMaker Python SDK.
|
|
156
|
+
"""
|
|
157
|
+
|
|
158
|
+
body: ResponseStream
|
|
159
|
+
content_type: Optional[str] = Unassigned()
|
|
160
|
+
invoked_production_variant: Optional[str] = Unassigned()
|
|
161
|
+
custom_attributes: Optional[str] = Unassigned()
|
|
162
|
+
|
|
163
|
+
|
|
164
|
+
class ModelError(Base):
|
|
165
|
+
"""
|
|
166
|
+
ModelError
|
|
167
|
+
Model (owned by the customer in the container) returned 4xx or 5xx error code.
|
|
168
|
+
|
|
169
|
+
Attributes
|
|
170
|
+
----------------------
|
|
171
|
+
message
|
|
172
|
+
original_status_code: Original status code.
|
|
173
|
+
original_message: Original message.
|
|
174
|
+
log_stream_arn: The Amazon Resource Name (ARN) of the log stream.
|
|
175
|
+
"""
|
|
176
|
+
|
|
177
|
+
message: Optional[str] = Unassigned()
|
|
178
|
+
original_status_code: Optional[int] = Unassigned()
|
|
179
|
+
original_message: Optional[str] = Unassigned()
|
|
180
|
+
log_stream_arn: Optional[str] = Unassigned()
|
|
181
|
+
|
|
182
|
+
|
|
183
|
+
class ModelNotReadyException(Base):
|
|
184
|
+
"""
|
|
185
|
+
ModelNotReadyException
|
|
186
|
+
Either a serverless endpoint variant's resources are still being provisioned, or a multi-model endpoint is still downloading or loading the target model. Wait and try your request again.
|
|
187
|
+
|
|
188
|
+
Attributes
|
|
189
|
+
----------------------
|
|
190
|
+
message
|
|
191
|
+
"""
|
|
192
|
+
|
|
193
|
+
message: Optional[str] = Unassigned()
|
|
194
|
+
|
|
195
|
+
|
|
196
|
+
class ServiceUnavailable(Base):
|
|
197
|
+
"""
|
|
198
|
+
ServiceUnavailable
|
|
199
|
+
The service is currently unavailable.
|
|
200
|
+
|
|
201
|
+
Attributes
|
|
202
|
+
----------------------
|
|
203
|
+
message
|
|
204
|
+
"""
|
|
205
|
+
|
|
206
|
+
message: Optional[str] = Unassigned()
|
|
207
|
+
|
|
208
|
+
|
|
209
|
+
class ValidationError(Base):
|
|
210
|
+
"""
|
|
211
|
+
ValidationError
|
|
212
|
+
There was an error validating your request.
|
|
213
|
+
|
|
214
|
+
Attributes
|
|
215
|
+
----------------------
|
|
216
|
+
message
|
|
217
|
+
"""
|
|
218
|
+
|
|
219
|
+
message: Optional[str] = Unassigned()
|
|
220
|
+
|
|
221
|
+
|
|
222
|
+
class AccessForbidden(Base):
|
|
223
|
+
"""
|
|
224
|
+
AccessForbidden
|
|
225
|
+
You do not have permission to perform an action.
|
|
226
|
+
|
|
227
|
+
Attributes
|
|
228
|
+
----------------------
|
|
229
|
+
message
|
|
230
|
+
"""
|
|
231
|
+
|
|
232
|
+
message: Optional[str] = Unassigned()
|
|
233
|
+
|
|
234
|
+
|
|
235
|
+
class BatchGetRecordError(Base):
|
|
236
|
+
"""
|
|
237
|
+
BatchGetRecordError
|
|
238
|
+
The error that has occurred when attempting to retrieve a batch of Records.
|
|
239
|
+
|
|
240
|
+
Attributes
|
|
241
|
+
----------------------
|
|
242
|
+
feature_group_name: The name of the feature group that the record belongs to.
|
|
243
|
+
record_identifier_value_as_string: The value for the RecordIdentifier in string format of a Record from a FeatureGroup that is causing an error when attempting to be retrieved.
|
|
244
|
+
error_code: The error code of an error that has occurred when attempting to retrieve a batch of Records. For more information on errors, see Errors.
|
|
245
|
+
error_message: The error message of an error that has occurred when attempting to retrieve a record in the batch.
|
|
246
|
+
"""
|
|
247
|
+
|
|
248
|
+
feature_group_name: Union[str, object]
|
|
249
|
+
record_identifier_value_as_string: str
|
|
250
|
+
error_code: str
|
|
251
|
+
error_message: str
|
|
252
|
+
|
|
253
|
+
|
|
254
|
+
class BatchGetRecordIdentifier(Base):
|
|
255
|
+
"""
|
|
256
|
+
BatchGetRecordIdentifier
|
|
257
|
+
The identifier that identifies the batch of Records you are retrieving in a batch.
|
|
258
|
+
|
|
259
|
+
Attributes
|
|
260
|
+
----------------------
|
|
261
|
+
feature_group_name: The name or Amazon Resource Name (ARN) of the FeatureGroup containing the records you are retrieving in a batch.
|
|
262
|
+
record_identifiers_value_as_string: The value for a list of record identifiers in string format.
|
|
263
|
+
feature_names: List of names of Features to be retrieved. If not specified, the latest value for all the Features are returned.
|
|
264
|
+
"""
|
|
265
|
+
|
|
266
|
+
feature_group_name: Union[str, object]
|
|
267
|
+
record_identifiers_value_as_string: List[str]
|
|
268
|
+
feature_names: Optional[List[str]] = Unassigned()
|
|
269
|
+
|
|
270
|
+
|
|
271
|
+
class FeatureValue(Base):
|
|
272
|
+
"""
|
|
273
|
+
FeatureValue
|
|
274
|
+
The value associated with a feature.
|
|
275
|
+
|
|
276
|
+
Attributes
|
|
277
|
+
----------------------
|
|
278
|
+
feature_name: The name of a feature that a feature value corresponds to.
|
|
279
|
+
value_as_string: The value in string format associated with a feature. Used when your CollectionType is None. Note that features types can be String, Integral, or Fractional. This value represents all three types as a string.
|
|
280
|
+
value_as_string_list: The list of values in string format associated with a feature. Used when your CollectionType is a List, Set, or Vector. Note that features types can be String, Integral, or Fractional. These values represents all three types as a string.
|
|
281
|
+
"""
|
|
282
|
+
|
|
283
|
+
feature_name: str
|
|
284
|
+
value_as_string: Optional[str] = Unassigned()
|
|
285
|
+
value_as_string_list: Optional[List[str]] = Unassigned()
|
|
286
|
+
|
|
287
|
+
|
|
288
|
+
class BatchGetRecordResultDetail(Base):
|
|
289
|
+
"""
|
|
290
|
+
BatchGetRecordResultDetail
|
|
291
|
+
The output of records that have been retrieved in a batch.
|
|
292
|
+
|
|
293
|
+
Attributes
|
|
294
|
+
----------------------
|
|
295
|
+
feature_group_name: The FeatureGroupName containing Records you retrieved in a batch.
|
|
296
|
+
record_identifier_value_as_string: The value of the record identifier in string format.
|
|
297
|
+
record: The Record retrieved.
|
|
298
|
+
expires_at: The ExpiresAt ISO string of the requested record.
|
|
299
|
+
"""
|
|
300
|
+
|
|
301
|
+
feature_group_name: Union[str, object]
|
|
302
|
+
record_identifier_value_as_string: str
|
|
303
|
+
record: List[FeatureValue]
|
|
304
|
+
expires_at: Optional[str] = Unassigned()
|
|
305
|
+
|
|
306
|
+
|
|
307
|
+
class BatchGetRecordResponse(Base):
|
|
308
|
+
"""
|
|
309
|
+
BatchGetRecordResponse
|
|
310
|
+
|
|
311
|
+
Attributes
|
|
312
|
+
----------------------
|
|
313
|
+
records: A list of Records you requested to be retrieved in batch.
|
|
314
|
+
errors: A list of errors that have occurred when retrieving a batch of Records.
|
|
315
|
+
unprocessed_identifiers: A unprocessed list of FeatureGroup names, with their corresponding RecordIdentifier value, and Feature name.
|
|
316
|
+
"""
|
|
317
|
+
|
|
318
|
+
records: List[BatchGetRecordResultDetail]
|
|
319
|
+
errors: List[BatchGetRecordError]
|
|
320
|
+
unprocessed_identifiers: List[BatchGetRecordIdentifier]
|
|
321
|
+
|
|
322
|
+
|
|
323
|
+
class GetRecordResponse(Base):
|
|
324
|
+
"""
|
|
325
|
+
GetRecordResponse
|
|
326
|
+
|
|
327
|
+
Attributes
|
|
328
|
+
----------------------
|
|
329
|
+
record: The record you requested. A list of FeatureValues.
|
|
330
|
+
expires_at: The ExpiresAt ISO string of the requested record.
|
|
331
|
+
"""
|
|
332
|
+
|
|
333
|
+
record: Optional[List[FeatureValue]] = Unassigned()
|
|
334
|
+
expires_at: Optional[str] = Unassigned()
|
|
335
|
+
|
|
336
|
+
|
|
337
|
+
class TtlDuration(Base):
|
|
338
|
+
"""
|
|
339
|
+
TtlDuration
|
|
340
|
+
Time to live duration, where the record is hard deleted after the expiration time is reached; ExpiresAt = EventTime + TtlDuration. For information on HardDelete, see the DeleteRecord API in the Amazon SageMaker API Reference guide.
|
|
341
|
+
|
|
342
|
+
Attributes
|
|
343
|
+
----------------------
|
|
344
|
+
unit: TtlDuration time unit.
|
|
345
|
+
value: TtlDuration time value.
|
|
346
|
+
"""
|
|
347
|
+
|
|
348
|
+
unit: Optional[str] = Unassigned()
|
|
349
|
+
value: Optional[int] = Unassigned()
|
|
350
|
+
|
|
351
|
+
|
|
352
|
+
class ResourceNotFound(Base):
|
|
353
|
+
"""
|
|
354
|
+
ResourceNotFound
|
|
355
|
+
Resource being access is not found.
|
|
356
|
+
|
|
357
|
+
Attributes
|
|
358
|
+
----------------------
|
|
359
|
+
message
|
|
360
|
+
"""
|
|
361
|
+
|
|
362
|
+
message: Optional[str] = Unassigned()
|
|
363
|
+
|
|
364
|
+
|
|
365
|
+
class BatchPutMetricsError(Base):
|
|
366
|
+
"""
|
|
367
|
+
BatchPutMetricsError
|
|
368
|
+
An error that occured when putting the metric data.
|
|
369
|
+
|
|
370
|
+
Attributes
|
|
371
|
+
----------------------
|
|
372
|
+
code: The error code of an error that occured when attempting to put metrics. METRIC_LIMIT_EXCEEDED: The maximum amount of metrics per resource is exceeded. INTERNAL_ERROR: An internal error occured. VALIDATION_ERROR: The metric data failed validation. CONFLICT_ERROR: Multiple requests attempted to modify the same data simultaneously.
|
|
373
|
+
metric_index: An index that corresponds to the metric in the request.
|
|
374
|
+
"""
|
|
375
|
+
|
|
376
|
+
code: Optional[str] = Unassigned()
|
|
377
|
+
metric_index: Optional[int] = Unassigned()
|
|
378
|
+
|
|
379
|
+
|
|
380
|
+
class RawMetricData(Base):
|
|
381
|
+
"""
|
|
382
|
+
RawMetricData
|
|
383
|
+
The raw metric data to associate with the resource.
|
|
384
|
+
|
|
385
|
+
Attributes
|
|
386
|
+
----------------------
|
|
387
|
+
metric_name: The name of the metric.
|
|
388
|
+
timestamp: The time that the metric was recorded.
|
|
389
|
+
step: The metric step (epoch).
|
|
390
|
+
value: The metric value.
|
|
391
|
+
"""
|
|
392
|
+
|
|
393
|
+
metric_name: str
|
|
394
|
+
timestamp: datetime.datetime
|
|
395
|
+
value: float
|
|
396
|
+
step: Optional[int] = Unassigned()
|
|
397
|
+
|
|
398
|
+
|
|
24
399
|
class ActionSource(Base):
|
|
25
400
|
"""
|
|
26
401
|
ActionSource
|
|
@@ -2675,6 +3050,7 @@ class ClusterInstanceGroupDetails(Base):
|
|
|
2675
3050
|
execution_role: The execution role for the instance group to assume.
|
|
2676
3051
|
threads_per_core: The number you specified to TreadsPerCore in CreateCluster for enabling or disabling multithreading. For instance types that support multithreading, you can specify 1 for disabling multithreading and 2 for enabling multithreading. For more information, see the reference table of CPU cores and threads per CPU core per instance type in the Amazon Elastic Compute Cloud User Guide.
|
|
2677
3052
|
instance_storage_configs: The additional storage configurations for the instances in the SageMaker HyperPod cluster instance group.
|
|
3053
|
+
on_start_deep_health_checks: A flag indicating whether deep health checks should be performed when the cluster instance group is created or updated.
|
|
2678
3054
|
"""
|
|
2679
3055
|
|
|
2680
3056
|
current_count: Optional[int] = Unassigned()
|
|
@@ -2685,6 +3061,7 @@ class ClusterInstanceGroupDetails(Base):
|
|
|
2685
3061
|
execution_role: Optional[str] = Unassigned()
|
|
2686
3062
|
threads_per_core: Optional[int] = Unassigned()
|
|
2687
3063
|
instance_storage_configs: Optional[List[ClusterInstanceStorageConfig]] = Unassigned()
|
|
3064
|
+
on_start_deep_health_checks: Optional[List[str]] = Unassigned()
|
|
2688
3065
|
|
|
2689
3066
|
|
|
2690
3067
|
class ClusterInstanceGroupSpecification(Base):
|
|
@@ -2701,6 +3078,7 @@ class ClusterInstanceGroupSpecification(Base):
|
|
|
2701
3078
|
execution_role: Specifies an IAM execution role to be assumed by the instance group.
|
|
2702
3079
|
threads_per_core: Specifies the value for Threads per core. For instance types that support multithreading, you can specify 1 for disabling multithreading and 2 for enabling multithreading. For instance types that doesn't support multithreading, specify 1. For more information, see the reference table of CPU cores and threads per CPU core per instance type in the Amazon Elastic Compute Cloud User Guide.
|
|
2703
3080
|
instance_storage_configs: Specifies the additional storage configurations for the instances in the SageMaker HyperPod cluster instance group.
|
|
3081
|
+
on_start_deep_health_checks: A flag indicating whether deep health checks should be performed when the cluster instance group is created or updated.
|
|
2704
3082
|
"""
|
|
2705
3083
|
|
|
2706
3084
|
instance_count: int
|
|
@@ -2710,6 +3088,7 @@ class ClusterInstanceGroupSpecification(Base):
|
|
|
2710
3088
|
execution_role: str
|
|
2711
3089
|
threads_per_core: Optional[int] = Unassigned()
|
|
2712
3090
|
instance_storage_configs: Optional[List[ClusterInstanceStorageConfig]] = Unassigned()
|
|
3091
|
+
on_start_deep_health_checks: Optional[List[str]] = Unassigned()
|
|
2713
3092
|
|
|
2714
3093
|
|
|
2715
3094
|
class ClusterInstancePlacement(Base):
|
|
@@ -2796,6 +3175,32 @@ class ClusterNodeSummary(Base):
|
|
|
2796
3175
|
instance_status: ClusterInstanceStatusDetails
|
|
2797
3176
|
|
|
2798
3177
|
|
|
3178
|
+
class ClusterOrchestratorEksConfig(Base):
|
|
3179
|
+
"""
|
|
3180
|
+
ClusterOrchestratorEksConfig
|
|
3181
|
+
The configuration settings for the Amazon EKS cluster used as the orchestrator for the SageMaker HyperPod cluster.
|
|
3182
|
+
|
|
3183
|
+
Attributes
|
|
3184
|
+
----------------------
|
|
3185
|
+
cluster_arn: The Amazon Resource Name (ARN) of the Amazon EKS cluster associated with the SageMaker HyperPod cluster.
|
|
3186
|
+
"""
|
|
3187
|
+
|
|
3188
|
+
cluster_arn: str
|
|
3189
|
+
|
|
3190
|
+
|
|
3191
|
+
class ClusterOrchestrator(Base):
|
|
3192
|
+
"""
|
|
3193
|
+
ClusterOrchestrator
|
|
3194
|
+
The type of orchestrator used for the SageMaker HyperPod cluster.
|
|
3195
|
+
|
|
3196
|
+
Attributes
|
|
3197
|
+
----------------------
|
|
3198
|
+
eks: The Amazon EKS cluster used as the orchestrator for the SageMaker HyperPod cluster.
|
|
3199
|
+
"""
|
|
3200
|
+
|
|
3201
|
+
eks: ClusterOrchestratorEksConfig
|
|
3202
|
+
|
|
3203
|
+
|
|
2799
3204
|
class ClusterSummary(Base):
|
|
2800
3205
|
"""
|
|
2801
3206
|
ClusterSummary
|
|
@@ -4268,21 +4673,6 @@ class OnlineStoreSecurityConfig(Base):
|
|
|
4268
4673
|
kms_key_id: Optional[str] = Unassigned()
|
|
4269
4674
|
|
|
4270
4675
|
|
|
4271
|
-
class TtlDuration(Base):
|
|
4272
|
-
"""
|
|
4273
|
-
TtlDuration
|
|
4274
|
-
Time to live duration, where the record is hard deleted after the expiration time is reached; ExpiresAt = EventTime + TtlDuration. For information on HardDelete, see the DeleteRecord API in the Amazon SageMaker API Reference guide.
|
|
4275
|
-
|
|
4276
|
-
Attributes
|
|
4277
|
-
----------------------
|
|
4278
|
-
unit: TtlDuration time unit.
|
|
4279
|
-
value: TtlDuration time value.
|
|
4280
|
-
"""
|
|
4281
|
-
|
|
4282
|
-
unit: Optional[str] = Unassigned()
|
|
4283
|
-
value: Optional[int] = Unassigned()
|
|
4284
|
-
|
|
4285
|
-
|
|
4286
4676
|
class OnlineStoreConfig(Base):
|
|
4287
4677
|
"""
|
|
4288
4678
|
OnlineStoreConfig
|
|
@@ -11228,19 +11618,6 @@ class ResourceLimitExceeded(Base):
|
|
|
11228
11618
|
message: Optional[str] = Unassigned()
|
|
11229
11619
|
|
|
11230
11620
|
|
|
11231
|
-
class ResourceNotFound(Base):
|
|
11232
|
-
"""
|
|
11233
|
-
ResourceNotFound
|
|
11234
|
-
Resource being access is not found.
|
|
11235
|
-
|
|
11236
|
-
Attributes
|
|
11237
|
-
----------------------
|
|
11238
|
-
message
|
|
11239
|
-
"""
|
|
11240
|
-
|
|
11241
|
-
message: Optional[str] = Unassigned()
|
|
11242
|
-
|
|
11243
|
-
|
|
11244
11621
|
class SearchExpression(Base):
|
|
11245
11622
|
"""
|
|
11246
11623
|
SearchExpression
|
|
@@ -11574,145 +11951,3 @@ class VariantProperty(Base):
|
|
|
11574
11951
|
"""
|
|
11575
11952
|
|
|
11576
11953
|
variant_property_type: str
|
|
11577
|
-
|
|
11578
|
-
|
|
11579
|
-
class InternalDependencyException(Base):
|
|
11580
|
-
"""
|
|
11581
|
-
InternalDependencyException
|
|
11582
|
-
Your request caused an exception with an internal dependency. Contact customer support.
|
|
11583
|
-
|
|
11584
|
-
Attributes
|
|
11585
|
-
----------------------
|
|
11586
|
-
message
|
|
11587
|
-
"""
|
|
11588
|
-
|
|
11589
|
-
message: Optional[str] = Unassigned()
|
|
11590
|
-
|
|
11591
|
-
|
|
11592
|
-
class InternalFailure(Base):
|
|
11593
|
-
"""
|
|
11594
|
-
InternalFailure
|
|
11595
|
-
An internal failure occurred.
|
|
11596
|
-
|
|
11597
|
-
Attributes
|
|
11598
|
-
----------------------
|
|
11599
|
-
message
|
|
11600
|
-
"""
|
|
11601
|
-
|
|
11602
|
-
message: Optional[str] = Unassigned()
|
|
11603
|
-
|
|
11604
|
-
|
|
11605
|
-
class InternalStreamFailure(Base):
|
|
11606
|
-
"""
|
|
11607
|
-
InternalStreamFailure
|
|
11608
|
-
The stream processing failed because of an unknown error, exception or failure. Try your request again.
|
|
11609
|
-
|
|
11610
|
-
Attributes
|
|
11611
|
-
----------------------
|
|
11612
|
-
message
|
|
11613
|
-
"""
|
|
11614
|
-
|
|
11615
|
-
message: Optional[str] = Unassigned()
|
|
11616
|
-
|
|
11617
|
-
|
|
11618
|
-
class PayloadPart(Base):
|
|
11619
|
-
"""
|
|
11620
|
-
PayloadPart
|
|
11621
|
-
A wrapper for pieces of the payload that's returned in response to a streaming inference request. A streaming inference response consists of one or more payload parts.
|
|
11622
|
-
|
|
11623
|
-
Attributes
|
|
11624
|
-
----------------------
|
|
11625
|
-
bytes: A blob that contains part of the response for your streaming inference request.
|
|
11626
|
-
"""
|
|
11627
|
-
|
|
11628
|
-
bytes: Optional[Any] = Unassigned()
|
|
11629
|
-
|
|
11630
|
-
|
|
11631
|
-
class ModelStreamError(Base):
|
|
11632
|
-
"""
|
|
11633
|
-
ModelStreamError
|
|
11634
|
-
An error occurred while streaming the response body. This error can have the following error codes: ModelInvocationTimeExceeded The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker. StreamBroken The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
|
|
11635
|
-
|
|
11636
|
-
Attributes
|
|
11637
|
-
----------------------
|
|
11638
|
-
message
|
|
11639
|
-
error_code: This error can have the following error codes: ModelInvocationTimeExceeded The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker. StreamBroken The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
|
|
11640
|
-
"""
|
|
11641
|
-
|
|
11642
|
-
message: Optional[str] = Unassigned()
|
|
11643
|
-
error_code: Optional[str] = Unassigned()
|
|
11644
|
-
|
|
11645
|
-
|
|
11646
|
-
class ResponseStream(Base):
|
|
11647
|
-
"""
|
|
11648
|
-
ResponseStream
|
|
11649
|
-
A stream of payload parts. Each part contains a portion of the response for a streaming inference request.
|
|
11650
|
-
|
|
11651
|
-
Attributes
|
|
11652
|
-
----------------------
|
|
11653
|
-
payload_part: A wrapper for pieces of the payload that's returned in response to a streaming inference request. A streaming inference response consists of one or more payload parts.
|
|
11654
|
-
model_stream_error: An error occurred while streaming the response body. This error can have the following error codes: ModelInvocationTimeExceeded The model failed to finish sending the response within the timeout period allowed by Amazon SageMaker. StreamBroken The Transmission Control Protocol (TCP) connection between the client and the model was reset or closed.
|
|
11655
|
-
internal_stream_failure: The stream processing failed because of an unknown error, exception or failure. Try your request again.
|
|
11656
|
-
"""
|
|
11657
|
-
|
|
11658
|
-
payload_part: Optional[PayloadPart] = Unassigned()
|
|
11659
|
-
model_stream_error: Optional[ModelStreamError] = Unassigned()
|
|
11660
|
-
internal_stream_failure: Optional[InternalStreamFailure] = Unassigned()
|
|
11661
|
-
|
|
11662
|
-
|
|
11663
|
-
class ModelError(Base):
|
|
11664
|
-
"""
|
|
11665
|
-
ModelError
|
|
11666
|
-
Model (owned by the customer in the container) returned 4xx or 5xx error code.
|
|
11667
|
-
|
|
11668
|
-
Attributes
|
|
11669
|
-
----------------------
|
|
11670
|
-
message
|
|
11671
|
-
original_status_code: Original status code.
|
|
11672
|
-
original_message: Original message.
|
|
11673
|
-
log_stream_arn: The Amazon Resource Name (ARN) of the log stream.
|
|
11674
|
-
"""
|
|
11675
|
-
|
|
11676
|
-
message: Optional[str] = Unassigned()
|
|
11677
|
-
original_status_code: Optional[int] = Unassigned()
|
|
11678
|
-
original_message: Optional[str] = Unassigned()
|
|
11679
|
-
log_stream_arn: Optional[str] = Unassigned()
|
|
11680
|
-
|
|
11681
|
-
|
|
11682
|
-
class ModelNotReadyException(Base):
|
|
11683
|
-
"""
|
|
11684
|
-
ModelNotReadyException
|
|
11685
|
-
Either a serverless endpoint variant's resources are still being provisioned, or a multi-model endpoint is still downloading or loading the target model. Wait and try your request again.
|
|
11686
|
-
|
|
11687
|
-
Attributes
|
|
11688
|
-
----------------------
|
|
11689
|
-
message
|
|
11690
|
-
"""
|
|
11691
|
-
|
|
11692
|
-
message: Optional[str] = Unassigned()
|
|
11693
|
-
|
|
11694
|
-
|
|
11695
|
-
class ServiceUnavailable(Base):
|
|
11696
|
-
"""
|
|
11697
|
-
ServiceUnavailable
|
|
11698
|
-
The service is unavailable. Try your call again.
|
|
11699
|
-
|
|
11700
|
-
Attributes
|
|
11701
|
-
----------------------
|
|
11702
|
-
message
|
|
11703
|
-
"""
|
|
11704
|
-
|
|
11705
|
-
message: Optional[str] = Unassigned()
|
|
11706
|
-
|
|
11707
|
-
|
|
11708
|
-
class ValidationError(Base):
|
|
11709
|
-
"""
|
|
11710
|
-
ValidationError
|
|
11711
|
-
Inspect your request and try again.
|
|
11712
|
-
|
|
11713
|
-
Attributes
|
|
11714
|
-
----------------------
|
|
11715
|
-
message
|
|
11716
|
-
"""
|
|
11717
|
-
|
|
11718
|
-
message: Optional[str] = Unassigned()
|