sagemaker-core 1.0.14__py3-none-any.whl → 1.0.16__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of sagemaker-core might be problematic. Click here for more details.

@@ -1263,6 +1263,7 @@ SHAPE_DAG = {
1263
1263
  "type": "list",
1264
1264
  },
1265
1265
  {"name": "OnStartDeepHealthChecks", "shape": "OnStartDeepHealthChecks", "type": "list"},
1266
+ {"name": "OverrideVpcConfig", "shape": "VpcConfig", "type": "structure"},
1266
1267
  ],
1267
1268
  "type": "structure",
1268
1269
  },
@@ -1285,6 +1286,7 @@ SHAPE_DAG = {
1285
1286
  "type": "list",
1286
1287
  },
1287
1288
  {"name": "OnStartDeepHealthChecks", "shape": "OnStartDeepHealthChecks", "type": "list"},
1289
+ {"name": "OverrideVpcConfig", "shape": "VpcConfig", "type": "structure"},
1288
1290
  ],
1289
1291
  "type": "structure",
1290
1292
  },
@@ -1337,6 +1339,7 @@ SHAPE_DAG = {
1337
1339
  {"name": "InstanceType", "shape": "ClusterInstanceType", "type": "string"},
1338
1340
  {"name": "LaunchTime", "shape": "Timestamp", "type": "timestamp"},
1339
1341
  {"name": "LifeCycleConfig", "shape": "ClusterLifeCycleConfig", "type": "structure"},
1342
+ {"name": "OverrideVpcConfig", "shape": "VpcConfig", "type": "structure"},
1340
1343
  {"name": "ThreadsPerCore", "shape": "ClusterThreadsPerCore", "type": "integer"},
1341
1344
  {
1342
1345
  "name": "InstanceStorageConfigs",
@@ -7360,6 +7363,11 @@ SHAPE_DAG = {
7360
7363
  "shape": "InferenceComponentComputeResourceRequirements",
7361
7364
  "type": "structure",
7362
7365
  },
7366
+ {
7367
+ "name": "BaseInferenceComponentName",
7368
+ "shape": "InferenceComponentName",
7369
+ "type": "string",
7370
+ },
7363
7371
  ],
7364
7372
  "type": "structure",
7365
7373
  },
@@ -7381,6 +7389,11 @@ SHAPE_DAG = {
7381
7389
  "shape": "InferenceComponentComputeResourceRequirements",
7382
7390
  "type": "structure",
7383
7391
  },
7392
+ {
7393
+ "name": "BaseInferenceComponentName",
7394
+ "shape": "InferenceComponentName",
7395
+ "type": "string",
7396
+ },
7384
7397
  ],
7385
7398
  "type": "structure",
7386
7399
  },
@@ -10457,6 +10470,17 @@ SHAPE_DAG = {
10457
10470
  ],
10458
10471
  "type": "structure",
10459
10472
  },
10473
+ "ModelShardingConfig": {
10474
+ "members": [
10475
+ {"name": "Image", "shape": "OptimizationContainerImage", "type": "string"},
10476
+ {
10477
+ "name": "OverrideEnvironment",
10478
+ "shape": "OptimizationJobEnvironmentVariables",
10479
+ "type": "map",
10480
+ },
10481
+ ],
10482
+ "type": "structure",
10483
+ },
10460
10484
  "ModelStepMetadata": {
10461
10485
  "members": [{"name": "Arn", "shape": "String256", "type": "string"}],
10462
10486
  "type": "structure",
@@ -11060,6 +11084,7 @@ SHAPE_DAG = {
11060
11084
  "shape": "ModelCompilationConfig",
11061
11085
  "type": "structure",
11062
11086
  },
11087
+ {"name": "ModelShardingConfig", "shape": "ModelShardingConfig", "type": "structure"},
11063
11088
  ],
11064
11089
  "type": "structure",
11065
11090
  },
@@ -13786,9 +13786,9 @@ class InferenceComponent(Base):
13786
13786
  cls,
13787
13787
  inference_component_name: str,
13788
13788
  endpoint_name: Union[str, object],
13789
- variant_name: str,
13790
13789
  specification: InferenceComponentSpecification,
13791
- runtime_config: InferenceComponentRuntimeConfig,
13790
+ variant_name: Optional[str] = Unassigned(),
13791
+ runtime_config: Optional[InferenceComponentRuntimeConfig] = Unassigned(),
13792
13792
  tags: Optional[List[Tag]] = Unassigned(),
13793
13793
  session: Optional[Session] = None,
13794
13794
  region: Optional[str] = None,
@@ -13799,8 +13799,8 @@ class InferenceComponent(Base):
13799
13799
  Parameters:
13800
13800
  inference_component_name: A unique name to assign to the inference component.
13801
13801
  endpoint_name: The name of an existing endpoint where you host the inference component.
13802
- variant_name: The name of an existing production variant where you host the inference component.
13803
13802
  specification: Details about the resources to deploy with this inference component, including the model, container, and compute resources.
13803
+ variant_name: The name of an existing production variant where you host the inference component.
13804
13804
  runtime_config: Runtime settings for a model that is deployed with an inference component.
13805
13805
  tags: A list of key-value pairs associated with the model. For more information, see Tagging Amazon Web Services resources in the Amazon Web Services General Reference.
13806
13806
  session: Boto3 session.
@@ -3140,6 +3140,7 @@ class ClusterInstanceGroupDetails(Base):
3140
3140
  threads_per_core: The number you specified to TreadsPerCore in CreateCluster for enabling or disabling multithreading. For instance types that support multithreading, you can specify 1 for disabling multithreading and 2 for enabling multithreading. For more information, see the reference table of CPU cores and threads per CPU core per instance type in the Amazon Elastic Compute Cloud User Guide.
3141
3141
  instance_storage_configs: The additional storage configurations for the instances in the SageMaker HyperPod cluster instance group.
3142
3142
  on_start_deep_health_checks: A flag indicating whether deep health checks should be performed when the cluster instance group is created or updated.
3143
+ override_vpc_config
3143
3144
  """
3144
3145
 
3145
3146
  current_count: Optional[int] = Unassigned()
@@ -3151,6 +3152,7 @@ class ClusterInstanceGroupDetails(Base):
3151
3152
  threads_per_core: Optional[int] = Unassigned()
3152
3153
  instance_storage_configs: Optional[List[ClusterInstanceStorageConfig]] = Unassigned()
3153
3154
  on_start_deep_health_checks: Optional[List[str]] = Unassigned()
3155
+ override_vpc_config: Optional[VpcConfig] = Unassigned()
3154
3156
 
3155
3157
 
3156
3158
  class ClusterInstanceGroupSpecification(Base):
@@ -3168,6 +3170,7 @@ class ClusterInstanceGroupSpecification(Base):
3168
3170
  threads_per_core: Specifies the value for Threads per core. For instance types that support multithreading, you can specify 1 for disabling multithreading and 2 for enabling multithreading. For instance types that doesn't support multithreading, specify 1. For more information, see the reference table of CPU cores and threads per CPU core per instance type in the Amazon Elastic Compute Cloud User Guide.
3169
3171
  instance_storage_configs: Specifies the additional storage configurations for the instances in the SageMaker HyperPod cluster instance group.
3170
3172
  on_start_deep_health_checks: A flag indicating whether deep health checks should be performed when the cluster instance group is created or updated.
3173
+ override_vpc_config
3171
3174
  """
3172
3175
 
3173
3176
  instance_count: int
@@ -3178,6 +3181,7 @@ class ClusterInstanceGroupSpecification(Base):
3178
3181
  threads_per_core: Optional[int] = Unassigned()
3179
3182
  instance_storage_configs: Optional[List[ClusterInstanceStorageConfig]] = Unassigned()
3180
3183
  on_start_deep_health_checks: Optional[List[str]] = Unassigned()
3184
+ override_vpc_config: Optional[VpcConfig] = Unassigned()
3181
3185
 
3182
3186
 
3183
3187
  class ClusterInstancePlacement(Base):
@@ -3223,6 +3227,7 @@ class ClusterNodeDetails(Base):
3223
3227
  instance_type: The type of the instance.
3224
3228
  launch_time: The time when the instance is launched.
3225
3229
  life_cycle_config: The LifeCycle configuration applied to the instance.
3230
+ override_vpc_config
3226
3231
  threads_per_core: The number of threads per CPU core you specified under CreateCluster.
3227
3232
  instance_storage_configs: The configurations of additional storage specified to the instance group where the instance (node) is launched.
3228
3233
  private_primary_ip: The private primary IP address of the SageMaker HyperPod cluster node.
@@ -3236,6 +3241,7 @@ class ClusterNodeDetails(Base):
3236
3241
  instance_type: Optional[str] = Unassigned()
3237
3242
  launch_time: Optional[datetime.datetime] = Unassigned()
3238
3243
  life_cycle_config: Optional[ClusterLifeCycleConfig] = Unassigned()
3244
+ override_vpc_config: Optional[VpcConfig] = Unassigned()
3239
3245
  threads_per_core: Optional[int] = Unassigned()
3240
3246
  instance_storage_configs: Optional[List[ClusterInstanceStorageConfig]] = Unassigned()
3241
3247
  private_primary_ip: Optional[str] = Unassigned()
@@ -5324,7 +5330,7 @@ class InferenceComponentStartupParameters(Base):
5324
5330
  class InferenceComponentComputeResourceRequirements(Base):
5325
5331
  """
5326
5332
  InferenceComponentComputeResourceRequirements
5327
- Defines the compute resources to allocate to run a model that you assign to an inference component. These resources include CPU cores, accelerators, and memory.
5333
+ Defines the compute resources to allocate to run a model, plus any adapter models, that you assign to an inference component. These resources include CPU cores, accelerators, and memory.
5328
5334
 
5329
5335
  Attributes
5330
5336
  ----------------------
@@ -5350,13 +5356,17 @@ class InferenceComponentSpecification(Base):
5350
5356
  model_name: The name of an existing SageMaker model object in your account that you want to deploy with the inference component.
5351
5357
  container: Defines a container that provides the runtime environment for a model that you deploy with an inference component.
5352
5358
  startup_parameters: Settings that take effect while the model container starts up.
5353
- compute_resource_requirements: The compute resources allocated to run the model assigned to the inference component.
5359
+ compute_resource_requirements: The compute resources allocated to run the model, plus any adapter models, that you assign to the inference component. Omit this parameter if your request is meant to create an adapter inference component. An adapter inference component is loaded by a base inference component, and it uses the compute resources of the base inference component.
5360
+ base_inference_component_name: The name of an existing inference component that is to contain the inference component that you're creating with your request. Specify this parameter only if your request is meant to create an adapter inference component. An adapter inference component contains the path to an adapter model. The purpose of the adapter model is to tailor the inference output of a base foundation model, which is hosted by the base inference component. The adapter inference component uses the compute resources that you assigned to the base inference component. When you create an adapter inference component, use the Container parameter to specify the location of the adapter artifacts. In the parameter value, use the ArtifactUrl parameter of the InferenceComponentContainerSpecification data type. Before you can create an adapter inference component, you must have an existing inference component that contains the foundation model that you want to adapt.
5354
5361
  """
5355
5362
 
5356
- compute_resource_requirements: InferenceComponentComputeResourceRequirements
5357
5363
  model_name: Optional[Union[str, object]] = Unassigned()
5358
5364
  container: Optional[InferenceComponentContainerSpecification] = Unassigned()
5359
5365
  startup_parameters: Optional[InferenceComponentStartupParameters] = Unassigned()
5366
+ compute_resource_requirements: Optional[InferenceComponentComputeResourceRequirements] = (
5367
+ Unassigned()
5368
+ )
5369
+ base_inference_component_name: Optional[str] = Unassigned()
5360
5370
 
5361
5371
 
5362
5372
  class InferenceComponentRuntimeConfig(Base):
@@ -6629,6 +6639,21 @@ class ModelCompilationConfig(Base):
6629
6639
  override_environment: Optional[Dict[str, str]] = Unassigned()
6630
6640
 
6631
6641
 
6642
+ class ModelShardingConfig(Base):
6643
+ """
6644
+ ModelShardingConfig
6645
+ Settings for the model sharding technique that's applied by a model optimization job.
6646
+
6647
+ Attributes
6648
+ ----------------------
6649
+ image: The URI of an LMI DLC in Amazon ECR. SageMaker uses this image to run the optimization.
6650
+ override_environment: Environment variables that override the default ones in the model container.
6651
+ """
6652
+
6653
+ image: Optional[str] = Unassigned()
6654
+ override_environment: Optional[Dict[str, str]] = Unassigned()
6655
+
6656
+
6632
6657
  class OptimizationConfig(Base):
6633
6658
  """
6634
6659
  OptimizationConfig
@@ -6638,10 +6663,12 @@ class OptimizationConfig(Base):
6638
6663
  ----------------------
6639
6664
  model_quantization_config: Settings for the model quantization technique that's applied by a model optimization job.
6640
6665
  model_compilation_config: Settings for the model compilation technique that's applied by a model optimization job.
6666
+ model_sharding_config: Settings for the model sharding technique that's applied by a model optimization job.
6641
6667
  """
6642
6668
 
6643
6669
  model_quantization_config: Optional[ModelQuantizationConfig] = Unassigned()
6644
6670
  model_compilation_config: Optional[ModelCompilationConfig] = Unassigned()
6671
+ model_sharding_config: Optional[ModelShardingConfig] = Unassigned()
6645
6672
 
6646
6673
 
6647
6674
  class OptimizationJobOutputConfig(Base):
@@ -8113,7 +8140,8 @@ class InferenceComponentSpecificationSummary(Base):
8113
8140
  model_name: The name of the SageMaker model object that is deployed with the inference component.
8114
8141
  container: Details about the container that provides the runtime environment for the model that is deployed with the inference component.
8115
8142
  startup_parameters: Settings that take effect while the model container starts up.
8116
- compute_resource_requirements: The compute resources allocated to run the model assigned to the inference component.
8143
+ compute_resource_requirements: The compute resources allocated to run the model, plus any adapter models, that you assign to the inference component.
8144
+ base_inference_component_name: The name of the base inference component that contains this inference component.
8117
8145
  """
8118
8146
 
8119
8147
  model_name: Optional[Union[str, object]] = Unassigned()
@@ -8122,6 +8150,7 @@ class InferenceComponentSpecificationSummary(Base):
8122
8150
  compute_resource_requirements: Optional[InferenceComponentComputeResourceRequirements] = (
8123
8151
  Unassigned()
8124
8152
  )
8153
+ base_inference_component_name: Optional[str] = Unassigned()
8125
8154
 
8126
8155
 
8127
8156
  class InferenceComponentRuntimeConfigSummary(Base):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: sagemaker-core
3
- Version: 1.0.14
3
+ Version: 1.0.16
4
4
  Summary: An python package for sagemaker core functionalities
5
5
  Author-email: AWS <sagemaker-interests@amazon.com>
6
6
  Project-URL: Repository, https://github.com/aws/sagemaker-core.git
@@ -15,19 +15,19 @@ Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.8
16
16
  Description-Content-Type: text/x-rst
17
17
  License-File: LICENSE
18
- Requires-Dist: boto3 <2.0.0,>=1.34.0
19
- Requires-Dist: pydantic <3.0.0,>=1.7.0
20
- Requires-Dist: PyYAML <7.0,>=6.0
21
- Requires-Dist: jsonschema <5.0.0
22
- Requires-Dist: platformdirs <5.0.0,>=4.0.0
23
- Requires-Dist: rich <14.0.0,>=13.0.0
24
- Requires-Dist: mock <5.0,>4.0
25
- Requires-Dist: importlib-metadata <7.0,>=1.4.0
18
+ Requires-Dist: boto3<2.0.0,>=1.34.0
19
+ Requires-Dist: pydantic<3.0.0,>=2.0.0
20
+ Requires-Dist: PyYAML<7.0,>=6.0
21
+ Requires-Dist: jsonschema<5.0.0
22
+ Requires-Dist: platformdirs<5.0.0,>=4.0.0
23
+ Requires-Dist: rich<14.0.0,>=13.0.0
24
+ Requires-Dist: mock<5.0,>4.0
25
+ Requires-Dist: importlib-metadata<7.0,>=1.4.0
26
26
  Provides-Extra: codegen
27
- Requires-Dist: black <25.0.0,>=24.3.0 ; extra == 'codegen'
28
- Requires-Dist: pandas <3.0.0,>=2.0.0 ; extra == 'codegen'
29
- Requires-Dist: pytest <9.0.0,>=8.0.0 ; extra == 'codegen'
30
- Requires-Dist: pylint <4.0.0,>=3.0.0 ; extra == 'codegen'
27
+ Requires-Dist: black<25.0.0,>=24.3.0; extra == "codegen"
28
+ Requires-Dist: pandas<3.0.0,>=2.0.0; extra == "codegen"
29
+ Requires-Dist: pytest<9.0.0,>=8.0.0; extra == "codegen"
30
+ Requires-Dist: pylint<4.0.0,>=3.0.0; extra == "codegen"
31
31
 
32
32
  .. image:: https://github.com/aws/sagemaker-python-sdk/raw/master/branding/icon/sagemaker-banner.png
33
33
  :height: 100px
@@ -7,15 +7,15 @@ sagemaker_core/main/config_schema.py,sha256=TeGoTobT4yotEVyfguLF0IdKYlOymsDZ45yS
7
7
  sagemaker_core/main/exceptions.py,sha256=87DUlrmHxaWoiYNlpNY9ixxFMPRk_dIGPsA2e_xdVwQ,5602
8
8
  sagemaker_core/main/intelligent_defaults_helper.py,sha256=5SDM6UavZtp-k5LhqRL7GRIDgzFB5UsC_p7YuiSPK9A,8334
9
9
  sagemaker_core/main/logs.py,sha256=yfEH7uP91nbE1lefymOlBr81ziBzsDSIOF2Qyd54FJE,6241
10
- sagemaker_core/main/resources.py,sha256=idwGeRbSSO7Acwtd0y_zOkIxOrMlJvwxx-gL0k7GlS8,1323921
11
- sagemaker_core/main/shapes.py,sha256=Vge1sJb41xqpOFdCnzl8JNdIOwPflgr0Ioy2IKhP01g,699286
10
+ sagemaker_core/main/resources.py,sha256=FZZrBi0q2mDraCsRFNohUeAJMpt8wnyqmu05gVJG3sI,1323971
11
+ sagemaker_core/main/shapes.py,sha256=qKNfazplYk4w9PDYLlG0WLD4WDb3b_SFvcrZ84qVmIw,701824
12
12
  sagemaker_core/main/user_agent.py,sha256=4sZybDXkzRoZnOnVDQ8p8zFTfiRJdsH7amDWInVQ4xU,2708
13
13
  sagemaker_core/main/utils.py,sha256=LCFDM6oxf6_e1i-_Dgtkm3ehl7YfoEpJ2kTTFTL6iOU,18471
14
14
  sagemaker_core/main/code_injection/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
15
15
  sagemaker_core/main/code_injection/base.py,sha256=11_Jif0nOzfbLGlXaacKf-wcizzfS64U0OSZGoVffFU,1733
16
16
  sagemaker_core/main/code_injection/codec.py,sha256=2DjmeD2uND307UqDefvVEpE0rZ8yfFU3Bi3TvQCQveI,7658
17
17
  sagemaker_core/main/code_injection/constants.py,sha256=2ICExGge8vAWx7lSTW0JGh-bH1korkvpOpDu5M63eI4,980
18
- sagemaker_core/main/code_injection/shape_dag.py,sha256=Akn-5sH0T8ujXuiXEOJtq5agJuRk-tKoFP04qwFx-NM,660663
18
+ sagemaker_core/main/code_injection/shape_dag.py,sha256=2FAuvJCSOQc3MaU7nQi0SnTkdNDYUBZ81ve9BcOJeSk,661711
19
19
  sagemaker_core/resources/__init__.py,sha256=EAYTFMN-nPjnPjjBbhIUeaL67FLKNPd7qbcbl9VIrws,31
20
20
  sagemaker_core/shapes/__init__.py,sha256=RnbIu9eTxKt-DNsOFJabrWIgrrtS9_SdAozP9JBl_ic,28
21
21
  sagemaker_core/tools/__init__.py,sha256=xX79JImxCVzrWMnjgntLCve2G5I-R4pRar5s20kT9Rs,56
@@ -28,8 +28,8 @@ sagemaker_core/tools/resources_extractor.py,sha256=hN61ehZbPnhFW-2FIVDi7NsEz4rLv
28
28
  sagemaker_core/tools/shapes_codegen.py,sha256=_ve959bwH8usZ6dPlpXxi2on9t0hLpcmhRWnaWHCWMQ,11745
29
29
  sagemaker_core/tools/shapes_extractor.py,sha256=4KjgDmhlPM4G1f1NeYbORKlXs1s7Q_sm_NK31S_ROQ0,11950
30
30
  sagemaker_core/tools/templates.py,sha256=yX2RQKeClgYwKS5Qu_mDpnWJIBCuj0yELrdm95aiTpk,23262
31
- sagemaker_core-1.0.14.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
32
- sagemaker_core-1.0.14.dist-info/METADATA,sha256=626z-hexHS0uj3CGQtc_f02Obevywo2OdAUISjfogz8,4878
33
- sagemaker_core-1.0.14.dist-info/WHEEL,sha256=R06PA3UVYHThwHvxuRWMqaGcr-PuniXahwjmQRFMEkY,91
34
- sagemaker_core-1.0.14.dist-info/top_level.txt,sha256=R3GAZZ1zC5JxqdE_0x2Lu_WYi2Xfke7VsiP3L5zngfA,15
35
- sagemaker_core-1.0.14.dist-info/RECORD,,
31
+ sagemaker_core-1.0.16.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
32
+ sagemaker_core-1.0.16.dist-info/METADATA,sha256=SR6taP7cmz3IMYc5EaF8ThhHuwvAAG5PYfgtyFVVYfw,4862
33
+ sagemaker_core-1.0.16.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
34
+ sagemaker_core-1.0.16.dist-info/top_level.txt,sha256=R3GAZZ1zC5JxqdE_0x2Lu_WYi2Xfke7VsiP3L5zngfA,15
35
+ sagemaker_core-1.0.16.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (75.5.0)
2
+ Generator: setuptools (75.6.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5