PyPI - gcore - Versions diffs - 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

gcore 0.3.0py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gcore might be problematic. Click here for more details.

Files changed (226) hide show

gcore/__init__.py +2 -1
gcore/_base_client.py +31 -2
gcore/_client.py +18 -0
gcore/_constants.py +2 -2
gcore/_models.py +8 -5
gcore/_version.py +1 -1
gcore/pagination.py +252 -1
gcore/resources/__init__.py +28 -0
gcore/resources/cloud/baremetal/flavors.py +11 -137
gcore/resources/cloud/baremetal/images.py +10 -12
gcore/resources/cloud/baremetal/servers.py +33 -30
gcore/resources/cloud/billing_reservations.py +2 -2
gcore/resources/cloud/file_shares/file_shares.py +7 -8
gcore/resources/cloud/floating_ips.py +7 -12
gcore/resources/cloud/gpu_baremetal_clusters/gpu_baremetal_clusters.py +33 -22
gcore/resources/cloud/gpu_baremetal_clusters/images.py +9 -10
gcore/resources/cloud/gpu_baremetal_clusters/interfaces.py +2 -2
gcore/resources/cloud/gpu_baremetal_clusters/servers.py +8 -4
gcore/resources/cloud/inference/deployments/deployments.py +76 -35
gcore/resources/cloud/inference/deployments/logs.py +7 -7
gcore/resources/cloud/inference/inference.py +5 -5
gcore/resources/cloud/inference/models.py +16 -15
gcore/resources/cloud/inference/registry_credentials.py +18 -18
gcore/resources/cloud/inference/secrets.py +12 -13
gcore/resources/cloud/instances/flavors.py +9 -233
gcore/resources/cloud/instances/images.py +47 -37
gcore/resources/cloud/instances/instances.py +49 -34
gcore/resources/cloud/instances/interfaces.py +2 -2
gcore/resources/cloud/ip_ranges.py +34 -2
gcore/resources/cloud/load_balancers/l7_policies/l7_policies.py +10 -2
gcore/resources/cloud/load_balancers/listeners.py +17 -8
gcore/resources/cloud/load_balancers/load_balancers.py +73 -21
gcore/resources/cloud/load_balancers/metrics.py +2 -2
gcore/resources/cloud/load_balancers/pools/health_monitors.py +2 -2
gcore/resources/cloud/load_balancers/pools/members.py +6 -2
gcore/resources/cloud/networks/networks.py +81 -17
gcore/resources/cloud/networks/routers.py +18 -18
gcore/resources/cloud/networks/subnets.py +51 -11
gcore/resources/cloud/projects.py +38 -24
gcore/resources/cloud/quotas/quotas.py +6 -6
gcore/resources/cloud/quotas/requests.py +8 -8
gcore/resources/cloud/registries/artifacts.py +4 -4
gcore/resources/cloud/registries/registries.py +14 -16
gcore/resources/cloud/registries/repositories.py +4 -4
gcore/resources/cloud/registries/tags.py +2 -2
gcore/resources/cloud/registries/users.py +21 -22
gcore/resources/cloud/reserved_fixed_ips/reserved_fixed_ips.py +20 -20
gcore/resources/cloud/reserved_fixed_ips/vip.py +10 -10
gcore/resources/cloud/secrets.py +14 -224
gcore/resources/cloud/security_groups/rules.py +6 -6
gcore/resources/cloud/security_groups/security_groups.py +70 -31
gcore/resources/cloud/tasks.py +34 -32
gcore/resources/cloud/users/role_assignments.py +12 -14
gcore/resources/cloud/volumes.py +139 -49
gcore/resources/fastedge/__init__.py +103 -0
gcore/resources/fastedge/apps/__init__.py +33 -0
gcore/resources/fastedge/apps/apps.py +932 -0
gcore/resources/fastedge/apps/logs.py +248 -0
gcore/resources/fastedge/binaries.py +286 -0
gcore/resources/fastedge/fastedge.py +327 -0
gcore/resources/fastedge/kv_stores.py +523 -0
gcore/resources/fastedge/secrets.py +687 -0
gcore/resources/fastedge/statistics.py +347 -0
gcore/resources/fastedge/templates.py +652 -0
gcore/resources/iam/__init__.py +47 -0
gcore/resources/iam/api_tokens.py +521 -0
gcore/resources/iam/iam.py +199 -0
gcore/resources/iam/users.py +642 -0
gcore/resources/waap/__init__.py +0 -14
gcore/resources/waap/waap.py +0 -32
gcore/types/cloud/__init__.py +2 -28
gcore/types/cloud/baremetal/__init__.py +0 -1
gcore/types/cloud/baremetal/image_list_params.py +1 -5
gcore/types/cloud/baremetal/server_create_params.py +5 -9
gcore/types/cloud/baremetal/server_list_params.py +1 -5
gcore/types/cloud/ddos_profile.py +9 -3
gcore/types/cloud/file_share_create_params.py +3 -5
gcore/types/cloud/floating_ip_create_params.py +2 -4
gcore/types/cloud/floating_ip_list_params.py +1 -5
gcore/types/cloud/gpu_baremetal_cluster_create_params.py +3 -4
gcore/types/cloud/gpu_baremetal_clusters/image_upload_params.py +2 -4
gcore/types/cloud/health_monitor.py +6 -1
gcore/types/cloud/inference/__init__.py +12 -8
gcore/types/cloud/inference/deployment_create_params.py +224 -7
gcore/types/cloud/inference/deployment_update_params.py +24 -3
gcore/types/cloud/inference/deployments/__init__.py +1 -0
gcore/types/cloud/inference/{inference_log.py → deployments/inference_deployment_log.py} +3 -3
gcore/types/cloud/inference/inference_deployment.py +266 -0
gcore/types/cloud/inference/{inference_apikey_secret.py → inference_deployment_api_key.py} +2 -2
gcore/types/cloud/inference/{mlcatalog_model_card.py → inference_model.py} +2 -2
gcore/types/cloud/inference/{inference_registry_credential.py → inference_registry_credentials.py} +2 -2
gcore/types/cloud/inference/{inference_registry_credential_full.py → inference_registry_credentials_create.py} +2 -2
gcore/types/cloud/inference/inference_secret.py +10 -3
gcore/types/cloud/inference/model_list_params.py +2 -4
gcore/types/cloud/{container_probe.py → inference/probe.py} +9 -9
gcore/types/cloud/{container_probe_config.py → inference/probe_config.py} +5 -5
gcore/types/cloud/{container_probe_exec.py → inference/probe_exec.py} +3 -3
gcore/types/cloud/{container_probe_http_get.py → inference/probe_http_get.py} +3 -3
gcore/types/cloud/{container_probe_tcp_socket.py → inference/probe_tcp_socket.py} +3 -3
gcore/types/cloud/inference/secret_create_params.py +10 -4
gcore/types/cloud/inference/secret_replace_params.py +10 -4
gcore/types/cloud/{region_capacity.py → inference_region_capacity.py} +10 -3
gcore/types/cloud/{region_capacity_list.py → inference_region_capacity_list.py} +4 -4
gcore/types/cloud/instance_create_params.py +8 -9
gcore/types/cloud/instance_list_params.py +1 -5
gcore/types/cloud/instances/__init__.py +0 -2
gcore/types/cloud/instances/image_create_from_volume_params.py +2 -4
gcore/types/cloud/instances/image_list_params.py +1 -5
gcore/types/cloud/instances/image_upload_params.py +2 -4
gcore/types/cloud/load_balancer_create_params.py +8 -4
gcore/types/cloud/load_balancer_list_params.py +1 -5
gcore/types/cloud/load_balancer_update_params.py +24 -0
gcore/types/cloud/load_balancers/pool_create_params.py +6 -1
gcore/types/cloud/load_balancers/pool_update_params.py +6 -1
gcore/types/cloud/load_balancers/pools/member_add_params.py +6 -1
gcore/types/cloud/member.py +6 -1
gcore/types/cloud/network_create_params.py +2 -3
gcore/types/cloud/network_list_params.py +4 -5
gcore/types/cloud/network_update_params.py +28 -2
gcore/types/cloud/networks/router_list_params.py +2 -2
gcore/types/cloud/networks/subnet_create_params.py +2 -3
gcore/types/cloud/networks/subnet_list_params.py +1 -5
gcore/types/cloud/networks/subnet_update_params.py +25 -0
gcore/types/cloud/registries/__init__.py +1 -0
gcore/types/cloud/registries/user_refresh_secret_response.py +31 -0
gcore/types/cloud/reserved_fixed_ip_list_params.py +2 -2
gcore/types/cloud/security_group_list_params.py +3 -7
gcore/types/cloud/security_group_update_params.py +25 -0
gcore/types/cloud/tag_update_map_param.py +2 -2
gcore/types/cloud/task_list_params.py +15 -14
gcore/types/cloud/volume_list_params.py +1 -5
gcore/types/cloud/volume_update_params.py +29 -3
gcore/types/fastedge/__init__.py +48 -0
gcore/types/fastedge/app.py +81 -0
gcore/types/fastedge/app_create_params.py +56 -0
gcore/types/fastedge/app_list_params.py +50 -0
gcore/types/fastedge/app_param.py +56 -0
gcore/types/fastedge/app_replace_params.py +17 -0
gcore/types/fastedge/app_short.py +60 -0
gcore/types/fastedge/app_update_params.py +56 -0
gcore/types/fastedge/apps/__init__.py +6 -0
gcore/types/fastedge/apps/log.py +28 -0
gcore/types/fastedge/apps/log_list_params.py +37 -0
gcore/types/fastedge/binary.py +40 -0
gcore/types/fastedge/binary_list_response.py +12 -0
gcore/types/fastedge/binary_short.py +32 -0
gcore/types/fastedge/call_status.py +24 -0
gcore/types/fastedge/client.py +57 -0
gcore/types/fastedge/duration_stats.py +30 -0
gcore/types/fastedge/kv_store.py +33 -0
gcore/types/fastedge/kv_store_create_params.py +23 -0
gcore/types/fastedge/kv_store_get_response.py +10 -0
gcore/types/fastedge/kv_store_list_params.py +12 -0
gcore/types/fastedge/kv_store_list_response.py +15 -0
gcore/types/fastedge/kv_store_replace_params.py +23 -0
gcore/types/fastedge/kv_store_short.py +19 -0
gcore/types/fastedge/kv_store_stats.py +26 -0
gcore/types/fastedge/secret.py +29 -0
gcore/types/fastedge/secret_create_params.py +27 -0
gcore/types/fastedge/secret_create_response.py +12 -0
gcore/types/fastedge/secret_delete_params.py +12 -0
gcore/types/fastedge/secret_list_params.py +15 -0
gcore/types/{cloud → fastedge}/secret_list_response.py +2 -6
gcore/types/fastedge/secret_replace_params.py +27 -0
gcore/types/fastedge/secret_short.py +21 -0
gcore/types/fastedge/secret_update_params.py +27 -0
gcore/types/fastedge/statistic_get_call_series_params.py +28 -0
gcore/types/fastedge/statistic_get_call_series_response.py +12 -0
gcore/types/fastedge/statistic_get_duration_series_params.py +28 -0
gcore/types/fastedge/statistic_get_duration_series_response.py +12 -0
gcore/types/fastedge/template.py +31 -0
gcore/types/fastedge/template_create_params.py +30 -0
gcore/types/fastedge/template_delete_params.py +12 -0
gcore/types/fastedge/template_list_params.py +25 -0
gcore/types/fastedge/template_parameter.py +22 -0
gcore/types/fastedge/template_parameter_param.py +21 -0
gcore/types/fastedge/template_replace_params.py +30 -0
gcore/types/fastedge/template_short.py +27 -0
gcore/types/iam/__init__.py +17 -0
gcore/types/iam/account_overview.py +488 -0
gcore/types/iam/api_token.py +78 -0
gcore/types/iam/api_token_create.py +15 -0
gcore/types/iam/api_token_create_params.py +42 -0
gcore/types/iam/api_token_list.py +81 -0
gcore/types/iam/api_token_list_params.py +41 -0
gcore/types/iam/user.py +86 -0
gcore/types/iam/user_detailed.py +104 -0
gcore/types/iam/user_invite.py +15 -0
gcore/types/iam/user_invite_params.py +37 -0
gcore/types/iam/user_list_params.py +15 -0
gcore/types/iam/user_update.py +104 -0
gcore/types/iam/user_update_params.py +52 -0
gcore/types/waap/__init__.py +0 -1
gcore/types/waap/domains/custom_rule_create_params.py +7 -3
gcore/types/waap/domains/custom_rule_update_params.py +7 -3
gcore/types/waap/waap_custom_rule.py +7 -3
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/METADATA +44 -5
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/RECORD +200 -151
gcore/resources/waap/clients.py +0 -135
gcore/types/cloud/aws_iam_data.py +0 -13
gcore/types/cloud/aws_iam_data_param.py +0 -15
gcore/types/cloud/baremetal/flavor_list_suitable_params.py +0 -22
gcore/types/cloud/capacity.py +0 -13
gcore/types/cloud/container_probe_config_create_param.py +0 -17
gcore/types/cloud/container_probe_create_param.py +0 -38
gcore/types/cloud/container_probe_exec_create_param.py +0 -13
gcore/types/cloud/container_probe_http_get_create_param.py +0 -25
gcore/types/cloud/container_probe_tcp_socket_create_param.py +0 -12
gcore/types/cloud/container_scale.py +0 -25
gcore/types/cloud/container_scale_trigger_rate.py +0 -13
gcore/types/cloud/container_scale_trigger_sqs.py +0 -33
gcore/types/cloud/container_scale_trigger_threshold.py +0 -10
gcore/types/cloud/container_scale_triggers.py +0 -36
gcore/types/cloud/deploy_status.py +0 -13
gcore/types/cloud/inference/container.py +0 -26
gcore/types/cloud/inference/inference.py +0 -95
gcore/types/cloud/inference/mlcatalog_order_by_choices.py +0 -7
gcore/types/cloud/inference_probes.py +0 -19
gcore/types/cloud/ingress_opts_out.py +0 -16
gcore/types/cloud/ingress_opts_param.py +0 -18
gcore/types/cloud/instances/flavor_list_for_resize_params.py +0 -16
gcore/types/cloud/instances/flavor_list_suitable_params.py +0 -59
gcore/types/cloud/secret_create_params.py +0 -66
gcore/types/waap/client_me_response.py +0 -34
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/WHEEL +0 -0
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/licenses/LICENSE +0 -0

gcore/resources/cloud/inference/deployments/deployments.py CHANGED Viewed

@@ -28,9 +28,8 @@ from .....pagination import SyncOffsetPage, AsyncOffsetPage
 from ....._base_client import AsyncPaginator, make_request_options
 from .....types.cloud.inference import deployment_list_params, deployment_create_params, deployment_update_params
 from .....types.cloud.task_id_list import TaskIDList
-from .....types.cloud.ingress_opts_param import IngressOptsParam
-from .....types.cloud.inference.inference import Inference
-from .....types.cloud.inference.inference_apikey_secret import InferenceApikeySecret
+from .....types.cloud.inference.inference_deployment import InferenceDeployment
+from .....types.cloud.inference.inference_deployment_api_key import InferenceDeploymentAPIKey
 __all__ = ["DeploymentsResource", "AsyncDeploymentsResource"]
@@ -68,12 +67,13 @@ class DeploymentsResource(SyncAPIResource):
         image: str,
         listening_port: int,
         name: str,
+        api_keys: List[str] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -103,9 +103,15 @@ class DeploymentsResource(SyncAPIResource):
           name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -148,6 +154,7 @@ class DeploymentsResource(SyncAPIResource):
                     "image": image,
                     "listening_port": listening_port,
                     "name": name,
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "credentials_name": credentials_name,
@@ -171,6 +178,7 @@ class DeploymentsResource(SyncAPIResource):
         deployment_name: str,
         *,
         project_id: int | None = None,
+        api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
@@ -179,7 +187,7 @@ class DeploymentsResource(SyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -199,9 +207,16 @@ class DeploymentsResource(SyncAPIResource):
           deployment_name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.If `[]` is provided, the API keys will be removed
+              and auth will be disabled on the deployment.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -250,6 +265,7 @@ class DeploymentsResource(SyncAPIResource):
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
             body=maybe_transform(
                 {
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "containers": containers,
@@ -284,7 +300,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> SyncOffsetPage[Inference]:
+    ) -> SyncOffsetPage[InferenceDeployment]:
         """List inference deployments
         Args:
@@ -309,7 +325,7 @@ class DeploymentsResource(SyncAPIResource):
             project_id = self._client._get_cloud_project_id_path_param()
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments",
-            page=SyncOffsetPage[Inference],
+            page=SyncOffsetPage[InferenceDeployment],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -323,7 +339,7 @@ class DeploymentsResource(SyncAPIResource):
                     deployment_list_params.DeploymentListParams,
                 ),
             ),
-            model=Inference,
+            model=InferenceDeployment,
         )
     def delete(
@@ -377,7 +393,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Get inference deployment
@@ -403,7 +419,7 @@ class DeploymentsResource(SyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=Inference,
+            cast_to=InferenceDeployment,
         )
     def get_api_key(
@@ -417,7 +433,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> InferenceApikeySecret:
+    ) -> InferenceDeploymentAPIKey:
         """
         Get inference deployment API key
@@ -443,7 +459,7 @@ class DeploymentsResource(SyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=InferenceApikeySecret,
+            cast_to=InferenceDeploymentAPIKey,
         )
     def start(
@@ -556,7 +572,7 @@ class DeploymentsResource(SyncAPIResource):
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -567,7 +583,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         response = self.create(
             project_id=project_id,
             containers=containers,
@@ -596,7 +612,11 @@ class DeploymentsResource(SyncAPIResource):
             extra_headers=extra_headers,
             polling_interval_seconds=polling_interval_seconds,
         )
-        if not task.created_resources or not task.created_resources.inference_instances or len(task.created_resources.inference_instances) != 1:
+        if (
+            not task.created_resources
+            or not task.created_resources.inference_instances
+            or len(task.created_resources.inference_instances) != 1
+        ):
             raise ValueError(f"Expected exactly one resource to be created in a task")
         return self.get(
             deployment_name=task.created_resources.inference_instances[0],
@@ -618,7 +638,7 @@ class DeploymentsResource(SyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -630,7 +650,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
         """
@@ -735,12 +755,13 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         image: str,
         listening_port: int,
         name: str,
+        api_keys: List[str] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -770,9 +791,15 @@ class AsyncDeploymentsResource(AsyncAPIResource):
           name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -815,6 +842,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
                     "image": image,
                     "listening_port": listening_port,
                     "name": name,
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "credentials_name": credentials_name,
@@ -838,6 +866,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         deployment_name: str,
         *,
         project_id: int | None = None,
+        api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
@@ -846,7 +875,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -866,9 +895,16 @@ class AsyncDeploymentsResource(AsyncAPIResource):
           deployment_name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.If `[]` is provided, the API keys will be removed
+              and auth will be disabled on the deployment.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -917,6 +953,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
             body=await async_maybe_transform(
                 {
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "containers": containers,
@@ -951,7 +988,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> AsyncPaginator[Inference, AsyncOffsetPage[Inference]]:
+    ) -> AsyncPaginator[InferenceDeployment, AsyncOffsetPage[InferenceDeployment]]:
         """List inference deployments
         Args:
@@ -976,7 +1013,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             project_id = self._client._get_cloud_project_id_path_param()
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments",
-            page=AsyncOffsetPage[Inference],
+            page=AsyncOffsetPage[InferenceDeployment],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -990,7 +1027,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
                     deployment_list_params.DeploymentListParams,
                 ),
             ),
-            model=Inference,
+            model=InferenceDeployment,
         )
     async def delete(
@@ -1044,7 +1081,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Get inference deployment
@@ -1070,7 +1107,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=Inference,
+            cast_to=InferenceDeployment,
         )
     async def get_api_key(
@@ -1084,7 +1121,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> InferenceApikeySecret:
+    ) -> InferenceDeploymentAPIKey:
         """
         Get inference deployment API key
@@ -1110,7 +1147,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=InferenceApikeySecret,
+            cast_to=InferenceDeploymentAPIKey,
         )
     async def start(
@@ -1223,7 +1260,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -1234,7 +1271,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         response = await self.create(
             project_id=project_id,
             containers=containers,
@@ -1263,7 +1300,11 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             extra_headers=extra_headers,
             polling_interval_seconds=polling_interval_seconds,
         )
-        if not task.created_resources or not task.created_resources.inference_instances or len(task.created_resources.inference_instances) != 1:
+        if (
+            not task.created_resources
+            or not task.created_resources.inference_instances
+            or len(task.created_resources.inference_instances) != 1
+        ):
             raise ValueError(f"Expected exactly one resource to be created in a task")
         return await self.get(
             deployment_name=task.created_resources.inference_instances[0],
@@ -1285,7 +1326,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -1297,7 +1338,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
         """

gcore/resources/cloud/inference/deployments/logs.py CHANGED Viewed

@@ -20,7 +20,7 @@ from ....._response import (
 from .....pagination import SyncOffsetPage, AsyncOffsetPage
 from ....._base_client import AsyncPaginator, make_request_options
 from .....types.cloud.inference.deployments import log_list_params
-from .....types.cloud.inference.inference_log import InferenceLog
+from .....types.cloud.inference.deployments.inference_deployment_log import InferenceDeploymentLog
 __all__ = ["LogsResource", "AsyncLogsResource"]
@@ -60,7 +60,7 @@ class LogsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> SyncOffsetPage[InferenceLog]:
+    ) -> SyncOffsetPage[InferenceDeploymentLog]:
         """
         Get inference deployment logs
@@ -92,7 +92,7 @@ class LogsResource(SyncAPIResource):
             raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
-            page=SyncOffsetPage[InferenceLog],
+            page=SyncOffsetPage[InferenceDeploymentLog],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -108,7 +108,7 @@ class LogsResource(SyncAPIResource):
                     log_list_params.LogListParams,
                 ),
             ),
-            model=InferenceLog,
+            model=InferenceDeploymentLog,
         )
@@ -147,7 +147,7 @@ class AsyncLogsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> AsyncPaginator[InferenceLog, AsyncOffsetPage[InferenceLog]]:
+    ) -> AsyncPaginator[InferenceDeploymentLog, AsyncOffsetPage[InferenceDeploymentLog]]:
         """
         Get inference deployment logs
@@ -179,7 +179,7 @@ class AsyncLogsResource(AsyncAPIResource):
             raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
-            page=AsyncOffsetPage[InferenceLog],
+            page=AsyncOffsetPage[InferenceDeploymentLog],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -195,7 +195,7 @@ class AsyncLogsResource(AsyncAPIResource):
                     log_list_params.LogListParams,
                 ),
             ),
-            model=InferenceLog,
+            model=InferenceDeploymentLog,
         )

gcore/resources/cloud/inference/inference.py CHANGED Viewed

@@ -54,7 +54,7 @@ from .deployments.deployments import (
     DeploymentsResourceWithStreamingResponse,
     AsyncDeploymentsResourceWithStreamingResponse,
 )
-from ....types.cloud.region_capacity_list import RegionCapacityList
+from ....types.cloud.inference_region_capacity_list import InferenceRegionCapacityList
 __all__ = ["InferenceResource", "AsyncInferenceResource"]
@@ -108,14 +108,14 @@ class InferenceResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> RegionCapacityList:
+    ) -> InferenceRegionCapacityList:
         """Get inference capacity by region"""
         return self._get(
             "/cloud/v3/inference/capacity",
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=RegionCapacityList,
+            cast_to=InferenceRegionCapacityList,
         )
@@ -168,14 +168,14 @@ class AsyncInferenceResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> RegionCapacityList:
+    ) -> InferenceRegionCapacityList:
         """Get inference capacity by region"""
         return await self._get(
             "/cloud/v3/inference/capacity",
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=RegionCapacityList,
+            cast_to=InferenceRegionCapacityList,
         )

gcore/resources/cloud/inference/models.py CHANGED Viewed

@@ -2,6 +2,8 @@
 from __future__ import annotations
+from typing_extensions import Literal
 import httpx
 from ...._types import NOT_GIVEN, Body, Query, Headers, NotGiven
@@ -16,9 +18,8 @@ from ...._response import (
 )
 from ....pagination import SyncOffsetPage, AsyncOffsetPage
 from ...._base_client import AsyncPaginator, make_request_options
-from ....types.cloud.inference import MlcatalogOrderByChoices, model_list_params
-from ....types.cloud.inference.mlcatalog_model_card import MlcatalogModelCard
-from ....types.cloud.inference.mlcatalog_order_by_choices import MlcatalogOrderByChoices
+from ....types.cloud.inference import model_list_params
+from ....types.cloud.inference.inference_model import InferenceModel
 __all__ = ["ModelsResource", "AsyncModelsResource"]
@@ -48,14 +49,14 @@ class ModelsResource(SyncAPIResource):
         *,
         limit: int | NotGiven = NOT_GIVEN,
         offset: int | NotGiven = NOT_GIVEN,
-        order_by: MlcatalogOrderByChoices | NotGiven = NOT_GIVEN,
+        order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
         # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
         # The extra values given here take precedence over values defined on the client or passed to this method.
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> SyncOffsetPage[MlcatalogModelCard]:
+    ) -> SyncOffsetPage[InferenceModel]:
         """List models from catalog
         Args:
@@ -78,7 +79,7 @@ class ModelsResource(SyncAPIResource):
         """
         return self._get_api_list(
             "/cloud/v3/inference/models",
-            page=SyncOffsetPage[MlcatalogModelCard],
+            page=SyncOffsetPage[InferenceModel],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -93,7 +94,7 @@ class ModelsResource(SyncAPIResource):
                     model_list_params.ModelListParams,
                 ),
             ),
-            model=MlcatalogModelCard,
+            model=InferenceModel,
         )
     def get(
@@ -106,7 +107,7 @@ class ModelsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> MlcatalogModelCard:
+    ) -> InferenceModel:
         """
         Get model from catalog
@@ -128,7 +129,7 @@ class ModelsResource(SyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=MlcatalogModelCard,
+            cast_to=InferenceModel,
         )
@@ -157,14 +158,14 @@ class AsyncModelsResource(AsyncAPIResource):
         *,
         limit: int | NotGiven = NOT_GIVEN,
         offset: int | NotGiven = NOT_GIVEN,
-        order_by: MlcatalogOrderByChoices | NotGiven = NOT_GIVEN,
+        order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
         # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
         # The extra values given here take precedence over values defined on the client or passed to this method.
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> AsyncPaginator[MlcatalogModelCard, AsyncOffsetPage[MlcatalogModelCard]]:
+    ) -> AsyncPaginator[InferenceModel, AsyncOffsetPage[InferenceModel]]:
         """List models from catalog
         Args:
@@ -187,7 +188,7 @@ class AsyncModelsResource(AsyncAPIResource):
         """
         return self._get_api_list(
             "/cloud/v3/inference/models",
-            page=AsyncOffsetPage[MlcatalogModelCard],
+            page=AsyncOffsetPage[InferenceModel],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -202,7 +203,7 @@ class AsyncModelsResource(AsyncAPIResource):
                     model_list_params.ModelListParams,
                 ),
             ),
-            model=MlcatalogModelCard,
+            model=InferenceModel,
         )
     async def get(
@@ -215,7 +216,7 @@ class AsyncModelsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> MlcatalogModelCard:
+    ) -> InferenceModel:
         """
         Get model from catalog
@@ -237,7 +238,7 @@ class AsyncModelsResource(AsyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=MlcatalogModelCard,
+            cast_to=InferenceModel,
         )

gcore 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

Potentially problematic release.

gcore 0.3.0py3-none-any.whl → 0.5.0py3-none-any.whl