PyPI - gcore - Versions diffs - 0.4.0__py3-none-any.whl → 0.6.0__py3-none-any.whl - Mend

gcore 0.4.0py3-none-any.whl → 0.6.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gcore might be problematic. Click here for more details.

Files changed (145) hide show

gcore/_base_client.py +9 -2
gcore/_client.py +9 -0
gcore/_constants.py +2 -2
gcore/_models.py +8 -5
gcore/_version.py +1 -1
gcore/pagination.py +192 -1
gcore/resources/__init__.py +14 -0
gcore/resources/cloud/__init__.py +14 -0
gcore/resources/cloud/audit_logs.py +480 -0
gcore/resources/cloud/baremetal/servers.py +2 -2
gcore/resources/cloud/cloud.py +32 -0
gcore/resources/cloud/file_shares/file_shares.py +64 -9
gcore/resources/cloud/gpu_baremetal_clusters/gpu_baremetal_clusters.py +2 -2
gcore/resources/cloud/inference/__init__.py +14 -0
gcore/resources/cloud/inference/api_keys.py +621 -0
gcore/resources/cloud/inference/deployments/deployments.py +66 -33
gcore/resources/cloud/inference/deployments/logs.py +7 -7
gcore/resources/cloud/inference/inference.py +37 -5
gcore/resources/cloud/inference/models.py +16 -15
gcore/resources/cloud/inference/registry_credentials.py +16 -16
gcore/resources/cloud/inference/secrets.py +4 -5
gcore/resources/cloud/instances/instances.py +2 -2
gcore/resources/cloud/load_balancers/pools/members.py +22 -6
gcore/resources/cloud/secrets.py +14 -224
gcore/resources/cloud/tasks.py +30 -28
gcore/resources/fastedge/__init__.py +103 -0
gcore/resources/fastedge/apps/__init__.py +33 -0
gcore/resources/fastedge/apps/apps.py +932 -0
gcore/resources/fastedge/apps/logs.py +248 -0
gcore/resources/fastedge/binaries.py +286 -0
gcore/resources/fastedge/fastedge.py +327 -0
gcore/resources/fastedge/kv_stores.py +523 -0
gcore/resources/fastedge/secrets.py +687 -0
gcore/resources/fastedge/statistics.py +347 -0
gcore/resources/fastedge/templates.py +652 -0
gcore/types/cloud/__init__.py +4 -28
gcore/types/cloud/audit_log_entry.py +254 -0
gcore/types/cloud/audit_log_list_params.py +158 -0
gcore/types/cloud/baremetal/server_create_params.py +1 -1
gcore/types/cloud/file_share_update_params.py +29 -3
gcore/types/cloud/gpu_baremetal_cluster_create_params.py +1 -1
gcore/types/cloud/inference/__init__.py +17 -8
gcore/types/cloud/inference/api_key_create_params.py +21 -0
gcore/types/cloud/inference/api_key_list_params.py +21 -0
gcore/types/cloud/inference/api_key_update_params.py +16 -0
gcore/types/cloud/inference/deployment_create_params.py +224 -7
gcore/types/cloud/inference/deployment_update_params.py +24 -3
gcore/types/cloud/inference/deployments/__init__.py +1 -0
gcore/types/cloud/inference/{inference_log.py → deployments/inference_deployment_log.py} +3 -3
gcore/types/cloud/inference/inference_api_key.py +24 -0
gcore/types/cloud/inference/inference_api_key_create.py +27 -0
gcore/types/cloud/inference/inference_deployment.py +266 -0
gcore/types/cloud/inference/{inference_apikey_secret.py → inference_deployment_api_key.py} +2 -2
gcore/types/cloud/inference/{mlcatalog_model_card.py → inference_model.py} +2 -2
gcore/types/cloud/inference/{inference_registry_credential.py → inference_registry_credentials.py} +2 -2
gcore/types/cloud/inference/{inference_registry_credential_full.py → inference_registry_credentials_create.py} +2 -2
gcore/types/cloud/inference/inference_secret.py +10 -3
gcore/types/cloud/inference/model_list_params.py +2 -4
gcore/types/cloud/{container_probe.py → inference/probe.py} +9 -9
gcore/types/cloud/{container_probe_config.py → inference/probe_config.py} +5 -5
gcore/types/cloud/{container_probe_exec.py → inference/probe_exec.py} +3 -3
gcore/types/cloud/{container_probe_http_get.py → inference/probe_http_get.py} +3 -3
gcore/types/cloud/{container_probe_tcp_socket.py → inference/probe_tcp_socket.py} +3 -3
gcore/types/cloud/inference/secret_create_params.py +10 -4
gcore/types/cloud/inference/secret_replace_params.py +10 -4
gcore/types/cloud/{region_capacity.py → inference_region_capacity.py} +10 -3
gcore/types/cloud/{region_capacity_list.py → inference_region_capacity_list.py} +4 -4
gcore/types/cloud/instance_create_params.py +1 -1
gcore/types/cloud/load_balancer_create_params.py +14 -3
gcore/types/cloud/load_balancers/pool_create_params.py +14 -3
gcore/types/cloud/load_balancers/pool_update_params.py +14 -3
gcore/types/cloud/load_balancers/pools/member_add_params.py +14 -3
gcore/types/cloud/member.py +12 -4
gcore/types/cloud/task_list_params.py +15 -14
gcore/types/fastedge/__init__.py +48 -0
gcore/types/fastedge/app.py +81 -0
gcore/types/fastedge/app_create_params.py +56 -0
gcore/types/fastedge/app_list_params.py +50 -0
gcore/types/fastedge/app_param.py +56 -0
gcore/types/fastedge/app_replace_params.py +17 -0
gcore/types/fastedge/app_short.py +60 -0
gcore/types/fastedge/app_update_params.py +56 -0
gcore/types/fastedge/apps/__init__.py +6 -0
gcore/types/fastedge/apps/log.py +28 -0
gcore/types/fastedge/apps/log_list_params.py +37 -0
gcore/types/fastedge/binary.py +40 -0
gcore/types/fastedge/binary_list_response.py +12 -0
gcore/types/fastedge/binary_short.py +32 -0
gcore/types/fastedge/call_status.py +24 -0
gcore/types/fastedge/client.py +57 -0
gcore/types/fastedge/duration_stats.py +30 -0
gcore/types/fastedge/kv_store.py +33 -0
gcore/types/fastedge/kv_store_create_params.py +23 -0
gcore/types/fastedge/kv_store_get_response.py +10 -0
gcore/types/fastedge/kv_store_list_params.py +12 -0
gcore/types/fastedge/kv_store_list_response.py +15 -0
gcore/types/fastedge/kv_store_replace_params.py +23 -0
gcore/types/fastedge/kv_store_short.py +19 -0
gcore/types/fastedge/kv_store_stats.py +26 -0
gcore/types/fastedge/secret.py +29 -0
gcore/types/fastedge/secret_create_params.py +27 -0
gcore/types/fastedge/secret_create_response.py +12 -0
gcore/types/fastedge/secret_delete_params.py +12 -0
gcore/types/fastedge/secret_list_params.py +15 -0
gcore/types/{cloud → fastedge}/secret_list_response.py +2 -6
gcore/types/fastedge/secret_replace_params.py +27 -0
gcore/types/fastedge/secret_short.py +21 -0
gcore/types/fastedge/secret_update_params.py +27 -0
gcore/types/fastedge/statistic_get_call_series_params.py +28 -0
gcore/types/fastedge/statistic_get_call_series_response.py +12 -0
gcore/types/fastedge/statistic_get_duration_series_params.py +28 -0
gcore/types/fastedge/statistic_get_duration_series_response.py +12 -0
gcore/types/fastedge/template.py +31 -0
gcore/types/fastedge/template_create_params.py +30 -0
gcore/types/fastedge/template_delete_params.py +12 -0
gcore/types/fastedge/template_list_params.py +25 -0
gcore/types/fastedge/template_parameter.py +22 -0
gcore/types/fastedge/template_parameter_param.py +21 -0
gcore/types/fastedge/template_replace_params.py +30 -0
gcore/types/fastedge/template_short.py +27 -0
{gcore-0.4.0.dist-info → gcore-0.6.0.dist-info}/METADATA +8 -7
{gcore-0.4.0.dist-info → gcore-0.6.0.dist-info}/RECORD +124 -80
gcore/types/cloud/aws_iam_data.py +0 -13
gcore/types/cloud/aws_iam_data_param.py +0 -15
gcore/types/cloud/capacity.py +0 -13
gcore/types/cloud/container_probe_config_create_param.py +0 -17
gcore/types/cloud/container_probe_create_param.py +0 -38
gcore/types/cloud/container_probe_exec_create_param.py +0 -13
gcore/types/cloud/container_probe_http_get_create_param.py +0 -25
gcore/types/cloud/container_probe_tcp_socket_create_param.py +0 -12
gcore/types/cloud/container_scale.py +0 -25
gcore/types/cloud/container_scale_trigger_rate.py +0 -13
gcore/types/cloud/container_scale_trigger_sqs.py +0 -33
gcore/types/cloud/container_scale_trigger_threshold.py +0 -10
gcore/types/cloud/container_scale_triggers.py +0 -36
gcore/types/cloud/deploy_status.py +0 -13
gcore/types/cloud/inference/container.py +0 -26
gcore/types/cloud/inference/inference.py +0 -95
gcore/types/cloud/inference/mlcatalog_order_by_choices.py +0 -7
gcore/types/cloud/inference_probes.py +0 -19
gcore/types/cloud/ingress_opts_out.py +0 -16
gcore/types/cloud/ingress_opts_param.py +0 -18
gcore/types/cloud/secret_create_params.py +0 -66
{gcore-0.4.0.dist-info → gcore-0.6.0.dist-info}/WHEEL +0 -0
{gcore-0.4.0.dist-info → gcore-0.6.0.dist-info}/licenses/LICENSE +0 -0

gcore/resources/cloud/inference/deployments/deployments.py CHANGED Viewed

@@ -28,9 +28,8 @@ from .....pagination import SyncOffsetPage, AsyncOffsetPage
 from ....._base_client import AsyncPaginator, make_request_options
 from .....types.cloud.inference import deployment_list_params, deployment_create_params, deployment_update_params
 from .....types.cloud.task_id_list import TaskIDList
-from .....types.cloud.ingress_opts_param import IngressOptsParam
-from .....types.cloud.inference.inference import Inference
-from .....types.cloud.inference.inference_apikey_secret import InferenceApikeySecret
+from .....types.cloud.inference.inference_deployment import InferenceDeployment
+from .....types.cloud.inference.inference_deployment_api_key import InferenceDeploymentAPIKey
 __all__ = ["DeploymentsResource", "AsyncDeploymentsResource"]
@@ -68,12 +67,13 @@ class DeploymentsResource(SyncAPIResource):
         image: str,
         listening_port: int,
         name: str,
+        api_keys: List[str] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -103,9 +103,15 @@ class DeploymentsResource(SyncAPIResource):
           name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -148,6 +154,7 @@ class DeploymentsResource(SyncAPIResource):
                     "image": image,
                     "listening_port": listening_port,
                     "name": name,
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "credentials_name": credentials_name,
@@ -171,6 +178,7 @@ class DeploymentsResource(SyncAPIResource):
         deployment_name: str,
         *,
         project_id: int | None = None,
+        api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
@@ -179,7 +187,7 @@ class DeploymentsResource(SyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -199,9 +207,16 @@ class DeploymentsResource(SyncAPIResource):
           deployment_name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.If `[]` is provided, the API keys will be removed
+              and auth will be disabled on the deployment.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -250,6 +265,7 @@ class DeploymentsResource(SyncAPIResource):
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
             body=maybe_transform(
                 {
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "containers": containers,
@@ -284,7 +300,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> SyncOffsetPage[Inference]:
+    ) -> SyncOffsetPage[InferenceDeployment]:
         """List inference deployments
         Args:
@@ -309,7 +325,7 @@ class DeploymentsResource(SyncAPIResource):
             project_id = self._client._get_cloud_project_id_path_param()
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments",
-            page=SyncOffsetPage[Inference],
+            page=SyncOffsetPage[InferenceDeployment],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -323,7 +339,7 @@ class DeploymentsResource(SyncAPIResource):
                     deployment_list_params.DeploymentListParams,
                 ),
             ),
-            model=Inference,
+            model=InferenceDeployment,
         )
     def delete(
@@ -377,7 +393,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Get inference deployment
@@ -403,7 +419,7 @@ class DeploymentsResource(SyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=Inference,
+            cast_to=InferenceDeployment,
         )
     def get_api_key(
@@ -417,7 +433,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> InferenceApikeySecret:
+    ) -> InferenceDeploymentAPIKey:
         """
         Get inference deployment API key
@@ -443,7 +459,7 @@ class DeploymentsResource(SyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=InferenceApikeySecret,
+            cast_to=InferenceDeploymentAPIKey,
         )
     def start(
@@ -556,7 +572,7 @@ class DeploymentsResource(SyncAPIResource):
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -567,7 +583,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         response = self.create(
             project_id=project_id,
             containers=containers,
@@ -622,7 +638,7 @@ class DeploymentsResource(SyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -634,7 +650,7 @@ class DeploymentsResource(SyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
         """
@@ -739,12 +755,13 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         image: str,
         listening_port: int,
         name: str,
+        api_keys: List[str] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -774,9 +791,15 @@ class AsyncDeploymentsResource(AsyncAPIResource):
           name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -819,6 +842,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
                     "image": image,
                     "listening_port": listening_port,
                     "name": name,
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "credentials_name": credentials_name,
@@ -842,6 +866,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         deployment_name: str,
         *,
         project_id: int | None = None,
+        api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
         auth_enabled: bool | NotGiven = NOT_GIVEN,
         command: Optional[List[str]] | NotGiven = NOT_GIVEN,
         containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
@@ -850,7 +875,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -870,9 +895,16 @@ class AsyncDeploymentsResource(AsyncAPIResource):
           deployment_name: Inference instance name.
+          api_keys: List of API keys for the inference instance. Multiple keys can be attached to
+              one deployment.If `auth_enabled` and `api_keys` are both specified, a
+              ValidationError will be raised.If `[]` is provided, the API keys will be removed
+              and auth will be disabled on the deployment.
           auth_enabled: Set to `true` to enable API key authentication for the inference instance.
               `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-              for the requests to the instance if enabled
+              for the requests to the instance if enabled. This field is deprecated and will
+              be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+              `api_keys` are both specified, a ValidationError will be raised.
           command: Command to be executed when running a container from an image.
@@ -921,6 +953,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
             body=await async_maybe_transform(
                 {
+                    "api_keys": api_keys,
                     "auth_enabled": auth_enabled,
                     "command": command,
                     "containers": containers,
@@ -955,7 +988,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> AsyncPaginator[Inference, AsyncOffsetPage[Inference]]:
+    ) -> AsyncPaginator[InferenceDeployment, AsyncOffsetPage[InferenceDeployment]]:
         """List inference deployments
         Args:
@@ -980,7 +1013,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             project_id = self._client._get_cloud_project_id_path_param()
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments",
-            page=AsyncOffsetPage[Inference],
+            page=AsyncOffsetPage[InferenceDeployment],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -994,7 +1027,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
                     deployment_list_params.DeploymentListParams,
                 ),
             ),
-            model=Inference,
+            model=InferenceDeployment,
         )
     async def delete(
@@ -1048,7 +1081,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Get inference deployment
@@ -1074,7 +1107,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=Inference,
+            cast_to=InferenceDeployment,
         )
     async def get_api_key(
@@ -1088,7 +1121,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> InferenceApikeySecret:
+    ) -> InferenceDeploymentAPIKey:
         """
         Get inference deployment API key
@@ -1114,7 +1147,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=InferenceApikeySecret,
+            cast_to=InferenceDeploymentAPIKey,
         )
     async def start(
@@ -1227,7 +1260,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
         description: Optional[str] | NotGiven = NOT_GIVEN,
         envs: Dict[str, str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
         api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -1238,7 +1271,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         response = await self.create(
             project_id=project_id,
             containers=containers,
@@ -1293,7 +1326,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
         flavor_name: str | NotGiven = NOT_GIVEN,
         image: Optional[str] | NotGiven = NOT_GIVEN,
-        ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
+        ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
         listening_port: Optional[int] | NotGiven = NOT_GIVEN,
         logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
         probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -1305,7 +1338,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
-    ) -> Inference:
+    ) -> InferenceDeployment:
         """
         Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
         """

gcore/resources/cloud/inference/deployments/logs.py CHANGED Viewed

@@ -20,7 +20,7 @@ from ....._response import (
 from .....pagination import SyncOffsetPage, AsyncOffsetPage
 from ....._base_client import AsyncPaginator, make_request_options
 from .....types.cloud.inference.deployments import log_list_params
-from .....types.cloud.inference.inference_log import InferenceLog
+from .....types.cloud.inference.deployments.inference_deployment_log import InferenceDeploymentLog
 __all__ = ["LogsResource", "AsyncLogsResource"]
@@ -60,7 +60,7 @@ class LogsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> SyncOffsetPage[InferenceLog]:
+    ) -> SyncOffsetPage[InferenceDeploymentLog]:
         """
         Get inference deployment logs
@@ -92,7 +92,7 @@ class LogsResource(SyncAPIResource):
             raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
-            page=SyncOffsetPage[InferenceLog],
+            page=SyncOffsetPage[InferenceDeploymentLog],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -108,7 +108,7 @@ class LogsResource(SyncAPIResource):
                     log_list_params.LogListParams,
                 ),
             ),
-            model=InferenceLog,
+            model=InferenceDeploymentLog,
         )
@@ -147,7 +147,7 @@ class AsyncLogsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> AsyncPaginator[InferenceLog, AsyncOffsetPage[InferenceLog]]:
+    ) -> AsyncPaginator[InferenceDeploymentLog, AsyncOffsetPage[InferenceDeploymentLog]]:
         """
         Get inference deployment logs
@@ -179,7 +179,7 @@ class AsyncLogsResource(AsyncAPIResource):
             raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
         return self._get_api_list(
             f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
-            page=AsyncOffsetPage[InferenceLog],
+            page=AsyncOffsetPage[InferenceDeploymentLog],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -195,7 +195,7 @@ class AsyncLogsResource(AsyncAPIResource):
                     log_list_params.LogListParams,
                 ),
             ),
-            model=InferenceLog,
+            model=InferenceDeploymentLog,
         )

gcore/resources/cloud/inference/inference.py CHANGED Viewed

@@ -28,6 +28,14 @@ from .secrets import (
     SecretsResourceWithStreamingResponse,
     AsyncSecretsResourceWithStreamingResponse,
 )
+from .api_keys import (
+    APIKeysResource,
+    AsyncAPIKeysResource,
+    APIKeysResourceWithRawResponse,
+    AsyncAPIKeysResourceWithRawResponse,
+    APIKeysResourceWithStreamingResponse,
+    AsyncAPIKeysResourceWithStreamingResponse,
+)
 from ...._types import NOT_GIVEN, Body, Query, Headers, NotGiven
 from ...._compat import cached_property
 from ...._resource import SyncAPIResource, AsyncAPIResource
@@ -54,7 +62,7 @@ from .deployments.deployments import (
     DeploymentsResourceWithStreamingResponse,
     AsyncDeploymentsResourceWithStreamingResponse,
 )
-from ....types.cloud.region_capacity_list import RegionCapacityList
+from ....types.cloud.inference_region_capacity_list import InferenceRegionCapacityList
 __all__ = ["InferenceResource", "AsyncInferenceResource"]
@@ -80,6 +88,10 @@ class InferenceResource(SyncAPIResource):
     def secrets(self) -> SecretsResource:
         return SecretsResource(self._client)
+    @cached_property
+    def api_keys(self) -> APIKeysResource:
+        return APIKeysResource(self._client)
     @cached_property
     def with_raw_response(self) -> InferenceResourceWithRawResponse:
         """
@@ -108,14 +120,14 @@ class InferenceResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> RegionCapacityList:
+    ) -> InferenceRegionCapacityList:
         """Get inference capacity by region"""
         return self._get(
             "/cloud/v3/inference/capacity",
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=RegionCapacityList,
+            cast_to=InferenceRegionCapacityList,
         )
@@ -140,6 +152,10 @@ class AsyncInferenceResource(AsyncAPIResource):
     def secrets(self) -> AsyncSecretsResource:
         return AsyncSecretsResource(self._client)
+    @cached_property
+    def api_keys(self) -> AsyncAPIKeysResource:
+        return AsyncAPIKeysResource(self._client)
     @cached_property
     def with_raw_response(self) -> AsyncInferenceResourceWithRawResponse:
         """
@@ -168,14 +184,14 @@ class AsyncInferenceResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> RegionCapacityList:
+    ) -> InferenceRegionCapacityList:
         """Get inference capacity by region"""
         return await self._get(
             "/cloud/v3/inference/capacity",
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=RegionCapacityList,
+            cast_to=InferenceRegionCapacityList,
         )
@@ -207,6 +223,10 @@ class InferenceResourceWithRawResponse:
     def secrets(self) -> SecretsResourceWithRawResponse:
         return SecretsResourceWithRawResponse(self._inference.secrets)
+    @cached_property
+    def api_keys(self) -> APIKeysResourceWithRawResponse:
+        return APIKeysResourceWithRawResponse(self._inference.api_keys)
 class AsyncInferenceResourceWithRawResponse:
     def __init__(self, inference: AsyncInferenceResource) -> None:
@@ -236,6 +256,10 @@ class AsyncInferenceResourceWithRawResponse:
     def secrets(self) -> AsyncSecretsResourceWithRawResponse:
         return AsyncSecretsResourceWithRawResponse(self._inference.secrets)
+    @cached_property
+    def api_keys(self) -> AsyncAPIKeysResourceWithRawResponse:
+        return AsyncAPIKeysResourceWithRawResponse(self._inference.api_keys)
 class InferenceResourceWithStreamingResponse:
     def __init__(self, inference: InferenceResource) -> None:
@@ -265,6 +289,10 @@ class InferenceResourceWithStreamingResponse:
     def secrets(self) -> SecretsResourceWithStreamingResponse:
         return SecretsResourceWithStreamingResponse(self._inference.secrets)
+    @cached_property
+    def api_keys(self) -> APIKeysResourceWithStreamingResponse:
+        return APIKeysResourceWithStreamingResponse(self._inference.api_keys)
 class AsyncInferenceResourceWithStreamingResponse:
     def __init__(self, inference: AsyncInferenceResource) -> None:
@@ -293,3 +321,7 @@ class AsyncInferenceResourceWithStreamingResponse:
     @cached_property
     def secrets(self) -> AsyncSecretsResourceWithStreamingResponse:
         return AsyncSecretsResourceWithStreamingResponse(self._inference.secrets)
+    @cached_property
+    def api_keys(self) -> AsyncAPIKeysResourceWithStreamingResponse:
+        return AsyncAPIKeysResourceWithStreamingResponse(self._inference.api_keys)

gcore/resources/cloud/inference/models.py CHANGED Viewed

@@ -2,6 +2,8 @@
 from __future__ import annotations
+from typing_extensions import Literal
 import httpx
 from ...._types import NOT_GIVEN, Body, Query, Headers, NotGiven
@@ -16,9 +18,8 @@ from ...._response import (
 )
 from ....pagination import SyncOffsetPage, AsyncOffsetPage
 from ...._base_client import AsyncPaginator, make_request_options
-from ....types.cloud.inference import MlcatalogOrderByChoices, model_list_params
-from ....types.cloud.inference.mlcatalog_model_card import MlcatalogModelCard
-from ....types.cloud.inference.mlcatalog_order_by_choices import MlcatalogOrderByChoices
+from ....types.cloud.inference import model_list_params
+from ....types.cloud.inference.inference_model import InferenceModel
 __all__ = ["ModelsResource", "AsyncModelsResource"]
@@ -48,14 +49,14 @@ class ModelsResource(SyncAPIResource):
         *,
         limit: int | NotGiven = NOT_GIVEN,
         offset: int | NotGiven = NOT_GIVEN,
-        order_by: MlcatalogOrderByChoices | NotGiven = NOT_GIVEN,
+        order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
         # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
         # The extra values given here take precedence over values defined on the client or passed to this method.
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> SyncOffsetPage[MlcatalogModelCard]:
+    ) -> SyncOffsetPage[InferenceModel]:
         """List models from catalog
         Args:
@@ -78,7 +79,7 @@ class ModelsResource(SyncAPIResource):
         """
         return self._get_api_list(
             "/cloud/v3/inference/models",
-            page=SyncOffsetPage[MlcatalogModelCard],
+            page=SyncOffsetPage[InferenceModel],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -93,7 +94,7 @@ class ModelsResource(SyncAPIResource):
                     model_list_params.ModelListParams,
                 ),
             ),
-            model=MlcatalogModelCard,
+            model=InferenceModel,
         )
     def get(
@@ -106,7 +107,7 @@ class ModelsResource(SyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> MlcatalogModelCard:
+    ) -> InferenceModel:
         """
         Get model from catalog
@@ -128,7 +129,7 @@ class ModelsResource(SyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=MlcatalogModelCard,
+            cast_to=InferenceModel,
         )
@@ -157,14 +158,14 @@ class AsyncModelsResource(AsyncAPIResource):
         *,
         limit: int | NotGiven = NOT_GIVEN,
         offset: int | NotGiven = NOT_GIVEN,
-        order_by: MlcatalogOrderByChoices | NotGiven = NOT_GIVEN,
+        order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
         # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
         # The extra values given here take precedence over values defined on the client or passed to this method.
         extra_headers: Headers | None = None,
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> AsyncPaginator[MlcatalogModelCard, AsyncOffsetPage[MlcatalogModelCard]]:
+    ) -> AsyncPaginator[InferenceModel, AsyncOffsetPage[InferenceModel]]:
         """List models from catalog
         Args:
@@ -187,7 +188,7 @@ class AsyncModelsResource(AsyncAPIResource):
         """
         return self._get_api_list(
             "/cloud/v3/inference/models",
-            page=AsyncOffsetPage[MlcatalogModelCard],
+            page=AsyncOffsetPage[InferenceModel],
             options=make_request_options(
                 extra_headers=extra_headers,
                 extra_query=extra_query,
@@ -202,7 +203,7 @@ class AsyncModelsResource(AsyncAPIResource):
                     model_list_params.ModelListParams,
                 ),
             ),
-            model=MlcatalogModelCard,
+            model=InferenceModel,
         )
     async def get(
@@ -215,7 +216,7 @@ class AsyncModelsResource(AsyncAPIResource):
         extra_query: Query | None = None,
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
-    ) -> MlcatalogModelCard:
+    ) -> InferenceModel:
         """
         Get model from catalog
@@ -237,7 +238,7 @@ class AsyncModelsResource(AsyncAPIResource):
             options=make_request_options(
                 extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
             ),
-            cast_to=MlcatalogModelCard,
+            cast_to=InferenceModel,
         )

gcore 0.4.0__py3-none-any.whl → 0.6.0__py3-none-any.whl

Potentially problematic release.

gcore 0.4.0py3-none-any.whl → 0.6.0py3-none-any.whl