gcore 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of gcore might be problematic. Click here for more details.
- gcore/__init__.py +2 -1
- gcore/_base_client.py +31 -2
- gcore/_client.py +18 -0
- gcore/_constants.py +2 -2
- gcore/_models.py +8 -5
- gcore/_version.py +1 -1
- gcore/pagination.py +252 -1
- gcore/resources/__init__.py +28 -0
- gcore/resources/cloud/baremetal/flavors.py +11 -137
- gcore/resources/cloud/baremetal/images.py +10 -12
- gcore/resources/cloud/baremetal/servers.py +33 -30
- gcore/resources/cloud/billing_reservations.py +2 -2
- gcore/resources/cloud/file_shares/file_shares.py +7 -8
- gcore/resources/cloud/floating_ips.py +7 -12
- gcore/resources/cloud/gpu_baremetal_clusters/gpu_baremetal_clusters.py +33 -22
- gcore/resources/cloud/gpu_baremetal_clusters/images.py +9 -10
- gcore/resources/cloud/gpu_baremetal_clusters/interfaces.py +2 -2
- gcore/resources/cloud/gpu_baremetal_clusters/servers.py +8 -4
- gcore/resources/cloud/inference/deployments/deployments.py +76 -35
- gcore/resources/cloud/inference/deployments/logs.py +7 -7
- gcore/resources/cloud/inference/inference.py +5 -5
- gcore/resources/cloud/inference/models.py +16 -15
- gcore/resources/cloud/inference/registry_credentials.py +18 -18
- gcore/resources/cloud/inference/secrets.py +12 -13
- gcore/resources/cloud/instances/flavors.py +9 -233
- gcore/resources/cloud/instances/images.py +47 -37
- gcore/resources/cloud/instances/instances.py +49 -34
- gcore/resources/cloud/instances/interfaces.py +2 -2
- gcore/resources/cloud/ip_ranges.py +34 -2
- gcore/resources/cloud/load_balancers/l7_policies/l7_policies.py +10 -2
- gcore/resources/cloud/load_balancers/listeners.py +17 -8
- gcore/resources/cloud/load_balancers/load_balancers.py +73 -21
- gcore/resources/cloud/load_balancers/metrics.py +2 -2
- gcore/resources/cloud/load_balancers/pools/health_monitors.py +2 -2
- gcore/resources/cloud/load_balancers/pools/members.py +6 -2
- gcore/resources/cloud/networks/networks.py +81 -17
- gcore/resources/cloud/networks/routers.py +18 -18
- gcore/resources/cloud/networks/subnets.py +51 -11
- gcore/resources/cloud/projects.py +38 -24
- gcore/resources/cloud/quotas/quotas.py +6 -6
- gcore/resources/cloud/quotas/requests.py +8 -8
- gcore/resources/cloud/registries/artifacts.py +4 -4
- gcore/resources/cloud/registries/registries.py +14 -16
- gcore/resources/cloud/registries/repositories.py +4 -4
- gcore/resources/cloud/registries/tags.py +2 -2
- gcore/resources/cloud/registries/users.py +21 -22
- gcore/resources/cloud/reserved_fixed_ips/reserved_fixed_ips.py +20 -20
- gcore/resources/cloud/reserved_fixed_ips/vip.py +10 -10
- gcore/resources/cloud/secrets.py +14 -224
- gcore/resources/cloud/security_groups/rules.py +6 -6
- gcore/resources/cloud/security_groups/security_groups.py +70 -31
- gcore/resources/cloud/tasks.py +34 -32
- gcore/resources/cloud/users/role_assignments.py +12 -14
- gcore/resources/cloud/volumes.py +139 -49
- gcore/resources/fastedge/__init__.py +103 -0
- gcore/resources/fastedge/apps/__init__.py +33 -0
- gcore/resources/fastedge/apps/apps.py +932 -0
- gcore/resources/fastedge/apps/logs.py +248 -0
- gcore/resources/fastedge/binaries.py +286 -0
- gcore/resources/fastedge/fastedge.py +327 -0
- gcore/resources/fastedge/kv_stores.py +523 -0
- gcore/resources/fastedge/secrets.py +687 -0
- gcore/resources/fastedge/statistics.py +347 -0
- gcore/resources/fastedge/templates.py +652 -0
- gcore/resources/iam/__init__.py +47 -0
- gcore/resources/iam/api_tokens.py +521 -0
- gcore/resources/iam/iam.py +199 -0
- gcore/resources/iam/users.py +642 -0
- gcore/resources/waap/__init__.py +0 -14
- gcore/resources/waap/waap.py +0 -32
- gcore/types/cloud/__init__.py +2 -28
- gcore/types/cloud/baremetal/__init__.py +0 -1
- gcore/types/cloud/baremetal/image_list_params.py +1 -5
- gcore/types/cloud/baremetal/server_create_params.py +5 -9
- gcore/types/cloud/baremetal/server_list_params.py +1 -5
- gcore/types/cloud/ddos_profile.py +9 -3
- gcore/types/cloud/file_share_create_params.py +3 -5
- gcore/types/cloud/floating_ip_create_params.py +2 -4
- gcore/types/cloud/floating_ip_list_params.py +1 -5
- gcore/types/cloud/gpu_baremetal_cluster_create_params.py +3 -4
- gcore/types/cloud/gpu_baremetal_clusters/image_upload_params.py +2 -4
- gcore/types/cloud/health_monitor.py +6 -1
- gcore/types/cloud/inference/__init__.py +12 -8
- gcore/types/cloud/inference/deployment_create_params.py +224 -7
- gcore/types/cloud/inference/deployment_update_params.py +24 -3
- gcore/types/cloud/inference/deployments/__init__.py +1 -0
- gcore/types/cloud/inference/{inference_log.py → deployments/inference_deployment_log.py} +3 -3
- gcore/types/cloud/inference/inference_deployment.py +266 -0
- gcore/types/cloud/inference/{inference_apikey_secret.py → inference_deployment_api_key.py} +2 -2
- gcore/types/cloud/inference/{mlcatalog_model_card.py → inference_model.py} +2 -2
- gcore/types/cloud/inference/{inference_registry_credential.py → inference_registry_credentials.py} +2 -2
- gcore/types/cloud/inference/{inference_registry_credential_full.py → inference_registry_credentials_create.py} +2 -2
- gcore/types/cloud/inference/inference_secret.py +10 -3
- gcore/types/cloud/inference/model_list_params.py +2 -4
- gcore/types/cloud/{container_probe.py → inference/probe.py} +9 -9
- gcore/types/cloud/{container_probe_config.py → inference/probe_config.py} +5 -5
- gcore/types/cloud/{container_probe_exec.py → inference/probe_exec.py} +3 -3
- gcore/types/cloud/{container_probe_http_get.py → inference/probe_http_get.py} +3 -3
- gcore/types/cloud/{container_probe_tcp_socket.py → inference/probe_tcp_socket.py} +3 -3
- gcore/types/cloud/inference/secret_create_params.py +10 -4
- gcore/types/cloud/inference/secret_replace_params.py +10 -4
- gcore/types/cloud/{region_capacity.py → inference_region_capacity.py} +10 -3
- gcore/types/cloud/{region_capacity_list.py → inference_region_capacity_list.py} +4 -4
- gcore/types/cloud/instance_create_params.py +8 -9
- gcore/types/cloud/instance_list_params.py +1 -5
- gcore/types/cloud/instances/__init__.py +0 -2
- gcore/types/cloud/instances/image_create_from_volume_params.py +2 -4
- gcore/types/cloud/instances/image_list_params.py +1 -5
- gcore/types/cloud/instances/image_upload_params.py +2 -4
- gcore/types/cloud/load_balancer_create_params.py +8 -4
- gcore/types/cloud/load_balancer_list_params.py +1 -5
- gcore/types/cloud/load_balancer_update_params.py +24 -0
- gcore/types/cloud/load_balancers/pool_create_params.py +6 -1
- gcore/types/cloud/load_balancers/pool_update_params.py +6 -1
- gcore/types/cloud/load_balancers/pools/member_add_params.py +6 -1
- gcore/types/cloud/member.py +6 -1
- gcore/types/cloud/network_create_params.py +2 -3
- gcore/types/cloud/network_list_params.py +4 -5
- gcore/types/cloud/network_update_params.py +28 -2
- gcore/types/cloud/networks/router_list_params.py +2 -2
- gcore/types/cloud/networks/subnet_create_params.py +2 -3
- gcore/types/cloud/networks/subnet_list_params.py +1 -5
- gcore/types/cloud/networks/subnet_update_params.py +25 -0
- gcore/types/cloud/registries/__init__.py +1 -0
- gcore/types/cloud/registries/user_refresh_secret_response.py +31 -0
- gcore/types/cloud/reserved_fixed_ip_list_params.py +2 -2
- gcore/types/cloud/security_group_list_params.py +3 -7
- gcore/types/cloud/security_group_update_params.py +25 -0
- gcore/types/cloud/tag_update_map_param.py +2 -2
- gcore/types/cloud/task_list_params.py +15 -14
- gcore/types/cloud/volume_list_params.py +1 -5
- gcore/types/cloud/volume_update_params.py +29 -3
- gcore/types/fastedge/__init__.py +48 -0
- gcore/types/fastedge/app.py +81 -0
- gcore/types/fastedge/app_create_params.py +56 -0
- gcore/types/fastedge/app_list_params.py +50 -0
- gcore/types/fastedge/app_param.py +56 -0
- gcore/types/fastedge/app_replace_params.py +17 -0
- gcore/types/fastedge/app_short.py +60 -0
- gcore/types/fastedge/app_update_params.py +56 -0
- gcore/types/fastedge/apps/__init__.py +6 -0
- gcore/types/fastedge/apps/log.py +28 -0
- gcore/types/fastedge/apps/log_list_params.py +37 -0
- gcore/types/fastedge/binary.py +40 -0
- gcore/types/fastedge/binary_list_response.py +12 -0
- gcore/types/fastedge/binary_short.py +32 -0
- gcore/types/fastedge/call_status.py +24 -0
- gcore/types/fastedge/client.py +57 -0
- gcore/types/fastedge/duration_stats.py +30 -0
- gcore/types/fastedge/kv_store.py +33 -0
- gcore/types/fastedge/kv_store_create_params.py +23 -0
- gcore/types/fastedge/kv_store_get_response.py +10 -0
- gcore/types/fastedge/kv_store_list_params.py +12 -0
- gcore/types/fastedge/kv_store_list_response.py +15 -0
- gcore/types/fastedge/kv_store_replace_params.py +23 -0
- gcore/types/fastedge/kv_store_short.py +19 -0
- gcore/types/fastedge/kv_store_stats.py +26 -0
- gcore/types/fastedge/secret.py +29 -0
- gcore/types/fastedge/secret_create_params.py +27 -0
- gcore/types/fastedge/secret_create_response.py +12 -0
- gcore/types/fastedge/secret_delete_params.py +12 -0
- gcore/types/fastedge/secret_list_params.py +15 -0
- gcore/types/{cloud → fastedge}/secret_list_response.py +2 -6
- gcore/types/fastedge/secret_replace_params.py +27 -0
- gcore/types/fastedge/secret_short.py +21 -0
- gcore/types/fastedge/secret_update_params.py +27 -0
- gcore/types/fastedge/statistic_get_call_series_params.py +28 -0
- gcore/types/fastedge/statistic_get_call_series_response.py +12 -0
- gcore/types/fastedge/statistic_get_duration_series_params.py +28 -0
- gcore/types/fastedge/statistic_get_duration_series_response.py +12 -0
- gcore/types/fastedge/template.py +31 -0
- gcore/types/fastedge/template_create_params.py +30 -0
- gcore/types/fastedge/template_delete_params.py +12 -0
- gcore/types/fastedge/template_list_params.py +25 -0
- gcore/types/fastedge/template_parameter.py +22 -0
- gcore/types/fastedge/template_parameter_param.py +21 -0
- gcore/types/fastedge/template_replace_params.py +30 -0
- gcore/types/fastedge/template_short.py +27 -0
- gcore/types/iam/__init__.py +17 -0
- gcore/types/iam/account_overview.py +488 -0
- gcore/types/iam/api_token.py +78 -0
- gcore/types/iam/api_token_create.py +15 -0
- gcore/types/iam/api_token_create_params.py +42 -0
- gcore/types/iam/api_token_list.py +81 -0
- gcore/types/iam/api_token_list_params.py +41 -0
- gcore/types/iam/user.py +86 -0
- gcore/types/iam/user_detailed.py +104 -0
- gcore/types/iam/user_invite.py +15 -0
- gcore/types/iam/user_invite_params.py +37 -0
- gcore/types/iam/user_list_params.py +15 -0
- gcore/types/iam/user_update.py +104 -0
- gcore/types/iam/user_update_params.py +52 -0
- gcore/types/waap/__init__.py +0 -1
- gcore/types/waap/domains/custom_rule_create_params.py +7 -3
- gcore/types/waap/domains/custom_rule_update_params.py +7 -3
- gcore/types/waap/waap_custom_rule.py +7 -3
- {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/METADATA +44 -5
- {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/RECORD +200 -151
- gcore/resources/waap/clients.py +0 -135
- gcore/types/cloud/aws_iam_data.py +0 -13
- gcore/types/cloud/aws_iam_data_param.py +0 -15
- gcore/types/cloud/baremetal/flavor_list_suitable_params.py +0 -22
- gcore/types/cloud/capacity.py +0 -13
- gcore/types/cloud/container_probe_config_create_param.py +0 -17
- gcore/types/cloud/container_probe_create_param.py +0 -38
- gcore/types/cloud/container_probe_exec_create_param.py +0 -13
- gcore/types/cloud/container_probe_http_get_create_param.py +0 -25
- gcore/types/cloud/container_probe_tcp_socket_create_param.py +0 -12
- gcore/types/cloud/container_scale.py +0 -25
- gcore/types/cloud/container_scale_trigger_rate.py +0 -13
- gcore/types/cloud/container_scale_trigger_sqs.py +0 -33
- gcore/types/cloud/container_scale_trigger_threshold.py +0 -10
- gcore/types/cloud/container_scale_triggers.py +0 -36
- gcore/types/cloud/deploy_status.py +0 -13
- gcore/types/cloud/inference/container.py +0 -26
- gcore/types/cloud/inference/inference.py +0 -95
- gcore/types/cloud/inference/mlcatalog_order_by_choices.py +0 -7
- gcore/types/cloud/inference_probes.py +0 -19
- gcore/types/cloud/ingress_opts_out.py +0 -16
- gcore/types/cloud/ingress_opts_param.py +0 -18
- gcore/types/cloud/instances/flavor_list_for_resize_params.py +0 -16
- gcore/types/cloud/instances/flavor_list_suitable_params.py +0 -59
- gcore/types/cloud/secret_create_params.py +0 -66
- gcore/types/waap/client_me_response.py +0 -34
- {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/WHEEL +0 -0
- {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/licenses/LICENSE +0 -0
|
@@ -28,9 +28,8 @@ from .....pagination import SyncOffsetPage, AsyncOffsetPage
|
|
|
28
28
|
from ....._base_client import AsyncPaginator, make_request_options
|
|
29
29
|
from .....types.cloud.inference import deployment_list_params, deployment_create_params, deployment_update_params
|
|
30
30
|
from .....types.cloud.task_id_list import TaskIDList
|
|
31
|
-
from .....types.cloud.
|
|
32
|
-
from .....types.cloud.inference.
|
|
33
|
-
from .....types.cloud.inference.inference_apikey_secret import InferenceApikeySecret
|
|
31
|
+
from .....types.cloud.inference.inference_deployment import InferenceDeployment
|
|
32
|
+
from .....types.cloud.inference.inference_deployment_api_key import InferenceDeploymentAPIKey
|
|
34
33
|
|
|
35
34
|
__all__ = ["DeploymentsResource", "AsyncDeploymentsResource"]
|
|
36
35
|
|
|
@@ -68,12 +67,13 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
68
67
|
image: str,
|
|
69
68
|
listening_port: int,
|
|
70
69
|
name: str,
|
|
70
|
+
api_keys: List[str] | NotGiven = NOT_GIVEN,
|
|
71
71
|
auth_enabled: bool | NotGiven = NOT_GIVEN,
|
|
72
72
|
command: Optional[List[str]] | NotGiven = NOT_GIVEN,
|
|
73
73
|
credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
|
|
74
74
|
description: Optional[str] | NotGiven = NOT_GIVEN,
|
|
75
75
|
envs: Dict[str, str] | NotGiven = NOT_GIVEN,
|
|
76
|
-
ingress_opts: Optional[
|
|
76
|
+
ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
77
77
|
logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
|
|
78
78
|
probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
|
|
79
79
|
api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
|
|
@@ -103,9 +103,15 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
103
103
|
|
|
104
104
|
name: Inference instance name.
|
|
105
105
|
|
|
106
|
+
api_keys: List of API keys for the inference instance. Multiple keys can be attached to
|
|
107
|
+
one deployment.If `auth_enabled` and `api_keys` are both specified, a
|
|
108
|
+
ValidationError will be raised.
|
|
109
|
+
|
|
106
110
|
auth_enabled: Set to `true` to enable API key authentication for the inference instance.
|
|
107
111
|
`"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
|
|
108
|
-
for the requests to the instance if enabled
|
|
112
|
+
for the requests to the instance if enabled. This field is deprecated and will
|
|
113
|
+
be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
|
|
114
|
+
`api_keys` are both specified, a ValidationError will be raised.
|
|
109
115
|
|
|
110
116
|
command: Command to be executed when running a container from an image.
|
|
111
117
|
|
|
@@ -148,6 +154,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
148
154
|
"image": image,
|
|
149
155
|
"listening_port": listening_port,
|
|
150
156
|
"name": name,
|
|
157
|
+
"api_keys": api_keys,
|
|
151
158
|
"auth_enabled": auth_enabled,
|
|
152
159
|
"command": command,
|
|
153
160
|
"credentials_name": credentials_name,
|
|
@@ -171,6 +178,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
171
178
|
deployment_name: str,
|
|
172
179
|
*,
|
|
173
180
|
project_id: int | None = None,
|
|
181
|
+
api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
|
|
174
182
|
auth_enabled: bool | NotGiven = NOT_GIVEN,
|
|
175
183
|
command: Optional[List[str]] | NotGiven = NOT_GIVEN,
|
|
176
184
|
containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
|
|
@@ -179,7 +187,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
179
187
|
envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
|
|
180
188
|
flavor_name: str | NotGiven = NOT_GIVEN,
|
|
181
189
|
image: Optional[str] | NotGiven = NOT_GIVEN,
|
|
182
|
-
ingress_opts: Optional[
|
|
190
|
+
ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
183
191
|
listening_port: Optional[int] | NotGiven = NOT_GIVEN,
|
|
184
192
|
logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
|
|
185
193
|
probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
|
|
@@ -199,9 +207,16 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
199
207
|
|
|
200
208
|
deployment_name: Inference instance name.
|
|
201
209
|
|
|
210
|
+
api_keys: List of API keys for the inference instance. Multiple keys can be attached to
|
|
211
|
+
one deployment.If `auth_enabled` and `api_keys` are both specified, a
|
|
212
|
+
ValidationError will be raised.If `[]` is provided, the API keys will be removed
|
|
213
|
+
and auth will be disabled on the deployment.
|
|
214
|
+
|
|
202
215
|
auth_enabled: Set to `true` to enable API key authentication for the inference instance.
|
|
203
216
|
`"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
|
|
204
|
-
for the requests to the instance if enabled
|
|
217
|
+
for the requests to the instance if enabled. This field is deprecated and will
|
|
218
|
+
be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
|
|
219
|
+
`api_keys` are both specified, a ValidationError will be raised.
|
|
205
220
|
|
|
206
221
|
command: Command to be executed when running a container from an image.
|
|
207
222
|
|
|
@@ -250,6 +265,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
250
265
|
f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
|
|
251
266
|
body=maybe_transform(
|
|
252
267
|
{
|
|
268
|
+
"api_keys": api_keys,
|
|
253
269
|
"auth_enabled": auth_enabled,
|
|
254
270
|
"command": command,
|
|
255
271
|
"containers": containers,
|
|
@@ -284,7 +300,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
284
300
|
extra_query: Query | None = None,
|
|
285
301
|
extra_body: Body | None = None,
|
|
286
302
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
287
|
-
) -> SyncOffsetPage[
|
|
303
|
+
) -> SyncOffsetPage[InferenceDeployment]:
|
|
288
304
|
"""List inference deployments
|
|
289
305
|
|
|
290
306
|
Args:
|
|
@@ -309,7 +325,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
309
325
|
project_id = self._client._get_cloud_project_id_path_param()
|
|
310
326
|
return self._get_api_list(
|
|
311
327
|
f"/cloud/v3/inference/{project_id}/deployments",
|
|
312
|
-
page=SyncOffsetPage[
|
|
328
|
+
page=SyncOffsetPage[InferenceDeployment],
|
|
313
329
|
options=make_request_options(
|
|
314
330
|
extra_headers=extra_headers,
|
|
315
331
|
extra_query=extra_query,
|
|
@@ -323,7 +339,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
323
339
|
deployment_list_params.DeploymentListParams,
|
|
324
340
|
),
|
|
325
341
|
),
|
|
326
|
-
model=
|
|
342
|
+
model=InferenceDeployment,
|
|
327
343
|
)
|
|
328
344
|
|
|
329
345
|
def delete(
|
|
@@ -377,7 +393,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
377
393
|
extra_query: Query | None = None,
|
|
378
394
|
extra_body: Body | None = None,
|
|
379
395
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
380
|
-
) ->
|
|
396
|
+
) -> InferenceDeployment:
|
|
381
397
|
"""
|
|
382
398
|
Get inference deployment
|
|
383
399
|
|
|
@@ -403,7 +419,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
403
419
|
options=make_request_options(
|
|
404
420
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
405
421
|
),
|
|
406
|
-
cast_to=
|
|
422
|
+
cast_to=InferenceDeployment,
|
|
407
423
|
)
|
|
408
424
|
|
|
409
425
|
def get_api_key(
|
|
@@ -417,7 +433,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
417
433
|
extra_query: Query | None = None,
|
|
418
434
|
extra_body: Body | None = None,
|
|
419
435
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
420
|
-
) ->
|
|
436
|
+
) -> InferenceDeploymentAPIKey:
|
|
421
437
|
"""
|
|
422
438
|
Get inference deployment API key
|
|
423
439
|
|
|
@@ -443,7 +459,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
443
459
|
options=make_request_options(
|
|
444
460
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
445
461
|
),
|
|
446
|
-
cast_to=
|
|
462
|
+
cast_to=InferenceDeploymentAPIKey,
|
|
447
463
|
)
|
|
448
464
|
|
|
449
465
|
def start(
|
|
@@ -556,7 +572,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
556
572
|
credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
|
|
557
573
|
description: Optional[str] | NotGiven = NOT_GIVEN,
|
|
558
574
|
envs: Dict[str, str] | NotGiven = NOT_GIVEN,
|
|
559
|
-
ingress_opts: Optional[
|
|
575
|
+
ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
560
576
|
logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
|
|
561
577
|
probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
|
|
562
578
|
api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
|
|
@@ -567,7 +583,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
567
583
|
extra_headers: Headers | None = None,
|
|
568
584
|
extra_query: Query | None = None,
|
|
569
585
|
extra_body: Body | None = None,
|
|
570
|
-
) ->
|
|
586
|
+
) -> InferenceDeployment:
|
|
571
587
|
response = self.create(
|
|
572
588
|
project_id=project_id,
|
|
573
589
|
containers=containers,
|
|
@@ -596,7 +612,11 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
596
612
|
extra_headers=extra_headers,
|
|
597
613
|
polling_interval_seconds=polling_interval_seconds,
|
|
598
614
|
)
|
|
599
|
-
if
|
|
615
|
+
if (
|
|
616
|
+
not task.created_resources
|
|
617
|
+
or not task.created_resources.inference_instances
|
|
618
|
+
or len(task.created_resources.inference_instances) != 1
|
|
619
|
+
):
|
|
600
620
|
raise ValueError(f"Expected exactly one resource to be created in a task")
|
|
601
621
|
return self.get(
|
|
602
622
|
deployment_name=task.created_resources.inference_instances[0],
|
|
@@ -618,7 +638,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
618
638
|
envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
|
|
619
639
|
flavor_name: str | NotGiven = NOT_GIVEN,
|
|
620
640
|
image: Optional[str] | NotGiven = NOT_GIVEN,
|
|
621
|
-
ingress_opts: Optional[
|
|
641
|
+
ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
622
642
|
listening_port: Optional[int] | NotGiven = NOT_GIVEN,
|
|
623
643
|
logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
|
|
624
644
|
probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
|
|
@@ -630,7 +650,7 @@ class DeploymentsResource(SyncAPIResource):
|
|
|
630
650
|
extra_headers: Headers | None = None,
|
|
631
651
|
extra_query: Query | None = None,
|
|
632
652
|
extra_body: Body | None = None,
|
|
633
|
-
) ->
|
|
653
|
+
) -> InferenceDeployment:
|
|
634
654
|
"""
|
|
635
655
|
Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
|
|
636
656
|
"""
|
|
@@ -735,12 +755,13 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
735
755
|
image: str,
|
|
736
756
|
listening_port: int,
|
|
737
757
|
name: str,
|
|
758
|
+
api_keys: List[str] | NotGiven = NOT_GIVEN,
|
|
738
759
|
auth_enabled: bool | NotGiven = NOT_GIVEN,
|
|
739
760
|
command: Optional[List[str]] | NotGiven = NOT_GIVEN,
|
|
740
761
|
credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
|
|
741
762
|
description: Optional[str] | NotGiven = NOT_GIVEN,
|
|
742
763
|
envs: Dict[str, str] | NotGiven = NOT_GIVEN,
|
|
743
|
-
ingress_opts: Optional[
|
|
764
|
+
ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
744
765
|
logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
|
|
745
766
|
probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
|
|
746
767
|
api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
|
|
@@ -770,9 +791,15 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
770
791
|
|
|
771
792
|
name: Inference instance name.
|
|
772
793
|
|
|
794
|
+
api_keys: List of API keys for the inference instance. Multiple keys can be attached to
|
|
795
|
+
one deployment.If `auth_enabled` and `api_keys` are both specified, a
|
|
796
|
+
ValidationError will be raised.
|
|
797
|
+
|
|
773
798
|
auth_enabled: Set to `true` to enable API key authentication for the inference instance.
|
|
774
799
|
`"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
|
|
775
|
-
for the requests to the instance if enabled
|
|
800
|
+
for the requests to the instance if enabled. This field is deprecated and will
|
|
801
|
+
be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
|
|
802
|
+
`api_keys` are both specified, a ValidationError will be raised.
|
|
776
803
|
|
|
777
804
|
command: Command to be executed when running a container from an image.
|
|
778
805
|
|
|
@@ -815,6 +842,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
815
842
|
"image": image,
|
|
816
843
|
"listening_port": listening_port,
|
|
817
844
|
"name": name,
|
|
845
|
+
"api_keys": api_keys,
|
|
818
846
|
"auth_enabled": auth_enabled,
|
|
819
847
|
"command": command,
|
|
820
848
|
"credentials_name": credentials_name,
|
|
@@ -838,6 +866,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
838
866
|
deployment_name: str,
|
|
839
867
|
*,
|
|
840
868
|
project_id: int | None = None,
|
|
869
|
+
api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
|
|
841
870
|
auth_enabled: bool | NotGiven = NOT_GIVEN,
|
|
842
871
|
command: Optional[List[str]] | NotGiven = NOT_GIVEN,
|
|
843
872
|
containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
|
|
@@ -846,7 +875,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
846
875
|
envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
|
|
847
876
|
flavor_name: str | NotGiven = NOT_GIVEN,
|
|
848
877
|
image: Optional[str] | NotGiven = NOT_GIVEN,
|
|
849
|
-
ingress_opts: Optional[
|
|
878
|
+
ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
850
879
|
listening_port: Optional[int] | NotGiven = NOT_GIVEN,
|
|
851
880
|
logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
|
|
852
881
|
probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
|
|
@@ -866,9 +895,16 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
866
895
|
|
|
867
896
|
deployment_name: Inference instance name.
|
|
868
897
|
|
|
898
|
+
api_keys: List of API keys for the inference instance. Multiple keys can be attached to
|
|
899
|
+
one deployment.If `auth_enabled` and `api_keys` are both specified, a
|
|
900
|
+
ValidationError will be raised.If `[]` is provided, the API keys will be removed
|
|
901
|
+
and auth will be disabled on the deployment.
|
|
902
|
+
|
|
869
903
|
auth_enabled: Set to `true` to enable API key authentication for the inference instance.
|
|
870
904
|
`"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
|
|
871
|
-
for the requests to the instance if enabled
|
|
905
|
+
for the requests to the instance if enabled. This field is deprecated and will
|
|
906
|
+
be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
|
|
907
|
+
`api_keys` are both specified, a ValidationError will be raised.
|
|
872
908
|
|
|
873
909
|
command: Command to be executed when running a container from an image.
|
|
874
910
|
|
|
@@ -917,6 +953,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
917
953
|
f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
|
|
918
954
|
body=await async_maybe_transform(
|
|
919
955
|
{
|
|
956
|
+
"api_keys": api_keys,
|
|
920
957
|
"auth_enabled": auth_enabled,
|
|
921
958
|
"command": command,
|
|
922
959
|
"containers": containers,
|
|
@@ -951,7 +988,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
951
988
|
extra_query: Query | None = None,
|
|
952
989
|
extra_body: Body | None = None,
|
|
953
990
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
954
|
-
) -> AsyncPaginator[
|
|
991
|
+
) -> AsyncPaginator[InferenceDeployment, AsyncOffsetPage[InferenceDeployment]]:
|
|
955
992
|
"""List inference deployments
|
|
956
993
|
|
|
957
994
|
Args:
|
|
@@ -976,7 +1013,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
976
1013
|
project_id = self._client._get_cloud_project_id_path_param()
|
|
977
1014
|
return self._get_api_list(
|
|
978
1015
|
f"/cloud/v3/inference/{project_id}/deployments",
|
|
979
|
-
page=AsyncOffsetPage[
|
|
1016
|
+
page=AsyncOffsetPage[InferenceDeployment],
|
|
980
1017
|
options=make_request_options(
|
|
981
1018
|
extra_headers=extra_headers,
|
|
982
1019
|
extra_query=extra_query,
|
|
@@ -990,7 +1027,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
990
1027
|
deployment_list_params.DeploymentListParams,
|
|
991
1028
|
),
|
|
992
1029
|
),
|
|
993
|
-
model=
|
|
1030
|
+
model=InferenceDeployment,
|
|
994
1031
|
)
|
|
995
1032
|
|
|
996
1033
|
async def delete(
|
|
@@ -1044,7 +1081,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1044
1081
|
extra_query: Query | None = None,
|
|
1045
1082
|
extra_body: Body | None = None,
|
|
1046
1083
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
1047
|
-
) ->
|
|
1084
|
+
) -> InferenceDeployment:
|
|
1048
1085
|
"""
|
|
1049
1086
|
Get inference deployment
|
|
1050
1087
|
|
|
@@ -1070,7 +1107,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1070
1107
|
options=make_request_options(
|
|
1071
1108
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
1072
1109
|
),
|
|
1073
|
-
cast_to=
|
|
1110
|
+
cast_to=InferenceDeployment,
|
|
1074
1111
|
)
|
|
1075
1112
|
|
|
1076
1113
|
async def get_api_key(
|
|
@@ -1084,7 +1121,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1084
1121
|
extra_query: Query | None = None,
|
|
1085
1122
|
extra_body: Body | None = None,
|
|
1086
1123
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
1087
|
-
) ->
|
|
1124
|
+
) -> InferenceDeploymentAPIKey:
|
|
1088
1125
|
"""
|
|
1089
1126
|
Get inference deployment API key
|
|
1090
1127
|
|
|
@@ -1110,7 +1147,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1110
1147
|
options=make_request_options(
|
|
1111
1148
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
1112
1149
|
),
|
|
1113
|
-
cast_to=
|
|
1150
|
+
cast_to=InferenceDeploymentAPIKey,
|
|
1114
1151
|
)
|
|
1115
1152
|
|
|
1116
1153
|
async def start(
|
|
@@ -1223,7 +1260,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1223
1260
|
credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
|
|
1224
1261
|
description: Optional[str] | NotGiven = NOT_GIVEN,
|
|
1225
1262
|
envs: Dict[str, str] | NotGiven = NOT_GIVEN,
|
|
1226
|
-
ingress_opts: Optional[
|
|
1263
|
+
ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
1227
1264
|
logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
|
|
1228
1265
|
probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
|
|
1229
1266
|
api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
|
|
@@ -1234,7 +1271,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1234
1271
|
extra_headers: Headers | None = None,
|
|
1235
1272
|
extra_query: Query | None = None,
|
|
1236
1273
|
extra_body: Body | None = None,
|
|
1237
|
-
) ->
|
|
1274
|
+
) -> InferenceDeployment:
|
|
1238
1275
|
response = await self.create(
|
|
1239
1276
|
project_id=project_id,
|
|
1240
1277
|
containers=containers,
|
|
@@ -1263,7 +1300,11 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1263
1300
|
extra_headers=extra_headers,
|
|
1264
1301
|
polling_interval_seconds=polling_interval_seconds,
|
|
1265
1302
|
)
|
|
1266
|
-
if
|
|
1303
|
+
if (
|
|
1304
|
+
not task.created_resources
|
|
1305
|
+
or not task.created_resources.inference_instances
|
|
1306
|
+
or len(task.created_resources.inference_instances) != 1
|
|
1307
|
+
):
|
|
1267
1308
|
raise ValueError(f"Expected exactly one resource to be created in a task")
|
|
1268
1309
|
return await self.get(
|
|
1269
1310
|
deployment_name=task.created_resources.inference_instances[0],
|
|
@@ -1285,7 +1326,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1285
1326
|
envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
|
|
1286
1327
|
flavor_name: str | NotGiven = NOT_GIVEN,
|
|
1287
1328
|
image: Optional[str] | NotGiven = NOT_GIVEN,
|
|
1288
|
-
ingress_opts: Optional[
|
|
1329
|
+
ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
|
|
1289
1330
|
listening_port: Optional[int] | NotGiven = NOT_GIVEN,
|
|
1290
1331
|
logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
|
|
1291
1332
|
probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
|
|
@@ -1297,7 +1338,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
|
|
|
1297
1338
|
extra_headers: Headers | None = None,
|
|
1298
1339
|
extra_query: Query | None = None,
|
|
1299
1340
|
extra_body: Body | None = None,
|
|
1300
|
-
) ->
|
|
1341
|
+
) -> InferenceDeployment:
|
|
1301
1342
|
"""
|
|
1302
1343
|
Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
|
|
1303
1344
|
"""
|
|
@@ -20,7 +20,7 @@ from ....._response import (
|
|
|
20
20
|
from .....pagination import SyncOffsetPage, AsyncOffsetPage
|
|
21
21
|
from ....._base_client import AsyncPaginator, make_request_options
|
|
22
22
|
from .....types.cloud.inference.deployments import log_list_params
|
|
23
|
-
from .....types.cloud.inference.
|
|
23
|
+
from .....types.cloud.inference.deployments.inference_deployment_log import InferenceDeploymentLog
|
|
24
24
|
|
|
25
25
|
__all__ = ["LogsResource", "AsyncLogsResource"]
|
|
26
26
|
|
|
@@ -60,7 +60,7 @@ class LogsResource(SyncAPIResource):
|
|
|
60
60
|
extra_query: Query | None = None,
|
|
61
61
|
extra_body: Body | None = None,
|
|
62
62
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
63
|
-
) -> SyncOffsetPage[
|
|
63
|
+
) -> SyncOffsetPage[InferenceDeploymentLog]:
|
|
64
64
|
"""
|
|
65
65
|
Get inference deployment logs
|
|
66
66
|
|
|
@@ -92,7 +92,7 @@ class LogsResource(SyncAPIResource):
|
|
|
92
92
|
raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
|
|
93
93
|
return self._get_api_list(
|
|
94
94
|
f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
|
|
95
|
-
page=SyncOffsetPage[
|
|
95
|
+
page=SyncOffsetPage[InferenceDeploymentLog],
|
|
96
96
|
options=make_request_options(
|
|
97
97
|
extra_headers=extra_headers,
|
|
98
98
|
extra_query=extra_query,
|
|
@@ -108,7 +108,7 @@ class LogsResource(SyncAPIResource):
|
|
|
108
108
|
log_list_params.LogListParams,
|
|
109
109
|
),
|
|
110
110
|
),
|
|
111
|
-
model=
|
|
111
|
+
model=InferenceDeploymentLog,
|
|
112
112
|
)
|
|
113
113
|
|
|
114
114
|
|
|
@@ -147,7 +147,7 @@ class AsyncLogsResource(AsyncAPIResource):
|
|
|
147
147
|
extra_query: Query | None = None,
|
|
148
148
|
extra_body: Body | None = None,
|
|
149
149
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
150
|
-
) -> AsyncPaginator[
|
|
150
|
+
) -> AsyncPaginator[InferenceDeploymentLog, AsyncOffsetPage[InferenceDeploymentLog]]:
|
|
151
151
|
"""
|
|
152
152
|
Get inference deployment logs
|
|
153
153
|
|
|
@@ -179,7 +179,7 @@ class AsyncLogsResource(AsyncAPIResource):
|
|
|
179
179
|
raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
|
|
180
180
|
return self._get_api_list(
|
|
181
181
|
f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
|
|
182
|
-
page=AsyncOffsetPage[
|
|
182
|
+
page=AsyncOffsetPage[InferenceDeploymentLog],
|
|
183
183
|
options=make_request_options(
|
|
184
184
|
extra_headers=extra_headers,
|
|
185
185
|
extra_query=extra_query,
|
|
@@ -195,7 +195,7 @@ class AsyncLogsResource(AsyncAPIResource):
|
|
|
195
195
|
log_list_params.LogListParams,
|
|
196
196
|
),
|
|
197
197
|
),
|
|
198
|
-
model=
|
|
198
|
+
model=InferenceDeploymentLog,
|
|
199
199
|
)
|
|
200
200
|
|
|
201
201
|
|
|
@@ -54,7 +54,7 @@ from .deployments.deployments import (
|
|
|
54
54
|
DeploymentsResourceWithStreamingResponse,
|
|
55
55
|
AsyncDeploymentsResourceWithStreamingResponse,
|
|
56
56
|
)
|
|
57
|
-
from ....types.cloud.
|
|
57
|
+
from ....types.cloud.inference_region_capacity_list import InferenceRegionCapacityList
|
|
58
58
|
|
|
59
59
|
__all__ = ["InferenceResource", "AsyncInferenceResource"]
|
|
60
60
|
|
|
@@ -108,14 +108,14 @@ class InferenceResource(SyncAPIResource):
|
|
|
108
108
|
extra_query: Query | None = None,
|
|
109
109
|
extra_body: Body | None = None,
|
|
110
110
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
111
|
-
) ->
|
|
111
|
+
) -> InferenceRegionCapacityList:
|
|
112
112
|
"""Get inference capacity by region"""
|
|
113
113
|
return self._get(
|
|
114
114
|
"/cloud/v3/inference/capacity",
|
|
115
115
|
options=make_request_options(
|
|
116
116
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
117
117
|
),
|
|
118
|
-
cast_to=
|
|
118
|
+
cast_to=InferenceRegionCapacityList,
|
|
119
119
|
)
|
|
120
120
|
|
|
121
121
|
|
|
@@ -168,14 +168,14 @@ class AsyncInferenceResource(AsyncAPIResource):
|
|
|
168
168
|
extra_query: Query | None = None,
|
|
169
169
|
extra_body: Body | None = None,
|
|
170
170
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
171
|
-
) ->
|
|
171
|
+
) -> InferenceRegionCapacityList:
|
|
172
172
|
"""Get inference capacity by region"""
|
|
173
173
|
return await self._get(
|
|
174
174
|
"/cloud/v3/inference/capacity",
|
|
175
175
|
options=make_request_options(
|
|
176
176
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
177
177
|
),
|
|
178
|
-
cast_to=
|
|
178
|
+
cast_to=InferenceRegionCapacityList,
|
|
179
179
|
)
|
|
180
180
|
|
|
181
181
|
|
|
@@ -2,6 +2,8 @@
|
|
|
2
2
|
|
|
3
3
|
from __future__ import annotations
|
|
4
4
|
|
|
5
|
+
from typing_extensions import Literal
|
|
6
|
+
|
|
5
7
|
import httpx
|
|
6
8
|
|
|
7
9
|
from ...._types import NOT_GIVEN, Body, Query, Headers, NotGiven
|
|
@@ -16,9 +18,8 @@ from ...._response import (
|
|
|
16
18
|
)
|
|
17
19
|
from ....pagination import SyncOffsetPage, AsyncOffsetPage
|
|
18
20
|
from ...._base_client import AsyncPaginator, make_request_options
|
|
19
|
-
from ....types.cloud.inference import
|
|
20
|
-
from ....types.cloud.inference.
|
|
21
|
-
from ....types.cloud.inference.mlcatalog_order_by_choices import MlcatalogOrderByChoices
|
|
21
|
+
from ....types.cloud.inference import model_list_params
|
|
22
|
+
from ....types.cloud.inference.inference_model import InferenceModel
|
|
22
23
|
|
|
23
24
|
__all__ = ["ModelsResource", "AsyncModelsResource"]
|
|
24
25
|
|
|
@@ -48,14 +49,14 @@ class ModelsResource(SyncAPIResource):
|
|
|
48
49
|
*,
|
|
49
50
|
limit: int | NotGiven = NOT_GIVEN,
|
|
50
51
|
offset: int | NotGiven = NOT_GIVEN,
|
|
51
|
-
order_by:
|
|
52
|
+
order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
|
|
52
53
|
# Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
|
|
53
54
|
# The extra values given here take precedence over values defined on the client or passed to this method.
|
|
54
55
|
extra_headers: Headers | None = None,
|
|
55
56
|
extra_query: Query | None = None,
|
|
56
57
|
extra_body: Body | None = None,
|
|
57
58
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
58
|
-
) -> SyncOffsetPage[
|
|
59
|
+
) -> SyncOffsetPage[InferenceModel]:
|
|
59
60
|
"""List models from catalog
|
|
60
61
|
|
|
61
62
|
Args:
|
|
@@ -78,7 +79,7 @@ class ModelsResource(SyncAPIResource):
|
|
|
78
79
|
"""
|
|
79
80
|
return self._get_api_list(
|
|
80
81
|
"/cloud/v3/inference/models",
|
|
81
|
-
page=SyncOffsetPage[
|
|
82
|
+
page=SyncOffsetPage[InferenceModel],
|
|
82
83
|
options=make_request_options(
|
|
83
84
|
extra_headers=extra_headers,
|
|
84
85
|
extra_query=extra_query,
|
|
@@ -93,7 +94,7 @@ class ModelsResource(SyncAPIResource):
|
|
|
93
94
|
model_list_params.ModelListParams,
|
|
94
95
|
),
|
|
95
96
|
),
|
|
96
|
-
model=
|
|
97
|
+
model=InferenceModel,
|
|
97
98
|
)
|
|
98
99
|
|
|
99
100
|
def get(
|
|
@@ -106,7 +107,7 @@ class ModelsResource(SyncAPIResource):
|
|
|
106
107
|
extra_query: Query | None = None,
|
|
107
108
|
extra_body: Body | None = None,
|
|
108
109
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
109
|
-
) ->
|
|
110
|
+
) -> InferenceModel:
|
|
110
111
|
"""
|
|
111
112
|
Get model from catalog
|
|
112
113
|
|
|
@@ -128,7 +129,7 @@ class ModelsResource(SyncAPIResource):
|
|
|
128
129
|
options=make_request_options(
|
|
129
130
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
130
131
|
),
|
|
131
|
-
cast_to=
|
|
132
|
+
cast_to=InferenceModel,
|
|
132
133
|
)
|
|
133
134
|
|
|
134
135
|
|
|
@@ -157,14 +158,14 @@ class AsyncModelsResource(AsyncAPIResource):
|
|
|
157
158
|
*,
|
|
158
159
|
limit: int | NotGiven = NOT_GIVEN,
|
|
159
160
|
offset: int | NotGiven = NOT_GIVEN,
|
|
160
|
-
order_by:
|
|
161
|
+
order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
|
|
161
162
|
# Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
|
|
162
163
|
# The extra values given here take precedence over values defined on the client or passed to this method.
|
|
163
164
|
extra_headers: Headers | None = None,
|
|
164
165
|
extra_query: Query | None = None,
|
|
165
166
|
extra_body: Body | None = None,
|
|
166
167
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
167
|
-
) -> AsyncPaginator[
|
|
168
|
+
) -> AsyncPaginator[InferenceModel, AsyncOffsetPage[InferenceModel]]:
|
|
168
169
|
"""List models from catalog
|
|
169
170
|
|
|
170
171
|
Args:
|
|
@@ -187,7 +188,7 @@ class AsyncModelsResource(AsyncAPIResource):
|
|
|
187
188
|
"""
|
|
188
189
|
return self._get_api_list(
|
|
189
190
|
"/cloud/v3/inference/models",
|
|
190
|
-
page=AsyncOffsetPage[
|
|
191
|
+
page=AsyncOffsetPage[InferenceModel],
|
|
191
192
|
options=make_request_options(
|
|
192
193
|
extra_headers=extra_headers,
|
|
193
194
|
extra_query=extra_query,
|
|
@@ -202,7 +203,7 @@ class AsyncModelsResource(AsyncAPIResource):
|
|
|
202
203
|
model_list_params.ModelListParams,
|
|
203
204
|
),
|
|
204
205
|
),
|
|
205
|
-
model=
|
|
206
|
+
model=InferenceModel,
|
|
206
207
|
)
|
|
207
208
|
|
|
208
209
|
async def get(
|
|
@@ -215,7 +216,7 @@ class AsyncModelsResource(AsyncAPIResource):
|
|
|
215
216
|
extra_query: Query | None = None,
|
|
216
217
|
extra_body: Body | None = None,
|
|
217
218
|
timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
|
|
218
|
-
) ->
|
|
219
|
+
) -> InferenceModel:
|
|
219
220
|
"""
|
|
220
221
|
Get model from catalog
|
|
221
222
|
|
|
@@ -237,7 +238,7 @@ class AsyncModelsResource(AsyncAPIResource):
|
|
|
237
238
|
options=make_request_options(
|
|
238
239
|
extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
|
|
239
240
|
),
|
|
240
|
-
cast_to=
|
|
241
|
+
cast_to=InferenceModel,
|
|
241
242
|
)
|
|
242
243
|
|
|
243
244
|
|