gcore 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of gcore might be problematic. Click here for more details.

Files changed (226) hide show
  1. gcore/__init__.py +2 -1
  2. gcore/_base_client.py +31 -2
  3. gcore/_client.py +18 -0
  4. gcore/_constants.py +2 -2
  5. gcore/_models.py +8 -5
  6. gcore/_version.py +1 -1
  7. gcore/pagination.py +252 -1
  8. gcore/resources/__init__.py +28 -0
  9. gcore/resources/cloud/baremetal/flavors.py +11 -137
  10. gcore/resources/cloud/baremetal/images.py +10 -12
  11. gcore/resources/cloud/baremetal/servers.py +33 -30
  12. gcore/resources/cloud/billing_reservations.py +2 -2
  13. gcore/resources/cloud/file_shares/file_shares.py +7 -8
  14. gcore/resources/cloud/floating_ips.py +7 -12
  15. gcore/resources/cloud/gpu_baremetal_clusters/gpu_baremetal_clusters.py +33 -22
  16. gcore/resources/cloud/gpu_baremetal_clusters/images.py +9 -10
  17. gcore/resources/cloud/gpu_baremetal_clusters/interfaces.py +2 -2
  18. gcore/resources/cloud/gpu_baremetal_clusters/servers.py +8 -4
  19. gcore/resources/cloud/inference/deployments/deployments.py +76 -35
  20. gcore/resources/cloud/inference/deployments/logs.py +7 -7
  21. gcore/resources/cloud/inference/inference.py +5 -5
  22. gcore/resources/cloud/inference/models.py +16 -15
  23. gcore/resources/cloud/inference/registry_credentials.py +18 -18
  24. gcore/resources/cloud/inference/secrets.py +12 -13
  25. gcore/resources/cloud/instances/flavors.py +9 -233
  26. gcore/resources/cloud/instances/images.py +47 -37
  27. gcore/resources/cloud/instances/instances.py +49 -34
  28. gcore/resources/cloud/instances/interfaces.py +2 -2
  29. gcore/resources/cloud/ip_ranges.py +34 -2
  30. gcore/resources/cloud/load_balancers/l7_policies/l7_policies.py +10 -2
  31. gcore/resources/cloud/load_balancers/listeners.py +17 -8
  32. gcore/resources/cloud/load_balancers/load_balancers.py +73 -21
  33. gcore/resources/cloud/load_balancers/metrics.py +2 -2
  34. gcore/resources/cloud/load_balancers/pools/health_monitors.py +2 -2
  35. gcore/resources/cloud/load_balancers/pools/members.py +6 -2
  36. gcore/resources/cloud/networks/networks.py +81 -17
  37. gcore/resources/cloud/networks/routers.py +18 -18
  38. gcore/resources/cloud/networks/subnets.py +51 -11
  39. gcore/resources/cloud/projects.py +38 -24
  40. gcore/resources/cloud/quotas/quotas.py +6 -6
  41. gcore/resources/cloud/quotas/requests.py +8 -8
  42. gcore/resources/cloud/registries/artifacts.py +4 -4
  43. gcore/resources/cloud/registries/registries.py +14 -16
  44. gcore/resources/cloud/registries/repositories.py +4 -4
  45. gcore/resources/cloud/registries/tags.py +2 -2
  46. gcore/resources/cloud/registries/users.py +21 -22
  47. gcore/resources/cloud/reserved_fixed_ips/reserved_fixed_ips.py +20 -20
  48. gcore/resources/cloud/reserved_fixed_ips/vip.py +10 -10
  49. gcore/resources/cloud/secrets.py +14 -224
  50. gcore/resources/cloud/security_groups/rules.py +6 -6
  51. gcore/resources/cloud/security_groups/security_groups.py +70 -31
  52. gcore/resources/cloud/tasks.py +34 -32
  53. gcore/resources/cloud/users/role_assignments.py +12 -14
  54. gcore/resources/cloud/volumes.py +139 -49
  55. gcore/resources/fastedge/__init__.py +103 -0
  56. gcore/resources/fastedge/apps/__init__.py +33 -0
  57. gcore/resources/fastedge/apps/apps.py +932 -0
  58. gcore/resources/fastedge/apps/logs.py +248 -0
  59. gcore/resources/fastedge/binaries.py +286 -0
  60. gcore/resources/fastedge/fastedge.py +327 -0
  61. gcore/resources/fastedge/kv_stores.py +523 -0
  62. gcore/resources/fastedge/secrets.py +687 -0
  63. gcore/resources/fastedge/statistics.py +347 -0
  64. gcore/resources/fastedge/templates.py +652 -0
  65. gcore/resources/iam/__init__.py +47 -0
  66. gcore/resources/iam/api_tokens.py +521 -0
  67. gcore/resources/iam/iam.py +199 -0
  68. gcore/resources/iam/users.py +642 -0
  69. gcore/resources/waap/__init__.py +0 -14
  70. gcore/resources/waap/waap.py +0 -32
  71. gcore/types/cloud/__init__.py +2 -28
  72. gcore/types/cloud/baremetal/__init__.py +0 -1
  73. gcore/types/cloud/baremetal/image_list_params.py +1 -5
  74. gcore/types/cloud/baremetal/server_create_params.py +5 -9
  75. gcore/types/cloud/baremetal/server_list_params.py +1 -5
  76. gcore/types/cloud/ddos_profile.py +9 -3
  77. gcore/types/cloud/file_share_create_params.py +3 -5
  78. gcore/types/cloud/floating_ip_create_params.py +2 -4
  79. gcore/types/cloud/floating_ip_list_params.py +1 -5
  80. gcore/types/cloud/gpu_baremetal_cluster_create_params.py +3 -4
  81. gcore/types/cloud/gpu_baremetal_clusters/image_upload_params.py +2 -4
  82. gcore/types/cloud/health_monitor.py +6 -1
  83. gcore/types/cloud/inference/__init__.py +12 -8
  84. gcore/types/cloud/inference/deployment_create_params.py +224 -7
  85. gcore/types/cloud/inference/deployment_update_params.py +24 -3
  86. gcore/types/cloud/inference/deployments/__init__.py +1 -0
  87. gcore/types/cloud/inference/{inference_log.py → deployments/inference_deployment_log.py} +3 -3
  88. gcore/types/cloud/inference/inference_deployment.py +266 -0
  89. gcore/types/cloud/inference/{inference_apikey_secret.py → inference_deployment_api_key.py} +2 -2
  90. gcore/types/cloud/inference/{mlcatalog_model_card.py → inference_model.py} +2 -2
  91. gcore/types/cloud/inference/{inference_registry_credential.py → inference_registry_credentials.py} +2 -2
  92. gcore/types/cloud/inference/{inference_registry_credential_full.py → inference_registry_credentials_create.py} +2 -2
  93. gcore/types/cloud/inference/inference_secret.py +10 -3
  94. gcore/types/cloud/inference/model_list_params.py +2 -4
  95. gcore/types/cloud/{container_probe.py → inference/probe.py} +9 -9
  96. gcore/types/cloud/{container_probe_config.py → inference/probe_config.py} +5 -5
  97. gcore/types/cloud/{container_probe_exec.py → inference/probe_exec.py} +3 -3
  98. gcore/types/cloud/{container_probe_http_get.py → inference/probe_http_get.py} +3 -3
  99. gcore/types/cloud/{container_probe_tcp_socket.py → inference/probe_tcp_socket.py} +3 -3
  100. gcore/types/cloud/inference/secret_create_params.py +10 -4
  101. gcore/types/cloud/inference/secret_replace_params.py +10 -4
  102. gcore/types/cloud/{region_capacity.py → inference_region_capacity.py} +10 -3
  103. gcore/types/cloud/{region_capacity_list.py → inference_region_capacity_list.py} +4 -4
  104. gcore/types/cloud/instance_create_params.py +8 -9
  105. gcore/types/cloud/instance_list_params.py +1 -5
  106. gcore/types/cloud/instances/__init__.py +0 -2
  107. gcore/types/cloud/instances/image_create_from_volume_params.py +2 -4
  108. gcore/types/cloud/instances/image_list_params.py +1 -5
  109. gcore/types/cloud/instances/image_upload_params.py +2 -4
  110. gcore/types/cloud/load_balancer_create_params.py +8 -4
  111. gcore/types/cloud/load_balancer_list_params.py +1 -5
  112. gcore/types/cloud/load_balancer_update_params.py +24 -0
  113. gcore/types/cloud/load_balancers/pool_create_params.py +6 -1
  114. gcore/types/cloud/load_balancers/pool_update_params.py +6 -1
  115. gcore/types/cloud/load_balancers/pools/member_add_params.py +6 -1
  116. gcore/types/cloud/member.py +6 -1
  117. gcore/types/cloud/network_create_params.py +2 -3
  118. gcore/types/cloud/network_list_params.py +4 -5
  119. gcore/types/cloud/network_update_params.py +28 -2
  120. gcore/types/cloud/networks/router_list_params.py +2 -2
  121. gcore/types/cloud/networks/subnet_create_params.py +2 -3
  122. gcore/types/cloud/networks/subnet_list_params.py +1 -5
  123. gcore/types/cloud/networks/subnet_update_params.py +25 -0
  124. gcore/types/cloud/registries/__init__.py +1 -0
  125. gcore/types/cloud/registries/user_refresh_secret_response.py +31 -0
  126. gcore/types/cloud/reserved_fixed_ip_list_params.py +2 -2
  127. gcore/types/cloud/security_group_list_params.py +3 -7
  128. gcore/types/cloud/security_group_update_params.py +25 -0
  129. gcore/types/cloud/tag_update_map_param.py +2 -2
  130. gcore/types/cloud/task_list_params.py +15 -14
  131. gcore/types/cloud/volume_list_params.py +1 -5
  132. gcore/types/cloud/volume_update_params.py +29 -3
  133. gcore/types/fastedge/__init__.py +48 -0
  134. gcore/types/fastedge/app.py +81 -0
  135. gcore/types/fastedge/app_create_params.py +56 -0
  136. gcore/types/fastedge/app_list_params.py +50 -0
  137. gcore/types/fastedge/app_param.py +56 -0
  138. gcore/types/fastedge/app_replace_params.py +17 -0
  139. gcore/types/fastedge/app_short.py +60 -0
  140. gcore/types/fastedge/app_update_params.py +56 -0
  141. gcore/types/fastedge/apps/__init__.py +6 -0
  142. gcore/types/fastedge/apps/log.py +28 -0
  143. gcore/types/fastedge/apps/log_list_params.py +37 -0
  144. gcore/types/fastedge/binary.py +40 -0
  145. gcore/types/fastedge/binary_list_response.py +12 -0
  146. gcore/types/fastedge/binary_short.py +32 -0
  147. gcore/types/fastedge/call_status.py +24 -0
  148. gcore/types/fastedge/client.py +57 -0
  149. gcore/types/fastedge/duration_stats.py +30 -0
  150. gcore/types/fastedge/kv_store.py +33 -0
  151. gcore/types/fastedge/kv_store_create_params.py +23 -0
  152. gcore/types/fastedge/kv_store_get_response.py +10 -0
  153. gcore/types/fastedge/kv_store_list_params.py +12 -0
  154. gcore/types/fastedge/kv_store_list_response.py +15 -0
  155. gcore/types/fastedge/kv_store_replace_params.py +23 -0
  156. gcore/types/fastedge/kv_store_short.py +19 -0
  157. gcore/types/fastedge/kv_store_stats.py +26 -0
  158. gcore/types/fastedge/secret.py +29 -0
  159. gcore/types/fastedge/secret_create_params.py +27 -0
  160. gcore/types/fastedge/secret_create_response.py +12 -0
  161. gcore/types/fastedge/secret_delete_params.py +12 -0
  162. gcore/types/fastedge/secret_list_params.py +15 -0
  163. gcore/types/{cloud → fastedge}/secret_list_response.py +2 -6
  164. gcore/types/fastedge/secret_replace_params.py +27 -0
  165. gcore/types/fastedge/secret_short.py +21 -0
  166. gcore/types/fastedge/secret_update_params.py +27 -0
  167. gcore/types/fastedge/statistic_get_call_series_params.py +28 -0
  168. gcore/types/fastedge/statistic_get_call_series_response.py +12 -0
  169. gcore/types/fastedge/statistic_get_duration_series_params.py +28 -0
  170. gcore/types/fastedge/statistic_get_duration_series_response.py +12 -0
  171. gcore/types/fastedge/template.py +31 -0
  172. gcore/types/fastedge/template_create_params.py +30 -0
  173. gcore/types/fastedge/template_delete_params.py +12 -0
  174. gcore/types/fastedge/template_list_params.py +25 -0
  175. gcore/types/fastedge/template_parameter.py +22 -0
  176. gcore/types/fastedge/template_parameter_param.py +21 -0
  177. gcore/types/fastedge/template_replace_params.py +30 -0
  178. gcore/types/fastedge/template_short.py +27 -0
  179. gcore/types/iam/__init__.py +17 -0
  180. gcore/types/iam/account_overview.py +488 -0
  181. gcore/types/iam/api_token.py +78 -0
  182. gcore/types/iam/api_token_create.py +15 -0
  183. gcore/types/iam/api_token_create_params.py +42 -0
  184. gcore/types/iam/api_token_list.py +81 -0
  185. gcore/types/iam/api_token_list_params.py +41 -0
  186. gcore/types/iam/user.py +86 -0
  187. gcore/types/iam/user_detailed.py +104 -0
  188. gcore/types/iam/user_invite.py +15 -0
  189. gcore/types/iam/user_invite_params.py +37 -0
  190. gcore/types/iam/user_list_params.py +15 -0
  191. gcore/types/iam/user_update.py +104 -0
  192. gcore/types/iam/user_update_params.py +52 -0
  193. gcore/types/waap/__init__.py +0 -1
  194. gcore/types/waap/domains/custom_rule_create_params.py +7 -3
  195. gcore/types/waap/domains/custom_rule_update_params.py +7 -3
  196. gcore/types/waap/waap_custom_rule.py +7 -3
  197. {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/METADATA +44 -5
  198. {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/RECORD +200 -151
  199. gcore/resources/waap/clients.py +0 -135
  200. gcore/types/cloud/aws_iam_data.py +0 -13
  201. gcore/types/cloud/aws_iam_data_param.py +0 -15
  202. gcore/types/cloud/baremetal/flavor_list_suitable_params.py +0 -22
  203. gcore/types/cloud/capacity.py +0 -13
  204. gcore/types/cloud/container_probe_config_create_param.py +0 -17
  205. gcore/types/cloud/container_probe_create_param.py +0 -38
  206. gcore/types/cloud/container_probe_exec_create_param.py +0 -13
  207. gcore/types/cloud/container_probe_http_get_create_param.py +0 -25
  208. gcore/types/cloud/container_probe_tcp_socket_create_param.py +0 -12
  209. gcore/types/cloud/container_scale.py +0 -25
  210. gcore/types/cloud/container_scale_trigger_rate.py +0 -13
  211. gcore/types/cloud/container_scale_trigger_sqs.py +0 -33
  212. gcore/types/cloud/container_scale_trigger_threshold.py +0 -10
  213. gcore/types/cloud/container_scale_triggers.py +0 -36
  214. gcore/types/cloud/deploy_status.py +0 -13
  215. gcore/types/cloud/inference/container.py +0 -26
  216. gcore/types/cloud/inference/inference.py +0 -95
  217. gcore/types/cloud/inference/mlcatalog_order_by_choices.py +0 -7
  218. gcore/types/cloud/inference_probes.py +0 -19
  219. gcore/types/cloud/ingress_opts_out.py +0 -16
  220. gcore/types/cloud/ingress_opts_param.py +0 -18
  221. gcore/types/cloud/instances/flavor_list_for_resize_params.py +0 -16
  222. gcore/types/cloud/instances/flavor_list_suitable_params.py +0 -59
  223. gcore/types/cloud/secret_create_params.py +0 -66
  224. gcore/types/waap/client_me_response.py +0 -34
  225. {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/WHEEL +0 -0
  226. {gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/licenses/LICENSE +0 -0
@@ -28,9 +28,8 @@ from .....pagination import SyncOffsetPage, AsyncOffsetPage
28
28
  from ....._base_client import AsyncPaginator, make_request_options
29
29
  from .....types.cloud.inference import deployment_list_params, deployment_create_params, deployment_update_params
30
30
  from .....types.cloud.task_id_list import TaskIDList
31
- from .....types.cloud.ingress_opts_param import IngressOptsParam
32
- from .....types.cloud.inference.inference import Inference
33
- from .....types.cloud.inference.inference_apikey_secret import InferenceApikeySecret
31
+ from .....types.cloud.inference.inference_deployment import InferenceDeployment
32
+ from .....types.cloud.inference.inference_deployment_api_key import InferenceDeploymentAPIKey
34
33
 
35
34
  __all__ = ["DeploymentsResource", "AsyncDeploymentsResource"]
36
35
 
@@ -68,12 +67,13 @@ class DeploymentsResource(SyncAPIResource):
68
67
  image: str,
69
68
  listening_port: int,
70
69
  name: str,
70
+ api_keys: List[str] | NotGiven = NOT_GIVEN,
71
71
  auth_enabled: bool | NotGiven = NOT_GIVEN,
72
72
  command: Optional[List[str]] | NotGiven = NOT_GIVEN,
73
73
  credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
74
74
  description: Optional[str] | NotGiven = NOT_GIVEN,
75
75
  envs: Dict[str, str] | NotGiven = NOT_GIVEN,
76
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
76
+ ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
77
77
  logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
78
78
  probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
79
79
  api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -103,9 +103,15 @@ class DeploymentsResource(SyncAPIResource):
103
103
 
104
104
  name: Inference instance name.
105
105
 
106
+ api_keys: List of API keys for the inference instance. Multiple keys can be attached to
107
+ one deployment.If `auth_enabled` and `api_keys` are both specified, a
108
+ ValidationError will be raised.
109
+
106
110
  auth_enabled: Set to `true` to enable API key authentication for the inference instance.
107
111
  `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
108
- for the requests to the instance if enabled
112
+ for the requests to the instance if enabled. This field is deprecated and will
113
+ be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
114
+ `api_keys` are both specified, a ValidationError will be raised.
109
115
 
110
116
  command: Command to be executed when running a container from an image.
111
117
 
@@ -148,6 +154,7 @@ class DeploymentsResource(SyncAPIResource):
148
154
  "image": image,
149
155
  "listening_port": listening_port,
150
156
  "name": name,
157
+ "api_keys": api_keys,
151
158
  "auth_enabled": auth_enabled,
152
159
  "command": command,
153
160
  "credentials_name": credentials_name,
@@ -171,6 +178,7 @@ class DeploymentsResource(SyncAPIResource):
171
178
  deployment_name: str,
172
179
  *,
173
180
  project_id: int | None = None,
181
+ api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
174
182
  auth_enabled: bool | NotGiven = NOT_GIVEN,
175
183
  command: Optional[List[str]] | NotGiven = NOT_GIVEN,
176
184
  containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
@@ -179,7 +187,7 @@ class DeploymentsResource(SyncAPIResource):
179
187
  envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
180
188
  flavor_name: str | NotGiven = NOT_GIVEN,
181
189
  image: Optional[str] | NotGiven = NOT_GIVEN,
182
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
190
+ ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
183
191
  listening_port: Optional[int] | NotGiven = NOT_GIVEN,
184
192
  logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
185
193
  probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -199,9 +207,16 @@ class DeploymentsResource(SyncAPIResource):
199
207
 
200
208
  deployment_name: Inference instance name.
201
209
 
210
+ api_keys: List of API keys for the inference instance. Multiple keys can be attached to
211
+ one deployment.If `auth_enabled` and `api_keys` are both specified, a
212
+ ValidationError will be raised.If `[]` is provided, the API keys will be removed
213
+ and auth will be disabled on the deployment.
214
+
202
215
  auth_enabled: Set to `true` to enable API key authentication for the inference instance.
203
216
  `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
204
- for the requests to the instance if enabled
217
+ for the requests to the instance if enabled. This field is deprecated and will
218
+ be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
219
+ `api_keys` are both specified, a ValidationError will be raised.
205
220
 
206
221
  command: Command to be executed when running a container from an image.
207
222
 
@@ -250,6 +265,7 @@ class DeploymentsResource(SyncAPIResource):
250
265
  f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
251
266
  body=maybe_transform(
252
267
  {
268
+ "api_keys": api_keys,
253
269
  "auth_enabled": auth_enabled,
254
270
  "command": command,
255
271
  "containers": containers,
@@ -284,7 +300,7 @@ class DeploymentsResource(SyncAPIResource):
284
300
  extra_query: Query | None = None,
285
301
  extra_body: Body | None = None,
286
302
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
287
- ) -> SyncOffsetPage[Inference]:
303
+ ) -> SyncOffsetPage[InferenceDeployment]:
288
304
  """List inference deployments
289
305
 
290
306
  Args:
@@ -309,7 +325,7 @@ class DeploymentsResource(SyncAPIResource):
309
325
  project_id = self._client._get_cloud_project_id_path_param()
310
326
  return self._get_api_list(
311
327
  f"/cloud/v3/inference/{project_id}/deployments",
312
- page=SyncOffsetPage[Inference],
328
+ page=SyncOffsetPage[InferenceDeployment],
313
329
  options=make_request_options(
314
330
  extra_headers=extra_headers,
315
331
  extra_query=extra_query,
@@ -323,7 +339,7 @@ class DeploymentsResource(SyncAPIResource):
323
339
  deployment_list_params.DeploymentListParams,
324
340
  ),
325
341
  ),
326
- model=Inference,
342
+ model=InferenceDeployment,
327
343
  )
328
344
 
329
345
  def delete(
@@ -377,7 +393,7 @@ class DeploymentsResource(SyncAPIResource):
377
393
  extra_query: Query | None = None,
378
394
  extra_body: Body | None = None,
379
395
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
380
- ) -> Inference:
396
+ ) -> InferenceDeployment:
381
397
  """
382
398
  Get inference deployment
383
399
 
@@ -403,7 +419,7 @@ class DeploymentsResource(SyncAPIResource):
403
419
  options=make_request_options(
404
420
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
405
421
  ),
406
- cast_to=Inference,
422
+ cast_to=InferenceDeployment,
407
423
  )
408
424
 
409
425
  def get_api_key(
@@ -417,7 +433,7 @@ class DeploymentsResource(SyncAPIResource):
417
433
  extra_query: Query | None = None,
418
434
  extra_body: Body | None = None,
419
435
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
420
- ) -> InferenceApikeySecret:
436
+ ) -> InferenceDeploymentAPIKey:
421
437
  """
422
438
  Get inference deployment API key
423
439
 
@@ -443,7 +459,7 @@ class DeploymentsResource(SyncAPIResource):
443
459
  options=make_request_options(
444
460
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
445
461
  ),
446
- cast_to=InferenceApikeySecret,
462
+ cast_to=InferenceDeploymentAPIKey,
447
463
  )
448
464
 
449
465
  def start(
@@ -556,7 +572,7 @@ class DeploymentsResource(SyncAPIResource):
556
572
  credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
557
573
  description: Optional[str] | NotGiven = NOT_GIVEN,
558
574
  envs: Dict[str, str] | NotGiven = NOT_GIVEN,
559
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
575
+ ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
560
576
  logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
561
577
  probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
562
578
  api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -567,7 +583,7 @@ class DeploymentsResource(SyncAPIResource):
567
583
  extra_headers: Headers | None = None,
568
584
  extra_query: Query | None = None,
569
585
  extra_body: Body | None = None,
570
- ) -> Inference:
586
+ ) -> InferenceDeployment:
571
587
  response = self.create(
572
588
  project_id=project_id,
573
589
  containers=containers,
@@ -596,7 +612,11 @@ class DeploymentsResource(SyncAPIResource):
596
612
  extra_headers=extra_headers,
597
613
  polling_interval_seconds=polling_interval_seconds,
598
614
  )
599
- if not task.created_resources or not task.created_resources.inference_instances or len(task.created_resources.inference_instances) != 1:
615
+ if (
616
+ not task.created_resources
617
+ or not task.created_resources.inference_instances
618
+ or len(task.created_resources.inference_instances) != 1
619
+ ):
600
620
  raise ValueError(f"Expected exactly one resource to be created in a task")
601
621
  return self.get(
602
622
  deployment_name=task.created_resources.inference_instances[0],
@@ -618,7 +638,7 @@ class DeploymentsResource(SyncAPIResource):
618
638
  envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
619
639
  flavor_name: str | NotGiven = NOT_GIVEN,
620
640
  image: Optional[str] | NotGiven = NOT_GIVEN,
621
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
641
+ ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
622
642
  listening_port: Optional[int] | NotGiven = NOT_GIVEN,
623
643
  logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
624
644
  probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -630,7 +650,7 @@ class DeploymentsResource(SyncAPIResource):
630
650
  extra_headers: Headers | None = None,
631
651
  extra_query: Query | None = None,
632
652
  extra_body: Body | None = None,
633
- ) -> Inference:
653
+ ) -> InferenceDeployment:
634
654
  """
635
655
  Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
636
656
  """
@@ -735,12 +755,13 @@ class AsyncDeploymentsResource(AsyncAPIResource):
735
755
  image: str,
736
756
  listening_port: int,
737
757
  name: str,
758
+ api_keys: List[str] | NotGiven = NOT_GIVEN,
738
759
  auth_enabled: bool | NotGiven = NOT_GIVEN,
739
760
  command: Optional[List[str]] | NotGiven = NOT_GIVEN,
740
761
  credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
741
762
  description: Optional[str] | NotGiven = NOT_GIVEN,
742
763
  envs: Dict[str, str] | NotGiven = NOT_GIVEN,
743
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
764
+ ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
744
765
  logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
745
766
  probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
746
767
  api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -770,9 +791,15 @@ class AsyncDeploymentsResource(AsyncAPIResource):
770
791
 
771
792
  name: Inference instance name.
772
793
 
794
+ api_keys: List of API keys for the inference instance. Multiple keys can be attached to
795
+ one deployment.If `auth_enabled` and `api_keys` are both specified, a
796
+ ValidationError will be raised.
797
+
773
798
  auth_enabled: Set to `true` to enable API key authentication for the inference instance.
774
799
  `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
775
- for the requests to the instance if enabled
800
+ for the requests to the instance if enabled. This field is deprecated and will
801
+ be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
802
+ `api_keys` are both specified, a ValidationError will be raised.
776
803
 
777
804
  command: Command to be executed when running a container from an image.
778
805
 
@@ -815,6 +842,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
815
842
  "image": image,
816
843
  "listening_port": listening_port,
817
844
  "name": name,
845
+ "api_keys": api_keys,
818
846
  "auth_enabled": auth_enabled,
819
847
  "command": command,
820
848
  "credentials_name": credentials_name,
@@ -838,6 +866,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
838
866
  deployment_name: str,
839
867
  *,
840
868
  project_id: int | None = None,
869
+ api_keys: Optional[List[str]] | NotGiven = NOT_GIVEN,
841
870
  auth_enabled: bool | NotGiven = NOT_GIVEN,
842
871
  command: Optional[List[str]] | NotGiven = NOT_GIVEN,
843
872
  containers: Optional[Iterable[deployment_update_params.Container]] | NotGiven = NOT_GIVEN,
@@ -846,7 +875,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
846
875
  envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
847
876
  flavor_name: str | NotGiven = NOT_GIVEN,
848
877
  image: Optional[str] | NotGiven = NOT_GIVEN,
849
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
878
+ ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
850
879
  listening_port: Optional[int] | NotGiven = NOT_GIVEN,
851
880
  logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
852
881
  probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -866,9 +895,16 @@ class AsyncDeploymentsResource(AsyncAPIResource):
866
895
 
867
896
  deployment_name: Inference instance name.
868
897
 
898
+ api_keys: List of API keys for the inference instance. Multiple keys can be attached to
899
+ one deployment.If `auth_enabled` and `api_keys` are both specified, a
900
+ ValidationError will be raised.If `[]` is provided, the API keys will be removed
901
+ and auth will be disabled on the deployment.
902
+
869
903
  auth_enabled: Set to `true` to enable API key authentication for the inference instance.
870
904
  `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
871
- for the requests to the instance if enabled
905
+ for the requests to the instance if enabled. This field is deprecated and will
906
+ be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
907
+ `api_keys` are both specified, a ValidationError will be raised.
872
908
 
873
909
  command: Command to be executed when running a container from an image.
874
910
 
@@ -917,6 +953,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
917
953
  f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}",
918
954
  body=await async_maybe_transform(
919
955
  {
956
+ "api_keys": api_keys,
920
957
  "auth_enabled": auth_enabled,
921
958
  "command": command,
922
959
  "containers": containers,
@@ -951,7 +988,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
951
988
  extra_query: Query | None = None,
952
989
  extra_body: Body | None = None,
953
990
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
954
- ) -> AsyncPaginator[Inference, AsyncOffsetPage[Inference]]:
991
+ ) -> AsyncPaginator[InferenceDeployment, AsyncOffsetPage[InferenceDeployment]]:
955
992
  """List inference deployments
956
993
 
957
994
  Args:
@@ -976,7 +1013,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
976
1013
  project_id = self._client._get_cloud_project_id_path_param()
977
1014
  return self._get_api_list(
978
1015
  f"/cloud/v3/inference/{project_id}/deployments",
979
- page=AsyncOffsetPage[Inference],
1016
+ page=AsyncOffsetPage[InferenceDeployment],
980
1017
  options=make_request_options(
981
1018
  extra_headers=extra_headers,
982
1019
  extra_query=extra_query,
@@ -990,7 +1027,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
990
1027
  deployment_list_params.DeploymentListParams,
991
1028
  ),
992
1029
  ),
993
- model=Inference,
1030
+ model=InferenceDeployment,
994
1031
  )
995
1032
 
996
1033
  async def delete(
@@ -1044,7 +1081,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1044
1081
  extra_query: Query | None = None,
1045
1082
  extra_body: Body | None = None,
1046
1083
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
1047
- ) -> Inference:
1084
+ ) -> InferenceDeployment:
1048
1085
  """
1049
1086
  Get inference deployment
1050
1087
 
@@ -1070,7 +1107,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1070
1107
  options=make_request_options(
1071
1108
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
1072
1109
  ),
1073
- cast_to=Inference,
1110
+ cast_to=InferenceDeployment,
1074
1111
  )
1075
1112
 
1076
1113
  async def get_api_key(
@@ -1084,7 +1121,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1084
1121
  extra_query: Query | None = None,
1085
1122
  extra_body: Body | None = None,
1086
1123
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
1087
- ) -> InferenceApikeySecret:
1124
+ ) -> InferenceDeploymentAPIKey:
1088
1125
  """
1089
1126
  Get inference deployment API key
1090
1127
 
@@ -1110,7 +1147,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1110
1147
  options=make_request_options(
1111
1148
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
1112
1149
  ),
1113
- cast_to=InferenceApikeySecret,
1150
+ cast_to=InferenceDeploymentAPIKey,
1114
1151
  )
1115
1152
 
1116
1153
  async def start(
@@ -1223,7 +1260,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1223
1260
  credentials_name: Optional[str] | NotGiven = NOT_GIVEN,
1224
1261
  description: Optional[str] | NotGiven = NOT_GIVEN,
1225
1262
  envs: Dict[str, str] | NotGiven = NOT_GIVEN,
1226
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
1263
+ ingress_opts: Optional[deployment_create_params.IngressOpts] | NotGiven = NOT_GIVEN,
1227
1264
  logging: Optional[deployment_create_params.Logging] | NotGiven = NOT_GIVEN,
1228
1265
  probes: Optional[deployment_create_params.Probes] | NotGiven = NOT_GIVEN,
1229
1266
  api_timeout: Optional[int] | NotGiven = NOT_GIVEN,
@@ -1234,7 +1271,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1234
1271
  extra_headers: Headers | None = None,
1235
1272
  extra_query: Query | None = None,
1236
1273
  extra_body: Body | None = None,
1237
- ) -> Inference:
1274
+ ) -> InferenceDeployment:
1238
1275
  response = await self.create(
1239
1276
  project_id=project_id,
1240
1277
  containers=containers,
@@ -1263,7 +1300,11 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1263
1300
  extra_headers=extra_headers,
1264
1301
  polling_interval_seconds=polling_interval_seconds,
1265
1302
  )
1266
- if not task.created_resources or not task.created_resources.inference_instances or len(task.created_resources.inference_instances) != 1:
1303
+ if (
1304
+ not task.created_resources
1305
+ or not task.created_resources.inference_instances
1306
+ or len(task.created_resources.inference_instances) != 1
1307
+ ):
1267
1308
  raise ValueError(f"Expected exactly one resource to be created in a task")
1268
1309
  return await self.get(
1269
1310
  deployment_name=task.created_resources.inference_instances[0],
@@ -1285,7 +1326,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1285
1326
  envs: Optional[Dict[str, str]] | NotGiven = NOT_GIVEN,
1286
1327
  flavor_name: str | NotGiven = NOT_GIVEN,
1287
1328
  image: Optional[str] | NotGiven = NOT_GIVEN,
1288
- ingress_opts: Optional[IngressOptsParam] | NotGiven = NOT_GIVEN,
1329
+ ingress_opts: Optional[deployment_update_params.IngressOpts] | NotGiven = NOT_GIVEN,
1289
1330
  listening_port: Optional[int] | NotGiven = NOT_GIVEN,
1290
1331
  logging: Optional[deployment_update_params.Logging] | NotGiven = NOT_GIVEN,
1291
1332
  probes: Optional[deployment_update_params.Probes] | NotGiven = NOT_GIVEN,
@@ -1297,7 +1338,7 @@ class AsyncDeploymentsResource(AsyncAPIResource):
1297
1338
  extra_headers: Headers | None = None,
1298
1339
  extra_query: Query | None = None,
1299
1340
  extra_body: Body | None = None,
1300
- ) -> Inference:
1341
+ ) -> InferenceDeployment:
1301
1342
  """
1302
1343
  Update inference deployment and poll for the result. Only the first task will be polled. If you need to poll more tasks, use the `tasks.poll` method.
1303
1344
  """
@@ -20,7 +20,7 @@ from ....._response import (
20
20
  from .....pagination import SyncOffsetPage, AsyncOffsetPage
21
21
  from ....._base_client import AsyncPaginator, make_request_options
22
22
  from .....types.cloud.inference.deployments import log_list_params
23
- from .....types.cloud.inference.inference_log import InferenceLog
23
+ from .....types.cloud.inference.deployments.inference_deployment_log import InferenceDeploymentLog
24
24
 
25
25
  __all__ = ["LogsResource", "AsyncLogsResource"]
26
26
 
@@ -60,7 +60,7 @@ class LogsResource(SyncAPIResource):
60
60
  extra_query: Query | None = None,
61
61
  extra_body: Body | None = None,
62
62
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
63
- ) -> SyncOffsetPage[InferenceLog]:
63
+ ) -> SyncOffsetPage[InferenceDeploymentLog]:
64
64
  """
65
65
  Get inference deployment logs
66
66
 
@@ -92,7 +92,7 @@ class LogsResource(SyncAPIResource):
92
92
  raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
93
93
  return self._get_api_list(
94
94
  f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
95
- page=SyncOffsetPage[InferenceLog],
95
+ page=SyncOffsetPage[InferenceDeploymentLog],
96
96
  options=make_request_options(
97
97
  extra_headers=extra_headers,
98
98
  extra_query=extra_query,
@@ -108,7 +108,7 @@ class LogsResource(SyncAPIResource):
108
108
  log_list_params.LogListParams,
109
109
  ),
110
110
  ),
111
- model=InferenceLog,
111
+ model=InferenceDeploymentLog,
112
112
  )
113
113
 
114
114
 
@@ -147,7 +147,7 @@ class AsyncLogsResource(AsyncAPIResource):
147
147
  extra_query: Query | None = None,
148
148
  extra_body: Body | None = None,
149
149
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
150
- ) -> AsyncPaginator[InferenceLog, AsyncOffsetPage[InferenceLog]]:
150
+ ) -> AsyncPaginator[InferenceDeploymentLog, AsyncOffsetPage[InferenceDeploymentLog]]:
151
151
  """
152
152
  Get inference deployment logs
153
153
 
@@ -179,7 +179,7 @@ class AsyncLogsResource(AsyncAPIResource):
179
179
  raise ValueError(f"Expected a non-empty value for `deployment_name` but received {deployment_name!r}")
180
180
  return self._get_api_list(
181
181
  f"/cloud/v3/inference/{project_id}/deployments/{deployment_name}/logs",
182
- page=AsyncOffsetPage[InferenceLog],
182
+ page=AsyncOffsetPage[InferenceDeploymentLog],
183
183
  options=make_request_options(
184
184
  extra_headers=extra_headers,
185
185
  extra_query=extra_query,
@@ -195,7 +195,7 @@ class AsyncLogsResource(AsyncAPIResource):
195
195
  log_list_params.LogListParams,
196
196
  ),
197
197
  ),
198
- model=InferenceLog,
198
+ model=InferenceDeploymentLog,
199
199
  )
200
200
 
201
201
 
@@ -54,7 +54,7 @@ from .deployments.deployments import (
54
54
  DeploymentsResourceWithStreamingResponse,
55
55
  AsyncDeploymentsResourceWithStreamingResponse,
56
56
  )
57
- from ....types.cloud.region_capacity_list import RegionCapacityList
57
+ from ....types.cloud.inference_region_capacity_list import InferenceRegionCapacityList
58
58
 
59
59
  __all__ = ["InferenceResource", "AsyncInferenceResource"]
60
60
 
@@ -108,14 +108,14 @@ class InferenceResource(SyncAPIResource):
108
108
  extra_query: Query | None = None,
109
109
  extra_body: Body | None = None,
110
110
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
111
- ) -> RegionCapacityList:
111
+ ) -> InferenceRegionCapacityList:
112
112
  """Get inference capacity by region"""
113
113
  return self._get(
114
114
  "/cloud/v3/inference/capacity",
115
115
  options=make_request_options(
116
116
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
117
117
  ),
118
- cast_to=RegionCapacityList,
118
+ cast_to=InferenceRegionCapacityList,
119
119
  )
120
120
 
121
121
 
@@ -168,14 +168,14 @@ class AsyncInferenceResource(AsyncAPIResource):
168
168
  extra_query: Query | None = None,
169
169
  extra_body: Body | None = None,
170
170
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
171
- ) -> RegionCapacityList:
171
+ ) -> InferenceRegionCapacityList:
172
172
  """Get inference capacity by region"""
173
173
  return await self._get(
174
174
  "/cloud/v3/inference/capacity",
175
175
  options=make_request_options(
176
176
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
177
177
  ),
178
- cast_to=RegionCapacityList,
178
+ cast_to=InferenceRegionCapacityList,
179
179
  )
180
180
 
181
181
 
@@ -2,6 +2,8 @@
2
2
 
3
3
  from __future__ import annotations
4
4
 
5
+ from typing_extensions import Literal
6
+
5
7
  import httpx
6
8
 
7
9
  from ...._types import NOT_GIVEN, Body, Query, Headers, NotGiven
@@ -16,9 +18,8 @@ from ...._response import (
16
18
  )
17
19
  from ....pagination import SyncOffsetPage, AsyncOffsetPage
18
20
  from ...._base_client import AsyncPaginator, make_request_options
19
- from ....types.cloud.inference import MlcatalogOrderByChoices, model_list_params
20
- from ....types.cloud.inference.mlcatalog_model_card import MlcatalogModelCard
21
- from ....types.cloud.inference.mlcatalog_order_by_choices import MlcatalogOrderByChoices
21
+ from ....types.cloud.inference import model_list_params
22
+ from ....types.cloud.inference.inference_model import InferenceModel
22
23
 
23
24
  __all__ = ["ModelsResource", "AsyncModelsResource"]
24
25
 
@@ -48,14 +49,14 @@ class ModelsResource(SyncAPIResource):
48
49
  *,
49
50
  limit: int | NotGiven = NOT_GIVEN,
50
51
  offset: int | NotGiven = NOT_GIVEN,
51
- order_by: MlcatalogOrderByChoices | NotGiven = NOT_GIVEN,
52
+ order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
52
53
  # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
53
54
  # The extra values given here take precedence over values defined on the client or passed to this method.
54
55
  extra_headers: Headers | None = None,
55
56
  extra_query: Query | None = None,
56
57
  extra_body: Body | None = None,
57
58
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
58
- ) -> SyncOffsetPage[MlcatalogModelCard]:
59
+ ) -> SyncOffsetPage[InferenceModel]:
59
60
  """List models from catalog
60
61
 
61
62
  Args:
@@ -78,7 +79,7 @@ class ModelsResource(SyncAPIResource):
78
79
  """
79
80
  return self._get_api_list(
80
81
  "/cloud/v3/inference/models",
81
- page=SyncOffsetPage[MlcatalogModelCard],
82
+ page=SyncOffsetPage[InferenceModel],
82
83
  options=make_request_options(
83
84
  extra_headers=extra_headers,
84
85
  extra_query=extra_query,
@@ -93,7 +94,7 @@ class ModelsResource(SyncAPIResource):
93
94
  model_list_params.ModelListParams,
94
95
  ),
95
96
  ),
96
- model=MlcatalogModelCard,
97
+ model=InferenceModel,
97
98
  )
98
99
 
99
100
  def get(
@@ -106,7 +107,7 @@ class ModelsResource(SyncAPIResource):
106
107
  extra_query: Query | None = None,
107
108
  extra_body: Body | None = None,
108
109
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
109
- ) -> MlcatalogModelCard:
110
+ ) -> InferenceModel:
110
111
  """
111
112
  Get model from catalog
112
113
 
@@ -128,7 +129,7 @@ class ModelsResource(SyncAPIResource):
128
129
  options=make_request_options(
129
130
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
130
131
  ),
131
- cast_to=MlcatalogModelCard,
132
+ cast_to=InferenceModel,
132
133
  )
133
134
 
134
135
 
@@ -157,14 +158,14 @@ class AsyncModelsResource(AsyncAPIResource):
157
158
  *,
158
159
  limit: int | NotGiven = NOT_GIVEN,
159
160
  offset: int | NotGiven = NOT_GIVEN,
160
- order_by: MlcatalogOrderByChoices | NotGiven = NOT_GIVEN,
161
+ order_by: Literal["name.asc", "name.desc"] | NotGiven = NOT_GIVEN,
161
162
  # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
162
163
  # The extra values given here take precedence over values defined on the client or passed to this method.
163
164
  extra_headers: Headers | None = None,
164
165
  extra_query: Query | None = None,
165
166
  extra_body: Body | None = None,
166
167
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
167
- ) -> AsyncPaginator[MlcatalogModelCard, AsyncOffsetPage[MlcatalogModelCard]]:
168
+ ) -> AsyncPaginator[InferenceModel, AsyncOffsetPage[InferenceModel]]:
168
169
  """List models from catalog
169
170
 
170
171
  Args:
@@ -187,7 +188,7 @@ class AsyncModelsResource(AsyncAPIResource):
187
188
  """
188
189
  return self._get_api_list(
189
190
  "/cloud/v3/inference/models",
190
- page=AsyncOffsetPage[MlcatalogModelCard],
191
+ page=AsyncOffsetPage[InferenceModel],
191
192
  options=make_request_options(
192
193
  extra_headers=extra_headers,
193
194
  extra_query=extra_query,
@@ -202,7 +203,7 @@ class AsyncModelsResource(AsyncAPIResource):
202
203
  model_list_params.ModelListParams,
203
204
  ),
204
205
  ),
205
- model=MlcatalogModelCard,
206
+ model=InferenceModel,
206
207
  )
207
208
 
208
209
  async def get(
@@ -215,7 +216,7 @@ class AsyncModelsResource(AsyncAPIResource):
215
216
  extra_query: Query | None = None,
216
217
  extra_body: Body | None = None,
217
218
  timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
218
- ) -> MlcatalogModelCard:
219
+ ) -> InferenceModel:
219
220
  """
220
221
  Get model from catalog
221
222
 
@@ -237,7 +238,7 @@ class AsyncModelsResource(AsyncAPIResource):
237
238
  options=make_request_options(
238
239
  extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
239
240
  ),
240
- cast_to=MlcatalogModelCard,
241
+ cast_to=InferenceModel,
241
242
  )
242
243
 
243
244