databricks-sdk 0.56.0__py3-none-any.whl → 0.58.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of databricks-sdk might be problematic. Click here for more details.
- databricks/sdk/__init__.py +38 -11
- databricks/sdk/service/aibuilder.py +122 -17
- databricks/sdk/service/apps.py +15 -45
- databricks/sdk/service/billing.py +70 -74
- databricks/sdk/service/catalog.py +1898 -557
- databricks/sdk/service/cleanrooms.py +14 -55
- databricks/sdk/service/compute.py +305 -508
- databricks/sdk/service/dashboards.py +148 -223
- databricks/sdk/service/database.py +657 -127
- databricks/sdk/service/files.py +18 -54
- databricks/sdk/service/iam.py +55 -165
- databricks/sdk/service/jobs.py +238 -214
- databricks/sdk/service/marketplace.py +47 -146
- databricks/sdk/service/ml.py +1137 -447
- databricks/sdk/service/oauth2.py +17 -46
- databricks/sdk/service/pipelines.py +93 -69
- databricks/sdk/service/provisioning.py +34 -212
- databricks/sdk/service/qualitymonitorv2.py +5 -33
- databricks/sdk/service/serving.py +69 -55
- databricks/sdk/service/settings.py +106 -434
- databricks/sdk/service/sharing.py +33 -95
- databricks/sdk/service/sql.py +164 -254
- databricks/sdk/service/vectorsearch.py +13 -62
- databricks/sdk/service/workspace.py +36 -110
- databricks/sdk/version.py +1 -1
- {databricks_sdk-0.56.0.dist-info → databricks_sdk-0.58.0.dist-info}/METADATA +1 -1
- {databricks_sdk-0.56.0.dist-info → databricks_sdk-0.58.0.dist-info}/RECORD +31 -31
- {databricks_sdk-0.56.0.dist-info → databricks_sdk-0.58.0.dist-info}/WHEEL +0 -0
- {databricks_sdk-0.56.0.dist-info → databricks_sdk-0.58.0.dist-info}/licenses/LICENSE +0 -0
- {databricks_sdk-0.56.0.dist-info → databricks_sdk-0.58.0.dist-info}/licenses/NOTICE +0 -0
- {databricks_sdk-0.56.0.dist-info → databricks_sdk-0.58.0.dist-info}/top_level.txt +0 -0
|
@@ -63,24 +63,6 @@ class AnomalyDetectionRunStatus(Enum):
|
|
|
63
63
|
ANOMALY_DETECTION_RUN_STATUS_WORKSPACE_MISMATCH_ERROR = "ANOMALY_DETECTION_RUN_STATUS_WORKSPACE_MISMATCH_ERROR"
|
|
64
64
|
|
|
65
65
|
|
|
66
|
-
@dataclass
|
|
67
|
-
class DeleteQualityMonitorResponse:
|
|
68
|
-
def as_dict(self) -> dict:
|
|
69
|
-
"""Serializes the DeleteQualityMonitorResponse into a dictionary suitable for use as a JSON request body."""
|
|
70
|
-
body = {}
|
|
71
|
-
return body
|
|
72
|
-
|
|
73
|
-
def as_shallow_dict(self) -> dict:
|
|
74
|
-
"""Serializes the DeleteQualityMonitorResponse into a shallow dictionary of its immediate attributes."""
|
|
75
|
-
body = {}
|
|
76
|
-
return body
|
|
77
|
-
|
|
78
|
-
@classmethod
|
|
79
|
-
def from_dict(cls, d: Dict[str, Any]) -> DeleteQualityMonitorResponse:
|
|
80
|
-
"""Deserializes the DeleteQualityMonitorResponse from a dictionary."""
|
|
81
|
-
return cls()
|
|
82
|
-
|
|
83
|
-
|
|
84
66
|
@dataclass
|
|
85
67
|
class ListQualityMonitorResponse:
|
|
86
68
|
next_page_token: Optional[str] = None
|
|
@@ -163,9 +145,7 @@ class QualityMonitorV2API:
|
|
|
163
145
|
self._api = api_client
|
|
164
146
|
|
|
165
147
|
def create_quality_monitor(self, quality_monitor: QualityMonitor) -> QualityMonitor:
|
|
166
|
-
"""Create a quality monitor
|
|
167
|
-
|
|
168
|
-
Create a quality monitor on UC object
|
|
148
|
+
"""Create a quality monitor on UC object
|
|
169
149
|
|
|
170
150
|
:param quality_monitor: :class:`QualityMonitor`
|
|
171
151
|
|
|
@@ -181,9 +161,7 @@ class QualityMonitorV2API:
|
|
|
181
161
|
return QualityMonitor.from_dict(res)
|
|
182
162
|
|
|
183
163
|
def delete_quality_monitor(self, object_type: str, object_id: str):
|
|
184
|
-
"""Delete a quality monitor
|
|
185
|
-
|
|
186
|
-
Delete a quality monitor on UC object
|
|
164
|
+
"""Delete a quality monitor on UC object
|
|
187
165
|
|
|
188
166
|
:param object_type: str
|
|
189
167
|
The type of the monitored object. Can be one of the following: schema.
|
|
@@ -200,9 +178,7 @@ class QualityMonitorV2API:
|
|
|
200
178
|
self._api.do("DELETE", f"/api/2.0/quality-monitors/{object_type}/{object_id}", headers=headers)
|
|
201
179
|
|
|
202
180
|
def get_quality_monitor(self, object_type: str, object_id: str) -> QualityMonitor:
|
|
203
|
-
"""Read a quality monitor
|
|
204
|
-
|
|
205
|
-
Read a quality monitor on UC object
|
|
181
|
+
"""Read a quality monitor on UC object
|
|
206
182
|
|
|
207
183
|
:param object_type: str
|
|
208
184
|
The type of the monitored object. Can be one of the following: schema.
|
|
@@ -222,9 +198,7 @@ class QualityMonitorV2API:
|
|
|
222
198
|
def list_quality_monitor(
|
|
223
199
|
self, *, page_size: Optional[int] = None, page_token: Optional[str] = None
|
|
224
200
|
) -> Iterator[QualityMonitor]:
|
|
225
|
-
"""List quality monitors
|
|
226
|
-
|
|
227
|
-
(Unimplemented) List quality monitors
|
|
201
|
+
"""(Unimplemented) List quality monitors
|
|
228
202
|
|
|
229
203
|
:param page_size: int (optional)
|
|
230
204
|
:param page_token: str (optional)
|
|
@@ -253,9 +227,7 @@ class QualityMonitorV2API:
|
|
|
253
227
|
def update_quality_monitor(
|
|
254
228
|
self, object_type: str, object_id: str, quality_monitor: QualityMonitor
|
|
255
229
|
) -> QualityMonitor:
|
|
256
|
-
"""Update a quality monitor
|
|
257
|
-
|
|
258
|
-
(Unimplemented) Update a quality monitor on UC object
|
|
230
|
+
"""(Unimplemented) Update a quality monitor on UC object
|
|
259
231
|
|
|
260
232
|
:param object_type: str
|
|
261
233
|
The type of the monitored object. Can be one of the following: schema.
|
|
@@ -306,8 +306,12 @@ class AiGatewayRateLimit:
|
|
|
306
306
|
"""Renewal period field for a rate limit. Currently, only 'minute' is supported."""
|
|
307
307
|
|
|
308
308
|
key: Optional[AiGatewayRateLimitKey] = None
|
|
309
|
-
"""Key field for a rate limit. Currently,
|
|
310
|
-
being the default if not specified."""
|
|
309
|
+
"""Key field for a rate limit. Currently, 'user', 'user_group, 'service_principal', and 'endpoint'
|
|
310
|
+
are supported, with 'endpoint' being the default if not specified."""
|
|
311
|
+
|
|
312
|
+
principal: Optional[str] = None
|
|
313
|
+
"""Principal field for a user, user group, or service principal to apply rate limiting to. Accepts
|
|
314
|
+
a user email, group name, or service principal application ID."""
|
|
311
315
|
|
|
312
316
|
def as_dict(self) -> dict:
|
|
313
317
|
"""Serializes the AiGatewayRateLimit into a dictionary suitable for use as a JSON request body."""
|
|
@@ -316,6 +320,8 @@ class AiGatewayRateLimit:
|
|
|
316
320
|
body["calls"] = self.calls
|
|
317
321
|
if self.key is not None:
|
|
318
322
|
body["key"] = self.key.value
|
|
323
|
+
if self.principal is not None:
|
|
324
|
+
body["principal"] = self.principal
|
|
319
325
|
if self.renewal_period is not None:
|
|
320
326
|
body["renewal_period"] = self.renewal_period.value
|
|
321
327
|
return body
|
|
@@ -327,6 +333,8 @@ class AiGatewayRateLimit:
|
|
|
327
333
|
body["calls"] = self.calls
|
|
328
334
|
if self.key is not None:
|
|
329
335
|
body["key"] = self.key
|
|
336
|
+
if self.principal is not None:
|
|
337
|
+
body["principal"] = self.principal
|
|
330
338
|
if self.renewal_period is not None:
|
|
331
339
|
body["renewal_period"] = self.renewal_period
|
|
332
340
|
return body
|
|
@@ -337,6 +345,7 @@ class AiGatewayRateLimit:
|
|
|
337
345
|
return cls(
|
|
338
346
|
calls=d.get("calls", None),
|
|
339
347
|
key=_enum(d, "key", AiGatewayRateLimitKey),
|
|
348
|
+
principal=d.get("principal", None),
|
|
340
349
|
renewal_period=_enum(d, "renewal_period", AiGatewayRateLimitRenewalPeriod),
|
|
341
350
|
)
|
|
342
351
|
|
|
@@ -344,7 +353,9 @@ class AiGatewayRateLimit:
|
|
|
344
353
|
class AiGatewayRateLimitKey(Enum):
|
|
345
354
|
|
|
346
355
|
ENDPOINT = "endpoint"
|
|
356
|
+
SERVICE_PRINCIPAL = "service_principal"
|
|
347
357
|
USER = "user"
|
|
358
|
+
USER_GROUP = "user_group"
|
|
348
359
|
|
|
349
360
|
|
|
350
361
|
class AiGatewayRateLimitRenewalPeriod(Enum):
|
|
@@ -919,6 +930,8 @@ class CreateServingEndpoint:
|
|
|
919
930
|
config: Optional[EndpointCoreConfigInput] = None
|
|
920
931
|
"""The core config of the serving endpoint."""
|
|
921
932
|
|
|
933
|
+
description: Optional[str] = None
|
|
934
|
+
|
|
922
935
|
rate_limits: Optional[List[RateLimit]] = None
|
|
923
936
|
"""Rate limits to be applied to the serving endpoint. NOTE: this field is deprecated, please use AI
|
|
924
937
|
Gateway to manage rate limits."""
|
|
@@ -938,6 +951,8 @@ class CreateServingEndpoint:
|
|
|
938
951
|
body["budget_policy_id"] = self.budget_policy_id
|
|
939
952
|
if self.config:
|
|
940
953
|
body["config"] = self.config.as_dict()
|
|
954
|
+
if self.description is not None:
|
|
955
|
+
body["description"] = self.description
|
|
941
956
|
if self.name is not None:
|
|
942
957
|
body["name"] = self.name
|
|
943
958
|
if self.rate_limits:
|
|
@@ -957,6 +972,8 @@ class CreateServingEndpoint:
|
|
|
957
972
|
body["budget_policy_id"] = self.budget_policy_id
|
|
958
973
|
if self.config:
|
|
959
974
|
body["config"] = self.config
|
|
975
|
+
if self.description is not None:
|
|
976
|
+
body["description"] = self.description
|
|
960
977
|
if self.name is not None:
|
|
961
978
|
body["name"] = self.name
|
|
962
979
|
if self.rate_limits:
|
|
@@ -974,6 +991,7 @@ class CreateServingEndpoint:
|
|
|
974
991
|
ai_gateway=_from_dict(d, "ai_gateway", AiGatewayConfig),
|
|
975
992
|
budget_policy_id=d.get("budget_policy_id", None),
|
|
976
993
|
config=_from_dict(d, "config", EndpointCoreConfigInput),
|
|
994
|
+
description=d.get("description", None),
|
|
977
995
|
name=d.get("name", None),
|
|
978
996
|
rate_limits=_repeated_dict(d, "rate_limits", RateLimit),
|
|
979
997
|
route_optimized=d.get("route_optimized", None),
|
|
@@ -2945,16 +2963,20 @@ class RateLimitRenewalPeriod(Enum):
|
|
|
2945
2963
|
|
|
2946
2964
|
@dataclass
|
|
2947
2965
|
class Route:
|
|
2948
|
-
served_model_name: str
|
|
2949
|
-
"""The name of the served model this route configures traffic for."""
|
|
2950
|
-
|
|
2951
2966
|
traffic_percentage: int
|
|
2952
2967
|
"""The percentage of endpoint traffic to send to this route. It must be an integer between 0 and
|
|
2953
2968
|
100 inclusive."""
|
|
2954
2969
|
|
|
2970
|
+
served_entity_name: Optional[str] = None
|
|
2971
|
+
|
|
2972
|
+
served_model_name: Optional[str] = None
|
|
2973
|
+
"""The name of the served model this route configures traffic for."""
|
|
2974
|
+
|
|
2955
2975
|
def as_dict(self) -> dict:
|
|
2956
2976
|
"""Serializes the Route into a dictionary suitable for use as a JSON request body."""
|
|
2957
2977
|
body = {}
|
|
2978
|
+
if self.served_entity_name is not None:
|
|
2979
|
+
body["served_entity_name"] = self.served_entity_name
|
|
2958
2980
|
if self.served_model_name is not None:
|
|
2959
2981
|
body["served_model_name"] = self.served_model_name
|
|
2960
2982
|
if self.traffic_percentage is not None:
|
|
@@ -2964,6 +2986,8 @@ class Route:
|
|
|
2964
2986
|
def as_shallow_dict(self) -> dict:
|
|
2965
2987
|
"""Serializes the Route into a shallow dictionary of its immediate attributes."""
|
|
2966
2988
|
body = {}
|
|
2989
|
+
if self.served_entity_name is not None:
|
|
2990
|
+
body["served_entity_name"] = self.served_entity_name
|
|
2967
2991
|
if self.served_model_name is not None:
|
|
2968
2992
|
body["served_model_name"] = self.served_model_name
|
|
2969
2993
|
if self.traffic_percentage is not None:
|
|
@@ -2974,7 +2998,9 @@ class Route:
|
|
|
2974
2998
|
def from_dict(cls, d: Dict[str, Any]) -> Route:
|
|
2975
2999
|
"""Deserializes the Route from a dictionary."""
|
|
2976
3000
|
return cls(
|
|
2977
|
-
|
|
3001
|
+
served_entity_name=d.get("served_entity_name", None),
|
|
3002
|
+
served_model_name=d.get("served_model_name", None),
|
|
3003
|
+
traffic_percentage=d.get("traffic_percentage", None),
|
|
2978
3004
|
)
|
|
2979
3005
|
|
|
2980
3006
|
|
|
@@ -3164,8 +3190,6 @@ class ServedEntityOutput:
|
|
|
3164
3190
|
external_model later. The task type of all external models within an endpoint must be the same."""
|
|
3165
3191
|
|
|
3166
3192
|
foundation_model: Optional[FoundationModel] = None
|
|
3167
|
-
"""All fields are not sensitive as they are hard-coded in the system and made available to
|
|
3168
|
-
customers."""
|
|
3169
3193
|
|
|
3170
3194
|
instance_profile_arn: Optional[str] = None
|
|
3171
3195
|
"""ARN of the instance profile that the served entity uses to access AWS resources."""
|
|
@@ -3331,8 +3355,6 @@ class ServedEntitySpec:
|
|
|
3331
3355
|
external_model: Optional[ExternalModel] = None
|
|
3332
3356
|
|
|
3333
3357
|
foundation_model: Optional[FoundationModel] = None
|
|
3334
|
-
"""All fields are not sensitive as they are hard-coded in the system and made available to
|
|
3335
|
-
customers."""
|
|
3336
3358
|
|
|
3337
3359
|
name: Optional[str] = None
|
|
3338
3360
|
|
|
@@ -3799,6 +3821,9 @@ class ServingEndpoint:
|
|
|
3799
3821
|
creator: Optional[str] = None
|
|
3800
3822
|
"""The email of the user who created the serving endpoint."""
|
|
3801
3823
|
|
|
3824
|
+
description: Optional[str] = None
|
|
3825
|
+
"""Description of the endpoint"""
|
|
3826
|
+
|
|
3802
3827
|
id: Optional[str] = None
|
|
3803
3828
|
"""System-generated ID of the endpoint, included to be used by the Permissions API."""
|
|
3804
3829
|
|
|
@@ -3830,6 +3855,8 @@ class ServingEndpoint:
|
|
|
3830
3855
|
body["creation_timestamp"] = self.creation_timestamp
|
|
3831
3856
|
if self.creator is not None:
|
|
3832
3857
|
body["creator"] = self.creator
|
|
3858
|
+
if self.description is not None:
|
|
3859
|
+
body["description"] = self.description
|
|
3833
3860
|
if self.id is not None:
|
|
3834
3861
|
body["id"] = self.id
|
|
3835
3862
|
if self.last_updated_timestamp is not None:
|
|
@@ -3857,6 +3884,8 @@ class ServingEndpoint:
|
|
|
3857
3884
|
body["creation_timestamp"] = self.creation_timestamp
|
|
3858
3885
|
if self.creator is not None:
|
|
3859
3886
|
body["creator"] = self.creator
|
|
3887
|
+
if self.description is not None:
|
|
3888
|
+
body["description"] = self.description
|
|
3860
3889
|
if self.id is not None:
|
|
3861
3890
|
body["id"] = self.id
|
|
3862
3891
|
if self.last_updated_timestamp is not None:
|
|
@@ -3880,6 +3909,7 @@ class ServingEndpoint:
|
|
|
3880
3909
|
config=_from_dict(d, "config", EndpointCoreConfigSummary),
|
|
3881
3910
|
creation_timestamp=d.get("creation_timestamp", None),
|
|
3882
3911
|
creator=d.get("creator", None),
|
|
3912
|
+
description=d.get("description", None),
|
|
3883
3913
|
id=d.get("id", None),
|
|
3884
3914
|
last_updated_timestamp=d.get("last_updated_timestamp", None),
|
|
3885
3915
|
name=d.get("name", None),
|
|
@@ -3895,7 +3925,6 @@ class ServingEndpointAccessControlRequest:
|
|
|
3895
3925
|
"""name of the group"""
|
|
3896
3926
|
|
|
3897
3927
|
permission_level: Optional[ServingEndpointPermissionLevel] = None
|
|
3898
|
-
"""Permission level"""
|
|
3899
3928
|
|
|
3900
3929
|
service_principal_name: Optional[str] = None
|
|
3901
3930
|
"""application ID of a service principal"""
|
|
@@ -4021,6 +4050,9 @@ class ServingEndpointDetailed:
|
|
|
4021
4050
|
data_plane_info: Optional[ModelDataPlaneInfo] = None
|
|
4022
4051
|
"""Information required to query DataPlane APIs."""
|
|
4023
4052
|
|
|
4053
|
+
description: Optional[str] = None
|
|
4054
|
+
"""Description of the serving model"""
|
|
4055
|
+
|
|
4024
4056
|
endpoint_url: Optional[str] = None
|
|
4025
4057
|
"""Endpoint invocation url if route optimization is enabled for endpoint"""
|
|
4026
4058
|
|
|
@@ -4067,6 +4099,8 @@ class ServingEndpointDetailed:
|
|
|
4067
4099
|
body["creator"] = self.creator
|
|
4068
4100
|
if self.data_plane_info:
|
|
4069
4101
|
body["data_plane_info"] = self.data_plane_info.as_dict()
|
|
4102
|
+
if self.description is not None:
|
|
4103
|
+
body["description"] = self.description
|
|
4070
4104
|
if self.endpoint_url is not None:
|
|
4071
4105
|
body["endpoint_url"] = self.endpoint_url
|
|
4072
4106
|
if self.id is not None:
|
|
@@ -4104,6 +4138,8 @@ class ServingEndpointDetailed:
|
|
|
4104
4138
|
body["creator"] = self.creator
|
|
4105
4139
|
if self.data_plane_info:
|
|
4106
4140
|
body["data_plane_info"] = self.data_plane_info
|
|
4141
|
+
if self.description is not None:
|
|
4142
|
+
body["description"] = self.description
|
|
4107
4143
|
if self.endpoint_url is not None:
|
|
4108
4144
|
body["endpoint_url"] = self.endpoint_url
|
|
4109
4145
|
if self.id is not None:
|
|
@@ -4136,6 +4172,7 @@ class ServingEndpointDetailed:
|
|
|
4136
4172
|
creation_timestamp=d.get("creation_timestamp", None),
|
|
4137
4173
|
creator=d.get("creator", None),
|
|
4138
4174
|
data_plane_info=_from_dict(d, "data_plane_info", ModelDataPlaneInfo),
|
|
4175
|
+
description=d.get("description", None),
|
|
4139
4176
|
endpoint_url=d.get("endpoint_url", None),
|
|
4140
4177
|
id=d.get("id", None),
|
|
4141
4178
|
last_updated_timestamp=d.get("last_updated_timestamp", None),
|
|
@@ -4163,7 +4200,6 @@ class ServingEndpointPermission:
|
|
|
4163
4200
|
inherited_from_object: Optional[List[str]] = None
|
|
4164
4201
|
|
|
4165
4202
|
permission_level: Optional[ServingEndpointPermissionLevel] = None
|
|
4166
|
-
"""Permission level"""
|
|
4167
4203
|
|
|
4168
4204
|
def as_dict(self) -> dict:
|
|
4169
4205
|
"""Serializes the ServingEndpointPermission into a dictionary suitable for use as a JSON request body."""
|
|
@@ -4250,7 +4286,6 @@ class ServingEndpointPermissionsDescription:
|
|
|
4250
4286
|
description: Optional[str] = None
|
|
4251
4287
|
|
|
4252
4288
|
permission_level: Optional[ServingEndpointPermissionLevel] = None
|
|
4253
|
-
"""Permission level"""
|
|
4254
4289
|
|
|
4255
4290
|
def as_dict(self) -> dict:
|
|
4256
4291
|
"""Serializes the ServingEndpointPermissionsDescription into a dictionary suitable for use as a JSON request body."""
|
|
@@ -4489,9 +4524,7 @@ class ServingEndpointsAPI:
|
|
|
4489
4524
|
raise TimeoutError(f"timed out after {timeout}: {status_message}")
|
|
4490
4525
|
|
|
4491
4526
|
def build_logs(self, name: str, served_model_name: str) -> BuildLogsResponse:
|
|
4492
|
-
"""
|
|
4493
|
-
|
|
4494
|
-
Retrieves the build logs associated with the provided served model.
|
|
4527
|
+
"""Retrieves the build logs associated with the provided served model.
|
|
4495
4528
|
|
|
4496
4529
|
:param name: str
|
|
4497
4530
|
The name of the serving endpoint that the served model belongs to. This field is required.
|
|
@@ -4517,6 +4550,7 @@ class ServingEndpointsAPI:
|
|
|
4517
4550
|
ai_gateway: Optional[AiGatewayConfig] = None,
|
|
4518
4551
|
budget_policy_id: Optional[str] = None,
|
|
4519
4552
|
config: Optional[EndpointCoreConfigInput] = None,
|
|
4553
|
+
description: Optional[str] = None,
|
|
4520
4554
|
rate_limits: Optional[List[RateLimit]] = None,
|
|
4521
4555
|
route_optimized: Optional[bool] = None,
|
|
4522
4556
|
tags: Optional[List[EndpointTag]] = None,
|
|
@@ -4534,6 +4568,7 @@ class ServingEndpointsAPI:
|
|
|
4534
4568
|
The budget policy to be applied to the serving endpoint.
|
|
4535
4569
|
:param config: :class:`EndpointCoreConfigInput` (optional)
|
|
4536
4570
|
The core config of the serving endpoint.
|
|
4571
|
+
:param description: str (optional)
|
|
4537
4572
|
:param rate_limits: List[:class:`RateLimit`] (optional)
|
|
4538
4573
|
Rate limits to be applied to the serving endpoint. NOTE: this field is deprecated, please use AI
|
|
4539
4574
|
Gateway to manage rate limits.
|
|
@@ -4553,6 +4588,8 @@ class ServingEndpointsAPI:
|
|
|
4553
4588
|
body["budget_policy_id"] = budget_policy_id
|
|
4554
4589
|
if config is not None:
|
|
4555
4590
|
body["config"] = config.as_dict()
|
|
4591
|
+
if description is not None:
|
|
4592
|
+
body["description"] = description
|
|
4556
4593
|
if name is not None:
|
|
4557
4594
|
body["name"] = name
|
|
4558
4595
|
if rate_limits is not None:
|
|
@@ -4580,6 +4617,7 @@ class ServingEndpointsAPI:
|
|
|
4580
4617
|
ai_gateway: Optional[AiGatewayConfig] = None,
|
|
4581
4618
|
budget_policy_id: Optional[str] = None,
|
|
4582
4619
|
config: Optional[EndpointCoreConfigInput] = None,
|
|
4620
|
+
description: Optional[str] = None,
|
|
4583
4621
|
rate_limits: Optional[List[RateLimit]] = None,
|
|
4584
4622
|
route_optimized: Optional[bool] = None,
|
|
4585
4623
|
tags: Optional[List[EndpointTag]] = None,
|
|
@@ -4589,6 +4627,7 @@ class ServingEndpointsAPI:
|
|
|
4589
4627
|
ai_gateway=ai_gateway,
|
|
4590
4628
|
budget_policy_id=budget_policy_id,
|
|
4591
4629
|
config=config,
|
|
4630
|
+
description=description,
|
|
4592
4631
|
name=name,
|
|
4593
4632
|
rate_limits=rate_limits,
|
|
4594
4633
|
route_optimized=route_optimized,
|
|
@@ -4672,9 +4711,7 @@ class ServingEndpointsAPI:
|
|
|
4672
4711
|
self._api.do("DELETE", f"/api/2.0/serving-endpoints/{name}", headers=headers)
|
|
4673
4712
|
|
|
4674
4713
|
def export_metrics(self, name: str) -> ExportMetricsResponse:
|
|
4675
|
-
"""
|
|
4676
|
-
|
|
4677
|
-
Retrieves the metrics associated with the provided serving endpoint in either Prometheus or
|
|
4714
|
+
"""Retrieves the metrics associated with the provided serving endpoint in either Prometheus or
|
|
4678
4715
|
OpenMetrics exposition format.
|
|
4679
4716
|
|
|
4680
4717
|
:param name: str
|
|
@@ -4691,9 +4728,7 @@ class ServingEndpointsAPI:
|
|
|
4691
4728
|
return ExportMetricsResponse.from_dict(res)
|
|
4692
4729
|
|
|
4693
4730
|
def get(self, name: str) -> ServingEndpointDetailed:
|
|
4694
|
-
"""
|
|
4695
|
-
|
|
4696
|
-
Retrieves the details for a single serving endpoint.
|
|
4731
|
+
"""Retrieves the details for a single serving endpoint.
|
|
4697
4732
|
|
|
4698
4733
|
:param name: str
|
|
4699
4734
|
The name of the serving endpoint. This field is required.
|
|
@@ -4709,9 +4744,7 @@ class ServingEndpointsAPI:
|
|
|
4709
4744
|
return ServingEndpointDetailed.from_dict(res)
|
|
4710
4745
|
|
|
4711
4746
|
def get_open_api(self, name: str) -> GetOpenApiResponse:
|
|
4712
|
-
"""Get the schema
|
|
4713
|
-
|
|
4714
|
-
Get the query schema of the serving endpoint in OpenAPI format. The schema contains information for
|
|
4747
|
+
"""Get the query schema of the serving endpoint in OpenAPI format. The schema contains information for
|
|
4715
4748
|
the supported paths, input and output format and datatypes.
|
|
4716
4749
|
|
|
4717
4750
|
:param name: str
|
|
@@ -4728,9 +4761,7 @@ class ServingEndpointsAPI:
|
|
|
4728
4761
|
return GetOpenApiResponse.from_dict(res)
|
|
4729
4762
|
|
|
4730
4763
|
def get_permission_levels(self, serving_endpoint_id: str) -> GetServingEndpointPermissionLevelsResponse:
|
|
4731
|
-
"""
|
|
4732
|
-
|
|
4733
|
-
Gets the permission levels that a user can have on an object.
|
|
4764
|
+
"""Gets the permission levels that a user can have on an object.
|
|
4734
4765
|
|
|
4735
4766
|
:param serving_endpoint_id: str
|
|
4736
4767
|
The serving endpoint for which to get or manage permissions.
|
|
@@ -4748,9 +4779,7 @@ class ServingEndpointsAPI:
|
|
|
4748
4779
|
return GetServingEndpointPermissionLevelsResponse.from_dict(res)
|
|
4749
4780
|
|
|
4750
4781
|
def get_permissions(self, serving_endpoint_id: str) -> ServingEndpointPermissions:
|
|
4751
|
-
"""
|
|
4752
|
-
|
|
4753
|
-
Gets the permissions of a serving endpoint. Serving endpoints can inherit permissions from their root
|
|
4782
|
+
"""Gets the permissions of a serving endpoint. Serving endpoints can inherit permissions from their root
|
|
4754
4783
|
object.
|
|
4755
4784
|
|
|
4756
4785
|
:param serving_endpoint_id: str
|
|
@@ -4818,6 +4847,7 @@ class ServingEndpointsAPI:
|
|
|
4818
4847
|
def list(self) -> Iterator[ServingEndpoint]:
|
|
4819
4848
|
"""Get all serving endpoints.
|
|
4820
4849
|
|
|
4850
|
+
|
|
4821
4851
|
:returns: Iterator over :class:`ServingEndpoint`
|
|
4822
4852
|
"""
|
|
4823
4853
|
|
|
@@ -4830,9 +4860,7 @@ class ServingEndpointsAPI:
|
|
|
4830
4860
|
return parsed if parsed is not None else []
|
|
4831
4861
|
|
|
4832
4862
|
def logs(self, name: str, served_model_name: str) -> ServerLogsResponse:
|
|
4833
|
-
"""
|
|
4834
|
-
|
|
4835
|
-
Retrieves the service logs associated with the provided served model.
|
|
4863
|
+
"""Retrieves the service logs associated with the provided served model.
|
|
4836
4864
|
|
|
4837
4865
|
:param name: str
|
|
4838
4866
|
The name of the serving endpoint that the served model belongs to. This field is required.
|
|
@@ -4854,9 +4882,7 @@ class ServingEndpointsAPI:
|
|
|
4854
4882
|
def patch(
|
|
4855
4883
|
self, name: str, *, add_tags: Optional[List[EndpointTag]] = None, delete_tags: Optional[List[str]] = None
|
|
4856
4884
|
) -> EndpointTags:
|
|
4857
|
-
"""
|
|
4858
|
-
|
|
4859
|
-
Used to batch add and delete tags from a serving endpoint with a single API call.
|
|
4885
|
+
"""Used to batch add and delete tags from a serving endpoint with a single API call.
|
|
4860
4886
|
|
|
4861
4887
|
:param name: str
|
|
4862
4888
|
The name of the serving endpoint who's tags to patch. This field is required.
|
|
@@ -4881,9 +4907,7 @@ class ServingEndpointsAPI:
|
|
|
4881
4907
|
return EndpointTags.from_dict(res)
|
|
4882
4908
|
|
|
4883
4909
|
def put(self, name: str, *, rate_limits: Optional[List[RateLimit]] = None) -> PutResponse:
|
|
4884
|
-
"""
|
|
4885
|
-
|
|
4886
|
-
Deprecated: Please use AI Gateway to manage rate limits instead.
|
|
4910
|
+
"""Deprecated: Please use AI Gateway to manage rate limits instead.
|
|
4887
4911
|
|
|
4888
4912
|
:param name: str
|
|
4889
4913
|
The name of the serving endpoint whose rate limits are being updated. This field is required.
|
|
@@ -4913,9 +4937,7 @@ class ServingEndpointsAPI:
|
|
|
4913
4937
|
rate_limits: Optional[List[AiGatewayRateLimit]] = None,
|
|
4914
4938
|
usage_tracking_config: Optional[AiGatewayUsageTrackingConfig] = None,
|
|
4915
4939
|
) -> PutAiGatewayResponse:
|
|
4916
|
-
"""
|
|
4917
|
-
|
|
4918
|
-
Used to update the AI Gateway of a serving endpoint. NOTE: External model, provisioned throughput, and
|
|
4940
|
+
"""Used to update the AI Gateway of a serving endpoint. NOTE: External model, provisioned throughput, and
|
|
4919
4941
|
pay-per-token endpoints are fully supported; agent endpoints currently only support inference tables.
|
|
4920
4942
|
|
|
4921
4943
|
:param name: str
|
|
@@ -5070,9 +5092,7 @@ class ServingEndpointsAPI:
|
|
|
5070
5092
|
*,
|
|
5071
5093
|
access_control_list: Optional[List[ServingEndpointAccessControlRequest]] = None,
|
|
5072
5094
|
) -> ServingEndpointPermissions:
|
|
5073
|
-
"""
|
|
5074
|
-
|
|
5075
|
-
Sets permissions on an object, replacing existing permissions if they exist. Deletes all direct
|
|
5095
|
+
"""Sets permissions on an object, replacing existing permissions if they exist. Deletes all direct
|
|
5076
5096
|
permissions if none are specified. Objects can inherit permissions from their root object.
|
|
5077
5097
|
|
|
5078
5098
|
:param serving_endpoint_id: str
|
|
@@ -5103,9 +5123,7 @@ class ServingEndpointsAPI:
|
|
|
5103
5123
|
served_models: Optional[List[ServedModelInput]] = None,
|
|
5104
5124
|
traffic_config: Optional[TrafficConfig] = None,
|
|
5105
5125
|
) -> Wait[ServingEndpointDetailed]:
|
|
5106
|
-
"""
|
|
5107
|
-
|
|
5108
|
-
Updates any combination of the serving endpoint's served entities, the compute configuration of those
|
|
5126
|
+
"""Updates any combination of the serving endpoint's served entities, the compute configuration of those
|
|
5109
5127
|
served entities, and the endpoint's traffic config. An endpoint that already has an update in progress
|
|
5110
5128
|
can not be updated until the current update completes or fails.
|
|
5111
5129
|
|
|
@@ -5173,9 +5191,7 @@ class ServingEndpointsAPI:
|
|
|
5173
5191
|
*,
|
|
5174
5192
|
access_control_list: Optional[List[ServingEndpointAccessControlRequest]] = None,
|
|
5175
5193
|
) -> ServingEndpointPermissions:
|
|
5176
|
-
"""
|
|
5177
|
-
|
|
5178
|
-
Updates the permissions on a serving endpoint. Serving endpoints can inherit permissions from their
|
|
5194
|
+
"""Updates the permissions on a serving endpoint. Serving endpoints can inherit permissions from their
|
|
5179
5195
|
root object.
|
|
5180
5196
|
|
|
5181
5197
|
:param serving_endpoint_id: str
|
|
@@ -5200,9 +5216,7 @@ class ServingEndpointsAPI:
|
|
|
5200
5216
|
def update_provisioned_throughput_endpoint_config(
|
|
5201
5217
|
self, name: str, config: PtEndpointCoreConfig
|
|
5202
5218
|
) -> Wait[ServingEndpointDetailed]:
|
|
5203
|
-
"""
|
|
5204
|
-
|
|
5205
|
-
Updates any combination of the pt endpoint's served entities, the compute configuration of those
|
|
5219
|
+
"""Updates any combination of the pt endpoint's served entities, the compute configuration of those
|
|
5206
5220
|
served entities, and the endpoint's traffic config. Updates are instantaneous and endpoint should be
|
|
5207
5221
|
updated instantly
|
|
5208
5222
|
|