PyPI - gcore - Versions diffs - 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

gcore 0.3.0py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gcore might be problematic. Click here for more details.

Files changed (226) hide show

gcore/__init__.py +2 -1
gcore/_base_client.py +31 -2
gcore/_client.py +18 -0
gcore/_constants.py +2 -2
gcore/_models.py +8 -5
gcore/_version.py +1 -1
gcore/pagination.py +252 -1
gcore/resources/__init__.py +28 -0
gcore/resources/cloud/baremetal/flavors.py +11 -137
gcore/resources/cloud/baremetal/images.py +10 -12
gcore/resources/cloud/baremetal/servers.py +33 -30
gcore/resources/cloud/billing_reservations.py +2 -2
gcore/resources/cloud/file_shares/file_shares.py +7 -8
gcore/resources/cloud/floating_ips.py +7 -12
gcore/resources/cloud/gpu_baremetal_clusters/gpu_baremetal_clusters.py +33 -22
gcore/resources/cloud/gpu_baremetal_clusters/images.py +9 -10
gcore/resources/cloud/gpu_baremetal_clusters/interfaces.py +2 -2
gcore/resources/cloud/gpu_baremetal_clusters/servers.py +8 -4
gcore/resources/cloud/inference/deployments/deployments.py +76 -35
gcore/resources/cloud/inference/deployments/logs.py +7 -7
gcore/resources/cloud/inference/inference.py +5 -5
gcore/resources/cloud/inference/models.py +16 -15
gcore/resources/cloud/inference/registry_credentials.py +18 -18
gcore/resources/cloud/inference/secrets.py +12 -13
gcore/resources/cloud/instances/flavors.py +9 -233
gcore/resources/cloud/instances/images.py +47 -37
gcore/resources/cloud/instances/instances.py +49 -34
gcore/resources/cloud/instances/interfaces.py +2 -2
gcore/resources/cloud/ip_ranges.py +34 -2
gcore/resources/cloud/load_balancers/l7_policies/l7_policies.py +10 -2
gcore/resources/cloud/load_balancers/listeners.py +17 -8
gcore/resources/cloud/load_balancers/load_balancers.py +73 -21
gcore/resources/cloud/load_balancers/metrics.py +2 -2
gcore/resources/cloud/load_balancers/pools/health_monitors.py +2 -2
gcore/resources/cloud/load_balancers/pools/members.py +6 -2
gcore/resources/cloud/networks/networks.py +81 -17
gcore/resources/cloud/networks/routers.py +18 -18
gcore/resources/cloud/networks/subnets.py +51 -11
gcore/resources/cloud/projects.py +38 -24
gcore/resources/cloud/quotas/quotas.py +6 -6
gcore/resources/cloud/quotas/requests.py +8 -8
gcore/resources/cloud/registries/artifacts.py +4 -4
gcore/resources/cloud/registries/registries.py +14 -16
gcore/resources/cloud/registries/repositories.py +4 -4
gcore/resources/cloud/registries/tags.py +2 -2
gcore/resources/cloud/registries/users.py +21 -22
gcore/resources/cloud/reserved_fixed_ips/reserved_fixed_ips.py +20 -20
gcore/resources/cloud/reserved_fixed_ips/vip.py +10 -10
gcore/resources/cloud/secrets.py +14 -224
gcore/resources/cloud/security_groups/rules.py +6 -6
gcore/resources/cloud/security_groups/security_groups.py +70 -31
gcore/resources/cloud/tasks.py +34 -32
gcore/resources/cloud/users/role_assignments.py +12 -14
gcore/resources/cloud/volumes.py +139 -49
gcore/resources/fastedge/__init__.py +103 -0
gcore/resources/fastedge/apps/__init__.py +33 -0
gcore/resources/fastedge/apps/apps.py +932 -0
gcore/resources/fastedge/apps/logs.py +248 -0
gcore/resources/fastedge/binaries.py +286 -0
gcore/resources/fastedge/fastedge.py +327 -0
gcore/resources/fastedge/kv_stores.py +523 -0
gcore/resources/fastedge/secrets.py +687 -0
gcore/resources/fastedge/statistics.py +347 -0
gcore/resources/fastedge/templates.py +652 -0
gcore/resources/iam/__init__.py +47 -0
gcore/resources/iam/api_tokens.py +521 -0
gcore/resources/iam/iam.py +199 -0
gcore/resources/iam/users.py +642 -0
gcore/resources/waap/__init__.py +0 -14
gcore/resources/waap/waap.py +0 -32
gcore/types/cloud/__init__.py +2 -28
gcore/types/cloud/baremetal/__init__.py +0 -1
gcore/types/cloud/baremetal/image_list_params.py +1 -5
gcore/types/cloud/baremetal/server_create_params.py +5 -9
gcore/types/cloud/baremetal/server_list_params.py +1 -5
gcore/types/cloud/ddos_profile.py +9 -3
gcore/types/cloud/file_share_create_params.py +3 -5
gcore/types/cloud/floating_ip_create_params.py +2 -4
gcore/types/cloud/floating_ip_list_params.py +1 -5
gcore/types/cloud/gpu_baremetal_cluster_create_params.py +3 -4
gcore/types/cloud/gpu_baremetal_clusters/image_upload_params.py +2 -4
gcore/types/cloud/health_monitor.py +6 -1
gcore/types/cloud/inference/__init__.py +12 -8
gcore/types/cloud/inference/deployment_create_params.py +224 -7
gcore/types/cloud/inference/deployment_update_params.py +24 -3
gcore/types/cloud/inference/deployments/__init__.py +1 -0
gcore/types/cloud/inference/{inference_log.py → deployments/inference_deployment_log.py} +3 -3
gcore/types/cloud/inference/inference_deployment.py +266 -0
gcore/types/cloud/inference/{inference_apikey_secret.py → inference_deployment_api_key.py} +2 -2
gcore/types/cloud/inference/{mlcatalog_model_card.py → inference_model.py} +2 -2
gcore/types/cloud/inference/{inference_registry_credential.py → inference_registry_credentials.py} +2 -2
gcore/types/cloud/inference/{inference_registry_credential_full.py → inference_registry_credentials_create.py} +2 -2
gcore/types/cloud/inference/inference_secret.py +10 -3
gcore/types/cloud/inference/model_list_params.py +2 -4
gcore/types/cloud/{container_probe.py → inference/probe.py} +9 -9
gcore/types/cloud/{container_probe_config.py → inference/probe_config.py} +5 -5
gcore/types/cloud/{container_probe_exec.py → inference/probe_exec.py} +3 -3
gcore/types/cloud/{container_probe_http_get.py → inference/probe_http_get.py} +3 -3
gcore/types/cloud/{container_probe_tcp_socket.py → inference/probe_tcp_socket.py} +3 -3
gcore/types/cloud/inference/secret_create_params.py +10 -4
gcore/types/cloud/inference/secret_replace_params.py +10 -4
gcore/types/cloud/{region_capacity.py → inference_region_capacity.py} +10 -3
gcore/types/cloud/{region_capacity_list.py → inference_region_capacity_list.py} +4 -4
gcore/types/cloud/instance_create_params.py +8 -9
gcore/types/cloud/instance_list_params.py +1 -5
gcore/types/cloud/instances/__init__.py +0 -2
gcore/types/cloud/instances/image_create_from_volume_params.py +2 -4
gcore/types/cloud/instances/image_list_params.py +1 -5
gcore/types/cloud/instances/image_upload_params.py +2 -4
gcore/types/cloud/load_balancer_create_params.py +8 -4
gcore/types/cloud/load_balancer_list_params.py +1 -5
gcore/types/cloud/load_balancer_update_params.py +24 -0
gcore/types/cloud/load_balancers/pool_create_params.py +6 -1
gcore/types/cloud/load_balancers/pool_update_params.py +6 -1
gcore/types/cloud/load_balancers/pools/member_add_params.py +6 -1
gcore/types/cloud/member.py +6 -1
gcore/types/cloud/network_create_params.py +2 -3
gcore/types/cloud/network_list_params.py +4 -5
gcore/types/cloud/network_update_params.py +28 -2
gcore/types/cloud/networks/router_list_params.py +2 -2
gcore/types/cloud/networks/subnet_create_params.py +2 -3
gcore/types/cloud/networks/subnet_list_params.py +1 -5
gcore/types/cloud/networks/subnet_update_params.py +25 -0
gcore/types/cloud/registries/__init__.py +1 -0
gcore/types/cloud/registries/user_refresh_secret_response.py +31 -0
gcore/types/cloud/reserved_fixed_ip_list_params.py +2 -2
gcore/types/cloud/security_group_list_params.py +3 -7
gcore/types/cloud/security_group_update_params.py +25 -0
gcore/types/cloud/tag_update_map_param.py +2 -2
gcore/types/cloud/task_list_params.py +15 -14
gcore/types/cloud/volume_list_params.py +1 -5
gcore/types/cloud/volume_update_params.py +29 -3
gcore/types/fastedge/__init__.py +48 -0
gcore/types/fastedge/app.py +81 -0
gcore/types/fastedge/app_create_params.py +56 -0
gcore/types/fastedge/app_list_params.py +50 -0
gcore/types/fastedge/app_param.py +56 -0
gcore/types/fastedge/app_replace_params.py +17 -0
gcore/types/fastedge/app_short.py +60 -0
gcore/types/fastedge/app_update_params.py +56 -0
gcore/types/fastedge/apps/__init__.py +6 -0
gcore/types/fastedge/apps/log.py +28 -0
gcore/types/fastedge/apps/log_list_params.py +37 -0
gcore/types/fastedge/binary.py +40 -0
gcore/types/fastedge/binary_list_response.py +12 -0
gcore/types/fastedge/binary_short.py +32 -0
gcore/types/fastedge/call_status.py +24 -0
gcore/types/fastedge/client.py +57 -0
gcore/types/fastedge/duration_stats.py +30 -0
gcore/types/fastedge/kv_store.py +33 -0
gcore/types/fastedge/kv_store_create_params.py +23 -0
gcore/types/fastedge/kv_store_get_response.py +10 -0
gcore/types/fastedge/kv_store_list_params.py +12 -0
gcore/types/fastedge/kv_store_list_response.py +15 -0
gcore/types/fastedge/kv_store_replace_params.py +23 -0
gcore/types/fastedge/kv_store_short.py +19 -0
gcore/types/fastedge/kv_store_stats.py +26 -0
gcore/types/fastedge/secret.py +29 -0
gcore/types/fastedge/secret_create_params.py +27 -0
gcore/types/fastedge/secret_create_response.py +12 -0
gcore/types/fastedge/secret_delete_params.py +12 -0
gcore/types/fastedge/secret_list_params.py +15 -0
gcore/types/{cloud → fastedge}/secret_list_response.py +2 -6
gcore/types/fastedge/secret_replace_params.py +27 -0
gcore/types/fastedge/secret_short.py +21 -0
gcore/types/fastedge/secret_update_params.py +27 -0
gcore/types/fastedge/statistic_get_call_series_params.py +28 -0
gcore/types/fastedge/statistic_get_call_series_response.py +12 -0
gcore/types/fastedge/statistic_get_duration_series_params.py +28 -0
gcore/types/fastedge/statistic_get_duration_series_response.py +12 -0
gcore/types/fastedge/template.py +31 -0
gcore/types/fastedge/template_create_params.py +30 -0
gcore/types/fastedge/template_delete_params.py +12 -0
gcore/types/fastedge/template_list_params.py +25 -0
gcore/types/fastedge/template_parameter.py +22 -0
gcore/types/fastedge/template_parameter_param.py +21 -0
gcore/types/fastedge/template_replace_params.py +30 -0
gcore/types/fastedge/template_short.py +27 -0
gcore/types/iam/__init__.py +17 -0
gcore/types/iam/account_overview.py +488 -0
gcore/types/iam/api_token.py +78 -0
gcore/types/iam/api_token_create.py +15 -0
gcore/types/iam/api_token_create_params.py +42 -0
gcore/types/iam/api_token_list.py +81 -0
gcore/types/iam/api_token_list_params.py +41 -0
gcore/types/iam/user.py +86 -0
gcore/types/iam/user_detailed.py +104 -0
gcore/types/iam/user_invite.py +15 -0
gcore/types/iam/user_invite_params.py +37 -0
gcore/types/iam/user_list_params.py +15 -0
gcore/types/iam/user_update.py +104 -0
gcore/types/iam/user_update_params.py +52 -0
gcore/types/waap/__init__.py +0 -1
gcore/types/waap/domains/custom_rule_create_params.py +7 -3
gcore/types/waap/domains/custom_rule_update_params.py +7 -3
gcore/types/waap/waap_custom_rule.py +7 -3
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/METADATA +44 -5
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/RECORD +200 -151
gcore/resources/waap/clients.py +0 -135
gcore/types/cloud/aws_iam_data.py +0 -13
gcore/types/cloud/aws_iam_data_param.py +0 -15
gcore/types/cloud/baremetal/flavor_list_suitable_params.py +0 -22
gcore/types/cloud/capacity.py +0 -13
gcore/types/cloud/container_probe_config_create_param.py +0 -17
gcore/types/cloud/container_probe_create_param.py +0 -38
gcore/types/cloud/container_probe_exec_create_param.py +0 -13
gcore/types/cloud/container_probe_http_get_create_param.py +0 -25
gcore/types/cloud/container_probe_tcp_socket_create_param.py +0 -12
gcore/types/cloud/container_scale.py +0 -25
gcore/types/cloud/container_scale_trigger_rate.py +0 -13
gcore/types/cloud/container_scale_trigger_sqs.py +0 -33
gcore/types/cloud/container_scale_trigger_threshold.py +0 -10
gcore/types/cloud/container_scale_triggers.py +0 -36
gcore/types/cloud/deploy_status.py +0 -13
gcore/types/cloud/inference/container.py +0 -26
gcore/types/cloud/inference/inference.py +0 -95
gcore/types/cloud/inference/mlcatalog_order_by_choices.py +0 -7
gcore/types/cloud/inference_probes.py +0 -19
gcore/types/cloud/ingress_opts_out.py +0 -16
gcore/types/cloud/ingress_opts_param.py +0 -18
gcore/types/cloud/instances/flavor_list_for_resize_params.py +0 -16
gcore/types/cloud/instances/flavor_list_suitable_params.py +0 -59
gcore/types/cloud/secret_create_params.py +0 -66
gcore/types/waap/client_me_response.py +0 -34
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/WHEEL +0 -0
{gcore-0.3.0.dist-info → gcore-0.5.0.dist-info}/licenses/LICENSE +0 -0

gcore/types/cloud/inference/deployment_create_params.py CHANGED Viewed

@@ -6,9 +6,7 @@ from typing import Dict, List, Iterable, Optional
 from typing_extensions import Required, Annotated, TypedDict
 from ...._utils import PropertyInfo
-from ..ingress_opts_param import IngressOptsParam
 from ..laas_index_retention_policy_param import LaasIndexRetentionPolicyParam
-from ..container_probe_config_create_param import ContainerProbeConfigCreateParam
 __all__ = [
     "DeploymentCreateParams",
@@ -21,8 +19,24 @@ __all__ = [
     "ContainerScaleTriggersHTTP",
     "ContainerScaleTriggersMemory",
     "ContainerScaleTriggersSqs",
+    "IngressOpts",
     "Logging",
     "Probes",
+    "ProbesLivenessProbe",
+    "ProbesLivenessProbeProbe",
+    "ProbesLivenessProbeProbeExec",
+    "ProbesLivenessProbeProbeHTTPGet",
+    "ProbesLivenessProbeProbeTcpSocket",
+    "ProbesReadinessProbe",
+    "ProbesReadinessProbeProbe",
+    "ProbesReadinessProbeProbeExec",
+    "ProbesReadinessProbeProbeHTTPGet",
+    "ProbesReadinessProbeProbeTcpSocket",
+    "ProbesStartupProbe",
+    "ProbesStartupProbeProbe",
+    "ProbesStartupProbeProbeExec",
+    "ProbesStartupProbeProbeHTTPGet",
+    "ProbesStartupProbeProbeTcpSocket",
 ]
@@ -50,11 +64,20 @@ class DeploymentCreateParams(TypedDict, total=False):
     name: Required[str]
     """Inference instance name."""
+    api_keys: List[str]
+    """List of API keys for the inference instance.
+    Multiple keys can be attached to one deployment.If `auth_enabled` and `api_keys`
+    are both specified, a ValidationError will be raised.
+    """
     auth_enabled: bool
     """Set to `true` to enable API key authentication for the inference instance.
     `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-    for the requests to the instance if enabled
+    for the requests to the instance if enabled. This field is deprecated and will
+    be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+    `api_keys` are both specified, a ValidationError will be raised.
     """
     command: Optional[List[str]]
@@ -69,7 +92,7 @@ class DeploymentCreateParams(TypedDict, total=False):
     envs: Dict[str, str]
     """Environment variables for the inference instance."""
-    ingress_opts: Optional[IngressOptsParam]
+    ingress_opts: Optional[IngressOpts]
     """Ingress options for the inference instance"""
     logging: Optional[Logging]
@@ -197,6 +220,17 @@ class Container(TypedDict, total=False):
     """Scale for the container"""
+class IngressOpts(TypedDict, total=False):
+    disable_response_buffering: bool
+    """Disable response buffering if true.
+    A client usually has a much slower connection and can not consume the response
+    data as fast as it is produced by an upstream application. Ingress tries to
+    buffer the whole response in order to release the upstream application as soon
+    as possible.By default, the response buffering is enabled.
+    """
 class Logging(TypedDict, total=False):
     destination_region_id: Optional[int]
     """ID of the region in which the logs will be stored"""
@@ -211,12 +245,195 @@ class Logging(TypedDict, total=False):
     """The topic name to stream logs to"""
+class ProbesLivenessProbeProbeExec(TypedDict, total=False):
+    command: Required[List[str]]
+    """Command to be executed inside the running container."""
+class ProbesLivenessProbeProbeHTTPGet(TypedDict, total=False):
+    port: Required[int]
+    """Port number the probe should connect to."""
+    headers: Dict[str, str]
+    """HTTP headers to be sent with the request."""
+    host: Optional[str]
+    """Host name to send HTTP request to."""
+    path: str
+    """The endpoint to send the HTTP request to."""
+    schema: str
+    """Schema to use for the HTTP request."""
+class ProbesLivenessProbeProbeTcpSocket(TypedDict, total=False):
+    port: Required[int]
+    """Port number to check if it's open."""
+class ProbesLivenessProbeProbe(TypedDict, total=False):
+    exec: Optional[ProbesLivenessProbeProbeExec]
+    """Exec probe configuration"""
+    failure_threshold: int
+    """The number of consecutive probe failures that mark the container as unhealthy."""
+    http_get: Optional[ProbesLivenessProbeProbeHTTPGet]
+    """HTTP GET probe configuration"""
+    initial_delay_seconds: int
+    """The initial delay before starting the first probe."""
+    period_seconds: int
+    """How often (in seconds) to perform the probe."""
+    success_threshold: int
+    """The number of consecutive successful probes that mark the container as healthy."""
+    tcp_socket: Optional[ProbesLivenessProbeProbeTcpSocket]
+    """TCP socket probe configuration"""
+    timeout_seconds: int
+    """The timeout for each probe."""
+class ProbesLivenessProbe(TypedDict, total=False):
+    enabled: Required[bool]
+    """Whether the probe is enabled or not."""
+    probe: ProbesLivenessProbeProbe
+    """Probe configuration (exec, `http_get` or `tcp_socket`)"""
+class ProbesReadinessProbeProbeExec(TypedDict, total=False):
+    command: Required[List[str]]
+    """Command to be executed inside the running container."""
+class ProbesReadinessProbeProbeHTTPGet(TypedDict, total=False):
+    port: Required[int]
+    """Port number the probe should connect to."""
+    headers: Dict[str, str]
+    """HTTP headers to be sent with the request."""
+    host: Optional[str]
+    """Host name to send HTTP request to."""
+    path: str
+    """The endpoint to send the HTTP request to."""
+    schema: str
+    """Schema to use for the HTTP request."""
+class ProbesReadinessProbeProbeTcpSocket(TypedDict, total=False):
+    port: Required[int]
+    """Port number to check if it's open."""
+class ProbesReadinessProbeProbe(TypedDict, total=False):
+    exec: Optional[ProbesReadinessProbeProbeExec]
+    """Exec probe configuration"""
+    failure_threshold: int
+    """The number of consecutive probe failures that mark the container as unhealthy."""
+    http_get: Optional[ProbesReadinessProbeProbeHTTPGet]
+    """HTTP GET probe configuration"""
+    initial_delay_seconds: int
+    """The initial delay before starting the first probe."""
+    period_seconds: int
+    """How often (in seconds) to perform the probe."""
+    success_threshold: int
+    """The number of consecutive successful probes that mark the container as healthy."""
+    tcp_socket: Optional[ProbesReadinessProbeProbeTcpSocket]
+    """TCP socket probe configuration"""
+    timeout_seconds: int
+    """The timeout for each probe."""
+class ProbesReadinessProbe(TypedDict, total=False):
+    enabled: Required[bool]
+    """Whether the probe is enabled or not."""
+    probe: ProbesReadinessProbeProbe
+    """Probe configuration (exec, `http_get` or `tcp_socket`)"""
+class ProbesStartupProbeProbeExec(TypedDict, total=False):
+    command: Required[List[str]]
+    """Command to be executed inside the running container."""
+class ProbesStartupProbeProbeHTTPGet(TypedDict, total=False):
+    port: Required[int]
+    """Port number the probe should connect to."""
+    headers: Dict[str, str]
+    """HTTP headers to be sent with the request."""
+    host: Optional[str]
+    """Host name to send HTTP request to."""
+    path: str
+    """The endpoint to send the HTTP request to."""
+    schema: str
+    """Schema to use for the HTTP request."""
+class ProbesStartupProbeProbeTcpSocket(TypedDict, total=False):
+    port: Required[int]
+    """Port number to check if it's open."""
+class ProbesStartupProbeProbe(TypedDict, total=False):
+    exec: Optional[ProbesStartupProbeProbeExec]
+    """Exec probe configuration"""
+    failure_threshold: int
+    """The number of consecutive probe failures that mark the container as unhealthy."""
+    http_get: Optional[ProbesStartupProbeProbeHTTPGet]
+    """HTTP GET probe configuration"""
+    initial_delay_seconds: int
+    """The initial delay before starting the first probe."""
+    period_seconds: int
+    """How often (in seconds) to perform the probe."""
+    success_threshold: int
+    """The number of consecutive successful probes that mark the container as healthy."""
+    tcp_socket: Optional[ProbesStartupProbeProbeTcpSocket]
+    """TCP socket probe configuration"""
+    timeout_seconds: int
+    """The timeout for each probe."""
+class ProbesStartupProbe(TypedDict, total=False):
+    enabled: Required[bool]
+    """Whether the probe is enabled or not."""
+    probe: ProbesStartupProbeProbe
+    """Probe configuration (exec, `http_get` or `tcp_socket`)"""
 class Probes(TypedDict, total=False):
-    liveness_probe: Optional[ContainerProbeConfigCreateParam]
+    liveness_probe: Optional[ProbesLivenessProbe]
     """Liveness probe configuration"""
-    readiness_probe: Optional[ContainerProbeConfigCreateParam]
+    readiness_probe: Optional[ProbesReadinessProbe]
     """Readiness probe configuration"""
-    startup_probe: Optional[ContainerProbeConfigCreateParam]
+    startup_probe: Optional[ProbesStartupProbe]
     """Startup probe configuration"""

gcore/types/cloud/inference/deployment_update_params.py CHANGED Viewed

@@ -6,7 +6,6 @@ from typing import Dict, List, Iterable, Optional
 from typing_extensions import Required, Annotated, TypedDict
 from ...._utils import PropertyInfo
-from ..ingress_opts_param import IngressOptsParam
 from ..laas_index_retention_policy_param import LaasIndexRetentionPolicyParam
 __all__ = [
@@ -20,6 +19,7 @@ __all__ = [
     "ContainerScaleTriggersHTTP",
     "ContainerScaleTriggersMemory",
     "ContainerScaleTriggersSqs",
+    "IngressOpts",
     "Logging",
     "Probes",
     "ProbesLivenessProbe",
@@ -44,11 +44,21 @@ class DeploymentUpdateParams(TypedDict, total=False):
     project_id: int
     """Project ID"""
+    api_keys: Optional[List[str]]
+    """List of API keys for the inference instance.
+    Multiple keys can be attached to one deployment.If `auth_enabled` and `api_keys`
+    are both specified, a ValidationError will be raised.If `[]` is provided, the
+    API keys will be removed and auth will be disabled on the deployment.
+    """
     auth_enabled: bool
     """Set to `true` to enable API key authentication for the inference instance.
     `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
-    for the requests to the instance if enabled
+    for the requests to the instance if enabled. This field is deprecated and will
+    be removed in the future. Use `api_keys` field instead.If `auth_enabled` and
+    `api_keys` are both specified, a ValidationError will be raised.
     """
     command: Optional[List[str]]
@@ -77,7 +87,7 @@ class DeploymentUpdateParams(TypedDict, total=False):
     accessible Docker image URL can be specified.
     """
-    ingress_opts: Optional[IngressOptsParam]
+    ingress_opts: Optional[IngressOpts]
     """Ingress options for the inference instance"""
     listening_port: Optional[int]
@@ -204,6 +214,17 @@ class Container(TypedDict, total=False):
     """Scale for the container"""
+class IngressOpts(TypedDict, total=False):
+    disable_response_buffering: bool
+    """Disable response buffering if true.
+    A client usually has a much slower connection and can not consume the response
+    data as fast as it is produced by an upstream application. Ingress tries to
+    buffer the whole response in order to release the upstream application as soon
+    as possible.By default, the response buffering is enabled.
+    """
 class Logging(TypedDict, total=False):
     destination_region_id: Optional[int]
     """ID of the region in which the logs will be stored"""

gcore/types/cloud/inference/deployments/__init__.py CHANGED Viewed

@@ -3,3 +3,4 @@
 from __future__ import annotations
 from .log_list_params import LogListParams as LogListParams
+from .inference_deployment_log import InferenceDeploymentLog as InferenceDeploymentLog

gcore/types/cloud/inference/{inference_log.py → deployments/inference_deployment_log.py} RENAMED Viewed

@@ -2,12 +2,12 @@
 from datetime import datetime
-from ...._models import BaseModel
+from ....._models import BaseModel
-__all__ = ["InferenceLog"]
+__all__ = ["InferenceDeploymentLog"]
-class InferenceLog(BaseModel):
+class InferenceDeploymentLog(BaseModel):
     message: str
     """Log message."""

gcore/types/cloud/inference/inference_deployment.py ADDED Viewed

@@ -0,0 +1,266 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+from typing import Dict, List, Optional
+from typing_extensions import Literal
+from ..logging import Logging
+from ...._models import BaseModel
+from .probe_config import ProbeConfig
+__all__ = [
+    "InferenceDeployment",
+    "Container",
+    "ContainerDeployStatus",
+    "ContainerScale",
+    "ContainerScaleTriggers",
+    "ContainerScaleTriggersCPU",
+    "ContainerScaleTriggersGPUMemory",
+    "ContainerScaleTriggersGPUUtilization",
+    "ContainerScaleTriggersHTTP",
+    "ContainerScaleTriggersMemory",
+    "ContainerScaleTriggersSqs",
+    "IngressOpts",
+    "ObjectReference",
+    "Probes",
+]
+class ContainerDeployStatus(BaseModel):
+    ready: int
+    """Number of ready instances"""
+    total: int
+    """Total number of instances"""
+class ContainerScaleTriggersCPU(BaseModel):
+    threshold: int
+    """Threshold value for the trigger in percentage"""
+class ContainerScaleTriggersGPUMemory(BaseModel):
+    threshold: int
+    """Threshold value for the trigger in percentage"""
+class ContainerScaleTriggersGPUUtilization(BaseModel):
+    threshold: int
+    """Threshold value for the trigger in percentage"""
+class ContainerScaleTriggersHTTP(BaseModel):
+    rate: int
+    """Request count per 'window' seconds for the http trigger"""
+    window: int
+    """Time window for rate calculation in seconds"""
+class ContainerScaleTriggersMemory(BaseModel):
+    threshold: int
+    """Threshold value for the trigger in percentage"""
+class ContainerScaleTriggersSqs(BaseModel):
+    activation_queue_length: int
+    """Number of messages for activation"""
+    aws_endpoint: Optional[str] = None
+    """Custom AWS endpoint"""
+    aws_region: str
+    """AWS region"""
+    queue_length: int
+    """Number of messages for one replica"""
+    queue_url: str
+    """SQS queue URL"""
+    scale_on_delayed: bool
+    """Scale on delayed messages"""
+    scale_on_flight: bool
+    """Scale on in-flight messages"""
+    secret_name: str
+    """Auth secret name"""
+class ContainerScaleTriggers(BaseModel):
+    cpu: Optional[ContainerScaleTriggersCPU] = None
+    """CPU trigger configuration"""
+    gpu_memory: Optional[ContainerScaleTriggersGPUMemory] = None
+    """GPU memory trigger configuration.
+    Calculated by `DCGM_FI_DEV_MEM_COPY_UTIL` metric
+    """
+    gpu_utilization: Optional[ContainerScaleTriggersGPUUtilization] = None
+    """GPU utilization trigger configuration.
+    Calculated by `DCGM_FI_DEV_GPU_UTIL` metric
+    """
+    http: Optional[ContainerScaleTriggersHTTP] = None
+    """HTTP trigger configuration"""
+    memory: Optional[ContainerScaleTriggersMemory] = None
+    """Memory trigger configuration"""
+    sqs: Optional[ContainerScaleTriggersSqs] = None
+    """SQS trigger configuration"""
+class ContainerScale(BaseModel):
+    cooldown_period: Optional[int] = None
+    """Cooldown period between scaling actions in seconds"""
+    max: int
+    """Maximum scale for the container"""
+    min: int
+    """Minimum scale for the container"""
+    polling_interval: Optional[int] = None
+    """Polling interval for scaling triggers in seconds"""
+    triggers: ContainerScaleTriggers
+    """Triggers for scaling actions"""
+class Container(BaseModel):
+    address: Optional[str] = None
+    """Address of the inference instance"""
+    deploy_status: ContainerDeployStatus
+    """Status of the containers deployment"""
+    error_message: Optional[str] = None
+    """Error message if the container deployment failed"""
+    region_id: int
+    """Region name for the container"""
+    scale: ContainerScale
+    """Scale for the container"""
+class IngressOpts(BaseModel):
+    disable_response_buffering: bool
+    """Disable response buffering if true.
+    A client usually has a much slower connection and can not consume the response
+    data as fast as it is produced by an upstream application. Ingress tries to
+    buffer the whole response in order to release the upstream application as soon
+    as possible.By default, the response buffering is enabled.
+    """
+class ObjectReference(BaseModel):
+    kind: Literal["AppDeployment"]
+    """Kind of the inference object to be referenced"""
+    name: str
+    """Name of the inference object to be referenced"""
+class Probes(BaseModel):
+    liveness_probe: Optional[ProbeConfig] = None
+    """Liveness probe configuration"""
+    readiness_probe: Optional[ProbeConfig] = None
+    """Readiness probe configuration"""
+    startup_probe: Optional[ProbeConfig] = None
+    """Startup probe configuration"""
+class InferenceDeployment(BaseModel):
+    address: Optional[str] = None
+    """Address of the inference instance"""
+    auth_enabled: bool
+    """`true` if instance uses API key authentication.
+    `"Authorization": "Bearer ****\\**"` or `"X-Api-Key": "****\\**"` header is required
+    for the requests to the instance if enabled.
+    """
+    command: Optional[str] = None
+    """Command to be executed when running a container from an image."""
+    containers: List[Container]
+    """List of containers for the inference instance"""
+    created_at: Optional[str] = None
+    """Inference instance creation date in ISO 8601 format."""
+    credentials_name: str
+    """Registry credentials name"""
+    description: str
+    """Inference instance description."""
+    envs: Optional[Dict[str, str]] = None
+    """Environment variables for the inference instance"""
+    flavor_name: str
+    """Flavor name for the inference instance"""
+    image: str
+    """Docker image for the inference instance.
+    This field should contain the image name and tag in the format 'name:tag', e.g.,
+    'nginx:latest'. It defaults to Docker Hub as the image registry, but any
+    accessible Docker image URL can be specified.
+    """
+    ingress_opts: Optional[IngressOpts] = None
+    """Ingress options for the inference instance"""
+    listening_port: int
+    """Listening port for the inference instance."""
+    logging: Optional[Logging] = None
+    """Logging configuration for the inference instance"""
+    name: str
+    """Inference instance name."""
+    object_references: List[ObjectReference]
+    """Indicates to which parent object this inference belongs to."""
+    probes: Optional[Probes] = None
+    """Probes configured for all containers of the inference instance."""
+    project_id: int
+    """Project ID. If not provided, your default project ID will be used."""
+    status: Literal["ACTIVE", "DELETING", "DEPLOYING", "DISABLED", "PARTIALLYDEPLOYED", "PENDING"]
+    """Inference instance status. Value can be one of the following:
+    - `DEPLOYING` - The instance is being deployed. Containers are not yet created.
+    - `PARTIALLYDEPLOYED` - All containers have been created, but some may not be
+      ready yet. Instances stuck in this state typically indicate either image being
+      pulled, or a failure of some kind. In the latter case, the `error_message`
+      field of the respective container object in the `containers` collection
+      explains the failure reason.
+    - `ACTIVE` - The instance is running and ready to accept requests.
+    - `DISABLED` - The instance is disabled and not accepting any requests.
+    - `PENDING` - The instance is running but scaled to zero. It will be
+      automatically scaled up when a request is made.
+    - `DELETING` - The instance is being deleted.
+    """
+    timeout: Optional[int] = None
+    """
+    Specifies the duration in seconds without any requests after which the
+    containers will be downscaled to their minimum scale value as defined by
+    `scale.min`. If set, this helps in optimizing resource usage by reducing the
+    number of container instances during periods of inactivity.
+    """
+    api_keys: Optional[List[str]] = None
+    """List of API keys for the inference instance"""

gcore/types/cloud/inference/{inference_apikey_secret.py → inference_deployment_api_key.py} RENAMED Viewed

@@ -4,10 +4,10 @@ from typing_extensions import Literal
 from ...._models import BaseModel
-__all__ = ["InferenceApikeySecret"]
+__all__ = ["InferenceDeploymentAPIKey"]
-class InferenceApikeySecret(BaseModel):
+class InferenceDeploymentAPIKey(BaseModel):
     secret: str
     """API key secret"""

gcore/types/cloud/inference/{mlcatalog_model_card.py → inference_model.py} RENAMED Viewed

@@ -6,10 +6,10 @@ from pydantic import Field as FieldInfo
 from ...._models import BaseModel
-__all__ = ["MlcatalogModelCard"]
+__all__ = ["InferenceModel"]
-class MlcatalogModelCard(BaseModel):
+class InferenceModel(BaseModel):
     id: str
     """Model ID."""

gcore/types/cloud/inference/{inference_registry_credential.py → inference_registry_credentials.py} RENAMED Viewed

@@ -2,10 +2,10 @@
 from ...._models import BaseModel
-__all__ = ["InferenceRegistryCredential"]
+__all__ = ["InferenceRegistryCredentials"]
-class InferenceRegistryCredential(BaseModel):
+class InferenceRegistryCredentials(BaseModel):
     name: str
     """Registry credential name."""

gcore/types/cloud/inference/{inference_registry_credential_full.py → inference_registry_credentials_create.py} RENAMED Viewed

@@ -2,10 +2,10 @@
 from ...._models import BaseModel
-__all__ = ["InferenceRegistryCredentialFull"]
+__all__ = ["InferenceRegistryCredentialsCreate"]
-class InferenceRegistryCredentialFull(BaseModel):
+class InferenceRegistryCredentialsCreate(BaseModel):
     name: str
     """Registry credential name."""

gcore 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

Potentially problematic release.

gcore 0.3.0py3-none-any.whl → 0.5.0py3-none-any.whl