PyPI - kumoai - Versions diffs - 2.14.0.dev202601011731__cp310-cp310-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl - Mend

kumoai 2.14.0.dev202601011731__cp310-cp310-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of kumoai might be problematic. Click here for more details.

Files changed (122) hide show

kumoai/__init__.py +300 -0
kumoai/_logging.py +29 -0
kumoai/_singleton.py +25 -0
kumoai/_version.py +1 -0
kumoai/artifact_export/__init__.py +9 -0
kumoai/artifact_export/config.py +209 -0
kumoai/artifact_export/job.py +108 -0
kumoai/client/__init__.py +5 -0
kumoai/client/client.py +223 -0
kumoai/client/connector.py +110 -0
kumoai/client/endpoints.py +150 -0
kumoai/client/graph.py +120 -0
kumoai/client/jobs.py +471 -0
kumoai/client/online.py +78 -0
kumoai/client/pquery.py +207 -0
kumoai/client/rfm.py +112 -0
kumoai/client/source_table.py +53 -0
kumoai/client/table.py +101 -0
kumoai/client/utils.py +130 -0
kumoai/codegen/__init__.py +19 -0
kumoai/codegen/cli.py +100 -0
kumoai/codegen/context.py +16 -0
kumoai/codegen/edits.py +473 -0
kumoai/codegen/exceptions.py +10 -0
kumoai/codegen/generate.py +222 -0
kumoai/codegen/handlers/__init__.py +4 -0
kumoai/codegen/handlers/connector.py +118 -0
kumoai/codegen/handlers/graph.py +71 -0
kumoai/codegen/handlers/pquery.py +62 -0
kumoai/codegen/handlers/table.py +109 -0
kumoai/codegen/handlers/utils.py +42 -0
kumoai/codegen/identity.py +114 -0
kumoai/codegen/loader.py +93 -0
kumoai/codegen/naming.py +94 -0
kumoai/codegen/registry.py +121 -0
kumoai/connector/__init__.py +31 -0
kumoai/connector/base.py +153 -0
kumoai/connector/bigquery_connector.py +200 -0
kumoai/connector/databricks_connector.py +213 -0
kumoai/connector/file_upload_connector.py +189 -0
kumoai/connector/glue_connector.py +150 -0
kumoai/connector/s3_connector.py +278 -0
kumoai/connector/snowflake_connector.py +252 -0
kumoai/connector/source_table.py +471 -0
kumoai/connector/utils.py +1796 -0
kumoai/databricks.py +14 -0
kumoai/encoder/__init__.py +4 -0
kumoai/exceptions.py +26 -0
kumoai/experimental/__init__.py +0 -0
kumoai/experimental/rfm/__init__.py +210 -0
kumoai/experimental/rfm/authenticate.py +432 -0
kumoai/experimental/rfm/backend/__init__.py +0 -0
kumoai/experimental/rfm/backend/local/__init__.py +42 -0
kumoai/experimental/rfm/backend/local/graph_store.py +297 -0
kumoai/experimental/rfm/backend/local/sampler.py +312 -0
kumoai/experimental/rfm/backend/local/table.py +113 -0
kumoai/experimental/rfm/backend/snow/__init__.py +37 -0
kumoai/experimental/rfm/backend/snow/sampler.py +297 -0
kumoai/experimental/rfm/backend/snow/table.py +242 -0
kumoai/experimental/rfm/backend/sqlite/__init__.py +32 -0
kumoai/experimental/rfm/backend/sqlite/sampler.py +398 -0
kumoai/experimental/rfm/backend/sqlite/table.py +184 -0
kumoai/experimental/rfm/base/__init__.py +30 -0
kumoai/experimental/rfm/base/column.py +152 -0
kumoai/experimental/rfm/base/expression.py +44 -0
kumoai/experimental/rfm/base/sampler.py +761 -0
kumoai/experimental/rfm/base/source.py +19 -0
kumoai/experimental/rfm/base/sql_sampler.py +143 -0
kumoai/experimental/rfm/base/table.py +736 -0
kumoai/experimental/rfm/graph.py +1237 -0
kumoai/experimental/rfm/infer/__init__.py +19 -0
kumoai/experimental/rfm/infer/categorical.py +40 -0
kumoai/experimental/rfm/infer/dtype.py +82 -0
kumoai/experimental/rfm/infer/id.py +46 -0
kumoai/experimental/rfm/infer/multicategorical.py +48 -0
kumoai/experimental/rfm/infer/pkey.py +128 -0
kumoai/experimental/rfm/infer/stype.py +35 -0
kumoai/experimental/rfm/infer/time_col.py +61 -0
kumoai/experimental/rfm/infer/timestamp.py +41 -0
kumoai/experimental/rfm/pquery/__init__.py +7 -0
kumoai/experimental/rfm/pquery/executor.py +102 -0
kumoai/experimental/rfm/pquery/pandas_executor.py +530 -0
kumoai/experimental/rfm/relbench.py +76 -0
kumoai/experimental/rfm/rfm.py +1184 -0
kumoai/experimental/rfm/sagemaker.py +138 -0
kumoai/experimental/rfm/task_table.py +231 -0
kumoai/formatting.py +30 -0
kumoai/futures.py +99 -0
kumoai/graph/__init__.py +12 -0
kumoai/graph/column.py +106 -0
kumoai/graph/graph.py +948 -0
kumoai/graph/table.py +838 -0
kumoai/jobs.py +80 -0
kumoai/kumolib.cpython-310-x86_64-linux-gnu.so +0 -0
kumoai/mixin.py +28 -0
kumoai/pquery/__init__.py +25 -0
kumoai/pquery/prediction_table.py +287 -0
kumoai/pquery/predictive_query.py +641 -0
kumoai/pquery/training_table.py +424 -0
kumoai/spcs.py +121 -0
kumoai/testing/__init__.py +8 -0
kumoai/testing/decorators.py +57 -0
kumoai/testing/snow.py +50 -0
kumoai/trainer/__init__.py +42 -0
kumoai/trainer/baseline_trainer.py +93 -0
kumoai/trainer/config.py +2 -0
kumoai/trainer/distilled_trainer.py +175 -0
kumoai/trainer/job.py +1192 -0
kumoai/trainer/online_serving.py +258 -0
kumoai/trainer/trainer.py +475 -0
kumoai/trainer/util.py +103 -0
kumoai/utils/__init__.py +11 -0
kumoai/utils/datasets.py +83 -0
kumoai/utils/display.py +51 -0
kumoai/utils/forecasting.py +209 -0
kumoai/utils/progress_logger.py +343 -0
kumoai/utils/sql.py +3 -0
kumoai-2.14.0.dev202601011731.dist-info/METADATA +71 -0
kumoai-2.14.0.dev202601011731.dist-info/RECORD +122 -0
kumoai-2.14.0.dev202601011731.dist-info/WHEEL +6 -0
kumoai-2.14.0.dev202601011731.dist-info/licenses/LICENSE +9 -0
kumoai-2.14.0.dev202601011731.dist-info/top_level.txt +1 -0

kumoai/client/jobs.py ADDED Viewed

@@ -0,0 +1,471 @@
+from datetime import datetime
+from typing import (
+    Any,
+    Dict,
+    Generic,
+    List,
+    Mapping,
+    Optional,
+    Tuple,
+    Type,
+    TypeVar,
+)
+from kumoapi.common import ValidationResponse
+from kumoapi.jobs import (
+    ArtifactExportRequest,
+    ArtifactExportResponse,
+    AutoTrainerProgress,
+    BaselineJobRequest,
+    BaselineJobResource,
+    BatchPredictionJobResource,
+    BatchPredictionRequest,
+    CancelBatchPredictionJobResponse,
+    CancelTrainingJobResponse,
+    DistillationJobRequest,
+    DistillationJobResource,
+    ErrorDetails,
+    GeneratePredictionTableJobResource,
+    GeneratePredictionTableRequest,
+    GenerateTrainTableJobResource,
+    GenerateTrainTableRequest,
+    GetEmbeddingsDfUrlResponse,
+    GetPredictionsDfUrlResponse,
+    JobRequestBase,
+    JobResourceBase,
+    JobStatus,
+    PredictionProgress,
+    TrainingJobRequest,
+    TrainingJobResource,
+    TrainingTableSpec,
+)
+from kumoapi.json_serde import from_json, to_json_dict
+from kumoapi.source_table import LLMRequest, LLMResponse, SourceTableType
+from kumoapi.train import TrainingStage
+from typing_extensions import override
+from kumoai.client import KumoClient
+from kumoai.client.utils import (
+    Returns,
+    parse_patch_response,
+    parse_response,
+    raise_on_error,
+)
+TrainingJobID = str
+BatchPredictionJobID = str
+GenerateTrainTableJobID = str
+GeneratePredictionTableJobID = str
+LLMJobId = str
+BaselineJobID = str
+JobRequestType = TypeVar('JobRequestType', bound=JobRequestBase)
+JobResourceType = TypeVar('JobResourceType', bound=JobResourceBase)
+class CommonJobAPI(Generic[JobRequestType, JobResourceType]):
+    def __init__(self, client: KumoClient, base_endpoint: str,
+                 res_type: Type[JobResourceType]) -> None:
+        self._client = client
+        self._base_endpoint = base_endpoint
+        self._res_type = res_type
+    def create(self, request: JobRequestType) -> str:
+        response = self._client._post(self._base_endpoint,
+                                      json=to_json_dict(request))
+        raise_on_error(response)
+        return parse_response(Dict[str, str], response)['id']
+    def get(self, id: str) -> JobResourceType:
+        response = self._client._get(f'{self._base_endpoint}/{id}')
+        raise_on_error(response)
+        return parse_response(self._res_type, response)
+    def list(
+        self,
+        *,
+        pquery_name: Optional[str] = None,
+        pquery_id: Optional[str] = None,
+        job_status: Optional[JobStatus] = None,
+        limit: Optional[int] = None,
+        additional_tags: Mapping[str, str] = {},
+    ) -> List[JobResourceType]:
+        params: Dict[str, Any] = {
+            'pquery_name': pquery_name,
+            'pquery_id': pquery_id,
+            'job_status': job_status,
+            'limit': limit
+        }
+        params.update(additional_tags)
+        response = self._client._get(self._base_endpoint, params=params)
+        raise_on_error(response)
+        resource_elements = response.json()
+        assert isinstance(resource_elements, list)
+        return [from_json(e, self._res_type) for e in resource_elements]
+    def delete_tags(self, job_id: str, tags: List[str]) -> bool:
+        r"""Removes the tags from the job.
+        Args:
+            job_id (str): The ID of the job.
+            tags (List[str]): The tags to remove.
+        """
+        return self.update_tags(job_id, {t: 'none' for t in tags})
+    def update_tags(self, job_id: str,
+                    custom_job_tags: Mapping[str, Optional[str]]) -> bool:
+        r"""Updates the tags of the job.
+        Args:
+            job_id (str): The ID of the job.
+            custom_job_tags (Mapping[str, Optional[str]]): The tags to update.
+                Note that the value 'none' will remove the tag. If the tag is
+                not present, it will be added.
+        """
+        response = self._client._patch(
+            f'{self._base_endpoint}/{job_id}/tags',
+            data=None,
+            params={
+                k: str(v)
+                for k, v in custom_job_tags.items()
+            },
+        )
+        raise_on_error(response)
+        return parse_patch_response(response)
+class BaselineJobAPI(CommonJobAPI[BaselineJobRequest, BaselineJobResource]):
+    r"""Typed API definition for the baseline job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        super().__init__(client, '/baseline_jobs', BaselineJobResource)
+    def get_config(self, job_id: str) -> BaselineJobRequest:
+        """Load the configuration for a baseline job by ID."""
+        resource = self.get(job_id)
+        return resource.config
+class TrainingJobAPI(CommonJobAPI[TrainingJobRequest, TrainingJobResource]):
+    r"""Typed API definition for the training job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        super().__init__(client, '/training_jobs', TrainingJobResource)
+    def get_progress(self, id: TrainingJobID) -> AutoTrainerProgress:
+        response = self._client._get(f'{self._base_endpoint}/{id}/progress')
+        raise_on_error(response)
+        return parse_response(AutoTrainerProgress, response)
+    def holdout_data_url(self, id: TrainingJobID,
+                         presigned: bool = True) -> str:
+        response = self._client._get(f'{self._base_endpoint}/{id}/holdout',
+                                     params={'presigned': presigned})
+        raise_on_error(response)
+        return response.text
+    def cancel(self, id: str) -> CancelTrainingJobResponse:
+        response = self._client._post(f'{self._base_endpoint}/{id}/cancel')
+        raise_on_error(response)
+        return parse_response(CancelTrainingJobResponse, response)
+    def get_config(self, job_id: str) -> TrainingJobRequest:
+        """Load the configuration for a training job by ID."""
+        resource = self.get(job_id)
+        return resource.config
+class DistillationJobAPI(CommonJobAPI[DistillationJobRequest,
+                                      DistillationJobResource]):
+    r"""Typed API definition for the distillation job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        super().__init__(client, '/training_jobs/distilled_training_job',
+                         DistillationJobResource)
+    def get_config(self, job_id: str) -> DistillationJobRequest:
+        raise NotImplementedError(
+            "Getting the configuration for a distillation job is "
+            "not implemented yet.")
+    def get_progress(self, id: str) -> AutoTrainerProgress:
+        raise NotImplementedError(
+            "Getting the progress for a distillation job is not "
+            "implemented yet.")
+    def cancel(self, id: str) -> CancelTrainingJobResponse:
+        raise NotImplementedError(
+            "Cancelling a distillation job is not implemented yet.")
+class BatchPredictionJobAPI(CommonJobAPI[BatchPredictionRequest,
+                                         BatchPredictionJobResource]):
+    r"""Typed API definition for the prediction job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        super().__init__(client, '/prediction_jobs',
+                         BatchPredictionJobResource)
+    @override
+    def create(self, request: BatchPredictionRequest) -> str:
+        # TODO(manan): eventually, all `create` methods should
+        # return a validation response:
+        raise NotImplementedError
+    def maybe_create(
+        self, request: BatchPredictionRequest
+    ) -> Tuple[Optional[str], ValidationResponse]:
+        response = self._client._post(self._base_endpoint,
+                                      json=to_json_dict(request))
+        raise_on_error(response)
+        return parse_response(
+            Returns[Tuple[Optional[str], ValidationResponse]], response)
+    def list(
+        self,
+        *,
+        model_id: Optional[TrainingJobID] = None,
+        pquery_name: Optional[str] = None,
+        pquery_id: Optional[str] = None,
+        job_status: Optional[JobStatus] = None,
+        limit: Optional[int] = None,
+        additional_tags: Mapping[str, str] = {},
+    ) -> List[BatchPredictionJobResource]:
+        if model_id:
+            additional_tags = {**additional_tags, 'model_id': model_id}
+        return super().list(pquery_name=pquery_name, pquery_id=pquery_id,
+                            job_status=job_status, limit=limit,
+                            additional_tags=additional_tags)
+    def get_progress(self, id: str) -> PredictionProgress:
+        response = self._client._get(f'{self._base_endpoint}/{id}/progress')
+        raise_on_error(response)
+        return parse_response(PredictionProgress, response)
+    def cancel(self, id: str) -> CancelBatchPredictionJobResponse:
+        response = self._client._post(f'{self._base_endpoint}/{id}/cancel')
+        raise_on_error(response)
+        return parse_response(CancelBatchPredictionJobResponse, response)
+    def get_batch_predictions_url(self, id: str) -> List[str]:
+        """Returns presigned URLs pointing to the locations where the
+        predictions are stored. Depending on the environment where this is run,
+        they could be AWS S3 paths, Snowflake stage paths, or Databricks UC
+        volume paths.
+        Args:
+            id (str): ID of the batch prediction job for which predictions are
+                requested
+        """
+        response = self._client._get(
+            f'{self._base_endpoint}/{id}/get_prediction_df_urls')
+        raise_on_error(response)
+        return parse_response(
+            GetPredictionsDfUrlResponse,
+            response,
+        ).prediction_partitions
+    def get_batch_embeddings_url(self, id: str) -> List[str]:
+        """Returns presigned URLs pointing to the locations where the
+        embeddings are stored. Depending on the environment where this is run,
+        they could be AWS S3 paths, Snowflake stage paths, or Databricks UC
+        volume paths.
+        Args:
+            id (str): ID of the batch prediction job for which embeddings are
+                requested
+        """
+        response = self._client._get(
+            f'{self._base_endpoint}/{id}/get_embedding_df_urls')
+        raise_on_error(response)
+        return parse_response(
+            GetEmbeddingsDfUrlResponse,
+            response,
+        ).embedding_partitions
+    def get_config(self, job_id: str) -> BatchPredictionRequest:
+        """Load the configuration for a batch prediction job by ID."""
+        resource = self.get(job_id)
+        return resource.config
+class GenerateTrainTableJobAPI(CommonJobAPI[GenerateTrainTableRequest,
+                                            GenerateTrainTableJobResource]):
+    r"""Typed API definition for training table generation job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        super().__init__(client, '/gentraintable_jobs',
+                         GenerateTrainTableJobResource)
+    def get_table_data(self, id: GenerateTrainTableJobID,
+                       presigned: bool = True) -> List[str]:
+        """Return a list of URLs to access train table parquet data.
+        There might be multiple URLs if the table data is partitioned into
+        multiple files.
+        """
+        return self._get_table_data(id, presigned)
+    def _get_table_data(self, id: GenerateTrainTableJobID,
+                        presigned: bool = True,
+                        raw_path: bool = False) -> List[str]:
+        """Helper function to get train table data."""
+        # Raw path to get local file path instead of SPCS stage path
+        params: Dict[str, Any] = {'presigned': presigned, 'raw_path': raw_path}
+        resp = self._client._get(f'{self._base_endpoint}/{id}/table_data',
+                                 params=params)
+        raise_on_error(resp)
+        return parse_response(List[str], resp)
+    def get_split_masks(
+            self, id: GenerateTrainTableJobID) -> Dict[TrainingStage, str]:
+        """Return a dictionary of presigned URLs keyed by training stage.
+        Each URL points to a torch-serialized (default pickle protocol) file of
+        the mask tensor for that training stage.
+        Example:
+            >>> # code to load a mask tensor:
+            >>> import io
+            >>> import torch
+            >>> import requests
+            >>> masks = get_split_masks('some-gen-traintable-job-id')
+            >>> data_bytes = requests.get(masks[TrainingStage.TEST]).content
+            >>> test_mask_tensor = torch.load(io.BytesIO(data))
+        """
+        resp = self._client._get(f'{self._base_endpoint}/{id}/split_masks')
+        raise_on_error(resp)
+        return parse_response(Dict[TrainingStage, str], resp)
+    def get_progress(self, id: str) -> Dict[str, int]:
+        response = self._client._get(f'{self._base_endpoint}/{id}/progress')
+        raise_on_error(response)
+        return parse_response(Dict[str, int], response)
+    def cancel(self, id: str) -> None:
+        response = self._client._post(f'{self._base_endpoint}/{id}/cancel')
+        raise_on_error(response)
+    def validate_custom_train_table(
+        self,
+        id: str,
+        source_table_type: SourceTableType,
+        train_table_mod: TrainingTableSpec,
+    ) -> ValidationResponse:
+        response = self._client._post(
+            f'{self._base_endpoint}/{id}/validate_custom_train_table',
+            json=to_json_dict({
+                'custom_table': source_table_type,
+                'train_table_mod': train_table_mod,
+            }),
+        )
+        return parse_response(ValidationResponse, response)
+    def get_job_error(self, id: str) -> ErrorDetails:
+        """Thin API wrapper for fetching errors from the jobs.
+        Arguments:
+        id (str): Id of the job whose related errors are expected to be
+            queried.
+        """
+        response = self._client._get(f'{self._base_endpoint}/{id}/get_errors')
+        raise_on_error(response)
+        return parse_response(ErrorDetails, response)
+    def get_config(self, job_id: str) -> GenerateTrainTableRequest:
+        """Load the configuration for a training table generation job by ID."""
+        resource = self.get(job_id)
+        return resource.config
+class GeneratePredictionTableJobAPI(
+        CommonJobAPI[GeneratePredictionTableRequest,
+                     GeneratePredictionTableJobResource]):
+    r"""Typed API definition for prediction table generation job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        super().__init__(client, '/genpredtable_jobs',
+                         GeneratePredictionTableJobResource)
+    def get_anchor_time(self, id: BatchPredictionJobID) -> Optional[datetime]:
+        response = self._client._get(
+            f'{self._base_endpoint}/{id}/get_anchor_time')
+        raise_on_error(response)
+        return parse_response(Returns[Optional[datetime]], response)
+    def get_table_data(self, id: GeneratePredictionTableJobID,
+                       presigned: bool = True) -> List[str]:
+        """Return a list of URLs to access prediction table parquet data.
+        There might be multiple URLs if the table data is partitioned into
+        multiple files.
+        """
+        params: Dict[str, Any] = {'presigned': presigned}
+        resp = self._client._get(f'{self._base_endpoint}/{id}/table_data',
+                                 params=params)
+        raise_on_error(resp)
+        return parse_response(List[str], resp)
+    def cancel(self, id: str) -> None:
+        response = self._client._post(f'{self._base_endpoint}/{id}/cancel')
+        raise_on_error(response)
+    def get_job_error(self, id: str) -> ErrorDetails:
+        """Thin API wrapper for fetching errors from the jobs.
+        Arguments:
+        id (str): Id of the job whose related errors are expected to be
+            queried.
+        """
+        response = self._client._get(f'{self._base_endpoint}/{id}/get_errors')
+        raise_on_error(response)
+        return parse_response(ErrorDetails, response)
+    def get_config(self, job_id: str) -> GeneratePredictionTableRequest:
+        """Load the configuration for a
+        prediction table generation job by ID.
+        """
+        resource = self.get(job_id)
+        return resource.config
+class LLMJobAPI:
+    r"""Typed API definition for LLM job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        self._client = client
+        self._base_endpoint = '/llm_embedding_job'
+    def create(self, request: LLMRequest) -> LLMJobId:
+        response = self._client._post(
+            self._base_endpoint,
+            json=to_json_dict(request),
+        )
+        raise_on_error(response)
+        return parse_response(LLMResponse, response).job_id
+    def get(self, id: LLMJobId) -> JobStatus:
+        response = self._client._get(f'{self._base_endpoint}/status/{id}')
+        raise_on_error(response)
+        return parse_response(JobStatus, response)
+    def cancel(self, id: LLMJobId) -> JobStatus:
+        response = self._client._delete(f'{self._base_endpoint}/cancel/{id}')
+        return response
+class ArtifactExportJobAPI:
+    r"""Typed API definition for artifact export job resource."""
+    def __init__(self, client: KumoClient) -> None:
+        self._client = client
+        self._base_endpoint = '/artifact'
+    def create(self, request: ArtifactExportRequest) -> str:
+        response = self._client._post(
+            self._base_endpoint,
+            json=to_json_dict(request),
+        )
+        raise_on_error(response)
+        return parse_response(ArtifactExportResponse, response).job_id
+    # TODO Add an API in artifact export to get
+    # JobStatusReport and not just JobStatus
+    def get(self, id: str) -> JobStatus:
+        response = self._client._get(f'{self._base_endpoint}/{id}')
+        raise_on_error(response)
+        return parse_response(JobStatus, response)
+    def cancel(self, id: str) -> JobStatus:
+        response = self._client._post(f'{self._base_endpoint}/{id}/cancel')
+        raise_on_error(response)
+        return parse_response(JobStatus, response)

kumoai/client/online.py ADDED Viewed

@@ -0,0 +1,78 @@
+from http import HTTPStatus
+from typing import Any, List, Optional
+from kumoapi.json_serde import to_json_dict
+from kumoapi.online_serving import (
+    OnlineServingEndpointRequest,
+    OnlineServingEndpointResource,
+)
+from kumoai.client import KumoClient
+from kumoai.client.endpoints import OnlineServingEndpoints
+from kumoai.client.utils import (
+    parse_id_response,
+    parse_patch_response,
+    parse_response,
+    raise_on_error,
+)
+OnlineServingEndpointID = str
+class OnlineServingEndpointAPI:
+    r"""Typed API definition for Kumo graph definition."""
+    def __init__(self, client: KumoClient) -> None:
+        self._client = client
+        self._base_endpoint = '/online_serving_endpoints'
+    # TODO(blaz): document final interface
+    def create(
+        self,
+        req: OnlineServingEndpointRequest,
+        **query_params: Any,
+    ) -> OnlineServingEndpointID:
+        """Creates a new online serving endpoint.
+        Args:
+            req (OnlineServingEndpointRequest): request body.
+            use_ge (Optional[bool], optional): If present, override graph
+            backend option to use GRAPHENGINE if true else MEMORY.
+            **query_params: Additional query parameters to pass to the API.
+        Returns:
+            OnlineServingEndpointID: unique endpoint resource id.
+        """
+        resp = self._client._post(
+            self._base_endpoint,
+            params=query_params if query_params else None,
+            json=to_json_dict(req),
+        )
+        raise_on_error(resp)
+        return parse_id_response(resp)
+    def get_if_exists(
+        self, id: OnlineServingEndpointID
+    ) -> Optional[OnlineServingEndpointResource]:
+        resp = self._client._request(OnlineServingEndpoints.get.with_id(id))
+        if resp.status_code == HTTPStatus.NOT_FOUND:
+            return None
+        raise_on_error(resp)
+        return parse_response(OnlineServingEndpointResource, resp)
+    def list(self) -> List[OnlineServingEndpointResource]:
+        resp = self._client._request(OnlineServingEndpoints.list)
+        raise_on_error(resp)
+        return parse_response(List[OnlineServingEndpointResource], resp)
+    def update(self, id: OnlineServingEndpointID,
+               req: OnlineServingEndpointRequest) -> bool:
+        resp = self._client._request(OnlineServingEndpoints.update.with_id(id),
+                                     data=to_json_dict(req))
+        raise_on_error(resp)
+        return parse_patch_response(resp)
+    def delete(self, id: OnlineServingEndpointID) -> None:
+        """This is idempotent and can be called multiple times."""
+        resp = self._client._request(OnlineServingEndpoints.delete.with_id(id))
+        raise_on_error(resp)