PyPI - kumoai - Versions diffs - 2.14.0.dev202601011731__cp310-cp310-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl - Mend

kumoai 2.14.0.dev202601011731__cp310-cp310-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of kumoai might be problematic. Click here for more details.

Files changed (122) hide show

kumoai/__init__.py +300 -0
kumoai/_logging.py +29 -0
kumoai/_singleton.py +25 -0
kumoai/_version.py +1 -0
kumoai/artifact_export/__init__.py +9 -0
kumoai/artifact_export/config.py +209 -0
kumoai/artifact_export/job.py +108 -0
kumoai/client/__init__.py +5 -0
kumoai/client/client.py +223 -0
kumoai/client/connector.py +110 -0
kumoai/client/endpoints.py +150 -0
kumoai/client/graph.py +120 -0
kumoai/client/jobs.py +471 -0
kumoai/client/online.py +78 -0
kumoai/client/pquery.py +207 -0
kumoai/client/rfm.py +112 -0
kumoai/client/source_table.py +53 -0
kumoai/client/table.py +101 -0
kumoai/client/utils.py +130 -0
kumoai/codegen/__init__.py +19 -0
kumoai/codegen/cli.py +100 -0
kumoai/codegen/context.py +16 -0
kumoai/codegen/edits.py +473 -0
kumoai/codegen/exceptions.py +10 -0
kumoai/codegen/generate.py +222 -0
kumoai/codegen/handlers/__init__.py +4 -0
kumoai/codegen/handlers/connector.py +118 -0
kumoai/codegen/handlers/graph.py +71 -0
kumoai/codegen/handlers/pquery.py +62 -0
kumoai/codegen/handlers/table.py +109 -0
kumoai/codegen/handlers/utils.py +42 -0
kumoai/codegen/identity.py +114 -0
kumoai/codegen/loader.py +93 -0
kumoai/codegen/naming.py +94 -0
kumoai/codegen/registry.py +121 -0
kumoai/connector/__init__.py +31 -0
kumoai/connector/base.py +153 -0
kumoai/connector/bigquery_connector.py +200 -0
kumoai/connector/databricks_connector.py +213 -0
kumoai/connector/file_upload_connector.py +189 -0
kumoai/connector/glue_connector.py +150 -0
kumoai/connector/s3_connector.py +278 -0
kumoai/connector/snowflake_connector.py +252 -0
kumoai/connector/source_table.py +471 -0
kumoai/connector/utils.py +1796 -0
kumoai/databricks.py +14 -0
kumoai/encoder/__init__.py +4 -0
kumoai/exceptions.py +26 -0
kumoai/experimental/__init__.py +0 -0
kumoai/experimental/rfm/__init__.py +210 -0
kumoai/experimental/rfm/authenticate.py +432 -0
kumoai/experimental/rfm/backend/__init__.py +0 -0
kumoai/experimental/rfm/backend/local/__init__.py +42 -0
kumoai/experimental/rfm/backend/local/graph_store.py +297 -0
kumoai/experimental/rfm/backend/local/sampler.py +312 -0
kumoai/experimental/rfm/backend/local/table.py +113 -0
kumoai/experimental/rfm/backend/snow/__init__.py +37 -0
kumoai/experimental/rfm/backend/snow/sampler.py +297 -0
kumoai/experimental/rfm/backend/snow/table.py +242 -0
kumoai/experimental/rfm/backend/sqlite/__init__.py +32 -0
kumoai/experimental/rfm/backend/sqlite/sampler.py +398 -0
kumoai/experimental/rfm/backend/sqlite/table.py +184 -0
kumoai/experimental/rfm/base/__init__.py +30 -0
kumoai/experimental/rfm/base/column.py +152 -0
kumoai/experimental/rfm/base/expression.py +44 -0
kumoai/experimental/rfm/base/sampler.py +761 -0
kumoai/experimental/rfm/base/source.py +19 -0
kumoai/experimental/rfm/base/sql_sampler.py +143 -0
kumoai/experimental/rfm/base/table.py +736 -0
kumoai/experimental/rfm/graph.py +1237 -0
kumoai/experimental/rfm/infer/__init__.py +19 -0
kumoai/experimental/rfm/infer/categorical.py +40 -0
kumoai/experimental/rfm/infer/dtype.py +82 -0
kumoai/experimental/rfm/infer/id.py +46 -0
kumoai/experimental/rfm/infer/multicategorical.py +48 -0
kumoai/experimental/rfm/infer/pkey.py +128 -0
kumoai/experimental/rfm/infer/stype.py +35 -0
kumoai/experimental/rfm/infer/time_col.py +61 -0
kumoai/experimental/rfm/infer/timestamp.py +41 -0
kumoai/experimental/rfm/pquery/__init__.py +7 -0
kumoai/experimental/rfm/pquery/executor.py +102 -0
kumoai/experimental/rfm/pquery/pandas_executor.py +530 -0
kumoai/experimental/rfm/relbench.py +76 -0
kumoai/experimental/rfm/rfm.py +1184 -0
kumoai/experimental/rfm/sagemaker.py +138 -0
kumoai/experimental/rfm/task_table.py +231 -0
kumoai/formatting.py +30 -0
kumoai/futures.py +99 -0
kumoai/graph/__init__.py +12 -0
kumoai/graph/column.py +106 -0
kumoai/graph/graph.py +948 -0
kumoai/graph/table.py +838 -0
kumoai/jobs.py +80 -0
kumoai/kumolib.cpython-310-x86_64-linux-gnu.so +0 -0
kumoai/mixin.py +28 -0
kumoai/pquery/__init__.py +25 -0
kumoai/pquery/prediction_table.py +287 -0
kumoai/pquery/predictive_query.py +641 -0
kumoai/pquery/training_table.py +424 -0
kumoai/spcs.py +121 -0
kumoai/testing/__init__.py +8 -0
kumoai/testing/decorators.py +57 -0
kumoai/testing/snow.py +50 -0
kumoai/trainer/__init__.py +42 -0
kumoai/trainer/baseline_trainer.py +93 -0
kumoai/trainer/config.py +2 -0
kumoai/trainer/distilled_trainer.py +175 -0
kumoai/trainer/job.py +1192 -0
kumoai/trainer/online_serving.py +258 -0
kumoai/trainer/trainer.py +475 -0
kumoai/trainer/util.py +103 -0
kumoai/utils/__init__.py +11 -0
kumoai/utils/datasets.py +83 -0
kumoai/utils/display.py +51 -0
kumoai/utils/forecasting.py +209 -0
kumoai/utils/progress_logger.py +343 -0
kumoai/utils/sql.py +3 -0
kumoai-2.14.0.dev202601011731.dist-info/METADATA +71 -0
kumoai-2.14.0.dev202601011731.dist-info/RECORD +122 -0
kumoai-2.14.0.dev202601011731.dist-info/WHEEL +6 -0
kumoai-2.14.0.dev202601011731.dist-info/licenses/LICENSE +9 -0
kumoai-2.14.0.dev202601011731.dist-info/top_level.txt +1 -0

kumoai/pquery/predictive_query.py ADDED Viewed

@@ -0,0 +1,641 @@
+import logging
+from typing import List, Literal, Mapping, Optional, Tuple, Union, overload
+from kumoapi.jobs import (
+    GeneratePredictionTableRequest,
+    GenerateTrainTableRequest,
+)
+from kumoapi.model_plan import (
+    InferredType,
+    PredictionTableGenerationPlan,
+    RunMode,
+    SuggestModelPlanRequest,
+    TrainingTableGenerationPlan,
+)
+from kumoapi.pquery import PQueryResource
+from kumoapi.task import TaskType
+from kumoapi.train import TrainingTableSpec
+from typing_extensions import Self
+from kumoai import global_state
+from kumoai.client.jobs import (
+    GeneratePredictionTableJobID,
+    GenerateTrainTableJobID,
+    TrainingJobAPI,
+)
+from kumoai.graph import Graph
+from kumoai.pquery.prediction_table import PredictionTable, PredictionTableJob
+from kumoai.pquery.training_table import TrainingTable, TrainingTableJob
+from kumoai.trainer import (
+    BaselineTrainer,
+    ModelPlan,
+    Trainer,
+    TrainingJob,
+    TrainingJobResult,
+)
+from kumoai.trainer.job import BaselineJob, BaselineJobResult
+logger = logging.getLogger(__name__)
+PredictiveQueryID = str
+class PredictiveQuery:
+    r"""The Kumo predictive query is a declarative syntax for describing a
+    machine learning task. Predictive queries are written using the predictive
+    query language (PQL), a concise SQL-like syntax that allows you to define a
+    model for a new business problem.
+    A predictive query object can be created from a
+    :class:`~kumoai.graph.Graph` and a query string. For information on the
+    construction of a query string, please visit the Kumo
+    `documentation <https://docs.kumo.ai/docs/pquery-structure/>`__.
+    .. code-block:: python
+        import kumoai
+        # See `Graph` documentation for more information:
+        graph = kumoai.Graph(...)
+        # Create a predictive query representing a machine learning problem
+        # over this Graph:
+        pquery = kumoai.PredictiveQuery(
+            graph=graph,
+            query=(
+                "PREDICT MAX(transaction.Quantity, 0, 30) "
+                "FOR EACH customer.CustomerID"
+            ),
+        )
+        # Validate the predictive query configuration, for syntax and
+        # correctness:
+        pquery.validate(verbose=True)
+        # Get the machine learning task type corresponding to this predictive
+        # query (e.g. binary classification, regression, link prediction, etc.)
+        print(pquery.get_task_type())
+        # Suggest a training table generation plan and use it to generate a
+        # training table from this query, to be used in `Trainer.fit`:
+        training_table_plan = pquery.suggest_training_table_plan()
+        training_table = pquery.generate_training_table(training_table_plan)
+        # Suggest a prediction table generation plan and use it to generate a
+        # prediction table from this query, to be used in `Trainer.predict`:
+        pred_table_plan = pquery.suggest_prediction_table_plan()
+        pred_table = pquery.generate_prediction_table(pred_table_plan)
+    Args:
+        graph: The :class:`~kumoai.graph.Graph` object which the predictive
+            query is defined over.
+        query: A string representation of the predictive query.
+    """
+    def __init__(
+        self,
+        graph: Graph,
+        query: str,
+    ) -> None:
+        self.graph = graph
+        self.query = query
+        # A predictive query owns a trainer object, which is used internally
+        # to support `fit` and `predict` directly on this object. A user can
+        # also inspect the training table, prediction table, and trainer
+        # objects, but cannot set them; any advanced configuration must be
+        # done directly via `Trainer`:
+        self._train_table: Optional[Union[TrainingTable,
+                                          TrainingTableJob]] = None
+        self._prediction_table: Optional[Union[PredictionTable,
+                                               PredictionTableJob]] = None
+    # Metadata ################################################################
+    @property
+    def id(self) -> str:
+        r"""Returns the unique ID for this predictive query, determined from
+        its schema and the schema of its associated graph. Two queries that
+        differ either in their syntax or in their graph will have different
+        ids.
+        """
+        return self.save()
+    @property
+    def train_table(self) -> Union[TrainingTable, TrainingTableJob]:
+        r"""Returns the training table that was last generated by this
+        predictive query. If the predictive query has not yet generated a
+        training table, raises a :class:`ValueError`.
+        Note that the training table may be of type
+        :class:`~kumoai.pquery.TrainingTable` or
+        :class:`~kumoai.pquery.TrainingTableJob`, depending on whether the
+        training table was generated with or without waiting for its
+        completion, respectively.
+        """
+        if not self._train_table:
+            raise ValueError(
+                "This predictive query has not yet generated a training "
+                "table. Please call `generate_training_table` to generate "
+                "a training table before proceeding.")
+        return self._train_table
+    @property
+    def prediction_table(self) -> Union[PredictionTable, PredictionTableJob]:
+        r"""Returns the prediction table that was last generated by this
+        predictive query. If the predictive query has not yet generated a
+        prediction table, raises a :class:`ValueError`.
+        Note that the prediction table may be of type
+        :class:`~kumoai.pquery.PredictionTable` or
+        :class:`~kumoai.pquery.PredictionTableJob`, depending on whether the
+        prediction table was generated with or without waiting for its
+        completion, respectively.
+        """
+        if not self._prediction_table:
+            raise ValueError(
+                "This predictive query has not yet generated a prediction "
+                "table. Please call `generate_prediction_table` to generate a "
+                "prediction table before proceeding.")
+        return self._prediction_table
+    def get_task_type(self) -> TaskType:
+        r"""Returns the task type of this predictive query. The task type of
+        the query corresponds to the machine learning problem that this query
+        translates to in the Kumo platform; for more information about possible
+        task types, please visit the Kumo `documentation
+        <https://docs.kumo.ai/docs/task-types/>`__.
+        """
+        try:
+            self.validate(verbose=False)
+        except ValueError as e:
+            raise ValueError(
+                f"Predictive query {self.query} is improperly configured, so "
+                f"a task type cannot be obtained. Please ensure your query "
+                f"has a valid configuration before proceeding. You can use "
+                f"the `validate` method to verify the validity of your query."
+            ) from e
+        task_type, _ = global_state.client.pquery_api.infer_task_type(
+            pquery_string=self.query, graph_id=self.graph.id)
+        return task_type
+    def validate(self, verbose: bool = True) -> Self:
+        r"""Validates the syntax of this predictive query, ensuring that
+        the query is formulated correctly in Kumo's Predictive Query Language
+        and that the query makes semantic sense (defines a suitable predictive
+        problem) on this :class:`~kumoai.graph.Graph`.
+        Args:
+            verbose: Whether to log non-error output of this validation.
+        Raises:
+            ValueError:
+                if validation fails.
+        Example:
+            >>> import kumoai
+            >>> query = kumoai.PredictiveQuery(...)  # doctest: +SKIP
+            >>> query.validate()  # doctest: +SKIP
+            ValidationResponse(warnings=[], errors=[])
+        """
+        self.graph.save()  # Need a valid graph ID; also validates graph.
+        resp = global_state.client.pquery_api.validate(
+            self._to_api_pquery_resource())
+        if not resp.ok:
+            raise ValueError(resp.error_message())
+        if verbose:
+            if resp.empty():
+                logger.info("Query %s is configured correctly.", self.query)
+            else:
+                logger.warning(resp.message())
+        return self
+    # Persistence #############################################################
+    def _to_api_pquery_resource(
+        self,
+        name: Optional[str] = None,
+    ) -> PQueryResource:
+        return PQueryResource(
+            name=name,
+            query_string=self.query,
+            graph=self.graph._to_api_graph_definition(),
+            desc="",
+        )
+    def save(self, name: Optional[str] = None) -> PredictiveQueryID:
+        r"""Saves a predictive query to Kumo, returning a unique ID for this
+        query. If a name is provided, saves it as a named, re-usable template.
+        Args:
+            name: Optional name for the template. If provided, saves the
+                query as a named template. If the name already exists,
+                that template will be overwritten.
+        Example:
+            >>> import kumoai
+            >>> query = kumoai.PredictiveQuery(...)  # doctest: +SKIP
+            >>> query.save()  # doctest: +SKIP
+            pquery-xxx
+            >>> query.save("my_template")  # doctest: +SKIP
+            my_template
+        """
+        try:
+            self.validate(verbose=False)
+        except ValueError as e:
+            raise ValueError(
+                f"Predictive query {self.query} is improperly configured, so "
+                f"it cannot be saved. Please ensure your query "
+                f"has a valid configuration before proceeding. You can use "
+                f"the `validate` method to verify the validity of your query."
+            ) from e
+        if name is not None:
+            template_resource = global_state.client.pquery_api.get_if_exists(
+                name)
+            if template_resource is not None:
+                template_string = template_resource.query_string
+                logger.warning(
+                    ("Predictive query template %s already exists, with "
+                     "query string %s. This template will be overridden with "
+                     "configuration %s."), name, template_string, self.query)
+        self.graph.save()
+        return global_state.client.pquery_api.create(
+            pquery=self._to_api_pquery_resource(name))
+    @classmethod
+    def load(cls, pq_id_or_template: str) -> 'PredictiveQuery':
+        r"""Loads a predictive query from either a predictive query ID or a
+        named template. Returns a :class:`~kumoai.pquery.PredictiveQuery`
+        object that contains the loaded query along with its associated graph,
+        tables, etc.
+        """
+        api = global_state.client.pquery_api
+        res = api.get_if_exists(pq_id_or_template)
+        if not res:
+            raise ValueError(
+                f"Predictive query {pq_id_or_template} was not found.")
+        return cls(
+            graph=Graph._from_api_graph_definition(res.graph),
+            query=res.query_string,
+        )
+    @classmethod
+    def load_from_training_job(cls, training_job_id: str) -> 'PredictiveQuery':
+        r"""Loads a predictive query from a training job, regardless of the
+        training job's status. Returns a
+        :class:`~kumoai.pquery.PredictiveQuery` object that contains the loaded
+        query along with its associated graph, tables, etc.
+        """
+        train_api: TrainingJobAPI = global_state.client.training_job_api
+        job = train_api.get(training_job_id)
+        id_or_name = job.config.pquery_id
+        return PredictiveQuery.load(pq_id_or_template=id_or_name)
+    # Training & Prediction Table Generation ##################################
+    @overload
+    def generate_training_table(
+        self,
+        plan: Optional[TrainingTableGenerationPlan] = None,
+    ) -> TrainingTable:
+        pass
+    @overload
+    def generate_training_table(
+        self,
+        plan: Optional[TrainingTableGenerationPlan] = None,
+        *,
+        non_blocking: Literal[False],
+    ) -> TrainingTable:
+        pass
+    @overload
+    def generate_training_table(
+        self,
+        plan: Optional[TrainingTableGenerationPlan] = None,
+        *,
+        non_blocking: Literal[True],
+    ) -> TrainingTableJob:
+        pass
+    @overload
+    def generate_training_table(
+        self,
+        plan: Optional[TrainingTableGenerationPlan] = None,
+        *,
+        non_blocking: bool,
+    ) -> Union[TrainingTable, TrainingTableJob]:
+        pass
+    def generate_training_table(
+        self,
+        plan: Optional[TrainingTableGenerationPlan] = None,
+        *,
+        non_blocking: bool = False,
+        custom_tags: Mapping[str, str] = {},
+    ) -> Union[TrainingTable, TrainingTableJob]:
+        r"""Generates a training table from the specified :attr:`query`
+        string.
+        Args:
+            plan: A specification of the parameters for training table
+                generation. If not provided, will use an intelligently
+                generated default plan based on the query and graph. This plan
+                is equivalent to the plan inferred with
+                ``suggest_training_table_plan(run_mode=RunMode.NORMAL)``.
+            non_blocking: Whether this operation should return immediately
+                after launching the training table generation job, or await
+                completion of the generated training table.
+            custom_tags: Additional, customer defined k-v tags to be associated
+                with the job to be launched. Job tags are useful for grouping
+                and searching jobs.
+        Returns:
+            Union[TrainingTable, TrainingTableJob]:
+                If ``non_blocking=False``, returns a training table object. If
+                ``non_blocking=True``, returns a training table future object.
+        """
+        pq_id = self.save()
+        # TODO(manan): improve this...
+        if not plan:
+            plan = self.suggest_training_table_plan()
+        train_table_job_api = global_state.client.generate_train_table_job_api
+        job_id: GenerateTrainTableJobID = train_table_job_api.create(
+            GenerateTrainTableRequest(
+                dict(custom_tags),
+                pq_id,
+                plan,
+                None,
+            ))
+        self._train_table = TrainingTableJob(job_id=job_id)
+        if non_blocking:
+            return self._train_table
+        self._train_table = self._train_table.attach()
+        return self._train_table
+    @overload
+    def generate_prediction_table(
+        self,
+        plan: Optional[PredictionTableGenerationPlan] = None,
+    ) -> PredictionTable:
+        pass
+    @overload
+    def generate_prediction_table(
+        self,
+        plan: Optional[PredictionTableGenerationPlan] = None,
+        *,
+        non_blocking: Literal[False],
+    ) -> PredictionTable:
+        pass
+    @overload
+    def generate_prediction_table(
+        self,
+        plan: Optional[PredictionTableGenerationPlan] = None,
+        *,
+        non_blocking: Literal[True],
+    ) -> PredictionTableJob:
+        pass
+    @overload
+    def generate_prediction_table(
+        self,
+        plan: Optional[PredictionTableGenerationPlan] = None,
+        *,
+        non_blocking: bool,
+    ) -> Union[PredictionTable, PredictionTableJob]:
+        pass
+    def generate_prediction_table(
+        self,
+        plan: Optional[PredictionTableGenerationPlan] = None,
+        *,
+        non_blocking: bool = False,
+        custom_tags: Mapping[str, str] = {},
+    ) -> Union[PredictionTable, PredictionTableJob]:
+        r"""Generates a prediction table from the predictive query
+        :attr:`query` string.
+        Args:
+            plan: A specification of the parameters for prediction table
+                generation. If not provided, will use an intelligently
+                generated default plan based on the query and graph. This plan
+                is equivalent to the plan inferred with
+                ``suggest_prediction_table_plan(run_mode=RunMode.NORMAL)``.
+            non_blocking: Whether this operation should return immediately
+                after launching the prediction table generation job, or await
+                completion of the generated prediction table.
+            custom_tags: Additional, customer defined k-v tags to be associated
+                with the job to be launched. Job tags are useful for grouping
+                and searching jobs.
+        Returns:
+            Union[PredictionTable, PredictionTableJob]:
+                If ``non_blocking=False``, returns a prediction table object.
+                If ``non_blocking=True``, returns a prediction table future
+                object.
+        """
+        pq_id = self.save()
+        if not plan:
+            plan = self.suggest_prediction_table_plan()
+        bp_table_api = global_state.client.generate_prediction_table_job_api
+        job_id: GeneratePredictionTableJobID = bp_table_api.create(
+            GeneratePredictionTableRequest(
+                dict(custom_tags),
+                pq_id,
+                plan,
+                None,
+            ))
+        self._prediction_table = PredictionTableJob(job_id=job_id)
+        if non_blocking:
+            return self._prediction_table
+        self._prediction_table = self._prediction_table.result()
+        return self._prediction_table
+    # Training & Prediction ###################################################
+    def suggest_training_table_plan(
+        self,
+        run_mode: RunMode = RunMode.FAST,
+    ) -> TrainingTableGenerationPlan:
+        r"""Suggests a training table generation plan given the predictive
+        query and graph. This training table generation plan can be used to
+        alter the approach Kumo uses to generate the training table for your
+        predictive query.
+        Args:
+            run_mode: A representation of how quickly you would like your
+                predictive query to complete. Faster run modes correspond to
+                lower training times, at the cost of potentially lower
+                performance.
+        """
+        self.graph.save()
+        req = SuggestModelPlanRequest(
+            query_string=self.query,
+            graph_id=self.graph.id,
+            run_mode=run_mode,
+        )
+        return global_state.client.pquery_api.suggest_training_table_plan(req)
+    def suggest_prediction_table_plan(self, ) -> PredictionTableGenerationPlan:
+        r"""Suggests a prediction table generation plan given the predictive
+        query and graph. This prediction table generation plan can be used to
+        alter the approach Kumo uses to generate the prediction table for your
+        predictive query.
+        """
+        return PredictionTableGenerationPlan(anchor_time=InferredType.VALUE)
+    def suggest_model_plan(
+        self,
+        run_mode: RunMode = RunMode.FAST,
+        train_table_spec: Optional[TrainingTableSpec] = None,
+    ) -> ModelPlan:
+        r"""Suggests a modeling plan given the predictive query and graph. This
+        model plan can be used to alter the approach Kumo uses to train your
+        machine learning model.
+        Args:
+            run_mode: A representation of how quickly you would like your
+                predictive query to complete. Faster run modes correspond to
+                lower training times, at the cost of potentially lower
+                performance.
+            train_table_spec: Needed if the original train table has been
+                modified by adding a weight column.
+        """
+        self.graph.save()
+        req = SuggestModelPlanRequest(
+            query_string=self.query,
+            graph_id=self.graph.id,
+            run_mode=run_mode,
+            train_table_spec=train_table_spec,
+        )
+        return global_state.client.pquery_api.suggest_model_plan(req)
+    @overload
+    def fit(
+        self,
+        training_table_plan: Optional[TrainingTableGenerationPlan] = None,
+        model_plan: Optional[ModelPlan] = None,
+    ) -> Tuple[Trainer, TrainingJobResult]:
+        pass
+    @overload
+    def fit(
+        self,
+        training_table_plan: Optional[TrainingTableGenerationPlan] = None,
+        model_plan: Optional[ModelPlan] = None,
+        *,
+        non_blocking: Literal[False],
+    ) -> Tuple[Trainer, TrainingJobResult]:
+        pass
+    @overload
+    def fit(
+        self,
+        training_table_plan: Optional[TrainingTableGenerationPlan] = None,
+        model_plan: Optional[ModelPlan] = None,
+        *,
+        non_blocking: Literal[True],
+    ) -> Tuple[Trainer, TrainingJob]:
+        pass
+    @overload
+    def fit(
+        self,
+        training_table_plan: Optional[TrainingTableGenerationPlan] = None,
+        model_plan: Optional[ModelPlan] = None,
+        *,
+        non_blocking: bool,
+    ) -> Tuple[Trainer, Union[TrainingJobResult, TrainingJob]]:
+        pass
+    def fit(
+        self,
+        training_table_plan: Optional[TrainingTableGenerationPlan] = None,
+        model_plan: Optional[ModelPlan] = None,
+        *,
+        non_blocking: bool = False,
+    ) -> Tuple[Trainer, Union[TrainingJobResult, TrainingJob]]:
+        r"""Trains a Kumo model on this predictive query, given optional
+        additional specifications of the training table generation plan and
+        the model plan.
+        Args:
+            training_table_plan: A specification of the parameters for training
+                table generation. If not provided, will use an intelligently
+                generated default plan based on the query and graph. This plan
+                is equivalent to the plan inferred with
+                ``suggest_training_table_plan(run_mode=RunMode.NORMAL)``.
+            model_plan: A specification of the parameters for model training.
+                If not provided, will use an intelligently generated default
+                plan based on the query and graph. This plan
+                is equivalent to the plan inferred with
+                ``suggest_model_plan(run_mode=RunMode.NORMAL)``.
+            non_blocking: Whether this operation should return immediately
+                after launching the training job, or await completion of the
+                training job.
+        Returns:
+            Tuple[Trainer, Union[TrainingJobResult, TrainingJob]]:
+                A tuple with two elements. The first element is the trainer
+                object used to launch the training job. The second element
+                is either a training job object (if ``non_blocking=True``)
+                or a training job future object (if ``non_blocking=False``).
+        """
+        # If we have already generated the training table, use it with Trainer:
+        if self._train_table is None:
+            # Nonblocking generate:
+            self._train_table = self.generate_training_table(
+                training_table_plan, non_blocking=True)
+        # TODO(manan): what if `self._train_table` represents a failed job?
+        model_plan = model_plan or self.suggest_model_plan()
+        trainer = Trainer(model_plan)
+        return (trainer,
+                trainer.fit(self.graph, self.train_table,
+                            non_blocking=non_blocking))
+    def generate_baseline(
+        self,
+        metrics: List[str],
+        train_table: Union[TrainingTable, TrainingTableJob],
+        *,
+        non_blocking: bool = False,
+    ) -> Union[BaselineJob, BaselineJobResult]:
+        r"""Runs a baseline model on this predictive query, given metrics and
+        optional additional specifications of the training table generation
+        plan.
+        Args:
+            metrics (List[str]): A list to metrics that baseline model will be
+                evaluated on.
+            train_table (Union[TrainingTable, TrainingTableJob]): The
+                :class:`~kumoai.pquery.TrainingTable`, or in-progress
+                :class:`~kumoai.pquery.TrainingTableJob` that represents
+                the training data produced by a
+                :class:`~kumoai.pquery.PredictiveQuery` on :obj:`graph`.
+            non_blocking (bool): Whether this operation should
+                return immediately after launching the baseline job, or await
+                completion of the baseline job. Defaults to False.
+        Returns:
+            Union[BaselineJob, BaselineJobResult]:  either a baseline job
+                object (if ``non_blocking=True``) or a baseline job future
+                object (if ``non_blocking=False``).
+        """ # noqa
+        baseline_trainer = BaselineTrainer(metrics)
+        return baseline_trainer.run(self.graph, train_table,
+                                    non_blocking=non_blocking)