PyPI - oracle-ads - Versions diffs - 2.11.6__py3-none-any.whl → 2.11.8__py3-none-any.whl - Mend

oracle-ads 2.11.6py3-none-any.whl → 2.11.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

ads/aqua/__init__.py +24 -14
ads/aqua/base.py +0 -2
ads/aqua/cli.py +50 -2
ads/aqua/decorator.py +8 -0
ads/aqua/deployment.py +37 -34
ads/aqua/evaluation.py +106 -49
ads/aqua/extension/base_handler.py +18 -10
ads/aqua/extension/common_handler.py +21 -2
ads/aqua/extension/deployment_handler.py +1 -4
ads/aqua/extension/evaluation_handler.py +1 -2
ads/aqua/extension/finetune_handler.py +0 -1
ads/aqua/extension/ui_handler.py +1 -12
ads/aqua/extension/utils.py +4 -4
ads/aqua/finetune.py +24 -11
ads/aqua/model.py +2 -4
ads/aqua/utils.py +39 -23
ads/catalog/model.py +3 -3
ads/catalog/notebook.py +3 -3
ads/catalog/project.py +2 -2
ads/catalog/summary.py +2 -4
ads/cli.py +21 -2
ads/common/serializer.py +5 -4
ads/common/utils.py +6 -2
ads/config.py +1 -0
ads/data_labeling/metadata.py +2 -2
ads/dataset/dataset.py +3 -5
ads/dataset/factory.py +2 -3
ads/dataset/label_encoder.py +1 -1
ads/dataset/sampled_dataset.py +3 -5
ads/jobs/ads_job.py +26 -2
ads/jobs/builders/infrastructure/dsc_job.py +20 -7
ads/llm/serializers/runnable_parallel.py +7 -1
ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +1 -1
ads/opctl/operator/lowcode/anomaly/README.md +1 -1
ads/opctl/operator/lowcode/anomaly/environment.yaml +1 -1
ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +8 -15
ads/opctl/operator/lowcode/anomaly/model/automlx.py +16 -10
ads/opctl/operator/lowcode/anomaly/model/autots.py +9 -10
ads/opctl/operator/lowcode/anomaly/model/base_model.py +36 -39
ads/opctl/operator/lowcode/anomaly/model/tods.py +4 -4
ads/opctl/operator/lowcode/anomaly/operator_config.py +18 -1
ads/opctl/operator/lowcode/anomaly/schema.yaml +16 -4
ads/opctl/operator/lowcode/common/data.py +16 -2
ads/opctl/operator/lowcode/common/transformations.py +48 -14
ads/opctl/operator/lowcode/forecast/README.md +1 -1
ads/opctl/operator/lowcode/forecast/environment.yaml +5 -4
ads/opctl/operator/lowcode/forecast/model/arima.py +36 -29
ads/opctl/operator/lowcode/forecast/model/automlx.py +91 -90
ads/opctl/operator/lowcode/forecast/model/autots.py +200 -166
ads/opctl/operator/lowcode/forecast/model/base_model.py +144 -140
ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +86 -80
ads/opctl/operator/lowcode/forecast/model/prophet.py +68 -63
ads/opctl/operator/lowcode/forecast/operator_config.py +18 -2
ads/opctl/operator/lowcode/forecast/schema.yaml +20 -4
ads/opctl/operator/lowcode/forecast/utils.py +8 -4
ads/opctl/operator/lowcode/pii/README.md +1 -1
ads/opctl/operator/lowcode/pii/environment.yaml +1 -1
ads/opctl/operator/lowcode/pii/model/report.py +71 -70
ads/pipeline/ads_pipeline_step.py +11 -12
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/METADATA +8 -7
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/RECORD +64 -64
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/LICENSE.txt +0 -0
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/WHEEL +0 -0
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/entry_points.txt +0 -0

ads/opctl/operator/lowcode/forecast/model/automlx.py CHANGED Viewed

@@ -2,7 +2,7 @@
 # -*- coding: utf-8 -*--
 import traceback
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2023, 2024 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 import pandas as pd
@@ -22,6 +22,7 @@ from ads.opctl.operator.lowcode.common.utils import (
     seconds_to_datetime,
     datetime_to_seconds,
 )
+from ads.opctl.operator.lowcode.forecast.utils import _label_encode_dataframe
 AUTOMLX_N_ALGOS_TUNED = 4
 AUTOMLX_DEFAULT_SCORE_METRIC = "neg_sym_mean_abs_percent_error"
@@ -51,8 +52,12 @@ class AutoMLXOperatorModel(ForecastOperatorBaseModel):
         ] = self.spec.preprocessing or model_kwargs_cleaned.get("preprocessing", True)
         return model_kwargs_cleaned, time_budget
-    def preprocess(self, data, series_id=None):
-        return data.set_index(self.spec.datetime_column.name)
+    def preprocess(self, data, series_id=None):  # TODO: re-use self.le for explanations
+        _, df_encoded = _label_encode_dataframe(
+            data,
+            no_encode={self.spec.datetime_column.name, self.original_target_column},
+        )
+        return df_encoded.set_index(self.spec.datetime_column.name)
     @runtime_dependency(
         module="automlx",
@@ -70,17 +75,20 @@ class AutoMLXOperatorModel(ForecastOperatorBaseModel):
     )
     def _build_model(self) -> pd.DataFrame:
         from automlx import init
-        from sktime.forecasting.model_selection import temporal_train_test_split
+        import logging
         try:
-            init(engine="ray", engine_opts={"ray_setup": {"_temp_dir": "/tmp/ray-temp"}})
+            init(
+                engine="ray",
+                engine_opts={"ray_setup": {"_temp_dir": "/tmp/ray-temp"}},
+                loglevel=logging.CRITICAL,
+            )
         except Exception as e:
             logger.info("Ray already initialized")
         full_data_dict = self.datasets.get_data_by_series()
         self.models = dict()
-        date_column = self.spec.datetime_column.name
         horizon = self.spec.horizon
         self.spec.confidence_interval_width = self.spec.confidence_interval_width or 0.8
         self.forecast_output = ForecastOutput(
@@ -107,7 +115,7 @@ class AutoMLXOperatorModel(ForecastOperatorBaseModel):
                 logger.debug(f"Time Index Monotonic: {data_i.index.is_monotonic}")
-                if self.loaded_models is not None:
+                if self.loaded_models is not None and s_id in self.loaded_models:
                     model = self.loaded_models[s_id]
                 else:
                     model = automlx.Pipeline(
@@ -163,12 +171,6 @@ class AutoMLXOperatorModel(ForecastOperatorBaseModel):
         return self.forecast_output.get_forecast_long()
-    @runtime_dependency(
-        module="datapane",
-        err_msg=(
-            "Please run `pip3 install datapane` to install the required dependencies for report generation."
-        ),
-    )
     def _generate_report(self):
         """
         Generate the report for the automlx model.
@@ -179,106 +181,105 @@ class AutoMLXOperatorModel(ForecastOperatorBaseModel):
         Returns
         -------
-            - model_description (datapane.Text): A Text component containing the description of the automlx model.
-            - other_sections (List[Union[datapane.Text, datapane.Blocks]]): A list of Text and Blocks components representing various sections of the report.
+            - model_description (report-creator.Text): A Text component containing the description of the automlx model.
+            - other_sections (List[Union[report-creator.Text, report-creator.Block]]): A list of Text and Blocks components representing various sections of the report.
             - forecast_col_name (str): The name of the forecasted column.
             - train_metrics (bool): A boolean value indicating whether to include train metrics in the report.
             - ds_column_series (pd.Series): The pd.Series object representing the datetime column of the dataset.
             - ds_forecast_col (pd.Series): The pd.Series object representing the forecasted column.
             - ci_col_names (List[str]): A list of column names for the confidence interval in the report.
         """
-        import datapane as dp
+        import report_creator as rc
         """The method that needs to be implemented on the particular model level."""
-        selected_models_text = dp.Text(
-            f"## Selected Models Overview \n "
-            "The following tables provide information regarding the "
-            "chosen model for each series and the corresponding parameters of the models."
-        )
         selected_models = dict()
         models = self.models
-        for i, (s_id, df) in enumerate(self.full_data_dict.items()):
-            selected_models[s_id] = {
-                "series_id": s_id,
-                "selected_model": models[s_id].selected_model_,
-                "model_params": models[s_id].selected_model_params_,
-            }
-        selected_models_df = pd.DataFrame(
-            selected_models.items(), columns=["series_id", "best_selected_model"]
-        )
-        selected_df = selected_models_df["best_selected_model"].apply(pd.Series)
-        selected_models_section = dp.Blocks(
-            "### Best Selected Model", dp.DataTable(selected_df)
-        )
+        other_sections = []
+        if len(self.models) > 0:
+            for i, (s_id, m) in enumerate(models.items()):
+                selected_models[s_id] = {
+                    "series_id": s_id,
+                    "selected_model": m.selected_model_,
+                    "model_params": m.selected_model_params_,
+                }
+            selected_models_df = pd.DataFrame(
+                selected_models.items(), columns=["series_id", "best_selected_model"]
+            )
+            selected_df = selected_models_df["best_selected_model"].apply(pd.Series)
+            selected_models_section = rc.Block(
+                rc.Heading("Selected Models Overview", level=2),
+                rc.Text(
+                    "The following tables provide information regarding the "
+                    "chosen model for each series and the corresponding parameters of the models."
+                ),
+                rc.DataTable(selected_df, index=True),
+            )
-        all_sections = [selected_models_text, selected_models_section]
+            other_sections = [selected_models_section]
         if self.spec.generate_explanations:
-            # try:
-            # If the key is present, call the "explain_model" method
-            self.explain_model()
-            # Create a markdown text block for the global explanation section
-            global_explanation_text = dp.Text(
-                f"## Global Explanation of Models \n "
-                "The following tables provide the feature attribution for the global explainability."
-            )
+            try:
+                # If the key is present, call the "explain_model" method
+                self.explain_model()
-            # Convert the global explanation data to a DataFrame
-            global_explanation_df = pd.DataFrame(self.global_explanation)
+                # Convert the global explanation data to a DataFrame
+                global_explanation_df = pd.DataFrame(self.global_explanation)
-            self.formatted_global_explanation = (
-                global_explanation_df / global_explanation_df.sum(axis=0) * 100
-            )
-            self.formatted_global_explanation = (
-                self.formatted_global_explanation.rename(
-                    {self.spec.datetime_column.name: ForecastOutputColumns.DATE}, axis=1
+                self.formatted_global_explanation = (
+                    global_explanation_df / global_explanation_df.sum(axis=0) * 100
+                )
+                self.formatted_global_explanation = (
+                    self.formatted_global_explanation.rename(
+                        {self.spec.datetime_column.name: ForecastOutputColumns.DATE},
+                        axis=1,
+                    )
                 )
-            )
-            # Create a markdown section for the global explainability
-            global_explanation_section = dp.Blocks(
-                "### Global Explainability ",
-                dp.DataTable(self.formatted_global_explanation),
-            )
-            aggregate_local_explanations = pd.DataFrame()
-            for s_id, local_ex_df in self.local_explanation.items():
-                local_ex_df_copy = local_ex_df.copy()
-                local_ex_df_copy["Series"] = s_id
-                aggregate_local_explanations = pd.concat(
-                    [aggregate_local_explanations, local_ex_df_copy], axis=0
+                # Create a markdown section for the global explainability
+                global_explanation_section = rc.Block(
+                    rc.Heading("Global Explanation of Models", level=2),
+                    rc.Text(
+                        "The following tables provide the feature attribution for the global explainability."
+                    ),
+                    rc.DataTable(self.formatted_global_explanation, index=True),
                 )
-            self.formatted_local_explanation = aggregate_local_explanations
-            local_explanation_text = dp.Text(f"## Local Explanation of Models \n ")
-            blocks = [
-                dp.DataTable(
-                    local_ex_df.div(local_ex_df.abs().sum(axis=1), axis=0) * 100,
-                    label=s_id,
+                aggregate_local_explanations = pd.DataFrame()
+                for s_id, local_ex_df in self.local_explanation.items():
+                    local_ex_df_copy = local_ex_df.copy()
+                    local_ex_df_copy["Series"] = s_id
+                    aggregate_local_explanations = pd.concat(
+                        [aggregate_local_explanations, local_ex_df_copy], axis=0
+                    )
+                self.formatted_local_explanation = aggregate_local_explanations
+                blocks = [
+                    rc.DataTable(
+                        local_ex_df.div(local_ex_df.abs().sum(axis=1), axis=0) * 100,
+                        label=s_id,
+                        index=True,
+                    )
+                    for s_id, local_ex_df in self.local_explanation.items()
+                ]
+                local_explanation_section = rc.Block(
+                    rc.Heading("Local Explanation of Models", level=2),
+                    rc.Select(blocks=blocks),
                 )
-                for s_id, local_ex_df in self.local_explanation.items()
-            ]
-            local_explanation_section = (
-                dp.Select(blocks=blocks) if len(blocks) > 1 else blocks[0]
-            )
-            # Append the global explanation text and section to the "all_sections" list
-            all_sections = all_sections + [
-                global_explanation_text,
-                global_explanation_section,
-                local_explanation_text,
-                local_explanation_section,
-            ]
-            # except Exception as e:
-            #     logger.warn(f"Failed to generate Explanations with error: {e}.")
-            #     logger.debug(f"Full Traceback: {traceback.format_exc()}")
-        model_description = dp.Text(
+                # Append the global explanation text and section to the "other_sections" list
+                other_sections = other_sections + [
+                    global_explanation_section,
+                    local_explanation_section,
+                ]
+            except Exception as e:
+                logger.warn(f"Failed to generate Explanations with error: {e}.")
+                logger.debug(f"Full Traceback: {traceback.format_exc()}")
+        model_description = rc.Text(
             "The AutoMLx model automatically preprocesses, selects and engineers "
             "high-quality features in your dataset, which are then provided for further processing."
         )
-        other_sections = all_sections
         return (
             model_description,

oracle-ads 2.11.6__py3-none-any.whl → 2.11.8__py3-none-any.whl

oracle-ads 2.11.6py3-none-any.whl → 2.11.8py3-none-any.whl