PyPI - oracle-ads - Versions diffs - 2.11.6__py3-none-any.whl → 2.11.8__py3-none-any.whl - Mend

oracle-ads 2.11.6py3-none-any.whl → 2.11.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

ads/aqua/__init__.py +24 -14
ads/aqua/base.py +0 -2
ads/aqua/cli.py +50 -2
ads/aqua/decorator.py +8 -0
ads/aqua/deployment.py +37 -34
ads/aqua/evaluation.py +106 -49
ads/aqua/extension/base_handler.py +18 -10
ads/aqua/extension/common_handler.py +21 -2
ads/aqua/extension/deployment_handler.py +1 -4
ads/aqua/extension/evaluation_handler.py +1 -2
ads/aqua/extension/finetune_handler.py +0 -1
ads/aqua/extension/ui_handler.py +1 -12
ads/aqua/extension/utils.py +4 -4
ads/aqua/finetune.py +24 -11
ads/aqua/model.py +2 -4
ads/aqua/utils.py +39 -23
ads/catalog/model.py +3 -3
ads/catalog/notebook.py +3 -3
ads/catalog/project.py +2 -2
ads/catalog/summary.py +2 -4
ads/cli.py +21 -2
ads/common/serializer.py +5 -4
ads/common/utils.py +6 -2
ads/config.py +1 -0
ads/data_labeling/metadata.py +2 -2
ads/dataset/dataset.py +3 -5
ads/dataset/factory.py +2 -3
ads/dataset/label_encoder.py +1 -1
ads/dataset/sampled_dataset.py +3 -5
ads/jobs/ads_job.py +26 -2
ads/jobs/builders/infrastructure/dsc_job.py +20 -7
ads/llm/serializers/runnable_parallel.py +7 -1
ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +1 -1
ads/opctl/operator/lowcode/anomaly/README.md +1 -1
ads/opctl/operator/lowcode/anomaly/environment.yaml +1 -1
ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +8 -15
ads/opctl/operator/lowcode/anomaly/model/automlx.py +16 -10
ads/opctl/operator/lowcode/anomaly/model/autots.py +9 -10
ads/opctl/operator/lowcode/anomaly/model/base_model.py +36 -39
ads/opctl/operator/lowcode/anomaly/model/tods.py +4 -4
ads/opctl/operator/lowcode/anomaly/operator_config.py +18 -1
ads/opctl/operator/lowcode/anomaly/schema.yaml +16 -4
ads/opctl/operator/lowcode/common/data.py +16 -2
ads/opctl/operator/lowcode/common/transformations.py +48 -14
ads/opctl/operator/lowcode/forecast/README.md +1 -1
ads/opctl/operator/lowcode/forecast/environment.yaml +5 -4
ads/opctl/operator/lowcode/forecast/model/arima.py +36 -29
ads/opctl/operator/lowcode/forecast/model/automlx.py +91 -90
ads/opctl/operator/lowcode/forecast/model/autots.py +200 -166
ads/opctl/operator/lowcode/forecast/model/base_model.py +144 -140
ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +86 -80
ads/opctl/operator/lowcode/forecast/model/prophet.py +68 -63
ads/opctl/operator/lowcode/forecast/operator_config.py +18 -2
ads/opctl/operator/lowcode/forecast/schema.yaml +20 -4
ads/opctl/operator/lowcode/forecast/utils.py +8 -4
ads/opctl/operator/lowcode/pii/README.md +1 -1
ads/opctl/operator/lowcode/pii/environment.yaml +1 -1
ads/opctl/operator/lowcode/pii/model/report.py +71 -70
ads/pipeline/ads_pipeline_step.py +11 -12
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/METADATA +8 -7
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/RECORD +64 -64
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/LICENSE.txt +0 -0
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/WHEEL +0 -0
{oracle_ads-2.11.6.dist-info → oracle_ads-2.11.8.dist-info}/entry_points.txt +0 -0

ads/opctl/operator/lowcode/forecast/model/autots.py CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*--
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2023, 2024 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 import copy
@@ -54,145 +54,161 @@ class AutoTSOperatorModel(ForecastOperatorBaseModel):
             target_column=self.original_target_column,
             dt_column=self.spec.datetime_column.name,
         )
-        model = self.loaded_models if self.loaded_models is not None else None
-        if model is None:
-            # Initialize the AutoTS model with specified parameters
-            model = AutoTS(
-                forecast_length=self.spec.horizon,
-                frequency=self.spec.model_kwargs.get(
-                    "frequency", "infer"
-                ),  # TODO: Use datasets.get_datetime_frequency ?
-                prediction_interval=self.spec.confidence_interval_width,
-                max_generations=self.spec.model_kwargs.get(
-                    "max_generations", AUTOTS_MAX_GENERATION
-                ),
-                no_negatives=self.spec.model_kwargs.get("no_negatives", False),
-                constraint=self.spec.model_kwargs.get("constraint", None),
-                ensemble=self.spec.model_kwargs.get("ensemble", "auto"),
-                initial_template=self.spec.model_kwargs.get(
-                    "initial_template", "General+Random"
-                ),
-                random_seed=self.spec.model_kwargs.get("random_seed", 2022),
-                holiday_country=self.spec.model_kwargs.get("holiday_country", "US"),
-                subset=self.spec.model_kwargs.get("subset", None),
-                aggfunc=self.spec.model_kwargs.get("aggfunc", "first"),
-                na_tolerance=self.spec.model_kwargs.get("na_tolerance", 1),
-                drop_most_recent=self.spec.model_kwargs.get("drop_most_recent", 0),
-                drop_data_older_than_periods=self.spec.model_kwargs.get(
-                    "drop_data_older_than_periods", None
-                ),
-                model_list=self.spec.model_kwargs.get("model_list", "fast_parallel"),
-                transformer_list=self.spec.model_kwargs.get("transformer_list", "auto"),
-                transformer_max_depth=self.spec.model_kwargs.get(
-                    "transformer_max_depth", 6
-                ),
-                models_mode=self.spec.model_kwargs.get("models_mode", "random"),
-                num_validations=self.spec.model_kwargs.get("num_validations", "auto"),
-                models_to_validate=self.spec.model_kwargs.get(
-                    "models_to_validate", AUTOTS_MODELS_TO_VALIDATE
-                ),
-                max_per_model_class=self.spec.model_kwargs.get(
-                    "max_per_model_class", None
-                ),
-                validation_method=self.spec.model_kwargs.get(
-                    "validation_method", "backwards"
-                ),
-                min_allowed_train_percent=self.spec.model_kwargs.get(
-                    "min_allowed_train_percent", 0.5
-                ),
-                remove_leading_zeroes=self.spec.model_kwargs.get(
-                    "remove_leading_zeroes", False
-                ),
-                prefill_na=self.spec.model_kwargs.get("prefill_na", None),
-                introduce_na=self.spec.model_kwargs.get("introduce_na", None),
-                preclean=self.spec.model_kwargs.get("preclean", None),
-                model_interrupt=self.spec.model_kwargs.get("model_interrupt", True),
-                generation_timeout=self.spec.model_kwargs.get(
-                    "generation_timeout", None
-                ),
-                current_model_file=self.spec.model_kwargs.get(
-                    "current_model_file", None
-                ),
-                verbose=-1 if logger.level > 40 else 1,
-                n_jobs=self.spec.model_kwargs.get("n_jobs", -1),
-            )
-        full_data_indexed = self.datasets.get_data_multi_indexed()
-        dates = full_data_indexed.index.get_level_values(0).unique().tolist()
-        train_idx = dates[: -self.spec.horizon]
-        df_train = full_data_indexed[
-            full_data_indexed.index.get_level_values(0).isin(train_idx)
-        ][[self.original_target_column]].reset_index()
-        # Future regressors need to be in wide format - (num_unique_dates x (num_unique_series x num_unique_cols))
-        additional_regressors = list(
-            set(full_data_indexed.columns) - {self.original_target_column}
-        )
-        if len(additional_regressors) > 1:
-            future_regressor = full_data_indexed.reset_index().pivot(
-                index=self.spec.datetime_column.name,
-                columns=ForecastOutputColumns.SERIES,
-                values=additional_regressors,
-            )
-            future_reg = future_regressor[: -self.spec.horizon]
-            regr_fcst = future_regressor[-self.spec.horizon :]
-        else:
-            future_reg = None
-            regr_fcst = None
-        if self.loaded_models is None:
-            model = model.fit(
-                df_train,
-                future_regressor=future_reg,
-                date_col=self.spec.datetime_column.name,
-                value_col=self.original_target_column,
-                id_col=ForecastOutputColumns.SERIES,
-            )
-            # Store the trained model and generate forecasts
-            self.models = copy.deepcopy(model)
-        else:
-            self.models = self.loaded_models
-        self.outputs = model.predict(future_regressor=regr_fcst)
-        logger.debug("===========Forecast Generated===========")
-        hist_df = model.back_forecast().forecast
-        params = vars(model).copy()
-        for param in [
-            "ens_copy",
-            "df_wide_numeric",
-            "future_regressor_train",
-            "initial_results",
-            "score_per_series",
-            "validation_results",
-            "validation_train_indexes",
-            "validation_test_indexes",
-            "validation_indexes",
-            "best_model",
-        ]:
-            if param in params:
-                params.pop(param)
-        for s_id in self.datasets.list_series_ids():
-            self.forecast_output.init_series_output(
-                series_id=s_id, data_at_series=self.datasets.get_data_at_series(s_id)
-            )
-            self.forecast_output.populate_series_output(
-                series_id=s_id,
-                fit_val=hist_df[s_id].values,
-                forecast_val=self.outputs.forecast[s_id].values,
-                upper_bound=self.outputs.upper_forecast[s_id].values,
-                lower_bound=self.outputs.lower_forecast[s_id].values,
+        try:
+            model = self.loaded_models if self.loaded_models is not None else None
+            if model is None:
+                # Initialize the AutoTS model with specified parameters
+                model = AutoTS(
+                    forecast_length=self.spec.horizon,
+                    frequency=self.spec.model_kwargs.get(
+                        "frequency", "infer"
+                    ),  # TODO: Use datasets.get_datetime_frequency ?
+                    prediction_interval=self.spec.confidence_interval_width,
+                    max_generations=self.spec.model_kwargs.get(
+                        "max_generations", AUTOTS_MAX_GENERATION
+                    ),
+                    no_negatives=self.spec.model_kwargs.get("no_negatives", False),
+                    constraint=self.spec.model_kwargs.get("constraint", None),
+                    ensemble=self.spec.model_kwargs.get("ensemble", "auto"),
+                    initial_template=self.spec.model_kwargs.get(
+                        "initial_template", "General+Random"
+                    ),
+                    random_seed=self.spec.model_kwargs.get("random_seed", 2022),
+                    holiday_country=self.spec.model_kwargs.get("holiday_country", "US"),
+                    subset=self.spec.model_kwargs.get("subset", None),
+                    aggfunc=self.spec.model_kwargs.get("aggfunc", "first"),
+                    na_tolerance=self.spec.model_kwargs.get("na_tolerance", 1),
+                    drop_most_recent=self.spec.model_kwargs.get("drop_most_recent", 0),
+                    drop_data_older_than_periods=self.spec.model_kwargs.get(
+                        "drop_data_older_than_periods", None
+                    ),
+                    model_list=self.spec.model_kwargs.get(
+                        "model_list", "fast_parallel"
+                    ),
+                    transformer_list=self.spec.model_kwargs.get(
+                        "transformer_list", "auto"
+                    ),
+                    transformer_max_depth=self.spec.model_kwargs.get(
+                        "transformer_max_depth", 6
+                    ),
+                    models_mode=self.spec.model_kwargs.get("models_mode", "random"),
+                    num_validations=self.spec.model_kwargs.get(
+                        "num_validations", "auto"
+                    ),
+                    models_to_validate=self.spec.model_kwargs.get(
+                        "models_to_validate", AUTOTS_MODELS_TO_VALIDATE
+                    ),
+                    max_per_model_class=self.spec.model_kwargs.get(
+                        "max_per_model_class", None
+                    ),
+                    validation_method=self.spec.model_kwargs.get(
+                        "validation_method", "backwards"
+                    ),
+                    min_allowed_train_percent=self.spec.model_kwargs.get(
+                        "min_allowed_train_percent", 0.5
+                    ),
+                    remove_leading_zeroes=self.spec.model_kwargs.get(
+                        "remove_leading_zeroes", False
+                    ),
+                    prefill_na=self.spec.model_kwargs.get("prefill_na", None),
+                    introduce_na=self.spec.model_kwargs.get("introduce_na", None),
+                    preclean=self.spec.model_kwargs.get("preclean", None),
+                    model_interrupt=self.spec.model_kwargs.get("model_interrupt", True),
+                    generation_timeout=self.spec.model_kwargs.get(
+                        "generation_timeout", None
+                    ),
+                    current_model_file=self.spec.model_kwargs.get(
+                        "current_model_file", None
+                    ),
+                    verbose=-1 if logger.level > 40 else 1,
+                    n_jobs=self.spec.model_kwargs.get("n_jobs", -1),
+                )
+            full_data_indexed = self.datasets.get_data_multi_indexed()
+            dates = full_data_indexed.index.get_level_values(0).unique().tolist()
+            train_idx = dates[: -self.spec.horizon]
+            df_train = full_data_indexed[
+                full_data_indexed.index.get_level_values(0).isin(train_idx)
+            ][[self.original_target_column]].reset_index()
+            # Future regressors need to be in wide format - (num_unique_dates x (num_unique_series x num_unique_cols))
+            additional_regressors = list(
+                set(full_data_indexed.columns) - {self.original_target_column}
             )
-            self.model_parameters[s_id] = {
-                "framework": SupportedModels.AutoTS,
-                **params,
-            }
+            if len(additional_regressors) > 1:
+                future_regressor = full_data_indexed.reset_index().pivot(
+                    index=self.spec.datetime_column.name,
+                    columns=ForecastOutputColumns.SERIES,
+                    values=additional_regressors,
+                )
+                future_reg = future_regressor[: -self.spec.horizon]
+                regr_fcst = future_regressor[-self.spec.horizon :]
+            else:
+                future_reg = None
+                regr_fcst = None
+            for s_id in self.datasets.list_series_ids():
+                self.forecast_output.init_series_output(
+                    series_id=s_id,
+                    data_at_series=self.datasets.get_data_at_series(s_id),
+                )
+            if self.loaded_models is None:
+                model = model.fit(
+                    df_train,
+                    future_regressor=future_reg,
+                    date_col=self.spec.datetime_column.name,
+                    value_col=self.original_target_column,
+                    id_col=ForecastOutputColumns.SERIES,
+                )
+                # Store the trained model and generate forecasts
+                self.models = copy.deepcopy(model)
+            else:
+                self.models = self.loaded_models
+            self.outputs = model.predict(future_regressor=regr_fcst)
+            logger.debug("===========Forecast Generated===========")
+            hist_df = model.back_forecast().forecast
+            params = vars(model).copy()
+            for param in [
+                "ens_copy",
+                "df_wide_numeric",
+                "future_regressor_train",
+                "initial_results",
+                "score_per_series",
+                "validation_results",
+                "validation_train_indexes",
+                "validation_test_indexes",
+                "validation_indexes",
+                "best_model",
+            ]:
+                if param in params:
+                    params.pop(param)
+            for s_id in self.datasets.list_series_ids():
+                self.forecast_output.populate_series_output(
+                    series_id=s_id,
+                    fit_val=hist_df[s_id].values,
+                    forecast_val=self.outputs.forecast[s_id].values,
+                    upper_bound=self.outputs.upper_forecast[s_id].values,
+                    lower_bound=self.outputs.lower_forecast[s_id].values,
+                )
+                self.model_parameters[s_id] = {
+                    "framework": SupportedModels.AutoTS,
+                    **params,
+                }
+        except Exception as e:
+            for s_id in self.datasets.list_series_ids():
+                self.errors_dict[s_id] = {
+                    "model_name": self.spec.model,
+                    "error": str(e),
+                }
         logger.debug("===========Done===========")
@@ -204,7 +220,7 @@ class AutoTSOperatorModel(ForecastOperatorBaseModel):
         Returns:
             tuple: A tuple containing the following elements:
-            - model_description (dp.Text): A text object containing the description of the AutoTS model.
+            - model_description (rc.Text): A text object containing the description of the AutoTS model.
             - other_sections (list): A list of sections to be included in the report.
             - forecast_col_name (str): The name of the forecast column.
             - train_metrics (bool): A boolean indicating whether to include train metrics.
@@ -212,36 +228,48 @@ class AutoTSOperatorModel(ForecastOperatorBaseModel):
             - ds_forecast_col (pd.Index): A pandas Index containing the forecast column values.
             - ci_col_names (list): A list of column names for confidence intervals.
         """
-        import datapane as dp
+        import report_creator as rc
-        # Section 1: Forecast Overview
-        sec1_text = dp.Text(
-            "## Forecast Overview \n"
-            "These plots show your forecast in the context of historical data."
-        )
-        sec_1 = _select_plot_list(
-            lambda s_id: self.outputs.plot(self.models.df_wide_numeric, series=s_id),
-            self.datasets.list_series_ids(),
-        )
+        all_sections = []
+        if self.models:
+            # Section 1: Forecast Overview
-        # Section 2: AutoTS Model Parameters
-        sec2_text = dp.Text(f"## AutoTS Model Parameters")
-        try:
-            sec2 = dp.Code(
-                code=yaml.dump(list(self.models.best_model.T.to_dict().values())[0]),
-                language="yaml",
+            sec_1_plots = _select_plot_list(
+                lambda s_id: self.outputs.plot(
+                    self.models.df_wide_numeric, series=s_id
+                ),
+                self.datasets.list_series_ids(),
+            )
+            section_1 = rc.Block(
+                rc.Heading("Forecast Overview", level=2),
+                rc.Text(
+                    "These plots show your forecast in the context of historical data."
+                ),
+                sec_1_plots,
             )
-        except KeyError as ke:
-            logger.warn(f"Issue generating Model Parameters Table Section. Skipping")
-            sec2 = dp.Text(f"Error generating model parameters.")
-        all_sections = [sec1_text, sec_1, sec2_text, sec2]
+            # Section 2: AutoTS Model Parameters
+            sec2_text = rc.Heading("AutoTS Model Parameters", level=2)
+            try:
+                sec2 = rc.Yaml(
+                    yaml.dump(list(self.models.best_model.T.to_dict().values())[0]),
+                )
+            except KeyError as ke:
+                logger.warn(
+                    f"Issue generating Model Parameters Table Section. Skipping"
+                )
+                sec2 = rc.Text("Error generating model parameters.")
+            section_2 = rc.Block(sec2_text, sec2)
+            all_sections = [sec_1_plots, section_2]
         if self.spec.generate_explanations:
             logger.warn(f"Explanations not yet supported for the AutoTS Module")
         # Model Description
-        model_description = dp.Text(
+        model_description = rc.Text(
             "AutoTS is a time series package for Python designed for rapidly deploying high-accuracy forecasts at scale. "
             "In 2023, AutoTS has won in the M6 forecasting competition, "
             "delivering the highest performance investment decisions across 12 months of stock market forecasting."
@@ -266,9 +294,15 @@ class AutoTSOperatorModel(ForecastOperatorBaseModel):
         r2	-4.60E-06
         Explained Variance	0.002177087
         """
-        mapes = pd.DataFrame(self.models.best_model_per_series_mape()).T
-        scores = pd.DataFrame(
-            self.models.best_model_per_series_score(), columns=["AutoTS Score"]
-        ).T
-        df = pd.concat([mapes, scores])
+        df = pd.DataFrame()
+        try:
+            mapes = pd.DataFrame(self.models.best_model_per_series_mape()).T
+            scores = pd.DataFrame(
+                self.models.best_model_per_series_score(), columns=["AutoTS Score"]
+            ).T
+            df = pd.concat([mapes, scores])
+        except Exception as e:
+            logger.debug(f"Failed to generate training metrics")
+            logger.debug(f"Received Error Statement: {e}")
         return df

oracle-ads 2.11.6__py3-none-any.whl → 2.11.8__py3-none-any.whl

oracle-ads 2.11.6py3-none-any.whl → 2.11.8py3-none-any.whl