oracle-ads 2.13.9rc0__py3-none-any.whl → 2.13.10__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ads/aqua/__init__.py +40 -0
- ads/aqua/app.py +507 -0
- ads/aqua/cli.py +96 -0
- ads/aqua/client/__init__.py +3 -0
- ads/aqua/client/client.py +836 -0
- ads/aqua/client/openai_client.py +305 -0
- ads/aqua/common/__init__.py +5 -0
- ads/aqua/common/decorator.py +125 -0
- ads/aqua/common/entities.py +274 -0
- ads/aqua/common/enums.py +134 -0
- ads/aqua/common/errors.py +109 -0
- ads/aqua/common/utils.py +1295 -0
- ads/aqua/config/__init__.py +4 -0
- ads/aqua/config/container_config.py +246 -0
- ads/aqua/config/evaluation/__init__.py +4 -0
- ads/aqua/config/evaluation/evaluation_service_config.py +147 -0
- ads/aqua/config/utils/__init__.py +4 -0
- ads/aqua/config/utils/serializer.py +339 -0
- ads/aqua/constants.py +116 -0
- ads/aqua/data.py +14 -0
- ads/aqua/dummy_data/icon.txt +1 -0
- ads/aqua/dummy_data/oci_model_deployments.json +56 -0
- ads/aqua/dummy_data/oci_models.json +1 -0
- ads/aqua/dummy_data/readme.md +26 -0
- ads/aqua/evaluation/__init__.py +8 -0
- ads/aqua/evaluation/constants.py +53 -0
- ads/aqua/evaluation/entities.py +186 -0
- ads/aqua/evaluation/errors.py +70 -0
- ads/aqua/evaluation/evaluation.py +1814 -0
- ads/aqua/extension/__init__.py +42 -0
- ads/aqua/extension/aqua_ws_msg_handler.py +76 -0
- ads/aqua/extension/base_handler.py +90 -0
- ads/aqua/extension/common_handler.py +121 -0
- ads/aqua/extension/common_ws_msg_handler.py +36 -0
- ads/aqua/extension/deployment_handler.py +381 -0
- ads/aqua/extension/deployment_ws_msg_handler.py +54 -0
- ads/aqua/extension/errors.py +30 -0
- ads/aqua/extension/evaluation_handler.py +129 -0
- ads/aqua/extension/evaluation_ws_msg_handler.py +61 -0
- ads/aqua/extension/finetune_handler.py +96 -0
- ads/aqua/extension/model_handler.py +390 -0
- ads/aqua/extension/models/__init__.py +0 -0
- ads/aqua/extension/models/ws_models.py +145 -0
- ads/aqua/extension/models_ws_msg_handler.py +50 -0
- ads/aqua/extension/ui_handler.py +300 -0
- ads/aqua/extension/ui_websocket_handler.py +130 -0
- ads/aqua/extension/utils.py +133 -0
- ads/aqua/finetuning/__init__.py +7 -0
- ads/aqua/finetuning/constants.py +23 -0
- ads/aqua/finetuning/entities.py +181 -0
- ads/aqua/finetuning/finetuning.py +749 -0
- ads/aqua/model/__init__.py +8 -0
- ads/aqua/model/constants.py +60 -0
- ads/aqua/model/entities.py +385 -0
- ads/aqua/model/enums.py +32 -0
- ads/aqua/model/model.py +2134 -0
- ads/aqua/model/utils.py +52 -0
- ads/aqua/modeldeployment/__init__.py +6 -0
- ads/aqua/modeldeployment/constants.py +10 -0
- ads/aqua/modeldeployment/deployment.py +1315 -0
- ads/aqua/modeldeployment/entities.py +653 -0
- ads/aqua/modeldeployment/utils.py +543 -0
- ads/aqua/resources/gpu_shapes_index.json +94 -0
- ads/aqua/server/__init__.py +4 -0
- ads/aqua/server/__main__.py +24 -0
- ads/aqua/server/app.py +47 -0
- ads/aqua/server/aqua_spec.yml +1291 -0
- ads/aqua/training/__init__.py +4 -0
- ads/aqua/training/exceptions.py +476 -0
- ads/aqua/ui.py +519 -0
- ads/automl/__init__.py +9 -0
- ads/automl/driver.py +330 -0
- ads/automl/provider.py +975 -0
- ads/bds/__init__.py +5 -0
- ads/bds/auth.py +127 -0
- ads/bds/big_data_service.py +255 -0
- ads/catalog/__init__.py +19 -0
- ads/catalog/model.py +1576 -0
- ads/catalog/notebook.py +461 -0
- ads/catalog/project.py +468 -0
- ads/catalog/summary.py +178 -0
- ads/common/__init__.py +11 -0
- ads/common/analyzer.py +65 -0
- ads/common/artifact/.model-ignore +63 -0
- ads/common/artifact/__init__.py +10 -0
- ads/common/auth.py +1122 -0
- ads/common/card_identifier.py +83 -0
- ads/common/config.py +647 -0
- ads/common/data.py +165 -0
- ads/common/decorator/__init__.py +9 -0
- ads/common/decorator/argument_to_case.py +88 -0
- ads/common/decorator/deprecate.py +69 -0
- ads/common/decorator/require_nonempty_arg.py +65 -0
- ads/common/decorator/runtime_dependency.py +178 -0
- ads/common/decorator/threaded.py +97 -0
- ads/common/decorator/utils.py +35 -0
- ads/common/dsc_file_system.py +303 -0
- ads/common/error.py +14 -0
- ads/common/extended_enum.py +81 -0
- ads/common/function/__init__.py +5 -0
- ads/common/function/fn_util.py +142 -0
- ads/common/function/func_conf.yaml +25 -0
- ads/common/ipython.py +76 -0
- ads/common/model.py +679 -0
- ads/common/model_artifact.py +1759 -0
- ads/common/model_artifact_schema.json +107 -0
- ads/common/model_export_util.py +664 -0
- ads/common/model_metadata.py +24 -0
- ads/common/object_storage_details.py +296 -0
- ads/common/oci_client.py +179 -0
- ads/common/oci_datascience.py +46 -0
- ads/common/oci_logging.py +1144 -0
- ads/common/oci_mixin.py +957 -0
- ads/common/oci_resource.py +136 -0
- ads/common/serializer.py +559 -0
- ads/common/utils.py +1852 -0
- ads/common/word_lists.py +1491 -0
- ads/common/work_request.py +189 -0
- ads/config.py +1 -0
- ads/data_labeling/__init__.py +13 -0
- ads/data_labeling/boundingbox.py +253 -0
- ads/data_labeling/constants.py +47 -0
- ads/data_labeling/data_labeling_service.py +244 -0
- ads/data_labeling/interface/__init__.py +5 -0
- ads/data_labeling/interface/loader.py +16 -0
- ads/data_labeling/interface/parser.py +16 -0
- ads/data_labeling/interface/reader.py +23 -0
- ads/data_labeling/loader/__init__.py +5 -0
- ads/data_labeling/loader/file_loader.py +241 -0
- ads/data_labeling/metadata.py +110 -0
- ads/data_labeling/mixin/__init__.py +5 -0
- ads/data_labeling/mixin/data_labeling.py +232 -0
- ads/data_labeling/ner.py +129 -0
- ads/data_labeling/parser/__init__.py +5 -0
- ads/data_labeling/parser/dls_record_parser.py +388 -0
- ads/data_labeling/parser/export_metadata_parser.py +94 -0
- ads/data_labeling/parser/export_record_parser.py +473 -0
- ads/data_labeling/reader/__init__.py +5 -0
- ads/data_labeling/reader/dataset_reader.py +574 -0
- ads/data_labeling/reader/dls_record_reader.py +121 -0
- ads/data_labeling/reader/export_record_reader.py +62 -0
- ads/data_labeling/reader/jsonl_reader.py +75 -0
- ads/data_labeling/reader/metadata_reader.py +203 -0
- ads/data_labeling/reader/record_reader.py +263 -0
- ads/data_labeling/record.py +52 -0
- ads/data_labeling/visualizer/__init__.py +5 -0
- ads/data_labeling/visualizer/image_visualizer.py +525 -0
- ads/data_labeling/visualizer/text_visualizer.py +357 -0
- ads/database/__init__.py +5 -0
- ads/database/connection.py +338 -0
- ads/dataset/__init__.py +10 -0
- ads/dataset/capabilities.md +51 -0
- ads/dataset/classification_dataset.py +339 -0
- ads/dataset/correlation.py +226 -0
- ads/dataset/correlation_plot.py +563 -0
- ads/dataset/dask_series.py +173 -0
- ads/dataset/dataframe_transformer.py +110 -0
- ads/dataset/dataset.py +1979 -0
- ads/dataset/dataset_browser.py +360 -0
- ads/dataset/dataset_with_target.py +995 -0
- ads/dataset/exception.py +25 -0
- ads/dataset/factory.py +987 -0
- ads/dataset/feature_engineering_transformer.py +35 -0
- ads/dataset/feature_selection.py +107 -0
- ads/dataset/forecasting_dataset.py +26 -0
- ads/dataset/helper.py +1450 -0
- ads/dataset/label_encoder.py +99 -0
- ads/dataset/mixin/__init__.py +5 -0
- ads/dataset/mixin/dataset_accessor.py +134 -0
- ads/dataset/pipeline.py +58 -0
- ads/dataset/plot.py +710 -0
- ads/dataset/progress.py +86 -0
- ads/dataset/recommendation.py +297 -0
- ads/dataset/recommendation_transformer.py +502 -0
- ads/dataset/regression_dataset.py +14 -0
- ads/dataset/sampled_dataset.py +1050 -0
- ads/dataset/target.py +98 -0
- ads/dataset/timeseries.py +18 -0
- ads/dbmixin/__init__.py +5 -0
- ads/dbmixin/db_pandas_accessor.py +153 -0
- ads/environment/__init__.py +9 -0
- ads/environment/ml_runtime.py +66 -0
- ads/evaluations/README.md +14 -0
- ads/evaluations/__init__.py +109 -0
- ads/evaluations/evaluation_plot.py +983 -0
- ads/evaluations/evaluator.py +1334 -0
- ads/evaluations/statistical_metrics.py +543 -0
- ads/experiments/__init__.py +9 -0
- ads/experiments/capabilities.md +0 -0
- ads/explanations/__init__.py +21 -0
- ads/explanations/base_explainer.py +142 -0
- ads/explanations/capabilities.md +83 -0
- ads/explanations/explainer.py +190 -0
- ads/explanations/mlx_global_explainer.py +1050 -0
- ads/explanations/mlx_interface.py +386 -0
- ads/explanations/mlx_local_explainer.py +287 -0
- ads/explanations/mlx_whatif_explainer.py +201 -0
- ads/feature_engineering/__init__.py +20 -0
- ads/feature_engineering/accessor/__init__.py +5 -0
- ads/feature_engineering/accessor/dataframe_accessor.py +535 -0
- ads/feature_engineering/accessor/mixin/__init__.py +5 -0
- ads/feature_engineering/accessor/mixin/correlation.py +166 -0
- ads/feature_engineering/accessor/mixin/eda_mixin.py +266 -0
- ads/feature_engineering/accessor/mixin/eda_mixin_series.py +85 -0
- ads/feature_engineering/accessor/mixin/feature_types_mixin.py +211 -0
- ads/feature_engineering/accessor/mixin/utils.py +65 -0
- ads/feature_engineering/accessor/series_accessor.py +431 -0
- ads/feature_engineering/adsimage/__init__.py +5 -0
- ads/feature_engineering/adsimage/image.py +192 -0
- ads/feature_engineering/adsimage/image_reader.py +170 -0
- ads/feature_engineering/adsimage/interface/__init__.py +5 -0
- ads/feature_engineering/adsimage/interface/reader.py +19 -0
- ads/feature_engineering/adsstring/__init__.py +7 -0
- ads/feature_engineering/adsstring/oci_language/__init__.py +8 -0
- ads/feature_engineering/adsstring/string/__init__.py +8 -0
- ads/feature_engineering/data_schema.json +57 -0
- ads/feature_engineering/dataset/__init__.py +5 -0
- ads/feature_engineering/dataset/zip_code_data.py +42062 -0
- ads/feature_engineering/exceptions.py +40 -0
- ads/feature_engineering/feature_type/__init__.py +133 -0
- ads/feature_engineering/feature_type/address.py +184 -0
- ads/feature_engineering/feature_type/adsstring/__init__.py +5 -0
- ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +164 -0
- ads/feature_engineering/feature_type/adsstring/oci_language.py +93 -0
- ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +5 -0
- ads/feature_engineering/feature_type/adsstring/parsers/base.py +47 -0
- ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +96 -0
- ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +221 -0
- ads/feature_engineering/feature_type/adsstring/string.py +258 -0
- ads/feature_engineering/feature_type/base.py +58 -0
- ads/feature_engineering/feature_type/boolean.py +183 -0
- ads/feature_engineering/feature_type/category.py +146 -0
- ads/feature_engineering/feature_type/constant.py +137 -0
- ads/feature_engineering/feature_type/continuous.py +151 -0
- ads/feature_engineering/feature_type/creditcard.py +314 -0
- ads/feature_engineering/feature_type/datetime.py +190 -0
- ads/feature_engineering/feature_type/discrete.py +134 -0
- ads/feature_engineering/feature_type/document.py +43 -0
- ads/feature_engineering/feature_type/gis.py +251 -0
- ads/feature_engineering/feature_type/handler/__init__.py +5 -0
- ads/feature_engineering/feature_type/handler/feature_validator.py +524 -0
- ads/feature_engineering/feature_type/handler/feature_warning.py +319 -0
- ads/feature_engineering/feature_type/handler/warnings.py +128 -0
- ads/feature_engineering/feature_type/integer.py +142 -0
- ads/feature_engineering/feature_type/ip_address.py +144 -0
- ads/feature_engineering/feature_type/ip_address_v4.py +138 -0
- ads/feature_engineering/feature_type/ip_address_v6.py +138 -0
- ads/feature_engineering/feature_type/lat_long.py +256 -0
- ads/feature_engineering/feature_type/object.py +43 -0
- ads/feature_engineering/feature_type/ordinal.py +132 -0
- ads/feature_engineering/feature_type/phone_number.py +135 -0
- ads/feature_engineering/feature_type/string.py +171 -0
- ads/feature_engineering/feature_type/text.py +93 -0
- ads/feature_engineering/feature_type/unknown.py +43 -0
- ads/feature_engineering/feature_type/zip_code.py +164 -0
- ads/feature_engineering/feature_type_manager.py +406 -0
- ads/feature_engineering/schema.py +795 -0
- ads/feature_engineering/utils.py +245 -0
- ads/feature_store/.readthedocs.yaml +19 -0
- ads/feature_store/README.md +65 -0
- ads/feature_store/__init__.py +9 -0
- ads/feature_store/common/__init__.py +0 -0
- ads/feature_store/common/enums.py +339 -0
- ads/feature_store/common/exceptions.py +18 -0
- ads/feature_store/common/spark_session_singleton.py +125 -0
- ads/feature_store/common/utils/__init__.py +0 -0
- ads/feature_store/common/utils/base64_encoder_decoder.py +72 -0
- ads/feature_store/common/utils/feature_schema_mapper.py +283 -0
- ads/feature_store/common/utils/transformation_utils.py +82 -0
- ads/feature_store/common/utils/utility.py +403 -0
- ads/feature_store/data_validation/__init__.py +0 -0
- ads/feature_store/data_validation/great_expectation.py +129 -0
- ads/feature_store/dataset.py +1230 -0
- ads/feature_store/dataset_job.py +530 -0
- ads/feature_store/docs/Dockerfile +7 -0
- ads/feature_store/docs/Makefile +44 -0
- ads/feature_store/docs/conf.py +28 -0
- ads/feature_store/docs/requirements.txt +14 -0
- ads/feature_store/docs/source/ads.feature_store.query.rst +20 -0
- ads/feature_store/docs/source/cicd.rst +137 -0
- ads/feature_store/docs/source/conf.py +86 -0
- ads/feature_store/docs/source/data_versioning.rst +33 -0
- ads/feature_store/docs/source/dataset.rst +388 -0
- ads/feature_store/docs/source/dataset_job.rst +27 -0
- ads/feature_store/docs/source/demo.rst +70 -0
- ads/feature_store/docs/source/entity.rst +78 -0
- ads/feature_store/docs/source/feature_group.rst +624 -0
- ads/feature_store/docs/source/feature_group_job.rst +29 -0
- ads/feature_store/docs/source/feature_store.rst +122 -0
- ads/feature_store/docs/source/feature_store_class.rst +123 -0
- ads/feature_store/docs/source/feature_validation.rst +66 -0
- ads/feature_store/docs/source/figures/cicd.png +0 -0
- ads/feature_store/docs/source/figures/data_validation.png +0 -0
- ads/feature_store/docs/source/figures/data_versioning.png +0 -0
- ads/feature_store/docs/source/figures/dataset.gif +0 -0
- ads/feature_store/docs/source/figures/dataset.png +0 -0
- ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
- ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
- ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
- ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
- ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
- ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
- ads/feature_store/docs/source/figures/entity.png +0 -0
- ads/feature_store/docs/source/figures/feature_group.png +0 -0
- ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
- ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
- ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
- ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
- ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
- ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
- ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
- ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
- ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
- ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
- ads/feature_store/docs/source/figures/overview.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
- ads/feature_store/docs/source/figures/stats_1.png +0 -0
- ads/feature_store/docs/source/figures/stats_2.png +0 -0
- ads/feature_store/docs/source/figures/stats_d.png +0 -0
- ads/feature_store/docs/source/figures/stats_fg.png +0 -0
- ads/feature_store/docs/source/figures/transformation.png +0 -0
- ads/feature_store/docs/source/figures/transformations.gif +0 -0
- ads/feature_store/docs/source/figures/validation.png +0 -0
- ads/feature_store/docs/source/figures/validation_fg.png +0 -0
- ads/feature_store/docs/source/figures/validation_results.png +0 -0
- ads/feature_store/docs/source/figures/validation_summary.png +0 -0
- ads/feature_store/docs/source/index.rst +81 -0
- ads/feature_store/docs/source/module.rst +8 -0
- ads/feature_store/docs/source/notebook.rst +94 -0
- ads/feature_store/docs/source/overview.rst +47 -0
- ads/feature_store/docs/source/quickstart.rst +176 -0
- ads/feature_store/docs/source/release_notes.rst +194 -0
- ads/feature_store/docs/source/setup_feature_store.rst +81 -0
- ads/feature_store/docs/source/statistics.rst +58 -0
- ads/feature_store/docs/source/transformation.rst +199 -0
- ads/feature_store/docs/source/ui.rst +65 -0
- ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +66 -0
- ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +192 -0
- ads/feature_store/docs/source/user_guides.setup.terraform.rst +338 -0
- ads/feature_store/entity.py +718 -0
- ads/feature_store/execution_strategy/__init__.py +0 -0
- ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
- ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +375 -0
- ads/feature_store/execution_strategy/engine/__init__.py +0 -0
- ads/feature_store/execution_strategy/engine/spark_engine.py +316 -0
- ads/feature_store/execution_strategy/execution_strategy.py +113 -0
- ads/feature_store/execution_strategy/execution_strategy_provider.py +47 -0
- ads/feature_store/execution_strategy/spark/__init__.py +0 -0
- ads/feature_store/execution_strategy/spark/spark_execution.py +618 -0
- ads/feature_store/feature.py +192 -0
- ads/feature_store/feature_group.py +1494 -0
- ads/feature_store/feature_group_expectation.py +346 -0
- ads/feature_store/feature_group_job.py +602 -0
- ads/feature_store/feature_lineage/__init__.py +0 -0
- ads/feature_store/feature_lineage/graphviz_service.py +180 -0
- ads/feature_store/feature_option_details.py +50 -0
- ads/feature_store/feature_statistics/__init__.py +0 -0
- ads/feature_store/feature_statistics/statistics_service.py +99 -0
- ads/feature_store/feature_store.py +699 -0
- ads/feature_store/feature_store_registrar.py +518 -0
- ads/feature_store/input_feature_detail.py +149 -0
- ads/feature_store/mixin/__init__.py +4 -0
- ads/feature_store/mixin/oci_feature_store.py +145 -0
- ads/feature_store/model_details.py +73 -0
- ads/feature_store/query/__init__.py +0 -0
- ads/feature_store/query/filter.py +266 -0
- ads/feature_store/query/generator/__init__.py +0 -0
- ads/feature_store/query/generator/query_generator.py +298 -0
- ads/feature_store/query/join.py +161 -0
- ads/feature_store/query/query.py +403 -0
- ads/feature_store/query/validator/__init__.py +0 -0
- ads/feature_store/query/validator/query_validator.py +57 -0
- ads/feature_store/response/__init__.py +0 -0
- ads/feature_store/response/response_builder.py +68 -0
- ads/feature_store/service/__init__.py +0 -0
- ads/feature_store/service/oci_dataset.py +139 -0
- ads/feature_store/service/oci_dataset_job.py +199 -0
- ads/feature_store/service/oci_entity.py +125 -0
- ads/feature_store/service/oci_feature_group.py +164 -0
- ads/feature_store/service/oci_feature_group_job.py +214 -0
- ads/feature_store/service/oci_feature_store.py +182 -0
- ads/feature_store/service/oci_lineage.py +87 -0
- ads/feature_store/service/oci_transformation.py +104 -0
- ads/feature_store/statistics/__init__.py +0 -0
- ads/feature_store/statistics/abs_feature_value.py +49 -0
- ads/feature_store/statistics/charts/__init__.py +0 -0
- ads/feature_store/statistics/charts/abstract_feature_plot.py +37 -0
- ads/feature_store/statistics/charts/box_plot.py +148 -0
- ads/feature_store/statistics/charts/frequency_distribution.py +65 -0
- ads/feature_store/statistics/charts/probability_distribution.py +68 -0
- ads/feature_store/statistics/charts/top_k_frequent_elements.py +98 -0
- ads/feature_store/statistics/feature_stat.py +126 -0
- ads/feature_store/statistics/generic_feature_value.py +33 -0
- ads/feature_store/statistics/statistics.py +41 -0
- ads/feature_store/statistics_config.py +101 -0
- ads/feature_store/templates/feature_store_template.yaml +45 -0
- ads/feature_store/transformation.py +499 -0
- ads/feature_store/validation_output.py +57 -0
- ads/hpo/__init__.py +9 -0
- ads/hpo/_imports.py +91 -0
- ads/hpo/ads_search_space.py +439 -0
- ads/hpo/distributions.py +325 -0
- ads/hpo/objective.py +280 -0
- ads/hpo/search_cv.py +1657 -0
- ads/hpo/stopping_criterion.py +75 -0
- ads/hpo/tuner_artifact.py +413 -0
- ads/hpo/utils.py +91 -0
- ads/hpo/validation.py +140 -0
- ads/hpo/visualization/__init__.py +5 -0
- ads/hpo/visualization/_contour.py +23 -0
- ads/hpo/visualization/_edf.py +20 -0
- ads/hpo/visualization/_intermediate_values.py +21 -0
- ads/hpo/visualization/_optimization_history.py +25 -0
- ads/hpo/visualization/_parallel_coordinate.py +169 -0
- ads/hpo/visualization/_param_importances.py +26 -0
- ads/jobs/__init__.py +53 -0
- ads/jobs/ads_job.py +663 -0
- ads/jobs/builders/__init__.py +5 -0
- ads/jobs/builders/base.py +156 -0
- ads/jobs/builders/infrastructure/__init__.py +6 -0
- ads/jobs/builders/infrastructure/base.py +165 -0
- ads/jobs/builders/infrastructure/dataflow.py +1252 -0
- ads/jobs/builders/infrastructure/dsc_job.py +1894 -0
- ads/jobs/builders/infrastructure/dsc_job_runtime.py +1233 -0
- ads/jobs/builders/infrastructure/utils.py +65 -0
- ads/jobs/builders/runtimes/__init__.py +5 -0
- ads/jobs/builders/runtimes/artifact.py +338 -0
- ads/jobs/builders/runtimes/base.py +325 -0
- ads/jobs/builders/runtimes/container_runtime.py +242 -0
- ads/jobs/builders/runtimes/python_runtime.py +1016 -0
- ads/jobs/builders/runtimes/pytorch_runtime.py +204 -0
- ads/jobs/cli.py +104 -0
- ads/jobs/env_var_parser.py +131 -0
- ads/jobs/extension.py +160 -0
- ads/jobs/schema/__init__.py +5 -0
- ads/jobs/schema/infrastructure_schema.json +116 -0
- ads/jobs/schema/job_schema.json +42 -0
- ads/jobs/schema/runtime_schema.json +183 -0
- ads/jobs/schema/validator.py +141 -0
- ads/jobs/serializer.py +296 -0
- ads/jobs/templates/__init__.py +5 -0
- ads/jobs/templates/container.py +6 -0
- ads/jobs/templates/driver_notebook.py +177 -0
- ads/jobs/templates/driver_oci.py +500 -0
- ads/jobs/templates/driver_python.py +48 -0
- ads/jobs/templates/driver_pytorch.py +852 -0
- ads/jobs/templates/driver_utils.py +615 -0
- ads/jobs/templates/hostname_from_env.c +55 -0
- ads/jobs/templates/oci_metrics.py +181 -0
- ads/jobs/utils.py +104 -0
- ads/llm/__init__.py +28 -0
- ads/llm/autogen/__init__.py +2 -0
- ads/llm/autogen/constants.py +15 -0
- ads/llm/autogen/reports/__init__.py +2 -0
- ads/llm/autogen/reports/base.py +67 -0
- ads/llm/autogen/reports/data.py +103 -0
- ads/llm/autogen/reports/session.py +526 -0
- ads/llm/autogen/reports/templates/chat_box.html +13 -0
- ads/llm/autogen/reports/templates/chat_box_lt.html +5 -0
- ads/llm/autogen/reports/templates/chat_box_rt.html +6 -0
- ads/llm/autogen/reports/utils.py +56 -0
- ads/llm/autogen/v02/__init__.py +4 -0
- ads/llm/autogen/v02/client.py +295 -0
- ads/llm/autogen/v02/log_handlers/__init__.py +2 -0
- ads/llm/autogen/v02/log_handlers/oci_file_handler.py +83 -0
- ads/llm/autogen/v02/loggers/__init__.py +6 -0
- ads/llm/autogen/v02/loggers/metric_logger.py +320 -0
- ads/llm/autogen/v02/loggers/session_logger.py +580 -0
- ads/llm/autogen/v02/loggers/utils.py +86 -0
- ads/llm/autogen/v02/runtime_logging.py +163 -0
- ads/llm/chain.py +268 -0
- ads/llm/chat_template.py +31 -0
- ads/llm/deploy.py +63 -0
- ads/llm/guardrails/__init__.py +5 -0
- ads/llm/guardrails/base.py +442 -0
- ads/llm/guardrails/huggingface.py +44 -0
- ads/llm/langchain/__init__.py +5 -0
- ads/llm/langchain/plugins/__init__.py +5 -0
- ads/llm/langchain/plugins/chat_models/__init__.py +5 -0
- ads/llm/langchain/plugins/chat_models/oci_data_science.py +1027 -0
- ads/llm/langchain/plugins/embeddings/__init__.py +4 -0
- ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +184 -0
- ads/llm/langchain/plugins/llms/__init__.py +5 -0
- ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +979 -0
- ads/llm/requirements.txt +3 -0
- ads/llm/serialize.py +219 -0
- ads/llm/serializers/__init__.py +0 -0
- ads/llm/serializers/retrieval_qa.py +153 -0
- ads/llm/serializers/runnable_parallel.py +27 -0
- ads/llm/templates/score_chain.jinja2 +155 -0
- ads/llm/templates/tool_chat_template_hermes.jinja +130 -0
- ads/llm/templates/tool_chat_template_mistral_parallel.jinja +94 -0
- ads/model/__init__.py +52 -0
- ads/model/artifact.py +573 -0
- ads/model/artifact_downloader.py +254 -0
- ads/model/artifact_uploader.py +267 -0
- ads/model/base_properties.py +238 -0
- ads/model/common/.model-ignore +66 -0
- ads/model/common/__init__.py +5 -0
- ads/model/common/utils.py +142 -0
- ads/model/datascience_model.py +2635 -0
- ads/model/deployment/__init__.py +20 -0
- ads/model/deployment/common/__init__.py +5 -0
- ads/model/deployment/common/utils.py +308 -0
- ads/model/deployment/model_deployer.py +466 -0
- ads/model/deployment/model_deployment.py +1846 -0
- ads/model/deployment/model_deployment_infrastructure.py +671 -0
- ads/model/deployment/model_deployment_properties.py +493 -0
- ads/model/deployment/model_deployment_runtime.py +838 -0
- ads/model/extractor/__init__.py +5 -0
- ads/model/extractor/automl_extractor.py +74 -0
- ads/model/extractor/embedding_onnx_extractor.py +80 -0
- ads/model/extractor/huggingface_extractor.py +88 -0
- ads/model/extractor/keras_extractor.py +84 -0
- ads/model/extractor/lightgbm_extractor.py +93 -0
- ads/model/extractor/model_info_extractor.py +114 -0
- ads/model/extractor/model_info_extractor_factory.py +105 -0
- ads/model/extractor/pytorch_extractor.py +87 -0
- ads/model/extractor/sklearn_extractor.py +112 -0
- ads/model/extractor/spark_extractor.py +89 -0
- ads/model/extractor/tensorflow_extractor.py +85 -0
- ads/model/extractor/xgboost_extractor.py +94 -0
- ads/model/framework/__init__.py +5 -0
- ads/model/framework/automl_model.py +178 -0
- ads/model/framework/embedding_onnx_model.py +438 -0
- ads/model/framework/huggingface_model.py +399 -0
- ads/model/framework/lightgbm_model.py +266 -0
- ads/model/framework/pytorch_model.py +266 -0
- ads/model/framework/sklearn_model.py +250 -0
- ads/model/framework/spark_model.py +326 -0
- ads/model/framework/tensorflow_model.py +254 -0
- ads/model/framework/xgboost_model.py +258 -0
- ads/model/generic_model.py +3518 -0
- ads/model/model_artifact_boilerplate/README.md +381 -0
- ads/model/model_artifact_boilerplate/__init__.py +5 -0
- ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +5 -0
- ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +427 -0
- ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +2 -0
- ads/model/model_artifact_boilerplate/runtime.yaml +7 -0
- ads/model/model_artifact_boilerplate/score.py +61 -0
- ads/model/model_file_description_schema.json +68 -0
- ads/model/model_introspect.py +331 -0
- ads/model/model_metadata.py +1810 -0
- ads/model/model_metadata_mixin.py +460 -0
- ads/model/model_properties.py +63 -0
- ads/model/model_version_set.py +739 -0
- ads/model/runtime/__init__.py +5 -0
- ads/model/runtime/env_info.py +306 -0
- ads/model/runtime/model_deployment_details.py +37 -0
- ads/model/runtime/model_provenance_details.py +58 -0
- ads/model/runtime/runtime_info.py +81 -0
- ads/model/runtime/schemas/inference_env_info_schema.yaml +16 -0
- ads/model/runtime/schemas/model_provenance_schema.yaml +36 -0
- ads/model/runtime/schemas/training_env_info_schema.yaml +16 -0
- ads/model/runtime/utils.py +201 -0
- ads/model/serde/__init__.py +5 -0
- ads/model/serde/common.py +40 -0
- ads/model/serde/model_input.py +547 -0
- ads/model/serde/model_serializer.py +1184 -0
- ads/model/service/__init__.py +5 -0
- ads/model/service/oci_datascience_model.py +1076 -0
- ads/model/service/oci_datascience_model_deployment.py +500 -0
- ads/model/service/oci_datascience_model_version_set.py +176 -0
- ads/model/transformer/__init__.py +5 -0
- ads/model/transformer/onnx_transformer.py +324 -0
- ads/mysqldb/__init__.py +5 -0
- ads/mysqldb/mysql_db.py +227 -0
- ads/opctl/__init__.py +18 -0
- ads/opctl/anomaly_detection.py +11 -0
- ads/opctl/backend/__init__.py +5 -0
- ads/opctl/backend/ads_dataflow.py +353 -0
- ads/opctl/backend/ads_ml_job.py +710 -0
- ads/opctl/backend/ads_ml_pipeline.py +164 -0
- ads/opctl/backend/ads_model_deployment.py +209 -0
- ads/opctl/backend/base.py +146 -0
- ads/opctl/backend/local.py +1053 -0
- ads/opctl/backend/marketplace/__init__.py +9 -0
- ads/opctl/backend/marketplace/helm_helper.py +173 -0
- ads/opctl/backend/marketplace/local_marketplace.py +271 -0
- ads/opctl/backend/marketplace/marketplace_backend_runner.py +71 -0
- ads/opctl/backend/marketplace/marketplace_operator_interface.py +44 -0
- ads/opctl/backend/marketplace/marketplace_operator_runner.py +24 -0
- ads/opctl/backend/marketplace/marketplace_utils.py +212 -0
- ads/opctl/backend/marketplace/models/__init__.py +5 -0
- ads/opctl/backend/marketplace/models/bearer_token.py +94 -0
- ads/opctl/backend/marketplace/models/marketplace_type.py +70 -0
- ads/opctl/backend/marketplace/models/ocir_details.py +56 -0
- ads/opctl/backend/marketplace/prerequisite_checker.py +238 -0
- ads/opctl/cli.py +707 -0
- ads/opctl/cmds.py +869 -0
- ads/opctl/conda/__init__.py +5 -0
- ads/opctl/conda/cli.py +193 -0
- ads/opctl/conda/cmds.py +749 -0
- ads/opctl/conda/config.yaml +34 -0
- ads/opctl/conda/manifest_template.yaml +13 -0
- ads/opctl/conda/multipart_uploader.py +188 -0
- ads/opctl/conda/pack.py +89 -0
- ads/opctl/config/__init__.py +5 -0
- ads/opctl/config/base.py +57 -0
- ads/opctl/config/diagnostics/__init__.py +5 -0
- ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +62 -0
- ads/opctl/config/merger.py +255 -0
- ads/opctl/config/resolver.py +297 -0
- ads/opctl/config/utils.py +79 -0
- ads/opctl/config/validator.py +17 -0
- ads/opctl/config/versioner.py +68 -0
- ads/opctl/config/yaml_parsers/__init__.py +7 -0
- ads/opctl/config/yaml_parsers/base.py +58 -0
- ads/opctl/config/yaml_parsers/distributed/__init__.py +7 -0
- ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +201 -0
- ads/opctl/constants.py +66 -0
- ads/opctl/decorator/__init__.py +5 -0
- ads/opctl/decorator/common.py +129 -0
- ads/opctl/diagnostics/__init__.py +5 -0
- ads/opctl/diagnostics/__main__.py +25 -0
- ads/opctl/diagnostics/check_distributed_job_requirements.py +212 -0
- ads/opctl/diagnostics/check_requirements.py +144 -0
- ads/opctl/diagnostics/requirement_exception.py +9 -0
- ads/opctl/distributed/README.md +109 -0
- ads/opctl/distributed/__init__.py +5 -0
- ads/opctl/distributed/certificates.py +32 -0
- ads/opctl/distributed/cli.py +207 -0
- ads/opctl/distributed/cmds.py +731 -0
- ads/opctl/distributed/common/__init__.py +5 -0
- ads/opctl/distributed/common/abstract_cluster_provider.py +449 -0
- ads/opctl/distributed/common/abstract_framework_spec_builder.py +88 -0
- ads/opctl/distributed/common/cluster_config_helper.py +103 -0
- ads/opctl/distributed/common/cluster_provider_factory.py +21 -0
- ads/opctl/distributed/common/cluster_runner.py +54 -0
- ads/opctl/distributed/common/framework_factory.py +29 -0
- ads/opctl/docker/Dockerfile.job +103 -0
- ads/opctl/docker/Dockerfile.job.arm +107 -0
- ads/opctl/docker/Dockerfile.job.gpu +175 -0
- ads/opctl/docker/base-env.yaml +13 -0
- ads/opctl/docker/cuda.repo +6 -0
- ads/opctl/docker/operator/.dockerignore +0 -0
- ads/opctl/docker/operator/Dockerfile +41 -0
- ads/opctl/docker/operator/Dockerfile.gpu +85 -0
- ads/opctl/docker/operator/cuda.repo +6 -0
- ads/opctl/docker/operator/environment.yaml +8 -0
- ads/opctl/forecast.py +11 -0
- ads/opctl/index.yaml +3 -0
- ads/opctl/model/__init__.py +5 -0
- ads/opctl/model/cli.py +65 -0
- ads/opctl/model/cmds.py +73 -0
- ads/opctl/operator/README.md +4 -0
- ads/opctl/operator/__init__.py +31 -0
- ads/opctl/operator/cli.py +344 -0
- ads/opctl/operator/cmd.py +596 -0
- ads/opctl/operator/common/__init__.py +5 -0
- ads/opctl/operator/common/backend_factory.py +460 -0
- ads/opctl/operator/common/const.py +27 -0
- ads/opctl/operator/common/data/synthetic.csv +16001 -0
- ads/opctl/operator/common/dictionary_merger.py +148 -0
- ads/opctl/operator/common/errors.py +42 -0
- ads/opctl/operator/common/operator_config.py +99 -0
- ads/opctl/operator/common/operator_loader.py +811 -0
- ads/opctl/operator/common/operator_schema.yaml +130 -0
- ads/opctl/operator/common/operator_yaml_generator.py +152 -0
- ads/opctl/operator/common/utils.py +208 -0
- ads/opctl/operator/lowcode/__init__.py +5 -0
- ads/opctl/operator/lowcode/anomaly/MLoperator +16 -0
- ads/opctl/operator/lowcode/anomaly/README.md +207 -0
- ads/opctl/operator/lowcode/anomaly/__init__.py +5 -0
- ads/opctl/operator/lowcode/anomaly/__main__.py +103 -0
- ads/opctl/operator/lowcode/anomaly/cmd.py +35 -0
- ads/opctl/operator/lowcode/anomaly/const.py +167 -0
- ads/opctl/operator/lowcode/anomaly/environment.yaml +10 -0
- ads/opctl/operator/lowcode/anomaly/model/__init__.py +5 -0
- ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +146 -0
- ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +162 -0
- ads/opctl/operator/lowcode/anomaly/model/automlx.py +99 -0
- ads/opctl/operator/lowcode/anomaly/model/autots.py +115 -0
- ads/opctl/operator/lowcode/anomaly/model/base_model.py +404 -0
- ads/opctl/operator/lowcode/anomaly/model/factory.py +110 -0
- ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +78 -0
- ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +78 -0
- ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +120 -0
- ads/opctl/operator/lowcode/anomaly/model/tods.py +119 -0
- ads/opctl/operator/lowcode/anomaly/operator_config.py +127 -0
- ads/opctl/operator/lowcode/anomaly/schema.yaml +401 -0
- ads/opctl/operator/lowcode/anomaly/utils.py +88 -0
- ads/opctl/operator/lowcode/common/__init__.py +5 -0
- ads/opctl/operator/lowcode/common/const.py +10 -0
- ads/opctl/operator/lowcode/common/data.py +116 -0
- ads/opctl/operator/lowcode/common/errors.py +47 -0
- ads/opctl/operator/lowcode/common/transformations.py +296 -0
- ads/opctl/operator/lowcode/common/utils.py +384 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +13 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/README.md +30 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +5 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +116 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +85 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/const.py +15 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +4 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +32 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +43 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +120 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +34 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +386 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +160 -0
- ads/opctl/operator/lowcode/forecast/MLoperator +25 -0
- ads/opctl/operator/lowcode/forecast/README.md +209 -0
- ads/opctl/operator/lowcode/forecast/__init__.py +5 -0
- ads/opctl/operator/lowcode/forecast/__main__.py +89 -0
- ads/opctl/operator/lowcode/forecast/cmd.py +40 -0
- ads/opctl/operator/lowcode/forecast/const.py +92 -0
- ads/opctl/operator/lowcode/forecast/environment.yaml +20 -0
- ads/opctl/operator/lowcode/forecast/errors.py +26 -0
- ads/opctl/operator/lowcode/forecast/model/__init__.py +5 -0
- ads/opctl/operator/lowcode/forecast/model/arima.py +279 -0
- ads/opctl/operator/lowcode/forecast/model/automlx.py +553 -0
- ads/opctl/operator/lowcode/forecast/model/autots.py +312 -0
- ads/opctl/operator/lowcode/forecast/model/base_model.py +875 -0
- ads/opctl/operator/lowcode/forecast/model/factory.py +106 -0
- ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +492 -0
- ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +243 -0
- ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +482 -0
- ads/opctl/operator/lowcode/forecast/model/prophet.py +450 -0
- ads/opctl/operator/lowcode/forecast/model_evaluator.py +244 -0
- ads/opctl/operator/lowcode/forecast/operator_config.py +234 -0
- ads/opctl/operator/lowcode/forecast/schema.yaml +506 -0
- ads/opctl/operator/lowcode/forecast/utils.py +397 -0
- ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +7 -0
- ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +285 -0
- ads/opctl/operator/lowcode/forecast/whatifserve/score.py +246 -0
- ads/opctl/operator/lowcode/pii/MLoperator +17 -0
- ads/opctl/operator/lowcode/pii/README.md +208 -0
- ads/opctl/operator/lowcode/pii/__init__.py +5 -0
- ads/opctl/operator/lowcode/pii/__main__.py +78 -0
- ads/opctl/operator/lowcode/pii/cmd.py +39 -0
- ads/opctl/operator/lowcode/pii/constant.py +84 -0
- ads/opctl/operator/lowcode/pii/environment.yaml +17 -0
- ads/opctl/operator/lowcode/pii/errors.py +27 -0
- ads/opctl/operator/lowcode/pii/model/__init__.py +5 -0
- ads/opctl/operator/lowcode/pii/model/factory.py +82 -0
- ads/opctl/operator/lowcode/pii/model/guardrails.py +167 -0
- ads/opctl/operator/lowcode/pii/model/pii.py +145 -0
- ads/opctl/operator/lowcode/pii/model/processor/__init__.py +34 -0
- ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +34 -0
- ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +35 -0
- ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +225 -0
- ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +73 -0
- ads/opctl/operator/lowcode/pii/model/processor/remover.py +26 -0
- ads/opctl/operator/lowcode/pii/model/report.py +487 -0
- ads/opctl/operator/lowcode/pii/operator_config.py +95 -0
- ads/opctl/operator/lowcode/pii/schema.yaml +108 -0
- ads/opctl/operator/lowcode/pii/utils.py +43 -0
- ads/opctl/operator/lowcode/recommender/MLoperator +16 -0
- ads/opctl/operator/lowcode/recommender/README.md +206 -0
- ads/opctl/operator/lowcode/recommender/__init__.py +5 -0
- ads/opctl/operator/lowcode/recommender/__main__.py +82 -0
- ads/opctl/operator/lowcode/recommender/cmd.py +33 -0
- ads/opctl/operator/lowcode/recommender/constant.py +30 -0
- ads/opctl/operator/lowcode/recommender/environment.yaml +11 -0
- ads/opctl/operator/lowcode/recommender/model/base_model.py +212 -0
- ads/opctl/operator/lowcode/recommender/model/factory.py +56 -0
- ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +25 -0
- ads/opctl/operator/lowcode/recommender/model/svd.py +106 -0
- ads/opctl/operator/lowcode/recommender/operator_config.py +81 -0
- ads/opctl/operator/lowcode/recommender/schema.yaml +265 -0
- ads/opctl/operator/lowcode/recommender/utils.py +13 -0
- ads/opctl/operator/runtime/__init__.py +5 -0
- ads/opctl/operator/runtime/const.py +17 -0
- ads/opctl/operator/runtime/container_runtime_schema.yaml +50 -0
- ads/opctl/operator/runtime/marketplace_runtime.py +50 -0
- ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +21 -0
- ads/opctl/operator/runtime/python_runtime_schema.yaml +21 -0
- ads/opctl/operator/runtime/runtime.py +115 -0
- ads/opctl/schema.yaml.yml +36 -0
- ads/opctl/script.py +40 -0
- ads/opctl/spark/__init__.py +5 -0
- ads/opctl/spark/cli.py +43 -0
- ads/opctl/spark/cmds.py +147 -0
- ads/opctl/templates/diagnostic_report_template.jinja2 +102 -0
- ads/opctl/utils.py +344 -0
- ads/oracledb/__init__.py +5 -0
- ads/oracledb/oracle_db.py +346 -0
- ads/pipeline/__init__.py +39 -0
- ads/pipeline/ads_pipeline.py +2279 -0
- ads/pipeline/ads_pipeline_run.py +772 -0
- ads/pipeline/ads_pipeline_step.py +605 -0
- ads/pipeline/builders/__init__.py +5 -0
- ads/pipeline/builders/infrastructure/__init__.py +5 -0
- ads/pipeline/builders/infrastructure/custom_script.py +32 -0
- ads/pipeline/cli.py +119 -0
- ads/pipeline/extension.py +291 -0
- ads/pipeline/schema/__init__.py +5 -0
- ads/pipeline/schema/cs_step_schema.json +35 -0
- ads/pipeline/schema/ml_step_schema.json +31 -0
- ads/pipeline/schema/pipeline_schema.json +71 -0
- ads/pipeline/visualizer/__init__.py +5 -0
- ads/pipeline/visualizer/base.py +570 -0
- ads/pipeline/visualizer/graph_renderer.py +272 -0
- ads/pipeline/visualizer/text_renderer.py +84 -0
- ads/secrets/__init__.py +11 -0
- ads/secrets/adb.py +386 -0
- ads/secrets/auth_token.py +86 -0
- ads/secrets/big_data_service.py +365 -0
- ads/secrets/mysqldb.py +149 -0
- ads/secrets/oracledb.py +160 -0
- ads/secrets/secrets.py +407 -0
- ads/telemetry/__init__.py +7 -0
- ads/telemetry/base.py +69 -0
- ads/telemetry/client.py +122 -0
- ads/telemetry/telemetry.py +257 -0
- ads/templates/dataflow_pyspark.jinja2 +13 -0
- ads/templates/dataflow_sparksql.jinja2 +22 -0
- ads/templates/func.jinja2 +20 -0
- ads/templates/schemas/openapi.json +1740 -0
- ads/templates/score-pkl.jinja2 +173 -0
- ads/templates/score.jinja2 +322 -0
- ads/templates/score_embedding_onnx.jinja2 +202 -0
- ads/templates/score_generic.jinja2 +165 -0
- ads/templates/score_huggingface_pipeline.jinja2 +217 -0
- ads/templates/score_lightgbm.jinja2 +185 -0
- ads/templates/score_onnx.jinja2 +407 -0
- ads/templates/score_onnx_new.jinja2 +473 -0
- ads/templates/score_oracle_automl.jinja2 +185 -0
- ads/templates/score_pyspark.jinja2 +154 -0
- ads/templates/score_pytorch.jinja2 +219 -0
- ads/templates/score_scikit-learn.jinja2 +184 -0
- ads/templates/score_tensorflow.jinja2 +184 -0
- ads/templates/score_xgboost.jinja2 +178 -0
- ads/text_dataset/__init__.py +5 -0
- ads/text_dataset/backends.py +211 -0
- ads/text_dataset/dataset.py +445 -0
- ads/text_dataset/extractor.py +207 -0
- ads/text_dataset/options.py +53 -0
- ads/text_dataset/udfs.py +22 -0
- ads/text_dataset/utils.py +49 -0
- ads/type_discovery/__init__.py +9 -0
- ads/type_discovery/abstract_detector.py +21 -0
- ads/type_discovery/constant_detector.py +41 -0
- ads/type_discovery/continuous_detector.py +54 -0
- ads/type_discovery/credit_card_detector.py +99 -0
- ads/type_discovery/datetime_detector.py +92 -0
- ads/type_discovery/discrete_detector.py +118 -0
- ads/type_discovery/document_detector.py +146 -0
- ads/type_discovery/ip_detector.py +68 -0
- ads/type_discovery/latlon_detector.py +90 -0
- ads/type_discovery/phone_number_detector.py +63 -0
- ads/type_discovery/type_discovery_driver.py +87 -0
- ads/type_discovery/typed_feature.py +594 -0
- ads/type_discovery/unknown_detector.py +41 -0
- ads/type_discovery/zipcode_detector.py +48 -0
- ads/vault/__init__.py +7 -0
- ads/vault/vault.py +237 -0
- {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/METADATA +150 -149
- oracle_ads-2.13.10.dist-info/RECORD +858 -0
- {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/WHEEL +1 -2
- {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/entry_points.txt +2 -1
- oracle_ads-2.13.9rc0.dist-info/RECORD +0 -9
- oracle_ads-2.13.9rc0.dist-info/top_level.txt +0 -1
- {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/licenses/LICENSE.txt +0 -0
@@ -0,0 +1,450 @@
|
|
1
|
+
#!/usr/bin/env python
|
2
|
+
|
3
|
+
# Copyright (c) 2024, 2025 Oracle and/or its affiliates.
|
4
|
+
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
5
|
+
|
6
|
+
import logging
|
7
|
+
import traceback
|
8
|
+
|
9
|
+
import matplotlib as mpl
|
10
|
+
import numpy as np
|
11
|
+
import optuna
|
12
|
+
import pandas as pd
|
13
|
+
from joblib import Parallel, delayed
|
14
|
+
|
15
|
+
from ads.opctl import logger
|
16
|
+
from ads.opctl.operator.lowcode.common.utils import set_log_level
|
17
|
+
from ads.opctl.operator.lowcode.forecast.operator_config import ForecastOperatorConfig
|
18
|
+
from ads.opctl.operator.lowcode.forecast.utils import (
|
19
|
+
_select_plot_list,
|
20
|
+
)
|
21
|
+
|
22
|
+
from ..const import (
|
23
|
+
DEFAULT_TRIALS,
|
24
|
+
PROPHET_INTERNAL_DATE_COL,
|
25
|
+
SupportedModels,
|
26
|
+
)
|
27
|
+
from .base_model import ForecastOperatorBaseModel
|
28
|
+
from .forecast_datasets import ForecastDatasets, ForecastOutput
|
29
|
+
|
30
|
+
try:
|
31
|
+
set_log_level("prophet", logger.level)
|
32
|
+
set_log_level("cmdstanpy", logger.level)
|
33
|
+
mpl.rcParams["figure.max_open_warning"] = 100
|
34
|
+
except Exception:
|
35
|
+
pass
|
36
|
+
|
37
|
+
|
38
|
+
def _add_unit(num, unit):
|
39
|
+
return f"{num} {unit}"
|
40
|
+
|
41
|
+
|
42
|
+
def _fit_model(data, params, additional_regressors):
|
43
|
+
from prophet import Prophet
|
44
|
+
|
45
|
+
monthly_seasonality = params.pop("monthly_seasonality", False)
|
46
|
+
|
47
|
+
has_min = "min" in params
|
48
|
+
has_max = "max" in params
|
49
|
+
if has_min or has_max:
|
50
|
+
params["growth"] = "logistic"
|
51
|
+
data_floor = params.pop("min", None)
|
52
|
+
data_cap = params.pop("max", None)
|
53
|
+
|
54
|
+
model = Prophet(**params)
|
55
|
+
if monthly_seasonality:
|
56
|
+
model.add_seasonality(name="monthly", period=30.5, fourier_order=5)
|
57
|
+
params["monthly_seasonality"] = monthly_seasonality
|
58
|
+
for add_reg in additional_regressors:
|
59
|
+
model.add_regressor(add_reg)
|
60
|
+
|
61
|
+
if has_min:
|
62
|
+
data["floor"] = float(data_floor)
|
63
|
+
params["min"] = data_floor
|
64
|
+
if has_max:
|
65
|
+
data["cap"] = float(data_cap)
|
66
|
+
params["max"] = data_cap
|
67
|
+
|
68
|
+
model.fit(data)
|
69
|
+
return model
|
70
|
+
|
71
|
+
|
72
|
+
class ProphetOperatorModel(ForecastOperatorBaseModel):
|
73
|
+
"""Class representing Prophet operator model."""
|
74
|
+
|
75
|
+
def __init__(self, config: ForecastOperatorConfig, datasets: ForecastDatasets):
|
76
|
+
super().__init__(config=config, datasets=datasets)
|
77
|
+
self.global_explanation = {}
|
78
|
+
self.local_explanation = {}
|
79
|
+
|
80
|
+
def set_kwargs(self):
|
81
|
+
# Extract the Confidence Interval Width and convert to prophet's equivalent - interval_width
|
82
|
+
if self.spec.confidence_interval_width is None:
|
83
|
+
self.spec.confidence_interval_width = 1 - self.spec.model_kwargs.get(
|
84
|
+
"alpha", 0.90
|
85
|
+
)
|
86
|
+
model_kwargs = self.spec.model_kwargs
|
87
|
+
model_kwargs["interval_width"] = self.spec.confidence_interval_width
|
88
|
+
return model_kwargs
|
89
|
+
|
90
|
+
def _train_model(self, i, series_id, df, model_kwargs):
|
91
|
+
try:
|
92
|
+
self.forecast_output.init_series_output(
|
93
|
+
series_id=series_id, data_at_series=df
|
94
|
+
)
|
95
|
+
|
96
|
+
data = self.preprocess(df, series_id)
|
97
|
+
data_i = self.drop_horizon(data)
|
98
|
+
if self.loaded_models is not None and series_id in self.loaded_models:
|
99
|
+
model = self.loaded_models[series_id]
|
100
|
+
else:
|
101
|
+
if self.perform_tuning:
|
102
|
+
model_kwargs = self.run_tuning(data_i, model_kwargs)
|
103
|
+
|
104
|
+
model = _fit_model(
|
105
|
+
data=data,
|
106
|
+
params=model_kwargs,
|
107
|
+
additional_regressors=self.additional_regressors,
|
108
|
+
)
|
109
|
+
|
110
|
+
# Get future df for prediction
|
111
|
+
future = data.drop("y", axis=1)
|
112
|
+
|
113
|
+
# Make Prediction
|
114
|
+
forecast = model.predict(future)
|
115
|
+
logger.debug(f"-----------------Model {i}----------------------")
|
116
|
+
logger.debug(
|
117
|
+
forecast[
|
118
|
+
[PROPHET_INTERNAL_DATE_COL, "yhat", "yhat_lower", "yhat_upper"]
|
119
|
+
].tail()
|
120
|
+
)
|
121
|
+
|
122
|
+
self.outputs[series_id] = forecast
|
123
|
+
self.forecast_output.populate_series_output(
|
124
|
+
series_id=series_id,
|
125
|
+
fit_val=self.drop_horizon(forecast["yhat"]).values,
|
126
|
+
forecast_val=self.get_horizon(forecast["yhat"]).values,
|
127
|
+
upper_bound=self.get_horizon(forecast["yhat_upper"]).values,
|
128
|
+
lower_bound=self.get_horizon(forecast["yhat_lower"]).values,
|
129
|
+
)
|
130
|
+
# Get all features that make up the forecast. Exclude CI (upper/lower)
|
131
|
+
core_columns = forecast.columns[
|
132
|
+
~forecast.columns.str.endswith("_lower")
|
133
|
+
& ~forecast.columns.str.endswith("_upper")
|
134
|
+
]
|
135
|
+
core_columns = set(core_columns) - {
|
136
|
+
"additive_terms",
|
137
|
+
"extra_regressors_additive",
|
138
|
+
"multiplicative_terms",
|
139
|
+
"extra_regressors_multiplicative",
|
140
|
+
"cap",
|
141
|
+
"floor",
|
142
|
+
"yhat",
|
143
|
+
}
|
144
|
+
combine_terms = list(
|
145
|
+
core_columns.intersection(
|
146
|
+
{
|
147
|
+
"trend",
|
148
|
+
"daily",
|
149
|
+
"weekly",
|
150
|
+
"yearly",
|
151
|
+
"monthly",
|
152
|
+
"holidays",
|
153
|
+
"zeros",
|
154
|
+
}
|
155
|
+
)
|
156
|
+
)
|
157
|
+
|
158
|
+
temp_df = (
|
159
|
+
forecast[list(core_columns)]
|
160
|
+
.rename({"ds": "Date"}, axis=1)
|
161
|
+
.set_index("Date")
|
162
|
+
)
|
163
|
+
temp_df[self.spec.target_column] = temp_df[combine_terms].sum(axis=1)
|
164
|
+
self.explanations_info[series_id] = temp_df.drop(combine_terms, axis=1)
|
165
|
+
|
166
|
+
self.models[series_id] = {}
|
167
|
+
self.models[series_id]["model"] = model
|
168
|
+
self.models[series_id]["le"] = self.le[series_id]
|
169
|
+
|
170
|
+
params = vars(model).copy()
|
171
|
+
for param in ["history", "history_dates", "stan_fit"]:
|
172
|
+
if param in params:
|
173
|
+
params.pop(param)
|
174
|
+
self.model_parameters[series_id] = {
|
175
|
+
"framework": SupportedModels.Prophet,
|
176
|
+
**params,
|
177
|
+
}
|
178
|
+
|
179
|
+
logger.debug("===========Done===========")
|
180
|
+
except Exception as e:
|
181
|
+
self.errors_dict[series_id] = {
|
182
|
+
"model_name": self.spec.model,
|
183
|
+
"error": str(e),
|
184
|
+
"error_trace": traceback.format_exc(),
|
185
|
+
}
|
186
|
+
logger.warning(f"Encountered Error: {e}. Skipping.")
|
187
|
+
logger.warning(traceback.format_exc())
|
188
|
+
|
189
|
+
def _build_model(self) -> pd.DataFrame:
|
190
|
+
full_data_dict = self.datasets.get_data_by_series()
|
191
|
+
self.models = {}
|
192
|
+
self.outputs = {}
|
193
|
+
self.explanations_info = {}
|
194
|
+
self.additional_regressors = self.datasets.get_additional_data_column_names()
|
195
|
+
model_kwargs = self.set_kwargs()
|
196
|
+
self.forecast_output = ForecastOutput(
|
197
|
+
confidence_interval_width=self.spec.confidence_interval_width,
|
198
|
+
horizon=self.spec.horizon,
|
199
|
+
target_column=self.original_target_column,
|
200
|
+
dt_column=self.spec.datetime_column.name,
|
201
|
+
)
|
202
|
+
|
203
|
+
Parallel(n_jobs=-1, require="sharedmem")(
|
204
|
+
delayed(ProphetOperatorModel._train_model)(
|
205
|
+
self, i, series_id, df, model_kwargs.copy()
|
206
|
+
)
|
207
|
+
for self, (i, (series_id, df)) in zip(
|
208
|
+
[self] * len(full_data_dict), enumerate(full_data_dict.items())
|
209
|
+
)
|
210
|
+
)
|
211
|
+
|
212
|
+
return self.forecast_output.get_forecast_long()
|
213
|
+
|
214
|
+
def run_tuning(self, data_i, model_kwargs_i):
|
215
|
+
from prophet import Prophet
|
216
|
+
from prophet.diagnostics import cross_validation, performance_metrics
|
217
|
+
|
218
|
+
def objective(trial):
|
219
|
+
params = {
|
220
|
+
"seasonality_mode": trial.suggest_categorical(
|
221
|
+
"seasonality_mode", ["additive", "multiplicative"]
|
222
|
+
),
|
223
|
+
"changepoint_prior_scale": trial.suggest_float(
|
224
|
+
"changepoint_prior_scale", 0.001, 0.5, log=True
|
225
|
+
),
|
226
|
+
"seasonality_prior_scale": trial.suggest_float(
|
227
|
+
"seasonality_prior_scale", 0.01, 10, log=True
|
228
|
+
),
|
229
|
+
"holidays_prior_scale": trial.suggest_float(
|
230
|
+
"holidays_prior_scale", 0.01, 10, log=True
|
231
|
+
),
|
232
|
+
"changepoint_range": trial.suggest_float(
|
233
|
+
"changepoint_range", 0.8, 0.95
|
234
|
+
),
|
235
|
+
}
|
236
|
+
params.update(model_kwargs_i)
|
237
|
+
|
238
|
+
model = _fit_model(
|
239
|
+
data=data_i,
|
240
|
+
params=params,
|
241
|
+
additional_regressors=self.additional_regressors,
|
242
|
+
)
|
243
|
+
|
244
|
+
# Manual workaround because pandas 1.x dropped support for M and Y
|
245
|
+
interval = self.spec.horizon
|
246
|
+
freq = self.datasets.get_datetime_frequency()
|
247
|
+
unit = freq.split("-")[0] if freq else None
|
248
|
+
if unit == "M":
|
249
|
+
unit = "D"
|
250
|
+
interval = interval * 30.5
|
251
|
+
elif unit == "Y":
|
252
|
+
unit = "D"
|
253
|
+
interval = interval * 365.25
|
254
|
+
horizon = _add_unit(int(self.spec.horizon * interval), unit=unit)
|
255
|
+
initial = _add_unit((data_i.shape[0] * interval) // 2, unit=unit)
|
256
|
+
period = _add_unit((data_i.shape[0] * interval) // 4, unit=unit)
|
257
|
+
|
258
|
+
logger.debug(
|
259
|
+
f"using: horizon: {horizon}. initial:{initial}, period: {period}"
|
260
|
+
)
|
261
|
+
|
262
|
+
df_cv = cross_validation(
|
263
|
+
model,
|
264
|
+
horizon=horizon,
|
265
|
+
initial=initial,
|
266
|
+
period=period,
|
267
|
+
parallel="threads",
|
268
|
+
)
|
269
|
+
df_p = performance_metrics(df_cv)
|
270
|
+
try:
|
271
|
+
return np.mean(df_p[self.spec.metric])
|
272
|
+
except KeyError:
|
273
|
+
logger.warning(
|
274
|
+
f"Could not find the metric {self.spec.metric} within "
|
275
|
+
f"the performance metrics: {df_p.columns}. Defaulting to `rmse`"
|
276
|
+
)
|
277
|
+
return np.mean(df_p["rmse"])
|
278
|
+
|
279
|
+
study = optuna.create_study(direction="minimize")
|
280
|
+
m_temp = Prophet()
|
281
|
+
study.enqueue_trial(
|
282
|
+
{
|
283
|
+
"seasonality_mode": m_temp.seasonality_mode,
|
284
|
+
"changepoint_prior_scale": m_temp.changepoint_prior_scale,
|
285
|
+
"seasonality_prior_scale": m_temp.seasonality_prior_scale,
|
286
|
+
"holidays_prior_scale": m_temp.holidays_prior_scale,
|
287
|
+
"changepoint_range": m_temp.changepoint_range,
|
288
|
+
}
|
289
|
+
)
|
290
|
+
study.optimize(
|
291
|
+
objective,
|
292
|
+
n_trials=self.spec.tuning.n_trials if self.spec.tuning else DEFAULT_TRIALS,
|
293
|
+
n_jobs=-1,
|
294
|
+
)
|
295
|
+
|
296
|
+
study.best_params.update(model_kwargs_i)
|
297
|
+
model_kwargs_i = study.best_params
|
298
|
+
return model_kwargs_i
|
299
|
+
|
300
|
+
def explain_model(self):
|
301
|
+
self.local_explanation = {}
|
302
|
+
global_expl = []
|
303
|
+
|
304
|
+
for s_id, expl_df in self.explanations_info.items():
|
305
|
+
# Local Expl
|
306
|
+
self.local_explanation[s_id] = self.get_horizon(expl_df)
|
307
|
+
self.local_explanation[s_id]["Series"] = s_id
|
308
|
+
self.local_explanation[s_id].index.rename(self.dt_column_name, inplace=True)
|
309
|
+
# Global Expl
|
310
|
+
g_expl = self.drop_horizon(expl_df).mean()
|
311
|
+
g_expl.name = s_id
|
312
|
+
global_expl.append(np.abs(g_expl))
|
313
|
+
self.global_explanation = pd.concat(global_expl, axis=1)
|
314
|
+
self.formatted_global_explanation = (
|
315
|
+
self.global_explanation / self.global_explanation.sum(axis=0) * 100
|
316
|
+
)
|
317
|
+
self.formatted_local_explanation = pd.concat(self.local_explanation.values())
|
318
|
+
|
319
|
+
def _generate_report(self):
|
320
|
+
import report_creator as rc
|
321
|
+
from prophet.plot import add_changepoints_to_plot
|
322
|
+
|
323
|
+
logging.getLogger("report_creator").setLevel(logging.WARNING)
|
324
|
+
|
325
|
+
series_ids = self.models.keys()
|
326
|
+
all_sections = []
|
327
|
+
if len(series_ids) > 0:
|
328
|
+
sec1 = _select_plot_list(
|
329
|
+
lambda s_id: self.models[s_id]["model"].plot(
|
330
|
+
self.outputs[s_id], include_legend=True
|
331
|
+
),
|
332
|
+
series_ids=series_ids,
|
333
|
+
target_category_column=self.target_cat_col,
|
334
|
+
)
|
335
|
+
section_1 = rc.Block(
|
336
|
+
rc.Heading("Forecast Overview", level=2),
|
337
|
+
rc.Text(
|
338
|
+
"These plots show your forecast in the context of historical data."
|
339
|
+
),
|
340
|
+
sec1,
|
341
|
+
)
|
342
|
+
|
343
|
+
sec2 = _select_plot_list(
|
344
|
+
lambda s_id: self.models[s_id]["model"].plot_components(
|
345
|
+
self.outputs[s_id]
|
346
|
+
),
|
347
|
+
series_ids=series_ids,
|
348
|
+
target_category_column=self.target_cat_col,
|
349
|
+
)
|
350
|
+
section_2 = rc.Block(
|
351
|
+
rc.Heading("Forecast Broken Down by Trend Component", level=2), sec2
|
352
|
+
)
|
353
|
+
|
354
|
+
sec3_figs = {
|
355
|
+
s_id: self.models[s_id]["model"].plot(self.outputs[s_id])
|
356
|
+
for s_id in series_ids
|
357
|
+
}
|
358
|
+
for s_id in series_ids:
|
359
|
+
add_changepoints_to_plot(
|
360
|
+
sec3_figs[s_id].gca(),
|
361
|
+
self.models[s_id]["model"],
|
362
|
+
self.outputs[s_id],
|
363
|
+
)
|
364
|
+
sec3 = _select_plot_list(
|
365
|
+
lambda s_id: sec3_figs[s_id],
|
366
|
+
series_ids=series_ids,
|
367
|
+
target_category_column=self.target_cat_col,
|
368
|
+
)
|
369
|
+
section_3 = rc.Block(rc.Heading("Forecast Changepoints", level=2), sec3)
|
370
|
+
|
371
|
+
all_sections = [section_1, section_2, section_3]
|
372
|
+
|
373
|
+
sec5_text = rc.Heading("Prophet Model Seasonality Components", level=2)
|
374
|
+
model_states = []
|
375
|
+
for s_id in series_ids:
|
376
|
+
m = self.models[s_id]["model"]
|
377
|
+
model_states.append(
|
378
|
+
pd.Series(
|
379
|
+
m.seasonalities,
|
380
|
+
index=pd.Index(m.seasonalities.keys(), dtype="object"),
|
381
|
+
name=s_id
|
382
|
+
if self.target_cat_col
|
383
|
+
else self.original_target_column,
|
384
|
+
dtype="object",
|
385
|
+
)
|
386
|
+
)
|
387
|
+
all_model_states = pd.concat(model_states, axis=1)
|
388
|
+
if not all_model_states.empty:
|
389
|
+
sec5 = rc.DataTable(all_model_states, index=True)
|
390
|
+
all_sections = all_sections + [sec5_text, sec5]
|
391
|
+
|
392
|
+
if self.spec.generate_explanations:
|
393
|
+
try:
|
394
|
+
# If the key is present, call the "explain_model" method
|
395
|
+
self.explain_model()
|
396
|
+
|
397
|
+
if not self.target_cat_col:
|
398
|
+
self.formatted_global_explanation = (
|
399
|
+
self.formatted_global_explanation.rename(
|
400
|
+
{"Series 1": self.original_target_column},
|
401
|
+
axis=1,
|
402
|
+
)
|
403
|
+
)
|
404
|
+
self.formatted_local_explanation.drop(
|
405
|
+
"Series", axis=1, inplace=True
|
406
|
+
)
|
407
|
+
|
408
|
+
# Create a markdown section for the global explainability
|
409
|
+
global_explanation_section = rc.Block(
|
410
|
+
rc.Heading("Global Explainability", level=2),
|
411
|
+
rc.Text(
|
412
|
+
"The following tables provide the feature attribution for the global explainability."
|
413
|
+
),
|
414
|
+
rc.DataTable(self.formatted_global_explanation, index=True),
|
415
|
+
)
|
416
|
+
|
417
|
+
blocks = [
|
418
|
+
rc.DataTable(
|
419
|
+
local_ex_df.drop("Series", axis=1),
|
420
|
+
label=s_id if self.target_cat_col else None,
|
421
|
+
index=True,
|
422
|
+
)
|
423
|
+
for s_id, local_ex_df in self.local_explanation.items()
|
424
|
+
]
|
425
|
+
local_explanation_section = rc.Block(
|
426
|
+
rc.Heading("Local Explanation of Models", level=2),
|
427
|
+
rc.Select(blocks=blocks) if len(blocks) > 1 else blocks[0],
|
428
|
+
)
|
429
|
+
|
430
|
+
# Append the global explanation text and section to the "all_sections" list
|
431
|
+
all_sections = all_sections + [
|
432
|
+
global_explanation_section,
|
433
|
+
local_explanation_section,
|
434
|
+
]
|
435
|
+
except Exception as e:
|
436
|
+
# Do not fail the whole run due to explanations failure
|
437
|
+
logger.warning(f"Failed to generate Explanations with error: {e}.")
|
438
|
+
logger.debug(f"Full Traceback: {traceback.format_exc()}")
|
439
|
+
self.errors_dict["explainer_error"] = str(e)
|
440
|
+
self.errors_dict["explainer_error_error"] = traceback.format_exc()
|
441
|
+
|
442
|
+
model_description = rc.Text(
|
443
|
+
"""Prophet is a procedure for forecasting time series data based on an additive model where non-linear trends are fit with yearly, weekly, and daily seasonality, plus holiday effects. It works best with time series that have strong seasonal effects and several seasons of historical data. Prophet is robust to missing data and shifts in the trend, and typically handles outliers well."""
|
444
|
+
)
|
445
|
+
other_sections = all_sections
|
446
|
+
|
447
|
+
return (
|
448
|
+
model_description,
|
449
|
+
other_sections,
|
450
|
+
)
|
@@ -0,0 +1,244 @@
|
|
1
|
+
# Copyright (c) 2023 Oracle and/or its affiliates.
|
2
|
+
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
3
|
+
|
4
|
+
|
5
|
+
from pathlib import Path
|
6
|
+
|
7
|
+
import numpy as np
|
8
|
+
import pandas as pd
|
9
|
+
|
10
|
+
from ads.opctl import logger
|
11
|
+
from ads.opctl.operator.lowcode.common.const import DataColumns
|
12
|
+
from ads.opctl.operator.lowcode.common.errors import InsufficientDataError
|
13
|
+
from ads.opctl.operator.lowcode.forecast.const import BACKTEST_REPORT_NAME
|
14
|
+
from ads.opctl.operator.lowcode.forecast.model.factory import SupportedModels
|
15
|
+
|
16
|
+
from .model.forecast_datasets import ForecastDatasets
|
17
|
+
from .operator_config import ForecastOperatorConfig
|
18
|
+
|
19
|
+
|
20
|
+
class ModelEvaluator:
|
21
|
+
"""
|
22
|
+
A class used to evaluate and determine the best model or framework from a given set of candidates.
|
23
|
+
|
24
|
+
This class is responsible for comparing different models or frameworks based on specified evaluation
|
25
|
+
metrics and returning the best-performing option.
|
26
|
+
"""
|
27
|
+
|
28
|
+
def __init__(self, models, k=5, subsample_ratio=0.20):
|
29
|
+
"""
|
30
|
+
Initializes the ModelEvaluator with a list of models, number of backtests and subsample ratio.
|
31
|
+
|
32
|
+
Properties:
|
33
|
+
----------
|
34
|
+
models (list): The list of model to be evaluated.
|
35
|
+
k (int): The number of times each model is backtested to verify its performance.
|
36
|
+
subsample_ratio (float): The proportion of the data used in the evaluation process.
|
37
|
+
"""
|
38
|
+
self.models = models
|
39
|
+
self.k = k
|
40
|
+
self.subsample_ratio = subsample_ratio
|
41
|
+
self.minimum_sample_count = 5
|
42
|
+
|
43
|
+
def generate_cutoffs(self, unique_dates, horizon):
|
44
|
+
sorted_dates = np.sort(unique_dates)
|
45
|
+
train_window_size = [
|
46
|
+
len(sorted_dates) - (i + 1) * horizon for i in range(self.k)
|
47
|
+
]
|
48
|
+
valid_train_window_size = [ws for ws in train_window_size if ws >= horizon * 2]
|
49
|
+
if len(valid_train_window_size) < self.k:
|
50
|
+
logger.warning(f"Only {valid_train_window_size} backtests can be created")
|
51
|
+
cut_offs = sorted_dates[-horizon - 1 : -horizon * (self.k + 1) : -horizon][
|
52
|
+
: len(valid_train_window_size)
|
53
|
+
]
|
54
|
+
return cut_offs
|
55
|
+
|
56
|
+
def generate_k_fold_data(
|
57
|
+
self, datasets: ForecastDatasets, operator_config: ForecastOperatorConfig
|
58
|
+
):
|
59
|
+
date_col = operator_config.spec.datetime_column.name
|
60
|
+
horizon = operator_config.spec.horizon
|
61
|
+
historical_data = datasets.historical_data.data.reset_index()
|
62
|
+
series_col = DataColumns.Series
|
63
|
+
group_counts = historical_data[series_col].value_counts()
|
64
|
+
|
65
|
+
sample_count = max(
|
66
|
+
self.minimum_sample_count, int(len(group_counts) * self.subsample_ratio)
|
67
|
+
)
|
68
|
+
sampled_groups = group_counts.head(sample_count)
|
69
|
+
sampled_historical_data = historical_data[
|
70
|
+
historical_data[series_col].isin(sampled_groups.index)
|
71
|
+
]
|
72
|
+
|
73
|
+
min_group = group_counts.idxmin()
|
74
|
+
min_series_data = historical_data[historical_data[series_col] == min_group]
|
75
|
+
unique_dates = min_series_data[date_col].unique()
|
76
|
+
|
77
|
+
cut_offs = self.generate_cutoffs(unique_dates, horizon)
|
78
|
+
if not len(cut_offs):
|
79
|
+
raise InsufficientDataError(
|
80
|
+
"Insufficient data to evaluate multiple models. Please specify a model "
|
81
|
+
"instead of using auto-select."
|
82
|
+
)
|
83
|
+
training_datasets = [
|
84
|
+
sampled_historical_data[sampled_historical_data[date_col] <= cut_off_date]
|
85
|
+
for cut_off_date in cut_offs
|
86
|
+
]
|
87
|
+
test_datasets = [
|
88
|
+
sampled_historical_data[sampled_historical_data[date_col] > cut_offs[0]]
|
89
|
+
]
|
90
|
+
for i, current in enumerate(cut_offs[1:]):
|
91
|
+
test_datasets.append(
|
92
|
+
sampled_historical_data[
|
93
|
+
(current < sampled_historical_data[date_col])
|
94
|
+
& (sampled_historical_data[date_col] <= cut_offs[i])
|
95
|
+
]
|
96
|
+
)
|
97
|
+
all_additional = datasets.additional_data.data.reset_index()
|
98
|
+
sampled_additional_data = all_additional[
|
99
|
+
all_additional[series_col].isin(sampled_groups.index)
|
100
|
+
]
|
101
|
+
max_historical_date = sampled_historical_data[date_col].max()
|
102
|
+
additional_data = [
|
103
|
+
sampled_additional_data[
|
104
|
+
sampled_additional_data[date_col] <= max_historical_date
|
105
|
+
]
|
106
|
+
]
|
107
|
+
for cut_off in cut_offs[:-1]:
|
108
|
+
trimmed_additional_data = sampled_additional_data[
|
109
|
+
sampled_additional_data[date_col] <= cut_off
|
110
|
+
]
|
111
|
+
additional_data.append(trimmed_additional_data)
|
112
|
+
return cut_offs, training_datasets, additional_data, test_datasets
|
113
|
+
|
114
|
+
def remove_none_values(self, obj):
|
115
|
+
if isinstance(obj, dict):
|
116
|
+
return {
|
117
|
+
k: self.remove_none_values(v)
|
118
|
+
for k, v in obj.items()
|
119
|
+
if k is not None and v is not None
|
120
|
+
}
|
121
|
+
else:
|
122
|
+
return obj
|
123
|
+
|
124
|
+
def create_operator_config(
|
125
|
+
self,
|
126
|
+
operator_config,
|
127
|
+
backtest,
|
128
|
+
model,
|
129
|
+
historical_data,
|
130
|
+
additional_data,
|
131
|
+
test_data,
|
132
|
+
):
|
133
|
+
output_dir = operator_config.spec.output_directory.url
|
134
|
+
output_file_path = f"{output_dir}/back_testing/{model}/{backtest}"
|
135
|
+
Path(output_file_path).mkdir(parents=True, exist_ok=True)
|
136
|
+
backtest_op_config_draft = operator_config.to_dict()
|
137
|
+
backtest_spec = backtest_op_config_draft["spec"]
|
138
|
+
backtest_spec["datetime_column"]["format"] = None
|
139
|
+
backtest_spec.pop("test_data")
|
140
|
+
backtest_spec.pop("additional_data")
|
141
|
+
backtest_spec.pop("historical_data")
|
142
|
+
backtest_spec["generate_report"] = False
|
143
|
+
backtest_spec["model"] = model
|
144
|
+
backtest_spec["model_kwargs"] = None
|
145
|
+
backtest_spec["output_directory"] = {"url": output_file_path}
|
146
|
+
backtest_spec["target_category_columns"] = [DataColumns.Series]
|
147
|
+
backtest_spec["generate_explanations"] = False
|
148
|
+
cleaned_config = self.remove_none_values(backtest_op_config_draft)
|
149
|
+
|
150
|
+
backtest_op_config = ForecastOperatorConfig.from_dict(obj_dict=cleaned_config)
|
151
|
+
return backtest_op_config
|
152
|
+
|
153
|
+
def run_all_models(
|
154
|
+
self, datasets: ForecastDatasets, operator_config: ForecastOperatorConfig
|
155
|
+
):
|
156
|
+
cut_offs, train_sets, additional_data, test_sets = self.generate_k_fold_data(
|
157
|
+
datasets, operator_config
|
158
|
+
)
|
159
|
+
metrics = {}
|
160
|
+
date_col = operator_config.spec.datetime_column.name
|
161
|
+
for model in self.models:
|
162
|
+
from .model.factory import ForecastOperatorModelFactory
|
163
|
+
|
164
|
+
metrics[model] = {}
|
165
|
+
for i in range(len(cut_offs)):
|
166
|
+
try:
|
167
|
+
backtest_historical_data = train_sets[i].set_index(
|
168
|
+
[date_col, DataColumns.Series]
|
169
|
+
)
|
170
|
+
backtest_additional_data = additional_data[i].set_index(
|
171
|
+
[date_col, DataColumns.Series]
|
172
|
+
)
|
173
|
+
backtest_test_data = test_sets[i].set_index(
|
174
|
+
[date_col, DataColumns.Series]
|
175
|
+
)
|
176
|
+
backtest_operator_config = self.create_operator_config(
|
177
|
+
operator_config,
|
178
|
+
i,
|
179
|
+
model,
|
180
|
+
backtest_historical_data,
|
181
|
+
backtest_additional_data,
|
182
|
+
backtest_test_data,
|
183
|
+
)
|
184
|
+
datasets = ForecastDatasets(
|
185
|
+
backtest_operator_config,
|
186
|
+
backtest_historical_data,
|
187
|
+
backtest_additional_data,
|
188
|
+
backtest_test_data,
|
189
|
+
)
|
190
|
+
ForecastOperatorModelFactory.get_model(
|
191
|
+
backtest_operator_config, datasets
|
192
|
+
).generate_report()
|
193
|
+
test_metrics_filename = (
|
194
|
+
backtest_operator_config.spec.test_metrics_filename
|
195
|
+
)
|
196
|
+
metrics_df = pd.read_csv(
|
197
|
+
f"{backtest_operator_config.spec.output_directory.url}/{test_metrics_filename}"
|
198
|
+
)
|
199
|
+
metrics_df["average_across_series"] = metrics_df.drop(
|
200
|
+
"metrics", axis=1
|
201
|
+
).mean(axis=1)
|
202
|
+
metrics_average_dict = dict(
|
203
|
+
zip(
|
204
|
+
metrics_df["metrics"].str.lower(),
|
205
|
+
metrics_df["average_across_series"],
|
206
|
+
)
|
207
|
+
)
|
208
|
+
metrics[model][i] = metrics_average_dict[
|
209
|
+
operator_config.spec.metric
|
210
|
+
]
|
211
|
+
except:
|
212
|
+
logger.warning(
|
213
|
+
f"Failed to calculate metrics for {model} and {i} backtest"
|
214
|
+
)
|
215
|
+
return metrics
|
216
|
+
|
217
|
+
def find_best_model(
|
218
|
+
self, datasets: ForecastDatasets, operator_config: ForecastOperatorConfig
|
219
|
+
):
|
220
|
+
try:
|
221
|
+
metrics = self.run_all_models(datasets, operator_config)
|
222
|
+
except InsufficientDataError as e:
|
223
|
+
model = SupportedModels.Prophet
|
224
|
+
logger.error(
|
225
|
+
f"Running {model} model as auto-select failed with the following error: {e.message}"
|
226
|
+
)
|
227
|
+
return model
|
228
|
+
nonempty_metrics = {
|
229
|
+
model: metric for model, metric in metrics.items() if metric != {}
|
230
|
+
}
|
231
|
+
avg_backtests_metric = {
|
232
|
+
model: sum(value.values()) / len(value.values())
|
233
|
+
for model, value in nonempty_metrics.items()
|
234
|
+
}
|
235
|
+
best_model = min(avg_backtests_metric, key=avg_backtests_metric.get)
|
236
|
+
logger.info(
|
237
|
+
f"Among models {self.models}, {best_model} model shows better performance during backtesting."
|
238
|
+
)
|
239
|
+
backtest_stats = pd.DataFrame(nonempty_metrics).rename_axis("backtest")
|
240
|
+
backtest_stats["metric"] = operator_config.spec.metric
|
241
|
+
backtest_stats.reset_index(inplace=True)
|
242
|
+
output_dir = operator_config.spec.output_directory.url
|
243
|
+
backtest_stats.to_csv(f"{output_dir}/{BACKTEST_REPORT_NAME}", index=False)
|
244
|
+
return best_model
|