PyPI - oracle-ads - Versions diffs - 2.13.9rc0__py3-none-any.whl → 2.13.9rc1__py3-none-any.whl - Mend

oracle-ads 2.13.9rc0py3-none-any.whl → 2.13.9rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (857) hide show

ads/aqua/__init__.py +40 -0
ads/aqua/app.py +506 -0
ads/aqua/cli.py +96 -0
ads/aqua/client/__init__.py +3 -0
ads/aqua/client/client.py +836 -0
ads/aqua/client/openai_client.py +305 -0
ads/aqua/common/__init__.py +5 -0
ads/aqua/common/decorator.py +125 -0
ads/aqua/common/entities.py +269 -0
ads/aqua/common/enums.py +122 -0
ads/aqua/common/errors.py +109 -0
ads/aqua/common/utils.py +1285 -0
ads/aqua/config/__init__.py +4 -0
ads/aqua/config/container_config.py +248 -0
ads/aqua/config/evaluation/__init__.py +4 -0
ads/aqua/config/evaluation/evaluation_service_config.py +147 -0
ads/aqua/config/utils/__init__.py +4 -0
ads/aqua/config/utils/serializer.py +339 -0
ads/aqua/constants.py +116 -0
ads/aqua/data.py +14 -0
ads/aqua/dummy_data/icon.txt +1 -0
ads/aqua/dummy_data/oci_model_deployments.json +56 -0
ads/aqua/dummy_data/oci_models.json +1 -0
ads/aqua/dummy_data/readme.md +26 -0
ads/aqua/evaluation/__init__.py +8 -0
ads/aqua/evaluation/constants.py +53 -0
ads/aqua/evaluation/entities.py +186 -0
ads/aqua/evaluation/errors.py +70 -0
ads/aqua/evaluation/evaluation.py +1814 -0
ads/aqua/extension/__init__.py +42 -0
ads/aqua/extension/aqua_ws_msg_handler.py +76 -0
ads/aqua/extension/base_handler.py +90 -0
ads/aqua/extension/common_handler.py +121 -0
ads/aqua/extension/common_ws_msg_handler.py +36 -0
ads/aqua/extension/deployment_handler.py +298 -0
ads/aqua/extension/deployment_ws_msg_handler.py +54 -0
ads/aqua/extension/errors.py +30 -0
ads/aqua/extension/evaluation_handler.py +129 -0
ads/aqua/extension/evaluation_ws_msg_handler.py +61 -0
ads/aqua/extension/finetune_handler.py +96 -0
ads/aqua/extension/model_handler.py +390 -0
ads/aqua/extension/models/__init__.py +0 -0
ads/aqua/extension/models/ws_models.py +145 -0
ads/aqua/extension/models_ws_msg_handler.py +50 -0
ads/aqua/extension/ui_handler.py +282 -0
ads/aqua/extension/ui_websocket_handler.py +130 -0
ads/aqua/extension/utils.py +133 -0
ads/aqua/finetuning/__init__.py +7 -0
ads/aqua/finetuning/constants.py +23 -0
ads/aqua/finetuning/entities.py +181 -0
ads/aqua/finetuning/finetuning.py +749 -0
ads/aqua/model/__init__.py +8 -0
ads/aqua/model/constants.py +60 -0
ads/aqua/model/entities.py +385 -0
ads/aqua/model/enums.py +32 -0
ads/aqua/model/model.py +2114 -0
ads/aqua/modeldeployment/__init__.py +8 -0
ads/aqua/modeldeployment/constants.py +10 -0
ads/aqua/modeldeployment/deployment.py +1326 -0
ads/aqua/modeldeployment/entities.py +653 -0
ads/aqua/modeldeployment/inference.py +74 -0
ads/aqua/modeldeployment/utils.py +543 -0
ads/aqua/resources/gpu_shapes_index.json +94 -0
ads/aqua/server/__init__.py +4 -0
ads/aqua/server/__main__.py +24 -0
ads/aqua/server/app.py +47 -0
ads/aqua/server/aqua_spec.yml +1291 -0
ads/aqua/training/__init__.py +4 -0
ads/aqua/training/exceptions.py +476 -0
ads/aqua/ui.py +499 -0
ads/automl/__init__.py +9 -0
ads/automl/driver.py +330 -0
ads/automl/provider.py +975 -0
ads/bds/__init__.py +5 -0
ads/bds/auth.py +127 -0
ads/bds/big_data_service.py +255 -0
ads/catalog/__init__.py +19 -0
ads/catalog/model.py +1576 -0
ads/catalog/notebook.py +461 -0
ads/catalog/project.py +468 -0
ads/catalog/summary.py +178 -0
ads/common/__init__.py +11 -0
ads/common/analyzer.py +65 -0
ads/common/artifact/.model-ignore +63 -0
ads/common/artifact/__init__.py +10 -0
ads/common/auth.py +1122 -0
ads/common/card_identifier.py +83 -0
ads/common/config.py +647 -0
ads/common/data.py +165 -0
ads/common/decorator/__init__.py +9 -0
ads/common/decorator/argument_to_case.py +88 -0
ads/common/decorator/deprecate.py +69 -0
ads/common/decorator/require_nonempty_arg.py +65 -0
ads/common/decorator/runtime_dependency.py +178 -0
ads/common/decorator/threaded.py +97 -0
ads/common/decorator/utils.py +35 -0
ads/common/dsc_file_system.py +303 -0
ads/common/error.py +14 -0
ads/common/extended_enum.py +81 -0
ads/common/function/__init__.py +5 -0
ads/common/function/fn_util.py +142 -0
ads/common/function/func_conf.yaml +25 -0
ads/common/ipython.py +76 -0
ads/common/model.py +679 -0
ads/common/model_artifact.py +1759 -0
ads/common/model_artifact_schema.json +107 -0
ads/common/model_export_util.py +664 -0
ads/common/model_metadata.py +24 -0
ads/common/object_storage_details.py +296 -0
ads/common/oci_client.py +175 -0
ads/common/oci_datascience.py +46 -0
ads/common/oci_logging.py +1144 -0
ads/common/oci_mixin.py +957 -0
ads/common/oci_resource.py +136 -0
ads/common/serializer.py +559 -0
ads/common/utils.py +1852 -0
ads/common/word_lists.py +1491 -0
ads/common/work_request.py +189 -0
ads/data_labeling/__init__.py +13 -0
ads/data_labeling/boundingbox.py +253 -0
ads/data_labeling/constants.py +47 -0
ads/data_labeling/data_labeling_service.py +244 -0
ads/data_labeling/interface/__init__.py +5 -0
ads/data_labeling/interface/loader.py +16 -0
ads/data_labeling/interface/parser.py +16 -0
ads/data_labeling/interface/reader.py +23 -0
ads/data_labeling/loader/__init__.py +5 -0
ads/data_labeling/loader/file_loader.py +241 -0
ads/data_labeling/metadata.py +110 -0
ads/data_labeling/mixin/__init__.py +5 -0
ads/data_labeling/mixin/data_labeling.py +232 -0
ads/data_labeling/ner.py +129 -0
ads/data_labeling/parser/__init__.py +5 -0
ads/data_labeling/parser/dls_record_parser.py +388 -0
ads/data_labeling/parser/export_metadata_parser.py +94 -0
ads/data_labeling/parser/export_record_parser.py +473 -0
ads/data_labeling/reader/__init__.py +5 -0
ads/data_labeling/reader/dataset_reader.py +574 -0
ads/data_labeling/reader/dls_record_reader.py +121 -0
ads/data_labeling/reader/export_record_reader.py +62 -0
ads/data_labeling/reader/jsonl_reader.py +75 -0
ads/data_labeling/reader/metadata_reader.py +203 -0
ads/data_labeling/reader/record_reader.py +263 -0
ads/data_labeling/record.py +52 -0
ads/data_labeling/visualizer/__init__.py +5 -0
ads/data_labeling/visualizer/image_visualizer.py +525 -0
ads/data_labeling/visualizer/text_visualizer.py +357 -0
ads/database/__init__.py +5 -0
ads/database/connection.py +338 -0
ads/dataset/__init__.py +10 -0
ads/dataset/capabilities.md +51 -0
ads/dataset/classification_dataset.py +339 -0
ads/dataset/correlation.py +226 -0
ads/dataset/correlation_plot.py +563 -0
ads/dataset/dask_series.py +173 -0
ads/dataset/dataframe_transformer.py +110 -0
ads/dataset/dataset.py +1979 -0
ads/dataset/dataset_browser.py +360 -0
ads/dataset/dataset_with_target.py +995 -0
ads/dataset/exception.py +25 -0
ads/dataset/factory.py +987 -0
ads/dataset/feature_engineering_transformer.py +35 -0
ads/dataset/feature_selection.py +107 -0
ads/dataset/forecasting_dataset.py +26 -0
ads/dataset/helper.py +1450 -0
ads/dataset/label_encoder.py +99 -0
ads/dataset/mixin/__init__.py +5 -0
ads/dataset/mixin/dataset_accessor.py +134 -0
ads/dataset/pipeline.py +58 -0
ads/dataset/plot.py +710 -0
ads/dataset/progress.py +86 -0
ads/dataset/recommendation.py +297 -0
ads/dataset/recommendation_transformer.py +502 -0
ads/dataset/regression_dataset.py +14 -0
ads/dataset/sampled_dataset.py +1050 -0
ads/dataset/target.py +98 -0
ads/dataset/timeseries.py +18 -0
ads/dbmixin/__init__.py +5 -0
ads/dbmixin/db_pandas_accessor.py +153 -0
ads/environment/__init__.py +9 -0
ads/environment/ml_runtime.py +66 -0
ads/evaluations/README.md +14 -0
ads/evaluations/__init__.py +109 -0
ads/evaluations/evaluation_plot.py +983 -0
ads/evaluations/evaluator.py +1334 -0
ads/evaluations/statistical_metrics.py +543 -0
ads/experiments/__init__.py +9 -0
ads/experiments/capabilities.md +0 -0
ads/explanations/__init__.py +21 -0
ads/explanations/base_explainer.py +142 -0
ads/explanations/capabilities.md +83 -0
ads/explanations/explainer.py +190 -0
ads/explanations/mlx_global_explainer.py +1050 -0
ads/explanations/mlx_interface.py +386 -0
ads/explanations/mlx_local_explainer.py +287 -0
ads/explanations/mlx_whatif_explainer.py +201 -0
ads/feature_engineering/__init__.py +20 -0
ads/feature_engineering/accessor/__init__.py +5 -0
ads/feature_engineering/accessor/dataframe_accessor.py +535 -0
ads/feature_engineering/accessor/mixin/__init__.py +5 -0
ads/feature_engineering/accessor/mixin/correlation.py +166 -0
ads/feature_engineering/accessor/mixin/eda_mixin.py +266 -0
ads/feature_engineering/accessor/mixin/eda_mixin_series.py +85 -0
ads/feature_engineering/accessor/mixin/feature_types_mixin.py +211 -0
ads/feature_engineering/accessor/mixin/utils.py +65 -0
ads/feature_engineering/accessor/series_accessor.py +431 -0
ads/feature_engineering/adsimage/__init__.py +5 -0
ads/feature_engineering/adsimage/image.py +192 -0
ads/feature_engineering/adsimage/image_reader.py +170 -0
ads/feature_engineering/adsimage/interface/__init__.py +5 -0
ads/feature_engineering/adsimage/interface/reader.py +19 -0
ads/feature_engineering/adsstring/__init__.py +7 -0
ads/feature_engineering/adsstring/oci_language/__init__.py +8 -0
ads/feature_engineering/adsstring/string/__init__.py +8 -0
ads/feature_engineering/data_schema.json +57 -0
ads/feature_engineering/dataset/__init__.py +5 -0
ads/feature_engineering/dataset/zip_code_data.py +42062 -0
ads/feature_engineering/exceptions.py +40 -0
ads/feature_engineering/feature_type/__init__.py +133 -0
ads/feature_engineering/feature_type/address.py +184 -0
ads/feature_engineering/feature_type/adsstring/__init__.py +5 -0
ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +164 -0
ads/feature_engineering/feature_type/adsstring/oci_language.py +93 -0
ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +5 -0
ads/feature_engineering/feature_type/adsstring/parsers/base.py +47 -0
ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +96 -0
ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +221 -0
ads/feature_engineering/feature_type/adsstring/string.py +258 -0
ads/feature_engineering/feature_type/base.py +58 -0
ads/feature_engineering/feature_type/boolean.py +183 -0
ads/feature_engineering/feature_type/category.py +146 -0
ads/feature_engineering/feature_type/constant.py +137 -0
ads/feature_engineering/feature_type/continuous.py +151 -0
ads/feature_engineering/feature_type/creditcard.py +314 -0
ads/feature_engineering/feature_type/datetime.py +190 -0
ads/feature_engineering/feature_type/discrete.py +134 -0
ads/feature_engineering/feature_type/document.py +43 -0
ads/feature_engineering/feature_type/gis.py +251 -0
ads/feature_engineering/feature_type/handler/__init__.py +5 -0
ads/feature_engineering/feature_type/handler/feature_validator.py +524 -0
ads/feature_engineering/feature_type/handler/feature_warning.py +319 -0
ads/feature_engineering/feature_type/handler/warnings.py +128 -0
ads/feature_engineering/feature_type/integer.py +142 -0
ads/feature_engineering/feature_type/ip_address.py +144 -0
ads/feature_engineering/feature_type/ip_address_v4.py +138 -0
ads/feature_engineering/feature_type/ip_address_v6.py +138 -0
ads/feature_engineering/feature_type/lat_long.py +256 -0
ads/feature_engineering/feature_type/object.py +43 -0
ads/feature_engineering/feature_type/ordinal.py +132 -0
ads/feature_engineering/feature_type/phone_number.py +135 -0
ads/feature_engineering/feature_type/string.py +171 -0
ads/feature_engineering/feature_type/text.py +93 -0
ads/feature_engineering/feature_type/unknown.py +43 -0
ads/feature_engineering/feature_type/zip_code.py +164 -0
ads/feature_engineering/feature_type_manager.py +406 -0
ads/feature_engineering/schema.py +795 -0
ads/feature_engineering/utils.py +245 -0
ads/feature_store/.readthedocs.yaml +19 -0
ads/feature_store/README.md +65 -0
ads/feature_store/__init__.py +9 -0
ads/feature_store/common/__init__.py +0 -0
ads/feature_store/common/enums.py +339 -0
ads/feature_store/common/exceptions.py +18 -0
ads/feature_store/common/spark_session_singleton.py +125 -0
ads/feature_store/common/utils/__init__.py +0 -0
ads/feature_store/common/utils/base64_encoder_decoder.py +72 -0
ads/feature_store/common/utils/feature_schema_mapper.py +283 -0
ads/feature_store/common/utils/transformation_utils.py +82 -0
ads/feature_store/common/utils/utility.py +403 -0
ads/feature_store/data_validation/__init__.py +0 -0
ads/feature_store/data_validation/great_expectation.py +129 -0
ads/feature_store/dataset.py +1230 -0
ads/feature_store/dataset_job.py +530 -0
ads/feature_store/docs/Dockerfile +7 -0
ads/feature_store/docs/Makefile +44 -0
ads/feature_store/docs/conf.py +28 -0
ads/feature_store/docs/requirements.txt +14 -0
ads/feature_store/docs/source/ads.feature_store.query.rst +20 -0
ads/feature_store/docs/source/cicd.rst +137 -0
ads/feature_store/docs/source/conf.py +86 -0
ads/feature_store/docs/source/data_versioning.rst +33 -0
ads/feature_store/docs/source/dataset.rst +388 -0
ads/feature_store/docs/source/dataset_job.rst +27 -0
ads/feature_store/docs/source/demo.rst +70 -0
ads/feature_store/docs/source/entity.rst +78 -0
ads/feature_store/docs/source/feature_group.rst +624 -0
ads/feature_store/docs/source/feature_group_job.rst +29 -0
ads/feature_store/docs/source/feature_store.rst +122 -0
ads/feature_store/docs/source/feature_store_class.rst +123 -0
ads/feature_store/docs/source/feature_validation.rst +66 -0
ads/feature_store/docs/source/figures/cicd.png +0 -0
ads/feature_store/docs/source/figures/data_validation.png +0 -0
ads/feature_store/docs/source/figures/data_versioning.png +0 -0
ads/feature_store/docs/source/figures/dataset.gif +0 -0
ads/feature_store/docs/source/figures/dataset.png +0 -0
ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
ads/feature_store/docs/source/figures/entity.png +0 -0
ads/feature_store/docs/source/figures/feature_group.png +0 -0
ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
ads/feature_store/docs/source/figures/overview.png +0 -0
ads/feature_store/docs/source/figures/resource_manager.png +0 -0
ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
ads/feature_store/docs/source/figures/stats_1.png +0 -0
ads/feature_store/docs/source/figures/stats_2.png +0 -0
ads/feature_store/docs/source/figures/stats_d.png +0 -0
ads/feature_store/docs/source/figures/stats_fg.png +0 -0
ads/feature_store/docs/source/figures/transformation.png +0 -0
ads/feature_store/docs/source/figures/transformations.gif +0 -0
ads/feature_store/docs/source/figures/validation.png +0 -0
ads/feature_store/docs/source/figures/validation_fg.png +0 -0
ads/feature_store/docs/source/figures/validation_results.png +0 -0
ads/feature_store/docs/source/figures/validation_summary.png +0 -0
ads/feature_store/docs/source/index.rst +81 -0
ads/feature_store/docs/source/module.rst +8 -0
ads/feature_store/docs/source/notebook.rst +94 -0
ads/feature_store/docs/source/overview.rst +47 -0
ads/feature_store/docs/source/quickstart.rst +176 -0
ads/feature_store/docs/source/release_notes.rst +194 -0
ads/feature_store/docs/source/setup_feature_store.rst +81 -0
ads/feature_store/docs/source/statistics.rst +58 -0
ads/feature_store/docs/source/transformation.rst +199 -0
ads/feature_store/docs/source/ui.rst +65 -0
ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +66 -0
ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +192 -0
ads/feature_store/docs/source/user_guides.setup.terraform.rst +338 -0
ads/feature_store/entity.py +718 -0
ads/feature_store/execution_strategy/__init__.py +0 -0
ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +375 -0
ads/feature_store/execution_strategy/engine/__init__.py +0 -0
ads/feature_store/execution_strategy/engine/spark_engine.py +316 -0
ads/feature_store/execution_strategy/execution_strategy.py +113 -0
ads/feature_store/execution_strategy/execution_strategy_provider.py +47 -0
ads/feature_store/execution_strategy/spark/__init__.py +0 -0
ads/feature_store/execution_strategy/spark/spark_execution.py +618 -0
ads/feature_store/feature.py +192 -0
ads/feature_store/feature_group.py +1494 -0
ads/feature_store/feature_group_expectation.py +346 -0
ads/feature_store/feature_group_job.py +602 -0
ads/feature_store/feature_lineage/__init__.py +0 -0
ads/feature_store/feature_lineage/graphviz_service.py +180 -0
ads/feature_store/feature_option_details.py +50 -0
ads/feature_store/feature_statistics/__init__.py +0 -0
ads/feature_store/feature_statistics/statistics_service.py +99 -0
ads/feature_store/feature_store.py +699 -0
ads/feature_store/feature_store_registrar.py +518 -0
ads/feature_store/input_feature_detail.py +149 -0
ads/feature_store/mixin/__init__.py +4 -0
ads/feature_store/mixin/oci_feature_store.py +145 -0
ads/feature_store/model_details.py +73 -0
ads/feature_store/query/__init__.py +0 -0
ads/feature_store/query/filter.py +266 -0
ads/feature_store/query/generator/__init__.py +0 -0
ads/feature_store/query/generator/query_generator.py +298 -0
ads/feature_store/query/join.py +161 -0
ads/feature_store/query/query.py +403 -0
ads/feature_store/query/validator/__init__.py +0 -0
ads/feature_store/query/validator/query_validator.py +57 -0
ads/feature_store/response/__init__.py +0 -0
ads/feature_store/response/response_builder.py +68 -0
ads/feature_store/service/__init__.py +0 -0
ads/feature_store/service/oci_dataset.py +139 -0
ads/feature_store/service/oci_dataset_job.py +199 -0
ads/feature_store/service/oci_entity.py +125 -0
ads/feature_store/service/oci_feature_group.py +164 -0
ads/feature_store/service/oci_feature_group_job.py +214 -0
ads/feature_store/service/oci_feature_store.py +182 -0
ads/feature_store/service/oci_lineage.py +87 -0
ads/feature_store/service/oci_transformation.py +104 -0
ads/feature_store/statistics/__init__.py +0 -0
ads/feature_store/statistics/abs_feature_value.py +49 -0
ads/feature_store/statistics/charts/__init__.py +0 -0
ads/feature_store/statistics/charts/abstract_feature_plot.py +37 -0
ads/feature_store/statistics/charts/box_plot.py +148 -0
ads/feature_store/statistics/charts/frequency_distribution.py +65 -0
ads/feature_store/statistics/charts/probability_distribution.py +68 -0
ads/feature_store/statistics/charts/top_k_frequent_elements.py +98 -0
ads/feature_store/statistics/feature_stat.py +126 -0
ads/feature_store/statistics/generic_feature_value.py +33 -0
ads/feature_store/statistics/statistics.py +41 -0
ads/feature_store/statistics_config.py +101 -0
ads/feature_store/templates/feature_store_template.yaml +45 -0
ads/feature_store/transformation.py +499 -0
ads/feature_store/validation_output.py +57 -0
ads/hpo/__init__.py +9 -0
ads/hpo/_imports.py +91 -0
ads/hpo/ads_search_space.py +439 -0
ads/hpo/distributions.py +325 -0
ads/hpo/objective.py +280 -0
ads/hpo/search_cv.py +1657 -0
ads/hpo/stopping_criterion.py +75 -0
ads/hpo/tuner_artifact.py +413 -0
ads/hpo/utils.py +91 -0
ads/hpo/validation.py +140 -0
ads/hpo/visualization/__init__.py +5 -0
ads/hpo/visualization/_contour.py +23 -0
ads/hpo/visualization/_edf.py +20 -0
ads/hpo/visualization/_intermediate_values.py +21 -0
ads/hpo/visualization/_optimization_history.py +25 -0
ads/hpo/visualization/_parallel_coordinate.py +169 -0
ads/hpo/visualization/_param_importances.py +26 -0
ads/jobs/__init__.py +53 -0
ads/jobs/ads_job.py +663 -0
ads/jobs/builders/__init__.py +5 -0
ads/jobs/builders/base.py +156 -0
ads/jobs/builders/infrastructure/__init__.py +6 -0
ads/jobs/builders/infrastructure/base.py +165 -0
ads/jobs/builders/infrastructure/dataflow.py +1252 -0
ads/jobs/builders/infrastructure/dsc_job.py +1894 -0
ads/jobs/builders/infrastructure/dsc_job_runtime.py +1233 -0
ads/jobs/builders/infrastructure/utils.py +65 -0
ads/jobs/builders/runtimes/__init__.py +5 -0
ads/jobs/builders/runtimes/artifact.py +338 -0
ads/jobs/builders/runtimes/base.py +325 -0
ads/jobs/builders/runtimes/container_runtime.py +242 -0
ads/jobs/builders/runtimes/python_runtime.py +1016 -0
ads/jobs/builders/runtimes/pytorch_runtime.py +204 -0
ads/jobs/cli.py +104 -0
ads/jobs/env_var_parser.py +131 -0
ads/jobs/extension.py +160 -0
ads/jobs/schema/__init__.py +5 -0
ads/jobs/schema/infrastructure_schema.json +116 -0
ads/jobs/schema/job_schema.json +42 -0
ads/jobs/schema/runtime_schema.json +183 -0
ads/jobs/schema/validator.py +141 -0
ads/jobs/serializer.py +296 -0
ads/jobs/templates/__init__.py +5 -0
ads/jobs/templates/container.py +6 -0
ads/jobs/templates/driver_notebook.py +177 -0
ads/jobs/templates/driver_oci.py +500 -0
ads/jobs/templates/driver_python.py +48 -0
ads/jobs/templates/driver_pytorch.py +852 -0
ads/jobs/templates/driver_utils.py +615 -0
ads/jobs/templates/hostname_from_env.c +55 -0
ads/jobs/templates/oci_metrics.py +181 -0
ads/jobs/utils.py +104 -0
ads/llm/__init__.py +28 -0
ads/llm/autogen/__init__.py +2 -0
ads/llm/autogen/constants.py +15 -0
ads/llm/autogen/reports/__init__.py +2 -0
ads/llm/autogen/reports/base.py +67 -0
ads/llm/autogen/reports/data.py +103 -0
ads/llm/autogen/reports/session.py +526 -0
ads/llm/autogen/reports/templates/chat_box.html +13 -0
ads/llm/autogen/reports/templates/chat_box_lt.html +5 -0
ads/llm/autogen/reports/templates/chat_box_rt.html +6 -0
ads/llm/autogen/reports/utils.py +56 -0
ads/llm/autogen/v02/__init__.py +4 -0
ads/llm/autogen/v02/client.py +295 -0
ads/llm/autogen/v02/log_handlers/__init__.py +2 -0
ads/llm/autogen/v02/log_handlers/oci_file_handler.py +83 -0
ads/llm/autogen/v02/loggers/__init__.py +6 -0
ads/llm/autogen/v02/loggers/metric_logger.py +320 -0
ads/llm/autogen/v02/loggers/session_logger.py +580 -0
ads/llm/autogen/v02/loggers/utils.py +86 -0
ads/llm/autogen/v02/runtime_logging.py +163 -0
ads/llm/chain.py +268 -0
ads/llm/chat_template.py +31 -0
ads/llm/deploy.py +63 -0
ads/llm/guardrails/__init__.py +5 -0
ads/llm/guardrails/base.py +442 -0
ads/llm/guardrails/huggingface.py +44 -0
ads/llm/langchain/__init__.py +5 -0
ads/llm/langchain/plugins/__init__.py +5 -0
ads/llm/langchain/plugins/chat_models/__init__.py +5 -0
ads/llm/langchain/plugins/chat_models/oci_data_science.py +1027 -0
ads/llm/langchain/plugins/embeddings/__init__.py +4 -0
ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +184 -0
ads/llm/langchain/plugins/llms/__init__.py +5 -0
ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +979 -0
ads/llm/requirements.txt +3 -0
ads/llm/serialize.py +219 -0
ads/llm/serializers/__init__.py +0 -0
ads/llm/serializers/retrieval_qa.py +153 -0
ads/llm/serializers/runnable_parallel.py +27 -0
ads/llm/templates/score_chain.jinja2 +155 -0
ads/llm/templates/tool_chat_template_hermes.jinja +130 -0
ads/llm/templates/tool_chat_template_mistral_parallel.jinja +94 -0
ads/model/__init__.py +52 -0
ads/model/artifact.py +573 -0
ads/model/artifact_downloader.py +254 -0
ads/model/artifact_uploader.py +267 -0
ads/model/base_properties.py +238 -0
ads/model/common/.model-ignore +66 -0
ads/model/common/__init__.py +5 -0
ads/model/common/utils.py +142 -0
ads/model/datascience_model.py +2635 -0
ads/model/deployment/__init__.py +20 -0
ads/model/deployment/common/__init__.py +5 -0
ads/model/deployment/common/utils.py +308 -0
ads/model/deployment/model_deployer.py +466 -0
ads/model/deployment/model_deployment.py +1846 -0
ads/model/deployment/model_deployment_infrastructure.py +671 -0
ads/model/deployment/model_deployment_properties.py +493 -0
ads/model/deployment/model_deployment_runtime.py +838 -0
ads/model/extractor/__init__.py +5 -0
ads/model/extractor/automl_extractor.py +74 -0
ads/model/extractor/embedding_onnx_extractor.py +80 -0
ads/model/extractor/huggingface_extractor.py +88 -0
ads/model/extractor/keras_extractor.py +84 -0
ads/model/extractor/lightgbm_extractor.py +93 -0
ads/model/extractor/model_info_extractor.py +114 -0
ads/model/extractor/model_info_extractor_factory.py +105 -0
ads/model/extractor/pytorch_extractor.py +87 -0
ads/model/extractor/sklearn_extractor.py +112 -0
ads/model/extractor/spark_extractor.py +89 -0
ads/model/extractor/tensorflow_extractor.py +85 -0
ads/model/extractor/xgboost_extractor.py +94 -0
ads/model/framework/__init__.py +5 -0
ads/model/framework/automl_model.py +178 -0
ads/model/framework/embedding_onnx_model.py +438 -0
ads/model/framework/huggingface_model.py +399 -0
ads/model/framework/lightgbm_model.py +266 -0
ads/model/framework/pytorch_model.py +266 -0
ads/model/framework/sklearn_model.py +250 -0
ads/model/framework/spark_model.py +326 -0
ads/model/framework/tensorflow_model.py +254 -0
ads/model/framework/xgboost_model.py +258 -0
ads/model/generic_model.py +3518 -0
ads/model/model_artifact_boilerplate/README.md +381 -0
ads/model/model_artifact_boilerplate/__init__.py +5 -0
ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +5 -0
ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +427 -0
ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +2 -0
ads/model/model_artifact_boilerplate/runtime.yaml +7 -0
ads/model/model_artifact_boilerplate/score.py +61 -0
ads/model/model_file_description_schema.json +68 -0
ads/model/model_introspect.py +331 -0
ads/model/model_metadata.py +1810 -0
ads/model/model_metadata_mixin.py +460 -0
ads/model/model_properties.py +63 -0
ads/model/model_version_set.py +739 -0
ads/model/runtime/__init__.py +5 -0
ads/model/runtime/env_info.py +306 -0
ads/model/runtime/model_deployment_details.py +37 -0
ads/model/runtime/model_provenance_details.py +58 -0
ads/model/runtime/runtime_info.py +81 -0
ads/model/runtime/schemas/inference_env_info_schema.yaml +16 -0
ads/model/runtime/schemas/model_provenance_schema.yaml +36 -0
ads/model/runtime/schemas/training_env_info_schema.yaml +16 -0
ads/model/runtime/utils.py +201 -0
ads/model/serde/__init__.py +5 -0
ads/model/serde/common.py +40 -0
ads/model/serde/model_input.py +547 -0
ads/model/serde/model_serializer.py +1184 -0
ads/model/service/__init__.py +5 -0
ads/model/service/oci_datascience_model.py +1076 -0
ads/model/service/oci_datascience_model_deployment.py +500 -0
ads/model/service/oci_datascience_model_version_set.py +176 -0
ads/model/transformer/__init__.py +5 -0
ads/model/transformer/onnx_transformer.py +324 -0
ads/mysqldb/__init__.py +5 -0
ads/mysqldb/mysql_db.py +227 -0
ads/opctl/__init__.py +18 -0
ads/opctl/anomaly_detection.py +11 -0
ads/opctl/backend/__init__.py +5 -0
ads/opctl/backend/ads_dataflow.py +353 -0
ads/opctl/backend/ads_ml_job.py +710 -0
ads/opctl/backend/ads_ml_pipeline.py +164 -0
ads/opctl/backend/ads_model_deployment.py +209 -0
ads/opctl/backend/base.py +146 -0
ads/opctl/backend/local.py +1053 -0
ads/opctl/backend/marketplace/__init__.py +9 -0
ads/opctl/backend/marketplace/helm_helper.py +173 -0
ads/opctl/backend/marketplace/local_marketplace.py +271 -0
ads/opctl/backend/marketplace/marketplace_backend_runner.py +71 -0
ads/opctl/backend/marketplace/marketplace_operator_interface.py +44 -0
ads/opctl/backend/marketplace/marketplace_operator_runner.py +24 -0
ads/opctl/backend/marketplace/marketplace_utils.py +212 -0
ads/opctl/backend/marketplace/models/__init__.py +5 -0
ads/opctl/backend/marketplace/models/bearer_token.py +94 -0
ads/opctl/backend/marketplace/models/marketplace_type.py +70 -0
ads/opctl/backend/marketplace/models/ocir_details.py +56 -0
ads/opctl/backend/marketplace/prerequisite_checker.py +238 -0
ads/opctl/cli.py +707 -0
ads/opctl/cmds.py +869 -0
ads/opctl/conda/__init__.py +5 -0
ads/opctl/conda/cli.py +193 -0
ads/opctl/conda/cmds.py +749 -0
ads/opctl/conda/config.yaml +34 -0
ads/opctl/conda/manifest_template.yaml +13 -0
ads/opctl/conda/multipart_uploader.py +188 -0
ads/opctl/conda/pack.py +89 -0
ads/opctl/config/__init__.py +5 -0
ads/opctl/config/base.py +57 -0
ads/opctl/config/diagnostics/__init__.py +5 -0
ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +62 -0
ads/opctl/config/merger.py +255 -0
ads/opctl/config/resolver.py +297 -0
ads/opctl/config/utils.py +79 -0
ads/opctl/config/validator.py +17 -0
ads/opctl/config/versioner.py +68 -0
ads/opctl/config/yaml_parsers/__init__.py +7 -0
ads/opctl/config/yaml_parsers/base.py +58 -0
ads/opctl/config/yaml_parsers/distributed/__init__.py +7 -0
ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +201 -0
ads/opctl/constants.py +66 -0
ads/opctl/decorator/__init__.py +5 -0
ads/opctl/decorator/common.py +129 -0
ads/opctl/diagnostics/__init__.py +5 -0
ads/opctl/diagnostics/__main__.py +25 -0
ads/opctl/diagnostics/check_distributed_job_requirements.py +212 -0
ads/opctl/diagnostics/check_requirements.py +144 -0
ads/opctl/diagnostics/requirement_exception.py +9 -0
ads/opctl/distributed/README.md +109 -0
ads/opctl/distributed/__init__.py +5 -0
ads/opctl/distributed/certificates.py +32 -0
ads/opctl/distributed/cli.py +207 -0
ads/opctl/distributed/cmds.py +731 -0
ads/opctl/distributed/common/__init__.py +5 -0
ads/opctl/distributed/common/abstract_cluster_provider.py +449 -0
ads/opctl/distributed/common/abstract_framework_spec_builder.py +88 -0
ads/opctl/distributed/common/cluster_config_helper.py +103 -0
ads/opctl/distributed/common/cluster_provider_factory.py +21 -0
ads/opctl/distributed/common/cluster_runner.py +54 -0
ads/opctl/distributed/common/framework_factory.py +29 -0
ads/opctl/docker/Dockerfile.job +103 -0
ads/opctl/docker/Dockerfile.job.arm +107 -0
ads/opctl/docker/Dockerfile.job.gpu +175 -0
ads/opctl/docker/base-env.yaml +13 -0
ads/opctl/docker/cuda.repo +6 -0
ads/opctl/docker/operator/.dockerignore +0 -0
ads/opctl/docker/operator/Dockerfile +41 -0
ads/opctl/docker/operator/Dockerfile.gpu +85 -0
ads/opctl/docker/operator/cuda.repo +6 -0
ads/opctl/docker/operator/environment.yaml +8 -0
ads/opctl/forecast.py +11 -0
ads/opctl/index.yaml +3 -0
ads/opctl/model/__init__.py +5 -0
ads/opctl/model/cli.py +65 -0
ads/opctl/model/cmds.py +73 -0
ads/opctl/operator/README.md +4 -0
ads/opctl/operator/__init__.py +31 -0
ads/opctl/operator/cli.py +344 -0
ads/opctl/operator/cmd.py +596 -0
ads/opctl/operator/common/__init__.py +5 -0
ads/opctl/operator/common/backend_factory.py +460 -0
ads/opctl/operator/common/const.py +27 -0
ads/opctl/operator/common/data/synthetic.csv +16001 -0
ads/opctl/operator/common/dictionary_merger.py +148 -0
ads/opctl/operator/common/errors.py +42 -0
ads/opctl/operator/common/operator_config.py +99 -0
ads/opctl/operator/common/operator_loader.py +811 -0
ads/opctl/operator/common/operator_schema.yaml +130 -0
ads/opctl/operator/common/operator_yaml_generator.py +152 -0
ads/opctl/operator/common/utils.py +208 -0
ads/opctl/operator/lowcode/__init__.py +5 -0
ads/opctl/operator/lowcode/anomaly/MLoperator +16 -0
ads/opctl/operator/lowcode/anomaly/README.md +207 -0
ads/opctl/operator/lowcode/anomaly/__init__.py +5 -0
ads/opctl/operator/lowcode/anomaly/__main__.py +103 -0
ads/opctl/operator/lowcode/anomaly/cmd.py +35 -0
ads/opctl/operator/lowcode/anomaly/const.py +167 -0
ads/opctl/operator/lowcode/anomaly/environment.yaml +10 -0
ads/opctl/operator/lowcode/anomaly/model/__init__.py +5 -0
ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +146 -0
ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +162 -0
ads/opctl/operator/lowcode/anomaly/model/automlx.py +99 -0
ads/opctl/operator/lowcode/anomaly/model/autots.py +115 -0
ads/opctl/operator/lowcode/anomaly/model/base_model.py +404 -0
ads/opctl/operator/lowcode/anomaly/model/factory.py +110 -0
ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +78 -0
ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +78 -0
ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +120 -0
ads/opctl/operator/lowcode/anomaly/model/tods.py +119 -0
ads/opctl/operator/lowcode/anomaly/operator_config.py +127 -0
ads/opctl/operator/lowcode/anomaly/schema.yaml +401 -0
ads/opctl/operator/lowcode/anomaly/utils.py +88 -0
ads/opctl/operator/lowcode/common/__init__.py +5 -0
ads/opctl/operator/lowcode/common/const.py +10 -0
ads/opctl/operator/lowcode/common/data.py +116 -0
ads/opctl/operator/lowcode/common/errors.py +47 -0
ads/opctl/operator/lowcode/common/transformations.py +296 -0
ads/opctl/operator/lowcode/common/utils.py +384 -0
ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +13 -0
ads/opctl/operator/lowcode/feature_store_marketplace/README.md +30 -0
ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +5 -0
ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +116 -0
ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +85 -0
ads/opctl/operator/lowcode/feature_store_marketplace/const.py +15 -0
ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +4 -0
ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +32 -0
ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +43 -0
ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +120 -0
ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +34 -0
ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +386 -0
ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +160 -0
ads/opctl/operator/lowcode/forecast/MLoperator +25 -0
ads/opctl/operator/lowcode/forecast/README.md +209 -0
ads/opctl/operator/lowcode/forecast/__init__.py +5 -0
ads/opctl/operator/lowcode/forecast/__main__.py +89 -0
ads/opctl/operator/lowcode/forecast/cmd.py +40 -0
ads/opctl/operator/lowcode/forecast/const.py +92 -0
ads/opctl/operator/lowcode/forecast/environment.yaml +20 -0
ads/opctl/operator/lowcode/forecast/errors.py +26 -0
ads/opctl/operator/lowcode/forecast/model/__init__.py +5 -0
ads/opctl/operator/lowcode/forecast/model/arima.py +279 -0
ads/opctl/operator/lowcode/forecast/model/automlx.py +553 -0
ads/opctl/operator/lowcode/forecast/model/autots.py +312 -0
ads/opctl/operator/lowcode/forecast/model/base_model.py +875 -0
ads/opctl/operator/lowcode/forecast/model/factory.py +106 -0
ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +492 -0
ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +243 -0
ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +482 -0
ads/opctl/operator/lowcode/forecast/model/prophet.py +445 -0
ads/opctl/operator/lowcode/forecast/model_evaluator.py +244 -0
ads/opctl/operator/lowcode/forecast/operator_config.py +234 -0
ads/opctl/operator/lowcode/forecast/schema.yaml +506 -0
ads/opctl/operator/lowcode/forecast/utils.py +397 -0
ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +7 -0
ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +285 -0
ads/opctl/operator/lowcode/forecast/whatifserve/score.py +246 -0
ads/opctl/operator/lowcode/pii/MLoperator +17 -0
ads/opctl/operator/lowcode/pii/README.md +208 -0
ads/opctl/operator/lowcode/pii/__init__.py +5 -0
ads/opctl/operator/lowcode/pii/__main__.py +78 -0
ads/opctl/operator/lowcode/pii/cmd.py +39 -0
ads/opctl/operator/lowcode/pii/constant.py +84 -0
ads/opctl/operator/lowcode/pii/environment.yaml +17 -0
ads/opctl/operator/lowcode/pii/errors.py +27 -0
ads/opctl/operator/lowcode/pii/model/__init__.py +5 -0
ads/opctl/operator/lowcode/pii/model/factory.py +82 -0
ads/opctl/operator/lowcode/pii/model/guardrails.py +167 -0
ads/opctl/operator/lowcode/pii/model/pii.py +145 -0
ads/opctl/operator/lowcode/pii/model/processor/__init__.py +34 -0
ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +34 -0
ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +35 -0
ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +225 -0
ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +73 -0
ads/opctl/operator/lowcode/pii/model/processor/remover.py +26 -0
ads/opctl/operator/lowcode/pii/model/report.py +487 -0
ads/opctl/operator/lowcode/pii/operator_config.py +95 -0
ads/opctl/operator/lowcode/pii/schema.yaml +108 -0
ads/opctl/operator/lowcode/pii/utils.py +43 -0
ads/opctl/operator/lowcode/recommender/MLoperator +16 -0
ads/opctl/operator/lowcode/recommender/README.md +206 -0
ads/opctl/operator/lowcode/recommender/__init__.py +5 -0
ads/opctl/operator/lowcode/recommender/__main__.py +82 -0
ads/opctl/operator/lowcode/recommender/cmd.py +33 -0
ads/opctl/operator/lowcode/recommender/constant.py +30 -0
ads/opctl/operator/lowcode/recommender/environment.yaml +11 -0
ads/opctl/operator/lowcode/recommender/model/base_model.py +212 -0
ads/opctl/operator/lowcode/recommender/model/factory.py +56 -0
ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +25 -0
ads/opctl/operator/lowcode/recommender/model/svd.py +106 -0
ads/opctl/operator/lowcode/recommender/operator_config.py +81 -0
ads/opctl/operator/lowcode/recommender/schema.yaml +265 -0
ads/opctl/operator/lowcode/recommender/utils.py +13 -0
ads/opctl/operator/runtime/__init__.py +5 -0
ads/opctl/operator/runtime/const.py +17 -0
ads/opctl/operator/runtime/container_runtime_schema.yaml +50 -0
ads/opctl/operator/runtime/marketplace_runtime.py +50 -0
ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +21 -0
ads/opctl/operator/runtime/python_runtime_schema.yaml +21 -0
ads/opctl/operator/runtime/runtime.py +115 -0
ads/opctl/schema.yaml.yml +36 -0
ads/opctl/script.py +40 -0
ads/opctl/spark/__init__.py +5 -0
ads/opctl/spark/cli.py +43 -0
ads/opctl/spark/cmds.py +147 -0
ads/opctl/templates/diagnostic_report_template.jinja2 +102 -0
ads/opctl/utils.py +344 -0
ads/oracledb/__init__.py +5 -0
ads/oracledb/oracle_db.py +346 -0
ads/pipeline/__init__.py +39 -0
ads/pipeline/ads_pipeline.py +2279 -0
ads/pipeline/ads_pipeline_run.py +772 -0
ads/pipeline/ads_pipeline_step.py +605 -0
ads/pipeline/builders/__init__.py +5 -0
ads/pipeline/builders/infrastructure/__init__.py +5 -0
ads/pipeline/builders/infrastructure/custom_script.py +32 -0
ads/pipeline/cli.py +119 -0
ads/pipeline/extension.py +291 -0
ads/pipeline/schema/__init__.py +5 -0
ads/pipeline/schema/cs_step_schema.json +35 -0
ads/pipeline/schema/ml_step_schema.json +31 -0
ads/pipeline/schema/pipeline_schema.json +71 -0
ads/pipeline/visualizer/__init__.py +5 -0
ads/pipeline/visualizer/base.py +570 -0
ads/pipeline/visualizer/graph_renderer.py +272 -0
ads/pipeline/visualizer/text_renderer.py +84 -0
ads/secrets/__init__.py +11 -0
ads/secrets/adb.py +386 -0
ads/secrets/auth_token.py +86 -0
ads/secrets/big_data_service.py +365 -0
ads/secrets/mysqldb.py +149 -0
ads/secrets/oracledb.py +160 -0
ads/secrets/secrets.py +407 -0
ads/telemetry/__init__.py +7 -0
ads/telemetry/base.py +69 -0
ads/telemetry/client.py +125 -0
ads/telemetry/telemetry.py +257 -0
ads/templates/dataflow_pyspark.jinja2 +13 -0
ads/templates/dataflow_sparksql.jinja2 +22 -0
ads/templates/func.jinja2 +20 -0
ads/templates/schemas/openapi.json +1740 -0
ads/templates/score-pkl.jinja2 +173 -0
ads/templates/score.jinja2 +322 -0
ads/templates/score_embedding_onnx.jinja2 +202 -0
ads/templates/score_generic.jinja2 +165 -0
ads/templates/score_huggingface_pipeline.jinja2 +217 -0
ads/templates/score_lightgbm.jinja2 +185 -0
ads/templates/score_onnx.jinja2 +407 -0
ads/templates/score_onnx_new.jinja2 +473 -0
ads/templates/score_oracle_automl.jinja2 +185 -0
ads/templates/score_pyspark.jinja2 +154 -0
ads/templates/score_pytorch.jinja2 +219 -0
ads/templates/score_scikit-learn.jinja2 +184 -0
ads/templates/score_tensorflow.jinja2 +184 -0
ads/templates/score_xgboost.jinja2 +178 -0
ads/text_dataset/__init__.py +5 -0
ads/text_dataset/backends.py +211 -0
ads/text_dataset/dataset.py +445 -0
ads/text_dataset/extractor.py +207 -0
ads/text_dataset/options.py +53 -0
ads/text_dataset/udfs.py +22 -0
ads/text_dataset/utils.py +49 -0
ads/type_discovery/__init__.py +9 -0
ads/type_discovery/abstract_detector.py +21 -0
ads/type_discovery/constant_detector.py +41 -0
ads/type_discovery/continuous_detector.py +54 -0
ads/type_discovery/credit_card_detector.py +99 -0
ads/type_discovery/datetime_detector.py +92 -0
ads/type_discovery/discrete_detector.py +118 -0
ads/type_discovery/document_detector.py +146 -0
ads/type_discovery/ip_detector.py +68 -0
ads/type_discovery/latlon_detector.py +90 -0
ads/type_discovery/phone_number_detector.py +63 -0
ads/type_discovery/type_discovery_driver.py +87 -0
ads/type_discovery/typed_feature.py +594 -0
ads/type_discovery/unknown_detector.py +41 -0
ads/type_discovery/zipcode_detector.py +48 -0
ads/vault/__init__.py +7 -0
ads/vault/vault.py +237 -0
{oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/METADATA +150 -150
oracle_ads-2.13.9rc1.dist-info/RECORD +858 -0
{oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/WHEEL +1 -2
{oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/entry_points.txt +2 -1
oracle_ads-2.13.9rc0.dist-info/RECORD +0 -9
oracle_ads-2.13.9rc0.dist-info/top_level.txt +0 -1
{oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/licenses/LICENSE.txt +0 -0

ads/automl/provider.py ADDED Viewed

@@ -0,0 +1,975 @@
+#!/usr/bin/env python
+# -*- coding: utf-8; -*-
+# Copyright (c) 2020, 2023 Oracle and/or its affiliates.
+# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
+import logging
+import time
+import sys
+import warnings
+from abc import ABC, abstractmethod, abstractproperty
+import math
+import pandas as pd
+import numpy as np
+from sklearn import set_config
+from sklearn.dummy import DummyClassifier, DummyRegressor
+import matplotlib.pyplot as plt
+import ads
+from ads.common.utils import (
+    ml_task_types,
+    wrap_lines,
+    is_documentation_mode,
+    is_notebook,
+)
+from ads.common.decorator.runtime_dependency import (
+    runtime_dependency,
+    OptionalDependency,
+)
+from ads.common.decorator.deprecate import deprecated
+from ads.dataset.label_encoder import DataFrameLabelEncoder
+from ads.dataset.helper import is_text_data
+from ads.common import logger, utils
+class AutoMLProvider(ABC):
+    """
+    Abstract Base Class defining the structure of an AutoML solution. The solution needs to
+    implement train() and get_transformer_pipeline().
+    """
+    @deprecated(
+        details="Working with AutoML has moved from within ADS to working directly with the AutoMLx library. AutoMLx are preinstalled in conda pack automlx_p38_cpu_v2 and later, and can now be updated independently of ADS. AutoMLx documentation may be found at https://docs.oracle.com/en-us/iaas/tools/automlx/latest/html/multiversion/v23.1.1/index.html. Notebook examples are in Oracle's samples repository: https://github.com/oracle-samples/oci-data-science-ai-samples/tree/master/notebook_examples and a migration tutorial can be found at https://accelerated-data-science.readthedocs.io/en/latest/user_guide/model_training/automl/quick_start.html .",
+        raise_error=True,
+    )
+    def __init__(self):
+        self.X_train = None
+        self.y_train = None
+        self.X_valid = None
+        self.y_valid = None
+        self.client = None
+        self.ml_task_type = None
+        self.class_names = None
+        self.transformer_pipeline = None
+        self.est = None
+    def setup(
+        self,
+        X_train,
+        y_train,
+        ml_task_type,
+        X_valid=None,
+        y_valid=None,
+        class_names=None,
+        client=None,
+    ):
+        """
+        Setup arguments to the AutoML instance.
+        Parameters
+        ----------
+        X_train : DataFrame
+            Training features
+        y_train : DataFrame
+            Training labels
+        ml_task_type : One of ml_task_type.{REGRESSION,BINARY_CLASSIFICATION,
+            MULTI_CLASS_CLASSIFICATION,BINARY_TEXT_CLASSIFICATION,MULTI_CLASS_TEXT_CLASSIFICATION}
+        X_valid : DataFrame
+            Validation features
+        y_valid : DataFrame
+            Validation labels
+        class_names : list
+            Unique values in y_train
+        client : object
+            Dask client instance for distributed execution
+        """
+        self.X_train = X_train
+        self.y_train = y_train
+        self.X_valid = X_valid
+        self.y_valid = y_valid
+        self.ml_task_type = ml_task_type
+        self.client = client
+        self.class_names = class_names
+    @property
+    def est(self):
+        """
+        Returns the estimator.
+        The estimator can be a standard sklearn estimator or any object that implement methods from
+        (BaseEstimator, RegressorMixin) for regression or (BaseEstimator, ClassifierMixin) for classification.
+        Returns
+        -------
+        est : An instance of estimator
+        """
+        return self.__est
+    @est.setter
+    def est(self, est):
+        self.__est = est
+    @abstractmethod
+    def train(self, **kwargs):
+        """
+        Calls fit on estimator.
+        This method is expected to set the 'est' property.
+        Parameters
+        ----------
+        kwargs: dict, optional
+        kwargs to decide the estimator and arguments for the fit method
+        """
+        pass
+    @abstractmethod
+    def get_transformer_pipeline(self):
+        """
+        Returns a list of transformers representing the transformations done on data before model prediction.
+        This method is optional to implement, and is used only for visualizing transformations on data using
+        ADSModel#visualize_transforms().
+        Returns
+        -------
+        transformers_list : list of transformers implementing fit and transform
+        """
+        pass
+class BaselineModel(object):
+    """
+    A BaselineModel object that supports fit/predict/predict_proba/transform
+    interface. Labels (y) are encoded using DataFrameLabelEncoder.
+    """
+    @deprecated(
+        details="Working with AutoML has moved from within ADS to working directly with the AutoMLx library. AutoMLx are preinstalled in conda pack automlx_p38_cpu_v2 and later, and can now be updated independently of ADS. AutoMLx documentation may be found at https://docs.oracle.com/en-us/iaas/tools/automlx/latest/html/multiversion/v23.1.1/index.html. Notebook examples are in Oracle's samples repository: https://github.com/oracle-samples/oci-data-science-ai-samples/tree/master/notebook_examples and a migration tutorial can be found at https://accelerated-data-science.readthedocs.io/en/latest/user_guide/model_training/automl/quick_start.html .",
+        raise_error=True,
+    )
+    def __init__(self, est):
+        self.est = est
+        self.df_label_encoder = DataFrameLabelEncoder()
+    def predict(self, X):
+        """
+        Runs the Baselines predict function and returns the result.
+        Parameters
+        ----------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be predicted on
+        Returns
+        -------
+        List: A list of predictions performed on the input data.
+        """
+        X = self.transform(X)
+        return self.est.predict(X)
+    def predict_proba(self, X):
+        """
+        Runs the Baselines predict_proba function and returns the result.
+        Parameters
+        ----------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be predicted on
+        Returns
+        -------
+        List: A list of probabilities of being part of a class
+        """
+        X = self.transform(X)
+        return self.est.predict_proba(X)
+    def fit(self, X, y):
+        """
+        Fits the baseline estimator.
+        Parameters
+        ----------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be predicted on
+        Y: Dataframe, Series, or list-like
+          A Dataframe, series, or list-like object holding the labels
+        Returns
+        -------
+        estimator: The fitted estimator
+        """
+        self.est.fit(X, y)
+        return self
+    def transform(self, X):
+        """
+        Runs the Baselines transform function and returns the result.
+        Parameters
+        ---------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be transformed
+        Returns
+        -------
+        Dataframe or list-like: The transformed Dataframe. Currently, no transformation is performed by the default Baseline Estimator.
+        """
+        return X
+    def __getattr__(self, item):
+        return getattr(self.est, item)
+    def __getstate__(self):
+        return self.__dict__
+    def __setstate__(self, state):
+        self.__dict__ = state
+    def __repr__(self):
+        set_config()
+        return str(self.est)[:-2]
+class BaselineAutoMLProvider(AutoMLProvider):
+    def get_transformer_pipeline(self):
+        """
+        Returns a list of transformers representing the transformations done on data before model prediction.
+        This method is used only for visualizing transformations on data using
+        ADSModel#visualize_transforms().
+        Returns
+        -------
+        transformers_list : list of transformers implementing fit and transform
+        """
+        msg = "Baseline"
+        return [("automl_preprocessing", AutoMLPreprocessingTransformer(msg))]
+    @deprecated(
+        details="Working with AutoML has moved from within ADS to working directly with the AutoMLx library. AutoMLx are preinstalled in conda pack automlx_p38_cpu_v2 and later, and can now be updated independently of ADS. AutoMLx documentation may be found at https://docs.oracle.com/en-us/iaas/tools/automlx/latest/html/multiversion/v23.1.1/index.html. Notebook examples are in Oracle's samples repository: https://github.com/oracle-samples/oci-data-science-ai-samples/tree/master/notebook_examples and a migration tutorial can be found at https://accelerated-data-science.readthedocs.io/en/latest/user_guide/model_training/automl/quick_start.html .",
+        raise_error=True,
+    )
+    def __init__(self, est):
+        """
+        Generates a baseline model using the Zero Rule algorithm by default. For a classification
+        predictive modeling problem where a categorical value is predicted, the Zero
+        Rule algorithm predicts the class value that has the most observations in the training dataset.
+        Parameters
+        ----------
+        est : BaselineModel
+            An estimator that supports the fit/predict/predict_proba interface.
+            By default, DummyClassifier/DummyRegressor are used as estimators
+        """
+        super(BaselineAutoMLProvider, self).__init__()
+        self.est = est
+    def __repr__(self):
+        set_config()
+        return str(self.est)[:-2]
+    def train(self, **kwargs):
+        self.est = self.decide_estimator(**kwargs)
+        if self.est is None:
+            raise ValueError(
+                "Baseline model for (%s) is not supported" % self.ml_task_type
+            )
+        try:
+            self.est.fit(self.X_train, self.y_train)
+        except Exception as e:
+            warning_message = f"The baseline estimator failed to fit the data. It could not evaluate {self.est} and gave the exception {e}."
+            logger.warning(warning_message)
+    def decide_estimator(self, **kwargs):
+        """
+        Decides which type of BaselineModel to generate.
+        Returns
+        -------
+        Modell: BaselineModel
+            A baseline model generated for the particular ML task being performed
+        """
+        if self.est is not None:
+            return self.est
+        else:
+            if self.ml_task_type == ml_task_types.REGRESSION:
+                return BaselineModel(DummyRegressor())
+            elif self.ml_task_type in [
+                ml_task_types.BINARY_CLASSIFICATION,
+                ml_task_types.MULTI_CLASS_CLASSIFICATION,
+                ml_task_types.BINARY_TEXT_CLASSIFICATION,
+                ml_task_types.MULTI_CLASS_TEXT_CLASSIFICATION,
+            ]:
+                return BaselineModel(DummyClassifier())
+# An installation of oracle labs automl is required only for this class
+class OracleAutoMLProvider(AutoMLProvider, ABC):
+    @deprecated(
+        "2.6.7",
+        details="Oracle AutoML is recommended to be directly instantiated by importing automlx package",
+        raise_error=True,
+    )
+    def __init__(
+        self, n_jobs=-1, loglevel=None, logger_override=None, model_n_jobs: int = 1
+    ):
+        """
+        The Oracle AutoML Provider automatically provides a tuned ML pipeline that best models the given a training
+        dataset and a prediction task at hand.
+        Parameters
+        ----------
+        n_jobs : int
+            Specifies the degree of parallelism for Oracle AutoML. -1 (default) means that AutoML will use all
+            available cores.
+        loglevel : int
+            The verbosity of output for Oracle AutoML. Can be specified using the Python logging module
+            (https://docs.python.org/3/library/logging.html#logging-levels).
+        model_n_jobs: (optional, int). Defaults to 1.
+            Specifies the model parallelism used by AutoML.
+            This will be passed to the underlying model it is training.
+        """
+        try:
+            self.automl = __import__("automl")
+            self.cpuinfo = __import__("cpuinfo")
+        except ModuleNotFoundError as e:
+            utils._log_missing_module("automl", "ads[labs]")
+            raise e
+        super(OracleAutoMLProvider, self).__init__()
+        if loglevel is None:
+            loglevel = logging.DEBUG if ads.debug_mode else logging.ERROR
+        self.automl.init(
+            engine="local",
+            engine_opts={"n_jobs": n_jobs, "model_n_jobs": model_n_jobs},
+            logger=logger_override,
+            loglevel=loglevel,
+        )
+    def __repr__(self):
+        super(OracleAutoMLProvider, self).__repr__()
+    def get_transformer_pipeline(self):
+        """
+        Returns a list of transformers representing the transformations done on data before model prediction.
+        This method is used only for visualizing transformations on data using
+        ADSModel#visualize_transforms().
+        Returns
+        -------
+        transformers_list : list of transformers implementing fit and transform
+        """
+        if hasattr(self.est, "text") and not self.est.text:
+            msg1 = wrap_lines(
+                self.est.selected_features_names_, heading="Select features:"
+            )
+            return [("automl_feature_selection", AutoMLFeatureSelection(msg1))]
+        else:
+            msg = "Apply Tfidf Vectorization\n"
+            msg += "Normalize features\n"
+            msg += "Label encode target"
+            return [("automl_preprocessing", AutoMLPreprocessingTransformer(msg))]
+    def selected_model_name(self):
+        """
+        Return the name of the selected model by AutoML.
+        """
+        return self.est.selected_model_
+    @runtime_dependency(module="IPython", install_from=OptionalDependency.NOTEBOOK)
+    def print_summary(
+        self,
+        max_rows=None,
+        sort_column="Mean Validation Score",
+        ranking_table_only=False,
+    ):
+        """
+        Prints a summary of the Oracle AutoML Pipeline in the last train() call.
+        Parameters
+        ----------
+        max_rows : int
+            Number of trials to print. Pass in None to print all trials
+        sort_column: string
+            Column to sort results by. Must be one of ['Algorithm', '#Samples', '#Features', 'Mean Validation Score',
+            'Hyperparameters', 'All Validation Scores', 'CPU Time']
+        ranking_table_only: bool
+            Table to be displayed. Pass in False to display the complete table.
+            Pass in True to display the ranking table only.
+        """
+        if is_notebook():  # pragma: no cover
+            logger.info(
+                f"Training time was ({(time.time() - self.train_start_time):.2f} seconds.)"
+            )
+            if len(self.est.tuning_trials_) == 0 or len(self.est.train_shape_) == 0:
+                logger.error(
+                    "Unfortunately, there were no trials found, so we cannot visualize it."
+                )
+                return
+            info = [
+                ["Training Dataset size", self.X_train.shape],
+                [
+                    "Validation Dataset size",
+                    self.X_valid.shape if self.X_valid is not None else None,
+                ],
+                ["CV", self.est.num_cv_folds_],
+                ["Target variable", self.y_train.name],
+                ["Optimization Metric", self.est.inferred_score_metric],
+                ["Initial number of Features", self.est.train_shape_[1]],
+                ["Selected number of Features", len(self.est.selected_features_names_)],
+                ["Selected Features", self.est.selected_features_names_],
+                ["Selected Algorithm", self.est.selected_model_],
+                [
+                    "End-to-end Elapsed Time (seconds)",
+                    self.train_end_time - self.train_start_time,
+                ],
+                ["Selected Hyperparameters", self.est.selected_model_params_],
+                ["Mean Validation Score", self.est.tuning_trials_[0][3]],
+                ["AutoML n_jobs", self.est.n_jobs_],
+                ["AutoML version", self.automl.__version__],
+                ["Python version", sys.version],
+            ]
+            info_df = pd.DataFrame(info)
+            # Remove the selected model and its params from the trials since it already shows up in the summary table
+            all_trials_ = (
+                self.est.model_selection_trials_
+                + self.est.adaptive_sampling_trials_
+                + self.est.feature_selection_trials_
+                + self.est.tuning_trials_[1:]
+            )
+            col_names = [
+                "Algorithm",
+                "#Samples",
+                "#Features",
+                "Mean Validation Score",
+                "Hyperparameters",
+                "All Validation Scores",
+                "CPU Time",
+                "Memory Usage",
+            ]
+            if ranking_table_only:
+                dropped_cols = [
+                    "#Samples",
+                    "#Features",
+                    "All Validation Scores",
+                    "CPU Time",
+                ]
+            else:
+                dropped_cols = "All Validation Scores"
+            summary_df = pd.DataFrame(all_trials_, columns=col_names).drop(
+                dropped_cols, axis=1
+            )
+            sorted_summary_df = summary_df.sort_values(sort_column, ascending=False)
+            # Add a rank column at the front
+            sorted_summary_df.insert(
+                0, "Rank based on Performance", np.arange(2, len(sorted_summary_df) + 2)
+            )
+            from IPython.core.display import display, HTML
+            with pd.option_context(
+                "display.max_colwidth",
+                1000,
+                "display.width",
+                None,
+                "display.precision",
+                4,
+            ):
+                display(HTML(info_df.to_html(index=False, header=False)))
+                if max_rows is None:
+                    display(HTML(sorted_summary_df.to_html(index=False)))
+                else:
+                    display(
+                        HTML(sorted_summary_df.to_html(index=False, max_rows=max_rows))
+                    )
+    def train(self, **kwargs):
+        """
+        Train the Oracle AutoML Pipeline. This looks at the training data, and
+        identifies the best set of features, the best algorithm and the best
+        set of hyperparameters for this data. A model is then generated, trained
+        on this data and returned.
+        Parameters
+        ----------
+        score_metric : str, callable
+            Score function (or loss function) with signature ``score_func(y, y_pred, **kwargs)`` or string specified as
+            https://scikit-learn.org/stable/modules/model_evaluation.html#common-cases-predefined-values
+        random_state : int
+            Random seed used by AutoML
+        model_list : list of str
+            Models that will be evaluated by the Pipeline. Supported models:
+            - Classification: AdaBoostClassifier, DecisionTreeClassifier,
+            ExtraTreesClassifier, KNeighborsClassifier,
+            LGBMClassifier, LinearSVC, LogisticRegression,
+            RandomForestClassifier, SVC, XGBClassifier
+            - Regression: AdaBoostRegressor, DecisionTreeRegressor,
+            ExtraTreesRegressor, KNeighborsRegressor,
+            LGBMRegressor, LinearSVR, LinearRegression, RandomForestRegressor,
+            SVR, XGBRegressor
+        time_budget : float, optional
+            Time budget in seconds where 0 means no time budget constraint (best effort)
+        min_features : int, float, list, optional (default: 1)
+            Minimum number of features to keep. Acceptable values:
+            - If int, 0 < min_features <= n_features
+            - If float, 0 < min_features <= 1.0
+            - If list, names of features to keep, for example ['a', 'b'] means keep features 'a' and 'b'
+        Returns
+        -------
+        self : object
+        """
+        """Adding this part to give the correct error for situations when dataset > 10000 rows and user tries SVC or KNN"""
+        if len(self.X_train) > 10000:
+            if "model_list" in kwargs:
+                bad_model_list = ["SVC", "KNeighborsClassifier"]
+                for model in kwargs["model_list"]:
+                    for item in bad_model_list:
+                        if item in model:
+                            raise ValueError(
+                                "SVC, KNeighborsClassifier are disabled for datasets with > 10K samples"
+                            )
+        self.train_start_time = time.time()
+        self.time_budget = kwargs.pop("time_budget", 0)  # 0 means unlimited
+        self.col_types = kwargs.pop("col_types", None)
+        self.est = self._decide_estimator(**kwargs)
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            self.est.fit(
+                self.X_train,
+                self.y_train,
+                X_valid=self.X_valid,
+                y_valid=self.y_valid,
+                time_budget=self.time_budget,
+                col_types=self.col_types,
+            )
+        self.train_end_time = time.time()
+        self.print_summary(max_rows=10)
+    def print_trials(self, max_rows=None, sort_column="Mean Validation Score"):
+        """
+        Prints all trials executed by the Oracle AutoML Pipeline in the last train() call.
+        Parameters
+        ----------
+        max_rows : int
+            Number of trials to print. Pass in None to print all trials
+        sort_column: string
+            Column to sort results by. Must be one of ['Algorithm', '#Samples', '#Features', 'Mean Validation Score',
+            'Hyperparameters', 'All Validation Scores', 'CPU Time']
+        """
+        self.est.print_trials(max_rows=max_rows, sort_column=sort_column)
+    def _decide_estimator(self, **kwargs):
+        """
+        Decide arguments to the Oracle AutoML pipeline based on user provided
+        arguments
+        """
+        est = None
+        score_metric = None
+        # Explicity define the default AutoML metrics
+        if (
+            self.ml_task_type == ml_task_types.BINARY_CLASSIFICATION
+            or self.ml_task_type == ml_task_types.BINARY_TEXT_CLASSIFICATION
+        ):
+            test_model_list = ["LogisticRegression"]
+        elif (
+            self.ml_task_type == ml_task_types.MULTI_CLASS_CLASSIFICATION
+            or self.ml_task_type == ml_task_types.MULTI_CLASS_TEXT_CLASSIFICATION
+        ):
+            test_model_list = ["LogisticRegression"]
+        elif self.ml_task_type == ml_task_types.REGRESSION:
+            test_model_list = ["LinearRegression"]
+        else:
+            raise ValueError("AutoML for (%s) is not supported" % self.ml_task_type)
+        # Respect the user provided scoring metric if given
+        if "score_metric" in kwargs:
+            score_metric = kwargs.pop("score_metric")
+        #
+        # ***FOR TESTING PURPOSE ONLY***
+        #
+        # Ignore model_list for test mode
+        if ads.test_mode:  # pragma: no cover
+            if "model_list" in kwargs:
+                _ = kwargs.pop("model_list")
+            kwargs["model_list"] = test_model_list
+        if (
+            self.ml_task_type == ml_task_types.BINARY_CLASSIFICATION
+            or self.ml_task_type == ml_task_types.MULTI_CLASS_CLASSIFICATION
+        ):
+            est = self.automl.Pipeline(
+                task="classification", score_metric=score_metric, **kwargs
+            )
+        elif (
+            self.ml_task_type == ml_task_types.BINARY_TEXT_CLASSIFICATION
+            or self.ml_task_type == ml_task_types.MULTI_CLASS_TEXT_CLASSIFICATION
+        ):
+            est = self.automl.Pipeline(
+                task="classification", score_metric=score_metric, **kwargs
+            )
+            if not self.col_types:
+                if len(self.X_train.columns) == 1:
+                    self.col_types = ["text"]
+                elif len(self.X_train.columns) == 2:
+                    self.col_types = ["text", "text"]
+                else:
+                    raise ValueError(
+                        "We detected a text classification problem. Pass "
+                        "in `col_types = [<type of column1>, <type of column2>, ...]`."
+                        " Valid types are: ['categorical', 'numerical', 'text', 'datetime',"
+                        " 'timedelta']."
+                    )
+        elif self.ml_task_type == ml_task_types.REGRESSION:
+            est = self.automl.Pipeline(
+                task="regression", score_metric=score_metric, **kwargs
+            )
+        else:
+            raise ValueError("AutoML for (%s) is not supported" % self.ml_task_type)
+        return est
+    def selected_score_label(self):
+        """
+        Return the name of score_metric used in train.
+        """
+        score_label = self.est.score_metric
+        if score_label is None:
+            score_label = self.est.inferred_score_metric
+        return score_label
+    @runtime_dependency(module="scipy", install_from=OptionalDependency.VIZ)
+    def visualize_algorithm_selection_trials(self, ylabel=None):
+        """
+        Plot the scores predicted by Algorithm Selection for each algorithm. The
+        horizontal line shows the average score across all algorithms. Algorithms
+        below the line are colored turquoise, whereas those with a score higher
+        than the mean are colored teal. The orange bar shows the algorithm with
+        the highest predicted score. The error bar is +/- one standard error.
+        Parameters
+        ----------
+        ylabel : str,
+            Label for the y-axis. Defaults to the scoring metric.
+        """
+        if ylabel is None:
+            ylabel = self.selected_score_label().capitalize()
+        trials = self.est.model_selection_trials_
+        if not len(trials):
+            _log_visualize_no_trials("algorithm selection")
+            return
+        fig, ax = plt.subplots(1, figsize=(6, 3))
+        colors = []
+        y_error = []
+        mean_scores, models, cvscores = [], [], []
+        for (
+            algorithm,
+            samples,
+            features,
+            mean_score,
+            hyperparameters,
+            all_scores,
+            runtime,
+            x,
+        ) in trials:
+            mean_scores.append(mean_score)
+            models.append(algorithm)
+            cvscores.append(all_scores)
+        mean_scores_ser = pd.Series(mean_scores, index=models).sort_values(
+            ascending=False
+        )
+        scores_ser = pd.Series(cvscores, index=models)
+        ax.set_title("Algorithm Selection Trials")
+        ax.set_ylabel(ylabel)
+        ax.set_xlabel("Algorithm")
+        for f in mean_scores_ser.keys():
+            se = scipy.stats.sem(scores_ser[f], ddof=1)
+            y_error.append(se)
+            if f == "{}_AS".format(self.est.selected_model_):
+                colors.append("orange")
+            elif mean_scores_ser[f] >= mean_scores_ser.mean():
+                colors.append("teal")
+            else:
+                colors.append("turquoise")
+        mean_scores_ser.plot.bar(ax=ax, color=colors, edgecolor="black", zorder=1)
+        ax.errorbar(
+            x=mean_scores_ser.index.values,
+            y=mean_scores_ser.values,
+            yerr=y_error,
+            fmt="none",
+            capsize=4,
+            color="black",
+            zorder=0,
+        )
+        ax.axhline(y=mean_scores_ser.mean(), color="black", linewidth=0.5)
+        ax.autoscale_view()
+        plt.show()
+    def visualize_adaptive_sampling_trials(self):
+        """
+        Visualize the trials for Adaptive Sampling.
+        """
+        trials = self.est.adaptive_sampling_trials_
+        if len(trials) == 0:
+            _log_visualize_no_trials("adaptive sampling")
+            return
+        fig, ax = plt.subplots(1, figsize=(6, 3))
+        ax.set_title("Adaptive Sampling ({})".format(trials[0][0]))
+        ax.set_xlabel("Dataset sample size")
+        ax.set_ylabel(r"Predicted model score")
+        scores = [
+            mean_score
+            for (
+                algorithm,
+                samples,
+                features,
+                mean_score,
+                hyperparameters,
+                all_scores,
+                runtime,
+                x,
+            ) in trials
+        ]
+        n_samples = [
+            samples
+            for (
+                algorithm,
+                samples,
+                features,
+                mean_score,
+                hyperparameters,
+                all_scores,
+                runtime,
+                x,
+            ) in trials
+        ]
+        y_margin = 0.10 * (max(scores) - min(scores))
+        ax.grid(color="g", linestyle="-", linewidth=0.1)
+        ax.set_ylim(min(scores) - y_margin, max(scores) + y_margin)
+        ax.plot(n_samples, scores, "k:", marker="s", color="teal", markersize=3)
+        plt.show()
+    def visualize_feature_selection_trials(self, ylabel=None):
+        """
+        Visualize the feature selection trials taken to arrive at optimal set of
+        features. The orange line shows the optimal number of features chosen
+        by Feature Selection.
+        Parameters
+        ----------
+        ylabel : str,
+            Label for the y-axis. Defaults to the scoring metric.
+        """
+        if ylabel is None:
+            ylabel = self.selected_score_label().capitalize()
+        trials = self.est.feature_selection_trials_
+        if len(trials) == 0:
+            _log_visualize_no_trials("feature selection")
+            return
+        fig, ax = plt.subplots(1, figsize=(6, 3))
+        ax.set_title("Feature Selection Trials")
+        ax.set_xlabel("Number of Features")
+        ax.set_ylabel(ylabel)
+        scores = [
+            mean_score
+            for (
+                algorithm,
+                samples,
+                features,
+                mean_score,
+                hyperparameters,
+                all_scores,
+                runtime,
+                x,
+            ) in trials
+        ]
+        n_features = [
+            features
+            for (
+                algorithm,
+                samples,
+                features,
+                mean_score,
+                hyperparameters,
+                all_scores,
+                runtime,
+                x,
+            ) in trials
+        ]
+        y_margin = 0.10 * (max(scores) - min(scores))
+        ax.grid(color="g", linestyle="-", linewidth=0.1)
+        ax.set_ylim(min(scores) - y_margin, max(scores) + y_margin)
+        ax.plot(n_features, scores, "k:", marker="s", color="teal", markersize=3)
+        ax.axvline(
+            x=len(self.est.selected_features_names_), color="orange", linewidth=2.0
+        )
+        plt.show()
+    def visualize_tuning_trials(self, ylabel=None):
+        """
+        Visualize (plot) the hyperparamter tuning trials taken to arrive at the optimal
+        hyper parameters. Each trial in the plot represents a particular
+        hyperparamter combination.
+        Parameters
+        ----------
+        ylabel : str,
+            Label for the y-axis. Defaults to the scoring metric.
+        """
+        if ylabel is None:
+            ylabel = self.selected_score_label().capitalize()
+        # scores in trials are sorted decreasingly.
+        # reversed(trails) : let the scores sort in increasing order from left to right.
+        scores = [
+            mean_score
+            for (
+                algorithm,
+                samples,
+                features,
+                mean_score,
+                hyperparameters,
+                all_scores,
+                runtime,
+                x,
+            ) in reversed(self.est.tuning_trials_)
+            if mean_score and not np.isnan(mean_score)
+        ]
+        if not len(scores) > 1:
+            raise RuntimeError("Insufficient tuning trials.")
+        else:
+            fig, ax = plt.subplots(1, figsize=(6, 3))
+            ax.set_title("Hyperparameter Tuning Trials")
+            ax.set_xlabel("Iteration $n$")
+            ax.set_ylabel(ylabel)
+            y_margin = 0.10 * (max(scores) - min(scores))
+            ax.grid(color="g", linestyle="-", linewidth=0.1)
+            ax.set_ylim(min(scores) - y_margin, max(scores) + y_margin)
+            ax.plot(
+                range(1, len(scores) + 1),
+                scores,
+                "k:",
+                marker="s",
+                color="teal",
+                markersize=3,
+            )
+            plt.show()
+class AutoMLPreprocessingTransformer(object):  # pragma: no cover
+    @deprecated(
+        details="Working with AutoML has moved from within ADS to working directly with the AutoMLx library. AutoMLx are preinstalled in conda pack automlx_p38_cpu_v2 and later, and can now be updated independently of ADS. AutoMLx documentation may be found at https://docs.oracle.com/en-us/iaas/tools/automlx/latest/html/multiversion/v23.1.1/index.html. Notebook examples are in Oracle's samples repository: https://github.com/oracle-samples/oci-data-science-ai-samples/tree/master/notebook_examples and a migration tutorial can be found at https://accelerated-data-science.readthedocs.io/en/latest/user_guide/model_training/automl/quick_start.html .",
+        raise_error=True,
+    )
+    def __init__(self, msg):
+        self.msg = msg
+    def fit(self, X):
+        """
+        Fits the preprocessing Transformer
+        Parameters
+        ----------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be predicted on
+        Returns
+        -------
+        Self: Estimator
+            The fitted estimator
+        """
+        return self
+    def transform(self, X):
+        """
+        Runs the preprocessing transform function and returns the result
+        Parameters
+        ---------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be transformed
+        Returns
+        -------
+        X: Dataframe or list-like
+            The transformed Dataframe.
+        """
+        return X
+    def _log_visualize_no_trials(target):
+        logger.error(
+            f"There are no trials. Therefore, the {target} cannot be visualized."
+        )
+    def __repr__(self):
+        return self.msg
+class AutoMLFeatureSelection(object):  # pragma: no cover
+    @deprecated(
+        details="Working with AutoML has moved from within ADS to working directly with the AutoMLx library. AutoMLx are preinstalled in conda pack automlx_p38_cpu_v2 and later, and can now be updated independently of ADS. AutoMLx documentation may be found at https://docs.oracle.com/en-us/iaas/tools/automlx/latest/html/multiversion/v23.1.1/index.html. Notebook examples are in Oracle's samples repository: https://github.com/oracle-samples/oci-data-science-ai-samples/tree/master/notebook_examples and a migration tutorial can be found at https://accelerated-data-science.readthedocs.io/en/latest/user_guide/model_training/automl/quick_start.html .",
+        raise_error=True,
+    )
+    def __init__(self, msg):
+        self.msg = msg
+    def fit(self, X):
+        """
+        Fits the baseline estimator
+        Parameters
+        ----------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be predicted on
+        Returns
+        -------
+        Self: Estimator
+            The fitted estimator
+        """
+        return self
+    def transform(self, X):
+        """
+        Runs the Baselines transform function and returns the result
+        Parameters
+        ---------
+        X: Dataframe or list-like
+          A Dataframe or list-like object holding data to be transformed
+        Returns
+        -------
+        X: Dataframe or list-like
+            The transformed Dataframe.
+        """
+        return X
+    def __repr__(self):
+        return self.msg

oracle-ads 2.13.9rc0__py3-none-any.whl → 2.13.9rc1__py3-none-any.whl

oracle-ads 2.13.9rc0py3-none-any.whl → 2.13.9rc1py3-none-any.whl