oracle-ads 2.13.8__py3-none-any.whl → 2.13.9rc0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/METADATA +151 -151
- oracle_ads-2.13.9rc0.dist-info/RECORD +9 -0
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/WHEEL +2 -1
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/entry_points.txt +1 -2
- oracle_ads-2.13.9rc0.dist-info/top_level.txt +1 -0
- ads/aqua/__init__.py +0 -40
- ads/aqua/app.py +0 -506
- ads/aqua/cli.py +0 -96
- ads/aqua/client/__init__.py +0 -3
- ads/aqua/client/client.py +0 -836
- ads/aqua/client/openai_client.py +0 -305
- ads/aqua/common/__init__.py +0 -5
- ads/aqua/common/decorator.py +0 -125
- ads/aqua/common/entities.py +0 -266
- ads/aqua/common/enums.py +0 -122
- ads/aqua/common/errors.py +0 -109
- ads/aqua/common/utils.py +0 -1285
- ads/aqua/config/__init__.py +0 -4
- ads/aqua/config/container_config.py +0 -248
- ads/aqua/config/evaluation/__init__.py +0 -4
- ads/aqua/config/evaluation/evaluation_service_config.py +0 -147
- ads/aqua/config/utils/__init__.py +0 -4
- ads/aqua/config/utils/serializer.py +0 -339
- ads/aqua/constants.py +0 -114
- ads/aqua/data.py +0 -14
- ads/aqua/dummy_data/icon.txt +0 -1
- ads/aqua/dummy_data/oci_model_deployments.json +0 -56
- ads/aqua/dummy_data/oci_models.json +0 -1
- ads/aqua/dummy_data/readme.md +0 -26
- ads/aqua/evaluation/__init__.py +0 -8
- ads/aqua/evaluation/constants.py +0 -53
- ads/aqua/evaluation/entities.py +0 -186
- ads/aqua/evaluation/errors.py +0 -70
- ads/aqua/evaluation/evaluation.py +0 -1814
- ads/aqua/extension/__init__.py +0 -42
- ads/aqua/extension/aqua_ws_msg_handler.py +0 -76
- ads/aqua/extension/base_handler.py +0 -90
- ads/aqua/extension/common_handler.py +0 -121
- ads/aqua/extension/common_ws_msg_handler.py +0 -36
- ads/aqua/extension/deployment_handler.py +0 -298
- ads/aqua/extension/deployment_ws_msg_handler.py +0 -54
- ads/aqua/extension/errors.py +0 -30
- ads/aqua/extension/evaluation_handler.py +0 -129
- ads/aqua/extension/evaluation_ws_msg_handler.py +0 -61
- ads/aqua/extension/finetune_handler.py +0 -96
- ads/aqua/extension/model_handler.py +0 -390
- ads/aqua/extension/models/__init__.py +0 -0
- ads/aqua/extension/models/ws_models.py +0 -145
- ads/aqua/extension/models_ws_msg_handler.py +0 -50
- ads/aqua/extension/ui_handler.py +0 -282
- ads/aqua/extension/ui_websocket_handler.py +0 -130
- ads/aqua/extension/utils.py +0 -133
- ads/aqua/finetuning/__init__.py +0 -7
- ads/aqua/finetuning/constants.py +0 -23
- ads/aqua/finetuning/entities.py +0 -181
- ads/aqua/finetuning/finetuning.py +0 -731
- ads/aqua/model/__init__.py +0 -8
- ads/aqua/model/constants.py +0 -60
- ads/aqua/model/entities.py +0 -306
- ads/aqua/model/enums.py +0 -30
- ads/aqua/model/model.py +0 -2080
- ads/aqua/modeldeployment/__init__.py +0 -8
- ads/aqua/modeldeployment/constants.py +0 -10
- ads/aqua/modeldeployment/deployment.py +0 -1324
- ads/aqua/modeldeployment/entities.py +0 -653
- ads/aqua/modeldeployment/inference.py +0 -74
- ads/aqua/modeldeployment/utils.py +0 -543
- ads/aqua/resources/gpu_shapes_index.json +0 -94
- ads/aqua/server/__init__.py +0 -4
- ads/aqua/server/__main__.py +0 -24
- ads/aqua/server/app.py +0 -47
- ads/aqua/server/aqua_spec.yml +0 -1291
- ads/aqua/training/__init__.py +0 -4
- ads/aqua/training/exceptions.py +0 -476
- ads/aqua/ui.py +0 -499
- ads/automl/__init__.py +0 -9
- ads/automl/driver.py +0 -330
- ads/automl/provider.py +0 -975
- ads/bds/__init__.py +0 -5
- ads/bds/auth.py +0 -127
- ads/bds/big_data_service.py +0 -255
- ads/catalog/__init__.py +0 -19
- ads/catalog/model.py +0 -1576
- ads/catalog/notebook.py +0 -461
- ads/catalog/project.py +0 -468
- ads/catalog/summary.py +0 -178
- ads/common/__init__.py +0 -11
- ads/common/analyzer.py +0 -65
- ads/common/artifact/.model-ignore +0 -63
- ads/common/artifact/__init__.py +0 -10
- ads/common/auth.py +0 -1122
- ads/common/card_identifier.py +0 -83
- ads/common/config.py +0 -647
- ads/common/data.py +0 -165
- ads/common/decorator/__init__.py +0 -9
- ads/common/decorator/argument_to_case.py +0 -88
- ads/common/decorator/deprecate.py +0 -69
- ads/common/decorator/require_nonempty_arg.py +0 -65
- ads/common/decorator/runtime_dependency.py +0 -178
- ads/common/decorator/threaded.py +0 -97
- ads/common/decorator/utils.py +0 -35
- ads/common/dsc_file_system.py +0 -303
- ads/common/error.py +0 -14
- ads/common/extended_enum.py +0 -81
- ads/common/function/__init__.py +0 -5
- ads/common/function/fn_util.py +0 -142
- ads/common/function/func_conf.yaml +0 -25
- ads/common/ipython.py +0 -76
- ads/common/model.py +0 -679
- ads/common/model_artifact.py +0 -1759
- ads/common/model_artifact_schema.json +0 -107
- ads/common/model_export_util.py +0 -664
- ads/common/model_metadata.py +0 -24
- ads/common/object_storage_details.py +0 -296
- ads/common/oci_client.py +0 -175
- ads/common/oci_datascience.py +0 -46
- ads/common/oci_logging.py +0 -1144
- ads/common/oci_mixin.py +0 -957
- ads/common/oci_resource.py +0 -136
- ads/common/serializer.py +0 -559
- ads/common/utils.py +0 -1852
- ads/common/word_lists.py +0 -1491
- ads/common/work_request.py +0 -189
- ads/data_labeling/__init__.py +0 -13
- ads/data_labeling/boundingbox.py +0 -253
- ads/data_labeling/constants.py +0 -47
- ads/data_labeling/data_labeling_service.py +0 -244
- ads/data_labeling/interface/__init__.py +0 -5
- ads/data_labeling/interface/loader.py +0 -16
- ads/data_labeling/interface/parser.py +0 -16
- ads/data_labeling/interface/reader.py +0 -23
- ads/data_labeling/loader/__init__.py +0 -5
- ads/data_labeling/loader/file_loader.py +0 -241
- ads/data_labeling/metadata.py +0 -110
- ads/data_labeling/mixin/__init__.py +0 -5
- ads/data_labeling/mixin/data_labeling.py +0 -232
- ads/data_labeling/ner.py +0 -129
- ads/data_labeling/parser/__init__.py +0 -5
- ads/data_labeling/parser/dls_record_parser.py +0 -388
- ads/data_labeling/parser/export_metadata_parser.py +0 -94
- ads/data_labeling/parser/export_record_parser.py +0 -473
- ads/data_labeling/reader/__init__.py +0 -5
- ads/data_labeling/reader/dataset_reader.py +0 -574
- ads/data_labeling/reader/dls_record_reader.py +0 -121
- ads/data_labeling/reader/export_record_reader.py +0 -62
- ads/data_labeling/reader/jsonl_reader.py +0 -75
- ads/data_labeling/reader/metadata_reader.py +0 -203
- ads/data_labeling/reader/record_reader.py +0 -263
- ads/data_labeling/record.py +0 -52
- ads/data_labeling/visualizer/__init__.py +0 -5
- ads/data_labeling/visualizer/image_visualizer.py +0 -525
- ads/data_labeling/visualizer/text_visualizer.py +0 -357
- ads/database/__init__.py +0 -5
- ads/database/connection.py +0 -338
- ads/dataset/__init__.py +0 -10
- ads/dataset/capabilities.md +0 -51
- ads/dataset/classification_dataset.py +0 -339
- ads/dataset/correlation.py +0 -226
- ads/dataset/correlation_plot.py +0 -563
- ads/dataset/dask_series.py +0 -173
- ads/dataset/dataframe_transformer.py +0 -110
- ads/dataset/dataset.py +0 -1979
- ads/dataset/dataset_browser.py +0 -360
- ads/dataset/dataset_with_target.py +0 -995
- ads/dataset/exception.py +0 -25
- ads/dataset/factory.py +0 -987
- ads/dataset/feature_engineering_transformer.py +0 -35
- ads/dataset/feature_selection.py +0 -107
- ads/dataset/forecasting_dataset.py +0 -26
- ads/dataset/helper.py +0 -1450
- ads/dataset/label_encoder.py +0 -99
- ads/dataset/mixin/__init__.py +0 -5
- ads/dataset/mixin/dataset_accessor.py +0 -134
- ads/dataset/pipeline.py +0 -58
- ads/dataset/plot.py +0 -710
- ads/dataset/progress.py +0 -86
- ads/dataset/recommendation.py +0 -297
- ads/dataset/recommendation_transformer.py +0 -502
- ads/dataset/regression_dataset.py +0 -14
- ads/dataset/sampled_dataset.py +0 -1050
- ads/dataset/target.py +0 -98
- ads/dataset/timeseries.py +0 -18
- ads/dbmixin/__init__.py +0 -5
- ads/dbmixin/db_pandas_accessor.py +0 -153
- ads/environment/__init__.py +0 -9
- ads/environment/ml_runtime.py +0 -66
- ads/evaluations/README.md +0 -14
- ads/evaluations/__init__.py +0 -109
- ads/evaluations/evaluation_plot.py +0 -983
- ads/evaluations/evaluator.py +0 -1334
- ads/evaluations/statistical_metrics.py +0 -543
- ads/experiments/__init__.py +0 -9
- ads/experiments/capabilities.md +0 -0
- ads/explanations/__init__.py +0 -21
- ads/explanations/base_explainer.py +0 -142
- ads/explanations/capabilities.md +0 -83
- ads/explanations/explainer.py +0 -190
- ads/explanations/mlx_global_explainer.py +0 -1050
- ads/explanations/mlx_interface.py +0 -386
- ads/explanations/mlx_local_explainer.py +0 -287
- ads/explanations/mlx_whatif_explainer.py +0 -201
- ads/feature_engineering/__init__.py +0 -20
- ads/feature_engineering/accessor/__init__.py +0 -5
- ads/feature_engineering/accessor/dataframe_accessor.py +0 -535
- ads/feature_engineering/accessor/mixin/__init__.py +0 -5
- ads/feature_engineering/accessor/mixin/correlation.py +0 -166
- ads/feature_engineering/accessor/mixin/eda_mixin.py +0 -266
- ads/feature_engineering/accessor/mixin/eda_mixin_series.py +0 -85
- ads/feature_engineering/accessor/mixin/feature_types_mixin.py +0 -211
- ads/feature_engineering/accessor/mixin/utils.py +0 -65
- ads/feature_engineering/accessor/series_accessor.py +0 -431
- ads/feature_engineering/adsimage/__init__.py +0 -5
- ads/feature_engineering/adsimage/image.py +0 -192
- ads/feature_engineering/adsimage/image_reader.py +0 -170
- ads/feature_engineering/adsimage/interface/__init__.py +0 -5
- ads/feature_engineering/adsimage/interface/reader.py +0 -19
- ads/feature_engineering/adsstring/__init__.py +0 -7
- ads/feature_engineering/adsstring/oci_language/__init__.py +0 -8
- ads/feature_engineering/adsstring/string/__init__.py +0 -8
- ads/feature_engineering/data_schema.json +0 -57
- ads/feature_engineering/dataset/__init__.py +0 -5
- ads/feature_engineering/dataset/zip_code_data.py +0 -42062
- ads/feature_engineering/exceptions.py +0 -40
- ads/feature_engineering/feature_type/__init__.py +0 -133
- ads/feature_engineering/feature_type/address.py +0 -184
- ads/feature_engineering/feature_type/adsstring/__init__.py +0 -5
- ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +0 -164
- ads/feature_engineering/feature_type/adsstring/oci_language.py +0 -93
- ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +0 -5
- ads/feature_engineering/feature_type/adsstring/parsers/base.py +0 -47
- ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +0 -96
- ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +0 -221
- ads/feature_engineering/feature_type/adsstring/string.py +0 -258
- ads/feature_engineering/feature_type/base.py +0 -58
- ads/feature_engineering/feature_type/boolean.py +0 -183
- ads/feature_engineering/feature_type/category.py +0 -146
- ads/feature_engineering/feature_type/constant.py +0 -137
- ads/feature_engineering/feature_type/continuous.py +0 -151
- ads/feature_engineering/feature_type/creditcard.py +0 -314
- ads/feature_engineering/feature_type/datetime.py +0 -190
- ads/feature_engineering/feature_type/discrete.py +0 -134
- ads/feature_engineering/feature_type/document.py +0 -43
- ads/feature_engineering/feature_type/gis.py +0 -251
- ads/feature_engineering/feature_type/handler/__init__.py +0 -5
- ads/feature_engineering/feature_type/handler/feature_validator.py +0 -524
- ads/feature_engineering/feature_type/handler/feature_warning.py +0 -319
- ads/feature_engineering/feature_type/handler/warnings.py +0 -128
- ads/feature_engineering/feature_type/integer.py +0 -142
- ads/feature_engineering/feature_type/ip_address.py +0 -144
- ads/feature_engineering/feature_type/ip_address_v4.py +0 -138
- ads/feature_engineering/feature_type/ip_address_v6.py +0 -138
- ads/feature_engineering/feature_type/lat_long.py +0 -256
- ads/feature_engineering/feature_type/object.py +0 -43
- ads/feature_engineering/feature_type/ordinal.py +0 -132
- ads/feature_engineering/feature_type/phone_number.py +0 -135
- ads/feature_engineering/feature_type/string.py +0 -171
- ads/feature_engineering/feature_type/text.py +0 -93
- ads/feature_engineering/feature_type/unknown.py +0 -43
- ads/feature_engineering/feature_type/zip_code.py +0 -164
- ads/feature_engineering/feature_type_manager.py +0 -406
- ads/feature_engineering/schema.py +0 -795
- ads/feature_engineering/utils.py +0 -245
- ads/feature_store/.readthedocs.yaml +0 -19
- ads/feature_store/README.md +0 -65
- ads/feature_store/__init__.py +0 -9
- ads/feature_store/common/__init__.py +0 -0
- ads/feature_store/common/enums.py +0 -339
- ads/feature_store/common/exceptions.py +0 -18
- ads/feature_store/common/spark_session_singleton.py +0 -125
- ads/feature_store/common/utils/__init__.py +0 -0
- ads/feature_store/common/utils/base64_encoder_decoder.py +0 -72
- ads/feature_store/common/utils/feature_schema_mapper.py +0 -283
- ads/feature_store/common/utils/transformation_utils.py +0 -82
- ads/feature_store/common/utils/utility.py +0 -403
- ads/feature_store/data_validation/__init__.py +0 -0
- ads/feature_store/data_validation/great_expectation.py +0 -129
- ads/feature_store/dataset.py +0 -1230
- ads/feature_store/dataset_job.py +0 -530
- ads/feature_store/docs/Dockerfile +0 -7
- ads/feature_store/docs/Makefile +0 -44
- ads/feature_store/docs/conf.py +0 -28
- ads/feature_store/docs/requirements.txt +0 -14
- ads/feature_store/docs/source/ads.feature_store.query.rst +0 -20
- ads/feature_store/docs/source/cicd.rst +0 -137
- ads/feature_store/docs/source/conf.py +0 -86
- ads/feature_store/docs/source/data_versioning.rst +0 -33
- ads/feature_store/docs/source/dataset.rst +0 -388
- ads/feature_store/docs/source/dataset_job.rst +0 -27
- ads/feature_store/docs/source/demo.rst +0 -70
- ads/feature_store/docs/source/entity.rst +0 -78
- ads/feature_store/docs/source/feature_group.rst +0 -624
- ads/feature_store/docs/source/feature_group_job.rst +0 -29
- ads/feature_store/docs/source/feature_store.rst +0 -122
- ads/feature_store/docs/source/feature_store_class.rst +0 -123
- ads/feature_store/docs/source/feature_validation.rst +0 -66
- ads/feature_store/docs/source/figures/cicd.png +0 -0
- ads/feature_store/docs/source/figures/data_validation.png +0 -0
- ads/feature_store/docs/source/figures/data_versioning.png +0 -0
- ads/feature_store/docs/source/figures/dataset.gif +0 -0
- ads/feature_store/docs/source/figures/dataset.png +0 -0
- ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
- ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
- ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
- ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
- ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
- ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
- ads/feature_store/docs/source/figures/entity.png +0 -0
- ads/feature_store/docs/source/figures/feature_group.png +0 -0
- ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
- ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
- ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
- ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
- ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
- ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
- ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
- ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
- ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
- ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
- ads/feature_store/docs/source/figures/overview.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
- ads/feature_store/docs/source/figures/stats_1.png +0 -0
- ads/feature_store/docs/source/figures/stats_2.png +0 -0
- ads/feature_store/docs/source/figures/stats_d.png +0 -0
- ads/feature_store/docs/source/figures/stats_fg.png +0 -0
- ads/feature_store/docs/source/figures/transformation.png +0 -0
- ads/feature_store/docs/source/figures/transformations.gif +0 -0
- ads/feature_store/docs/source/figures/validation.png +0 -0
- ads/feature_store/docs/source/figures/validation_fg.png +0 -0
- ads/feature_store/docs/source/figures/validation_results.png +0 -0
- ads/feature_store/docs/source/figures/validation_summary.png +0 -0
- ads/feature_store/docs/source/index.rst +0 -81
- ads/feature_store/docs/source/module.rst +0 -8
- ads/feature_store/docs/source/notebook.rst +0 -94
- ads/feature_store/docs/source/overview.rst +0 -47
- ads/feature_store/docs/source/quickstart.rst +0 -176
- ads/feature_store/docs/source/release_notes.rst +0 -194
- ads/feature_store/docs/source/setup_feature_store.rst +0 -81
- ads/feature_store/docs/source/statistics.rst +0 -58
- ads/feature_store/docs/source/transformation.rst +0 -199
- ads/feature_store/docs/source/ui.rst +0 -65
- ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +0 -66
- ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +0 -192
- ads/feature_store/docs/source/user_guides.setup.terraform.rst +0 -338
- ads/feature_store/entity.py +0 -718
- ads/feature_store/execution_strategy/__init__.py +0 -0
- ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
- ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +0 -375
- ads/feature_store/execution_strategy/engine/__init__.py +0 -0
- ads/feature_store/execution_strategy/engine/spark_engine.py +0 -316
- ads/feature_store/execution_strategy/execution_strategy.py +0 -113
- ads/feature_store/execution_strategy/execution_strategy_provider.py +0 -47
- ads/feature_store/execution_strategy/spark/__init__.py +0 -0
- ads/feature_store/execution_strategy/spark/spark_execution.py +0 -618
- ads/feature_store/feature.py +0 -192
- ads/feature_store/feature_group.py +0 -1494
- ads/feature_store/feature_group_expectation.py +0 -346
- ads/feature_store/feature_group_job.py +0 -602
- ads/feature_store/feature_lineage/__init__.py +0 -0
- ads/feature_store/feature_lineage/graphviz_service.py +0 -180
- ads/feature_store/feature_option_details.py +0 -50
- ads/feature_store/feature_statistics/__init__.py +0 -0
- ads/feature_store/feature_statistics/statistics_service.py +0 -99
- ads/feature_store/feature_store.py +0 -699
- ads/feature_store/feature_store_registrar.py +0 -518
- ads/feature_store/input_feature_detail.py +0 -149
- ads/feature_store/mixin/__init__.py +0 -4
- ads/feature_store/mixin/oci_feature_store.py +0 -145
- ads/feature_store/model_details.py +0 -73
- ads/feature_store/query/__init__.py +0 -0
- ads/feature_store/query/filter.py +0 -266
- ads/feature_store/query/generator/__init__.py +0 -0
- ads/feature_store/query/generator/query_generator.py +0 -298
- ads/feature_store/query/join.py +0 -161
- ads/feature_store/query/query.py +0 -403
- ads/feature_store/query/validator/__init__.py +0 -0
- ads/feature_store/query/validator/query_validator.py +0 -57
- ads/feature_store/response/__init__.py +0 -0
- ads/feature_store/response/response_builder.py +0 -68
- ads/feature_store/service/__init__.py +0 -0
- ads/feature_store/service/oci_dataset.py +0 -139
- ads/feature_store/service/oci_dataset_job.py +0 -199
- ads/feature_store/service/oci_entity.py +0 -125
- ads/feature_store/service/oci_feature_group.py +0 -164
- ads/feature_store/service/oci_feature_group_job.py +0 -214
- ads/feature_store/service/oci_feature_store.py +0 -182
- ads/feature_store/service/oci_lineage.py +0 -87
- ads/feature_store/service/oci_transformation.py +0 -104
- ads/feature_store/statistics/__init__.py +0 -0
- ads/feature_store/statistics/abs_feature_value.py +0 -49
- ads/feature_store/statistics/charts/__init__.py +0 -0
- ads/feature_store/statistics/charts/abstract_feature_plot.py +0 -37
- ads/feature_store/statistics/charts/box_plot.py +0 -148
- ads/feature_store/statistics/charts/frequency_distribution.py +0 -65
- ads/feature_store/statistics/charts/probability_distribution.py +0 -68
- ads/feature_store/statistics/charts/top_k_frequent_elements.py +0 -98
- ads/feature_store/statistics/feature_stat.py +0 -126
- ads/feature_store/statistics/generic_feature_value.py +0 -33
- ads/feature_store/statistics/statistics.py +0 -41
- ads/feature_store/statistics_config.py +0 -101
- ads/feature_store/templates/feature_store_template.yaml +0 -45
- ads/feature_store/transformation.py +0 -499
- ads/feature_store/validation_output.py +0 -57
- ads/hpo/__init__.py +0 -9
- ads/hpo/_imports.py +0 -91
- ads/hpo/ads_search_space.py +0 -439
- ads/hpo/distributions.py +0 -325
- ads/hpo/objective.py +0 -280
- ads/hpo/search_cv.py +0 -1657
- ads/hpo/stopping_criterion.py +0 -75
- ads/hpo/tuner_artifact.py +0 -413
- ads/hpo/utils.py +0 -91
- ads/hpo/validation.py +0 -140
- ads/hpo/visualization/__init__.py +0 -5
- ads/hpo/visualization/_contour.py +0 -23
- ads/hpo/visualization/_edf.py +0 -20
- ads/hpo/visualization/_intermediate_values.py +0 -21
- ads/hpo/visualization/_optimization_history.py +0 -25
- ads/hpo/visualization/_parallel_coordinate.py +0 -169
- ads/hpo/visualization/_param_importances.py +0 -26
- ads/jobs/__init__.py +0 -53
- ads/jobs/ads_job.py +0 -663
- ads/jobs/builders/__init__.py +0 -5
- ads/jobs/builders/base.py +0 -156
- ads/jobs/builders/infrastructure/__init__.py +0 -6
- ads/jobs/builders/infrastructure/base.py +0 -165
- ads/jobs/builders/infrastructure/dataflow.py +0 -1252
- ads/jobs/builders/infrastructure/dsc_job.py +0 -1894
- ads/jobs/builders/infrastructure/dsc_job_runtime.py +0 -1233
- ads/jobs/builders/infrastructure/utils.py +0 -65
- ads/jobs/builders/runtimes/__init__.py +0 -5
- ads/jobs/builders/runtimes/artifact.py +0 -338
- ads/jobs/builders/runtimes/base.py +0 -325
- ads/jobs/builders/runtimes/container_runtime.py +0 -242
- ads/jobs/builders/runtimes/python_runtime.py +0 -1016
- ads/jobs/builders/runtimes/pytorch_runtime.py +0 -204
- ads/jobs/cli.py +0 -104
- ads/jobs/env_var_parser.py +0 -131
- ads/jobs/extension.py +0 -160
- ads/jobs/schema/__init__.py +0 -5
- ads/jobs/schema/infrastructure_schema.json +0 -116
- ads/jobs/schema/job_schema.json +0 -42
- ads/jobs/schema/runtime_schema.json +0 -183
- ads/jobs/schema/validator.py +0 -141
- ads/jobs/serializer.py +0 -296
- ads/jobs/templates/__init__.py +0 -5
- ads/jobs/templates/container.py +0 -6
- ads/jobs/templates/driver_notebook.py +0 -177
- ads/jobs/templates/driver_oci.py +0 -500
- ads/jobs/templates/driver_python.py +0 -48
- ads/jobs/templates/driver_pytorch.py +0 -852
- ads/jobs/templates/driver_utils.py +0 -615
- ads/jobs/templates/hostname_from_env.c +0 -55
- ads/jobs/templates/oci_metrics.py +0 -181
- ads/jobs/utils.py +0 -104
- ads/llm/__init__.py +0 -28
- ads/llm/autogen/__init__.py +0 -2
- ads/llm/autogen/constants.py +0 -15
- ads/llm/autogen/reports/__init__.py +0 -2
- ads/llm/autogen/reports/base.py +0 -67
- ads/llm/autogen/reports/data.py +0 -103
- ads/llm/autogen/reports/session.py +0 -526
- ads/llm/autogen/reports/templates/chat_box.html +0 -13
- ads/llm/autogen/reports/templates/chat_box_lt.html +0 -5
- ads/llm/autogen/reports/templates/chat_box_rt.html +0 -6
- ads/llm/autogen/reports/utils.py +0 -56
- ads/llm/autogen/v02/__init__.py +0 -4
- ads/llm/autogen/v02/client.py +0 -295
- ads/llm/autogen/v02/log_handlers/__init__.py +0 -2
- ads/llm/autogen/v02/log_handlers/oci_file_handler.py +0 -83
- ads/llm/autogen/v02/loggers/__init__.py +0 -6
- ads/llm/autogen/v02/loggers/metric_logger.py +0 -320
- ads/llm/autogen/v02/loggers/session_logger.py +0 -580
- ads/llm/autogen/v02/loggers/utils.py +0 -86
- ads/llm/autogen/v02/runtime_logging.py +0 -163
- ads/llm/chain.py +0 -268
- ads/llm/chat_template.py +0 -31
- ads/llm/deploy.py +0 -63
- ads/llm/guardrails/__init__.py +0 -5
- ads/llm/guardrails/base.py +0 -442
- ads/llm/guardrails/huggingface.py +0 -44
- ads/llm/langchain/__init__.py +0 -5
- ads/llm/langchain/plugins/__init__.py +0 -5
- ads/llm/langchain/plugins/chat_models/__init__.py +0 -5
- ads/llm/langchain/plugins/chat_models/oci_data_science.py +0 -1027
- ads/llm/langchain/plugins/embeddings/__init__.py +0 -4
- ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +0 -184
- ads/llm/langchain/plugins/llms/__init__.py +0 -5
- ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +0 -979
- ads/llm/requirements.txt +0 -3
- ads/llm/serialize.py +0 -219
- ads/llm/serializers/__init__.py +0 -0
- ads/llm/serializers/retrieval_qa.py +0 -153
- ads/llm/serializers/runnable_parallel.py +0 -27
- ads/llm/templates/score_chain.jinja2 +0 -155
- ads/llm/templates/tool_chat_template_hermes.jinja +0 -130
- ads/llm/templates/tool_chat_template_mistral_parallel.jinja +0 -94
- ads/model/__init__.py +0 -52
- ads/model/artifact.py +0 -573
- ads/model/artifact_downloader.py +0 -254
- ads/model/artifact_uploader.py +0 -267
- ads/model/base_properties.py +0 -238
- ads/model/common/.model-ignore +0 -66
- ads/model/common/__init__.py +0 -5
- ads/model/common/utils.py +0 -142
- ads/model/datascience_model.py +0 -2635
- ads/model/deployment/__init__.py +0 -20
- ads/model/deployment/common/__init__.py +0 -5
- ads/model/deployment/common/utils.py +0 -308
- ads/model/deployment/model_deployer.py +0 -466
- ads/model/deployment/model_deployment.py +0 -1846
- ads/model/deployment/model_deployment_infrastructure.py +0 -671
- ads/model/deployment/model_deployment_properties.py +0 -493
- ads/model/deployment/model_deployment_runtime.py +0 -838
- ads/model/extractor/__init__.py +0 -5
- ads/model/extractor/automl_extractor.py +0 -74
- ads/model/extractor/embedding_onnx_extractor.py +0 -80
- ads/model/extractor/huggingface_extractor.py +0 -88
- ads/model/extractor/keras_extractor.py +0 -84
- ads/model/extractor/lightgbm_extractor.py +0 -93
- ads/model/extractor/model_info_extractor.py +0 -114
- ads/model/extractor/model_info_extractor_factory.py +0 -105
- ads/model/extractor/pytorch_extractor.py +0 -87
- ads/model/extractor/sklearn_extractor.py +0 -112
- ads/model/extractor/spark_extractor.py +0 -89
- ads/model/extractor/tensorflow_extractor.py +0 -85
- ads/model/extractor/xgboost_extractor.py +0 -94
- ads/model/framework/__init__.py +0 -5
- ads/model/framework/automl_model.py +0 -178
- ads/model/framework/embedding_onnx_model.py +0 -438
- ads/model/framework/huggingface_model.py +0 -399
- ads/model/framework/lightgbm_model.py +0 -266
- ads/model/framework/pytorch_model.py +0 -266
- ads/model/framework/sklearn_model.py +0 -250
- ads/model/framework/spark_model.py +0 -326
- ads/model/framework/tensorflow_model.py +0 -254
- ads/model/framework/xgboost_model.py +0 -258
- ads/model/generic_model.py +0 -3518
- ads/model/model_artifact_boilerplate/README.md +0 -381
- ads/model/model_artifact_boilerplate/__init__.py +0 -5
- ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +0 -5
- ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +0 -427
- ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +0 -2
- ads/model/model_artifact_boilerplate/runtime.yaml +0 -7
- ads/model/model_artifact_boilerplate/score.py +0 -61
- ads/model/model_file_description_schema.json +0 -68
- ads/model/model_introspect.py +0 -331
- ads/model/model_metadata.py +0 -1810
- ads/model/model_metadata_mixin.py +0 -460
- ads/model/model_properties.py +0 -63
- ads/model/model_version_set.py +0 -739
- ads/model/runtime/__init__.py +0 -5
- ads/model/runtime/env_info.py +0 -306
- ads/model/runtime/model_deployment_details.py +0 -37
- ads/model/runtime/model_provenance_details.py +0 -58
- ads/model/runtime/runtime_info.py +0 -81
- ads/model/runtime/schemas/inference_env_info_schema.yaml +0 -16
- ads/model/runtime/schemas/model_provenance_schema.yaml +0 -36
- ads/model/runtime/schemas/training_env_info_schema.yaml +0 -16
- ads/model/runtime/utils.py +0 -201
- ads/model/serde/__init__.py +0 -5
- ads/model/serde/common.py +0 -40
- ads/model/serde/model_input.py +0 -547
- ads/model/serde/model_serializer.py +0 -1184
- ads/model/service/__init__.py +0 -5
- ads/model/service/oci_datascience_model.py +0 -1076
- ads/model/service/oci_datascience_model_deployment.py +0 -500
- ads/model/service/oci_datascience_model_version_set.py +0 -176
- ads/model/transformer/__init__.py +0 -5
- ads/model/transformer/onnx_transformer.py +0 -324
- ads/mysqldb/__init__.py +0 -5
- ads/mysqldb/mysql_db.py +0 -227
- ads/opctl/__init__.py +0 -18
- ads/opctl/anomaly_detection.py +0 -11
- ads/opctl/backend/__init__.py +0 -5
- ads/opctl/backend/ads_dataflow.py +0 -353
- ads/opctl/backend/ads_ml_job.py +0 -710
- ads/opctl/backend/ads_ml_pipeline.py +0 -164
- ads/opctl/backend/ads_model_deployment.py +0 -209
- ads/opctl/backend/base.py +0 -146
- ads/opctl/backend/local.py +0 -1053
- ads/opctl/backend/marketplace/__init__.py +0 -9
- ads/opctl/backend/marketplace/helm_helper.py +0 -173
- ads/opctl/backend/marketplace/local_marketplace.py +0 -271
- ads/opctl/backend/marketplace/marketplace_backend_runner.py +0 -71
- ads/opctl/backend/marketplace/marketplace_operator_interface.py +0 -44
- ads/opctl/backend/marketplace/marketplace_operator_runner.py +0 -24
- ads/opctl/backend/marketplace/marketplace_utils.py +0 -212
- ads/opctl/backend/marketplace/models/__init__.py +0 -5
- ads/opctl/backend/marketplace/models/bearer_token.py +0 -94
- ads/opctl/backend/marketplace/models/marketplace_type.py +0 -70
- ads/opctl/backend/marketplace/models/ocir_details.py +0 -56
- ads/opctl/backend/marketplace/prerequisite_checker.py +0 -238
- ads/opctl/cli.py +0 -707
- ads/opctl/cmds.py +0 -869
- ads/opctl/conda/__init__.py +0 -5
- ads/opctl/conda/cli.py +0 -193
- ads/opctl/conda/cmds.py +0 -749
- ads/opctl/conda/config.yaml +0 -34
- ads/opctl/conda/manifest_template.yaml +0 -13
- ads/opctl/conda/multipart_uploader.py +0 -188
- ads/opctl/conda/pack.py +0 -89
- ads/opctl/config/__init__.py +0 -5
- ads/opctl/config/base.py +0 -57
- ads/opctl/config/diagnostics/__init__.py +0 -5
- ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +0 -62
- ads/opctl/config/merger.py +0 -255
- ads/opctl/config/resolver.py +0 -297
- ads/opctl/config/utils.py +0 -79
- ads/opctl/config/validator.py +0 -17
- ads/opctl/config/versioner.py +0 -68
- ads/opctl/config/yaml_parsers/__init__.py +0 -7
- ads/opctl/config/yaml_parsers/base.py +0 -58
- ads/opctl/config/yaml_parsers/distributed/__init__.py +0 -7
- ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +0 -201
- ads/opctl/constants.py +0 -66
- ads/opctl/decorator/__init__.py +0 -5
- ads/opctl/decorator/common.py +0 -129
- ads/opctl/diagnostics/__init__.py +0 -5
- ads/opctl/diagnostics/__main__.py +0 -25
- ads/opctl/diagnostics/check_distributed_job_requirements.py +0 -212
- ads/opctl/diagnostics/check_requirements.py +0 -144
- ads/opctl/diagnostics/requirement_exception.py +0 -9
- ads/opctl/distributed/README.md +0 -109
- ads/opctl/distributed/__init__.py +0 -5
- ads/opctl/distributed/certificates.py +0 -32
- ads/opctl/distributed/cli.py +0 -207
- ads/opctl/distributed/cmds.py +0 -731
- ads/opctl/distributed/common/__init__.py +0 -5
- ads/opctl/distributed/common/abstract_cluster_provider.py +0 -449
- ads/opctl/distributed/common/abstract_framework_spec_builder.py +0 -88
- ads/opctl/distributed/common/cluster_config_helper.py +0 -103
- ads/opctl/distributed/common/cluster_provider_factory.py +0 -21
- ads/opctl/distributed/common/cluster_runner.py +0 -54
- ads/opctl/distributed/common/framework_factory.py +0 -29
- ads/opctl/docker/Dockerfile.job +0 -103
- ads/opctl/docker/Dockerfile.job.arm +0 -107
- ads/opctl/docker/Dockerfile.job.gpu +0 -175
- ads/opctl/docker/base-env.yaml +0 -13
- ads/opctl/docker/cuda.repo +0 -6
- ads/opctl/docker/operator/.dockerignore +0 -0
- ads/opctl/docker/operator/Dockerfile +0 -41
- ads/opctl/docker/operator/Dockerfile.gpu +0 -85
- ads/opctl/docker/operator/cuda.repo +0 -6
- ads/opctl/docker/operator/environment.yaml +0 -8
- ads/opctl/forecast.py +0 -11
- ads/opctl/index.yaml +0 -3
- ads/opctl/model/__init__.py +0 -5
- ads/opctl/model/cli.py +0 -65
- ads/opctl/model/cmds.py +0 -73
- ads/opctl/operator/README.md +0 -4
- ads/opctl/operator/__init__.py +0 -31
- ads/opctl/operator/cli.py +0 -344
- ads/opctl/operator/cmd.py +0 -596
- ads/opctl/operator/common/__init__.py +0 -5
- ads/opctl/operator/common/backend_factory.py +0 -460
- ads/opctl/operator/common/const.py +0 -27
- ads/opctl/operator/common/data/synthetic.csv +0 -16001
- ads/opctl/operator/common/dictionary_merger.py +0 -148
- ads/opctl/operator/common/errors.py +0 -42
- ads/opctl/operator/common/operator_config.py +0 -99
- ads/opctl/operator/common/operator_loader.py +0 -811
- ads/opctl/operator/common/operator_schema.yaml +0 -130
- ads/opctl/operator/common/operator_yaml_generator.py +0 -152
- ads/opctl/operator/common/utils.py +0 -208
- ads/opctl/operator/lowcode/__init__.py +0 -5
- ads/opctl/operator/lowcode/anomaly/MLoperator +0 -16
- ads/opctl/operator/lowcode/anomaly/README.md +0 -207
- ads/opctl/operator/lowcode/anomaly/__init__.py +0 -5
- ads/opctl/operator/lowcode/anomaly/__main__.py +0 -103
- ads/opctl/operator/lowcode/anomaly/cmd.py +0 -35
- ads/opctl/operator/lowcode/anomaly/const.py +0 -167
- ads/opctl/operator/lowcode/anomaly/environment.yaml +0 -10
- ads/opctl/operator/lowcode/anomaly/model/__init__.py +0 -5
- ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +0 -146
- ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +0 -162
- ads/opctl/operator/lowcode/anomaly/model/automlx.py +0 -99
- ads/opctl/operator/lowcode/anomaly/model/autots.py +0 -115
- ads/opctl/operator/lowcode/anomaly/model/base_model.py +0 -404
- ads/opctl/operator/lowcode/anomaly/model/factory.py +0 -110
- ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +0 -78
- ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +0 -78
- ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +0 -120
- ads/opctl/operator/lowcode/anomaly/model/tods.py +0 -119
- ads/opctl/operator/lowcode/anomaly/operator_config.py +0 -127
- ads/opctl/operator/lowcode/anomaly/schema.yaml +0 -401
- ads/opctl/operator/lowcode/anomaly/utils.py +0 -88
- ads/opctl/operator/lowcode/common/__init__.py +0 -5
- ads/opctl/operator/lowcode/common/const.py +0 -10
- ads/opctl/operator/lowcode/common/data.py +0 -116
- ads/opctl/operator/lowcode/common/errors.py +0 -47
- ads/opctl/operator/lowcode/common/transformations.py +0 -296
- ads/opctl/operator/lowcode/common/utils.py +0 -293
- ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +0 -13
- ads/opctl/operator/lowcode/feature_store_marketplace/README.md +0 -30
- ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +0 -5
- ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +0 -116
- ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +0 -85
- ads/opctl/operator/lowcode/feature_store_marketplace/const.py +0 -15
- ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +0 -4
- ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +0 -32
- ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +0 -43
- ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +0 -120
- ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +0 -34
- ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +0 -386
- ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +0 -160
- ads/opctl/operator/lowcode/forecast/MLoperator +0 -25
- ads/opctl/operator/lowcode/forecast/README.md +0 -209
- ads/opctl/operator/lowcode/forecast/__init__.py +0 -5
- ads/opctl/operator/lowcode/forecast/__main__.py +0 -89
- ads/opctl/operator/lowcode/forecast/cmd.py +0 -40
- ads/opctl/operator/lowcode/forecast/const.py +0 -92
- ads/opctl/operator/lowcode/forecast/environment.yaml +0 -20
- ads/opctl/operator/lowcode/forecast/errors.py +0 -26
- ads/opctl/operator/lowcode/forecast/model/__init__.py +0 -5
- ads/opctl/operator/lowcode/forecast/model/arima.py +0 -279
- ads/opctl/operator/lowcode/forecast/model/automlx.py +0 -542
- ads/opctl/operator/lowcode/forecast/model/autots.py +0 -312
- ads/opctl/operator/lowcode/forecast/model/base_model.py +0 -863
- ads/opctl/operator/lowcode/forecast/model/factory.py +0 -106
- ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +0 -492
- ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +0 -243
- ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +0 -486
- ads/opctl/operator/lowcode/forecast/model/prophet.py +0 -445
- ads/opctl/operator/lowcode/forecast/model_evaluator.py +0 -244
- ads/opctl/operator/lowcode/forecast/operator_config.py +0 -234
- ads/opctl/operator/lowcode/forecast/schema.yaml +0 -506
- ads/opctl/operator/lowcode/forecast/utils.py +0 -413
- ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +0 -7
- ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +0 -285
- ads/opctl/operator/lowcode/forecast/whatifserve/score.py +0 -246
- ads/opctl/operator/lowcode/pii/MLoperator +0 -17
- ads/opctl/operator/lowcode/pii/README.md +0 -208
- ads/opctl/operator/lowcode/pii/__init__.py +0 -5
- ads/opctl/operator/lowcode/pii/__main__.py +0 -78
- ads/opctl/operator/lowcode/pii/cmd.py +0 -39
- ads/opctl/operator/lowcode/pii/constant.py +0 -84
- ads/opctl/operator/lowcode/pii/environment.yaml +0 -17
- ads/opctl/operator/lowcode/pii/errors.py +0 -27
- ads/opctl/operator/lowcode/pii/model/__init__.py +0 -5
- ads/opctl/operator/lowcode/pii/model/factory.py +0 -82
- ads/opctl/operator/lowcode/pii/model/guardrails.py +0 -167
- ads/opctl/operator/lowcode/pii/model/pii.py +0 -145
- ads/opctl/operator/lowcode/pii/model/processor/__init__.py +0 -34
- ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +0 -34
- ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +0 -35
- ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +0 -225
- ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +0 -73
- ads/opctl/operator/lowcode/pii/model/processor/remover.py +0 -26
- ads/opctl/operator/lowcode/pii/model/report.py +0 -487
- ads/opctl/operator/lowcode/pii/operator_config.py +0 -95
- ads/opctl/operator/lowcode/pii/schema.yaml +0 -108
- ads/opctl/operator/lowcode/pii/utils.py +0 -43
- ads/opctl/operator/lowcode/recommender/MLoperator +0 -16
- ads/opctl/operator/lowcode/recommender/README.md +0 -206
- ads/opctl/operator/lowcode/recommender/__init__.py +0 -5
- ads/opctl/operator/lowcode/recommender/__main__.py +0 -82
- ads/opctl/operator/lowcode/recommender/cmd.py +0 -33
- ads/opctl/operator/lowcode/recommender/constant.py +0 -30
- ads/opctl/operator/lowcode/recommender/environment.yaml +0 -11
- ads/opctl/operator/lowcode/recommender/model/base_model.py +0 -212
- ads/opctl/operator/lowcode/recommender/model/factory.py +0 -56
- ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +0 -25
- ads/opctl/operator/lowcode/recommender/model/svd.py +0 -106
- ads/opctl/operator/lowcode/recommender/operator_config.py +0 -81
- ads/opctl/operator/lowcode/recommender/schema.yaml +0 -265
- ads/opctl/operator/lowcode/recommender/utils.py +0 -13
- ads/opctl/operator/runtime/__init__.py +0 -5
- ads/opctl/operator/runtime/const.py +0 -17
- ads/opctl/operator/runtime/container_runtime_schema.yaml +0 -50
- ads/opctl/operator/runtime/marketplace_runtime.py +0 -50
- ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +0 -21
- ads/opctl/operator/runtime/python_runtime_schema.yaml +0 -21
- ads/opctl/operator/runtime/runtime.py +0 -115
- ads/opctl/schema.yaml.yml +0 -36
- ads/opctl/script.py +0 -40
- ads/opctl/spark/__init__.py +0 -5
- ads/opctl/spark/cli.py +0 -43
- ads/opctl/spark/cmds.py +0 -147
- ads/opctl/templates/diagnostic_report_template.jinja2 +0 -102
- ads/opctl/utils.py +0 -344
- ads/oracledb/__init__.py +0 -5
- ads/oracledb/oracle_db.py +0 -346
- ads/pipeline/__init__.py +0 -39
- ads/pipeline/ads_pipeline.py +0 -2279
- ads/pipeline/ads_pipeline_run.py +0 -772
- ads/pipeline/ads_pipeline_step.py +0 -605
- ads/pipeline/builders/__init__.py +0 -5
- ads/pipeline/builders/infrastructure/__init__.py +0 -5
- ads/pipeline/builders/infrastructure/custom_script.py +0 -32
- ads/pipeline/cli.py +0 -119
- ads/pipeline/extension.py +0 -291
- ads/pipeline/schema/__init__.py +0 -5
- ads/pipeline/schema/cs_step_schema.json +0 -35
- ads/pipeline/schema/ml_step_schema.json +0 -31
- ads/pipeline/schema/pipeline_schema.json +0 -71
- ads/pipeline/visualizer/__init__.py +0 -5
- ads/pipeline/visualizer/base.py +0 -570
- ads/pipeline/visualizer/graph_renderer.py +0 -272
- ads/pipeline/visualizer/text_renderer.py +0 -84
- ads/secrets/__init__.py +0 -11
- ads/secrets/adb.py +0 -386
- ads/secrets/auth_token.py +0 -86
- ads/secrets/big_data_service.py +0 -365
- ads/secrets/mysqldb.py +0 -149
- ads/secrets/oracledb.py +0 -160
- ads/secrets/secrets.py +0 -407
- ads/telemetry/__init__.py +0 -7
- ads/telemetry/base.py +0 -69
- ads/telemetry/client.py +0 -125
- ads/telemetry/telemetry.py +0 -257
- ads/templates/dataflow_pyspark.jinja2 +0 -13
- ads/templates/dataflow_sparksql.jinja2 +0 -22
- ads/templates/func.jinja2 +0 -20
- ads/templates/schemas/openapi.json +0 -1740
- ads/templates/score-pkl.jinja2 +0 -173
- ads/templates/score.jinja2 +0 -322
- ads/templates/score_embedding_onnx.jinja2 +0 -202
- ads/templates/score_generic.jinja2 +0 -165
- ads/templates/score_huggingface_pipeline.jinja2 +0 -217
- ads/templates/score_lightgbm.jinja2 +0 -185
- ads/templates/score_onnx.jinja2 +0 -407
- ads/templates/score_onnx_new.jinja2 +0 -473
- ads/templates/score_oracle_automl.jinja2 +0 -185
- ads/templates/score_pyspark.jinja2 +0 -154
- ads/templates/score_pytorch.jinja2 +0 -219
- ads/templates/score_scikit-learn.jinja2 +0 -184
- ads/templates/score_tensorflow.jinja2 +0 -184
- ads/templates/score_xgboost.jinja2 +0 -178
- ads/text_dataset/__init__.py +0 -5
- ads/text_dataset/backends.py +0 -211
- ads/text_dataset/dataset.py +0 -445
- ads/text_dataset/extractor.py +0 -207
- ads/text_dataset/options.py +0 -53
- ads/text_dataset/udfs.py +0 -22
- ads/text_dataset/utils.py +0 -49
- ads/type_discovery/__init__.py +0 -9
- ads/type_discovery/abstract_detector.py +0 -21
- ads/type_discovery/constant_detector.py +0 -41
- ads/type_discovery/continuous_detector.py +0 -54
- ads/type_discovery/credit_card_detector.py +0 -99
- ads/type_discovery/datetime_detector.py +0 -92
- ads/type_discovery/discrete_detector.py +0 -118
- ads/type_discovery/document_detector.py +0 -146
- ads/type_discovery/ip_detector.py +0 -68
- ads/type_discovery/latlon_detector.py +0 -90
- ads/type_discovery/phone_number_detector.py +0 -63
- ads/type_discovery/type_discovery_driver.py +0 -87
- ads/type_discovery/typed_feature.py +0 -594
- ads/type_discovery/unknown_detector.py +0 -41
- ads/type_discovery/zipcode_detector.py +0 -48
- ads/vault/__init__.py +0 -7
- ads/vault/vault.py +0 -237
- oracle_ads-2.13.8.dist-info/RECORD +0 -858
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/licenses/LICENSE.txt +0 -0
@@ -1,18 +0,0 @@
|
|
1
|
-
#!/usr/bin/env python
|
2
|
-
# -*- coding: utf-8; -*-
|
3
|
-
|
4
|
-
# Copyright (c) 2023 Oracle and/or its affiliates.
|
5
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
6
|
-
|
7
|
-
|
8
|
-
class NotMaterializedError(ValueError):
|
9
|
-
"""
|
10
|
-
Exception raised when a resource is not materialized.
|
11
|
-
|
12
|
-
Attributes:
|
13
|
-
resource_name (str): The name of the resource that is not materialized.
|
14
|
-
"""
|
15
|
-
|
16
|
-
def __init__(self, resource_type: str, resource_name: str):
|
17
|
-
self.resource_name = resource_name
|
18
|
-
super().__init__(f"{resource_type} {resource_name} is not materialized.")
|
@@ -1,125 +0,0 @@
|
|
1
|
-
#!/usr/bin/env python
|
2
|
-
# -*- coding: utf-8; -*-
|
3
|
-
import copy
|
4
|
-
|
5
|
-
import ads
|
6
|
-
|
7
|
-
# Copyright (c) 2023 Oracle and/or its affiliates.
|
8
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
9
|
-
|
10
|
-
from ads.common.decorator.runtime_dependency import OptionalDependency
|
11
|
-
import os
|
12
|
-
from ads.common.oci_client import OCIClientFactory
|
13
|
-
|
14
|
-
try:
|
15
|
-
from delta import configure_spark_with_delta_pip
|
16
|
-
except ModuleNotFoundError:
|
17
|
-
raise ModuleNotFoundError(
|
18
|
-
f"The `pyspark` module was not found. Please run `pip install "
|
19
|
-
f"{OptionalDependency.SPARK}`."
|
20
|
-
)
|
21
|
-
except Exception as e:
|
22
|
-
raise
|
23
|
-
try:
|
24
|
-
from pyspark.sql import SparkSession
|
25
|
-
except ModuleNotFoundError:
|
26
|
-
raise ModuleNotFoundError(
|
27
|
-
f"The `pyspark` module was not found. Please run `pip install "
|
28
|
-
f"{OptionalDependency.SPARK}`."
|
29
|
-
)
|
30
|
-
except Exception as e:
|
31
|
-
raise
|
32
|
-
|
33
|
-
|
34
|
-
def get_env_bool(env_var: str, default: bool = False) -> bool:
|
35
|
-
"""
|
36
|
-
:param env_var: Environment variable name
|
37
|
-
:param default: Default environment variable value
|
38
|
-
:return: Value of the boolean env variable
|
39
|
-
"""
|
40
|
-
env_val = os.getenv(env_var)
|
41
|
-
if env_val is None:
|
42
|
-
env_val = default
|
43
|
-
else:
|
44
|
-
env_val = env_val.lower()
|
45
|
-
if env_val == "true":
|
46
|
-
env_val = True
|
47
|
-
elif env_val == "false":
|
48
|
-
env_val = False
|
49
|
-
else:
|
50
|
-
raise ValueError(
|
51
|
-
"For environment variable: {0} only string values T/true or F/false are allowed but: \
|
52
|
-
{1} was provided.".format(
|
53
|
-
env_var, env_val
|
54
|
-
)
|
55
|
-
)
|
56
|
-
return env_val
|
57
|
-
|
58
|
-
|
59
|
-
def developer_enabled():
|
60
|
-
return get_env_bool("DEVELOPER_MODE", False)
|
61
|
-
|
62
|
-
|
63
|
-
class SingletonMeta(type):
|
64
|
-
_instances = {}
|
65
|
-
|
66
|
-
def __call__(cls, *args, **kwargs):
|
67
|
-
if cls not in cls._instances:
|
68
|
-
cls._instances[cls] = super().__call__(*args, **kwargs)
|
69
|
-
return cls._instances[cls]
|
70
|
-
|
71
|
-
|
72
|
-
class SparkSessionSingleton(metaclass=SingletonMeta):
|
73
|
-
"""Class provides the spark session."""
|
74
|
-
|
75
|
-
def __init__(self, metastore_id: str = None):
|
76
|
-
"""Virtually private constructor."""
|
77
|
-
|
78
|
-
spark_builder = (
|
79
|
-
SparkSession.builder.appName("FeatureStore")
|
80
|
-
.config("spark.sql.extensions", "io.delta.sql.DeltaSparkSessionExtension")
|
81
|
-
.config(
|
82
|
-
"spark.sql.catalog.spark_catalog",
|
83
|
-
"org.apache.spark.sql.delta.catalog.DeltaCatalog",
|
84
|
-
)
|
85
|
-
.enableHiveSupport()
|
86
|
-
)
|
87
|
-
_managed_table_location = None
|
88
|
-
|
89
|
-
if not developer_enabled() and metastore_id:
|
90
|
-
# Get the authentication credentials for the OCI data catalog service
|
91
|
-
auth = copy.copy(ads.auth.default_signer())
|
92
|
-
|
93
|
-
# Remove the "client_kwargs" key from the authentication credentials (if present)
|
94
|
-
auth.pop("client_kwargs", None)
|
95
|
-
|
96
|
-
data_catalog_client = OCIClientFactory(**auth).data_catalog
|
97
|
-
metastore = data_catalog_client.get_metastore(metastore_id).data
|
98
|
-
_managed_table_location = metastore.default_managed_table_location
|
99
|
-
# Configure the Spark session builder object to use the specified metastore
|
100
|
-
spark_builder.config(
|
101
|
-
"spark.hadoop.oracle.dcat.metastore.id", metastore_id
|
102
|
-
).config("spark.sql.warehouse.dir", _managed_table_location).config(
|
103
|
-
"spark.driver.memory", "16G"
|
104
|
-
)
|
105
|
-
|
106
|
-
if developer_enabled():
|
107
|
-
# Configure spark session with delta jars only in developer mode. In other cases,
|
108
|
-
# jars should be part of the conda pack
|
109
|
-
self.spark_session = configure_spark_with_delta_pip(
|
110
|
-
spark_builder
|
111
|
-
).getOrCreate()
|
112
|
-
else:
|
113
|
-
self.spark_session = spark_builder.getOrCreate()
|
114
|
-
|
115
|
-
self.spark_session.conf.set("spark.sql.execution.arrow.pyspark.enabled", "true")
|
116
|
-
self.spark_session.sparkContext.setLogLevel("OFF")
|
117
|
-
self.managed_table_location = _managed_table_location
|
118
|
-
|
119
|
-
def get_spark_session(self):
|
120
|
-
"""Access method to get the spark session."""
|
121
|
-
return self.spark_session
|
122
|
-
|
123
|
-
def get_managed_table_location(self):
|
124
|
-
"""Returns the managed table location for the spark"""
|
125
|
-
return self.managed_table_location
|
File without changes
|
@@ -1,72 +0,0 @@
|
|
1
|
-
#!/usr/bin/env python
|
2
|
-
# -*- coding: utf-8; -*-
|
3
|
-
|
4
|
-
# Copyright (c) 2023 Oracle and/or its affiliates.
|
5
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
6
|
-
|
7
|
-
import base64
|
8
|
-
|
9
|
-
|
10
|
-
class Base64EncoderDecoder:
|
11
|
-
"""
|
12
|
-
A utility class for encoding and decoding data in Base64 format.
|
13
|
-
|
14
|
-
Usage:
|
15
|
-
To encode a string:
|
16
|
-
```
|
17
|
-
encoded_data = Base64EncoderDecoder.encode("Hello, World!")
|
18
|
-
```
|
19
|
-
|
20
|
-
To decode an encoded string:
|
21
|
-
```
|
22
|
-
decoded_data = Base64EncoderDecoder.decode(encoded_data)
|
23
|
-
```
|
24
|
-
|
25
|
-
Attributes:
|
26
|
-
-----------
|
27
|
-
None
|
28
|
-
|
29
|
-
Methods:
|
30
|
-
--------
|
31
|
-
encode(raw_data: str) -> str:
|
32
|
-
Encodes the provided raw data into Base64 format and returns the encoded data as a string.
|
33
|
-
|
34
|
-
decode(encoded_data: str) -> str:
|
35
|
-
Decodes the provided Base64 data into its original format and returns the decoded data as a string.
|
36
|
-
"""
|
37
|
-
|
38
|
-
@classmethod
|
39
|
-
def encode(cls, raw_data: str) -> str:
|
40
|
-
"""Encodes raw data into Base64 format.
|
41
|
-
|
42
|
-
Parameters:
|
43
|
-
----------
|
44
|
-
raw_data: str
|
45
|
-
The raw data that needs to be encoded.
|
46
|
-
|
47
|
-
Returns:
|
48
|
-
-------
|
49
|
-
str:
|
50
|
-
Base64-encoded data as a string.
|
51
|
-
"""
|
52
|
-
byte_code = raw_data.encode("ascii")
|
53
|
-
base64_bytes = base64.b64encode(byte_code)
|
54
|
-
return base64_bytes.decode("ascii")
|
55
|
-
|
56
|
-
@classmethod
|
57
|
-
def decode(cls, encoded_data: str) -> str:
|
58
|
-
"""Decodes Base64 data into its original format.
|
59
|
-
|
60
|
-
Parameters:
|
61
|
-
----------
|
62
|
-
encoded_data: str
|
63
|
-
The Base64-encoded data that needs to be decoded.
|
64
|
-
|
65
|
-
Returns:
|
66
|
-
-------
|
67
|
-
str:
|
68
|
-
Decoded data as a string.
|
69
|
-
"""
|
70
|
-
base64_bytes = encoded_data.encode("ascii")
|
71
|
-
message_bytes = base64.b64decode(base64_bytes)
|
72
|
-
return message_bytes.decode("ascii")
|
@@ -1,283 +0,0 @@
|
|
1
|
-
#!/usr/bin/env python
|
2
|
-
# -*- coding: utf-8; -*-
|
3
|
-
|
4
|
-
# Copyright (c) 2023 Oracle and/or its affiliates.
|
5
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
6
|
-
|
7
|
-
import logging
|
8
|
-
from typing import List
|
9
|
-
|
10
|
-
import numpy as np
|
11
|
-
import pandas as pd
|
12
|
-
|
13
|
-
from ads.common.decorator.runtime_dependency import OptionalDependency
|
14
|
-
from mlm_insights.constants import types
|
15
|
-
|
16
|
-
from ads.feature_store.common.enums import FeatureType
|
17
|
-
|
18
|
-
try:
|
19
|
-
from pyspark.sql.types import *
|
20
|
-
except ModuleNotFoundError:
|
21
|
-
raise ModuleNotFoundError(
|
22
|
-
f"The `pyspark` module was not found. Please run `pip install "
|
23
|
-
f"{OptionalDependency.SPARK}`."
|
24
|
-
)
|
25
|
-
except Exception as e:
|
26
|
-
raise
|
27
|
-
|
28
|
-
logger = logging.getLogger(__name__)
|
29
|
-
|
30
|
-
|
31
|
-
def map_spark_type_to_feature_type(spark_type):
|
32
|
-
"""Returns the feature type corresponding to SparkType
|
33
|
-
:param spark_type:
|
34
|
-
:return:
|
35
|
-
"""
|
36
|
-
spark_type_to_feature_type = {
|
37
|
-
StringType(): FeatureType.STRING,
|
38
|
-
IntegerType(): FeatureType.INTEGER,
|
39
|
-
ShortType(): FeatureType.SHORT,
|
40
|
-
LongType(): FeatureType.LONG,
|
41
|
-
FloatType(): FeatureType.FLOAT,
|
42
|
-
DoubleType(): FeatureType.DOUBLE,
|
43
|
-
BooleanType(): FeatureType.BOOLEAN,
|
44
|
-
DateType(): FeatureType.DATE,
|
45
|
-
TimestampType(): FeatureType.TIMESTAMP,
|
46
|
-
BinaryType(): FeatureType.BINARY,
|
47
|
-
ByteType(): FeatureType.BYTE,
|
48
|
-
ArrayType(StringType()): FeatureType.STRING_ARRAY,
|
49
|
-
ArrayType(IntegerType()): FeatureType.INTEGER_ARRAY,
|
50
|
-
ArrayType(LongType()): FeatureType.LONG_ARRAY,
|
51
|
-
ArrayType(FloatType()): FeatureType.FLOAT_ARRAY,
|
52
|
-
ArrayType(DoubleType()): FeatureType.DOUBLE_ARRAY,
|
53
|
-
ArrayType(BinaryType()): FeatureType.BINARY_ARRAY,
|
54
|
-
ArrayType(DateType()): FeatureType.DATE_ARRAY,
|
55
|
-
ArrayType(TimestampType()): FeatureType.TIMESTAMP_ARRAY,
|
56
|
-
ArrayType(ByteType()): FeatureType.BYTE_ARRAY,
|
57
|
-
ArrayType(BooleanType()): FeatureType.BOOLEAN_ARRAY,
|
58
|
-
ArrayType(ShortType()): FeatureType.SHORT_ARRAY,
|
59
|
-
MapType(StringType(), StringType()): FeatureType.STRING_STRING_MAP,
|
60
|
-
MapType(StringType(), IntegerType()): FeatureType.STRING_INTEGER_MAP,
|
61
|
-
MapType(StringType(), ShortType()): FeatureType.STRING_SHORT_MAP,
|
62
|
-
MapType(StringType(), LongType()): FeatureType.STRING_LONG_MAP,
|
63
|
-
MapType(StringType(), FloatType()): FeatureType.STRING_FLOAT_MAP,
|
64
|
-
MapType(StringType(), DoubleType()): FeatureType.STRING_DOUBLE_MAP,
|
65
|
-
MapType(StringType(), TimestampType()): FeatureType.STRING_TIMESTAMP_MAP,
|
66
|
-
MapType(StringType(), DateType()): FeatureType.STRING_DATE_MAP,
|
67
|
-
MapType(StringType(), BinaryType()): FeatureType.STRING_BINARY_MAP,
|
68
|
-
MapType(StringType(), ByteType()): FeatureType.STRING_BYTE_MAP,
|
69
|
-
MapType(StringType(), BooleanType()): FeatureType.STRING_BOOLEAN_MAP,
|
70
|
-
}
|
71
|
-
if spark_type in spark_type_to_feature_type:
|
72
|
-
return spark_type_to_feature_type.get(spark_type)
|
73
|
-
else:
|
74
|
-
return FeatureType.COMPLEX
|
75
|
-
|
76
|
-
|
77
|
-
def map_pandas_type_to_feature_type(feature_name, values):
|
78
|
-
pandas_type = str(values.dtype)
|
79
|
-
inferred_dtype = FeatureType.UNKNOWN
|
80
|
-
if pandas_type is "object":
|
81
|
-
for row in values:
|
82
|
-
if isinstance(row, (list, np.ndarray)):
|
83
|
-
raise TypeError(f"object of type {type(row)} not supported")
|
84
|
-
pandas_basic_type = type(row).__name__
|
85
|
-
current_dtype = map_pandas_basic_type_to_feature_type(pandas_basic_type)
|
86
|
-
if inferred_dtype is FeatureType.UNKNOWN:
|
87
|
-
inferred_dtype = current_dtype
|
88
|
-
else:
|
89
|
-
if (
|
90
|
-
current_dtype != inferred_dtype
|
91
|
-
and current_dtype is not FeatureType.UNKNOWN
|
92
|
-
):
|
93
|
-
raise TypeError(
|
94
|
-
f"Input feature '{feature_name}' has mixed types, {current_dtype} and {inferred_dtype}. "
|
95
|
-
f"That is not allowed. "
|
96
|
-
)
|
97
|
-
else:
|
98
|
-
inferred_dtype = map_pandas_basic_type_to_feature_type(pandas_type)
|
99
|
-
if inferred_dtype is FeatureType.UNKNOWN:
|
100
|
-
raise TypeError(
|
101
|
-
f"Input feature '{feature_name}' has type {str(pandas_type)} which is not supported"
|
102
|
-
)
|
103
|
-
else:
|
104
|
-
return inferred_dtype
|
105
|
-
|
106
|
-
|
107
|
-
def map_pandas_basic_type_to_feature_type(pandas_type):
|
108
|
-
"""Returns the feature type corresponding to pandas_type
|
109
|
-
:param pandas_type:
|
110
|
-
:return:
|
111
|
-
"""
|
112
|
-
# TODO uint64 with bigger number cant be mapped to LongType
|
113
|
-
pandas_type_to_feature_type = {
|
114
|
-
"str": FeatureType.STRING,
|
115
|
-
"string": FeatureType.STRING,
|
116
|
-
"int": FeatureType.INTEGER,
|
117
|
-
"int8": FeatureType.INTEGER,
|
118
|
-
"int16": FeatureType.INTEGER,
|
119
|
-
"int32": FeatureType.LONG,
|
120
|
-
"int64": FeatureType.LONG,
|
121
|
-
"uint8": FeatureType.INTEGER,
|
122
|
-
"uint16": FeatureType.INTEGER,
|
123
|
-
"uint32": FeatureType.LONG,
|
124
|
-
"uint64": FeatureType.LONG,
|
125
|
-
"float": FeatureType.FLOAT,
|
126
|
-
"float16": FeatureType.FLOAT,
|
127
|
-
"float32": FeatureType.DOUBLE,
|
128
|
-
"float64": FeatureType.DOUBLE,
|
129
|
-
"datetime64[ns]": FeatureType.TIMESTAMP,
|
130
|
-
"datetime64[ns, UTC]": FeatureType.TIMESTAMP,
|
131
|
-
"timedelta64[ns]": FeatureType.LONG,
|
132
|
-
"bool": FeatureType.BOOLEAN,
|
133
|
-
"Decimal": FeatureType.DECIMAL,
|
134
|
-
"date": FeatureType.DATE,
|
135
|
-
}
|
136
|
-
if pandas_type in pandas_type_to_feature_type:
|
137
|
-
return pandas_type_to_feature_type.get(pandas_type)
|
138
|
-
return FeatureType.UNKNOWN
|
139
|
-
|
140
|
-
|
141
|
-
def map_feature_type_to_spark_type(feature_type):
|
142
|
-
"""Returns the Spark Type for a particular feature type.
|
143
|
-
:param feature_type:
|
144
|
-
:return: Spark Type
|
145
|
-
"""
|
146
|
-
feature_type_in = FeatureType(feature_type)
|
147
|
-
spark_types = {
|
148
|
-
FeatureType.STRING: StringType(),
|
149
|
-
FeatureType.SHORT: ShortType(),
|
150
|
-
FeatureType.INTEGER: IntegerType(),
|
151
|
-
FeatureType.LONG: LongType(),
|
152
|
-
FeatureType.FLOAT: FloatType(),
|
153
|
-
FeatureType.DOUBLE: DoubleType(),
|
154
|
-
FeatureType.BOOLEAN: BooleanType(),
|
155
|
-
FeatureType.DATE: DateType(),
|
156
|
-
FeatureType.TIMESTAMP: TimestampType(),
|
157
|
-
FeatureType.DECIMAL: DecimalType(),
|
158
|
-
FeatureType.BINARY: BinaryType(),
|
159
|
-
FeatureType.STRING_ARRAY: ArrayType(StringType()),
|
160
|
-
FeatureType.INTEGER_ARRAY: ArrayType(IntegerType()),
|
161
|
-
FeatureType.SHORT_ARRAY: ArrayType(ShortType()),
|
162
|
-
FeatureType.LONG_ARRAY: ArrayType(LongType()),
|
163
|
-
FeatureType.FLOAT_ARRAY: ArrayType(FloatType()),
|
164
|
-
FeatureType.DOUBLE_ARRAY: ArrayType(DoubleType()),
|
165
|
-
FeatureType.BINARY_ARRAY: ArrayType(BinaryType()),
|
166
|
-
FeatureType.DATE_ARRAY: ArrayType(DateType()),
|
167
|
-
FeatureType.BOOLEAN_ARRAY: ArrayType(BooleanType()),
|
168
|
-
FeatureType.TIMESTAMP_ARRAY: ArrayType(TimestampType()),
|
169
|
-
FeatureType.STRING_STRING_MAP: MapType(StringType(), StringType()),
|
170
|
-
FeatureType.STRING_INTEGER_MAP: MapType(StringType(), IntegerType()),
|
171
|
-
FeatureType.STRING_SHORT_MAP: MapType(StringType(), ShortType()),
|
172
|
-
FeatureType.STRING_LONG_MAP: MapType(StringType(), LongType()),
|
173
|
-
FeatureType.STRING_FLOAT_MAP: MapType(StringType(), FloatType()),
|
174
|
-
FeatureType.STRING_DOUBLE_MAP: MapType(StringType(), DoubleType()),
|
175
|
-
FeatureType.STRING_DATE_MAP: MapType(StringType(), DateType()),
|
176
|
-
FeatureType.STRING_TIMESTAMP_MAP: MapType(StringType(), TimestampType()),
|
177
|
-
FeatureType.STRING_BOOLEAN_MAP: MapType(StringType(), BooleanType()),
|
178
|
-
FeatureType.BYTE: ByteType(),
|
179
|
-
}
|
180
|
-
if feature_type_in in spark_types:
|
181
|
-
return spark_types.get(feature_type_in)
|
182
|
-
else:
|
183
|
-
return "COMPLEX"
|
184
|
-
|
185
|
-
|
186
|
-
def get_raw_data_source_schema(raw_feature_details: List[dict]):
|
187
|
-
"""Converts input feature details to Spark schema.
|
188
|
-
|
189
|
-
Args:
|
190
|
-
raw_feature_details(List[dict]): List of input feature details.
|
191
|
-
|
192
|
-
Returns:
|
193
|
-
StructType: Spark schema.
|
194
|
-
:param raw_feature_details:
|
195
|
-
"""
|
196
|
-
# Initialize the schema
|
197
|
-
features_schema = StructType()
|
198
|
-
|
199
|
-
for feature_details in raw_feature_details:
|
200
|
-
# Get the name, feature_type and is_nullable
|
201
|
-
feature_name = feature_details.get("name")
|
202
|
-
feature_type = map_feature_type_to_spark_type(
|
203
|
-
feature_details.get("featureType")
|
204
|
-
)
|
205
|
-
is_nullable = (
|
206
|
-
True
|
207
|
-
if feature_details.get("isNullable") is None
|
208
|
-
else feature_details.get("isNullable")
|
209
|
-
)
|
210
|
-
|
211
|
-
features_schema.add(feature_name, feature_type, is_nullable)
|
212
|
-
|
213
|
-
return features_schema
|
214
|
-
|
215
|
-
|
216
|
-
def map_feature_type_to_pandas(feature_type):
|
217
|
-
feature_type_in = FeatureType(feature_type)
|
218
|
-
supported_feature_type = {
|
219
|
-
FeatureType.STRING: str,
|
220
|
-
FeatureType.LONG: "int64",
|
221
|
-
FeatureType.DOUBLE: "float64",
|
222
|
-
FeatureType.TIMESTAMP: "datetime64[ns]",
|
223
|
-
FeatureType.BOOLEAN: "bool",
|
224
|
-
FeatureType.FLOAT: "float32",
|
225
|
-
FeatureType.INTEGER: "int32",
|
226
|
-
FeatureType.DECIMAL: "object",
|
227
|
-
FeatureType.DATE: "object",
|
228
|
-
FeatureType.STRING_ARRAY: "object",
|
229
|
-
FeatureType.INTEGER_ARRAY: "object",
|
230
|
-
FeatureType.LONG_ARRAY: "object",
|
231
|
-
FeatureType.FLOAT_ARRAY: "object",
|
232
|
-
FeatureType.DOUBLE_ARRAY: "object",
|
233
|
-
FeatureType.TIMESTAMP_ARRAY: "object",
|
234
|
-
FeatureType.BOOLEAN_ARRAY: "object",
|
235
|
-
# FeatureType.DECIMAL_ARRAY: "object",
|
236
|
-
FeatureType.DATE_ARRAY: "object",
|
237
|
-
}
|
238
|
-
if feature_type_in in supported_feature_type:
|
239
|
-
return supported_feature_type.get(feature_type_in)
|
240
|
-
else:
|
241
|
-
raise TypeError(f"Feature Type {feature_type} is not supported for pandas")
|
242
|
-
|
243
|
-
|
244
|
-
def map_spark_type_to_stats_data_type(spark_type):
|
245
|
-
"""Maps the spark data types to MLM library data types
|
246
|
-
args:
|
247
|
-
param spark_type: Spark data type input from the feature dataframe on which we need stats
|
248
|
-
:return:
|
249
|
-
Returns the MLM data type corresponding to SparkType
|
250
|
-
"""
|
251
|
-
spark_type_to_mlm_data_type = {
|
252
|
-
StringType(): types.DataType.STRING,
|
253
|
-
IntegerType(): types.DataType.INTEGER,
|
254
|
-
FloatType(): types.DataType.FLOAT,
|
255
|
-
DoubleType(): types.DataType.FLOAT,
|
256
|
-
BooleanType(): types.DataType.BOOLEAN,
|
257
|
-
DecimalType(): types.DataType.FLOAT,
|
258
|
-
ShortType(): types.DataType.INTEGER,
|
259
|
-
LongType(): types.DataType.INTEGER,
|
260
|
-
}
|
261
|
-
|
262
|
-
return spark_type_to_mlm_data_type.get(spark_type)
|
263
|
-
|
264
|
-
|
265
|
-
def map_spark_type_to_stats_variable_type(spark_type):
|
266
|
-
"""Maps the spark data types to MLM library variable types
|
267
|
-
args:
|
268
|
-
param spark_type: Spark data type input from the feature dataframe on which we need stats
|
269
|
-
:return:
|
270
|
-
Returns the MLM variable type corresponding to SparkType
|
271
|
-
"""
|
272
|
-
spark_type_to_feature_type = {
|
273
|
-
StringType(): types.VariableType.NOMINAL,
|
274
|
-
IntegerType(): types.VariableType.CONTINUOUS,
|
275
|
-
FloatType(): types.VariableType.CONTINUOUS,
|
276
|
-
DoubleType(): types.VariableType.CONTINUOUS,
|
277
|
-
BooleanType(): types.VariableType.BINARY,
|
278
|
-
DecimalType(): types.VariableType.CONTINUOUS,
|
279
|
-
ShortType(): types.VariableType.CONTINUOUS,
|
280
|
-
LongType(): types.VariableType.CONTINUOUS,
|
281
|
-
}
|
282
|
-
|
283
|
-
return spark_type_to_feature_type.get(spark_type)
|
@@ -1,82 +0,0 @@
|
|
1
|
-
#!/usr/bin/env python
|
2
|
-
# -*- coding: utf-8; -*-
|
3
|
-
|
4
|
-
# Copyright (c) 2024 Oracle and/or its affiliates.
|
5
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
6
|
-
|
7
|
-
import json
|
8
|
-
|
9
|
-
# Copyright (c) 2023 Oracle and/or its affiliates.
|
10
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
11
|
-
|
12
|
-
from typing import Union
|
13
|
-
|
14
|
-
from ads.common.decorator.runtime_dependency import OptionalDependency
|
15
|
-
from ads.feature_store.common.utils.base64_encoder_decoder import Base64EncoderDecoder
|
16
|
-
from ads.feature_store.transformation import Transformation, TransformationMode
|
17
|
-
import pandas as pd
|
18
|
-
|
19
|
-
try:
|
20
|
-
from pyspark.sql import SparkSession, DataFrame
|
21
|
-
except ModuleNotFoundError:
|
22
|
-
raise ModuleNotFoundError(
|
23
|
-
f"The `pyspark` module was not found. Please run `pip install "
|
24
|
-
f"{OptionalDependency.SPARK}`."
|
25
|
-
)
|
26
|
-
except Exception as e:
|
27
|
-
raise
|
28
|
-
|
29
|
-
|
30
|
-
class TransformationUtils:
|
31
|
-
@staticmethod
|
32
|
-
def apply_transformation(
|
33
|
-
spark: SparkSession,
|
34
|
-
dataframe: Union[DataFrame, pd.DataFrame],
|
35
|
-
transformation: Transformation,
|
36
|
-
transformation_kwargs: str,
|
37
|
-
):
|
38
|
-
"""
|
39
|
-
Perform data transformation using either SQL or Pandas, depending on the specified transformation mode.
|
40
|
-
|
41
|
-
Args:
|
42
|
-
spark: A SparkSession object.
|
43
|
-
transformation (Transformation): A transformation object containing details of transformation to be performed.
|
44
|
-
dataframe (DataFrame): The input dataframe to be transformed.
|
45
|
-
transformation_kwargs(str): The transformation parameters as json string.
|
46
|
-
|
47
|
-
Returns:
|
48
|
-
DataFrame: The resulting transformed data.
|
49
|
-
"""
|
50
|
-
|
51
|
-
# Fetch the transformation function
|
52
|
-
transformation_function = Base64EncoderDecoder.decode(
|
53
|
-
transformation.source_code_function
|
54
|
-
)
|
55
|
-
|
56
|
-
# Execute the function under namespace
|
57
|
-
execution_namespace = {}
|
58
|
-
exec(transformation_function, execution_namespace)
|
59
|
-
transformation_function_caller = execution_namespace.get(transformation.name)
|
60
|
-
transformed_data = None
|
61
|
-
|
62
|
-
transformation_kwargs_dict = json.loads(transformation_kwargs)
|
63
|
-
|
64
|
-
if transformation.transformation_mode == TransformationMode.SQL.value:
|
65
|
-
# Register the temporary table
|
66
|
-
temporary_table_view = "df_view"
|
67
|
-
dataframe.createOrReplaceTempView(temporary_table_view)
|
68
|
-
|
69
|
-
transformed_data = spark.sql(
|
70
|
-
transformation_function_caller(
|
71
|
-
temporary_table_view, **transformation_kwargs_dict
|
72
|
-
)
|
73
|
-
)
|
74
|
-
elif transformation.transformation_mode in [
|
75
|
-
TransformationMode.PANDAS.value,
|
76
|
-
TransformationMode.SPARK.value,
|
77
|
-
]:
|
78
|
-
transformed_data = transformation_function_caller(
|
79
|
-
dataframe, **transformation_kwargs_dict
|
80
|
-
)
|
81
|
-
|
82
|
-
return transformed_data
|