oracle-ads 2.13.8__py3-none-any.whl → 2.13.9rc0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/METADATA +151 -151
- oracle_ads-2.13.9rc0.dist-info/RECORD +9 -0
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/WHEEL +2 -1
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/entry_points.txt +1 -2
- oracle_ads-2.13.9rc0.dist-info/top_level.txt +1 -0
- ads/aqua/__init__.py +0 -40
- ads/aqua/app.py +0 -506
- ads/aqua/cli.py +0 -96
- ads/aqua/client/__init__.py +0 -3
- ads/aqua/client/client.py +0 -836
- ads/aqua/client/openai_client.py +0 -305
- ads/aqua/common/__init__.py +0 -5
- ads/aqua/common/decorator.py +0 -125
- ads/aqua/common/entities.py +0 -266
- ads/aqua/common/enums.py +0 -122
- ads/aqua/common/errors.py +0 -109
- ads/aqua/common/utils.py +0 -1285
- ads/aqua/config/__init__.py +0 -4
- ads/aqua/config/container_config.py +0 -248
- ads/aqua/config/evaluation/__init__.py +0 -4
- ads/aqua/config/evaluation/evaluation_service_config.py +0 -147
- ads/aqua/config/utils/__init__.py +0 -4
- ads/aqua/config/utils/serializer.py +0 -339
- ads/aqua/constants.py +0 -114
- ads/aqua/data.py +0 -14
- ads/aqua/dummy_data/icon.txt +0 -1
- ads/aqua/dummy_data/oci_model_deployments.json +0 -56
- ads/aqua/dummy_data/oci_models.json +0 -1
- ads/aqua/dummy_data/readme.md +0 -26
- ads/aqua/evaluation/__init__.py +0 -8
- ads/aqua/evaluation/constants.py +0 -53
- ads/aqua/evaluation/entities.py +0 -186
- ads/aqua/evaluation/errors.py +0 -70
- ads/aqua/evaluation/evaluation.py +0 -1814
- ads/aqua/extension/__init__.py +0 -42
- ads/aqua/extension/aqua_ws_msg_handler.py +0 -76
- ads/aqua/extension/base_handler.py +0 -90
- ads/aqua/extension/common_handler.py +0 -121
- ads/aqua/extension/common_ws_msg_handler.py +0 -36
- ads/aqua/extension/deployment_handler.py +0 -298
- ads/aqua/extension/deployment_ws_msg_handler.py +0 -54
- ads/aqua/extension/errors.py +0 -30
- ads/aqua/extension/evaluation_handler.py +0 -129
- ads/aqua/extension/evaluation_ws_msg_handler.py +0 -61
- ads/aqua/extension/finetune_handler.py +0 -96
- ads/aqua/extension/model_handler.py +0 -390
- ads/aqua/extension/models/__init__.py +0 -0
- ads/aqua/extension/models/ws_models.py +0 -145
- ads/aqua/extension/models_ws_msg_handler.py +0 -50
- ads/aqua/extension/ui_handler.py +0 -282
- ads/aqua/extension/ui_websocket_handler.py +0 -130
- ads/aqua/extension/utils.py +0 -133
- ads/aqua/finetuning/__init__.py +0 -7
- ads/aqua/finetuning/constants.py +0 -23
- ads/aqua/finetuning/entities.py +0 -181
- ads/aqua/finetuning/finetuning.py +0 -731
- ads/aqua/model/__init__.py +0 -8
- ads/aqua/model/constants.py +0 -60
- ads/aqua/model/entities.py +0 -306
- ads/aqua/model/enums.py +0 -30
- ads/aqua/model/model.py +0 -2080
- ads/aqua/modeldeployment/__init__.py +0 -8
- ads/aqua/modeldeployment/constants.py +0 -10
- ads/aqua/modeldeployment/deployment.py +0 -1324
- ads/aqua/modeldeployment/entities.py +0 -653
- ads/aqua/modeldeployment/inference.py +0 -74
- ads/aqua/modeldeployment/utils.py +0 -543
- ads/aqua/resources/gpu_shapes_index.json +0 -94
- ads/aqua/server/__init__.py +0 -4
- ads/aqua/server/__main__.py +0 -24
- ads/aqua/server/app.py +0 -47
- ads/aqua/server/aqua_spec.yml +0 -1291
- ads/aqua/training/__init__.py +0 -4
- ads/aqua/training/exceptions.py +0 -476
- ads/aqua/ui.py +0 -499
- ads/automl/__init__.py +0 -9
- ads/automl/driver.py +0 -330
- ads/automl/provider.py +0 -975
- ads/bds/__init__.py +0 -5
- ads/bds/auth.py +0 -127
- ads/bds/big_data_service.py +0 -255
- ads/catalog/__init__.py +0 -19
- ads/catalog/model.py +0 -1576
- ads/catalog/notebook.py +0 -461
- ads/catalog/project.py +0 -468
- ads/catalog/summary.py +0 -178
- ads/common/__init__.py +0 -11
- ads/common/analyzer.py +0 -65
- ads/common/artifact/.model-ignore +0 -63
- ads/common/artifact/__init__.py +0 -10
- ads/common/auth.py +0 -1122
- ads/common/card_identifier.py +0 -83
- ads/common/config.py +0 -647
- ads/common/data.py +0 -165
- ads/common/decorator/__init__.py +0 -9
- ads/common/decorator/argument_to_case.py +0 -88
- ads/common/decorator/deprecate.py +0 -69
- ads/common/decorator/require_nonempty_arg.py +0 -65
- ads/common/decorator/runtime_dependency.py +0 -178
- ads/common/decorator/threaded.py +0 -97
- ads/common/decorator/utils.py +0 -35
- ads/common/dsc_file_system.py +0 -303
- ads/common/error.py +0 -14
- ads/common/extended_enum.py +0 -81
- ads/common/function/__init__.py +0 -5
- ads/common/function/fn_util.py +0 -142
- ads/common/function/func_conf.yaml +0 -25
- ads/common/ipython.py +0 -76
- ads/common/model.py +0 -679
- ads/common/model_artifact.py +0 -1759
- ads/common/model_artifact_schema.json +0 -107
- ads/common/model_export_util.py +0 -664
- ads/common/model_metadata.py +0 -24
- ads/common/object_storage_details.py +0 -296
- ads/common/oci_client.py +0 -175
- ads/common/oci_datascience.py +0 -46
- ads/common/oci_logging.py +0 -1144
- ads/common/oci_mixin.py +0 -957
- ads/common/oci_resource.py +0 -136
- ads/common/serializer.py +0 -559
- ads/common/utils.py +0 -1852
- ads/common/word_lists.py +0 -1491
- ads/common/work_request.py +0 -189
- ads/data_labeling/__init__.py +0 -13
- ads/data_labeling/boundingbox.py +0 -253
- ads/data_labeling/constants.py +0 -47
- ads/data_labeling/data_labeling_service.py +0 -244
- ads/data_labeling/interface/__init__.py +0 -5
- ads/data_labeling/interface/loader.py +0 -16
- ads/data_labeling/interface/parser.py +0 -16
- ads/data_labeling/interface/reader.py +0 -23
- ads/data_labeling/loader/__init__.py +0 -5
- ads/data_labeling/loader/file_loader.py +0 -241
- ads/data_labeling/metadata.py +0 -110
- ads/data_labeling/mixin/__init__.py +0 -5
- ads/data_labeling/mixin/data_labeling.py +0 -232
- ads/data_labeling/ner.py +0 -129
- ads/data_labeling/parser/__init__.py +0 -5
- ads/data_labeling/parser/dls_record_parser.py +0 -388
- ads/data_labeling/parser/export_metadata_parser.py +0 -94
- ads/data_labeling/parser/export_record_parser.py +0 -473
- ads/data_labeling/reader/__init__.py +0 -5
- ads/data_labeling/reader/dataset_reader.py +0 -574
- ads/data_labeling/reader/dls_record_reader.py +0 -121
- ads/data_labeling/reader/export_record_reader.py +0 -62
- ads/data_labeling/reader/jsonl_reader.py +0 -75
- ads/data_labeling/reader/metadata_reader.py +0 -203
- ads/data_labeling/reader/record_reader.py +0 -263
- ads/data_labeling/record.py +0 -52
- ads/data_labeling/visualizer/__init__.py +0 -5
- ads/data_labeling/visualizer/image_visualizer.py +0 -525
- ads/data_labeling/visualizer/text_visualizer.py +0 -357
- ads/database/__init__.py +0 -5
- ads/database/connection.py +0 -338
- ads/dataset/__init__.py +0 -10
- ads/dataset/capabilities.md +0 -51
- ads/dataset/classification_dataset.py +0 -339
- ads/dataset/correlation.py +0 -226
- ads/dataset/correlation_plot.py +0 -563
- ads/dataset/dask_series.py +0 -173
- ads/dataset/dataframe_transformer.py +0 -110
- ads/dataset/dataset.py +0 -1979
- ads/dataset/dataset_browser.py +0 -360
- ads/dataset/dataset_with_target.py +0 -995
- ads/dataset/exception.py +0 -25
- ads/dataset/factory.py +0 -987
- ads/dataset/feature_engineering_transformer.py +0 -35
- ads/dataset/feature_selection.py +0 -107
- ads/dataset/forecasting_dataset.py +0 -26
- ads/dataset/helper.py +0 -1450
- ads/dataset/label_encoder.py +0 -99
- ads/dataset/mixin/__init__.py +0 -5
- ads/dataset/mixin/dataset_accessor.py +0 -134
- ads/dataset/pipeline.py +0 -58
- ads/dataset/plot.py +0 -710
- ads/dataset/progress.py +0 -86
- ads/dataset/recommendation.py +0 -297
- ads/dataset/recommendation_transformer.py +0 -502
- ads/dataset/regression_dataset.py +0 -14
- ads/dataset/sampled_dataset.py +0 -1050
- ads/dataset/target.py +0 -98
- ads/dataset/timeseries.py +0 -18
- ads/dbmixin/__init__.py +0 -5
- ads/dbmixin/db_pandas_accessor.py +0 -153
- ads/environment/__init__.py +0 -9
- ads/environment/ml_runtime.py +0 -66
- ads/evaluations/README.md +0 -14
- ads/evaluations/__init__.py +0 -109
- ads/evaluations/evaluation_plot.py +0 -983
- ads/evaluations/evaluator.py +0 -1334
- ads/evaluations/statistical_metrics.py +0 -543
- ads/experiments/__init__.py +0 -9
- ads/experiments/capabilities.md +0 -0
- ads/explanations/__init__.py +0 -21
- ads/explanations/base_explainer.py +0 -142
- ads/explanations/capabilities.md +0 -83
- ads/explanations/explainer.py +0 -190
- ads/explanations/mlx_global_explainer.py +0 -1050
- ads/explanations/mlx_interface.py +0 -386
- ads/explanations/mlx_local_explainer.py +0 -287
- ads/explanations/mlx_whatif_explainer.py +0 -201
- ads/feature_engineering/__init__.py +0 -20
- ads/feature_engineering/accessor/__init__.py +0 -5
- ads/feature_engineering/accessor/dataframe_accessor.py +0 -535
- ads/feature_engineering/accessor/mixin/__init__.py +0 -5
- ads/feature_engineering/accessor/mixin/correlation.py +0 -166
- ads/feature_engineering/accessor/mixin/eda_mixin.py +0 -266
- ads/feature_engineering/accessor/mixin/eda_mixin_series.py +0 -85
- ads/feature_engineering/accessor/mixin/feature_types_mixin.py +0 -211
- ads/feature_engineering/accessor/mixin/utils.py +0 -65
- ads/feature_engineering/accessor/series_accessor.py +0 -431
- ads/feature_engineering/adsimage/__init__.py +0 -5
- ads/feature_engineering/adsimage/image.py +0 -192
- ads/feature_engineering/adsimage/image_reader.py +0 -170
- ads/feature_engineering/adsimage/interface/__init__.py +0 -5
- ads/feature_engineering/adsimage/interface/reader.py +0 -19
- ads/feature_engineering/adsstring/__init__.py +0 -7
- ads/feature_engineering/adsstring/oci_language/__init__.py +0 -8
- ads/feature_engineering/adsstring/string/__init__.py +0 -8
- ads/feature_engineering/data_schema.json +0 -57
- ads/feature_engineering/dataset/__init__.py +0 -5
- ads/feature_engineering/dataset/zip_code_data.py +0 -42062
- ads/feature_engineering/exceptions.py +0 -40
- ads/feature_engineering/feature_type/__init__.py +0 -133
- ads/feature_engineering/feature_type/address.py +0 -184
- ads/feature_engineering/feature_type/adsstring/__init__.py +0 -5
- ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +0 -164
- ads/feature_engineering/feature_type/adsstring/oci_language.py +0 -93
- ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +0 -5
- ads/feature_engineering/feature_type/adsstring/parsers/base.py +0 -47
- ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +0 -96
- ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +0 -221
- ads/feature_engineering/feature_type/adsstring/string.py +0 -258
- ads/feature_engineering/feature_type/base.py +0 -58
- ads/feature_engineering/feature_type/boolean.py +0 -183
- ads/feature_engineering/feature_type/category.py +0 -146
- ads/feature_engineering/feature_type/constant.py +0 -137
- ads/feature_engineering/feature_type/continuous.py +0 -151
- ads/feature_engineering/feature_type/creditcard.py +0 -314
- ads/feature_engineering/feature_type/datetime.py +0 -190
- ads/feature_engineering/feature_type/discrete.py +0 -134
- ads/feature_engineering/feature_type/document.py +0 -43
- ads/feature_engineering/feature_type/gis.py +0 -251
- ads/feature_engineering/feature_type/handler/__init__.py +0 -5
- ads/feature_engineering/feature_type/handler/feature_validator.py +0 -524
- ads/feature_engineering/feature_type/handler/feature_warning.py +0 -319
- ads/feature_engineering/feature_type/handler/warnings.py +0 -128
- ads/feature_engineering/feature_type/integer.py +0 -142
- ads/feature_engineering/feature_type/ip_address.py +0 -144
- ads/feature_engineering/feature_type/ip_address_v4.py +0 -138
- ads/feature_engineering/feature_type/ip_address_v6.py +0 -138
- ads/feature_engineering/feature_type/lat_long.py +0 -256
- ads/feature_engineering/feature_type/object.py +0 -43
- ads/feature_engineering/feature_type/ordinal.py +0 -132
- ads/feature_engineering/feature_type/phone_number.py +0 -135
- ads/feature_engineering/feature_type/string.py +0 -171
- ads/feature_engineering/feature_type/text.py +0 -93
- ads/feature_engineering/feature_type/unknown.py +0 -43
- ads/feature_engineering/feature_type/zip_code.py +0 -164
- ads/feature_engineering/feature_type_manager.py +0 -406
- ads/feature_engineering/schema.py +0 -795
- ads/feature_engineering/utils.py +0 -245
- ads/feature_store/.readthedocs.yaml +0 -19
- ads/feature_store/README.md +0 -65
- ads/feature_store/__init__.py +0 -9
- ads/feature_store/common/__init__.py +0 -0
- ads/feature_store/common/enums.py +0 -339
- ads/feature_store/common/exceptions.py +0 -18
- ads/feature_store/common/spark_session_singleton.py +0 -125
- ads/feature_store/common/utils/__init__.py +0 -0
- ads/feature_store/common/utils/base64_encoder_decoder.py +0 -72
- ads/feature_store/common/utils/feature_schema_mapper.py +0 -283
- ads/feature_store/common/utils/transformation_utils.py +0 -82
- ads/feature_store/common/utils/utility.py +0 -403
- ads/feature_store/data_validation/__init__.py +0 -0
- ads/feature_store/data_validation/great_expectation.py +0 -129
- ads/feature_store/dataset.py +0 -1230
- ads/feature_store/dataset_job.py +0 -530
- ads/feature_store/docs/Dockerfile +0 -7
- ads/feature_store/docs/Makefile +0 -44
- ads/feature_store/docs/conf.py +0 -28
- ads/feature_store/docs/requirements.txt +0 -14
- ads/feature_store/docs/source/ads.feature_store.query.rst +0 -20
- ads/feature_store/docs/source/cicd.rst +0 -137
- ads/feature_store/docs/source/conf.py +0 -86
- ads/feature_store/docs/source/data_versioning.rst +0 -33
- ads/feature_store/docs/source/dataset.rst +0 -388
- ads/feature_store/docs/source/dataset_job.rst +0 -27
- ads/feature_store/docs/source/demo.rst +0 -70
- ads/feature_store/docs/source/entity.rst +0 -78
- ads/feature_store/docs/source/feature_group.rst +0 -624
- ads/feature_store/docs/source/feature_group_job.rst +0 -29
- ads/feature_store/docs/source/feature_store.rst +0 -122
- ads/feature_store/docs/source/feature_store_class.rst +0 -123
- ads/feature_store/docs/source/feature_validation.rst +0 -66
- ads/feature_store/docs/source/figures/cicd.png +0 -0
- ads/feature_store/docs/source/figures/data_validation.png +0 -0
- ads/feature_store/docs/source/figures/data_versioning.png +0 -0
- ads/feature_store/docs/source/figures/dataset.gif +0 -0
- ads/feature_store/docs/source/figures/dataset.png +0 -0
- ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
- ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
- ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
- ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
- ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
- ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
- ads/feature_store/docs/source/figures/entity.png +0 -0
- ads/feature_store/docs/source/figures/feature_group.png +0 -0
- ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
- ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
- ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
- ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
- ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
- ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
- ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
- ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
- ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
- ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
- ads/feature_store/docs/source/figures/overview.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
- ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
- ads/feature_store/docs/source/figures/stats_1.png +0 -0
- ads/feature_store/docs/source/figures/stats_2.png +0 -0
- ads/feature_store/docs/source/figures/stats_d.png +0 -0
- ads/feature_store/docs/source/figures/stats_fg.png +0 -0
- ads/feature_store/docs/source/figures/transformation.png +0 -0
- ads/feature_store/docs/source/figures/transformations.gif +0 -0
- ads/feature_store/docs/source/figures/validation.png +0 -0
- ads/feature_store/docs/source/figures/validation_fg.png +0 -0
- ads/feature_store/docs/source/figures/validation_results.png +0 -0
- ads/feature_store/docs/source/figures/validation_summary.png +0 -0
- ads/feature_store/docs/source/index.rst +0 -81
- ads/feature_store/docs/source/module.rst +0 -8
- ads/feature_store/docs/source/notebook.rst +0 -94
- ads/feature_store/docs/source/overview.rst +0 -47
- ads/feature_store/docs/source/quickstart.rst +0 -176
- ads/feature_store/docs/source/release_notes.rst +0 -194
- ads/feature_store/docs/source/setup_feature_store.rst +0 -81
- ads/feature_store/docs/source/statistics.rst +0 -58
- ads/feature_store/docs/source/transformation.rst +0 -199
- ads/feature_store/docs/source/ui.rst +0 -65
- ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +0 -66
- ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +0 -192
- ads/feature_store/docs/source/user_guides.setup.terraform.rst +0 -338
- ads/feature_store/entity.py +0 -718
- ads/feature_store/execution_strategy/__init__.py +0 -0
- ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
- ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +0 -375
- ads/feature_store/execution_strategy/engine/__init__.py +0 -0
- ads/feature_store/execution_strategy/engine/spark_engine.py +0 -316
- ads/feature_store/execution_strategy/execution_strategy.py +0 -113
- ads/feature_store/execution_strategy/execution_strategy_provider.py +0 -47
- ads/feature_store/execution_strategy/spark/__init__.py +0 -0
- ads/feature_store/execution_strategy/spark/spark_execution.py +0 -618
- ads/feature_store/feature.py +0 -192
- ads/feature_store/feature_group.py +0 -1494
- ads/feature_store/feature_group_expectation.py +0 -346
- ads/feature_store/feature_group_job.py +0 -602
- ads/feature_store/feature_lineage/__init__.py +0 -0
- ads/feature_store/feature_lineage/graphviz_service.py +0 -180
- ads/feature_store/feature_option_details.py +0 -50
- ads/feature_store/feature_statistics/__init__.py +0 -0
- ads/feature_store/feature_statistics/statistics_service.py +0 -99
- ads/feature_store/feature_store.py +0 -699
- ads/feature_store/feature_store_registrar.py +0 -518
- ads/feature_store/input_feature_detail.py +0 -149
- ads/feature_store/mixin/__init__.py +0 -4
- ads/feature_store/mixin/oci_feature_store.py +0 -145
- ads/feature_store/model_details.py +0 -73
- ads/feature_store/query/__init__.py +0 -0
- ads/feature_store/query/filter.py +0 -266
- ads/feature_store/query/generator/__init__.py +0 -0
- ads/feature_store/query/generator/query_generator.py +0 -298
- ads/feature_store/query/join.py +0 -161
- ads/feature_store/query/query.py +0 -403
- ads/feature_store/query/validator/__init__.py +0 -0
- ads/feature_store/query/validator/query_validator.py +0 -57
- ads/feature_store/response/__init__.py +0 -0
- ads/feature_store/response/response_builder.py +0 -68
- ads/feature_store/service/__init__.py +0 -0
- ads/feature_store/service/oci_dataset.py +0 -139
- ads/feature_store/service/oci_dataset_job.py +0 -199
- ads/feature_store/service/oci_entity.py +0 -125
- ads/feature_store/service/oci_feature_group.py +0 -164
- ads/feature_store/service/oci_feature_group_job.py +0 -214
- ads/feature_store/service/oci_feature_store.py +0 -182
- ads/feature_store/service/oci_lineage.py +0 -87
- ads/feature_store/service/oci_transformation.py +0 -104
- ads/feature_store/statistics/__init__.py +0 -0
- ads/feature_store/statistics/abs_feature_value.py +0 -49
- ads/feature_store/statistics/charts/__init__.py +0 -0
- ads/feature_store/statistics/charts/abstract_feature_plot.py +0 -37
- ads/feature_store/statistics/charts/box_plot.py +0 -148
- ads/feature_store/statistics/charts/frequency_distribution.py +0 -65
- ads/feature_store/statistics/charts/probability_distribution.py +0 -68
- ads/feature_store/statistics/charts/top_k_frequent_elements.py +0 -98
- ads/feature_store/statistics/feature_stat.py +0 -126
- ads/feature_store/statistics/generic_feature_value.py +0 -33
- ads/feature_store/statistics/statistics.py +0 -41
- ads/feature_store/statistics_config.py +0 -101
- ads/feature_store/templates/feature_store_template.yaml +0 -45
- ads/feature_store/transformation.py +0 -499
- ads/feature_store/validation_output.py +0 -57
- ads/hpo/__init__.py +0 -9
- ads/hpo/_imports.py +0 -91
- ads/hpo/ads_search_space.py +0 -439
- ads/hpo/distributions.py +0 -325
- ads/hpo/objective.py +0 -280
- ads/hpo/search_cv.py +0 -1657
- ads/hpo/stopping_criterion.py +0 -75
- ads/hpo/tuner_artifact.py +0 -413
- ads/hpo/utils.py +0 -91
- ads/hpo/validation.py +0 -140
- ads/hpo/visualization/__init__.py +0 -5
- ads/hpo/visualization/_contour.py +0 -23
- ads/hpo/visualization/_edf.py +0 -20
- ads/hpo/visualization/_intermediate_values.py +0 -21
- ads/hpo/visualization/_optimization_history.py +0 -25
- ads/hpo/visualization/_parallel_coordinate.py +0 -169
- ads/hpo/visualization/_param_importances.py +0 -26
- ads/jobs/__init__.py +0 -53
- ads/jobs/ads_job.py +0 -663
- ads/jobs/builders/__init__.py +0 -5
- ads/jobs/builders/base.py +0 -156
- ads/jobs/builders/infrastructure/__init__.py +0 -6
- ads/jobs/builders/infrastructure/base.py +0 -165
- ads/jobs/builders/infrastructure/dataflow.py +0 -1252
- ads/jobs/builders/infrastructure/dsc_job.py +0 -1894
- ads/jobs/builders/infrastructure/dsc_job_runtime.py +0 -1233
- ads/jobs/builders/infrastructure/utils.py +0 -65
- ads/jobs/builders/runtimes/__init__.py +0 -5
- ads/jobs/builders/runtimes/artifact.py +0 -338
- ads/jobs/builders/runtimes/base.py +0 -325
- ads/jobs/builders/runtimes/container_runtime.py +0 -242
- ads/jobs/builders/runtimes/python_runtime.py +0 -1016
- ads/jobs/builders/runtimes/pytorch_runtime.py +0 -204
- ads/jobs/cli.py +0 -104
- ads/jobs/env_var_parser.py +0 -131
- ads/jobs/extension.py +0 -160
- ads/jobs/schema/__init__.py +0 -5
- ads/jobs/schema/infrastructure_schema.json +0 -116
- ads/jobs/schema/job_schema.json +0 -42
- ads/jobs/schema/runtime_schema.json +0 -183
- ads/jobs/schema/validator.py +0 -141
- ads/jobs/serializer.py +0 -296
- ads/jobs/templates/__init__.py +0 -5
- ads/jobs/templates/container.py +0 -6
- ads/jobs/templates/driver_notebook.py +0 -177
- ads/jobs/templates/driver_oci.py +0 -500
- ads/jobs/templates/driver_python.py +0 -48
- ads/jobs/templates/driver_pytorch.py +0 -852
- ads/jobs/templates/driver_utils.py +0 -615
- ads/jobs/templates/hostname_from_env.c +0 -55
- ads/jobs/templates/oci_metrics.py +0 -181
- ads/jobs/utils.py +0 -104
- ads/llm/__init__.py +0 -28
- ads/llm/autogen/__init__.py +0 -2
- ads/llm/autogen/constants.py +0 -15
- ads/llm/autogen/reports/__init__.py +0 -2
- ads/llm/autogen/reports/base.py +0 -67
- ads/llm/autogen/reports/data.py +0 -103
- ads/llm/autogen/reports/session.py +0 -526
- ads/llm/autogen/reports/templates/chat_box.html +0 -13
- ads/llm/autogen/reports/templates/chat_box_lt.html +0 -5
- ads/llm/autogen/reports/templates/chat_box_rt.html +0 -6
- ads/llm/autogen/reports/utils.py +0 -56
- ads/llm/autogen/v02/__init__.py +0 -4
- ads/llm/autogen/v02/client.py +0 -295
- ads/llm/autogen/v02/log_handlers/__init__.py +0 -2
- ads/llm/autogen/v02/log_handlers/oci_file_handler.py +0 -83
- ads/llm/autogen/v02/loggers/__init__.py +0 -6
- ads/llm/autogen/v02/loggers/metric_logger.py +0 -320
- ads/llm/autogen/v02/loggers/session_logger.py +0 -580
- ads/llm/autogen/v02/loggers/utils.py +0 -86
- ads/llm/autogen/v02/runtime_logging.py +0 -163
- ads/llm/chain.py +0 -268
- ads/llm/chat_template.py +0 -31
- ads/llm/deploy.py +0 -63
- ads/llm/guardrails/__init__.py +0 -5
- ads/llm/guardrails/base.py +0 -442
- ads/llm/guardrails/huggingface.py +0 -44
- ads/llm/langchain/__init__.py +0 -5
- ads/llm/langchain/plugins/__init__.py +0 -5
- ads/llm/langchain/plugins/chat_models/__init__.py +0 -5
- ads/llm/langchain/plugins/chat_models/oci_data_science.py +0 -1027
- ads/llm/langchain/plugins/embeddings/__init__.py +0 -4
- ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +0 -184
- ads/llm/langchain/plugins/llms/__init__.py +0 -5
- ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +0 -979
- ads/llm/requirements.txt +0 -3
- ads/llm/serialize.py +0 -219
- ads/llm/serializers/__init__.py +0 -0
- ads/llm/serializers/retrieval_qa.py +0 -153
- ads/llm/serializers/runnable_parallel.py +0 -27
- ads/llm/templates/score_chain.jinja2 +0 -155
- ads/llm/templates/tool_chat_template_hermes.jinja +0 -130
- ads/llm/templates/tool_chat_template_mistral_parallel.jinja +0 -94
- ads/model/__init__.py +0 -52
- ads/model/artifact.py +0 -573
- ads/model/artifact_downloader.py +0 -254
- ads/model/artifact_uploader.py +0 -267
- ads/model/base_properties.py +0 -238
- ads/model/common/.model-ignore +0 -66
- ads/model/common/__init__.py +0 -5
- ads/model/common/utils.py +0 -142
- ads/model/datascience_model.py +0 -2635
- ads/model/deployment/__init__.py +0 -20
- ads/model/deployment/common/__init__.py +0 -5
- ads/model/deployment/common/utils.py +0 -308
- ads/model/deployment/model_deployer.py +0 -466
- ads/model/deployment/model_deployment.py +0 -1846
- ads/model/deployment/model_deployment_infrastructure.py +0 -671
- ads/model/deployment/model_deployment_properties.py +0 -493
- ads/model/deployment/model_deployment_runtime.py +0 -838
- ads/model/extractor/__init__.py +0 -5
- ads/model/extractor/automl_extractor.py +0 -74
- ads/model/extractor/embedding_onnx_extractor.py +0 -80
- ads/model/extractor/huggingface_extractor.py +0 -88
- ads/model/extractor/keras_extractor.py +0 -84
- ads/model/extractor/lightgbm_extractor.py +0 -93
- ads/model/extractor/model_info_extractor.py +0 -114
- ads/model/extractor/model_info_extractor_factory.py +0 -105
- ads/model/extractor/pytorch_extractor.py +0 -87
- ads/model/extractor/sklearn_extractor.py +0 -112
- ads/model/extractor/spark_extractor.py +0 -89
- ads/model/extractor/tensorflow_extractor.py +0 -85
- ads/model/extractor/xgboost_extractor.py +0 -94
- ads/model/framework/__init__.py +0 -5
- ads/model/framework/automl_model.py +0 -178
- ads/model/framework/embedding_onnx_model.py +0 -438
- ads/model/framework/huggingface_model.py +0 -399
- ads/model/framework/lightgbm_model.py +0 -266
- ads/model/framework/pytorch_model.py +0 -266
- ads/model/framework/sklearn_model.py +0 -250
- ads/model/framework/spark_model.py +0 -326
- ads/model/framework/tensorflow_model.py +0 -254
- ads/model/framework/xgboost_model.py +0 -258
- ads/model/generic_model.py +0 -3518
- ads/model/model_artifact_boilerplate/README.md +0 -381
- ads/model/model_artifact_boilerplate/__init__.py +0 -5
- ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +0 -5
- ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +0 -427
- ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +0 -2
- ads/model/model_artifact_boilerplate/runtime.yaml +0 -7
- ads/model/model_artifact_boilerplate/score.py +0 -61
- ads/model/model_file_description_schema.json +0 -68
- ads/model/model_introspect.py +0 -331
- ads/model/model_metadata.py +0 -1810
- ads/model/model_metadata_mixin.py +0 -460
- ads/model/model_properties.py +0 -63
- ads/model/model_version_set.py +0 -739
- ads/model/runtime/__init__.py +0 -5
- ads/model/runtime/env_info.py +0 -306
- ads/model/runtime/model_deployment_details.py +0 -37
- ads/model/runtime/model_provenance_details.py +0 -58
- ads/model/runtime/runtime_info.py +0 -81
- ads/model/runtime/schemas/inference_env_info_schema.yaml +0 -16
- ads/model/runtime/schemas/model_provenance_schema.yaml +0 -36
- ads/model/runtime/schemas/training_env_info_schema.yaml +0 -16
- ads/model/runtime/utils.py +0 -201
- ads/model/serde/__init__.py +0 -5
- ads/model/serde/common.py +0 -40
- ads/model/serde/model_input.py +0 -547
- ads/model/serde/model_serializer.py +0 -1184
- ads/model/service/__init__.py +0 -5
- ads/model/service/oci_datascience_model.py +0 -1076
- ads/model/service/oci_datascience_model_deployment.py +0 -500
- ads/model/service/oci_datascience_model_version_set.py +0 -176
- ads/model/transformer/__init__.py +0 -5
- ads/model/transformer/onnx_transformer.py +0 -324
- ads/mysqldb/__init__.py +0 -5
- ads/mysqldb/mysql_db.py +0 -227
- ads/opctl/__init__.py +0 -18
- ads/opctl/anomaly_detection.py +0 -11
- ads/opctl/backend/__init__.py +0 -5
- ads/opctl/backend/ads_dataflow.py +0 -353
- ads/opctl/backend/ads_ml_job.py +0 -710
- ads/opctl/backend/ads_ml_pipeline.py +0 -164
- ads/opctl/backend/ads_model_deployment.py +0 -209
- ads/opctl/backend/base.py +0 -146
- ads/opctl/backend/local.py +0 -1053
- ads/opctl/backend/marketplace/__init__.py +0 -9
- ads/opctl/backend/marketplace/helm_helper.py +0 -173
- ads/opctl/backend/marketplace/local_marketplace.py +0 -271
- ads/opctl/backend/marketplace/marketplace_backend_runner.py +0 -71
- ads/opctl/backend/marketplace/marketplace_operator_interface.py +0 -44
- ads/opctl/backend/marketplace/marketplace_operator_runner.py +0 -24
- ads/opctl/backend/marketplace/marketplace_utils.py +0 -212
- ads/opctl/backend/marketplace/models/__init__.py +0 -5
- ads/opctl/backend/marketplace/models/bearer_token.py +0 -94
- ads/opctl/backend/marketplace/models/marketplace_type.py +0 -70
- ads/opctl/backend/marketplace/models/ocir_details.py +0 -56
- ads/opctl/backend/marketplace/prerequisite_checker.py +0 -238
- ads/opctl/cli.py +0 -707
- ads/opctl/cmds.py +0 -869
- ads/opctl/conda/__init__.py +0 -5
- ads/opctl/conda/cli.py +0 -193
- ads/opctl/conda/cmds.py +0 -749
- ads/opctl/conda/config.yaml +0 -34
- ads/opctl/conda/manifest_template.yaml +0 -13
- ads/opctl/conda/multipart_uploader.py +0 -188
- ads/opctl/conda/pack.py +0 -89
- ads/opctl/config/__init__.py +0 -5
- ads/opctl/config/base.py +0 -57
- ads/opctl/config/diagnostics/__init__.py +0 -5
- ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +0 -62
- ads/opctl/config/merger.py +0 -255
- ads/opctl/config/resolver.py +0 -297
- ads/opctl/config/utils.py +0 -79
- ads/opctl/config/validator.py +0 -17
- ads/opctl/config/versioner.py +0 -68
- ads/opctl/config/yaml_parsers/__init__.py +0 -7
- ads/opctl/config/yaml_parsers/base.py +0 -58
- ads/opctl/config/yaml_parsers/distributed/__init__.py +0 -7
- ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +0 -201
- ads/opctl/constants.py +0 -66
- ads/opctl/decorator/__init__.py +0 -5
- ads/opctl/decorator/common.py +0 -129
- ads/opctl/diagnostics/__init__.py +0 -5
- ads/opctl/diagnostics/__main__.py +0 -25
- ads/opctl/diagnostics/check_distributed_job_requirements.py +0 -212
- ads/opctl/diagnostics/check_requirements.py +0 -144
- ads/opctl/diagnostics/requirement_exception.py +0 -9
- ads/opctl/distributed/README.md +0 -109
- ads/opctl/distributed/__init__.py +0 -5
- ads/opctl/distributed/certificates.py +0 -32
- ads/opctl/distributed/cli.py +0 -207
- ads/opctl/distributed/cmds.py +0 -731
- ads/opctl/distributed/common/__init__.py +0 -5
- ads/opctl/distributed/common/abstract_cluster_provider.py +0 -449
- ads/opctl/distributed/common/abstract_framework_spec_builder.py +0 -88
- ads/opctl/distributed/common/cluster_config_helper.py +0 -103
- ads/opctl/distributed/common/cluster_provider_factory.py +0 -21
- ads/opctl/distributed/common/cluster_runner.py +0 -54
- ads/opctl/distributed/common/framework_factory.py +0 -29
- ads/opctl/docker/Dockerfile.job +0 -103
- ads/opctl/docker/Dockerfile.job.arm +0 -107
- ads/opctl/docker/Dockerfile.job.gpu +0 -175
- ads/opctl/docker/base-env.yaml +0 -13
- ads/opctl/docker/cuda.repo +0 -6
- ads/opctl/docker/operator/.dockerignore +0 -0
- ads/opctl/docker/operator/Dockerfile +0 -41
- ads/opctl/docker/operator/Dockerfile.gpu +0 -85
- ads/opctl/docker/operator/cuda.repo +0 -6
- ads/opctl/docker/operator/environment.yaml +0 -8
- ads/opctl/forecast.py +0 -11
- ads/opctl/index.yaml +0 -3
- ads/opctl/model/__init__.py +0 -5
- ads/opctl/model/cli.py +0 -65
- ads/opctl/model/cmds.py +0 -73
- ads/opctl/operator/README.md +0 -4
- ads/opctl/operator/__init__.py +0 -31
- ads/opctl/operator/cli.py +0 -344
- ads/opctl/operator/cmd.py +0 -596
- ads/opctl/operator/common/__init__.py +0 -5
- ads/opctl/operator/common/backend_factory.py +0 -460
- ads/opctl/operator/common/const.py +0 -27
- ads/opctl/operator/common/data/synthetic.csv +0 -16001
- ads/opctl/operator/common/dictionary_merger.py +0 -148
- ads/opctl/operator/common/errors.py +0 -42
- ads/opctl/operator/common/operator_config.py +0 -99
- ads/opctl/operator/common/operator_loader.py +0 -811
- ads/opctl/operator/common/operator_schema.yaml +0 -130
- ads/opctl/operator/common/operator_yaml_generator.py +0 -152
- ads/opctl/operator/common/utils.py +0 -208
- ads/opctl/operator/lowcode/__init__.py +0 -5
- ads/opctl/operator/lowcode/anomaly/MLoperator +0 -16
- ads/opctl/operator/lowcode/anomaly/README.md +0 -207
- ads/opctl/operator/lowcode/anomaly/__init__.py +0 -5
- ads/opctl/operator/lowcode/anomaly/__main__.py +0 -103
- ads/opctl/operator/lowcode/anomaly/cmd.py +0 -35
- ads/opctl/operator/lowcode/anomaly/const.py +0 -167
- ads/opctl/operator/lowcode/anomaly/environment.yaml +0 -10
- ads/opctl/operator/lowcode/anomaly/model/__init__.py +0 -5
- ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +0 -146
- ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +0 -162
- ads/opctl/operator/lowcode/anomaly/model/automlx.py +0 -99
- ads/opctl/operator/lowcode/anomaly/model/autots.py +0 -115
- ads/opctl/operator/lowcode/anomaly/model/base_model.py +0 -404
- ads/opctl/operator/lowcode/anomaly/model/factory.py +0 -110
- ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +0 -78
- ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +0 -78
- ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +0 -120
- ads/opctl/operator/lowcode/anomaly/model/tods.py +0 -119
- ads/opctl/operator/lowcode/anomaly/operator_config.py +0 -127
- ads/opctl/operator/lowcode/anomaly/schema.yaml +0 -401
- ads/opctl/operator/lowcode/anomaly/utils.py +0 -88
- ads/opctl/operator/lowcode/common/__init__.py +0 -5
- ads/opctl/operator/lowcode/common/const.py +0 -10
- ads/opctl/operator/lowcode/common/data.py +0 -116
- ads/opctl/operator/lowcode/common/errors.py +0 -47
- ads/opctl/operator/lowcode/common/transformations.py +0 -296
- ads/opctl/operator/lowcode/common/utils.py +0 -293
- ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +0 -13
- ads/opctl/operator/lowcode/feature_store_marketplace/README.md +0 -30
- ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +0 -5
- ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +0 -116
- ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +0 -85
- ads/opctl/operator/lowcode/feature_store_marketplace/const.py +0 -15
- ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
- ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +0 -4
- ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +0 -32
- ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +0 -43
- ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +0 -120
- ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +0 -34
- ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +0 -386
- ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +0 -160
- ads/opctl/operator/lowcode/forecast/MLoperator +0 -25
- ads/opctl/operator/lowcode/forecast/README.md +0 -209
- ads/opctl/operator/lowcode/forecast/__init__.py +0 -5
- ads/opctl/operator/lowcode/forecast/__main__.py +0 -89
- ads/opctl/operator/lowcode/forecast/cmd.py +0 -40
- ads/opctl/operator/lowcode/forecast/const.py +0 -92
- ads/opctl/operator/lowcode/forecast/environment.yaml +0 -20
- ads/opctl/operator/lowcode/forecast/errors.py +0 -26
- ads/opctl/operator/lowcode/forecast/model/__init__.py +0 -5
- ads/opctl/operator/lowcode/forecast/model/arima.py +0 -279
- ads/opctl/operator/lowcode/forecast/model/automlx.py +0 -542
- ads/opctl/operator/lowcode/forecast/model/autots.py +0 -312
- ads/opctl/operator/lowcode/forecast/model/base_model.py +0 -863
- ads/opctl/operator/lowcode/forecast/model/factory.py +0 -106
- ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +0 -492
- ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +0 -243
- ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +0 -486
- ads/opctl/operator/lowcode/forecast/model/prophet.py +0 -445
- ads/opctl/operator/lowcode/forecast/model_evaluator.py +0 -244
- ads/opctl/operator/lowcode/forecast/operator_config.py +0 -234
- ads/opctl/operator/lowcode/forecast/schema.yaml +0 -506
- ads/opctl/operator/lowcode/forecast/utils.py +0 -413
- ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +0 -7
- ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +0 -285
- ads/opctl/operator/lowcode/forecast/whatifserve/score.py +0 -246
- ads/opctl/operator/lowcode/pii/MLoperator +0 -17
- ads/opctl/operator/lowcode/pii/README.md +0 -208
- ads/opctl/operator/lowcode/pii/__init__.py +0 -5
- ads/opctl/operator/lowcode/pii/__main__.py +0 -78
- ads/opctl/operator/lowcode/pii/cmd.py +0 -39
- ads/opctl/operator/lowcode/pii/constant.py +0 -84
- ads/opctl/operator/lowcode/pii/environment.yaml +0 -17
- ads/opctl/operator/lowcode/pii/errors.py +0 -27
- ads/opctl/operator/lowcode/pii/model/__init__.py +0 -5
- ads/opctl/operator/lowcode/pii/model/factory.py +0 -82
- ads/opctl/operator/lowcode/pii/model/guardrails.py +0 -167
- ads/opctl/operator/lowcode/pii/model/pii.py +0 -145
- ads/opctl/operator/lowcode/pii/model/processor/__init__.py +0 -34
- ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +0 -34
- ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +0 -35
- ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +0 -225
- ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +0 -73
- ads/opctl/operator/lowcode/pii/model/processor/remover.py +0 -26
- ads/opctl/operator/lowcode/pii/model/report.py +0 -487
- ads/opctl/operator/lowcode/pii/operator_config.py +0 -95
- ads/opctl/operator/lowcode/pii/schema.yaml +0 -108
- ads/opctl/operator/lowcode/pii/utils.py +0 -43
- ads/opctl/operator/lowcode/recommender/MLoperator +0 -16
- ads/opctl/operator/lowcode/recommender/README.md +0 -206
- ads/opctl/operator/lowcode/recommender/__init__.py +0 -5
- ads/opctl/operator/lowcode/recommender/__main__.py +0 -82
- ads/opctl/operator/lowcode/recommender/cmd.py +0 -33
- ads/opctl/operator/lowcode/recommender/constant.py +0 -30
- ads/opctl/operator/lowcode/recommender/environment.yaml +0 -11
- ads/opctl/operator/lowcode/recommender/model/base_model.py +0 -212
- ads/opctl/operator/lowcode/recommender/model/factory.py +0 -56
- ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +0 -25
- ads/opctl/operator/lowcode/recommender/model/svd.py +0 -106
- ads/opctl/operator/lowcode/recommender/operator_config.py +0 -81
- ads/opctl/operator/lowcode/recommender/schema.yaml +0 -265
- ads/opctl/operator/lowcode/recommender/utils.py +0 -13
- ads/opctl/operator/runtime/__init__.py +0 -5
- ads/opctl/operator/runtime/const.py +0 -17
- ads/opctl/operator/runtime/container_runtime_schema.yaml +0 -50
- ads/opctl/operator/runtime/marketplace_runtime.py +0 -50
- ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +0 -21
- ads/opctl/operator/runtime/python_runtime_schema.yaml +0 -21
- ads/opctl/operator/runtime/runtime.py +0 -115
- ads/opctl/schema.yaml.yml +0 -36
- ads/opctl/script.py +0 -40
- ads/opctl/spark/__init__.py +0 -5
- ads/opctl/spark/cli.py +0 -43
- ads/opctl/spark/cmds.py +0 -147
- ads/opctl/templates/diagnostic_report_template.jinja2 +0 -102
- ads/opctl/utils.py +0 -344
- ads/oracledb/__init__.py +0 -5
- ads/oracledb/oracle_db.py +0 -346
- ads/pipeline/__init__.py +0 -39
- ads/pipeline/ads_pipeline.py +0 -2279
- ads/pipeline/ads_pipeline_run.py +0 -772
- ads/pipeline/ads_pipeline_step.py +0 -605
- ads/pipeline/builders/__init__.py +0 -5
- ads/pipeline/builders/infrastructure/__init__.py +0 -5
- ads/pipeline/builders/infrastructure/custom_script.py +0 -32
- ads/pipeline/cli.py +0 -119
- ads/pipeline/extension.py +0 -291
- ads/pipeline/schema/__init__.py +0 -5
- ads/pipeline/schema/cs_step_schema.json +0 -35
- ads/pipeline/schema/ml_step_schema.json +0 -31
- ads/pipeline/schema/pipeline_schema.json +0 -71
- ads/pipeline/visualizer/__init__.py +0 -5
- ads/pipeline/visualizer/base.py +0 -570
- ads/pipeline/visualizer/graph_renderer.py +0 -272
- ads/pipeline/visualizer/text_renderer.py +0 -84
- ads/secrets/__init__.py +0 -11
- ads/secrets/adb.py +0 -386
- ads/secrets/auth_token.py +0 -86
- ads/secrets/big_data_service.py +0 -365
- ads/secrets/mysqldb.py +0 -149
- ads/secrets/oracledb.py +0 -160
- ads/secrets/secrets.py +0 -407
- ads/telemetry/__init__.py +0 -7
- ads/telemetry/base.py +0 -69
- ads/telemetry/client.py +0 -125
- ads/telemetry/telemetry.py +0 -257
- ads/templates/dataflow_pyspark.jinja2 +0 -13
- ads/templates/dataflow_sparksql.jinja2 +0 -22
- ads/templates/func.jinja2 +0 -20
- ads/templates/schemas/openapi.json +0 -1740
- ads/templates/score-pkl.jinja2 +0 -173
- ads/templates/score.jinja2 +0 -322
- ads/templates/score_embedding_onnx.jinja2 +0 -202
- ads/templates/score_generic.jinja2 +0 -165
- ads/templates/score_huggingface_pipeline.jinja2 +0 -217
- ads/templates/score_lightgbm.jinja2 +0 -185
- ads/templates/score_onnx.jinja2 +0 -407
- ads/templates/score_onnx_new.jinja2 +0 -473
- ads/templates/score_oracle_automl.jinja2 +0 -185
- ads/templates/score_pyspark.jinja2 +0 -154
- ads/templates/score_pytorch.jinja2 +0 -219
- ads/templates/score_scikit-learn.jinja2 +0 -184
- ads/templates/score_tensorflow.jinja2 +0 -184
- ads/templates/score_xgboost.jinja2 +0 -178
- ads/text_dataset/__init__.py +0 -5
- ads/text_dataset/backends.py +0 -211
- ads/text_dataset/dataset.py +0 -445
- ads/text_dataset/extractor.py +0 -207
- ads/text_dataset/options.py +0 -53
- ads/text_dataset/udfs.py +0 -22
- ads/text_dataset/utils.py +0 -49
- ads/type_discovery/__init__.py +0 -9
- ads/type_discovery/abstract_detector.py +0 -21
- ads/type_discovery/constant_detector.py +0 -41
- ads/type_discovery/continuous_detector.py +0 -54
- ads/type_discovery/credit_card_detector.py +0 -99
- ads/type_discovery/datetime_detector.py +0 -92
- ads/type_discovery/discrete_detector.py +0 -118
- ads/type_discovery/document_detector.py +0 -146
- ads/type_discovery/ip_detector.py +0 -68
- ads/type_discovery/latlon_detector.py +0 -90
- ads/type_discovery/phone_number_detector.py +0 -63
- ads/type_discovery/type_discovery_driver.py +0 -87
- ads/type_discovery/typed_feature.py +0 -594
- ads/type_discovery/unknown_detector.py +0 -41
- ads/type_discovery/zipcode_detector.py +0 -48
- ads/vault/__init__.py +0 -7
- ads/vault/vault.py +0 -237
- oracle_ads-2.13.8.dist-info/RECORD +0 -858
- {oracle_ads-2.13.8.dist-info → oracle_ads-2.13.9rc0.dist-info}/licenses/LICENSE.txt +0 -0
@@ -1,795 +0,0 @@
|
|
1
|
-
#!/usr/bin/env python
|
2
|
-
# -*- coding: utf-8 -*--
|
3
|
-
|
4
|
-
# Copyright (c) 2021, 2022 Oracle and/or its affiliates.
|
5
|
-
# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
|
6
|
-
|
7
|
-
import asteval
|
8
|
-
import fsspec
|
9
|
-
import json
|
10
|
-
import os
|
11
|
-
import sys
|
12
|
-
import yaml
|
13
|
-
from abc import ABC, abstractmethod
|
14
|
-
from cerberus import Validator
|
15
|
-
from copy import deepcopy
|
16
|
-
from dataclasses import dataclass, field
|
17
|
-
from typing import Dict, List, Optional
|
18
|
-
from string import Template
|
19
|
-
from os import path
|
20
|
-
from ads.common.serializer import DataClassSerializable
|
21
|
-
from ads.common.object_storage_details import ObjectStorageDetails
|
22
|
-
|
23
|
-
try:
|
24
|
-
from yaml import CDumper as dumper
|
25
|
-
from yaml import CLoader as loader
|
26
|
-
except:
|
27
|
-
from yaml import Dumper as dumper
|
28
|
-
from yaml import Loader as loader
|
29
|
-
|
30
|
-
SCHEMA_VALIDATOR_NAME = "data_schema.json"
|
31
|
-
INPUT_OUTPUT_SCHENA_SIZE_LIMIT = 32000
|
32
|
-
SCHEMA_VERSION = "1.1"
|
33
|
-
DEFAULT_SCHEMA_VERSION = "1.0"
|
34
|
-
SCHEMA_KEY = "schema"
|
35
|
-
SCHEMA_VERSION_KEY = "version"
|
36
|
-
DEFAULT_STORAGE_OPTIONS = None
|
37
|
-
|
38
|
-
|
39
|
-
class SchemaSizeTooLarge(ValueError):
|
40
|
-
def __init__(self, size: int):
|
41
|
-
super().__init__(
|
42
|
-
f"The schema `{size}` bytes and "
|
43
|
-
f"the maximum allowable schema size is `{INPUT_OUTPUT_SCHENA_SIZE_LIMIT}` bytes. "
|
44
|
-
"Reduce the size of the schema."
|
45
|
-
)
|
46
|
-
|
47
|
-
|
48
|
-
class DataSizeTooWide(ValueError):
|
49
|
-
def __init__(self, data_col_num: int, max_col_num: int):
|
50
|
-
super().__init__(
|
51
|
-
f"The data has `{data_col_num}` columns and "
|
52
|
-
f"the maximum allowable number of columns is `{max_col_num}`. "
|
53
|
-
"Increase allowable number of columns by setting a larger max_col_num. It will take longer time to prepare."
|
54
|
-
)
|
55
|
-
|
56
|
-
|
57
|
-
@dataclass(repr=False)
|
58
|
-
class Expression(DataClassSerializable):
|
59
|
-
"""
|
60
|
-
Expression allows specifying string representation of an expression which can be evaluated by the language corresponding to the value provided in `langauge` attribute
|
61
|
-
|
62
|
-
Default value for language is python
|
63
|
-
|
64
|
-
Parameters
|
65
|
-
----------
|
66
|
-
exression: Must use string.Template format for specifying the exression
|
67
|
-
type: str
|
68
|
-
language: default value is python. It could be any language. `evaluate` method expects the expression to be of type python
|
69
|
-
|
70
|
-
Examples
|
71
|
-
--------
|
72
|
-
>>> exp = Expression("($x > 10 and $x <100) or ($x < -1 and $x > -500)")
|
73
|
-
>>> exp.evaluate(x=500)
|
74
|
-
False
|
75
|
-
>>> exp.evaluate(x=20)
|
76
|
-
True
|
77
|
-
>>> exp.evaluate(x=9)
|
78
|
-
False
|
79
|
-
>>> exp.evaluate(x=-9)
|
80
|
-
True
|
81
|
-
"""
|
82
|
-
|
83
|
-
expression: str
|
84
|
-
language: str = "python"
|
85
|
-
|
86
|
-
def evaluate(self, **kwargs):
|
87
|
-
if self.language.lower() != "python":
|
88
|
-
raise Exception(
|
89
|
-
f"Evaluation not supported for language ${self.language}. Supported language: python"
|
90
|
-
)
|
91
|
-
|
92
|
-
exp = Template(self.expression)
|
93
|
-
final_expression = None
|
94
|
-
try:
|
95
|
-
final_expression = exp.substitute(kwargs)
|
96
|
-
except:
|
97
|
-
raise Exception(
|
98
|
-
"Error substituting the value into the expression. Check if the variable in the expression matches the parameter names passed to evaluate method"
|
99
|
-
)
|
100
|
-
aeval = asteval.Interpreter()
|
101
|
-
return aeval(final_expression)
|
102
|
-
|
103
|
-
def __post_init__(self):
|
104
|
-
if not self.expression or not self.language:
|
105
|
-
raise ValueError(
|
106
|
-
f"An Expression object requires values for both expression and language"
|
107
|
-
)
|
108
|
-
|
109
|
-
|
110
|
-
@dataclass(repr=False)
|
111
|
-
class Domain(DataClassSerializable):
|
112
|
-
"""Domain describes the data. It holds following information -
|
113
|
-
* stats - Statistics of the data.
|
114
|
-
* constraints - List of Expression which defines the constraint for the data.
|
115
|
-
* Domain values.
|
116
|
-
|
117
|
-
Examples
|
118
|
-
--------
|
119
|
-
|
120
|
-
>>> Domain(values='Rational Numbers', stats={"mean":50, "median":51, "min": 5, "max":100}, constraints=[Expression('$x > 5')])
|
121
|
-
constraints:
|
122
|
-
- expression: $x > 5
|
123
|
-
language: python
|
124
|
-
stats:
|
125
|
-
max: 100
|
126
|
-
mean: 50
|
127
|
-
median: 51
|
128
|
-
min: 5
|
129
|
-
values: Rational Numbers
|
130
|
-
"""
|
131
|
-
|
132
|
-
values: str = ""
|
133
|
-
stats: Dict = field(default_factory=dict)
|
134
|
-
constraints: List[Expression] = field(default_factory=list)
|
135
|
-
|
136
|
-
|
137
|
-
@dataclass(repr=False, order=True)
|
138
|
-
class Attribute(DataClassSerializable):
|
139
|
-
"""
|
140
|
-
Attribute describes the column/feature/element. It holds following information -
|
141
|
-
* dtype - Type of data - float, int64, etc. Matches with Pandas dtypes
|
142
|
-
* feature_type - Feature type of data - Integer, String, etc. Matches with ads feature types.
|
143
|
-
* name - Name of the feature
|
144
|
-
* domain - Represented by the Domain class
|
145
|
-
* required - Boolean - True or False
|
146
|
-
* description - Description about the column/feature
|
147
|
-
* order - order of the column/feature in the data
|
148
|
-
|
149
|
-
Examples
|
150
|
-
--------
|
151
|
-
|
152
|
-
>>> attr_fruits = Attribute(
|
153
|
-
... dtype = "category",
|
154
|
-
... feature_type = "category",
|
155
|
-
... name = "fruits",
|
156
|
-
... domain = Domain(values="Apple, Orange, Grapes", stats={"mode": "Orange"}, constraints=[Expression("in ['Apple', 'Orange', 'Grapes']")]),
|
157
|
-
... required = True,
|
158
|
-
... description = "Names of fruits",
|
159
|
-
... order = 0
|
160
|
-
... )
|
161
|
-
>>> attr_fruits
|
162
|
-
description: Names of fruits
|
163
|
-
domain:
|
164
|
-
constraints:
|
165
|
-
- expression: in ['Apple', 'Orange', 'Grapes']
|
166
|
-
language: python
|
167
|
-
stats:
|
168
|
-
mode: Orange
|
169
|
-
values: Apple, Orange, Grapes
|
170
|
-
dtype: category
|
171
|
-
feature_type: category
|
172
|
-
name: fruits
|
173
|
-
order: 0
|
174
|
-
required: true
|
175
|
-
>>> attr_fruits.key
|
176
|
-
'fruits'
|
177
|
-
"""
|
178
|
-
|
179
|
-
sort_index: int = field(init=False, repr=False)
|
180
|
-
dtype: str
|
181
|
-
feature_type: str
|
182
|
-
name: str
|
183
|
-
domain: Domain
|
184
|
-
required: bool
|
185
|
-
description: str
|
186
|
-
order: Optional[int] = None
|
187
|
-
|
188
|
-
@property
|
189
|
-
def key(self):
|
190
|
-
return self.name
|
191
|
-
|
192
|
-
def to_dict(self, **kwargs) -> dict:
|
193
|
-
data = super().to_dict(**kwargs)
|
194
|
-
data.pop("sort_index", None)
|
195
|
-
return data
|
196
|
-
|
197
|
-
def __hash__(self):
|
198
|
-
return hash(self.key)
|
199
|
-
|
200
|
-
def __post_init__(self):
|
201
|
-
object.__setattr__(self, "sort_index", self.order or 0)
|
202
|
-
|
203
|
-
|
204
|
-
class BaseSchemaLoader(ABC):
|
205
|
-
"""
|
206
|
-
Base Schema Loader which load and validate schema.
|
207
|
-
|
208
|
-
Methods
|
209
|
-
-------
|
210
|
-
load_schema(self)
|
211
|
-
Load and validate schema from a file and return the normalized schema.
|
212
|
-
"""
|
213
|
-
|
214
|
-
def __init__(self):
|
215
|
-
self._schema = None
|
216
|
-
|
217
|
-
def load_schema(self, schema_path):
|
218
|
-
"""Load and validate schema from a file and return the normalized schema."""
|
219
|
-
self._load_schema(schema_path)
|
220
|
-
self._normalize()
|
221
|
-
return self._validate()
|
222
|
-
|
223
|
-
def _normalize(self):
|
224
|
-
self._schema = {key.lower(): value for key, value in self._schema.items()}
|
225
|
-
|
226
|
-
@abstractmethod
|
227
|
-
def _load_schema(self, schema_path):
|
228
|
-
pass
|
229
|
-
|
230
|
-
def _validate(self):
|
231
|
-
"""Validate the schema."""
|
232
|
-
schema_validator = self._load_schema_validator()
|
233
|
-
v = Validator(schema_validator)
|
234
|
-
normalized_items = []
|
235
|
-
for item in self._schema[SCHEMA_KEY]:
|
236
|
-
valid = v.validate(item)
|
237
|
-
if not valid:
|
238
|
-
new_dict = {"column": item["name"], "error": v.errors}
|
239
|
-
raise ValueError(json.dumps(new_dict, indent=2))
|
240
|
-
normalized_items.append(v.normalized(item))
|
241
|
-
schema_version = self._schema.get(SCHEMA_VERSION_KEY) or DEFAULT_SCHEMA_VERSION
|
242
|
-
self._schema = {
|
243
|
-
SCHEMA_KEY: normalized_items,
|
244
|
-
SCHEMA_VERSION_KEY: schema_version,
|
245
|
-
}
|
246
|
-
return self._schema
|
247
|
-
|
248
|
-
@staticmethod
|
249
|
-
def _load_schema_validator():
|
250
|
-
"""load the schema validator to validate the schema."""
|
251
|
-
with open(
|
252
|
-
os.path.join(
|
253
|
-
os.path.dirname(os.path.abspath(__file__)), SCHEMA_VALIDATOR_NAME
|
254
|
-
)
|
255
|
-
) as schema_file:
|
256
|
-
schema_validator = json.load(schema_file)
|
257
|
-
return schema_validator
|
258
|
-
|
259
|
-
|
260
|
-
class JsonSchemaLoader(BaseSchemaLoader):
|
261
|
-
"""
|
262
|
-
Json Schema which load and validate schema from json file.
|
263
|
-
|
264
|
-
Methods
|
265
|
-
-------
|
266
|
-
load_schema(self)
|
267
|
-
Load and validate schema from json file and return the normalized schema.
|
268
|
-
|
269
|
-
Examples
|
270
|
-
--------
|
271
|
-
>>> schema_loader = JsonSchemaLoader()
|
272
|
-
>>> schema_dict = schema_loader.load_schema('schema.json')
|
273
|
-
>>> schema_dict
|
274
|
-
{'Schema': [{'dtype': 'object',
|
275
|
-
'feature_type': 'String',
|
276
|
-
'name': 'Attrition',
|
277
|
-
'domain': {'values': 'String',
|
278
|
-
'stats': {'count': 1470, 'unique': 2},
|
279
|
-
'constraints': []},
|
280
|
-
'required': True,
|
281
|
-
'description': 'Attrition'},
|
282
|
-
{'dtype': 'int64',
|
283
|
-
'feature_type': 'Integer',
|
284
|
-
'name': 'Age',
|
285
|
-
'domain': {'values': 'Integer',
|
286
|
-
'stats': {'count': 1470.0,
|
287
|
-
'mean': 37.923809523809524,
|
288
|
-
'std': 9.135373489136732,
|
289
|
-
'min': 19.0,
|
290
|
-
'25%': 31.0,
|
291
|
-
'50%': 37.0,
|
292
|
-
'75%': 44.0,
|
293
|
-
'max': 61.0},
|
294
|
-
'constraints': []},
|
295
|
-
'required': True,
|
296
|
-
'description': 'Age'}]}
|
297
|
-
"""
|
298
|
-
|
299
|
-
def _load_schema(self, schema_path):
|
300
|
-
"""Loads and validates schema from a json file."""
|
301
|
-
assert os.path.splitext(schema_path)[-1].lower() in [
|
302
|
-
".json"
|
303
|
-
], "Expecting a json format file."
|
304
|
-
if not path.exists(schema_path):
|
305
|
-
raise FileNotFoundError(f"{schema_path} does not exist")
|
306
|
-
with fsspec.open(schema_path, mode="r", encoding="utf8") as f:
|
307
|
-
self._schema = json.load(f)
|
308
|
-
|
309
|
-
|
310
|
-
class YamlSchemaLoader(BaseSchemaLoader):
|
311
|
-
"""
|
312
|
-
Yaml Schema which loads and validates schema from a yaml file.
|
313
|
-
|
314
|
-
Methods
|
315
|
-
-------
|
316
|
-
load_schema(self)
|
317
|
-
Loads and validates schema from a yaml file and returns the normalized schema.
|
318
|
-
|
319
|
-
Examples
|
320
|
-
--------
|
321
|
-
>>> schema_loader = YamlSchemaLoader()
|
322
|
-
>>> schema_dict = schema_loader.load_schema('schema.yaml')
|
323
|
-
>>> schema_dict
|
324
|
-
{'Schema': [{'description': 'Attrition',
|
325
|
-
'domain': {'constraints': [],
|
326
|
-
'stats': {'count': 1470, 'unique': 2},
|
327
|
-
'values': 'String'},
|
328
|
-
'dtype': 'object',
|
329
|
-
'feature_type': 'String',
|
330
|
-
'name': 'Attrition',
|
331
|
-
'required': True},
|
332
|
-
{'description': 'Age',
|
333
|
-
'domain': {'constraints': [],
|
334
|
-
'stats': {'25%': 31.0,
|
335
|
-
'50%': 37.0,
|
336
|
-
'75%': 44.0,
|
337
|
-
'count': 1470.0,
|
338
|
-
'max': 61.0,
|
339
|
-
'mean': 37.923809523809524,
|
340
|
-
'min': 19.0,
|
341
|
-
'std': 9.135373489136732},
|
342
|
-
'values': 'Integer'},
|
343
|
-
'dtype': 'int64',
|
344
|
-
'feature_type': 'Integer',
|
345
|
-
'name': 'Age',
|
346
|
-
'required': True}]}
|
347
|
-
"""
|
348
|
-
|
349
|
-
def _load_schema(self, schema_path):
|
350
|
-
"""Load and validate schema from yaml file."""
|
351
|
-
assert os.path.splitext(schema_path)[-1].lower() in [
|
352
|
-
".yaml",
|
353
|
-
".yml",
|
354
|
-
], "Expecting yaml format file."
|
355
|
-
if not path.exists(schema_path):
|
356
|
-
raise FileNotFoundError(f"{schema_path} does not exist")
|
357
|
-
with open(schema_path, "r") as stream:
|
358
|
-
try:
|
359
|
-
self._schema = yaml.load(yaml.safe_load(stream), Loader=loader)
|
360
|
-
except yaml.YAMLError as exc:
|
361
|
-
raise exc
|
362
|
-
|
363
|
-
|
364
|
-
class SchemaFactory:
|
365
|
-
"""
|
366
|
-
Schema Factory.
|
367
|
-
|
368
|
-
Methods
|
369
|
-
-------
|
370
|
-
register_format(self)
|
371
|
-
Register a new type of schema class.
|
372
|
-
get_schema(self)
|
373
|
-
Get the YamlSchema or JsonSchema based on the format.
|
374
|
-
default_schema(cls)
|
375
|
-
Construct a SchemaFactory instance and register yaml and json loader.
|
376
|
-
|
377
|
-
Examples
|
378
|
-
--------
|
379
|
-
>>> factory = SchemaFactory.default_schema()
|
380
|
-
>>> schema_loader = factory.get_schema('.json')
|
381
|
-
>>> schema_dict = schema_loader.load_schema('schema.json')
|
382
|
-
>>> schema = Schema.from_dict(schema_dict)
|
383
|
-
>>> schema
|
384
|
-
Schema:
|
385
|
-
- description: Attrition
|
386
|
-
domain:
|
387
|
-
constraints: []
|
388
|
-
stats:
|
389
|
-
count: 1470
|
390
|
-
unique: 2
|
391
|
-
values: String
|
392
|
-
dtype: object
|
393
|
-
feature_type: String
|
394
|
-
name: Attrition
|
395
|
-
required: true
|
396
|
-
- description: Age
|
397
|
-
domain:
|
398
|
-
constraints: []
|
399
|
-
stats:
|
400
|
-
25%: 31.0
|
401
|
-
50%: 37.0
|
402
|
-
75%: 44.0
|
403
|
-
count: 1470.0
|
404
|
-
max: 61.0
|
405
|
-
mean: 37.923809523809524
|
406
|
-
min: 19.0
|
407
|
-
std: 9.135373489136732
|
408
|
-
values: Integer
|
409
|
-
dtype: int64
|
410
|
-
feature_type: Integer
|
411
|
-
name: Age
|
412
|
-
required: true
|
413
|
-
"""
|
414
|
-
|
415
|
-
def __init__(self):
|
416
|
-
self._creators = {}
|
417
|
-
|
418
|
-
def register_format(self, file_format, creator):
|
419
|
-
"""Register a new type of schema class."""
|
420
|
-
self._creators[file_format] = creator
|
421
|
-
|
422
|
-
def get_schema(self, file_format):
|
423
|
-
"""Get the YamlSchema or JsonSchema based on the format."""
|
424
|
-
creator = self._creators.get(file_format)
|
425
|
-
if not creator:
|
426
|
-
raise ValueError(
|
427
|
-
f"This {file_format} format is not supported. Pass Json or Yaml Files."
|
428
|
-
)
|
429
|
-
return creator()
|
430
|
-
|
431
|
-
@classmethod
|
432
|
-
def default_schema(cls):
|
433
|
-
factory = cls()
|
434
|
-
factory.register_format(".json", JsonSchemaLoader)
|
435
|
-
factory.register_format(".yaml", YamlSchemaLoader)
|
436
|
-
factory.register_format(".yml", YamlSchemaLoader)
|
437
|
-
return factory
|
438
|
-
|
439
|
-
|
440
|
-
@dataclass(repr=False)
|
441
|
-
class Schema:
|
442
|
-
"""
|
443
|
-
Schema describes the structure of the data.
|
444
|
-
|
445
|
-
Methods
|
446
|
-
-------
|
447
|
-
add(self, item: Attribute, replace: bool = False)
|
448
|
-
Adds a new attribute item. Replaces existing one if replace flag is True.
|
449
|
-
from_dict(self)
|
450
|
-
Constructs an instance of Schema from a dictionary.
|
451
|
-
from_file(cls, file_path):
|
452
|
-
Loads the data schema from a file.
|
453
|
-
to_dict(self)
|
454
|
-
Serializes the data schema into a dictionary.
|
455
|
-
to_yaml(self)
|
456
|
-
Serializes the data schema into a YAML.
|
457
|
-
to_json(self)
|
458
|
-
Serializes the data schema into a json string.
|
459
|
-
to_json_file(self)
|
460
|
-
Saves the data schema into a json file.
|
461
|
-
to_yaml_file(self)
|
462
|
-
Save to a yaml file.
|
463
|
-
add(self, item: Attribute, replace=False) -> None
|
464
|
-
Adds a new attribute item. Replaces existing one if replace flag is True.
|
465
|
-
|
466
|
-
Examples
|
467
|
-
--------
|
468
|
-
|
469
|
-
>>> attr_fruits = Attribute(
|
470
|
-
... dtype = "category",
|
471
|
-
... feature_type = "category",
|
472
|
-
... name = "fruits",
|
473
|
-
... domain = Domain(values="Apple, Orange, Grapes", stats={"mode": "Orange"}, constraints=[Expression("in ['Apple', 'Orange', 'Grapes']")]),
|
474
|
-
... required = True,
|
475
|
-
... description = "Names of fruits",
|
476
|
-
... order = 0,
|
477
|
-
... )
|
478
|
-
>>> attr_animals = Attribute(
|
479
|
-
... dtype = "category",
|
480
|
-
... feature_type = "category",
|
481
|
-
... name = "animals",
|
482
|
-
... domain = Domain(values="Dog, Cat, Python", stats={"mode": "Dog"}, constraints=[Expression("in ['Dog', 'Cat', 'Python']")]),
|
483
|
-
... required = True,
|
484
|
-
... description = "Names of animals",
|
485
|
-
... order = 1,
|
486
|
-
... )
|
487
|
-
>>> schema = Schema()
|
488
|
-
>>> schema.add(attr_fruits)
|
489
|
-
>>> schema.add(attr_animals)
|
490
|
-
>>> schema
|
491
|
-
schema:
|
492
|
-
- description: Names of fruits
|
493
|
-
domain:
|
494
|
-
constraints:
|
495
|
-
- expression: in ['Apple', 'Orange', 'Grapes']
|
496
|
-
language: python
|
497
|
-
stats:
|
498
|
-
mode: Orange
|
499
|
-
values: Apple, Orange, Grapes
|
500
|
-
dtype: category
|
501
|
-
feature_type: category
|
502
|
-
name: fruits
|
503
|
-
order: 0
|
504
|
-
required: true
|
505
|
-
- description: Names of animals
|
506
|
-
domain:
|
507
|
-
constraints:
|
508
|
-
- expression: in ['Dog', 'Cat', 'Python']
|
509
|
-
language: python
|
510
|
-
stats:
|
511
|
-
mode: Dog
|
512
|
-
values: Dog, Cat, Python
|
513
|
-
dtype: category
|
514
|
-
feature_type: category
|
515
|
-
name: animals
|
516
|
-
order: 1
|
517
|
-
required: true
|
518
|
-
>>> schema.to_dict()
|
519
|
-
{'schema': [{'dtype': 'category',
|
520
|
-
'feature_type': 'category',
|
521
|
-
'name': 'fruits',
|
522
|
-
'domain': {'values': 'Apple, Orange, Grapes',
|
523
|
-
'stats': {'mode': 'Orange'},
|
524
|
-
'constraints': [{'expression': "in ['Apple', 'Orange', 'Grapes']",
|
525
|
-
'language': 'python'}]},
|
526
|
-
'required': True,
|
527
|
-
'description': 'Names of fruits',
|
528
|
-
'order': 0},
|
529
|
-
{'dtype': 'category',
|
530
|
-
'feature_type': 'category',
|
531
|
-
'name': 'animals',
|
532
|
-
'domain': {'values': 'Dog, Cat, Python',
|
533
|
-
'stats': {'mode': 'Dog'},
|
534
|
-
'constraints': [{'expression': "in ['Dog', 'Cat', 'Python']",
|
535
|
-
'language': 'python'}]},
|
536
|
-
'required': True,
|
537
|
-
'description': 'Names of animals',
|
538
|
-
'order': 1}]}
|
539
|
-
|
540
|
-
"""
|
541
|
-
|
542
|
-
_schema: set = field(default_factory=set, init=False)
|
543
|
-
_version: str = SCHEMA_VERSION
|
544
|
-
|
545
|
-
def add(self, item: Attribute, replace: bool = False):
|
546
|
-
"""Adds a new attribute item. Replaces existing one if replace flag is True.
|
547
|
-
|
548
|
-
Overrides the existing one if replace flag is True.
|
549
|
-
|
550
|
-
Parameters
|
551
|
-
----------
|
552
|
-
item : Attribute
|
553
|
-
The attribute instance of a column/feature/element.
|
554
|
-
replace : bool
|
555
|
-
Overrides the existing attribute item if replace flag is True.
|
556
|
-
|
557
|
-
Returns
|
558
|
-
-------
|
559
|
-
None
|
560
|
-
Nothing.
|
561
|
-
|
562
|
-
Raises
|
563
|
-
------
|
564
|
-
ValueError
|
565
|
-
If item is already registered and replace flag is False.
|
566
|
-
TypeError
|
567
|
-
If input data has a wrong format.
|
568
|
-
"""
|
569
|
-
if not isinstance(item, Attribute):
|
570
|
-
raise TypeError("Argument must be an instance of the class Attribute.")
|
571
|
-
if not replace and item.key in self.keys:
|
572
|
-
raise ValueError(
|
573
|
-
f"The key {item.key} already exists. Use `replace=True` to overwrite."
|
574
|
-
)
|
575
|
-
self._schema.discard(item)
|
576
|
-
self._schema.add(item)
|
577
|
-
|
578
|
-
@property
|
579
|
-
def keys(self) -> list:
|
580
|
-
"""Returns all registered Attribute keys.
|
581
|
-
|
582
|
-
Returns
|
583
|
-
-------
|
584
|
-
Tuple[str]
|
585
|
-
The list of Attribute keys.
|
586
|
-
"""
|
587
|
-
return tuple(item.key for item in self)
|
588
|
-
|
589
|
-
@classmethod
|
590
|
-
def from_dict(cls, schema: dict):
|
591
|
-
"""Constructs an instance of Schema from a dictionary.
|
592
|
-
|
593
|
-
Parameters
|
594
|
-
----------
|
595
|
-
schema : dict
|
596
|
-
Data schema in dictionary format.
|
597
|
-
|
598
|
-
Returns
|
599
|
-
-------
|
600
|
-
Schema
|
601
|
-
An instance of Schema.
|
602
|
-
"""
|
603
|
-
sc = cls()
|
604
|
-
|
605
|
-
if schema == {}:
|
606
|
-
return sc
|
607
|
-
if not isinstance(schema, dict):
|
608
|
-
raise TypeError("schema has to be of dictionary type.")
|
609
|
-
|
610
|
-
schema = {key.lower(): value for key, value in deepcopy(schema).items()}
|
611
|
-
for item in schema[SCHEMA_KEY]:
|
612
|
-
domain = Domain(**item["domain"])
|
613
|
-
domain.constraints = []
|
614
|
-
for constraint in item["domain"]["constraints"]:
|
615
|
-
domain.constraints.append(Expression(**constraint))
|
616
|
-
item["domain"] = domain
|
617
|
-
sc.add(Attribute(**item))
|
618
|
-
return sc
|
619
|
-
|
620
|
-
@classmethod
|
621
|
-
def from_json(cls, schema: str):
|
622
|
-
"""Constructs an instance of Schema from a Json.
|
623
|
-
|
624
|
-
Parameters
|
625
|
-
----------
|
626
|
-
schema : str
|
627
|
-
Data schema in Json format.
|
628
|
-
|
629
|
-
Returns
|
630
|
-
-------
|
631
|
-
Schema
|
632
|
-
An instance of Schema.
|
633
|
-
"""
|
634
|
-
return Schema.from_dict(json.loads(schema))
|
635
|
-
|
636
|
-
@classmethod
|
637
|
-
def from_file(cls, file_path: str):
|
638
|
-
"""Loads the data schema from a file.
|
639
|
-
|
640
|
-
Parameters
|
641
|
-
----------
|
642
|
-
file_path : str
|
643
|
-
File Path to load the data schema.
|
644
|
-
|
645
|
-
Returns
|
646
|
-
-------
|
647
|
-
Schema
|
648
|
-
An instance of Schema.
|
649
|
-
"""
|
650
|
-
file_format = os.path.splitext(file_path)[-1]
|
651
|
-
schema_loader = SchemaFactory.default_schema().get_schema(file_format)
|
652
|
-
return cls.from_dict(schema_loader.load_schema(file_path))
|
653
|
-
|
654
|
-
def to_dict(self):
|
655
|
-
"""Serializes data schema into a dictionary.
|
656
|
-
|
657
|
-
Returns
|
658
|
-
-------
|
659
|
-
dict
|
660
|
-
The dictionary representation of data schema.
|
661
|
-
"""
|
662
|
-
return {
|
663
|
-
SCHEMA_KEY: [item.to_dict() for item in self],
|
664
|
-
SCHEMA_VERSION_KEY: self._version,
|
665
|
-
}
|
666
|
-
|
667
|
-
def to_yaml(self):
|
668
|
-
"""Serializes the data schema into a YAML.
|
669
|
-
Returns
|
670
|
-
-------
|
671
|
-
str
|
672
|
-
The yaml representation of data schema.
|
673
|
-
"""
|
674
|
-
return yaml.dump(self.to_dict(), Dumper=dumper)
|
675
|
-
|
676
|
-
def to_json(self):
|
677
|
-
"""Serializes the data schema into a json string.
|
678
|
-
Returns
|
679
|
-
-------
|
680
|
-
str
|
681
|
-
The json representation of data schema.
|
682
|
-
"""
|
683
|
-
return json.dumps(self.to_dict()).replace("NaN", "null")
|
684
|
-
|
685
|
-
def to_json_file(self, file_path, storage_options: dict = None):
|
686
|
-
"""Saves the data schema into a json file.
|
687
|
-
|
688
|
-
Parameters
|
689
|
-
----------
|
690
|
-
file_path : str
|
691
|
-
File Path to store the schema in json format.
|
692
|
-
storage_options: dict. Default None
|
693
|
-
Parameters passed on to the backend filesystem class.
|
694
|
-
Defaults to `storage_options` set using `DatasetFactory.set_default_storage()`.
|
695
|
-
|
696
|
-
Returns
|
697
|
-
-------
|
698
|
-
None
|
699
|
-
Nothing.
|
700
|
-
"""
|
701
|
-
directory = os.path.expanduser(os.path.dirname(file_path))
|
702
|
-
basename = os.path.expanduser(os.path.basename(file_path))
|
703
|
-
assert os.path.splitext(file_path)[-1].lower() in [
|
704
|
-
".json"
|
705
|
-
], f"The file `{basename}` is not a valid JSON file. The `{file_path}` must have the extension .json."
|
706
|
-
if directory and not os.path.exists(directory):
|
707
|
-
if not ObjectStorageDetails.is_oci_path(directory):
|
708
|
-
try:
|
709
|
-
os.mkdir(directory)
|
710
|
-
except:
|
711
|
-
raise Exception(f"Error creating the directory.")
|
712
|
-
if not storage_options:
|
713
|
-
storage_options = DEFAULT_STORAGE_OPTIONS or {"config": {}}
|
714
|
-
with fsspec.open(
|
715
|
-
os.path.join(directory, basename),
|
716
|
-
mode="w",
|
717
|
-
**(storage_options),
|
718
|
-
) as f:
|
719
|
-
f.write(json.dumps(self.to_dict()))
|
720
|
-
|
721
|
-
def to_yaml_file(self, file_path):
|
722
|
-
"""Saves the data schema into a yaml file.
|
723
|
-
Parameters
|
724
|
-
----------
|
725
|
-
file_path : str
|
726
|
-
File Path to store the schema in yaml format.
|
727
|
-
|
728
|
-
Returns
|
729
|
-
-------
|
730
|
-
None
|
731
|
-
Nothing.
|
732
|
-
"""
|
733
|
-
assert os.path.splitext(file_path)[-1] in [
|
734
|
-
".yaml",
|
735
|
-
".yml",
|
736
|
-
], "The `file_path` must have the extension .yaml or .yml."
|
737
|
-
directory = os.path.expanduser(os.path.dirname(file_path))
|
738
|
-
basename = os.path.expanduser(os.path.basename(file_path))
|
739
|
-
if directory and not os.path.exists(directory):
|
740
|
-
try:
|
741
|
-
os.mkdir(directory)
|
742
|
-
except:
|
743
|
-
raise Exception(f"Error creating the directory.")
|
744
|
-
with open(os.path.join(directory, basename), "w") as yaml_file:
|
745
|
-
yaml.dump(self.to_yaml(), yaml_file, default_flow_style=True)
|
746
|
-
|
747
|
-
def validate_size(self) -> bool:
|
748
|
-
"""Validates schema size.
|
749
|
-
|
750
|
-
Validates the size of schema. Throws an error if the size of the schema
|
751
|
-
exceeds expected value.
|
752
|
-
|
753
|
-
Returns
|
754
|
-
-------
|
755
|
-
bool
|
756
|
-
True if schema does not exceeds the size limit.
|
757
|
-
|
758
|
-
Raises
|
759
|
-
------
|
760
|
-
SchemaSizeTooLarge
|
761
|
-
If the size of the schema exceeds expected value.
|
762
|
-
"""
|
763
|
-
if sys.getsizeof(self.to_yaml()) > INPUT_OUTPUT_SCHENA_SIZE_LIMIT:
|
764
|
-
raise SchemaSizeTooLarge(sys.getsizeof(self.to_yaml()))
|
765
|
-
return True
|
766
|
-
|
767
|
-
def validate_schema(self):
|
768
|
-
"""Validate the schema."""
|
769
|
-
schema_validator = BaseSchemaLoader._load_schema_validator()
|
770
|
-
v = Validator(schema_validator)
|
771
|
-
for item in self.to_dict()[SCHEMA_KEY]:
|
772
|
-
valid = v.validate(item)
|
773
|
-
if not valid:
|
774
|
-
new_dict = {"column": item["name"], "error": v.errors}
|
775
|
-
raise ValueError(json.dumps(new_dict, indent=2))
|
776
|
-
return True
|
777
|
-
|
778
|
-
def __getitem__(self, key: str):
|
779
|
-
if key is None or key == "":
|
780
|
-
raise ValueError(f"The key `{key}` must not be empty.")
|
781
|
-
if not isinstance(key, str):
|
782
|
-
TypeError(f"The key `{key}` must be a string.")
|
783
|
-
for item in self._schema:
|
784
|
-
if item.key == key:
|
785
|
-
return item
|
786
|
-
raise ValueError(f"The key {key} is not found.")
|
787
|
-
|
788
|
-
def __repr__(self):
|
789
|
-
return self.to_yaml()
|
790
|
-
|
791
|
-
def __iter__(self):
|
792
|
-
return sorted(self._schema).__iter__()
|
793
|
-
|
794
|
-
def __len__(self):
|
795
|
-
return len(self._schema)
|