oracle-ads 2.13.9rc0__py3-none-any.whl → 2.13.10__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (858) hide show
  1. ads/aqua/__init__.py +40 -0
  2. ads/aqua/app.py +507 -0
  3. ads/aqua/cli.py +96 -0
  4. ads/aqua/client/__init__.py +3 -0
  5. ads/aqua/client/client.py +836 -0
  6. ads/aqua/client/openai_client.py +305 -0
  7. ads/aqua/common/__init__.py +5 -0
  8. ads/aqua/common/decorator.py +125 -0
  9. ads/aqua/common/entities.py +274 -0
  10. ads/aqua/common/enums.py +134 -0
  11. ads/aqua/common/errors.py +109 -0
  12. ads/aqua/common/utils.py +1295 -0
  13. ads/aqua/config/__init__.py +4 -0
  14. ads/aqua/config/container_config.py +246 -0
  15. ads/aqua/config/evaluation/__init__.py +4 -0
  16. ads/aqua/config/evaluation/evaluation_service_config.py +147 -0
  17. ads/aqua/config/utils/__init__.py +4 -0
  18. ads/aqua/config/utils/serializer.py +339 -0
  19. ads/aqua/constants.py +116 -0
  20. ads/aqua/data.py +14 -0
  21. ads/aqua/dummy_data/icon.txt +1 -0
  22. ads/aqua/dummy_data/oci_model_deployments.json +56 -0
  23. ads/aqua/dummy_data/oci_models.json +1 -0
  24. ads/aqua/dummy_data/readme.md +26 -0
  25. ads/aqua/evaluation/__init__.py +8 -0
  26. ads/aqua/evaluation/constants.py +53 -0
  27. ads/aqua/evaluation/entities.py +186 -0
  28. ads/aqua/evaluation/errors.py +70 -0
  29. ads/aqua/evaluation/evaluation.py +1814 -0
  30. ads/aqua/extension/__init__.py +42 -0
  31. ads/aqua/extension/aqua_ws_msg_handler.py +76 -0
  32. ads/aqua/extension/base_handler.py +90 -0
  33. ads/aqua/extension/common_handler.py +121 -0
  34. ads/aqua/extension/common_ws_msg_handler.py +36 -0
  35. ads/aqua/extension/deployment_handler.py +381 -0
  36. ads/aqua/extension/deployment_ws_msg_handler.py +54 -0
  37. ads/aqua/extension/errors.py +30 -0
  38. ads/aqua/extension/evaluation_handler.py +129 -0
  39. ads/aqua/extension/evaluation_ws_msg_handler.py +61 -0
  40. ads/aqua/extension/finetune_handler.py +96 -0
  41. ads/aqua/extension/model_handler.py +390 -0
  42. ads/aqua/extension/models/__init__.py +0 -0
  43. ads/aqua/extension/models/ws_models.py +145 -0
  44. ads/aqua/extension/models_ws_msg_handler.py +50 -0
  45. ads/aqua/extension/ui_handler.py +300 -0
  46. ads/aqua/extension/ui_websocket_handler.py +130 -0
  47. ads/aqua/extension/utils.py +133 -0
  48. ads/aqua/finetuning/__init__.py +7 -0
  49. ads/aqua/finetuning/constants.py +23 -0
  50. ads/aqua/finetuning/entities.py +181 -0
  51. ads/aqua/finetuning/finetuning.py +749 -0
  52. ads/aqua/model/__init__.py +8 -0
  53. ads/aqua/model/constants.py +60 -0
  54. ads/aqua/model/entities.py +385 -0
  55. ads/aqua/model/enums.py +32 -0
  56. ads/aqua/model/model.py +2134 -0
  57. ads/aqua/model/utils.py +52 -0
  58. ads/aqua/modeldeployment/__init__.py +6 -0
  59. ads/aqua/modeldeployment/constants.py +10 -0
  60. ads/aqua/modeldeployment/deployment.py +1315 -0
  61. ads/aqua/modeldeployment/entities.py +653 -0
  62. ads/aqua/modeldeployment/utils.py +543 -0
  63. ads/aqua/resources/gpu_shapes_index.json +94 -0
  64. ads/aqua/server/__init__.py +4 -0
  65. ads/aqua/server/__main__.py +24 -0
  66. ads/aqua/server/app.py +47 -0
  67. ads/aqua/server/aqua_spec.yml +1291 -0
  68. ads/aqua/training/__init__.py +4 -0
  69. ads/aqua/training/exceptions.py +476 -0
  70. ads/aqua/ui.py +519 -0
  71. ads/automl/__init__.py +9 -0
  72. ads/automl/driver.py +330 -0
  73. ads/automl/provider.py +975 -0
  74. ads/bds/__init__.py +5 -0
  75. ads/bds/auth.py +127 -0
  76. ads/bds/big_data_service.py +255 -0
  77. ads/catalog/__init__.py +19 -0
  78. ads/catalog/model.py +1576 -0
  79. ads/catalog/notebook.py +461 -0
  80. ads/catalog/project.py +468 -0
  81. ads/catalog/summary.py +178 -0
  82. ads/common/__init__.py +11 -0
  83. ads/common/analyzer.py +65 -0
  84. ads/common/artifact/.model-ignore +63 -0
  85. ads/common/artifact/__init__.py +10 -0
  86. ads/common/auth.py +1122 -0
  87. ads/common/card_identifier.py +83 -0
  88. ads/common/config.py +647 -0
  89. ads/common/data.py +165 -0
  90. ads/common/decorator/__init__.py +9 -0
  91. ads/common/decorator/argument_to_case.py +88 -0
  92. ads/common/decorator/deprecate.py +69 -0
  93. ads/common/decorator/require_nonempty_arg.py +65 -0
  94. ads/common/decorator/runtime_dependency.py +178 -0
  95. ads/common/decorator/threaded.py +97 -0
  96. ads/common/decorator/utils.py +35 -0
  97. ads/common/dsc_file_system.py +303 -0
  98. ads/common/error.py +14 -0
  99. ads/common/extended_enum.py +81 -0
  100. ads/common/function/__init__.py +5 -0
  101. ads/common/function/fn_util.py +142 -0
  102. ads/common/function/func_conf.yaml +25 -0
  103. ads/common/ipython.py +76 -0
  104. ads/common/model.py +679 -0
  105. ads/common/model_artifact.py +1759 -0
  106. ads/common/model_artifact_schema.json +107 -0
  107. ads/common/model_export_util.py +664 -0
  108. ads/common/model_metadata.py +24 -0
  109. ads/common/object_storage_details.py +296 -0
  110. ads/common/oci_client.py +179 -0
  111. ads/common/oci_datascience.py +46 -0
  112. ads/common/oci_logging.py +1144 -0
  113. ads/common/oci_mixin.py +957 -0
  114. ads/common/oci_resource.py +136 -0
  115. ads/common/serializer.py +559 -0
  116. ads/common/utils.py +1852 -0
  117. ads/common/word_lists.py +1491 -0
  118. ads/common/work_request.py +189 -0
  119. ads/config.py +1 -0
  120. ads/data_labeling/__init__.py +13 -0
  121. ads/data_labeling/boundingbox.py +253 -0
  122. ads/data_labeling/constants.py +47 -0
  123. ads/data_labeling/data_labeling_service.py +244 -0
  124. ads/data_labeling/interface/__init__.py +5 -0
  125. ads/data_labeling/interface/loader.py +16 -0
  126. ads/data_labeling/interface/parser.py +16 -0
  127. ads/data_labeling/interface/reader.py +23 -0
  128. ads/data_labeling/loader/__init__.py +5 -0
  129. ads/data_labeling/loader/file_loader.py +241 -0
  130. ads/data_labeling/metadata.py +110 -0
  131. ads/data_labeling/mixin/__init__.py +5 -0
  132. ads/data_labeling/mixin/data_labeling.py +232 -0
  133. ads/data_labeling/ner.py +129 -0
  134. ads/data_labeling/parser/__init__.py +5 -0
  135. ads/data_labeling/parser/dls_record_parser.py +388 -0
  136. ads/data_labeling/parser/export_metadata_parser.py +94 -0
  137. ads/data_labeling/parser/export_record_parser.py +473 -0
  138. ads/data_labeling/reader/__init__.py +5 -0
  139. ads/data_labeling/reader/dataset_reader.py +574 -0
  140. ads/data_labeling/reader/dls_record_reader.py +121 -0
  141. ads/data_labeling/reader/export_record_reader.py +62 -0
  142. ads/data_labeling/reader/jsonl_reader.py +75 -0
  143. ads/data_labeling/reader/metadata_reader.py +203 -0
  144. ads/data_labeling/reader/record_reader.py +263 -0
  145. ads/data_labeling/record.py +52 -0
  146. ads/data_labeling/visualizer/__init__.py +5 -0
  147. ads/data_labeling/visualizer/image_visualizer.py +525 -0
  148. ads/data_labeling/visualizer/text_visualizer.py +357 -0
  149. ads/database/__init__.py +5 -0
  150. ads/database/connection.py +338 -0
  151. ads/dataset/__init__.py +10 -0
  152. ads/dataset/capabilities.md +51 -0
  153. ads/dataset/classification_dataset.py +339 -0
  154. ads/dataset/correlation.py +226 -0
  155. ads/dataset/correlation_plot.py +563 -0
  156. ads/dataset/dask_series.py +173 -0
  157. ads/dataset/dataframe_transformer.py +110 -0
  158. ads/dataset/dataset.py +1979 -0
  159. ads/dataset/dataset_browser.py +360 -0
  160. ads/dataset/dataset_with_target.py +995 -0
  161. ads/dataset/exception.py +25 -0
  162. ads/dataset/factory.py +987 -0
  163. ads/dataset/feature_engineering_transformer.py +35 -0
  164. ads/dataset/feature_selection.py +107 -0
  165. ads/dataset/forecasting_dataset.py +26 -0
  166. ads/dataset/helper.py +1450 -0
  167. ads/dataset/label_encoder.py +99 -0
  168. ads/dataset/mixin/__init__.py +5 -0
  169. ads/dataset/mixin/dataset_accessor.py +134 -0
  170. ads/dataset/pipeline.py +58 -0
  171. ads/dataset/plot.py +710 -0
  172. ads/dataset/progress.py +86 -0
  173. ads/dataset/recommendation.py +297 -0
  174. ads/dataset/recommendation_transformer.py +502 -0
  175. ads/dataset/regression_dataset.py +14 -0
  176. ads/dataset/sampled_dataset.py +1050 -0
  177. ads/dataset/target.py +98 -0
  178. ads/dataset/timeseries.py +18 -0
  179. ads/dbmixin/__init__.py +5 -0
  180. ads/dbmixin/db_pandas_accessor.py +153 -0
  181. ads/environment/__init__.py +9 -0
  182. ads/environment/ml_runtime.py +66 -0
  183. ads/evaluations/README.md +14 -0
  184. ads/evaluations/__init__.py +109 -0
  185. ads/evaluations/evaluation_plot.py +983 -0
  186. ads/evaluations/evaluator.py +1334 -0
  187. ads/evaluations/statistical_metrics.py +543 -0
  188. ads/experiments/__init__.py +9 -0
  189. ads/experiments/capabilities.md +0 -0
  190. ads/explanations/__init__.py +21 -0
  191. ads/explanations/base_explainer.py +142 -0
  192. ads/explanations/capabilities.md +83 -0
  193. ads/explanations/explainer.py +190 -0
  194. ads/explanations/mlx_global_explainer.py +1050 -0
  195. ads/explanations/mlx_interface.py +386 -0
  196. ads/explanations/mlx_local_explainer.py +287 -0
  197. ads/explanations/mlx_whatif_explainer.py +201 -0
  198. ads/feature_engineering/__init__.py +20 -0
  199. ads/feature_engineering/accessor/__init__.py +5 -0
  200. ads/feature_engineering/accessor/dataframe_accessor.py +535 -0
  201. ads/feature_engineering/accessor/mixin/__init__.py +5 -0
  202. ads/feature_engineering/accessor/mixin/correlation.py +166 -0
  203. ads/feature_engineering/accessor/mixin/eda_mixin.py +266 -0
  204. ads/feature_engineering/accessor/mixin/eda_mixin_series.py +85 -0
  205. ads/feature_engineering/accessor/mixin/feature_types_mixin.py +211 -0
  206. ads/feature_engineering/accessor/mixin/utils.py +65 -0
  207. ads/feature_engineering/accessor/series_accessor.py +431 -0
  208. ads/feature_engineering/adsimage/__init__.py +5 -0
  209. ads/feature_engineering/adsimage/image.py +192 -0
  210. ads/feature_engineering/adsimage/image_reader.py +170 -0
  211. ads/feature_engineering/adsimage/interface/__init__.py +5 -0
  212. ads/feature_engineering/adsimage/interface/reader.py +19 -0
  213. ads/feature_engineering/adsstring/__init__.py +7 -0
  214. ads/feature_engineering/adsstring/oci_language/__init__.py +8 -0
  215. ads/feature_engineering/adsstring/string/__init__.py +8 -0
  216. ads/feature_engineering/data_schema.json +57 -0
  217. ads/feature_engineering/dataset/__init__.py +5 -0
  218. ads/feature_engineering/dataset/zip_code_data.py +42062 -0
  219. ads/feature_engineering/exceptions.py +40 -0
  220. ads/feature_engineering/feature_type/__init__.py +133 -0
  221. ads/feature_engineering/feature_type/address.py +184 -0
  222. ads/feature_engineering/feature_type/adsstring/__init__.py +5 -0
  223. ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +164 -0
  224. ads/feature_engineering/feature_type/adsstring/oci_language.py +93 -0
  225. ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +5 -0
  226. ads/feature_engineering/feature_type/adsstring/parsers/base.py +47 -0
  227. ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +96 -0
  228. ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +221 -0
  229. ads/feature_engineering/feature_type/adsstring/string.py +258 -0
  230. ads/feature_engineering/feature_type/base.py +58 -0
  231. ads/feature_engineering/feature_type/boolean.py +183 -0
  232. ads/feature_engineering/feature_type/category.py +146 -0
  233. ads/feature_engineering/feature_type/constant.py +137 -0
  234. ads/feature_engineering/feature_type/continuous.py +151 -0
  235. ads/feature_engineering/feature_type/creditcard.py +314 -0
  236. ads/feature_engineering/feature_type/datetime.py +190 -0
  237. ads/feature_engineering/feature_type/discrete.py +134 -0
  238. ads/feature_engineering/feature_type/document.py +43 -0
  239. ads/feature_engineering/feature_type/gis.py +251 -0
  240. ads/feature_engineering/feature_type/handler/__init__.py +5 -0
  241. ads/feature_engineering/feature_type/handler/feature_validator.py +524 -0
  242. ads/feature_engineering/feature_type/handler/feature_warning.py +319 -0
  243. ads/feature_engineering/feature_type/handler/warnings.py +128 -0
  244. ads/feature_engineering/feature_type/integer.py +142 -0
  245. ads/feature_engineering/feature_type/ip_address.py +144 -0
  246. ads/feature_engineering/feature_type/ip_address_v4.py +138 -0
  247. ads/feature_engineering/feature_type/ip_address_v6.py +138 -0
  248. ads/feature_engineering/feature_type/lat_long.py +256 -0
  249. ads/feature_engineering/feature_type/object.py +43 -0
  250. ads/feature_engineering/feature_type/ordinal.py +132 -0
  251. ads/feature_engineering/feature_type/phone_number.py +135 -0
  252. ads/feature_engineering/feature_type/string.py +171 -0
  253. ads/feature_engineering/feature_type/text.py +93 -0
  254. ads/feature_engineering/feature_type/unknown.py +43 -0
  255. ads/feature_engineering/feature_type/zip_code.py +164 -0
  256. ads/feature_engineering/feature_type_manager.py +406 -0
  257. ads/feature_engineering/schema.py +795 -0
  258. ads/feature_engineering/utils.py +245 -0
  259. ads/feature_store/.readthedocs.yaml +19 -0
  260. ads/feature_store/README.md +65 -0
  261. ads/feature_store/__init__.py +9 -0
  262. ads/feature_store/common/__init__.py +0 -0
  263. ads/feature_store/common/enums.py +339 -0
  264. ads/feature_store/common/exceptions.py +18 -0
  265. ads/feature_store/common/spark_session_singleton.py +125 -0
  266. ads/feature_store/common/utils/__init__.py +0 -0
  267. ads/feature_store/common/utils/base64_encoder_decoder.py +72 -0
  268. ads/feature_store/common/utils/feature_schema_mapper.py +283 -0
  269. ads/feature_store/common/utils/transformation_utils.py +82 -0
  270. ads/feature_store/common/utils/utility.py +403 -0
  271. ads/feature_store/data_validation/__init__.py +0 -0
  272. ads/feature_store/data_validation/great_expectation.py +129 -0
  273. ads/feature_store/dataset.py +1230 -0
  274. ads/feature_store/dataset_job.py +530 -0
  275. ads/feature_store/docs/Dockerfile +7 -0
  276. ads/feature_store/docs/Makefile +44 -0
  277. ads/feature_store/docs/conf.py +28 -0
  278. ads/feature_store/docs/requirements.txt +14 -0
  279. ads/feature_store/docs/source/ads.feature_store.query.rst +20 -0
  280. ads/feature_store/docs/source/cicd.rst +137 -0
  281. ads/feature_store/docs/source/conf.py +86 -0
  282. ads/feature_store/docs/source/data_versioning.rst +33 -0
  283. ads/feature_store/docs/source/dataset.rst +388 -0
  284. ads/feature_store/docs/source/dataset_job.rst +27 -0
  285. ads/feature_store/docs/source/demo.rst +70 -0
  286. ads/feature_store/docs/source/entity.rst +78 -0
  287. ads/feature_store/docs/source/feature_group.rst +624 -0
  288. ads/feature_store/docs/source/feature_group_job.rst +29 -0
  289. ads/feature_store/docs/source/feature_store.rst +122 -0
  290. ads/feature_store/docs/source/feature_store_class.rst +123 -0
  291. ads/feature_store/docs/source/feature_validation.rst +66 -0
  292. ads/feature_store/docs/source/figures/cicd.png +0 -0
  293. ads/feature_store/docs/source/figures/data_validation.png +0 -0
  294. ads/feature_store/docs/source/figures/data_versioning.png +0 -0
  295. ads/feature_store/docs/source/figures/dataset.gif +0 -0
  296. ads/feature_store/docs/source/figures/dataset.png +0 -0
  297. ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
  298. ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
  299. ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
  300. ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
  301. ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
  302. ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
  303. ads/feature_store/docs/source/figures/entity.png +0 -0
  304. ads/feature_store/docs/source/figures/feature_group.png +0 -0
  305. ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
  306. ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
  307. ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
  308. ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
  309. ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
  310. ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
  311. ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
  312. ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
  313. ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
  314. ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
  315. ads/feature_store/docs/source/figures/overview.png +0 -0
  316. ads/feature_store/docs/source/figures/resource_manager.png +0 -0
  317. ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
  318. ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
  319. ads/feature_store/docs/source/figures/stats_1.png +0 -0
  320. ads/feature_store/docs/source/figures/stats_2.png +0 -0
  321. ads/feature_store/docs/source/figures/stats_d.png +0 -0
  322. ads/feature_store/docs/source/figures/stats_fg.png +0 -0
  323. ads/feature_store/docs/source/figures/transformation.png +0 -0
  324. ads/feature_store/docs/source/figures/transformations.gif +0 -0
  325. ads/feature_store/docs/source/figures/validation.png +0 -0
  326. ads/feature_store/docs/source/figures/validation_fg.png +0 -0
  327. ads/feature_store/docs/source/figures/validation_results.png +0 -0
  328. ads/feature_store/docs/source/figures/validation_summary.png +0 -0
  329. ads/feature_store/docs/source/index.rst +81 -0
  330. ads/feature_store/docs/source/module.rst +8 -0
  331. ads/feature_store/docs/source/notebook.rst +94 -0
  332. ads/feature_store/docs/source/overview.rst +47 -0
  333. ads/feature_store/docs/source/quickstart.rst +176 -0
  334. ads/feature_store/docs/source/release_notes.rst +194 -0
  335. ads/feature_store/docs/source/setup_feature_store.rst +81 -0
  336. ads/feature_store/docs/source/statistics.rst +58 -0
  337. ads/feature_store/docs/source/transformation.rst +199 -0
  338. ads/feature_store/docs/source/ui.rst +65 -0
  339. ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +66 -0
  340. ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +192 -0
  341. ads/feature_store/docs/source/user_guides.setup.terraform.rst +338 -0
  342. ads/feature_store/entity.py +718 -0
  343. ads/feature_store/execution_strategy/__init__.py +0 -0
  344. ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
  345. ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +375 -0
  346. ads/feature_store/execution_strategy/engine/__init__.py +0 -0
  347. ads/feature_store/execution_strategy/engine/spark_engine.py +316 -0
  348. ads/feature_store/execution_strategy/execution_strategy.py +113 -0
  349. ads/feature_store/execution_strategy/execution_strategy_provider.py +47 -0
  350. ads/feature_store/execution_strategy/spark/__init__.py +0 -0
  351. ads/feature_store/execution_strategy/spark/spark_execution.py +618 -0
  352. ads/feature_store/feature.py +192 -0
  353. ads/feature_store/feature_group.py +1494 -0
  354. ads/feature_store/feature_group_expectation.py +346 -0
  355. ads/feature_store/feature_group_job.py +602 -0
  356. ads/feature_store/feature_lineage/__init__.py +0 -0
  357. ads/feature_store/feature_lineage/graphviz_service.py +180 -0
  358. ads/feature_store/feature_option_details.py +50 -0
  359. ads/feature_store/feature_statistics/__init__.py +0 -0
  360. ads/feature_store/feature_statistics/statistics_service.py +99 -0
  361. ads/feature_store/feature_store.py +699 -0
  362. ads/feature_store/feature_store_registrar.py +518 -0
  363. ads/feature_store/input_feature_detail.py +149 -0
  364. ads/feature_store/mixin/__init__.py +4 -0
  365. ads/feature_store/mixin/oci_feature_store.py +145 -0
  366. ads/feature_store/model_details.py +73 -0
  367. ads/feature_store/query/__init__.py +0 -0
  368. ads/feature_store/query/filter.py +266 -0
  369. ads/feature_store/query/generator/__init__.py +0 -0
  370. ads/feature_store/query/generator/query_generator.py +298 -0
  371. ads/feature_store/query/join.py +161 -0
  372. ads/feature_store/query/query.py +403 -0
  373. ads/feature_store/query/validator/__init__.py +0 -0
  374. ads/feature_store/query/validator/query_validator.py +57 -0
  375. ads/feature_store/response/__init__.py +0 -0
  376. ads/feature_store/response/response_builder.py +68 -0
  377. ads/feature_store/service/__init__.py +0 -0
  378. ads/feature_store/service/oci_dataset.py +139 -0
  379. ads/feature_store/service/oci_dataset_job.py +199 -0
  380. ads/feature_store/service/oci_entity.py +125 -0
  381. ads/feature_store/service/oci_feature_group.py +164 -0
  382. ads/feature_store/service/oci_feature_group_job.py +214 -0
  383. ads/feature_store/service/oci_feature_store.py +182 -0
  384. ads/feature_store/service/oci_lineage.py +87 -0
  385. ads/feature_store/service/oci_transformation.py +104 -0
  386. ads/feature_store/statistics/__init__.py +0 -0
  387. ads/feature_store/statistics/abs_feature_value.py +49 -0
  388. ads/feature_store/statistics/charts/__init__.py +0 -0
  389. ads/feature_store/statistics/charts/abstract_feature_plot.py +37 -0
  390. ads/feature_store/statistics/charts/box_plot.py +148 -0
  391. ads/feature_store/statistics/charts/frequency_distribution.py +65 -0
  392. ads/feature_store/statistics/charts/probability_distribution.py +68 -0
  393. ads/feature_store/statistics/charts/top_k_frequent_elements.py +98 -0
  394. ads/feature_store/statistics/feature_stat.py +126 -0
  395. ads/feature_store/statistics/generic_feature_value.py +33 -0
  396. ads/feature_store/statistics/statistics.py +41 -0
  397. ads/feature_store/statistics_config.py +101 -0
  398. ads/feature_store/templates/feature_store_template.yaml +45 -0
  399. ads/feature_store/transformation.py +499 -0
  400. ads/feature_store/validation_output.py +57 -0
  401. ads/hpo/__init__.py +9 -0
  402. ads/hpo/_imports.py +91 -0
  403. ads/hpo/ads_search_space.py +439 -0
  404. ads/hpo/distributions.py +325 -0
  405. ads/hpo/objective.py +280 -0
  406. ads/hpo/search_cv.py +1657 -0
  407. ads/hpo/stopping_criterion.py +75 -0
  408. ads/hpo/tuner_artifact.py +413 -0
  409. ads/hpo/utils.py +91 -0
  410. ads/hpo/validation.py +140 -0
  411. ads/hpo/visualization/__init__.py +5 -0
  412. ads/hpo/visualization/_contour.py +23 -0
  413. ads/hpo/visualization/_edf.py +20 -0
  414. ads/hpo/visualization/_intermediate_values.py +21 -0
  415. ads/hpo/visualization/_optimization_history.py +25 -0
  416. ads/hpo/visualization/_parallel_coordinate.py +169 -0
  417. ads/hpo/visualization/_param_importances.py +26 -0
  418. ads/jobs/__init__.py +53 -0
  419. ads/jobs/ads_job.py +663 -0
  420. ads/jobs/builders/__init__.py +5 -0
  421. ads/jobs/builders/base.py +156 -0
  422. ads/jobs/builders/infrastructure/__init__.py +6 -0
  423. ads/jobs/builders/infrastructure/base.py +165 -0
  424. ads/jobs/builders/infrastructure/dataflow.py +1252 -0
  425. ads/jobs/builders/infrastructure/dsc_job.py +1894 -0
  426. ads/jobs/builders/infrastructure/dsc_job_runtime.py +1233 -0
  427. ads/jobs/builders/infrastructure/utils.py +65 -0
  428. ads/jobs/builders/runtimes/__init__.py +5 -0
  429. ads/jobs/builders/runtimes/artifact.py +338 -0
  430. ads/jobs/builders/runtimes/base.py +325 -0
  431. ads/jobs/builders/runtimes/container_runtime.py +242 -0
  432. ads/jobs/builders/runtimes/python_runtime.py +1016 -0
  433. ads/jobs/builders/runtimes/pytorch_runtime.py +204 -0
  434. ads/jobs/cli.py +104 -0
  435. ads/jobs/env_var_parser.py +131 -0
  436. ads/jobs/extension.py +160 -0
  437. ads/jobs/schema/__init__.py +5 -0
  438. ads/jobs/schema/infrastructure_schema.json +116 -0
  439. ads/jobs/schema/job_schema.json +42 -0
  440. ads/jobs/schema/runtime_schema.json +183 -0
  441. ads/jobs/schema/validator.py +141 -0
  442. ads/jobs/serializer.py +296 -0
  443. ads/jobs/templates/__init__.py +5 -0
  444. ads/jobs/templates/container.py +6 -0
  445. ads/jobs/templates/driver_notebook.py +177 -0
  446. ads/jobs/templates/driver_oci.py +500 -0
  447. ads/jobs/templates/driver_python.py +48 -0
  448. ads/jobs/templates/driver_pytorch.py +852 -0
  449. ads/jobs/templates/driver_utils.py +615 -0
  450. ads/jobs/templates/hostname_from_env.c +55 -0
  451. ads/jobs/templates/oci_metrics.py +181 -0
  452. ads/jobs/utils.py +104 -0
  453. ads/llm/__init__.py +28 -0
  454. ads/llm/autogen/__init__.py +2 -0
  455. ads/llm/autogen/constants.py +15 -0
  456. ads/llm/autogen/reports/__init__.py +2 -0
  457. ads/llm/autogen/reports/base.py +67 -0
  458. ads/llm/autogen/reports/data.py +103 -0
  459. ads/llm/autogen/reports/session.py +526 -0
  460. ads/llm/autogen/reports/templates/chat_box.html +13 -0
  461. ads/llm/autogen/reports/templates/chat_box_lt.html +5 -0
  462. ads/llm/autogen/reports/templates/chat_box_rt.html +6 -0
  463. ads/llm/autogen/reports/utils.py +56 -0
  464. ads/llm/autogen/v02/__init__.py +4 -0
  465. ads/llm/autogen/v02/client.py +295 -0
  466. ads/llm/autogen/v02/log_handlers/__init__.py +2 -0
  467. ads/llm/autogen/v02/log_handlers/oci_file_handler.py +83 -0
  468. ads/llm/autogen/v02/loggers/__init__.py +6 -0
  469. ads/llm/autogen/v02/loggers/metric_logger.py +320 -0
  470. ads/llm/autogen/v02/loggers/session_logger.py +580 -0
  471. ads/llm/autogen/v02/loggers/utils.py +86 -0
  472. ads/llm/autogen/v02/runtime_logging.py +163 -0
  473. ads/llm/chain.py +268 -0
  474. ads/llm/chat_template.py +31 -0
  475. ads/llm/deploy.py +63 -0
  476. ads/llm/guardrails/__init__.py +5 -0
  477. ads/llm/guardrails/base.py +442 -0
  478. ads/llm/guardrails/huggingface.py +44 -0
  479. ads/llm/langchain/__init__.py +5 -0
  480. ads/llm/langchain/plugins/__init__.py +5 -0
  481. ads/llm/langchain/plugins/chat_models/__init__.py +5 -0
  482. ads/llm/langchain/plugins/chat_models/oci_data_science.py +1027 -0
  483. ads/llm/langchain/plugins/embeddings/__init__.py +4 -0
  484. ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +184 -0
  485. ads/llm/langchain/plugins/llms/__init__.py +5 -0
  486. ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +979 -0
  487. ads/llm/requirements.txt +3 -0
  488. ads/llm/serialize.py +219 -0
  489. ads/llm/serializers/__init__.py +0 -0
  490. ads/llm/serializers/retrieval_qa.py +153 -0
  491. ads/llm/serializers/runnable_parallel.py +27 -0
  492. ads/llm/templates/score_chain.jinja2 +155 -0
  493. ads/llm/templates/tool_chat_template_hermes.jinja +130 -0
  494. ads/llm/templates/tool_chat_template_mistral_parallel.jinja +94 -0
  495. ads/model/__init__.py +52 -0
  496. ads/model/artifact.py +573 -0
  497. ads/model/artifact_downloader.py +254 -0
  498. ads/model/artifact_uploader.py +267 -0
  499. ads/model/base_properties.py +238 -0
  500. ads/model/common/.model-ignore +66 -0
  501. ads/model/common/__init__.py +5 -0
  502. ads/model/common/utils.py +142 -0
  503. ads/model/datascience_model.py +2635 -0
  504. ads/model/deployment/__init__.py +20 -0
  505. ads/model/deployment/common/__init__.py +5 -0
  506. ads/model/deployment/common/utils.py +308 -0
  507. ads/model/deployment/model_deployer.py +466 -0
  508. ads/model/deployment/model_deployment.py +1846 -0
  509. ads/model/deployment/model_deployment_infrastructure.py +671 -0
  510. ads/model/deployment/model_deployment_properties.py +493 -0
  511. ads/model/deployment/model_deployment_runtime.py +838 -0
  512. ads/model/extractor/__init__.py +5 -0
  513. ads/model/extractor/automl_extractor.py +74 -0
  514. ads/model/extractor/embedding_onnx_extractor.py +80 -0
  515. ads/model/extractor/huggingface_extractor.py +88 -0
  516. ads/model/extractor/keras_extractor.py +84 -0
  517. ads/model/extractor/lightgbm_extractor.py +93 -0
  518. ads/model/extractor/model_info_extractor.py +114 -0
  519. ads/model/extractor/model_info_extractor_factory.py +105 -0
  520. ads/model/extractor/pytorch_extractor.py +87 -0
  521. ads/model/extractor/sklearn_extractor.py +112 -0
  522. ads/model/extractor/spark_extractor.py +89 -0
  523. ads/model/extractor/tensorflow_extractor.py +85 -0
  524. ads/model/extractor/xgboost_extractor.py +94 -0
  525. ads/model/framework/__init__.py +5 -0
  526. ads/model/framework/automl_model.py +178 -0
  527. ads/model/framework/embedding_onnx_model.py +438 -0
  528. ads/model/framework/huggingface_model.py +399 -0
  529. ads/model/framework/lightgbm_model.py +266 -0
  530. ads/model/framework/pytorch_model.py +266 -0
  531. ads/model/framework/sklearn_model.py +250 -0
  532. ads/model/framework/spark_model.py +326 -0
  533. ads/model/framework/tensorflow_model.py +254 -0
  534. ads/model/framework/xgboost_model.py +258 -0
  535. ads/model/generic_model.py +3518 -0
  536. ads/model/model_artifact_boilerplate/README.md +381 -0
  537. ads/model/model_artifact_boilerplate/__init__.py +5 -0
  538. ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +5 -0
  539. ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +427 -0
  540. ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +2 -0
  541. ads/model/model_artifact_boilerplate/runtime.yaml +7 -0
  542. ads/model/model_artifact_boilerplate/score.py +61 -0
  543. ads/model/model_file_description_schema.json +68 -0
  544. ads/model/model_introspect.py +331 -0
  545. ads/model/model_metadata.py +1810 -0
  546. ads/model/model_metadata_mixin.py +460 -0
  547. ads/model/model_properties.py +63 -0
  548. ads/model/model_version_set.py +739 -0
  549. ads/model/runtime/__init__.py +5 -0
  550. ads/model/runtime/env_info.py +306 -0
  551. ads/model/runtime/model_deployment_details.py +37 -0
  552. ads/model/runtime/model_provenance_details.py +58 -0
  553. ads/model/runtime/runtime_info.py +81 -0
  554. ads/model/runtime/schemas/inference_env_info_schema.yaml +16 -0
  555. ads/model/runtime/schemas/model_provenance_schema.yaml +36 -0
  556. ads/model/runtime/schemas/training_env_info_schema.yaml +16 -0
  557. ads/model/runtime/utils.py +201 -0
  558. ads/model/serde/__init__.py +5 -0
  559. ads/model/serde/common.py +40 -0
  560. ads/model/serde/model_input.py +547 -0
  561. ads/model/serde/model_serializer.py +1184 -0
  562. ads/model/service/__init__.py +5 -0
  563. ads/model/service/oci_datascience_model.py +1076 -0
  564. ads/model/service/oci_datascience_model_deployment.py +500 -0
  565. ads/model/service/oci_datascience_model_version_set.py +176 -0
  566. ads/model/transformer/__init__.py +5 -0
  567. ads/model/transformer/onnx_transformer.py +324 -0
  568. ads/mysqldb/__init__.py +5 -0
  569. ads/mysqldb/mysql_db.py +227 -0
  570. ads/opctl/__init__.py +18 -0
  571. ads/opctl/anomaly_detection.py +11 -0
  572. ads/opctl/backend/__init__.py +5 -0
  573. ads/opctl/backend/ads_dataflow.py +353 -0
  574. ads/opctl/backend/ads_ml_job.py +710 -0
  575. ads/opctl/backend/ads_ml_pipeline.py +164 -0
  576. ads/opctl/backend/ads_model_deployment.py +209 -0
  577. ads/opctl/backend/base.py +146 -0
  578. ads/opctl/backend/local.py +1053 -0
  579. ads/opctl/backend/marketplace/__init__.py +9 -0
  580. ads/opctl/backend/marketplace/helm_helper.py +173 -0
  581. ads/opctl/backend/marketplace/local_marketplace.py +271 -0
  582. ads/opctl/backend/marketplace/marketplace_backend_runner.py +71 -0
  583. ads/opctl/backend/marketplace/marketplace_operator_interface.py +44 -0
  584. ads/opctl/backend/marketplace/marketplace_operator_runner.py +24 -0
  585. ads/opctl/backend/marketplace/marketplace_utils.py +212 -0
  586. ads/opctl/backend/marketplace/models/__init__.py +5 -0
  587. ads/opctl/backend/marketplace/models/bearer_token.py +94 -0
  588. ads/opctl/backend/marketplace/models/marketplace_type.py +70 -0
  589. ads/opctl/backend/marketplace/models/ocir_details.py +56 -0
  590. ads/opctl/backend/marketplace/prerequisite_checker.py +238 -0
  591. ads/opctl/cli.py +707 -0
  592. ads/opctl/cmds.py +869 -0
  593. ads/opctl/conda/__init__.py +5 -0
  594. ads/opctl/conda/cli.py +193 -0
  595. ads/opctl/conda/cmds.py +749 -0
  596. ads/opctl/conda/config.yaml +34 -0
  597. ads/opctl/conda/manifest_template.yaml +13 -0
  598. ads/opctl/conda/multipart_uploader.py +188 -0
  599. ads/opctl/conda/pack.py +89 -0
  600. ads/opctl/config/__init__.py +5 -0
  601. ads/opctl/config/base.py +57 -0
  602. ads/opctl/config/diagnostics/__init__.py +5 -0
  603. ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +62 -0
  604. ads/opctl/config/merger.py +255 -0
  605. ads/opctl/config/resolver.py +297 -0
  606. ads/opctl/config/utils.py +79 -0
  607. ads/opctl/config/validator.py +17 -0
  608. ads/opctl/config/versioner.py +68 -0
  609. ads/opctl/config/yaml_parsers/__init__.py +7 -0
  610. ads/opctl/config/yaml_parsers/base.py +58 -0
  611. ads/opctl/config/yaml_parsers/distributed/__init__.py +7 -0
  612. ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +201 -0
  613. ads/opctl/constants.py +66 -0
  614. ads/opctl/decorator/__init__.py +5 -0
  615. ads/opctl/decorator/common.py +129 -0
  616. ads/opctl/diagnostics/__init__.py +5 -0
  617. ads/opctl/diagnostics/__main__.py +25 -0
  618. ads/opctl/diagnostics/check_distributed_job_requirements.py +212 -0
  619. ads/opctl/diagnostics/check_requirements.py +144 -0
  620. ads/opctl/diagnostics/requirement_exception.py +9 -0
  621. ads/opctl/distributed/README.md +109 -0
  622. ads/opctl/distributed/__init__.py +5 -0
  623. ads/opctl/distributed/certificates.py +32 -0
  624. ads/opctl/distributed/cli.py +207 -0
  625. ads/opctl/distributed/cmds.py +731 -0
  626. ads/opctl/distributed/common/__init__.py +5 -0
  627. ads/opctl/distributed/common/abstract_cluster_provider.py +449 -0
  628. ads/opctl/distributed/common/abstract_framework_spec_builder.py +88 -0
  629. ads/opctl/distributed/common/cluster_config_helper.py +103 -0
  630. ads/opctl/distributed/common/cluster_provider_factory.py +21 -0
  631. ads/opctl/distributed/common/cluster_runner.py +54 -0
  632. ads/opctl/distributed/common/framework_factory.py +29 -0
  633. ads/opctl/docker/Dockerfile.job +103 -0
  634. ads/opctl/docker/Dockerfile.job.arm +107 -0
  635. ads/opctl/docker/Dockerfile.job.gpu +175 -0
  636. ads/opctl/docker/base-env.yaml +13 -0
  637. ads/opctl/docker/cuda.repo +6 -0
  638. ads/opctl/docker/operator/.dockerignore +0 -0
  639. ads/opctl/docker/operator/Dockerfile +41 -0
  640. ads/opctl/docker/operator/Dockerfile.gpu +85 -0
  641. ads/opctl/docker/operator/cuda.repo +6 -0
  642. ads/opctl/docker/operator/environment.yaml +8 -0
  643. ads/opctl/forecast.py +11 -0
  644. ads/opctl/index.yaml +3 -0
  645. ads/opctl/model/__init__.py +5 -0
  646. ads/opctl/model/cli.py +65 -0
  647. ads/opctl/model/cmds.py +73 -0
  648. ads/opctl/operator/README.md +4 -0
  649. ads/opctl/operator/__init__.py +31 -0
  650. ads/opctl/operator/cli.py +344 -0
  651. ads/opctl/operator/cmd.py +596 -0
  652. ads/opctl/operator/common/__init__.py +5 -0
  653. ads/opctl/operator/common/backend_factory.py +460 -0
  654. ads/opctl/operator/common/const.py +27 -0
  655. ads/opctl/operator/common/data/synthetic.csv +16001 -0
  656. ads/opctl/operator/common/dictionary_merger.py +148 -0
  657. ads/opctl/operator/common/errors.py +42 -0
  658. ads/opctl/operator/common/operator_config.py +99 -0
  659. ads/opctl/operator/common/operator_loader.py +811 -0
  660. ads/opctl/operator/common/operator_schema.yaml +130 -0
  661. ads/opctl/operator/common/operator_yaml_generator.py +152 -0
  662. ads/opctl/operator/common/utils.py +208 -0
  663. ads/opctl/operator/lowcode/__init__.py +5 -0
  664. ads/opctl/operator/lowcode/anomaly/MLoperator +16 -0
  665. ads/opctl/operator/lowcode/anomaly/README.md +207 -0
  666. ads/opctl/operator/lowcode/anomaly/__init__.py +5 -0
  667. ads/opctl/operator/lowcode/anomaly/__main__.py +103 -0
  668. ads/opctl/operator/lowcode/anomaly/cmd.py +35 -0
  669. ads/opctl/operator/lowcode/anomaly/const.py +167 -0
  670. ads/opctl/operator/lowcode/anomaly/environment.yaml +10 -0
  671. ads/opctl/operator/lowcode/anomaly/model/__init__.py +5 -0
  672. ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +146 -0
  673. ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +162 -0
  674. ads/opctl/operator/lowcode/anomaly/model/automlx.py +99 -0
  675. ads/opctl/operator/lowcode/anomaly/model/autots.py +115 -0
  676. ads/opctl/operator/lowcode/anomaly/model/base_model.py +404 -0
  677. ads/opctl/operator/lowcode/anomaly/model/factory.py +110 -0
  678. ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +78 -0
  679. ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +78 -0
  680. ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +120 -0
  681. ads/opctl/operator/lowcode/anomaly/model/tods.py +119 -0
  682. ads/opctl/operator/lowcode/anomaly/operator_config.py +127 -0
  683. ads/opctl/operator/lowcode/anomaly/schema.yaml +401 -0
  684. ads/opctl/operator/lowcode/anomaly/utils.py +88 -0
  685. ads/opctl/operator/lowcode/common/__init__.py +5 -0
  686. ads/opctl/operator/lowcode/common/const.py +10 -0
  687. ads/opctl/operator/lowcode/common/data.py +116 -0
  688. ads/opctl/operator/lowcode/common/errors.py +47 -0
  689. ads/opctl/operator/lowcode/common/transformations.py +296 -0
  690. ads/opctl/operator/lowcode/common/utils.py +384 -0
  691. ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +13 -0
  692. ads/opctl/operator/lowcode/feature_store_marketplace/README.md +30 -0
  693. ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +5 -0
  694. ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +116 -0
  695. ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +85 -0
  696. ads/opctl/operator/lowcode/feature_store_marketplace/const.py +15 -0
  697. ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
  698. ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +4 -0
  699. ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +32 -0
  700. ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +43 -0
  701. ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +120 -0
  702. ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +34 -0
  703. ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +386 -0
  704. ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +160 -0
  705. ads/opctl/operator/lowcode/forecast/MLoperator +25 -0
  706. ads/opctl/operator/lowcode/forecast/README.md +209 -0
  707. ads/opctl/operator/lowcode/forecast/__init__.py +5 -0
  708. ads/opctl/operator/lowcode/forecast/__main__.py +89 -0
  709. ads/opctl/operator/lowcode/forecast/cmd.py +40 -0
  710. ads/opctl/operator/lowcode/forecast/const.py +92 -0
  711. ads/opctl/operator/lowcode/forecast/environment.yaml +20 -0
  712. ads/opctl/operator/lowcode/forecast/errors.py +26 -0
  713. ads/opctl/operator/lowcode/forecast/model/__init__.py +5 -0
  714. ads/opctl/operator/lowcode/forecast/model/arima.py +279 -0
  715. ads/opctl/operator/lowcode/forecast/model/automlx.py +553 -0
  716. ads/opctl/operator/lowcode/forecast/model/autots.py +312 -0
  717. ads/opctl/operator/lowcode/forecast/model/base_model.py +875 -0
  718. ads/opctl/operator/lowcode/forecast/model/factory.py +106 -0
  719. ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +492 -0
  720. ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +243 -0
  721. ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +482 -0
  722. ads/opctl/operator/lowcode/forecast/model/prophet.py +450 -0
  723. ads/opctl/operator/lowcode/forecast/model_evaluator.py +244 -0
  724. ads/opctl/operator/lowcode/forecast/operator_config.py +234 -0
  725. ads/opctl/operator/lowcode/forecast/schema.yaml +506 -0
  726. ads/opctl/operator/lowcode/forecast/utils.py +397 -0
  727. ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +7 -0
  728. ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +285 -0
  729. ads/opctl/operator/lowcode/forecast/whatifserve/score.py +246 -0
  730. ads/opctl/operator/lowcode/pii/MLoperator +17 -0
  731. ads/opctl/operator/lowcode/pii/README.md +208 -0
  732. ads/opctl/operator/lowcode/pii/__init__.py +5 -0
  733. ads/opctl/operator/lowcode/pii/__main__.py +78 -0
  734. ads/opctl/operator/lowcode/pii/cmd.py +39 -0
  735. ads/opctl/operator/lowcode/pii/constant.py +84 -0
  736. ads/opctl/operator/lowcode/pii/environment.yaml +17 -0
  737. ads/opctl/operator/lowcode/pii/errors.py +27 -0
  738. ads/opctl/operator/lowcode/pii/model/__init__.py +5 -0
  739. ads/opctl/operator/lowcode/pii/model/factory.py +82 -0
  740. ads/opctl/operator/lowcode/pii/model/guardrails.py +167 -0
  741. ads/opctl/operator/lowcode/pii/model/pii.py +145 -0
  742. ads/opctl/operator/lowcode/pii/model/processor/__init__.py +34 -0
  743. ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +34 -0
  744. ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +35 -0
  745. ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +225 -0
  746. ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +73 -0
  747. ads/opctl/operator/lowcode/pii/model/processor/remover.py +26 -0
  748. ads/opctl/operator/lowcode/pii/model/report.py +487 -0
  749. ads/opctl/operator/lowcode/pii/operator_config.py +95 -0
  750. ads/opctl/operator/lowcode/pii/schema.yaml +108 -0
  751. ads/opctl/operator/lowcode/pii/utils.py +43 -0
  752. ads/opctl/operator/lowcode/recommender/MLoperator +16 -0
  753. ads/opctl/operator/lowcode/recommender/README.md +206 -0
  754. ads/opctl/operator/lowcode/recommender/__init__.py +5 -0
  755. ads/opctl/operator/lowcode/recommender/__main__.py +82 -0
  756. ads/opctl/operator/lowcode/recommender/cmd.py +33 -0
  757. ads/opctl/operator/lowcode/recommender/constant.py +30 -0
  758. ads/opctl/operator/lowcode/recommender/environment.yaml +11 -0
  759. ads/opctl/operator/lowcode/recommender/model/base_model.py +212 -0
  760. ads/opctl/operator/lowcode/recommender/model/factory.py +56 -0
  761. ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +25 -0
  762. ads/opctl/operator/lowcode/recommender/model/svd.py +106 -0
  763. ads/opctl/operator/lowcode/recommender/operator_config.py +81 -0
  764. ads/opctl/operator/lowcode/recommender/schema.yaml +265 -0
  765. ads/opctl/operator/lowcode/recommender/utils.py +13 -0
  766. ads/opctl/operator/runtime/__init__.py +5 -0
  767. ads/opctl/operator/runtime/const.py +17 -0
  768. ads/opctl/operator/runtime/container_runtime_schema.yaml +50 -0
  769. ads/opctl/operator/runtime/marketplace_runtime.py +50 -0
  770. ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +21 -0
  771. ads/opctl/operator/runtime/python_runtime_schema.yaml +21 -0
  772. ads/opctl/operator/runtime/runtime.py +115 -0
  773. ads/opctl/schema.yaml.yml +36 -0
  774. ads/opctl/script.py +40 -0
  775. ads/opctl/spark/__init__.py +5 -0
  776. ads/opctl/spark/cli.py +43 -0
  777. ads/opctl/spark/cmds.py +147 -0
  778. ads/opctl/templates/diagnostic_report_template.jinja2 +102 -0
  779. ads/opctl/utils.py +344 -0
  780. ads/oracledb/__init__.py +5 -0
  781. ads/oracledb/oracle_db.py +346 -0
  782. ads/pipeline/__init__.py +39 -0
  783. ads/pipeline/ads_pipeline.py +2279 -0
  784. ads/pipeline/ads_pipeline_run.py +772 -0
  785. ads/pipeline/ads_pipeline_step.py +605 -0
  786. ads/pipeline/builders/__init__.py +5 -0
  787. ads/pipeline/builders/infrastructure/__init__.py +5 -0
  788. ads/pipeline/builders/infrastructure/custom_script.py +32 -0
  789. ads/pipeline/cli.py +119 -0
  790. ads/pipeline/extension.py +291 -0
  791. ads/pipeline/schema/__init__.py +5 -0
  792. ads/pipeline/schema/cs_step_schema.json +35 -0
  793. ads/pipeline/schema/ml_step_schema.json +31 -0
  794. ads/pipeline/schema/pipeline_schema.json +71 -0
  795. ads/pipeline/visualizer/__init__.py +5 -0
  796. ads/pipeline/visualizer/base.py +570 -0
  797. ads/pipeline/visualizer/graph_renderer.py +272 -0
  798. ads/pipeline/visualizer/text_renderer.py +84 -0
  799. ads/secrets/__init__.py +11 -0
  800. ads/secrets/adb.py +386 -0
  801. ads/secrets/auth_token.py +86 -0
  802. ads/secrets/big_data_service.py +365 -0
  803. ads/secrets/mysqldb.py +149 -0
  804. ads/secrets/oracledb.py +160 -0
  805. ads/secrets/secrets.py +407 -0
  806. ads/telemetry/__init__.py +7 -0
  807. ads/telemetry/base.py +69 -0
  808. ads/telemetry/client.py +122 -0
  809. ads/telemetry/telemetry.py +257 -0
  810. ads/templates/dataflow_pyspark.jinja2 +13 -0
  811. ads/templates/dataflow_sparksql.jinja2 +22 -0
  812. ads/templates/func.jinja2 +20 -0
  813. ads/templates/schemas/openapi.json +1740 -0
  814. ads/templates/score-pkl.jinja2 +173 -0
  815. ads/templates/score.jinja2 +322 -0
  816. ads/templates/score_embedding_onnx.jinja2 +202 -0
  817. ads/templates/score_generic.jinja2 +165 -0
  818. ads/templates/score_huggingface_pipeline.jinja2 +217 -0
  819. ads/templates/score_lightgbm.jinja2 +185 -0
  820. ads/templates/score_onnx.jinja2 +407 -0
  821. ads/templates/score_onnx_new.jinja2 +473 -0
  822. ads/templates/score_oracle_automl.jinja2 +185 -0
  823. ads/templates/score_pyspark.jinja2 +154 -0
  824. ads/templates/score_pytorch.jinja2 +219 -0
  825. ads/templates/score_scikit-learn.jinja2 +184 -0
  826. ads/templates/score_tensorflow.jinja2 +184 -0
  827. ads/templates/score_xgboost.jinja2 +178 -0
  828. ads/text_dataset/__init__.py +5 -0
  829. ads/text_dataset/backends.py +211 -0
  830. ads/text_dataset/dataset.py +445 -0
  831. ads/text_dataset/extractor.py +207 -0
  832. ads/text_dataset/options.py +53 -0
  833. ads/text_dataset/udfs.py +22 -0
  834. ads/text_dataset/utils.py +49 -0
  835. ads/type_discovery/__init__.py +9 -0
  836. ads/type_discovery/abstract_detector.py +21 -0
  837. ads/type_discovery/constant_detector.py +41 -0
  838. ads/type_discovery/continuous_detector.py +54 -0
  839. ads/type_discovery/credit_card_detector.py +99 -0
  840. ads/type_discovery/datetime_detector.py +92 -0
  841. ads/type_discovery/discrete_detector.py +118 -0
  842. ads/type_discovery/document_detector.py +146 -0
  843. ads/type_discovery/ip_detector.py +68 -0
  844. ads/type_discovery/latlon_detector.py +90 -0
  845. ads/type_discovery/phone_number_detector.py +63 -0
  846. ads/type_discovery/type_discovery_driver.py +87 -0
  847. ads/type_discovery/typed_feature.py +594 -0
  848. ads/type_discovery/unknown_detector.py +41 -0
  849. ads/type_discovery/zipcode_detector.py +48 -0
  850. ads/vault/__init__.py +7 -0
  851. ads/vault/vault.py +237 -0
  852. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/METADATA +150 -149
  853. oracle_ads-2.13.10.dist-info/RECORD +858 -0
  854. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/WHEEL +1 -2
  855. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/entry_points.txt +2 -1
  856. oracle_ads-2.13.9rc0.dist-info/RECORD +0 -9
  857. oracle_ads-2.13.9rc0.dist-info/top_level.txt +0 -1
  858. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10.dist-info}/licenses/LICENSE.txt +0 -0
@@ -0,0 +1,795 @@
1
+ #!/usr/bin/env python
2
+ # -*- coding: utf-8 -*--
3
+
4
+ # Copyright (c) 2021, 2022 Oracle and/or its affiliates.
5
+ # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
6
+
7
+ import asteval
8
+ import fsspec
9
+ import json
10
+ import os
11
+ import sys
12
+ import yaml
13
+ from abc import ABC, abstractmethod
14
+ from cerberus import Validator
15
+ from copy import deepcopy
16
+ from dataclasses import dataclass, field
17
+ from typing import Dict, List, Optional
18
+ from string import Template
19
+ from os import path
20
+ from ads.common.serializer import DataClassSerializable
21
+ from ads.common.object_storage_details import ObjectStorageDetails
22
+
23
+ try:
24
+ from yaml import CDumper as dumper
25
+ from yaml import CLoader as loader
26
+ except:
27
+ from yaml import Dumper as dumper
28
+ from yaml import Loader as loader
29
+
30
+ SCHEMA_VALIDATOR_NAME = "data_schema.json"
31
+ INPUT_OUTPUT_SCHENA_SIZE_LIMIT = 32000
32
+ SCHEMA_VERSION = "1.1"
33
+ DEFAULT_SCHEMA_VERSION = "1.0"
34
+ SCHEMA_KEY = "schema"
35
+ SCHEMA_VERSION_KEY = "version"
36
+ DEFAULT_STORAGE_OPTIONS = None
37
+
38
+
39
+ class SchemaSizeTooLarge(ValueError):
40
+ def __init__(self, size: int):
41
+ super().__init__(
42
+ f"The schema `{size}` bytes and "
43
+ f"the maximum allowable schema size is `{INPUT_OUTPUT_SCHENA_SIZE_LIMIT}` bytes. "
44
+ "Reduce the size of the schema."
45
+ )
46
+
47
+
48
+ class DataSizeTooWide(ValueError):
49
+ def __init__(self, data_col_num: int, max_col_num: int):
50
+ super().__init__(
51
+ f"The data has `{data_col_num}` columns and "
52
+ f"the maximum allowable number of columns is `{max_col_num}`. "
53
+ "Increase allowable number of columns by setting a larger max_col_num. It will take longer time to prepare."
54
+ )
55
+
56
+
57
+ @dataclass(repr=False)
58
+ class Expression(DataClassSerializable):
59
+ """
60
+ Expression allows specifying string representation of an expression which can be evaluated by the language corresponding to the value provided in `langauge` attribute
61
+
62
+ Default value for language is python
63
+
64
+ Parameters
65
+ ----------
66
+ exression: Must use string.Template format for specifying the exression
67
+ type: str
68
+ language: default value is python. It could be any language. `evaluate` method expects the expression to be of type python
69
+
70
+ Examples
71
+ --------
72
+ >>> exp = Expression("($x > 10 and $x <100) or ($x < -1 and $x > -500)")
73
+ >>> exp.evaluate(x=500)
74
+ False
75
+ >>> exp.evaluate(x=20)
76
+ True
77
+ >>> exp.evaluate(x=9)
78
+ False
79
+ >>> exp.evaluate(x=-9)
80
+ True
81
+ """
82
+
83
+ expression: str
84
+ language: str = "python"
85
+
86
+ def evaluate(self, **kwargs):
87
+ if self.language.lower() != "python":
88
+ raise Exception(
89
+ f"Evaluation not supported for language ${self.language}. Supported language: python"
90
+ )
91
+
92
+ exp = Template(self.expression)
93
+ final_expression = None
94
+ try:
95
+ final_expression = exp.substitute(kwargs)
96
+ except:
97
+ raise Exception(
98
+ "Error substituting the value into the expression. Check if the variable in the expression matches the parameter names passed to evaluate method"
99
+ )
100
+ aeval = asteval.Interpreter()
101
+ return aeval(final_expression)
102
+
103
+ def __post_init__(self):
104
+ if not self.expression or not self.language:
105
+ raise ValueError(
106
+ f"An Expression object requires values for both expression and language"
107
+ )
108
+
109
+
110
+ @dataclass(repr=False)
111
+ class Domain(DataClassSerializable):
112
+ """Domain describes the data. It holds following information -
113
+ * stats - Statistics of the data.
114
+ * constraints - List of Expression which defines the constraint for the data.
115
+ * Domain values.
116
+
117
+ Examples
118
+ --------
119
+
120
+ >>> Domain(values='Rational Numbers', stats={"mean":50, "median":51, "min": 5, "max":100}, constraints=[Expression('$x > 5')])
121
+ constraints:
122
+ - expression: $x > 5
123
+ language: python
124
+ stats:
125
+ max: 100
126
+ mean: 50
127
+ median: 51
128
+ min: 5
129
+ values: Rational Numbers
130
+ """
131
+
132
+ values: str = ""
133
+ stats: Dict = field(default_factory=dict)
134
+ constraints: List[Expression] = field(default_factory=list)
135
+
136
+
137
+ @dataclass(repr=False, order=True)
138
+ class Attribute(DataClassSerializable):
139
+ """
140
+ Attribute describes the column/feature/element. It holds following information -
141
+ * dtype - Type of data - float, int64, etc. Matches with Pandas dtypes
142
+ * feature_type - Feature type of data - Integer, String, etc. Matches with ads feature types.
143
+ * name - Name of the feature
144
+ * domain - Represented by the Domain class
145
+ * required - Boolean - True or False
146
+ * description - Description about the column/feature
147
+ * order - order of the column/feature in the data
148
+
149
+ Examples
150
+ --------
151
+
152
+ >>> attr_fruits = Attribute(
153
+ ... dtype = "category",
154
+ ... feature_type = "category",
155
+ ... name = "fruits",
156
+ ... domain = Domain(values="Apple, Orange, Grapes", stats={"mode": "Orange"}, constraints=[Expression("in ['Apple', 'Orange', 'Grapes']")]),
157
+ ... required = True,
158
+ ... description = "Names of fruits",
159
+ ... order = 0
160
+ ... )
161
+ >>> attr_fruits
162
+ description: Names of fruits
163
+ domain:
164
+ constraints:
165
+ - expression: in ['Apple', 'Orange', 'Grapes']
166
+ language: python
167
+ stats:
168
+ mode: Orange
169
+ values: Apple, Orange, Grapes
170
+ dtype: category
171
+ feature_type: category
172
+ name: fruits
173
+ order: 0
174
+ required: true
175
+ >>> attr_fruits.key
176
+ 'fruits'
177
+ """
178
+
179
+ sort_index: int = field(init=False, repr=False)
180
+ dtype: str
181
+ feature_type: str
182
+ name: str
183
+ domain: Domain
184
+ required: bool
185
+ description: str
186
+ order: Optional[int] = None
187
+
188
+ @property
189
+ def key(self):
190
+ return self.name
191
+
192
+ def to_dict(self, **kwargs) -> dict:
193
+ data = super().to_dict(**kwargs)
194
+ data.pop("sort_index", None)
195
+ return data
196
+
197
+ def __hash__(self):
198
+ return hash(self.key)
199
+
200
+ def __post_init__(self):
201
+ object.__setattr__(self, "sort_index", self.order or 0)
202
+
203
+
204
+ class BaseSchemaLoader(ABC):
205
+ """
206
+ Base Schema Loader which load and validate schema.
207
+
208
+ Methods
209
+ -------
210
+ load_schema(self)
211
+ Load and validate schema from a file and return the normalized schema.
212
+ """
213
+
214
+ def __init__(self):
215
+ self._schema = None
216
+
217
+ def load_schema(self, schema_path):
218
+ """Load and validate schema from a file and return the normalized schema."""
219
+ self._load_schema(schema_path)
220
+ self._normalize()
221
+ return self._validate()
222
+
223
+ def _normalize(self):
224
+ self._schema = {key.lower(): value for key, value in self._schema.items()}
225
+
226
+ @abstractmethod
227
+ def _load_schema(self, schema_path):
228
+ pass
229
+
230
+ def _validate(self):
231
+ """Validate the schema."""
232
+ schema_validator = self._load_schema_validator()
233
+ v = Validator(schema_validator)
234
+ normalized_items = []
235
+ for item in self._schema[SCHEMA_KEY]:
236
+ valid = v.validate(item)
237
+ if not valid:
238
+ new_dict = {"column": item["name"], "error": v.errors}
239
+ raise ValueError(json.dumps(new_dict, indent=2))
240
+ normalized_items.append(v.normalized(item))
241
+ schema_version = self._schema.get(SCHEMA_VERSION_KEY) or DEFAULT_SCHEMA_VERSION
242
+ self._schema = {
243
+ SCHEMA_KEY: normalized_items,
244
+ SCHEMA_VERSION_KEY: schema_version,
245
+ }
246
+ return self._schema
247
+
248
+ @staticmethod
249
+ def _load_schema_validator():
250
+ """load the schema validator to validate the schema."""
251
+ with open(
252
+ os.path.join(
253
+ os.path.dirname(os.path.abspath(__file__)), SCHEMA_VALIDATOR_NAME
254
+ )
255
+ ) as schema_file:
256
+ schema_validator = json.load(schema_file)
257
+ return schema_validator
258
+
259
+
260
+ class JsonSchemaLoader(BaseSchemaLoader):
261
+ """
262
+ Json Schema which load and validate schema from json file.
263
+
264
+ Methods
265
+ -------
266
+ load_schema(self)
267
+ Load and validate schema from json file and return the normalized schema.
268
+
269
+ Examples
270
+ --------
271
+ >>> schema_loader = JsonSchemaLoader()
272
+ >>> schema_dict = schema_loader.load_schema('schema.json')
273
+ >>> schema_dict
274
+ {'Schema': [{'dtype': 'object',
275
+ 'feature_type': 'String',
276
+ 'name': 'Attrition',
277
+ 'domain': {'values': 'String',
278
+ 'stats': {'count': 1470, 'unique': 2},
279
+ 'constraints': []},
280
+ 'required': True,
281
+ 'description': 'Attrition'},
282
+ {'dtype': 'int64',
283
+ 'feature_type': 'Integer',
284
+ 'name': 'Age',
285
+ 'domain': {'values': 'Integer',
286
+ 'stats': {'count': 1470.0,
287
+ 'mean': 37.923809523809524,
288
+ 'std': 9.135373489136732,
289
+ 'min': 19.0,
290
+ '25%': 31.0,
291
+ '50%': 37.0,
292
+ '75%': 44.0,
293
+ 'max': 61.0},
294
+ 'constraints': []},
295
+ 'required': True,
296
+ 'description': 'Age'}]}
297
+ """
298
+
299
+ def _load_schema(self, schema_path):
300
+ """Loads and validates schema from a json file."""
301
+ assert os.path.splitext(schema_path)[-1].lower() in [
302
+ ".json"
303
+ ], "Expecting a json format file."
304
+ if not path.exists(schema_path):
305
+ raise FileNotFoundError(f"{schema_path} does not exist")
306
+ with fsspec.open(schema_path, mode="r", encoding="utf8") as f:
307
+ self._schema = json.load(f)
308
+
309
+
310
+ class YamlSchemaLoader(BaseSchemaLoader):
311
+ """
312
+ Yaml Schema which loads and validates schema from a yaml file.
313
+
314
+ Methods
315
+ -------
316
+ load_schema(self)
317
+ Loads and validates schema from a yaml file and returns the normalized schema.
318
+
319
+ Examples
320
+ --------
321
+ >>> schema_loader = YamlSchemaLoader()
322
+ >>> schema_dict = schema_loader.load_schema('schema.yaml')
323
+ >>> schema_dict
324
+ {'Schema': [{'description': 'Attrition',
325
+ 'domain': {'constraints': [],
326
+ 'stats': {'count': 1470, 'unique': 2},
327
+ 'values': 'String'},
328
+ 'dtype': 'object',
329
+ 'feature_type': 'String',
330
+ 'name': 'Attrition',
331
+ 'required': True},
332
+ {'description': 'Age',
333
+ 'domain': {'constraints': [],
334
+ 'stats': {'25%': 31.0,
335
+ '50%': 37.0,
336
+ '75%': 44.0,
337
+ 'count': 1470.0,
338
+ 'max': 61.0,
339
+ 'mean': 37.923809523809524,
340
+ 'min': 19.0,
341
+ 'std': 9.135373489136732},
342
+ 'values': 'Integer'},
343
+ 'dtype': 'int64',
344
+ 'feature_type': 'Integer',
345
+ 'name': 'Age',
346
+ 'required': True}]}
347
+ """
348
+
349
+ def _load_schema(self, schema_path):
350
+ """Load and validate schema from yaml file."""
351
+ assert os.path.splitext(schema_path)[-1].lower() in [
352
+ ".yaml",
353
+ ".yml",
354
+ ], "Expecting yaml format file."
355
+ if not path.exists(schema_path):
356
+ raise FileNotFoundError(f"{schema_path} does not exist")
357
+ with open(schema_path, "r") as stream:
358
+ try:
359
+ self._schema = yaml.load(yaml.safe_load(stream), Loader=loader)
360
+ except yaml.YAMLError as exc:
361
+ raise exc
362
+
363
+
364
+ class SchemaFactory:
365
+ """
366
+ Schema Factory.
367
+
368
+ Methods
369
+ -------
370
+ register_format(self)
371
+ Register a new type of schema class.
372
+ get_schema(self)
373
+ Get the YamlSchema or JsonSchema based on the format.
374
+ default_schema(cls)
375
+ Construct a SchemaFactory instance and register yaml and json loader.
376
+
377
+ Examples
378
+ --------
379
+ >>> factory = SchemaFactory.default_schema()
380
+ >>> schema_loader = factory.get_schema('.json')
381
+ >>> schema_dict = schema_loader.load_schema('schema.json')
382
+ >>> schema = Schema.from_dict(schema_dict)
383
+ >>> schema
384
+ Schema:
385
+ - description: Attrition
386
+ domain:
387
+ constraints: []
388
+ stats:
389
+ count: 1470
390
+ unique: 2
391
+ values: String
392
+ dtype: object
393
+ feature_type: String
394
+ name: Attrition
395
+ required: true
396
+ - description: Age
397
+ domain:
398
+ constraints: []
399
+ stats:
400
+ 25%: 31.0
401
+ 50%: 37.0
402
+ 75%: 44.0
403
+ count: 1470.0
404
+ max: 61.0
405
+ mean: 37.923809523809524
406
+ min: 19.0
407
+ std: 9.135373489136732
408
+ values: Integer
409
+ dtype: int64
410
+ feature_type: Integer
411
+ name: Age
412
+ required: true
413
+ """
414
+
415
+ def __init__(self):
416
+ self._creators = {}
417
+
418
+ def register_format(self, file_format, creator):
419
+ """Register a new type of schema class."""
420
+ self._creators[file_format] = creator
421
+
422
+ def get_schema(self, file_format):
423
+ """Get the YamlSchema or JsonSchema based on the format."""
424
+ creator = self._creators.get(file_format)
425
+ if not creator:
426
+ raise ValueError(
427
+ f"This {file_format} format is not supported. Pass Json or Yaml Files."
428
+ )
429
+ return creator()
430
+
431
+ @classmethod
432
+ def default_schema(cls):
433
+ factory = cls()
434
+ factory.register_format(".json", JsonSchemaLoader)
435
+ factory.register_format(".yaml", YamlSchemaLoader)
436
+ factory.register_format(".yml", YamlSchemaLoader)
437
+ return factory
438
+
439
+
440
+ @dataclass(repr=False)
441
+ class Schema:
442
+ """
443
+ Schema describes the structure of the data.
444
+
445
+ Methods
446
+ -------
447
+ add(self, item: Attribute, replace: bool = False)
448
+ Adds a new attribute item. Replaces existing one if replace flag is True.
449
+ from_dict(self)
450
+ Constructs an instance of Schema from a dictionary.
451
+ from_file(cls, file_path):
452
+ Loads the data schema from a file.
453
+ to_dict(self)
454
+ Serializes the data schema into a dictionary.
455
+ to_yaml(self)
456
+ Serializes the data schema into a YAML.
457
+ to_json(self)
458
+ Serializes the data schema into a json string.
459
+ to_json_file(self)
460
+ Saves the data schema into a json file.
461
+ to_yaml_file(self)
462
+ Save to a yaml file.
463
+ add(self, item: Attribute, replace=False) -> None
464
+ Adds a new attribute item. Replaces existing one if replace flag is True.
465
+
466
+ Examples
467
+ --------
468
+
469
+ >>> attr_fruits = Attribute(
470
+ ... dtype = "category",
471
+ ... feature_type = "category",
472
+ ... name = "fruits",
473
+ ... domain = Domain(values="Apple, Orange, Grapes", stats={"mode": "Orange"}, constraints=[Expression("in ['Apple', 'Orange', 'Grapes']")]),
474
+ ... required = True,
475
+ ... description = "Names of fruits",
476
+ ... order = 0,
477
+ ... )
478
+ >>> attr_animals = Attribute(
479
+ ... dtype = "category",
480
+ ... feature_type = "category",
481
+ ... name = "animals",
482
+ ... domain = Domain(values="Dog, Cat, Python", stats={"mode": "Dog"}, constraints=[Expression("in ['Dog', 'Cat', 'Python']")]),
483
+ ... required = True,
484
+ ... description = "Names of animals",
485
+ ... order = 1,
486
+ ... )
487
+ >>> schema = Schema()
488
+ >>> schema.add(attr_fruits)
489
+ >>> schema.add(attr_animals)
490
+ >>> schema
491
+ schema:
492
+ - description: Names of fruits
493
+ domain:
494
+ constraints:
495
+ - expression: in ['Apple', 'Orange', 'Grapes']
496
+ language: python
497
+ stats:
498
+ mode: Orange
499
+ values: Apple, Orange, Grapes
500
+ dtype: category
501
+ feature_type: category
502
+ name: fruits
503
+ order: 0
504
+ required: true
505
+ - description: Names of animals
506
+ domain:
507
+ constraints:
508
+ - expression: in ['Dog', 'Cat', 'Python']
509
+ language: python
510
+ stats:
511
+ mode: Dog
512
+ values: Dog, Cat, Python
513
+ dtype: category
514
+ feature_type: category
515
+ name: animals
516
+ order: 1
517
+ required: true
518
+ >>> schema.to_dict()
519
+ {'schema': [{'dtype': 'category',
520
+ 'feature_type': 'category',
521
+ 'name': 'fruits',
522
+ 'domain': {'values': 'Apple, Orange, Grapes',
523
+ 'stats': {'mode': 'Orange'},
524
+ 'constraints': [{'expression': "in ['Apple', 'Orange', 'Grapes']",
525
+ 'language': 'python'}]},
526
+ 'required': True,
527
+ 'description': 'Names of fruits',
528
+ 'order': 0},
529
+ {'dtype': 'category',
530
+ 'feature_type': 'category',
531
+ 'name': 'animals',
532
+ 'domain': {'values': 'Dog, Cat, Python',
533
+ 'stats': {'mode': 'Dog'},
534
+ 'constraints': [{'expression': "in ['Dog', 'Cat', 'Python']",
535
+ 'language': 'python'}]},
536
+ 'required': True,
537
+ 'description': 'Names of animals',
538
+ 'order': 1}]}
539
+
540
+ """
541
+
542
+ _schema: set = field(default_factory=set, init=False)
543
+ _version: str = SCHEMA_VERSION
544
+
545
+ def add(self, item: Attribute, replace: bool = False):
546
+ """Adds a new attribute item. Replaces existing one if replace flag is True.
547
+
548
+ Overrides the existing one if replace flag is True.
549
+
550
+ Parameters
551
+ ----------
552
+ item : Attribute
553
+ The attribute instance of a column/feature/element.
554
+ replace : bool
555
+ Overrides the existing attribute item if replace flag is True.
556
+
557
+ Returns
558
+ -------
559
+ None
560
+ Nothing.
561
+
562
+ Raises
563
+ ------
564
+ ValueError
565
+ If item is already registered and replace flag is False.
566
+ TypeError
567
+ If input data has a wrong format.
568
+ """
569
+ if not isinstance(item, Attribute):
570
+ raise TypeError("Argument must be an instance of the class Attribute.")
571
+ if not replace and item.key in self.keys:
572
+ raise ValueError(
573
+ f"The key {item.key} already exists. Use `replace=True` to overwrite."
574
+ )
575
+ self._schema.discard(item)
576
+ self._schema.add(item)
577
+
578
+ @property
579
+ def keys(self) -> list:
580
+ """Returns all registered Attribute keys.
581
+
582
+ Returns
583
+ -------
584
+ Tuple[str]
585
+ The list of Attribute keys.
586
+ """
587
+ return tuple(item.key for item in self)
588
+
589
+ @classmethod
590
+ def from_dict(cls, schema: dict):
591
+ """Constructs an instance of Schema from a dictionary.
592
+
593
+ Parameters
594
+ ----------
595
+ schema : dict
596
+ Data schema in dictionary format.
597
+
598
+ Returns
599
+ -------
600
+ Schema
601
+ An instance of Schema.
602
+ """
603
+ sc = cls()
604
+
605
+ if schema == {}:
606
+ return sc
607
+ if not isinstance(schema, dict):
608
+ raise TypeError("schema has to be of dictionary type.")
609
+
610
+ schema = {key.lower(): value for key, value in deepcopy(schema).items()}
611
+ for item in schema[SCHEMA_KEY]:
612
+ domain = Domain(**item["domain"])
613
+ domain.constraints = []
614
+ for constraint in item["domain"]["constraints"]:
615
+ domain.constraints.append(Expression(**constraint))
616
+ item["domain"] = domain
617
+ sc.add(Attribute(**item))
618
+ return sc
619
+
620
+ @classmethod
621
+ def from_json(cls, schema: str):
622
+ """Constructs an instance of Schema from a Json.
623
+
624
+ Parameters
625
+ ----------
626
+ schema : str
627
+ Data schema in Json format.
628
+
629
+ Returns
630
+ -------
631
+ Schema
632
+ An instance of Schema.
633
+ """
634
+ return Schema.from_dict(json.loads(schema))
635
+
636
+ @classmethod
637
+ def from_file(cls, file_path: str):
638
+ """Loads the data schema from a file.
639
+
640
+ Parameters
641
+ ----------
642
+ file_path : str
643
+ File Path to load the data schema.
644
+
645
+ Returns
646
+ -------
647
+ Schema
648
+ An instance of Schema.
649
+ """
650
+ file_format = os.path.splitext(file_path)[-1]
651
+ schema_loader = SchemaFactory.default_schema().get_schema(file_format)
652
+ return cls.from_dict(schema_loader.load_schema(file_path))
653
+
654
+ def to_dict(self):
655
+ """Serializes data schema into a dictionary.
656
+
657
+ Returns
658
+ -------
659
+ dict
660
+ The dictionary representation of data schema.
661
+ """
662
+ return {
663
+ SCHEMA_KEY: [item.to_dict() for item in self],
664
+ SCHEMA_VERSION_KEY: self._version,
665
+ }
666
+
667
+ def to_yaml(self):
668
+ """Serializes the data schema into a YAML.
669
+ Returns
670
+ -------
671
+ str
672
+ The yaml representation of data schema.
673
+ """
674
+ return yaml.dump(self.to_dict(), Dumper=dumper)
675
+
676
+ def to_json(self):
677
+ """Serializes the data schema into a json string.
678
+ Returns
679
+ -------
680
+ str
681
+ The json representation of data schema.
682
+ """
683
+ return json.dumps(self.to_dict()).replace("NaN", "null")
684
+
685
+ def to_json_file(self, file_path, storage_options: dict = None):
686
+ """Saves the data schema into a json file.
687
+
688
+ Parameters
689
+ ----------
690
+ file_path : str
691
+ File Path to store the schema in json format.
692
+ storage_options: dict. Default None
693
+ Parameters passed on to the backend filesystem class.
694
+ Defaults to `storage_options` set using `DatasetFactory.set_default_storage()`.
695
+
696
+ Returns
697
+ -------
698
+ None
699
+ Nothing.
700
+ """
701
+ directory = os.path.expanduser(os.path.dirname(file_path))
702
+ basename = os.path.expanduser(os.path.basename(file_path))
703
+ assert os.path.splitext(file_path)[-1].lower() in [
704
+ ".json"
705
+ ], f"The file `{basename}` is not a valid JSON file. The `{file_path}` must have the extension .json."
706
+ if directory and not os.path.exists(directory):
707
+ if not ObjectStorageDetails.is_oci_path(directory):
708
+ try:
709
+ os.mkdir(directory)
710
+ except:
711
+ raise Exception(f"Error creating the directory.")
712
+ if not storage_options:
713
+ storage_options = DEFAULT_STORAGE_OPTIONS or {"config": {}}
714
+ with fsspec.open(
715
+ os.path.join(directory, basename),
716
+ mode="w",
717
+ **(storage_options),
718
+ ) as f:
719
+ f.write(json.dumps(self.to_dict()))
720
+
721
+ def to_yaml_file(self, file_path):
722
+ """Saves the data schema into a yaml file.
723
+ Parameters
724
+ ----------
725
+ file_path : str
726
+ File Path to store the schema in yaml format.
727
+
728
+ Returns
729
+ -------
730
+ None
731
+ Nothing.
732
+ """
733
+ assert os.path.splitext(file_path)[-1] in [
734
+ ".yaml",
735
+ ".yml",
736
+ ], "The `file_path` must have the extension .yaml or .yml."
737
+ directory = os.path.expanduser(os.path.dirname(file_path))
738
+ basename = os.path.expanduser(os.path.basename(file_path))
739
+ if directory and not os.path.exists(directory):
740
+ try:
741
+ os.mkdir(directory)
742
+ except:
743
+ raise Exception(f"Error creating the directory.")
744
+ with open(os.path.join(directory, basename), "w") as yaml_file:
745
+ yaml.dump(self.to_yaml(), yaml_file, default_flow_style=True)
746
+
747
+ def validate_size(self) -> bool:
748
+ """Validates schema size.
749
+
750
+ Validates the size of schema. Throws an error if the size of the schema
751
+ exceeds expected value.
752
+
753
+ Returns
754
+ -------
755
+ bool
756
+ True if schema does not exceeds the size limit.
757
+
758
+ Raises
759
+ ------
760
+ SchemaSizeTooLarge
761
+ If the size of the schema exceeds expected value.
762
+ """
763
+ if sys.getsizeof(self.to_yaml()) > INPUT_OUTPUT_SCHENA_SIZE_LIMIT:
764
+ raise SchemaSizeTooLarge(sys.getsizeof(self.to_yaml()))
765
+ return True
766
+
767
+ def validate_schema(self):
768
+ """Validate the schema."""
769
+ schema_validator = BaseSchemaLoader._load_schema_validator()
770
+ v = Validator(schema_validator)
771
+ for item in self.to_dict()[SCHEMA_KEY]:
772
+ valid = v.validate(item)
773
+ if not valid:
774
+ new_dict = {"column": item["name"], "error": v.errors}
775
+ raise ValueError(json.dumps(new_dict, indent=2))
776
+ return True
777
+
778
+ def __getitem__(self, key: str):
779
+ if key is None or key == "":
780
+ raise ValueError(f"The key `{key}` must not be empty.")
781
+ if not isinstance(key, str):
782
+ TypeError(f"The key `{key}` must be a string.")
783
+ for item in self._schema:
784
+ if item.key == key:
785
+ return item
786
+ raise ValueError(f"The key {key} is not found.")
787
+
788
+ def __repr__(self):
789
+ return self.to_yaml()
790
+
791
+ def __iter__(self):
792
+ return sorted(self._schema).__iter__()
793
+
794
+ def __len__(self):
795
+ return len(self._schema)