oracle-ads 2.13.9rc0__py3-none-any.whl → 2.13.9rc1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (857) hide show
  1. ads/aqua/__init__.py +40 -0
  2. ads/aqua/app.py +506 -0
  3. ads/aqua/cli.py +96 -0
  4. ads/aqua/client/__init__.py +3 -0
  5. ads/aqua/client/client.py +836 -0
  6. ads/aqua/client/openai_client.py +305 -0
  7. ads/aqua/common/__init__.py +5 -0
  8. ads/aqua/common/decorator.py +125 -0
  9. ads/aqua/common/entities.py +269 -0
  10. ads/aqua/common/enums.py +122 -0
  11. ads/aqua/common/errors.py +109 -0
  12. ads/aqua/common/utils.py +1285 -0
  13. ads/aqua/config/__init__.py +4 -0
  14. ads/aqua/config/container_config.py +248 -0
  15. ads/aqua/config/evaluation/__init__.py +4 -0
  16. ads/aqua/config/evaluation/evaluation_service_config.py +147 -0
  17. ads/aqua/config/utils/__init__.py +4 -0
  18. ads/aqua/config/utils/serializer.py +339 -0
  19. ads/aqua/constants.py +116 -0
  20. ads/aqua/data.py +14 -0
  21. ads/aqua/dummy_data/icon.txt +1 -0
  22. ads/aqua/dummy_data/oci_model_deployments.json +56 -0
  23. ads/aqua/dummy_data/oci_models.json +1 -0
  24. ads/aqua/dummy_data/readme.md +26 -0
  25. ads/aqua/evaluation/__init__.py +8 -0
  26. ads/aqua/evaluation/constants.py +53 -0
  27. ads/aqua/evaluation/entities.py +186 -0
  28. ads/aqua/evaluation/errors.py +70 -0
  29. ads/aqua/evaluation/evaluation.py +1814 -0
  30. ads/aqua/extension/__init__.py +42 -0
  31. ads/aqua/extension/aqua_ws_msg_handler.py +76 -0
  32. ads/aqua/extension/base_handler.py +90 -0
  33. ads/aqua/extension/common_handler.py +121 -0
  34. ads/aqua/extension/common_ws_msg_handler.py +36 -0
  35. ads/aqua/extension/deployment_handler.py +298 -0
  36. ads/aqua/extension/deployment_ws_msg_handler.py +54 -0
  37. ads/aqua/extension/errors.py +30 -0
  38. ads/aqua/extension/evaluation_handler.py +129 -0
  39. ads/aqua/extension/evaluation_ws_msg_handler.py +61 -0
  40. ads/aqua/extension/finetune_handler.py +96 -0
  41. ads/aqua/extension/model_handler.py +390 -0
  42. ads/aqua/extension/models/__init__.py +0 -0
  43. ads/aqua/extension/models/ws_models.py +145 -0
  44. ads/aqua/extension/models_ws_msg_handler.py +50 -0
  45. ads/aqua/extension/ui_handler.py +282 -0
  46. ads/aqua/extension/ui_websocket_handler.py +130 -0
  47. ads/aqua/extension/utils.py +133 -0
  48. ads/aqua/finetuning/__init__.py +7 -0
  49. ads/aqua/finetuning/constants.py +23 -0
  50. ads/aqua/finetuning/entities.py +181 -0
  51. ads/aqua/finetuning/finetuning.py +749 -0
  52. ads/aqua/model/__init__.py +8 -0
  53. ads/aqua/model/constants.py +60 -0
  54. ads/aqua/model/entities.py +385 -0
  55. ads/aqua/model/enums.py +32 -0
  56. ads/aqua/model/model.py +2114 -0
  57. ads/aqua/modeldeployment/__init__.py +8 -0
  58. ads/aqua/modeldeployment/constants.py +10 -0
  59. ads/aqua/modeldeployment/deployment.py +1326 -0
  60. ads/aqua/modeldeployment/entities.py +653 -0
  61. ads/aqua/modeldeployment/inference.py +74 -0
  62. ads/aqua/modeldeployment/utils.py +543 -0
  63. ads/aqua/resources/gpu_shapes_index.json +94 -0
  64. ads/aqua/server/__init__.py +4 -0
  65. ads/aqua/server/__main__.py +24 -0
  66. ads/aqua/server/app.py +47 -0
  67. ads/aqua/server/aqua_spec.yml +1291 -0
  68. ads/aqua/training/__init__.py +4 -0
  69. ads/aqua/training/exceptions.py +476 -0
  70. ads/aqua/ui.py +499 -0
  71. ads/automl/__init__.py +9 -0
  72. ads/automl/driver.py +330 -0
  73. ads/automl/provider.py +975 -0
  74. ads/bds/__init__.py +5 -0
  75. ads/bds/auth.py +127 -0
  76. ads/bds/big_data_service.py +255 -0
  77. ads/catalog/__init__.py +19 -0
  78. ads/catalog/model.py +1576 -0
  79. ads/catalog/notebook.py +461 -0
  80. ads/catalog/project.py +468 -0
  81. ads/catalog/summary.py +178 -0
  82. ads/common/__init__.py +11 -0
  83. ads/common/analyzer.py +65 -0
  84. ads/common/artifact/.model-ignore +63 -0
  85. ads/common/artifact/__init__.py +10 -0
  86. ads/common/auth.py +1122 -0
  87. ads/common/card_identifier.py +83 -0
  88. ads/common/config.py +647 -0
  89. ads/common/data.py +165 -0
  90. ads/common/decorator/__init__.py +9 -0
  91. ads/common/decorator/argument_to_case.py +88 -0
  92. ads/common/decorator/deprecate.py +69 -0
  93. ads/common/decorator/require_nonempty_arg.py +65 -0
  94. ads/common/decorator/runtime_dependency.py +178 -0
  95. ads/common/decorator/threaded.py +97 -0
  96. ads/common/decorator/utils.py +35 -0
  97. ads/common/dsc_file_system.py +303 -0
  98. ads/common/error.py +14 -0
  99. ads/common/extended_enum.py +81 -0
  100. ads/common/function/__init__.py +5 -0
  101. ads/common/function/fn_util.py +142 -0
  102. ads/common/function/func_conf.yaml +25 -0
  103. ads/common/ipython.py +76 -0
  104. ads/common/model.py +679 -0
  105. ads/common/model_artifact.py +1759 -0
  106. ads/common/model_artifact_schema.json +107 -0
  107. ads/common/model_export_util.py +664 -0
  108. ads/common/model_metadata.py +24 -0
  109. ads/common/object_storage_details.py +296 -0
  110. ads/common/oci_client.py +175 -0
  111. ads/common/oci_datascience.py +46 -0
  112. ads/common/oci_logging.py +1144 -0
  113. ads/common/oci_mixin.py +957 -0
  114. ads/common/oci_resource.py +136 -0
  115. ads/common/serializer.py +559 -0
  116. ads/common/utils.py +1852 -0
  117. ads/common/word_lists.py +1491 -0
  118. ads/common/work_request.py +189 -0
  119. ads/data_labeling/__init__.py +13 -0
  120. ads/data_labeling/boundingbox.py +253 -0
  121. ads/data_labeling/constants.py +47 -0
  122. ads/data_labeling/data_labeling_service.py +244 -0
  123. ads/data_labeling/interface/__init__.py +5 -0
  124. ads/data_labeling/interface/loader.py +16 -0
  125. ads/data_labeling/interface/parser.py +16 -0
  126. ads/data_labeling/interface/reader.py +23 -0
  127. ads/data_labeling/loader/__init__.py +5 -0
  128. ads/data_labeling/loader/file_loader.py +241 -0
  129. ads/data_labeling/metadata.py +110 -0
  130. ads/data_labeling/mixin/__init__.py +5 -0
  131. ads/data_labeling/mixin/data_labeling.py +232 -0
  132. ads/data_labeling/ner.py +129 -0
  133. ads/data_labeling/parser/__init__.py +5 -0
  134. ads/data_labeling/parser/dls_record_parser.py +388 -0
  135. ads/data_labeling/parser/export_metadata_parser.py +94 -0
  136. ads/data_labeling/parser/export_record_parser.py +473 -0
  137. ads/data_labeling/reader/__init__.py +5 -0
  138. ads/data_labeling/reader/dataset_reader.py +574 -0
  139. ads/data_labeling/reader/dls_record_reader.py +121 -0
  140. ads/data_labeling/reader/export_record_reader.py +62 -0
  141. ads/data_labeling/reader/jsonl_reader.py +75 -0
  142. ads/data_labeling/reader/metadata_reader.py +203 -0
  143. ads/data_labeling/reader/record_reader.py +263 -0
  144. ads/data_labeling/record.py +52 -0
  145. ads/data_labeling/visualizer/__init__.py +5 -0
  146. ads/data_labeling/visualizer/image_visualizer.py +525 -0
  147. ads/data_labeling/visualizer/text_visualizer.py +357 -0
  148. ads/database/__init__.py +5 -0
  149. ads/database/connection.py +338 -0
  150. ads/dataset/__init__.py +10 -0
  151. ads/dataset/capabilities.md +51 -0
  152. ads/dataset/classification_dataset.py +339 -0
  153. ads/dataset/correlation.py +226 -0
  154. ads/dataset/correlation_plot.py +563 -0
  155. ads/dataset/dask_series.py +173 -0
  156. ads/dataset/dataframe_transformer.py +110 -0
  157. ads/dataset/dataset.py +1979 -0
  158. ads/dataset/dataset_browser.py +360 -0
  159. ads/dataset/dataset_with_target.py +995 -0
  160. ads/dataset/exception.py +25 -0
  161. ads/dataset/factory.py +987 -0
  162. ads/dataset/feature_engineering_transformer.py +35 -0
  163. ads/dataset/feature_selection.py +107 -0
  164. ads/dataset/forecasting_dataset.py +26 -0
  165. ads/dataset/helper.py +1450 -0
  166. ads/dataset/label_encoder.py +99 -0
  167. ads/dataset/mixin/__init__.py +5 -0
  168. ads/dataset/mixin/dataset_accessor.py +134 -0
  169. ads/dataset/pipeline.py +58 -0
  170. ads/dataset/plot.py +710 -0
  171. ads/dataset/progress.py +86 -0
  172. ads/dataset/recommendation.py +297 -0
  173. ads/dataset/recommendation_transformer.py +502 -0
  174. ads/dataset/regression_dataset.py +14 -0
  175. ads/dataset/sampled_dataset.py +1050 -0
  176. ads/dataset/target.py +98 -0
  177. ads/dataset/timeseries.py +18 -0
  178. ads/dbmixin/__init__.py +5 -0
  179. ads/dbmixin/db_pandas_accessor.py +153 -0
  180. ads/environment/__init__.py +9 -0
  181. ads/environment/ml_runtime.py +66 -0
  182. ads/evaluations/README.md +14 -0
  183. ads/evaluations/__init__.py +109 -0
  184. ads/evaluations/evaluation_plot.py +983 -0
  185. ads/evaluations/evaluator.py +1334 -0
  186. ads/evaluations/statistical_metrics.py +543 -0
  187. ads/experiments/__init__.py +9 -0
  188. ads/experiments/capabilities.md +0 -0
  189. ads/explanations/__init__.py +21 -0
  190. ads/explanations/base_explainer.py +142 -0
  191. ads/explanations/capabilities.md +83 -0
  192. ads/explanations/explainer.py +190 -0
  193. ads/explanations/mlx_global_explainer.py +1050 -0
  194. ads/explanations/mlx_interface.py +386 -0
  195. ads/explanations/mlx_local_explainer.py +287 -0
  196. ads/explanations/mlx_whatif_explainer.py +201 -0
  197. ads/feature_engineering/__init__.py +20 -0
  198. ads/feature_engineering/accessor/__init__.py +5 -0
  199. ads/feature_engineering/accessor/dataframe_accessor.py +535 -0
  200. ads/feature_engineering/accessor/mixin/__init__.py +5 -0
  201. ads/feature_engineering/accessor/mixin/correlation.py +166 -0
  202. ads/feature_engineering/accessor/mixin/eda_mixin.py +266 -0
  203. ads/feature_engineering/accessor/mixin/eda_mixin_series.py +85 -0
  204. ads/feature_engineering/accessor/mixin/feature_types_mixin.py +211 -0
  205. ads/feature_engineering/accessor/mixin/utils.py +65 -0
  206. ads/feature_engineering/accessor/series_accessor.py +431 -0
  207. ads/feature_engineering/adsimage/__init__.py +5 -0
  208. ads/feature_engineering/adsimage/image.py +192 -0
  209. ads/feature_engineering/adsimage/image_reader.py +170 -0
  210. ads/feature_engineering/adsimage/interface/__init__.py +5 -0
  211. ads/feature_engineering/adsimage/interface/reader.py +19 -0
  212. ads/feature_engineering/adsstring/__init__.py +7 -0
  213. ads/feature_engineering/adsstring/oci_language/__init__.py +8 -0
  214. ads/feature_engineering/adsstring/string/__init__.py +8 -0
  215. ads/feature_engineering/data_schema.json +57 -0
  216. ads/feature_engineering/dataset/__init__.py +5 -0
  217. ads/feature_engineering/dataset/zip_code_data.py +42062 -0
  218. ads/feature_engineering/exceptions.py +40 -0
  219. ads/feature_engineering/feature_type/__init__.py +133 -0
  220. ads/feature_engineering/feature_type/address.py +184 -0
  221. ads/feature_engineering/feature_type/adsstring/__init__.py +5 -0
  222. ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +164 -0
  223. ads/feature_engineering/feature_type/adsstring/oci_language.py +93 -0
  224. ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +5 -0
  225. ads/feature_engineering/feature_type/adsstring/parsers/base.py +47 -0
  226. ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +96 -0
  227. ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +221 -0
  228. ads/feature_engineering/feature_type/adsstring/string.py +258 -0
  229. ads/feature_engineering/feature_type/base.py +58 -0
  230. ads/feature_engineering/feature_type/boolean.py +183 -0
  231. ads/feature_engineering/feature_type/category.py +146 -0
  232. ads/feature_engineering/feature_type/constant.py +137 -0
  233. ads/feature_engineering/feature_type/continuous.py +151 -0
  234. ads/feature_engineering/feature_type/creditcard.py +314 -0
  235. ads/feature_engineering/feature_type/datetime.py +190 -0
  236. ads/feature_engineering/feature_type/discrete.py +134 -0
  237. ads/feature_engineering/feature_type/document.py +43 -0
  238. ads/feature_engineering/feature_type/gis.py +251 -0
  239. ads/feature_engineering/feature_type/handler/__init__.py +5 -0
  240. ads/feature_engineering/feature_type/handler/feature_validator.py +524 -0
  241. ads/feature_engineering/feature_type/handler/feature_warning.py +319 -0
  242. ads/feature_engineering/feature_type/handler/warnings.py +128 -0
  243. ads/feature_engineering/feature_type/integer.py +142 -0
  244. ads/feature_engineering/feature_type/ip_address.py +144 -0
  245. ads/feature_engineering/feature_type/ip_address_v4.py +138 -0
  246. ads/feature_engineering/feature_type/ip_address_v6.py +138 -0
  247. ads/feature_engineering/feature_type/lat_long.py +256 -0
  248. ads/feature_engineering/feature_type/object.py +43 -0
  249. ads/feature_engineering/feature_type/ordinal.py +132 -0
  250. ads/feature_engineering/feature_type/phone_number.py +135 -0
  251. ads/feature_engineering/feature_type/string.py +171 -0
  252. ads/feature_engineering/feature_type/text.py +93 -0
  253. ads/feature_engineering/feature_type/unknown.py +43 -0
  254. ads/feature_engineering/feature_type/zip_code.py +164 -0
  255. ads/feature_engineering/feature_type_manager.py +406 -0
  256. ads/feature_engineering/schema.py +795 -0
  257. ads/feature_engineering/utils.py +245 -0
  258. ads/feature_store/.readthedocs.yaml +19 -0
  259. ads/feature_store/README.md +65 -0
  260. ads/feature_store/__init__.py +9 -0
  261. ads/feature_store/common/__init__.py +0 -0
  262. ads/feature_store/common/enums.py +339 -0
  263. ads/feature_store/common/exceptions.py +18 -0
  264. ads/feature_store/common/spark_session_singleton.py +125 -0
  265. ads/feature_store/common/utils/__init__.py +0 -0
  266. ads/feature_store/common/utils/base64_encoder_decoder.py +72 -0
  267. ads/feature_store/common/utils/feature_schema_mapper.py +283 -0
  268. ads/feature_store/common/utils/transformation_utils.py +82 -0
  269. ads/feature_store/common/utils/utility.py +403 -0
  270. ads/feature_store/data_validation/__init__.py +0 -0
  271. ads/feature_store/data_validation/great_expectation.py +129 -0
  272. ads/feature_store/dataset.py +1230 -0
  273. ads/feature_store/dataset_job.py +530 -0
  274. ads/feature_store/docs/Dockerfile +7 -0
  275. ads/feature_store/docs/Makefile +44 -0
  276. ads/feature_store/docs/conf.py +28 -0
  277. ads/feature_store/docs/requirements.txt +14 -0
  278. ads/feature_store/docs/source/ads.feature_store.query.rst +20 -0
  279. ads/feature_store/docs/source/cicd.rst +137 -0
  280. ads/feature_store/docs/source/conf.py +86 -0
  281. ads/feature_store/docs/source/data_versioning.rst +33 -0
  282. ads/feature_store/docs/source/dataset.rst +388 -0
  283. ads/feature_store/docs/source/dataset_job.rst +27 -0
  284. ads/feature_store/docs/source/demo.rst +70 -0
  285. ads/feature_store/docs/source/entity.rst +78 -0
  286. ads/feature_store/docs/source/feature_group.rst +624 -0
  287. ads/feature_store/docs/source/feature_group_job.rst +29 -0
  288. ads/feature_store/docs/source/feature_store.rst +122 -0
  289. ads/feature_store/docs/source/feature_store_class.rst +123 -0
  290. ads/feature_store/docs/source/feature_validation.rst +66 -0
  291. ads/feature_store/docs/source/figures/cicd.png +0 -0
  292. ads/feature_store/docs/source/figures/data_validation.png +0 -0
  293. ads/feature_store/docs/source/figures/data_versioning.png +0 -0
  294. ads/feature_store/docs/source/figures/dataset.gif +0 -0
  295. ads/feature_store/docs/source/figures/dataset.png +0 -0
  296. ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
  297. ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
  298. ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
  299. ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
  300. ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
  301. ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
  302. ads/feature_store/docs/source/figures/entity.png +0 -0
  303. ads/feature_store/docs/source/figures/feature_group.png +0 -0
  304. ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
  305. ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
  306. ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
  307. ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
  308. ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
  309. ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
  310. ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
  311. ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
  312. ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
  313. ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
  314. ads/feature_store/docs/source/figures/overview.png +0 -0
  315. ads/feature_store/docs/source/figures/resource_manager.png +0 -0
  316. ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
  317. ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
  318. ads/feature_store/docs/source/figures/stats_1.png +0 -0
  319. ads/feature_store/docs/source/figures/stats_2.png +0 -0
  320. ads/feature_store/docs/source/figures/stats_d.png +0 -0
  321. ads/feature_store/docs/source/figures/stats_fg.png +0 -0
  322. ads/feature_store/docs/source/figures/transformation.png +0 -0
  323. ads/feature_store/docs/source/figures/transformations.gif +0 -0
  324. ads/feature_store/docs/source/figures/validation.png +0 -0
  325. ads/feature_store/docs/source/figures/validation_fg.png +0 -0
  326. ads/feature_store/docs/source/figures/validation_results.png +0 -0
  327. ads/feature_store/docs/source/figures/validation_summary.png +0 -0
  328. ads/feature_store/docs/source/index.rst +81 -0
  329. ads/feature_store/docs/source/module.rst +8 -0
  330. ads/feature_store/docs/source/notebook.rst +94 -0
  331. ads/feature_store/docs/source/overview.rst +47 -0
  332. ads/feature_store/docs/source/quickstart.rst +176 -0
  333. ads/feature_store/docs/source/release_notes.rst +194 -0
  334. ads/feature_store/docs/source/setup_feature_store.rst +81 -0
  335. ads/feature_store/docs/source/statistics.rst +58 -0
  336. ads/feature_store/docs/source/transformation.rst +199 -0
  337. ads/feature_store/docs/source/ui.rst +65 -0
  338. ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +66 -0
  339. ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +192 -0
  340. ads/feature_store/docs/source/user_guides.setup.terraform.rst +338 -0
  341. ads/feature_store/entity.py +718 -0
  342. ads/feature_store/execution_strategy/__init__.py +0 -0
  343. ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
  344. ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +375 -0
  345. ads/feature_store/execution_strategy/engine/__init__.py +0 -0
  346. ads/feature_store/execution_strategy/engine/spark_engine.py +316 -0
  347. ads/feature_store/execution_strategy/execution_strategy.py +113 -0
  348. ads/feature_store/execution_strategy/execution_strategy_provider.py +47 -0
  349. ads/feature_store/execution_strategy/spark/__init__.py +0 -0
  350. ads/feature_store/execution_strategy/spark/spark_execution.py +618 -0
  351. ads/feature_store/feature.py +192 -0
  352. ads/feature_store/feature_group.py +1494 -0
  353. ads/feature_store/feature_group_expectation.py +346 -0
  354. ads/feature_store/feature_group_job.py +602 -0
  355. ads/feature_store/feature_lineage/__init__.py +0 -0
  356. ads/feature_store/feature_lineage/graphviz_service.py +180 -0
  357. ads/feature_store/feature_option_details.py +50 -0
  358. ads/feature_store/feature_statistics/__init__.py +0 -0
  359. ads/feature_store/feature_statistics/statistics_service.py +99 -0
  360. ads/feature_store/feature_store.py +699 -0
  361. ads/feature_store/feature_store_registrar.py +518 -0
  362. ads/feature_store/input_feature_detail.py +149 -0
  363. ads/feature_store/mixin/__init__.py +4 -0
  364. ads/feature_store/mixin/oci_feature_store.py +145 -0
  365. ads/feature_store/model_details.py +73 -0
  366. ads/feature_store/query/__init__.py +0 -0
  367. ads/feature_store/query/filter.py +266 -0
  368. ads/feature_store/query/generator/__init__.py +0 -0
  369. ads/feature_store/query/generator/query_generator.py +298 -0
  370. ads/feature_store/query/join.py +161 -0
  371. ads/feature_store/query/query.py +403 -0
  372. ads/feature_store/query/validator/__init__.py +0 -0
  373. ads/feature_store/query/validator/query_validator.py +57 -0
  374. ads/feature_store/response/__init__.py +0 -0
  375. ads/feature_store/response/response_builder.py +68 -0
  376. ads/feature_store/service/__init__.py +0 -0
  377. ads/feature_store/service/oci_dataset.py +139 -0
  378. ads/feature_store/service/oci_dataset_job.py +199 -0
  379. ads/feature_store/service/oci_entity.py +125 -0
  380. ads/feature_store/service/oci_feature_group.py +164 -0
  381. ads/feature_store/service/oci_feature_group_job.py +214 -0
  382. ads/feature_store/service/oci_feature_store.py +182 -0
  383. ads/feature_store/service/oci_lineage.py +87 -0
  384. ads/feature_store/service/oci_transformation.py +104 -0
  385. ads/feature_store/statistics/__init__.py +0 -0
  386. ads/feature_store/statistics/abs_feature_value.py +49 -0
  387. ads/feature_store/statistics/charts/__init__.py +0 -0
  388. ads/feature_store/statistics/charts/abstract_feature_plot.py +37 -0
  389. ads/feature_store/statistics/charts/box_plot.py +148 -0
  390. ads/feature_store/statistics/charts/frequency_distribution.py +65 -0
  391. ads/feature_store/statistics/charts/probability_distribution.py +68 -0
  392. ads/feature_store/statistics/charts/top_k_frequent_elements.py +98 -0
  393. ads/feature_store/statistics/feature_stat.py +126 -0
  394. ads/feature_store/statistics/generic_feature_value.py +33 -0
  395. ads/feature_store/statistics/statistics.py +41 -0
  396. ads/feature_store/statistics_config.py +101 -0
  397. ads/feature_store/templates/feature_store_template.yaml +45 -0
  398. ads/feature_store/transformation.py +499 -0
  399. ads/feature_store/validation_output.py +57 -0
  400. ads/hpo/__init__.py +9 -0
  401. ads/hpo/_imports.py +91 -0
  402. ads/hpo/ads_search_space.py +439 -0
  403. ads/hpo/distributions.py +325 -0
  404. ads/hpo/objective.py +280 -0
  405. ads/hpo/search_cv.py +1657 -0
  406. ads/hpo/stopping_criterion.py +75 -0
  407. ads/hpo/tuner_artifact.py +413 -0
  408. ads/hpo/utils.py +91 -0
  409. ads/hpo/validation.py +140 -0
  410. ads/hpo/visualization/__init__.py +5 -0
  411. ads/hpo/visualization/_contour.py +23 -0
  412. ads/hpo/visualization/_edf.py +20 -0
  413. ads/hpo/visualization/_intermediate_values.py +21 -0
  414. ads/hpo/visualization/_optimization_history.py +25 -0
  415. ads/hpo/visualization/_parallel_coordinate.py +169 -0
  416. ads/hpo/visualization/_param_importances.py +26 -0
  417. ads/jobs/__init__.py +53 -0
  418. ads/jobs/ads_job.py +663 -0
  419. ads/jobs/builders/__init__.py +5 -0
  420. ads/jobs/builders/base.py +156 -0
  421. ads/jobs/builders/infrastructure/__init__.py +6 -0
  422. ads/jobs/builders/infrastructure/base.py +165 -0
  423. ads/jobs/builders/infrastructure/dataflow.py +1252 -0
  424. ads/jobs/builders/infrastructure/dsc_job.py +1894 -0
  425. ads/jobs/builders/infrastructure/dsc_job_runtime.py +1233 -0
  426. ads/jobs/builders/infrastructure/utils.py +65 -0
  427. ads/jobs/builders/runtimes/__init__.py +5 -0
  428. ads/jobs/builders/runtimes/artifact.py +338 -0
  429. ads/jobs/builders/runtimes/base.py +325 -0
  430. ads/jobs/builders/runtimes/container_runtime.py +242 -0
  431. ads/jobs/builders/runtimes/python_runtime.py +1016 -0
  432. ads/jobs/builders/runtimes/pytorch_runtime.py +204 -0
  433. ads/jobs/cli.py +104 -0
  434. ads/jobs/env_var_parser.py +131 -0
  435. ads/jobs/extension.py +160 -0
  436. ads/jobs/schema/__init__.py +5 -0
  437. ads/jobs/schema/infrastructure_schema.json +116 -0
  438. ads/jobs/schema/job_schema.json +42 -0
  439. ads/jobs/schema/runtime_schema.json +183 -0
  440. ads/jobs/schema/validator.py +141 -0
  441. ads/jobs/serializer.py +296 -0
  442. ads/jobs/templates/__init__.py +5 -0
  443. ads/jobs/templates/container.py +6 -0
  444. ads/jobs/templates/driver_notebook.py +177 -0
  445. ads/jobs/templates/driver_oci.py +500 -0
  446. ads/jobs/templates/driver_python.py +48 -0
  447. ads/jobs/templates/driver_pytorch.py +852 -0
  448. ads/jobs/templates/driver_utils.py +615 -0
  449. ads/jobs/templates/hostname_from_env.c +55 -0
  450. ads/jobs/templates/oci_metrics.py +181 -0
  451. ads/jobs/utils.py +104 -0
  452. ads/llm/__init__.py +28 -0
  453. ads/llm/autogen/__init__.py +2 -0
  454. ads/llm/autogen/constants.py +15 -0
  455. ads/llm/autogen/reports/__init__.py +2 -0
  456. ads/llm/autogen/reports/base.py +67 -0
  457. ads/llm/autogen/reports/data.py +103 -0
  458. ads/llm/autogen/reports/session.py +526 -0
  459. ads/llm/autogen/reports/templates/chat_box.html +13 -0
  460. ads/llm/autogen/reports/templates/chat_box_lt.html +5 -0
  461. ads/llm/autogen/reports/templates/chat_box_rt.html +6 -0
  462. ads/llm/autogen/reports/utils.py +56 -0
  463. ads/llm/autogen/v02/__init__.py +4 -0
  464. ads/llm/autogen/v02/client.py +295 -0
  465. ads/llm/autogen/v02/log_handlers/__init__.py +2 -0
  466. ads/llm/autogen/v02/log_handlers/oci_file_handler.py +83 -0
  467. ads/llm/autogen/v02/loggers/__init__.py +6 -0
  468. ads/llm/autogen/v02/loggers/metric_logger.py +320 -0
  469. ads/llm/autogen/v02/loggers/session_logger.py +580 -0
  470. ads/llm/autogen/v02/loggers/utils.py +86 -0
  471. ads/llm/autogen/v02/runtime_logging.py +163 -0
  472. ads/llm/chain.py +268 -0
  473. ads/llm/chat_template.py +31 -0
  474. ads/llm/deploy.py +63 -0
  475. ads/llm/guardrails/__init__.py +5 -0
  476. ads/llm/guardrails/base.py +442 -0
  477. ads/llm/guardrails/huggingface.py +44 -0
  478. ads/llm/langchain/__init__.py +5 -0
  479. ads/llm/langchain/plugins/__init__.py +5 -0
  480. ads/llm/langchain/plugins/chat_models/__init__.py +5 -0
  481. ads/llm/langchain/plugins/chat_models/oci_data_science.py +1027 -0
  482. ads/llm/langchain/plugins/embeddings/__init__.py +4 -0
  483. ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +184 -0
  484. ads/llm/langchain/plugins/llms/__init__.py +5 -0
  485. ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +979 -0
  486. ads/llm/requirements.txt +3 -0
  487. ads/llm/serialize.py +219 -0
  488. ads/llm/serializers/__init__.py +0 -0
  489. ads/llm/serializers/retrieval_qa.py +153 -0
  490. ads/llm/serializers/runnable_parallel.py +27 -0
  491. ads/llm/templates/score_chain.jinja2 +155 -0
  492. ads/llm/templates/tool_chat_template_hermes.jinja +130 -0
  493. ads/llm/templates/tool_chat_template_mistral_parallel.jinja +94 -0
  494. ads/model/__init__.py +52 -0
  495. ads/model/artifact.py +573 -0
  496. ads/model/artifact_downloader.py +254 -0
  497. ads/model/artifact_uploader.py +267 -0
  498. ads/model/base_properties.py +238 -0
  499. ads/model/common/.model-ignore +66 -0
  500. ads/model/common/__init__.py +5 -0
  501. ads/model/common/utils.py +142 -0
  502. ads/model/datascience_model.py +2635 -0
  503. ads/model/deployment/__init__.py +20 -0
  504. ads/model/deployment/common/__init__.py +5 -0
  505. ads/model/deployment/common/utils.py +308 -0
  506. ads/model/deployment/model_deployer.py +466 -0
  507. ads/model/deployment/model_deployment.py +1846 -0
  508. ads/model/deployment/model_deployment_infrastructure.py +671 -0
  509. ads/model/deployment/model_deployment_properties.py +493 -0
  510. ads/model/deployment/model_deployment_runtime.py +838 -0
  511. ads/model/extractor/__init__.py +5 -0
  512. ads/model/extractor/automl_extractor.py +74 -0
  513. ads/model/extractor/embedding_onnx_extractor.py +80 -0
  514. ads/model/extractor/huggingface_extractor.py +88 -0
  515. ads/model/extractor/keras_extractor.py +84 -0
  516. ads/model/extractor/lightgbm_extractor.py +93 -0
  517. ads/model/extractor/model_info_extractor.py +114 -0
  518. ads/model/extractor/model_info_extractor_factory.py +105 -0
  519. ads/model/extractor/pytorch_extractor.py +87 -0
  520. ads/model/extractor/sklearn_extractor.py +112 -0
  521. ads/model/extractor/spark_extractor.py +89 -0
  522. ads/model/extractor/tensorflow_extractor.py +85 -0
  523. ads/model/extractor/xgboost_extractor.py +94 -0
  524. ads/model/framework/__init__.py +5 -0
  525. ads/model/framework/automl_model.py +178 -0
  526. ads/model/framework/embedding_onnx_model.py +438 -0
  527. ads/model/framework/huggingface_model.py +399 -0
  528. ads/model/framework/lightgbm_model.py +266 -0
  529. ads/model/framework/pytorch_model.py +266 -0
  530. ads/model/framework/sklearn_model.py +250 -0
  531. ads/model/framework/spark_model.py +326 -0
  532. ads/model/framework/tensorflow_model.py +254 -0
  533. ads/model/framework/xgboost_model.py +258 -0
  534. ads/model/generic_model.py +3518 -0
  535. ads/model/model_artifact_boilerplate/README.md +381 -0
  536. ads/model/model_artifact_boilerplate/__init__.py +5 -0
  537. ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +5 -0
  538. ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +427 -0
  539. ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +2 -0
  540. ads/model/model_artifact_boilerplate/runtime.yaml +7 -0
  541. ads/model/model_artifact_boilerplate/score.py +61 -0
  542. ads/model/model_file_description_schema.json +68 -0
  543. ads/model/model_introspect.py +331 -0
  544. ads/model/model_metadata.py +1810 -0
  545. ads/model/model_metadata_mixin.py +460 -0
  546. ads/model/model_properties.py +63 -0
  547. ads/model/model_version_set.py +739 -0
  548. ads/model/runtime/__init__.py +5 -0
  549. ads/model/runtime/env_info.py +306 -0
  550. ads/model/runtime/model_deployment_details.py +37 -0
  551. ads/model/runtime/model_provenance_details.py +58 -0
  552. ads/model/runtime/runtime_info.py +81 -0
  553. ads/model/runtime/schemas/inference_env_info_schema.yaml +16 -0
  554. ads/model/runtime/schemas/model_provenance_schema.yaml +36 -0
  555. ads/model/runtime/schemas/training_env_info_schema.yaml +16 -0
  556. ads/model/runtime/utils.py +201 -0
  557. ads/model/serde/__init__.py +5 -0
  558. ads/model/serde/common.py +40 -0
  559. ads/model/serde/model_input.py +547 -0
  560. ads/model/serde/model_serializer.py +1184 -0
  561. ads/model/service/__init__.py +5 -0
  562. ads/model/service/oci_datascience_model.py +1076 -0
  563. ads/model/service/oci_datascience_model_deployment.py +500 -0
  564. ads/model/service/oci_datascience_model_version_set.py +176 -0
  565. ads/model/transformer/__init__.py +5 -0
  566. ads/model/transformer/onnx_transformer.py +324 -0
  567. ads/mysqldb/__init__.py +5 -0
  568. ads/mysqldb/mysql_db.py +227 -0
  569. ads/opctl/__init__.py +18 -0
  570. ads/opctl/anomaly_detection.py +11 -0
  571. ads/opctl/backend/__init__.py +5 -0
  572. ads/opctl/backend/ads_dataflow.py +353 -0
  573. ads/opctl/backend/ads_ml_job.py +710 -0
  574. ads/opctl/backend/ads_ml_pipeline.py +164 -0
  575. ads/opctl/backend/ads_model_deployment.py +209 -0
  576. ads/opctl/backend/base.py +146 -0
  577. ads/opctl/backend/local.py +1053 -0
  578. ads/opctl/backend/marketplace/__init__.py +9 -0
  579. ads/opctl/backend/marketplace/helm_helper.py +173 -0
  580. ads/opctl/backend/marketplace/local_marketplace.py +271 -0
  581. ads/opctl/backend/marketplace/marketplace_backend_runner.py +71 -0
  582. ads/opctl/backend/marketplace/marketplace_operator_interface.py +44 -0
  583. ads/opctl/backend/marketplace/marketplace_operator_runner.py +24 -0
  584. ads/opctl/backend/marketplace/marketplace_utils.py +212 -0
  585. ads/opctl/backend/marketplace/models/__init__.py +5 -0
  586. ads/opctl/backend/marketplace/models/bearer_token.py +94 -0
  587. ads/opctl/backend/marketplace/models/marketplace_type.py +70 -0
  588. ads/opctl/backend/marketplace/models/ocir_details.py +56 -0
  589. ads/opctl/backend/marketplace/prerequisite_checker.py +238 -0
  590. ads/opctl/cli.py +707 -0
  591. ads/opctl/cmds.py +869 -0
  592. ads/opctl/conda/__init__.py +5 -0
  593. ads/opctl/conda/cli.py +193 -0
  594. ads/opctl/conda/cmds.py +749 -0
  595. ads/opctl/conda/config.yaml +34 -0
  596. ads/opctl/conda/manifest_template.yaml +13 -0
  597. ads/opctl/conda/multipart_uploader.py +188 -0
  598. ads/opctl/conda/pack.py +89 -0
  599. ads/opctl/config/__init__.py +5 -0
  600. ads/opctl/config/base.py +57 -0
  601. ads/opctl/config/diagnostics/__init__.py +5 -0
  602. ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +62 -0
  603. ads/opctl/config/merger.py +255 -0
  604. ads/opctl/config/resolver.py +297 -0
  605. ads/opctl/config/utils.py +79 -0
  606. ads/opctl/config/validator.py +17 -0
  607. ads/opctl/config/versioner.py +68 -0
  608. ads/opctl/config/yaml_parsers/__init__.py +7 -0
  609. ads/opctl/config/yaml_parsers/base.py +58 -0
  610. ads/opctl/config/yaml_parsers/distributed/__init__.py +7 -0
  611. ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +201 -0
  612. ads/opctl/constants.py +66 -0
  613. ads/opctl/decorator/__init__.py +5 -0
  614. ads/opctl/decorator/common.py +129 -0
  615. ads/opctl/diagnostics/__init__.py +5 -0
  616. ads/opctl/diagnostics/__main__.py +25 -0
  617. ads/opctl/diagnostics/check_distributed_job_requirements.py +212 -0
  618. ads/opctl/diagnostics/check_requirements.py +144 -0
  619. ads/opctl/diagnostics/requirement_exception.py +9 -0
  620. ads/opctl/distributed/README.md +109 -0
  621. ads/opctl/distributed/__init__.py +5 -0
  622. ads/opctl/distributed/certificates.py +32 -0
  623. ads/opctl/distributed/cli.py +207 -0
  624. ads/opctl/distributed/cmds.py +731 -0
  625. ads/opctl/distributed/common/__init__.py +5 -0
  626. ads/opctl/distributed/common/abstract_cluster_provider.py +449 -0
  627. ads/opctl/distributed/common/abstract_framework_spec_builder.py +88 -0
  628. ads/opctl/distributed/common/cluster_config_helper.py +103 -0
  629. ads/opctl/distributed/common/cluster_provider_factory.py +21 -0
  630. ads/opctl/distributed/common/cluster_runner.py +54 -0
  631. ads/opctl/distributed/common/framework_factory.py +29 -0
  632. ads/opctl/docker/Dockerfile.job +103 -0
  633. ads/opctl/docker/Dockerfile.job.arm +107 -0
  634. ads/opctl/docker/Dockerfile.job.gpu +175 -0
  635. ads/opctl/docker/base-env.yaml +13 -0
  636. ads/opctl/docker/cuda.repo +6 -0
  637. ads/opctl/docker/operator/.dockerignore +0 -0
  638. ads/opctl/docker/operator/Dockerfile +41 -0
  639. ads/opctl/docker/operator/Dockerfile.gpu +85 -0
  640. ads/opctl/docker/operator/cuda.repo +6 -0
  641. ads/opctl/docker/operator/environment.yaml +8 -0
  642. ads/opctl/forecast.py +11 -0
  643. ads/opctl/index.yaml +3 -0
  644. ads/opctl/model/__init__.py +5 -0
  645. ads/opctl/model/cli.py +65 -0
  646. ads/opctl/model/cmds.py +73 -0
  647. ads/opctl/operator/README.md +4 -0
  648. ads/opctl/operator/__init__.py +31 -0
  649. ads/opctl/operator/cli.py +344 -0
  650. ads/opctl/operator/cmd.py +596 -0
  651. ads/opctl/operator/common/__init__.py +5 -0
  652. ads/opctl/operator/common/backend_factory.py +460 -0
  653. ads/opctl/operator/common/const.py +27 -0
  654. ads/opctl/operator/common/data/synthetic.csv +16001 -0
  655. ads/opctl/operator/common/dictionary_merger.py +148 -0
  656. ads/opctl/operator/common/errors.py +42 -0
  657. ads/opctl/operator/common/operator_config.py +99 -0
  658. ads/opctl/operator/common/operator_loader.py +811 -0
  659. ads/opctl/operator/common/operator_schema.yaml +130 -0
  660. ads/opctl/operator/common/operator_yaml_generator.py +152 -0
  661. ads/opctl/operator/common/utils.py +208 -0
  662. ads/opctl/operator/lowcode/__init__.py +5 -0
  663. ads/opctl/operator/lowcode/anomaly/MLoperator +16 -0
  664. ads/opctl/operator/lowcode/anomaly/README.md +207 -0
  665. ads/opctl/operator/lowcode/anomaly/__init__.py +5 -0
  666. ads/opctl/operator/lowcode/anomaly/__main__.py +103 -0
  667. ads/opctl/operator/lowcode/anomaly/cmd.py +35 -0
  668. ads/opctl/operator/lowcode/anomaly/const.py +167 -0
  669. ads/opctl/operator/lowcode/anomaly/environment.yaml +10 -0
  670. ads/opctl/operator/lowcode/anomaly/model/__init__.py +5 -0
  671. ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +146 -0
  672. ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +162 -0
  673. ads/opctl/operator/lowcode/anomaly/model/automlx.py +99 -0
  674. ads/opctl/operator/lowcode/anomaly/model/autots.py +115 -0
  675. ads/opctl/operator/lowcode/anomaly/model/base_model.py +404 -0
  676. ads/opctl/operator/lowcode/anomaly/model/factory.py +110 -0
  677. ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +78 -0
  678. ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +78 -0
  679. ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +120 -0
  680. ads/opctl/operator/lowcode/anomaly/model/tods.py +119 -0
  681. ads/opctl/operator/lowcode/anomaly/operator_config.py +127 -0
  682. ads/opctl/operator/lowcode/anomaly/schema.yaml +401 -0
  683. ads/opctl/operator/lowcode/anomaly/utils.py +88 -0
  684. ads/opctl/operator/lowcode/common/__init__.py +5 -0
  685. ads/opctl/operator/lowcode/common/const.py +10 -0
  686. ads/opctl/operator/lowcode/common/data.py +116 -0
  687. ads/opctl/operator/lowcode/common/errors.py +47 -0
  688. ads/opctl/operator/lowcode/common/transformations.py +296 -0
  689. ads/opctl/operator/lowcode/common/utils.py +384 -0
  690. ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +13 -0
  691. ads/opctl/operator/lowcode/feature_store_marketplace/README.md +30 -0
  692. ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +5 -0
  693. ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +116 -0
  694. ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +85 -0
  695. ads/opctl/operator/lowcode/feature_store_marketplace/const.py +15 -0
  696. ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
  697. ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +4 -0
  698. ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +32 -0
  699. ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +43 -0
  700. ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +120 -0
  701. ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +34 -0
  702. ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +386 -0
  703. ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +160 -0
  704. ads/opctl/operator/lowcode/forecast/MLoperator +25 -0
  705. ads/opctl/operator/lowcode/forecast/README.md +209 -0
  706. ads/opctl/operator/lowcode/forecast/__init__.py +5 -0
  707. ads/opctl/operator/lowcode/forecast/__main__.py +89 -0
  708. ads/opctl/operator/lowcode/forecast/cmd.py +40 -0
  709. ads/opctl/operator/lowcode/forecast/const.py +92 -0
  710. ads/opctl/operator/lowcode/forecast/environment.yaml +20 -0
  711. ads/opctl/operator/lowcode/forecast/errors.py +26 -0
  712. ads/opctl/operator/lowcode/forecast/model/__init__.py +5 -0
  713. ads/opctl/operator/lowcode/forecast/model/arima.py +279 -0
  714. ads/opctl/operator/lowcode/forecast/model/automlx.py +553 -0
  715. ads/opctl/operator/lowcode/forecast/model/autots.py +312 -0
  716. ads/opctl/operator/lowcode/forecast/model/base_model.py +875 -0
  717. ads/opctl/operator/lowcode/forecast/model/factory.py +106 -0
  718. ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +492 -0
  719. ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +243 -0
  720. ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +482 -0
  721. ads/opctl/operator/lowcode/forecast/model/prophet.py +445 -0
  722. ads/opctl/operator/lowcode/forecast/model_evaluator.py +244 -0
  723. ads/opctl/operator/lowcode/forecast/operator_config.py +234 -0
  724. ads/opctl/operator/lowcode/forecast/schema.yaml +506 -0
  725. ads/opctl/operator/lowcode/forecast/utils.py +397 -0
  726. ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +7 -0
  727. ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +285 -0
  728. ads/opctl/operator/lowcode/forecast/whatifserve/score.py +246 -0
  729. ads/opctl/operator/lowcode/pii/MLoperator +17 -0
  730. ads/opctl/operator/lowcode/pii/README.md +208 -0
  731. ads/opctl/operator/lowcode/pii/__init__.py +5 -0
  732. ads/opctl/operator/lowcode/pii/__main__.py +78 -0
  733. ads/opctl/operator/lowcode/pii/cmd.py +39 -0
  734. ads/opctl/operator/lowcode/pii/constant.py +84 -0
  735. ads/opctl/operator/lowcode/pii/environment.yaml +17 -0
  736. ads/opctl/operator/lowcode/pii/errors.py +27 -0
  737. ads/opctl/operator/lowcode/pii/model/__init__.py +5 -0
  738. ads/opctl/operator/lowcode/pii/model/factory.py +82 -0
  739. ads/opctl/operator/lowcode/pii/model/guardrails.py +167 -0
  740. ads/opctl/operator/lowcode/pii/model/pii.py +145 -0
  741. ads/opctl/operator/lowcode/pii/model/processor/__init__.py +34 -0
  742. ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +34 -0
  743. ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +35 -0
  744. ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +225 -0
  745. ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +73 -0
  746. ads/opctl/operator/lowcode/pii/model/processor/remover.py +26 -0
  747. ads/opctl/operator/lowcode/pii/model/report.py +487 -0
  748. ads/opctl/operator/lowcode/pii/operator_config.py +95 -0
  749. ads/opctl/operator/lowcode/pii/schema.yaml +108 -0
  750. ads/opctl/operator/lowcode/pii/utils.py +43 -0
  751. ads/opctl/operator/lowcode/recommender/MLoperator +16 -0
  752. ads/opctl/operator/lowcode/recommender/README.md +206 -0
  753. ads/opctl/operator/lowcode/recommender/__init__.py +5 -0
  754. ads/opctl/operator/lowcode/recommender/__main__.py +82 -0
  755. ads/opctl/operator/lowcode/recommender/cmd.py +33 -0
  756. ads/opctl/operator/lowcode/recommender/constant.py +30 -0
  757. ads/opctl/operator/lowcode/recommender/environment.yaml +11 -0
  758. ads/opctl/operator/lowcode/recommender/model/base_model.py +212 -0
  759. ads/opctl/operator/lowcode/recommender/model/factory.py +56 -0
  760. ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +25 -0
  761. ads/opctl/operator/lowcode/recommender/model/svd.py +106 -0
  762. ads/opctl/operator/lowcode/recommender/operator_config.py +81 -0
  763. ads/opctl/operator/lowcode/recommender/schema.yaml +265 -0
  764. ads/opctl/operator/lowcode/recommender/utils.py +13 -0
  765. ads/opctl/operator/runtime/__init__.py +5 -0
  766. ads/opctl/operator/runtime/const.py +17 -0
  767. ads/opctl/operator/runtime/container_runtime_schema.yaml +50 -0
  768. ads/opctl/operator/runtime/marketplace_runtime.py +50 -0
  769. ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +21 -0
  770. ads/opctl/operator/runtime/python_runtime_schema.yaml +21 -0
  771. ads/opctl/operator/runtime/runtime.py +115 -0
  772. ads/opctl/schema.yaml.yml +36 -0
  773. ads/opctl/script.py +40 -0
  774. ads/opctl/spark/__init__.py +5 -0
  775. ads/opctl/spark/cli.py +43 -0
  776. ads/opctl/spark/cmds.py +147 -0
  777. ads/opctl/templates/diagnostic_report_template.jinja2 +102 -0
  778. ads/opctl/utils.py +344 -0
  779. ads/oracledb/__init__.py +5 -0
  780. ads/oracledb/oracle_db.py +346 -0
  781. ads/pipeline/__init__.py +39 -0
  782. ads/pipeline/ads_pipeline.py +2279 -0
  783. ads/pipeline/ads_pipeline_run.py +772 -0
  784. ads/pipeline/ads_pipeline_step.py +605 -0
  785. ads/pipeline/builders/__init__.py +5 -0
  786. ads/pipeline/builders/infrastructure/__init__.py +5 -0
  787. ads/pipeline/builders/infrastructure/custom_script.py +32 -0
  788. ads/pipeline/cli.py +119 -0
  789. ads/pipeline/extension.py +291 -0
  790. ads/pipeline/schema/__init__.py +5 -0
  791. ads/pipeline/schema/cs_step_schema.json +35 -0
  792. ads/pipeline/schema/ml_step_schema.json +31 -0
  793. ads/pipeline/schema/pipeline_schema.json +71 -0
  794. ads/pipeline/visualizer/__init__.py +5 -0
  795. ads/pipeline/visualizer/base.py +570 -0
  796. ads/pipeline/visualizer/graph_renderer.py +272 -0
  797. ads/pipeline/visualizer/text_renderer.py +84 -0
  798. ads/secrets/__init__.py +11 -0
  799. ads/secrets/adb.py +386 -0
  800. ads/secrets/auth_token.py +86 -0
  801. ads/secrets/big_data_service.py +365 -0
  802. ads/secrets/mysqldb.py +149 -0
  803. ads/secrets/oracledb.py +160 -0
  804. ads/secrets/secrets.py +407 -0
  805. ads/telemetry/__init__.py +7 -0
  806. ads/telemetry/base.py +69 -0
  807. ads/telemetry/client.py +125 -0
  808. ads/telemetry/telemetry.py +257 -0
  809. ads/templates/dataflow_pyspark.jinja2 +13 -0
  810. ads/templates/dataflow_sparksql.jinja2 +22 -0
  811. ads/templates/func.jinja2 +20 -0
  812. ads/templates/schemas/openapi.json +1740 -0
  813. ads/templates/score-pkl.jinja2 +173 -0
  814. ads/templates/score.jinja2 +322 -0
  815. ads/templates/score_embedding_onnx.jinja2 +202 -0
  816. ads/templates/score_generic.jinja2 +165 -0
  817. ads/templates/score_huggingface_pipeline.jinja2 +217 -0
  818. ads/templates/score_lightgbm.jinja2 +185 -0
  819. ads/templates/score_onnx.jinja2 +407 -0
  820. ads/templates/score_onnx_new.jinja2 +473 -0
  821. ads/templates/score_oracle_automl.jinja2 +185 -0
  822. ads/templates/score_pyspark.jinja2 +154 -0
  823. ads/templates/score_pytorch.jinja2 +219 -0
  824. ads/templates/score_scikit-learn.jinja2 +184 -0
  825. ads/templates/score_tensorflow.jinja2 +184 -0
  826. ads/templates/score_xgboost.jinja2 +178 -0
  827. ads/text_dataset/__init__.py +5 -0
  828. ads/text_dataset/backends.py +211 -0
  829. ads/text_dataset/dataset.py +445 -0
  830. ads/text_dataset/extractor.py +207 -0
  831. ads/text_dataset/options.py +53 -0
  832. ads/text_dataset/udfs.py +22 -0
  833. ads/text_dataset/utils.py +49 -0
  834. ads/type_discovery/__init__.py +9 -0
  835. ads/type_discovery/abstract_detector.py +21 -0
  836. ads/type_discovery/constant_detector.py +41 -0
  837. ads/type_discovery/continuous_detector.py +54 -0
  838. ads/type_discovery/credit_card_detector.py +99 -0
  839. ads/type_discovery/datetime_detector.py +92 -0
  840. ads/type_discovery/discrete_detector.py +118 -0
  841. ads/type_discovery/document_detector.py +146 -0
  842. ads/type_discovery/ip_detector.py +68 -0
  843. ads/type_discovery/latlon_detector.py +90 -0
  844. ads/type_discovery/phone_number_detector.py +63 -0
  845. ads/type_discovery/type_discovery_driver.py +87 -0
  846. ads/type_discovery/typed_feature.py +594 -0
  847. ads/type_discovery/unknown_detector.py +41 -0
  848. ads/type_discovery/zipcode_detector.py +48 -0
  849. ads/vault/__init__.py +7 -0
  850. ads/vault/vault.py +237 -0
  851. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/METADATA +150 -150
  852. oracle_ads-2.13.9rc1.dist-info/RECORD +858 -0
  853. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/WHEEL +1 -2
  854. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/entry_points.txt +2 -1
  855. oracle_ads-2.13.9rc0.dist-info/RECORD +0 -9
  856. oracle_ads-2.13.9rc0.dist-info/top_level.txt +0 -1
  857. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.9rc1.dist-info}/licenses/LICENSE.txt +0 -0
@@ -0,0 +1,875 @@
1
+ #!/usr/bin/env python
2
+
3
+ # Copyright (c) 2023, 2025 Oracle and/or its affiliates.
4
+ # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
5
+
6
+ import logging
7
+ import os
8
+ import tempfile
9
+ import time
10
+ import traceback
11
+ from abc import ABC, abstractmethod
12
+ from typing import Tuple
13
+
14
+ import numpy as np
15
+ import pandas as pd
16
+ import report_creator as rc
17
+
18
+ from ads.common.decorator.runtime_dependency import runtime_dependency
19
+ from ads.common.object_storage_details import ObjectStorageDetails
20
+ from ads.opctl import logger
21
+ from ads.opctl.operator.lowcode.common.const import DataColumns
22
+ from ads.opctl.operator.lowcode.common.utils import (
23
+ datetime_to_seconds,
24
+ disable_print,
25
+ enable_print,
26
+ human_time_friendly,
27
+ load_pkl,
28
+ merged_category_column_name,
29
+ seconds_to_datetime,
30
+ write_data,
31
+ write_file,
32
+ write_json,
33
+ write_pkl,
34
+ )
35
+ from ads.opctl.operator.lowcode.forecast.utils import (
36
+ _build_metrics_df,
37
+ _build_metrics_per_horizon,
38
+ _label_encode_dataframe,
39
+ default_signer,
40
+ evaluate_train_metrics,
41
+ get_auto_select_plot,
42
+ get_forecast_plots,
43
+ )
44
+
45
+ from ..const import (
46
+ AUTO_SELECT,
47
+ BACKTEST_REPORT_NAME,
48
+ SUMMARY_METRICS_HORIZON_LIMIT,
49
+ ForecastOutputColumns,
50
+ SpeedAccuracyMode,
51
+ SupportedMetrics,
52
+ SupportedModels,
53
+ )
54
+ from ..operator_config import ForecastOperatorConfig, ForecastOperatorSpec
55
+ from .forecast_datasets import ForecastDatasets, ForecastResults
56
+
57
+ logging.getLogger("report_creator").setLevel(logging.WARNING)
58
+
59
+
60
+ class ForecastOperatorBaseModel(ABC):
61
+ """The base class for the forecast operator models."""
62
+
63
+ def __init__(self, config: ForecastOperatorConfig, datasets: ForecastDatasets):
64
+ """Instantiates the ForecastOperatorBaseModel instance.
65
+
66
+ Properties
67
+ ----------
68
+ config: ForecastOperatorConfig
69
+ The forecast operator configuration.
70
+ """
71
+ self.config: ForecastOperatorConfig = config
72
+ self.spec: ForecastOperatorSpec = config.spec
73
+ self.datasets: ForecastDatasets = datasets
74
+ self.target_cat_col = self.spec.target_category_columns
75
+ self.full_data_dict = datasets.get_data_by_series()
76
+
77
+ self.test_eval_metrics = None
78
+ self.original_target_column = self.spec.target_column
79
+ self.dt_column_name = self.spec.datetime_column.name
80
+
81
+ self.model_parameters = {}
82
+ self.loaded_models = None
83
+
84
+ # these fields are populated in the _build_model() method
85
+ self.models = None
86
+
87
+ # "outputs" is a list of outputs generated by the models. These should only be generated when the framework requires the original output for plotting
88
+ self.outputs = None
89
+ self.forecast_output = None
90
+ self.errors_dict = {}
91
+ self.le = {}
92
+
93
+ self.formatted_global_explanation = None
94
+ self.formatted_local_explanation = None
95
+
96
+ self.forecast_col_name = "yhat"
97
+ self.perform_tuning = (self.spec.tuning is not None) and (
98
+ self.spec.tuning.n_trials is not None
99
+ )
100
+
101
+ def generate_report(self):
102
+ """Generates the forecasting report."""
103
+ import warnings
104
+
105
+ from sklearn.exceptions import ConvergenceWarning
106
+
107
+ with warnings.catch_warnings():
108
+ warnings.simplefilter(action="ignore", category=FutureWarning)
109
+ warnings.simplefilter(action="ignore", category=UserWarning)
110
+ warnings.simplefilter(action="ignore", category=RuntimeWarning)
111
+ warnings.simplefilter(action="ignore", category=ConvergenceWarning)
112
+
113
+ # load models if given
114
+ if self.spec.previous_output_dir is not None:
115
+ self._load_model()
116
+
117
+ start_time = time.time()
118
+ result_df = self._build_model()
119
+ elapsed_time = time.time() - start_time
120
+ logger.info("Building the models completed in %s seconds", elapsed_time)
121
+
122
+ # Generate metrics
123
+ summary_metrics = None
124
+ test_data = self.datasets.test_data
125
+ self.eval_metrics = None
126
+
127
+ if self.spec.generate_report or self.spec.generate_metrics:
128
+ self.eval_metrics = self.generate_train_metrics()
129
+ if not self.target_cat_col:
130
+ self.eval_metrics.rename(
131
+ {"Series 1": self.original_target_column}, axis=1, inplace=True
132
+ )
133
+
134
+ if self.datasets.test_data is not None:
135
+ try:
136
+ (self.test_eval_metrics, summary_metrics) = (
137
+ self._test_evaluate_metrics(
138
+ elapsed_time=elapsed_time,
139
+ )
140
+ )
141
+ if not self.target_cat_col:
142
+ self.test_eval_metrics.rename(
143
+ {"Series 1": self.original_target_column},
144
+ axis=1,
145
+ inplace=True,
146
+ )
147
+ except Exception:
148
+ logger.warning("Unable to generate Test Metrics.")
149
+ logger.debug(f"Full Traceback: {traceback.format_exc()}")
150
+ report_sections = []
151
+
152
+ if self.spec.generate_report:
153
+ # build the report
154
+ (
155
+ model_description,
156
+ other_sections,
157
+ ) = self._generate_report()
158
+ header_section = rc.Block(
159
+ rc.Heading(self.spec.report_title, level=1),
160
+ rc.Text(
161
+ f"You selected the {self.spec.model} model.\nBased on your dataset, you could have also selected any of the models: {SupportedModels.keys()}."
162
+ ),
163
+ model_description,
164
+ rc.Group(
165
+ rc.Metric(
166
+ heading="Analysis was completed in ",
167
+ value=human_time_friendly(elapsed_time),
168
+ ),
169
+ rc.Metric(
170
+ heading="Starting time index",
171
+ value=self.datasets.get_earliest_timestamp().strftime(
172
+ "%B %d, %Y"
173
+ ),
174
+ ),
175
+ rc.Metric(
176
+ heading="Ending time index",
177
+ value=self.datasets.get_latest_timestamp().strftime(
178
+ "%B %d, %Y"
179
+ ),
180
+ ),
181
+ rc.Metric(
182
+ heading="Num series",
183
+ value=len(self.datasets.list_series_ids()),
184
+ ),
185
+ ),
186
+ )
187
+
188
+ first_5_rows_blocks = [
189
+ rc.DataTable(
190
+ df.head(5),
191
+ label=s_id if self.target_cat_col else None,
192
+ index=True,
193
+ )
194
+ for s_id, df in self.full_data_dict.items()
195
+ ]
196
+
197
+ last_5_rows_blocks = [
198
+ rc.DataTable(
199
+ df.tail(5),
200
+ label=s_id if self.target_cat_col else None,
201
+ index=True,
202
+ )
203
+ for s_id, df in self.full_data_dict.items()
204
+ ]
205
+
206
+ data_summary_blocks = [
207
+ rc.DataTable(
208
+ df.describe(),
209
+ label=s_id if self.target_cat_col else None,
210
+ index=True,
211
+ )
212
+ for s_id, df in self.full_data_dict.items()
213
+ ]
214
+
215
+ series_name = merged_category_column_name(
216
+ self.spec.target_category_columns
217
+ )
218
+ # series_subtext = rc.Text(f"Indexed by {series_name}")
219
+ first_10_title = rc.Heading("First 5 Rows of Data", level=3)
220
+ last_10_title = rc.Heading("Last 5 Rows of Data", level=3)
221
+ summary_title = rc.Heading("Data Summary Statistics", level=3)
222
+
223
+ data_summary_sec = rc.Block(
224
+ rc.Block(
225
+ first_10_title,
226
+ # series_subtext,
227
+ rc.Select(blocks=first_5_rows_blocks)
228
+ if self.target_cat_col
229
+ else first_5_rows_blocks[0],
230
+ ),
231
+ rc.Block(
232
+ last_10_title,
233
+ # series_subtext,
234
+ rc.Select(blocks=last_5_rows_blocks)
235
+ if self.target_cat_col
236
+ else last_5_rows_blocks[0],
237
+ ),
238
+ rc.Block(
239
+ summary_title,
240
+ # series_subtext,
241
+ rc.Select(blocks=data_summary_blocks)
242
+ if self.target_cat_col
243
+ else data_summary_blocks[0],
244
+ ),
245
+ rc.Separator(),
246
+ )
247
+
248
+ summary = rc.Block(
249
+ header_section,
250
+ data_summary_sec,
251
+ )
252
+
253
+ test_metrics_sections = []
254
+ if (
255
+ self.test_eval_metrics is not None
256
+ and not self.test_eval_metrics.empty
257
+ ):
258
+ sec7_text = rc.Heading("Test Data Evaluation Metrics", level=2)
259
+ sec7 = rc.DataTable(self.test_eval_metrics, index=True)
260
+ test_metrics_sections = test_metrics_sections + [sec7_text, sec7]
261
+
262
+ if summary_metrics is not None and not summary_metrics.empty:
263
+ sec8_text = rc.Heading("Test Data Summary Metrics", level=2)
264
+ sec8 = rc.DataTable(summary_metrics, index=True)
265
+ test_metrics_sections = test_metrics_sections + [sec8_text, sec8]
266
+
267
+ train_metrics_sections = []
268
+ if self.eval_metrics is not None and not self.eval_metrics.empty:
269
+ sec9_text = rc.Heading("Training Data Metrics", level=2)
270
+ sec9 = rc.DataTable(self.eval_metrics, index=True)
271
+ train_metrics_sections = [sec9_text, sec9]
272
+
273
+ backtest_sections = []
274
+ output_dir = self.spec.output_directory.url
275
+ file_path = f"{output_dir}/{BACKTEST_REPORT_NAME}"
276
+ if self.spec.model == AUTO_SELECT:
277
+ backtest_sections.append(
278
+ rc.Heading(
279
+ "Auto-Select Backtesting and Performance Metrics", level=2
280
+ )
281
+ )
282
+ if not os.path.exists(file_path):
283
+ failure_msg = rc.Text(
284
+ "auto-select could not be executed. Please check the "
285
+ "logs for more details."
286
+ )
287
+ backtest_sections.append(failure_msg)
288
+ else:
289
+ backtest_stats = pd.read_csv(file_path)
290
+ model_metric_map = backtest_stats.drop(
291
+ columns=["metric", "backtest"]
292
+ )
293
+ average_dict = {
294
+ k: round(v, 4)
295
+ for k, v in model_metric_map.mean().to_dict().items()
296
+ }
297
+ best_model = min(average_dict, key=average_dict.get)
298
+ summary_text = rc.Text(
299
+ f"Overall, the average {self.spec.metric} scores for the models are {average_dict}, with"
300
+ f" {best_model} being identified as the top-performing model during backtesting."
301
+ )
302
+ backtest_table = rc.DataTable(backtest_stats, index=True)
303
+ liner_plot = get_auto_select_plot(backtest_stats)
304
+ backtest_sections.extend(
305
+ [backtest_table, summary_text, liner_plot]
306
+ )
307
+
308
+ forecast_plots = []
309
+ if len(self.forecast_output.list_series_ids()) > 0:
310
+ forecast_text = rc.Heading(
311
+ "Forecasted Data Overlaying Historical", level=2
312
+ )
313
+ forecast_sec = get_forecast_plots(
314
+ self.forecast_output,
315
+ horizon=self.spec.horizon,
316
+ test_data=test_data,
317
+ ci_interval_width=self.spec.confidence_interval_width,
318
+ target_category_column=self.target_cat_col,
319
+ )
320
+ if (
321
+ series_name is not None
322
+ and len(self.datasets.list_series_ids()) > 1
323
+ ):
324
+ forecast_plots = [
325
+ forecast_text,
326
+ forecast_sec,
327
+ ] # series_subtext,
328
+ else:
329
+ forecast_plots = [forecast_text, forecast_sec]
330
+
331
+ yaml_appendix_title = rc.Heading("Reference: YAML File", level=2)
332
+ config_dict = self.config.to_dict()
333
+ # pop the data incase it isn't json serializable
334
+ config_dict["spec"]["historical_data"].pop("data")
335
+ if config_dict["spec"].get("additional_data"):
336
+ config_dict["spec"]["additional_data"].pop("data")
337
+ if config_dict["spec"].get("test_data"):
338
+ config_dict["spec"]["test_data"].pop("data")
339
+ yaml_appendix = rc.Yaml(config_dict)
340
+ report_sections = (
341
+ [summary]
342
+ + backtest_sections
343
+ + forecast_plots
344
+ + other_sections
345
+ + test_metrics_sections
346
+ + train_metrics_sections
347
+ + [yaml_appendix_title, yaml_appendix]
348
+ )
349
+
350
+ # save the report and result CSV
351
+ return self._save_report(
352
+ report_sections=report_sections,
353
+ result_df=result_df,
354
+ metrics_df=self.eval_metrics,
355
+ test_metrics_df=self.test_eval_metrics,
356
+ test_data=test_data,
357
+ )
358
+
359
+ def _test_evaluate_metrics(self, elapsed_time=0):
360
+ total_metrics = pd.DataFrame()
361
+ summary_metrics = pd.DataFrame()
362
+ data = self.datasets.test_data
363
+
364
+ # Generate y_pred and y_true for each series
365
+ for s_id in self.forecast_output.list_series_ids():
366
+ try:
367
+ y_true = data.get_data_for_series(s_id)[data.target_name].values[
368
+ -self.spec.horizon :
369
+ ]
370
+ except KeyError as ke:
371
+ logger.warning(
372
+ f"Error Generating Metrics: Unable to find {s_id} in the test data. Error: {ke.args}"
373
+ )
374
+ y_pred = self.forecast_output.get_forecast(s_id)["forecast_value"].values[
375
+ -self.spec.horizon :
376
+ ]
377
+
378
+ drop_na_mask = ~np.isnan(y_true) & ~np.isnan(y_pred)
379
+ if not drop_na_mask.all(): # There is a missing value
380
+ if drop_na_mask.any(): # All values are missing
381
+ logger.debug(
382
+ f"No values in the test data for series: {s_id}. This will affect the test metrics."
383
+ )
384
+ continue
385
+ logger.debug(
386
+ f"Missing values in the test data for series: {s_id}. This will affect the test metrics."
387
+ )
388
+ y_true = y_true[drop_na_mask]
389
+ y_pred = y_pred[drop_na_mask]
390
+
391
+ metrics_df = _build_metrics_df(
392
+ y_true=y_true,
393
+ y_pred=y_pred,
394
+ series_id=s_id,
395
+ )
396
+ total_metrics = pd.concat([total_metrics, metrics_df], axis=1)
397
+
398
+ if total_metrics.empty:
399
+ return total_metrics, summary_metrics
400
+
401
+ summary_metrics = pd.DataFrame(
402
+ {
403
+ SupportedMetrics.MEAN_SMAPE: np.mean(
404
+ total_metrics.loc[SupportedMetrics.SMAPE]
405
+ ),
406
+ SupportedMetrics.MEDIAN_SMAPE: np.median(
407
+ total_metrics.loc[SupportedMetrics.SMAPE]
408
+ ),
409
+ SupportedMetrics.MEAN_MAPE: np.mean(
410
+ total_metrics.loc[SupportedMetrics.MAPE]
411
+ ),
412
+ SupportedMetrics.MEDIAN_MAPE: np.median(
413
+ total_metrics.loc[SupportedMetrics.MAPE]
414
+ ),
415
+ SupportedMetrics.MEAN_RMSE: np.mean(
416
+ total_metrics.loc[SupportedMetrics.RMSE]
417
+ ),
418
+ SupportedMetrics.MEDIAN_RMSE: np.median(
419
+ total_metrics.loc[SupportedMetrics.RMSE]
420
+ ),
421
+ SupportedMetrics.MEAN_R2: np.mean(
422
+ total_metrics.loc[SupportedMetrics.R2]
423
+ ),
424
+ SupportedMetrics.MEDIAN_R2: np.median(
425
+ total_metrics.loc[SupportedMetrics.R2]
426
+ ),
427
+ SupportedMetrics.MEAN_EXPLAINED_VARIANCE: np.mean(
428
+ total_metrics.loc[SupportedMetrics.EXPLAINED_VARIANCE]
429
+ ),
430
+ SupportedMetrics.MEDIAN_EXPLAINED_VARIANCE: np.median(
431
+ total_metrics.loc[SupportedMetrics.EXPLAINED_VARIANCE]
432
+ ),
433
+ SupportedMetrics.ELAPSED_TIME: elapsed_time,
434
+ },
435
+ index=["All Targets"],
436
+ )
437
+
438
+ """Calculates Mean sMAPE, Median sMAPE, Mean MAPE, Median MAPE, Mean wMAPE, Median wMAPE values for each horizon
439
+ if horizon <= 10."""
440
+ if self.spec.horizon <= SUMMARY_METRICS_HORIZON_LIMIT:
441
+ metrics_per_horizon = _build_metrics_per_horizon(
442
+ test_data=data,
443
+ output=self.forecast_output,
444
+ )
445
+ if not metrics_per_horizon.empty:
446
+ summary_metrics = pd.concat([summary_metrics, metrics_per_horizon])
447
+
448
+ new_column_order = [
449
+ SupportedMetrics.MEAN_SMAPE,
450
+ SupportedMetrics.MEDIAN_SMAPE,
451
+ SupportedMetrics.MEAN_MAPE,
452
+ SupportedMetrics.MEDIAN_MAPE,
453
+ SupportedMetrics.MEAN_WMAPE,
454
+ SupportedMetrics.MEDIAN_WMAPE,
455
+ SupportedMetrics.MEAN_RMSE,
456
+ SupportedMetrics.MEDIAN_RMSE,
457
+ SupportedMetrics.MEAN_R2,
458
+ SupportedMetrics.MEDIAN_R2,
459
+ SupportedMetrics.MEAN_EXPLAINED_VARIANCE,
460
+ SupportedMetrics.MEDIAN_EXPLAINED_VARIANCE,
461
+ SupportedMetrics.ELAPSED_TIME,
462
+ ]
463
+ summary_metrics = summary_metrics[new_column_order]
464
+
465
+ return total_metrics, summary_metrics
466
+
467
+ def _save_report(
468
+ self,
469
+ report_sections: Tuple,
470
+ result_df: pd.DataFrame,
471
+ metrics_df: pd.DataFrame,
472
+ test_metrics_df: pd.DataFrame,
473
+ test_data: pd.DataFrame,
474
+ ):
475
+ """Saves resulting reports to the given folder."""
476
+
477
+ unique_output_dir = self.spec.output_directory.url
478
+ results = ForecastResults()
479
+
480
+ storage_options = (
481
+ default_signer()
482
+ if ObjectStorageDetails.is_oci_path(unique_output_dir)
483
+ else {}
484
+ )
485
+
486
+ # report-creator html report
487
+ if self.spec.generate_report:
488
+ with tempfile.TemporaryDirectory() as temp_dir:
489
+ report_local_path = os.path.join(temp_dir, "___report.html")
490
+ disable_print()
491
+ with rc.ReportCreator("My Report") as report:
492
+ report.save(rc.Block(*report_sections), report_local_path)
493
+ enable_print()
494
+
495
+ report_path = os.path.join(unique_output_dir, self.spec.report_filename)
496
+ write_file(
497
+ local_filename=report_local_path,
498
+ remote_filename=report_path,
499
+ storage_options=storage_options,
500
+ )
501
+
502
+ # forecast csv report
503
+ # todo: add test data into forecast.csv
504
+ # if self.spec.test_data is not None:
505
+ # test_data_dict = test_data.get_dict_by_series()
506
+ # for series_id, test_data_values in test_data_dict.items():
507
+ # result_df[DataColumns.Series] = test_data_values[]
508
+ result_df = (
509
+ result_df
510
+ if self.target_cat_col
511
+ else result_df.drop(DataColumns.Series, axis=1)
512
+ )
513
+ if self.spec.generate_forecast_file:
514
+ write_data(
515
+ data=result_df,
516
+ filename=os.path.join(unique_output_dir, self.spec.forecast_filename),
517
+ format="csv",
518
+ storage_options=storage_options,
519
+ )
520
+ results.set_forecast(result_df)
521
+
522
+ # metrics csv report
523
+ if self.spec.generate_metrics:
524
+ metrics_col_name = (
525
+ self.original_target_column
526
+ if self.datasets.has_artificial_series()
527
+ else "Series 1"
528
+ )
529
+ if metrics_df is not None:
530
+ metrics_df_formatted = metrics_df.reset_index().rename(
531
+ {"index": "metrics", "Series 1": metrics_col_name}, axis=1
532
+ )
533
+ if self.spec.generate_metrics_file:
534
+ write_data(
535
+ data=metrics_df_formatted,
536
+ filename=os.path.join(
537
+ unique_output_dir, self.spec.metrics_filename
538
+ ),
539
+ format="csv",
540
+ storage_options=storage_options,
541
+ index=False,
542
+ )
543
+ results.set_metrics(metrics_df_formatted)
544
+ else:
545
+ logger.warning(
546
+ f"Attempted to generate the {self.spec.metrics_filename} file with the training metrics, however the training metrics could not be properly generated."
547
+ )
548
+
549
+ # test_metrics csv report
550
+ if self.datasets.test_data is not None:
551
+ if test_metrics_df is not None:
552
+ test_metrics_df_formatted = test_metrics_df.reset_index().rename(
553
+ {"index": "metrics", "Series 1": metrics_col_name}, axis=1
554
+ )
555
+ if self.spec.generate_metrics_file:
556
+ write_data(
557
+ data=test_metrics_df_formatted,
558
+ filename=os.path.join(
559
+ unique_output_dir, self.spec.test_metrics_filename
560
+ ),
561
+ format="csv",
562
+ storage_options=storage_options,
563
+ index=False,
564
+ )
565
+ results.set_test_metrics(test_metrics_df_formatted)
566
+ else:
567
+ logger.warning(
568
+ f"Attempted to generate the {self.spec.test_metrics_filename} file with the test metrics, however the test metrics could not be properly generated."
569
+ )
570
+ # explanations csv reports
571
+ if self.spec.generate_explanations:
572
+ try:
573
+ if not self.formatted_global_explanation.empty:
574
+ # Round to 4 decimal places before writing
575
+ global_expl_rounded = self.formatted_global_explanation.copy()
576
+ global_expl_rounded = global_expl_rounded.apply(
577
+ lambda col: np.round(col, 4)
578
+ if np.issubdtype(col.dtype, np.number)
579
+ else col
580
+ )
581
+ if self.spec.generate_explanation_files:
582
+ write_data(
583
+ data=global_expl_rounded,
584
+ filename=os.path.join(
585
+ unique_output_dir, self.spec.global_explanation_filename
586
+ ),
587
+ format="csv",
588
+ storage_options=storage_options,
589
+ index=True,
590
+ )
591
+ results.set_global_explanations(global_expl_rounded)
592
+ else:
593
+ logger.warning(
594
+ f"Attempted to generate global explanations for the {self.spec.global_explanation_filename} file, but an issue occured in formatting the explanations."
595
+ )
596
+
597
+ if not self.formatted_local_explanation.empty:
598
+ # Round to 4 decimal places before writing
599
+ local_expl_rounded = self.formatted_local_explanation.copy()
600
+ local_expl_rounded = local_expl_rounded.apply(
601
+ lambda col: np.round(col, 4)
602
+ if np.issubdtype(col.dtype, np.number)
603
+ else col
604
+ )
605
+ if self.spec.generate_explanation_files:
606
+ write_data(
607
+ data=local_expl_rounded,
608
+ filename=os.path.join(
609
+ unique_output_dir, self.spec.local_explanation_filename
610
+ ),
611
+ format="csv",
612
+ storage_options=storage_options,
613
+ index=True,
614
+ )
615
+ results.set_local_explanations(local_expl_rounded)
616
+ else:
617
+ logger.warning(
618
+ f"Attempted to generate local explanations for the {self.spec.local_explanation_filename} file, but an issue occured in formatting the explanations."
619
+ )
620
+ except AttributeError as e:
621
+ logger.warning(
622
+ "Unable to generate explanations for this model type or for this dataset."
623
+ )
624
+ logger.debug(f"Got error: {e.args}")
625
+
626
+ if self.spec.generate_model_parameters:
627
+ # model params
628
+ write_data(
629
+ data=pd.DataFrame.from_dict(self.model_parameters),
630
+ filename=os.path.join(unique_output_dir, "model_params.json"),
631
+ format="json",
632
+ storage_options=storage_options,
633
+ index=True,
634
+ indent=4,
635
+ )
636
+ results.set_model_parameters(self.model_parameters)
637
+
638
+ # model pickle
639
+ if self.spec.generate_model_pickle:
640
+ self._save_model(unique_output_dir, storage_options)
641
+ results.set_models(self.models)
642
+
643
+ logger.info(
644
+ f"The outputs have been successfully "
645
+ f"generated and placed into the directory: {unique_output_dir}."
646
+ )
647
+ print(
648
+ f"The outputs have been successfully generated and placed into the directory: {unique_output_dir}."
649
+ )
650
+ if self.errors_dict:
651
+ write_json(
652
+ json_dict=self.errors_dict,
653
+ filename=os.path.join(
654
+ unique_output_dir, self.spec.errors_dict_filename
655
+ ),
656
+ storage_options=storage_options,
657
+ )
658
+ results.set_errors_dict(self.errors_dict)
659
+ else:
660
+ logger.info("All modeling completed successfully.")
661
+ return results
662
+
663
+ def preprocess(self, df, series_id):
664
+ """The method that needs to be implemented on the particular model level."""
665
+ data = df.rename(
666
+ {self.dt_column_name: "ds", self.original_target_column: "y"}, axis=1
667
+ )
668
+ self.le[series_id], df_encoded = _label_encode_dataframe(
669
+ data, no_encode={"ds", "y"}
670
+ )
671
+ return df_encoded
672
+
673
+ @abstractmethod
674
+ def _generate_report(self):
675
+ """
676
+ Generates the report for the particular model.
677
+ The method that needs to be implemented on the particular model level.
678
+ """
679
+
680
+ @abstractmethod
681
+ def _build_model(self) -> pd.DataFrame:
682
+ """
683
+ Build the model.
684
+ The method that needs to be implemented on the particular model level.
685
+ """
686
+
687
+ def drop_horizon(self, df: pd.DataFrame) -> pd.DataFrame:
688
+ return df.iloc[: -self.spec.horizon]
689
+
690
+ def get_horizon(self, df: pd.DataFrame) -> pd.DataFrame:
691
+ return df.iloc[-self.spec.horizon :]
692
+
693
+ def generate_train_metrics(self) -> pd.DataFrame:
694
+ """
695
+ Generate Training Metrics when fitted data is not available.
696
+ The method that needs to be implemented on the particular model level.
697
+ """
698
+ return evaluate_train_metrics(self.forecast_output)
699
+
700
+ def _load_model(self):
701
+ try:
702
+ self.loaded_models = load_pkl(self.spec.previous_output_dir + "/model.pkl")
703
+ except Exception as e:
704
+ logger.info(f"model.pkl is not present. Error: {e}")
705
+
706
+ def _save_model(self, output_dir, storage_options):
707
+ write_pkl(
708
+ obj=self.models,
709
+ filename="model.pkl",
710
+ output_dir=output_dir,
711
+ storage_options=storage_options,
712
+ )
713
+
714
+ def _validate_automlx_explanation_mode(self):
715
+ if (
716
+ self.spec.model != SupportedModels.AutoMLX
717
+ and self.spec.explanations_accuracy_mode == SpeedAccuracyMode.AUTOMLX
718
+ ):
719
+ raise ValueError(
720
+ "AUTOMLX explanation accuracy mode is only supported for AutoMLX models. "
721
+ "Please select mode other than AUTOMLX from the available explanations_accuracy_mode options"
722
+ )
723
+
724
+ @runtime_dependency(
725
+ module="shap",
726
+ err_msg=(
727
+ "Please run `python3 -m pip install shap` to install the required dependencies for model explanation."
728
+ ),
729
+ )
730
+ def explain_model(self):
731
+ """
732
+ Generates an explanation for the model by using the SHAP (Shapley Additive exPlanations) library.
733
+ This function calculates the SHAP values for each feature in the dataset and stores the results in the `global_explanation` dictionary.
734
+
735
+ Returns
736
+ -------
737
+ dict: A dictionary containing the global explanation for each feature in the dataset.
738
+ The keys are the feature names and the values are the average absolute SHAP values.
739
+ """
740
+ from shap import PermutationExplainer
741
+
742
+ datetime_col_name = self.datasets._datetime_column_name
743
+
744
+ exp_start_time = time.time()
745
+ global_ex_time = 0
746
+ local_ex_time = 0
747
+ logger.info(
748
+ f"Calculating explanations using {self.spec.explanations_accuracy_mode} mode"
749
+ )
750
+ ratio = SpeedAccuracyMode.ratio[self.spec.explanations_accuracy_mode]
751
+
752
+ # validate the automlx mode is use for automlx model
753
+ self._validate_automlx_explanation_mode()
754
+
755
+ for s_id, data_i in self.datasets.get_data_by_series(
756
+ include_horizon=False
757
+ ).items():
758
+ if s_id in self.models:
759
+ try:
760
+ explain_predict_fn = self.get_explain_predict_fn(series_id=s_id)
761
+ data_trimmed = data_i.tail(
762
+ max(int(len(data_i) * ratio), 5)
763
+ ).reset_index(drop=True)
764
+ data_trimmed[datetime_col_name] = data_trimmed[
765
+ datetime_col_name
766
+ ].apply(lambda x: x.timestamp())
767
+
768
+ # Explainer fails when boolean columns are passed
769
+
770
+ _, data_trimmed_encoded = _label_encode_dataframe(
771
+ data_trimmed,
772
+ no_encode={datetime_col_name, self.original_target_column},
773
+ )
774
+
775
+ kernel_explnr = PermutationExplainer(
776
+ model=explain_predict_fn, masker=data_trimmed_encoded
777
+ )
778
+ kernel_explnr_vals = kernel_explnr.shap_values(data_trimmed_encoded)
779
+ exp_end_time = time.time()
780
+ global_ex_time = global_ex_time + exp_end_time - exp_start_time
781
+ self.local_explainer(
782
+ kernel_explnr,
783
+ series_id=s_id,
784
+ datetime_col_name=datetime_col_name,
785
+ )
786
+ local_ex_time = local_ex_time + time.time() - exp_end_time
787
+
788
+ if not len(kernel_explnr_vals):
789
+ logger.warning(
790
+ "No explanations generated. Ensure that additional data has been provided."
791
+ )
792
+ else:
793
+ self.global_explanation[s_id] = dict(
794
+ zip(
795
+ data_trimmed.columns[1:],
796
+ np.average(
797
+ np.absolute(kernel_explnr_vals[:, 1:]), axis=0
798
+ ),
799
+ )
800
+ )
801
+ except Exception as e:
802
+ if s_id in self.errors_dict:
803
+ self.errors_dict[s_id]["explainer_error"] = str(e)
804
+ self.errors_dict[s_id]["explainer_error_trace"] = (
805
+ traceback.format_exc()
806
+ )
807
+ else:
808
+ self.errors_dict[s_id] = {
809
+ "model_name": self.spec.model,
810
+ "explainer_error": str(e),
811
+ "explainer_error_trace": traceback.format_exc(),
812
+ }
813
+ else:
814
+ logger.warning(
815
+ f"Skipping explanations for {s_id}, as forecast was not generated."
816
+ )
817
+
818
+ logger.info(
819
+ "Global explanations generation completed in %s seconds", global_ex_time
820
+ )
821
+ logger.info(
822
+ "Local explanations generation completed in %s seconds", local_ex_time
823
+ )
824
+
825
+ def local_explainer(self, kernel_explainer, series_id, datetime_col_name) -> None:
826
+ """
827
+ Generate local explanations using a kernel explainer.
828
+
829
+ Parameters
830
+ ----------
831
+ kernel_explainer: The kernel explainer object to use for generating explanations.
832
+ """
833
+ data = self.datasets.get_horizon_at_series(s_id=series_id)
834
+ # columns that were dropped in train_model in arima, should be dropped here as well
835
+ data[datetime_col_name] = datetime_to_seconds(data[datetime_col_name])
836
+ data = data.reset_index(drop=True)
837
+
838
+ # Explainer fails when boolean columns are passed
839
+ _, data = _label_encode_dataframe(
840
+ data, no_encode={datetime_col_name, self.original_target_column}
841
+ )
842
+ # Generate local SHAP values using the kernel explainer
843
+ local_kernel_explnr_vals = kernel_explainer.shap_values(data)
844
+
845
+ # Convert the SHAP values into a DataFrame
846
+ local_kernel_explnr_df = pd.DataFrame(
847
+ local_kernel_explnr_vals, columns=data.columns
848
+ )
849
+
850
+ # Add date column to local explanation DataFrame
851
+ local_kernel_explnr_df[ForecastOutputColumns.DATE] = (
852
+ self.datasets.get_horizon_at_series(
853
+ s_id=series_id
854
+ )[self.spec.datetime_column.name].reset_index(drop=True)
855
+ )
856
+ self.local_explanation[series_id] = local_kernel_explnr_df
857
+
858
+ def get_explain_predict_fn(self, series_id, fcst_col_name="yhat"):
859
+ def _custom_predict(
860
+ data,
861
+ model=self.models[series_id]["model"],
862
+ dt_column_name=self.datasets._datetime_column_name,
863
+ ):
864
+ """
865
+ data: ForecastDatasets.get_data_at_series(s_id)
866
+ """
867
+ data[dt_column_name] = seconds_to_datetime(
868
+ data[dt_column_name], dt_format=self.spec.datetime_column.format
869
+ )
870
+ data = self.preprocess(df=data, series_id=series_id)
871
+ data[self.original_target_column] = None
872
+ fcst = model.predict(data)[fcst_col_name]
873
+ return fcst
874
+
875
+ return _custom_predict