oracle-ads 2.13.9rc0__py3-none-any.whl → 2.13.10rc0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (858) hide show
  1. ads/aqua/__init__.py +40 -0
  2. ads/aqua/app.py +507 -0
  3. ads/aqua/cli.py +96 -0
  4. ads/aqua/client/__init__.py +3 -0
  5. ads/aqua/client/client.py +836 -0
  6. ads/aqua/client/openai_client.py +305 -0
  7. ads/aqua/common/__init__.py +5 -0
  8. ads/aqua/common/decorator.py +125 -0
  9. ads/aqua/common/entities.py +274 -0
  10. ads/aqua/common/enums.py +134 -0
  11. ads/aqua/common/errors.py +109 -0
  12. ads/aqua/common/utils.py +1295 -0
  13. ads/aqua/config/__init__.py +4 -0
  14. ads/aqua/config/container_config.py +247 -0
  15. ads/aqua/config/evaluation/__init__.py +4 -0
  16. ads/aqua/config/evaluation/evaluation_service_config.py +147 -0
  17. ads/aqua/config/utils/__init__.py +4 -0
  18. ads/aqua/config/utils/serializer.py +339 -0
  19. ads/aqua/constants.py +116 -0
  20. ads/aqua/data.py +14 -0
  21. ads/aqua/dummy_data/icon.txt +1 -0
  22. ads/aqua/dummy_data/oci_model_deployments.json +56 -0
  23. ads/aqua/dummy_data/oci_models.json +1 -0
  24. ads/aqua/dummy_data/readme.md +26 -0
  25. ads/aqua/evaluation/__init__.py +8 -0
  26. ads/aqua/evaluation/constants.py +53 -0
  27. ads/aqua/evaluation/entities.py +186 -0
  28. ads/aqua/evaluation/errors.py +70 -0
  29. ads/aqua/evaluation/evaluation.py +1814 -0
  30. ads/aqua/extension/__init__.py +42 -0
  31. ads/aqua/extension/aqua_ws_msg_handler.py +76 -0
  32. ads/aqua/extension/base_handler.py +90 -0
  33. ads/aqua/extension/common_handler.py +121 -0
  34. ads/aqua/extension/common_ws_msg_handler.py +36 -0
  35. ads/aqua/extension/deployment_handler.py +381 -0
  36. ads/aqua/extension/deployment_ws_msg_handler.py +54 -0
  37. ads/aqua/extension/errors.py +30 -0
  38. ads/aqua/extension/evaluation_handler.py +129 -0
  39. ads/aqua/extension/evaluation_ws_msg_handler.py +61 -0
  40. ads/aqua/extension/finetune_handler.py +96 -0
  41. ads/aqua/extension/model_handler.py +390 -0
  42. ads/aqua/extension/models/__init__.py +0 -0
  43. ads/aqua/extension/models/ws_models.py +145 -0
  44. ads/aqua/extension/models_ws_msg_handler.py +50 -0
  45. ads/aqua/extension/ui_handler.py +300 -0
  46. ads/aqua/extension/ui_websocket_handler.py +130 -0
  47. ads/aqua/extension/utils.py +133 -0
  48. ads/aqua/finetuning/__init__.py +7 -0
  49. ads/aqua/finetuning/constants.py +23 -0
  50. ads/aqua/finetuning/entities.py +181 -0
  51. ads/aqua/finetuning/finetuning.py +749 -0
  52. ads/aqua/model/__init__.py +8 -0
  53. ads/aqua/model/constants.py +60 -0
  54. ads/aqua/model/entities.py +385 -0
  55. ads/aqua/model/enums.py +32 -0
  56. ads/aqua/model/model.py +2134 -0
  57. ads/aqua/model/utils.py +52 -0
  58. ads/aqua/modeldeployment/__init__.py +6 -0
  59. ads/aqua/modeldeployment/constants.py +10 -0
  60. ads/aqua/modeldeployment/deployment.py +1315 -0
  61. ads/aqua/modeldeployment/entities.py +653 -0
  62. ads/aqua/modeldeployment/utils.py +543 -0
  63. ads/aqua/resources/gpu_shapes_index.json +94 -0
  64. ads/aqua/server/__init__.py +4 -0
  65. ads/aqua/server/__main__.py +24 -0
  66. ads/aqua/server/app.py +47 -0
  67. ads/aqua/server/aqua_spec.yml +1291 -0
  68. ads/aqua/training/__init__.py +4 -0
  69. ads/aqua/training/exceptions.py +476 -0
  70. ads/aqua/ui.py +519 -0
  71. ads/automl/__init__.py +9 -0
  72. ads/automl/driver.py +330 -0
  73. ads/automl/provider.py +975 -0
  74. ads/bds/__init__.py +5 -0
  75. ads/bds/auth.py +127 -0
  76. ads/bds/big_data_service.py +255 -0
  77. ads/catalog/__init__.py +19 -0
  78. ads/catalog/model.py +1576 -0
  79. ads/catalog/notebook.py +461 -0
  80. ads/catalog/project.py +468 -0
  81. ads/catalog/summary.py +178 -0
  82. ads/common/__init__.py +11 -0
  83. ads/common/analyzer.py +65 -0
  84. ads/common/artifact/.model-ignore +63 -0
  85. ads/common/artifact/__init__.py +10 -0
  86. ads/common/auth.py +1122 -0
  87. ads/common/card_identifier.py +83 -0
  88. ads/common/config.py +647 -0
  89. ads/common/data.py +165 -0
  90. ads/common/decorator/__init__.py +9 -0
  91. ads/common/decorator/argument_to_case.py +88 -0
  92. ads/common/decorator/deprecate.py +69 -0
  93. ads/common/decorator/require_nonempty_arg.py +65 -0
  94. ads/common/decorator/runtime_dependency.py +178 -0
  95. ads/common/decorator/threaded.py +97 -0
  96. ads/common/decorator/utils.py +35 -0
  97. ads/common/dsc_file_system.py +303 -0
  98. ads/common/error.py +14 -0
  99. ads/common/extended_enum.py +81 -0
  100. ads/common/function/__init__.py +5 -0
  101. ads/common/function/fn_util.py +142 -0
  102. ads/common/function/func_conf.yaml +25 -0
  103. ads/common/ipython.py +76 -0
  104. ads/common/model.py +679 -0
  105. ads/common/model_artifact.py +1759 -0
  106. ads/common/model_artifact_schema.json +107 -0
  107. ads/common/model_export_util.py +664 -0
  108. ads/common/model_metadata.py +24 -0
  109. ads/common/object_storage_details.py +296 -0
  110. ads/common/oci_client.py +179 -0
  111. ads/common/oci_datascience.py +46 -0
  112. ads/common/oci_logging.py +1144 -0
  113. ads/common/oci_mixin.py +957 -0
  114. ads/common/oci_resource.py +136 -0
  115. ads/common/serializer.py +559 -0
  116. ads/common/utils.py +1852 -0
  117. ads/common/word_lists.py +1491 -0
  118. ads/common/work_request.py +189 -0
  119. ads/config.py +1 -0
  120. ads/data_labeling/__init__.py +13 -0
  121. ads/data_labeling/boundingbox.py +253 -0
  122. ads/data_labeling/constants.py +47 -0
  123. ads/data_labeling/data_labeling_service.py +244 -0
  124. ads/data_labeling/interface/__init__.py +5 -0
  125. ads/data_labeling/interface/loader.py +16 -0
  126. ads/data_labeling/interface/parser.py +16 -0
  127. ads/data_labeling/interface/reader.py +23 -0
  128. ads/data_labeling/loader/__init__.py +5 -0
  129. ads/data_labeling/loader/file_loader.py +241 -0
  130. ads/data_labeling/metadata.py +110 -0
  131. ads/data_labeling/mixin/__init__.py +5 -0
  132. ads/data_labeling/mixin/data_labeling.py +232 -0
  133. ads/data_labeling/ner.py +129 -0
  134. ads/data_labeling/parser/__init__.py +5 -0
  135. ads/data_labeling/parser/dls_record_parser.py +388 -0
  136. ads/data_labeling/parser/export_metadata_parser.py +94 -0
  137. ads/data_labeling/parser/export_record_parser.py +473 -0
  138. ads/data_labeling/reader/__init__.py +5 -0
  139. ads/data_labeling/reader/dataset_reader.py +574 -0
  140. ads/data_labeling/reader/dls_record_reader.py +121 -0
  141. ads/data_labeling/reader/export_record_reader.py +62 -0
  142. ads/data_labeling/reader/jsonl_reader.py +75 -0
  143. ads/data_labeling/reader/metadata_reader.py +203 -0
  144. ads/data_labeling/reader/record_reader.py +263 -0
  145. ads/data_labeling/record.py +52 -0
  146. ads/data_labeling/visualizer/__init__.py +5 -0
  147. ads/data_labeling/visualizer/image_visualizer.py +525 -0
  148. ads/data_labeling/visualizer/text_visualizer.py +357 -0
  149. ads/database/__init__.py +5 -0
  150. ads/database/connection.py +338 -0
  151. ads/dataset/__init__.py +10 -0
  152. ads/dataset/capabilities.md +51 -0
  153. ads/dataset/classification_dataset.py +339 -0
  154. ads/dataset/correlation.py +226 -0
  155. ads/dataset/correlation_plot.py +563 -0
  156. ads/dataset/dask_series.py +173 -0
  157. ads/dataset/dataframe_transformer.py +110 -0
  158. ads/dataset/dataset.py +1979 -0
  159. ads/dataset/dataset_browser.py +360 -0
  160. ads/dataset/dataset_with_target.py +995 -0
  161. ads/dataset/exception.py +25 -0
  162. ads/dataset/factory.py +987 -0
  163. ads/dataset/feature_engineering_transformer.py +35 -0
  164. ads/dataset/feature_selection.py +107 -0
  165. ads/dataset/forecasting_dataset.py +26 -0
  166. ads/dataset/helper.py +1450 -0
  167. ads/dataset/label_encoder.py +99 -0
  168. ads/dataset/mixin/__init__.py +5 -0
  169. ads/dataset/mixin/dataset_accessor.py +134 -0
  170. ads/dataset/pipeline.py +58 -0
  171. ads/dataset/plot.py +710 -0
  172. ads/dataset/progress.py +86 -0
  173. ads/dataset/recommendation.py +297 -0
  174. ads/dataset/recommendation_transformer.py +502 -0
  175. ads/dataset/regression_dataset.py +14 -0
  176. ads/dataset/sampled_dataset.py +1050 -0
  177. ads/dataset/target.py +98 -0
  178. ads/dataset/timeseries.py +18 -0
  179. ads/dbmixin/__init__.py +5 -0
  180. ads/dbmixin/db_pandas_accessor.py +153 -0
  181. ads/environment/__init__.py +9 -0
  182. ads/environment/ml_runtime.py +66 -0
  183. ads/evaluations/README.md +14 -0
  184. ads/evaluations/__init__.py +109 -0
  185. ads/evaluations/evaluation_plot.py +983 -0
  186. ads/evaluations/evaluator.py +1334 -0
  187. ads/evaluations/statistical_metrics.py +543 -0
  188. ads/experiments/__init__.py +9 -0
  189. ads/experiments/capabilities.md +0 -0
  190. ads/explanations/__init__.py +21 -0
  191. ads/explanations/base_explainer.py +142 -0
  192. ads/explanations/capabilities.md +83 -0
  193. ads/explanations/explainer.py +190 -0
  194. ads/explanations/mlx_global_explainer.py +1050 -0
  195. ads/explanations/mlx_interface.py +386 -0
  196. ads/explanations/mlx_local_explainer.py +287 -0
  197. ads/explanations/mlx_whatif_explainer.py +201 -0
  198. ads/feature_engineering/__init__.py +20 -0
  199. ads/feature_engineering/accessor/__init__.py +5 -0
  200. ads/feature_engineering/accessor/dataframe_accessor.py +535 -0
  201. ads/feature_engineering/accessor/mixin/__init__.py +5 -0
  202. ads/feature_engineering/accessor/mixin/correlation.py +166 -0
  203. ads/feature_engineering/accessor/mixin/eda_mixin.py +266 -0
  204. ads/feature_engineering/accessor/mixin/eda_mixin_series.py +85 -0
  205. ads/feature_engineering/accessor/mixin/feature_types_mixin.py +211 -0
  206. ads/feature_engineering/accessor/mixin/utils.py +65 -0
  207. ads/feature_engineering/accessor/series_accessor.py +431 -0
  208. ads/feature_engineering/adsimage/__init__.py +5 -0
  209. ads/feature_engineering/adsimage/image.py +192 -0
  210. ads/feature_engineering/adsimage/image_reader.py +170 -0
  211. ads/feature_engineering/adsimage/interface/__init__.py +5 -0
  212. ads/feature_engineering/adsimage/interface/reader.py +19 -0
  213. ads/feature_engineering/adsstring/__init__.py +7 -0
  214. ads/feature_engineering/adsstring/oci_language/__init__.py +8 -0
  215. ads/feature_engineering/adsstring/string/__init__.py +8 -0
  216. ads/feature_engineering/data_schema.json +57 -0
  217. ads/feature_engineering/dataset/__init__.py +5 -0
  218. ads/feature_engineering/dataset/zip_code_data.py +42062 -0
  219. ads/feature_engineering/exceptions.py +40 -0
  220. ads/feature_engineering/feature_type/__init__.py +133 -0
  221. ads/feature_engineering/feature_type/address.py +184 -0
  222. ads/feature_engineering/feature_type/adsstring/__init__.py +5 -0
  223. ads/feature_engineering/feature_type/adsstring/common_regex_mixin.py +164 -0
  224. ads/feature_engineering/feature_type/adsstring/oci_language.py +93 -0
  225. ads/feature_engineering/feature_type/adsstring/parsers/__init__.py +5 -0
  226. ads/feature_engineering/feature_type/adsstring/parsers/base.py +47 -0
  227. ads/feature_engineering/feature_type/adsstring/parsers/nltk_parser.py +96 -0
  228. ads/feature_engineering/feature_type/adsstring/parsers/spacy_parser.py +221 -0
  229. ads/feature_engineering/feature_type/adsstring/string.py +258 -0
  230. ads/feature_engineering/feature_type/base.py +58 -0
  231. ads/feature_engineering/feature_type/boolean.py +183 -0
  232. ads/feature_engineering/feature_type/category.py +146 -0
  233. ads/feature_engineering/feature_type/constant.py +137 -0
  234. ads/feature_engineering/feature_type/continuous.py +151 -0
  235. ads/feature_engineering/feature_type/creditcard.py +314 -0
  236. ads/feature_engineering/feature_type/datetime.py +190 -0
  237. ads/feature_engineering/feature_type/discrete.py +134 -0
  238. ads/feature_engineering/feature_type/document.py +43 -0
  239. ads/feature_engineering/feature_type/gis.py +251 -0
  240. ads/feature_engineering/feature_type/handler/__init__.py +5 -0
  241. ads/feature_engineering/feature_type/handler/feature_validator.py +524 -0
  242. ads/feature_engineering/feature_type/handler/feature_warning.py +319 -0
  243. ads/feature_engineering/feature_type/handler/warnings.py +128 -0
  244. ads/feature_engineering/feature_type/integer.py +142 -0
  245. ads/feature_engineering/feature_type/ip_address.py +144 -0
  246. ads/feature_engineering/feature_type/ip_address_v4.py +138 -0
  247. ads/feature_engineering/feature_type/ip_address_v6.py +138 -0
  248. ads/feature_engineering/feature_type/lat_long.py +256 -0
  249. ads/feature_engineering/feature_type/object.py +43 -0
  250. ads/feature_engineering/feature_type/ordinal.py +132 -0
  251. ads/feature_engineering/feature_type/phone_number.py +135 -0
  252. ads/feature_engineering/feature_type/string.py +171 -0
  253. ads/feature_engineering/feature_type/text.py +93 -0
  254. ads/feature_engineering/feature_type/unknown.py +43 -0
  255. ads/feature_engineering/feature_type/zip_code.py +164 -0
  256. ads/feature_engineering/feature_type_manager.py +406 -0
  257. ads/feature_engineering/schema.py +795 -0
  258. ads/feature_engineering/utils.py +245 -0
  259. ads/feature_store/.readthedocs.yaml +19 -0
  260. ads/feature_store/README.md +65 -0
  261. ads/feature_store/__init__.py +9 -0
  262. ads/feature_store/common/__init__.py +0 -0
  263. ads/feature_store/common/enums.py +339 -0
  264. ads/feature_store/common/exceptions.py +18 -0
  265. ads/feature_store/common/spark_session_singleton.py +125 -0
  266. ads/feature_store/common/utils/__init__.py +0 -0
  267. ads/feature_store/common/utils/base64_encoder_decoder.py +72 -0
  268. ads/feature_store/common/utils/feature_schema_mapper.py +283 -0
  269. ads/feature_store/common/utils/transformation_utils.py +82 -0
  270. ads/feature_store/common/utils/utility.py +403 -0
  271. ads/feature_store/data_validation/__init__.py +0 -0
  272. ads/feature_store/data_validation/great_expectation.py +129 -0
  273. ads/feature_store/dataset.py +1230 -0
  274. ads/feature_store/dataset_job.py +530 -0
  275. ads/feature_store/docs/Dockerfile +7 -0
  276. ads/feature_store/docs/Makefile +44 -0
  277. ads/feature_store/docs/conf.py +28 -0
  278. ads/feature_store/docs/requirements.txt +14 -0
  279. ads/feature_store/docs/source/ads.feature_store.query.rst +20 -0
  280. ads/feature_store/docs/source/cicd.rst +137 -0
  281. ads/feature_store/docs/source/conf.py +86 -0
  282. ads/feature_store/docs/source/data_versioning.rst +33 -0
  283. ads/feature_store/docs/source/dataset.rst +388 -0
  284. ads/feature_store/docs/source/dataset_job.rst +27 -0
  285. ads/feature_store/docs/source/demo.rst +70 -0
  286. ads/feature_store/docs/source/entity.rst +78 -0
  287. ads/feature_store/docs/source/feature_group.rst +624 -0
  288. ads/feature_store/docs/source/feature_group_job.rst +29 -0
  289. ads/feature_store/docs/source/feature_store.rst +122 -0
  290. ads/feature_store/docs/source/feature_store_class.rst +123 -0
  291. ads/feature_store/docs/source/feature_validation.rst +66 -0
  292. ads/feature_store/docs/source/figures/cicd.png +0 -0
  293. ads/feature_store/docs/source/figures/data_validation.png +0 -0
  294. ads/feature_store/docs/source/figures/data_versioning.png +0 -0
  295. ads/feature_store/docs/source/figures/dataset.gif +0 -0
  296. ads/feature_store/docs/source/figures/dataset.png +0 -0
  297. ads/feature_store/docs/source/figures/dataset_lineage.png +0 -0
  298. ads/feature_store/docs/source/figures/dataset_statistics.png +0 -0
  299. ads/feature_store/docs/source/figures/dataset_statistics_viz.png +0 -0
  300. ads/feature_store/docs/source/figures/dataset_validation_results.png +0 -0
  301. ads/feature_store/docs/source/figures/dataset_validation_summary.png +0 -0
  302. ads/feature_store/docs/source/figures/drift_monitoring.png +0 -0
  303. ads/feature_store/docs/source/figures/entity.png +0 -0
  304. ads/feature_store/docs/source/figures/feature_group.png +0 -0
  305. ads/feature_store/docs/source/figures/feature_group_lineage.png +0 -0
  306. ads/feature_store/docs/source/figures/feature_group_statistics_viz.png +0 -0
  307. ads/feature_store/docs/source/figures/feature_store_deployment.png +0 -0
  308. ads/feature_store/docs/source/figures/feature_store_overview.png +0 -0
  309. ads/feature_store/docs/source/figures/featuregroup.gif +0 -0
  310. ads/feature_store/docs/source/figures/lineage_d1.png +0 -0
  311. ads/feature_store/docs/source/figures/lineage_d2.png +0 -0
  312. ads/feature_store/docs/source/figures/lineage_fg.png +0 -0
  313. ads/feature_store/docs/source/figures/logo-dark-mode.png +0 -0
  314. ads/feature_store/docs/source/figures/logo-light-mode.png +0 -0
  315. ads/feature_store/docs/source/figures/overview.png +0 -0
  316. ads/feature_store/docs/source/figures/resource_manager.png +0 -0
  317. ads/feature_store/docs/source/figures/resource_manager_feature_store_stack.png +0 -0
  318. ads/feature_store/docs/source/figures/resource_manager_home.png +0 -0
  319. ads/feature_store/docs/source/figures/stats_1.png +0 -0
  320. ads/feature_store/docs/source/figures/stats_2.png +0 -0
  321. ads/feature_store/docs/source/figures/stats_d.png +0 -0
  322. ads/feature_store/docs/source/figures/stats_fg.png +0 -0
  323. ads/feature_store/docs/source/figures/transformation.png +0 -0
  324. ads/feature_store/docs/source/figures/transformations.gif +0 -0
  325. ads/feature_store/docs/source/figures/validation.png +0 -0
  326. ads/feature_store/docs/source/figures/validation_fg.png +0 -0
  327. ads/feature_store/docs/source/figures/validation_results.png +0 -0
  328. ads/feature_store/docs/source/figures/validation_summary.png +0 -0
  329. ads/feature_store/docs/source/index.rst +81 -0
  330. ads/feature_store/docs/source/module.rst +8 -0
  331. ads/feature_store/docs/source/notebook.rst +94 -0
  332. ads/feature_store/docs/source/overview.rst +47 -0
  333. ads/feature_store/docs/source/quickstart.rst +176 -0
  334. ads/feature_store/docs/source/release_notes.rst +194 -0
  335. ads/feature_store/docs/source/setup_feature_store.rst +81 -0
  336. ads/feature_store/docs/source/statistics.rst +58 -0
  337. ads/feature_store/docs/source/transformation.rst +199 -0
  338. ads/feature_store/docs/source/ui.rst +65 -0
  339. ads/feature_store/docs/source/user_guides.setup.feature_store_operator.rst +66 -0
  340. ads/feature_store/docs/source/user_guides.setup.helm_chart.rst +192 -0
  341. ads/feature_store/docs/source/user_guides.setup.terraform.rst +338 -0
  342. ads/feature_store/entity.py +718 -0
  343. ads/feature_store/execution_strategy/__init__.py +0 -0
  344. ads/feature_store/execution_strategy/delta_lake/__init__.py +0 -0
  345. ads/feature_store/execution_strategy/delta_lake/delta_lake_service.py +375 -0
  346. ads/feature_store/execution_strategy/engine/__init__.py +0 -0
  347. ads/feature_store/execution_strategy/engine/spark_engine.py +316 -0
  348. ads/feature_store/execution_strategy/execution_strategy.py +113 -0
  349. ads/feature_store/execution_strategy/execution_strategy_provider.py +47 -0
  350. ads/feature_store/execution_strategy/spark/__init__.py +0 -0
  351. ads/feature_store/execution_strategy/spark/spark_execution.py +618 -0
  352. ads/feature_store/feature.py +192 -0
  353. ads/feature_store/feature_group.py +1494 -0
  354. ads/feature_store/feature_group_expectation.py +346 -0
  355. ads/feature_store/feature_group_job.py +602 -0
  356. ads/feature_store/feature_lineage/__init__.py +0 -0
  357. ads/feature_store/feature_lineage/graphviz_service.py +180 -0
  358. ads/feature_store/feature_option_details.py +50 -0
  359. ads/feature_store/feature_statistics/__init__.py +0 -0
  360. ads/feature_store/feature_statistics/statistics_service.py +99 -0
  361. ads/feature_store/feature_store.py +699 -0
  362. ads/feature_store/feature_store_registrar.py +518 -0
  363. ads/feature_store/input_feature_detail.py +149 -0
  364. ads/feature_store/mixin/__init__.py +4 -0
  365. ads/feature_store/mixin/oci_feature_store.py +145 -0
  366. ads/feature_store/model_details.py +73 -0
  367. ads/feature_store/query/__init__.py +0 -0
  368. ads/feature_store/query/filter.py +266 -0
  369. ads/feature_store/query/generator/__init__.py +0 -0
  370. ads/feature_store/query/generator/query_generator.py +298 -0
  371. ads/feature_store/query/join.py +161 -0
  372. ads/feature_store/query/query.py +403 -0
  373. ads/feature_store/query/validator/__init__.py +0 -0
  374. ads/feature_store/query/validator/query_validator.py +57 -0
  375. ads/feature_store/response/__init__.py +0 -0
  376. ads/feature_store/response/response_builder.py +68 -0
  377. ads/feature_store/service/__init__.py +0 -0
  378. ads/feature_store/service/oci_dataset.py +139 -0
  379. ads/feature_store/service/oci_dataset_job.py +199 -0
  380. ads/feature_store/service/oci_entity.py +125 -0
  381. ads/feature_store/service/oci_feature_group.py +164 -0
  382. ads/feature_store/service/oci_feature_group_job.py +214 -0
  383. ads/feature_store/service/oci_feature_store.py +182 -0
  384. ads/feature_store/service/oci_lineage.py +87 -0
  385. ads/feature_store/service/oci_transformation.py +104 -0
  386. ads/feature_store/statistics/__init__.py +0 -0
  387. ads/feature_store/statistics/abs_feature_value.py +49 -0
  388. ads/feature_store/statistics/charts/__init__.py +0 -0
  389. ads/feature_store/statistics/charts/abstract_feature_plot.py +37 -0
  390. ads/feature_store/statistics/charts/box_plot.py +148 -0
  391. ads/feature_store/statistics/charts/frequency_distribution.py +65 -0
  392. ads/feature_store/statistics/charts/probability_distribution.py +68 -0
  393. ads/feature_store/statistics/charts/top_k_frequent_elements.py +98 -0
  394. ads/feature_store/statistics/feature_stat.py +126 -0
  395. ads/feature_store/statistics/generic_feature_value.py +33 -0
  396. ads/feature_store/statistics/statistics.py +41 -0
  397. ads/feature_store/statistics_config.py +101 -0
  398. ads/feature_store/templates/feature_store_template.yaml +45 -0
  399. ads/feature_store/transformation.py +499 -0
  400. ads/feature_store/validation_output.py +57 -0
  401. ads/hpo/__init__.py +9 -0
  402. ads/hpo/_imports.py +91 -0
  403. ads/hpo/ads_search_space.py +439 -0
  404. ads/hpo/distributions.py +325 -0
  405. ads/hpo/objective.py +280 -0
  406. ads/hpo/search_cv.py +1657 -0
  407. ads/hpo/stopping_criterion.py +75 -0
  408. ads/hpo/tuner_artifact.py +413 -0
  409. ads/hpo/utils.py +91 -0
  410. ads/hpo/validation.py +140 -0
  411. ads/hpo/visualization/__init__.py +5 -0
  412. ads/hpo/visualization/_contour.py +23 -0
  413. ads/hpo/visualization/_edf.py +20 -0
  414. ads/hpo/visualization/_intermediate_values.py +21 -0
  415. ads/hpo/visualization/_optimization_history.py +25 -0
  416. ads/hpo/visualization/_parallel_coordinate.py +169 -0
  417. ads/hpo/visualization/_param_importances.py +26 -0
  418. ads/jobs/__init__.py +53 -0
  419. ads/jobs/ads_job.py +663 -0
  420. ads/jobs/builders/__init__.py +5 -0
  421. ads/jobs/builders/base.py +156 -0
  422. ads/jobs/builders/infrastructure/__init__.py +6 -0
  423. ads/jobs/builders/infrastructure/base.py +165 -0
  424. ads/jobs/builders/infrastructure/dataflow.py +1252 -0
  425. ads/jobs/builders/infrastructure/dsc_job.py +1894 -0
  426. ads/jobs/builders/infrastructure/dsc_job_runtime.py +1233 -0
  427. ads/jobs/builders/infrastructure/utils.py +65 -0
  428. ads/jobs/builders/runtimes/__init__.py +5 -0
  429. ads/jobs/builders/runtimes/artifact.py +338 -0
  430. ads/jobs/builders/runtimes/base.py +325 -0
  431. ads/jobs/builders/runtimes/container_runtime.py +242 -0
  432. ads/jobs/builders/runtimes/python_runtime.py +1016 -0
  433. ads/jobs/builders/runtimes/pytorch_runtime.py +204 -0
  434. ads/jobs/cli.py +104 -0
  435. ads/jobs/env_var_parser.py +131 -0
  436. ads/jobs/extension.py +160 -0
  437. ads/jobs/schema/__init__.py +5 -0
  438. ads/jobs/schema/infrastructure_schema.json +116 -0
  439. ads/jobs/schema/job_schema.json +42 -0
  440. ads/jobs/schema/runtime_schema.json +183 -0
  441. ads/jobs/schema/validator.py +141 -0
  442. ads/jobs/serializer.py +296 -0
  443. ads/jobs/templates/__init__.py +5 -0
  444. ads/jobs/templates/container.py +6 -0
  445. ads/jobs/templates/driver_notebook.py +177 -0
  446. ads/jobs/templates/driver_oci.py +500 -0
  447. ads/jobs/templates/driver_python.py +48 -0
  448. ads/jobs/templates/driver_pytorch.py +852 -0
  449. ads/jobs/templates/driver_utils.py +615 -0
  450. ads/jobs/templates/hostname_from_env.c +55 -0
  451. ads/jobs/templates/oci_metrics.py +181 -0
  452. ads/jobs/utils.py +104 -0
  453. ads/llm/__init__.py +28 -0
  454. ads/llm/autogen/__init__.py +2 -0
  455. ads/llm/autogen/constants.py +15 -0
  456. ads/llm/autogen/reports/__init__.py +2 -0
  457. ads/llm/autogen/reports/base.py +67 -0
  458. ads/llm/autogen/reports/data.py +103 -0
  459. ads/llm/autogen/reports/session.py +526 -0
  460. ads/llm/autogen/reports/templates/chat_box.html +13 -0
  461. ads/llm/autogen/reports/templates/chat_box_lt.html +5 -0
  462. ads/llm/autogen/reports/templates/chat_box_rt.html +6 -0
  463. ads/llm/autogen/reports/utils.py +56 -0
  464. ads/llm/autogen/v02/__init__.py +4 -0
  465. ads/llm/autogen/v02/client.py +295 -0
  466. ads/llm/autogen/v02/log_handlers/__init__.py +2 -0
  467. ads/llm/autogen/v02/log_handlers/oci_file_handler.py +83 -0
  468. ads/llm/autogen/v02/loggers/__init__.py +6 -0
  469. ads/llm/autogen/v02/loggers/metric_logger.py +320 -0
  470. ads/llm/autogen/v02/loggers/session_logger.py +580 -0
  471. ads/llm/autogen/v02/loggers/utils.py +86 -0
  472. ads/llm/autogen/v02/runtime_logging.py +163 -0
  473. ads/llm/chain.py +268 -0
  474. ads/llm/chat_template.py +31 -0
  475. ads/llm/deploy.py +63 -0
  476. ads/llm/guardrails/__init__.py +5 -0
  477. ads/llm/guardrails/base.py +442 -0
  478. ads/llm/guardrails/huggingface.py +44 -0
  479. ads/llm/langchain/__init__.py +5 -0
  480. ads/llm/langchain/plugins/__init__.py +5 -0
  481. ads/llm/langchain/plugins/chat_models/__init__.py +5 -0
  482. ads/llm/langchain/plugins/chat_models/oci_data_science.py +1027 -0
  483. ads/llm/langchain/plugins/embeddings/__init__.py +4 -0
  484. ads/llm/langchain/plugins/embeddings/oci_data_science_model_deployment_endpoint.py +184 -0
  485. ads/llm/langchain/plugins/llms/__init__.py +5 -0
  486. ads/llm/langchain/plugins/llms/oci_data_science_model_deployment_endpoint.py +979 -0
  487. ads/llm/requirements.txt +3 -0
  488. ads/llm/serialize.py +219 -0
  489. ads/llm/serializers/__init__.py +0 -0
  490. ads/llm/serializers/retrieval_qa.py +153 -0
  491. ads/llm/serializers/runnable_parallel.py +27 -0
  492. ads/llm/templates/score_chain.jinja2 +155 -0
  493. ads/llm/templates/tool_chat_template_hermes.jinja +130 -0
  494. ads/llm/templates/tool_chat_template_mistral_parallel.jinja +94 -0
  495. ads/model/__init__.py +52 -0
  496. ads/model/artifact.py +573 -0
  497. ads/model/artifact_downloader.py +254 -0
  498. ads/model/artifact_uploader.py +267 -0
  499. ads/model/base_properties.py +238 -0
  500. ads/model/common/.model-ignore +66 -0
  501. ads/model/common/__init__.py +5 -0
  502. ads/model/common/utils.py +142 -0
  503. ads/model/datascience_model.py +2635 -0
  504. ads/model/deployment/__init__.py +20 -0
  505. ads/model/deployment/common/__init__.py +5 -0
  506. ads/model/deployment/common/utils.py +308 -0
  507. ads/model/deployment/model_deployer.py +466 -0
  508. ads/model/deployment/model_deployment.py +1846 -0
  509. ads/model/deployment/model_deployment_infrastructure.py +671 -0
  510. ads/model/deployment/model_deployment_properties.py +493 -0
  511. ads/model/deployment/model_deployment_runtime.py +838 -0
  512. ads/model/extractor/__init__.py +5 -0
  513. ads/model/extractor/automl_extractor.py +74 -0
  514. ads/model/extractor/embedding_onnx_extractor.py +80 -0
  515. ads/model/extractor/huggingface_extractor.py +88 -0
  516. ads/model/extractor/keras_extractor.py +84 -0
  517. ads/model/extractor/lightgbm_extractor.py +93 -0
  518. ads/model/extractor/model_info_extractor.py +114 -0
  519. ads/model/extractor/model_info_extractor_factory.py +105 -0
  520. ads/model/extractor/pytorch_extractor.py +87 -0
  521. ads/model/extractor/sklearn_extractor.py +112 -0
  522. ads/model/extractor/spark_extractor.py +89 -0
  523. ads/model/extractor/tensorflow_extractor.py +85 -0
  524. ads/model/extractor/xgboost_extractor.py +94 -0
  525. ads/model/framework/__init__.py +5 -0
  526. ads/model/framework/automl_model.py +178 -0
  527. ads/model/framework/embedding_onnx_model.py +438 -0
  528. ads/model/framework/huggingface_model.py +399 -0
  529. ads/model/framework/lightgbm_model.py +266 -0
  530. ads/model/framework/pytorch_model.py +266 -0
  531. ads/model/framework/sklearn_model.py +250 -0
  532. ads/model/framework/spark_model.py +326 -0
  533. ads/model/framework/tensorflow_model.py +254 -0
  534. ads/model/framework/xgboost_model.py +258 -0
  535. ads/model/generic_model.py +3518 -0
  536. ads/model/model_artifact_boilerplate/README.md +381 -0
  537. ads/model/model_artifact_boilerplate/__init__.py +5 -0
  538. ads/model/model_artifact_boilerplate/artifact_introspection_test/__init__.py +5 -0
  539. ads/model/model_artifact_boilerplate/artifact_introspection_test/model_artifact_validate.py +427 -0
  540. ads/model/model_artifact_boilerplate/artifact_introspection_test/requirements.txt +2 -0
  541. ads/model/model_artifact_boilerplate/runtime.yaml +7 -0
  542. ads/model/model_artifact_boilerplate/score.py +61 -0
  543. ads/model/model_file_description_schema.json +68 -0
  544. ads/model/model_introspect.py +331 -0
  545. ads/model/model_metadata.py +1810 -0
  546. ads/model/model_metadata_mixin.py +460 -0
  547. ads/model/model_properties.py +63 -0
  548. ads/model/model_version_set.py +739 -0
  549. ads/model/runtime/__init__.py +5 -0
  550. ads/model/runtime/env_info.py +306 -0
  551. ads/model/runtime/model_deployment_details.py +37 -0
  552. ads/model/runtime/model_provenance_details.py +58 -0
  553. ads/model/runtime/runtime_info.py +81 -0
  554. ads/model/runtime/schemas/inference_env_info_schema.yaml +16 -0
  555. ads/model/runtime/schemas/model_provenance_schema.yaml +36 -0
  556. ads/model/runtime/schemas/training_env_info_schema.yaml +16 -0
  557. ads/model/runtime/utils.py +201 -0
  558. ads/model/serde/__init__.py +5 -0
  559. ads/model/serde/common.py +40 -0
  560. ads/model/serde/model_input.py +547 -0
  561. ads/model/serde/model_serializer.py +1184 -0
  562. ads/model/service/__init__.py +5 -0
  563. ads/model/service/oci_datascience_model.py +1076 -0
  564. ads/model/service/oci_datascience_model_deployment.py +500 -0
  565. ads/model/service/oci_datascience_model_version_set.py +176 -0
  566. ads/model/transformer/__init__.py +5 -0
  567. ads/model/transformer/onnx_transformer.py +324 -0
  568. ads/mysqldb/__init__.py +5 -0
  569. ads/mysqldb/mysql_db.py +227 -0
  570. ads/opctl/__init__.py +18 -0
  571. ads/opctl/anomaly_detection.py +11 -0
  572. ads/opctl/backend/__init__.py +5 -0
  573. ads/opctl/backend/ads_dataflow.py +353 -0
  574. ads/opctl/backend/ads_ml_job.py +710 -0
  575. ads/opctl/backend/ads_ml_pipeline.py +164 -0
  576. ads/opctl/backend/ads_model_deployment.py +209 -0
  577. ads/opctl/backend/base.py +146 -0
  578. ads/opctl/backend/local.py +1053 -0
  579. ads/opctl/backend/marketplace/__init__.py +9 -0
  580. ads/opctl/backend/marketplace/helm_helper.py +173 -0
  581. ads/opctl/backend/marketplace/local_marketplace.py +271 -0
  582. ads/opctl/backend/marketplace/marketplace_backend_runner.py +71 -0
  583. ads/opctl/backend/marketplace/marketplace_operator_interface.py +44 -0
  584. ads/opctl/backend/marketplace/marketplace_operator_runner.py +24 -0
  585. ads/opctl/backend/marketplace/marketplace_utils.py +212 -0
  586. ads/opctl/backend/marketplace/models/__init__.py +5 -0
  587. ads/opctl/backend/marketplace/models/bearer_token.py +94 -0
  588. ads/opctl/backend/marketplace/models/marketplace_type.py +70 -0
  589. ads/opctl/backend/marketplace/models/ocir_details.py +56 -0
  590. ads/opctl/backend/marketplace/prerequisite_checker.py +238 -0
  591. ads/opctl/cli.py +707 -0
  592. ads/opctl/cmds.py +869 -0
  593. ads/opctl/conda/__init__.py +5 -0
  594. ads/opctl/conda/cli.py +193 -0
  595. ads/opctl/conda/cmds.py +749 -0
  596. ads/opctl/conda/config.yaml +34 -0
  597. ads/opctl/conda/manifest_template.yaml +13 -0
  598. ads/opctl/conda/multipart_uploader.py +188 -0
  599. ads/opctl/conda/pack.py +89 -0
  600. ads/opctl/config/__init__.py +5 -0
  601. ads/opctl/config/base.py +57 -0
  602. ads/opctl/config/diagnostics/__init__.py +5 -0
  603. ads/opctl/config/diagnostics/distributed/default_requirements_config.yaml +62 -0
  604. ads/opctl/config/merger.py +255 -0
  605. ads/opctl/config/resolver.py +297 -0
  606. ads/opctl/config/utils.py +79 -0
  607. ads/opctl/config/validator.py +17 -0
  608. ads/opctl/config/versioner.py +68 -0
  609. ads/opctl/config/yaml_parsers/__init__.py +7 -0
  610. ads/opctl/config/yaml_parsers/base.py +58 -0
  611. ads/opctl/config/yaml_parsers/distributed/__init__.py +7 -0
  612. ads/opctl/config/yaml_parsers/distributed/yaml_parser.py +201 -0
  613. ads/opctl/constants.py +66 -0
  614. ads/opctl/decorator/__init__.py +5 -0
  615. ads/opctl/decorator/common.py +129 -0
  616. ads/opctl/diagnostics/__init__.py +5 -0
  617. ads/opctl/diagnostics/__main__.py +25 -0
  618. ads/opctl/diagnostics/check_distributed_job_requirements.py +212 -0
  619. ads/opctl/diagnostics/check_requirements.py +144 -0
  620. ads/opctl/diagnostics/requirement_exception.py +9 -0
  621. ads/opctl/distributed/README.md +109 -0
  622. ads/opctl/distributed/__init__.py +5 -0
  623. ads/opctl/distributed/certificates.py +32 -0
  624. ads/opctl/distributed/cli.py +207 -0
  625. ads/opctl/distributed/cmds.py +731 -0
  626. ads/opctl/distributed/common/__init__.py +5 -0
  627. ads/opctl/distributed/common/abstract_cluster_provider.py +449 -0
  628. ads/opctl/distributed/common/abstract_framework_spec_builder.py +88 -0
  629. ads/opctl/distributed/common/cluster_config_helper.py +103 -0
  630. ads/opctl/distributed/common/cluster_provider_factory.py +21 -0
  631. ads/opctl/distributed/common/cluster_runner.py +54 -0
  632. ads/opctl/distributed/common/framework_factory.py +29 -0
  633. ads/opctl/docker/Dockerfile.job +103 -0
  634. ads/opctl/docker/Dockerfile.job.arm +107 -0
  635. ads/opctl/docker/Dockerfile.job.gpu +175 -0
  636. ads/opctl/docker/base-env.yaml +13 -0
  637. ads/opctl/docker/cuda.repo +6 -0
  638. ads/opctl/docker/operator/.dockerignore +0 -0
  639. ads/opctl/docker/operator/Dockerfile +41 -0
  640. ads/opctl/docker/operator/Dockerfile.gpu +85 -0
  641. ads/opctl/docker/operator/cuda.repo +6 -0
  642. ads/opctl/docker/operator/environment.yaml +8 -0
  643. ads/opctl/forecast.py +11 -0
  644. ads/opctl/index.yaml +3 -0
  645. ads/opctl/model/__init__.py +5 -0
  646. ads/opctl/model/cli.py +65 -0
  647. ads/opctl/model/cmds.py +73 -0
  648. ads/opctl/operator/README.md +4 -0
  649. ads/opctl/operator/__init__.py +31 -0
  650. ads/opctl/operator/cli.py +344 -0
  651. ads/opctl/operator/cmd.py +596 -0
  652. ads/opctl/operator/common/__init__.py +5 -0
  653. ads/opctl/operator/common/backend_factory.py +460 -0
  654. ads/opctl/operator/common/const.py +27 -0
  655. ads/opctl/operator/common/data/synthetic.csv +16001 -0
  656. ads/opctl/operator/common/dictionary_merger.py +148 -0
  657. ads/opctl/operator/common/errors.py +42 -0
  658. ads/opctl/operator/common/operator_config.py +99 -0
  659. ads/opctl/operator/common/operator_loader.py +811 -0
  660. ads/opctl/operator/common/operator_schema.yaml +130 -0
  661. ads/opctl/operator/common/operator_yaml_generator.py +152 -0
  662. ads/opctl/operator/common/utils.py +208 -0
  663. ads/opctl/operator/lowcode/__init__.py +5 -0
  664. ads/opctl/operator/lowcode/anomaly/MLoperator +16 -0
  665. ads/opctl/operator/lowcode/anomaly/README.md +207 -0
  666. ads/opctl/operator/lowcode/anomaly/__init__.py +5 -0
  667. ads/opctl/operator/lowcode/anomaly/__main__.py +103 -0
  668. ads/opctl/operator/lowcode/anomaly/cmd.py +35 -0
  669. ads/opctl/operator/lowcode/anomaly/const.py +167 -0
  670. ads/opctl/operator/lowcode/anomaly/environment.yaml +10 -0
  671. ads/opctl/operator/lowcode/anomaly/model/__init__.py +5 -0
  672. ads/opctl/operator/lowcode/anomaly/model/anomaly_dataset.py +146 -0
  673. ads/opctl/operator/lowcode/anomaly/model/anomaly_merlion.py +162 -0
  674. ads/opctl/operator/lowcode/anomaly/model/automlx.py +99 -0
  675. ads/opctl/operator/lowcode/anomaly/model/autots.py +115 -0
  676. ads/opctl/operator/lowcode/anomaly/model/base_model.py +404 -0
  677. ads/opctl/operator/lowcode/anomaly/model/factory.py +110 -0
  678. ads/opctl/operator/lowcode/anomaly/model/isolationforest.py +78 -0
  679. ads/opctl/operator/lowcode/anomaly/model/oneclasssvm.py +78 -0
  680. ads/opctl/operator/lowcode/anomaly/model/randomcutforest.py +120 -0
  681. ads/opctl/operator/lowcode/anomaly/model/tods.py +119 -0
  682. ads/opctl/operator/lowcode/anomaly/operator_config.py +127 -0
  683. ads/opctl/operator/lowcode/anomaly/schema.yaml +401 -0
  684. ads/opctl/operator/lowcode/anomaly/utils.py +88 -0
  685. ads/opctl/operator/lowcode/common/__init__.py +5 -0
  686. ads/opctl/operator/lowcode/common/const.py +10 -0
  687. ads/opctl/operator/lowcode/common/data.py +116 -0
  688. ads/opctl/operator/lowcode/common/errors.py +47 -0
  689. ads/opctl/operator/lowcode/common/transformations.py +296 -0
  690. ads/opctl/operator/lowcode/common/utils.py +384 -0
  691. ads/opctl/operator/lowcode/feature_store_marketplace/MLoperator +13 -0
  692. ads/opctl/operator/lowcode/feature_store_marketplace/README.md +30 -0
  693. ads/opctl/operator/lowcode/feature_store_marketplace/__init__.py +5 -0
  694. ads/opctl/operator/lowcode/feature_store_marketplace/__main__.py +116 -0
  695. ads/opctl/operator/lowcode/feature_store_marketplace/cmd.py +85 -0
  696. ads/opctl/operator/lowcode/feature_store_marketplace/const.py +15 -0
  697. ads/opctl/operator/lowcode/feature_store_marketplace/environment.yaml +0 -0
  698. ads/opctl/operator/lowcode/feature_store_marketplace/models/__init__.py +4 -0
  699. ads/opctl/operator/lowcode/feature_store_marketplace/models/apigw_config.py +32 -0
  700. ads/opctl/operator/lowcode/feature_store_marketplace/models/db_config.py +43 -0
  701. ads/opctl/operator/lowcode/feature_store_marketplace/models/mysql_config.py +120 -0
  702. ads/opctl/operator/lowcode/feature_store_marketplace/models/serializable_yaml_model.py +34 -0
  703. ads/opctl/operator/lowcode/feature_store_marketplace/operator_utils.py +386 -0
  704. ads/opctl/operator/lowcode/feature_store_marketplace/schema.yaml +160 -0
  705. ads/opctl/operator/lowcode/forecast/MLoperator +25 -0
  706. ads/opctl/operator/lowcode/forecast/README.md +209 -0
  707. ads/opctl/operator/lowcode/forecast/__init__.py +5 -0
  708. ads/opctl/operator/lowcode/forecast/__main__.py +89 -0
  709. ads/opctl/operator/lowcode/forecast/cmd.py +40 -0
  710. ads/opctl/operator/lowcode/forecast/const.py +92 -0
  711. ads/opctl/operator/lowcode/forecast/environment.yaml +20 -0
  712. ads/opctl/operator/lowcode/forecast/errors.py +26 -0
  713. ads/opctl/operator/lowcode/forecast/model/__init__.py +5 -0
  714. ads/opctl/operator/lowcode/forecast/model/arima.py +279 -0
  715. ads/opctl/operator/lowcode/forecast/model/automlx.py +553 -0
  716. ads/opctl/operator/lowcode/forecast/model/autots.py +312 -0
  717. ads/opctl/operator/lowcode/forecast/model/base_model.py +875 -0
  718. ads/opctl/operator/lowcode/forecast/model/factory.py +106 -0
  719. ads/opctl/operator/lowcode/forecast/model/forecast_datasets.py +492 -0
  720. ads/opctl/operator/lowcode/forecast/model/ml_forecast.py +243 -0
  721. ads/opctl/operator/lowcode/forecast/model/neuralprophet.py +482 -0
  722. ads/opctl/operator/lowcode/forecast/model/prophet.py +450 -0
  723. ads/opctl/operator/lowcode/forecast/model_evaluator.py +244 -0
  724. ads/opctl/operator/lowcode/forecast/operator_config.py +234 -0
  725. ads/opctl/operator/lowcode/forecast/schema.yaml +506 -0
  726. ads/opctl/operator/lowcode/forecast/utils.py +397 -0
  727. ads/opctl/operator/lowcode/forecast/whatifserve/__init__.py +7 -0
  728. ads/opctl/operator/lowcode/forecast/whatifserve/deployment_manager.py +285 -0
  729. ads/opctl/operator/lowcode/forecast/whatifserve/score.py +246 -0
  730. ads/opctl/operator/lowcode/pii/MLoperator +17 -0
  731. ads/opctl/operator/lowcode/pii/README.md +208 -0
  732. ads/opctl/operator/lowcode/pii/__init__.py +5 -0
  733. ads/opctl/operator/lowcode/pii/__main__.py +78 -0
  734. ads/opctl/operator/lowcode/pii/cmd.py +39 -0
  735. ads/opctl/operator/lowcode/pii/constant.py +84 -0
  736. ads/opctl/operator/lowcode/pii/environment.yaml +17 -0
  737. ads/opctl/operator/lowcode/pii/errors.py +27 -0
  738. ads/opctl/operator/lowcode/pii/model/__init__.py +5 -0
  739. ads/opctl/operator/lowcode/pii/model/factory.py +82 -0
  740. ads/opctl/operator/lowcode/pii/model/guardrails.py +167 -0
  741. ads/opctl/operator/lowcode/pii/model/pii.py +145 -0
  742. ads/opctl/operator/lowcode/pii/model/processor/__init__.py +34 -0
  743. ads/opctl/operator/lowcode/pii/model/processor/email_replacer.py +34 -0
  744. ads/opctl/operator/lowcode/pii/model/processor/mbi_replacer.py +35 -0
  745. ads/opctl/operator/lowcode/pii/model/processor/name_replacer.py +225 -0
  746. ads/opctl/operator/lowcode/pii/model/processor/number_replacer.py +73 -0
  747. ads/opctl/operator/lowcode/pii/model/processor/remover.py +26 -0
  748. ads/opctl/operator/lowcode/pii/model/report.py +487 -0
  749. ads/opctl/operator/lowcode/pii/operator_config.py +95 -0
  750. ads/opctl/operator/lowcode/pii/schema.yaml +108 -0
  751. ads/opctl/operator/lowcode/pii/utils.py +43 -0
  752. ads/opctl/operator/lowcode/recommender/MLoperator +16 -0
  753. ads/opctl/operator/lowcode/recommender/README.md +206 -0
  754. ads/opctl/operator/lowcode/recommender/__init__.py +5 -0
  755. ads/opctl/operator/lowcode/recommender/__main__.py +82 -0
  756. ads/opctl/operator/lowcode/recommender/cmd.py +33 -0
  757. ads/opctl/operator/lowcode/recommender/constant.py +30 -0
  758. ads/opctl/operator/lowcode/recommender/environment.yaml +11 -0
  759. ads/opctl/operator/lowcode/recommender/model/base_model.py +212 -0
  760. ads/opctl/operator/lowcode/recommender/model/factory.py +56 -0
  761. ads/opctl/operator/lowcode/recommender/model/recommender_dataset.py +25 -0
  762. ads/opctl/operator/lowcode/recommender/model/svd.py +106 -0
  763. ads/opctl/operator/lowcode/recommender/operator_config.py +81 -0
  764. ads/opctl/operator/lowcode/recommender/schema.yaml +265 -0
  765. ads/opctl/operator/lowcode/recommender/utils.py +13 -0
  766. ads/opctl/operator/runtime/__init__.py +5 -0
  767. ads/opctl/operator/runtime/const.py +17 -0
  768. ads/opctl/operator/runtime/container_runtime_schema.yaml +50 -0
  769. ads/opctl/operator/runtime/marketplace_runtime.py +50 -0
  770. ads/opctl/operator/runtime/python_marketplace_runtime_schema.yaml +21 -0
  771. ads/opctl/operator/runtime/python_runtime_schema.yaml +21 -0
  772. ads/opctl/operator/runtime/runtime.py +115 -0
  773. ads/opctl/schema.yaml.yml +36 -0
  774. ads/opctl/script.py +40 -0
  775. ads/opctl/spark/__init__.py +5 -0
  776. ads/opctl/spark/cli.py +43 -0
  777. ads/opctl/spark/cmds.py +147 -0
  778. ads/opctl/templates/diagnostic_report_template.jinja2 +102 -0
  779. ads/opctl/utils.py +344 -0
  780. ads/oracledb/__init__.py +5 -0
  781. ads/oracledb/oracle_db.py +346 -0
  782. ads/pipeline/__init__.py +39 -0
  783. ads/pipeline/ads_pipeline.py +2279 -0
  784. ads/pipeline/ads_pipeline_run.py +772 -0
  785. ads/pipeline/ads_pipeline_step.py +605 -0
  786. ads/pipeline/builders/__init__.py +5 -0
  787. ads/pipeline/builders/infrastructure/__init__.py +5 -0
  788. ads/pipeline/builders/infrastructure/custom_script.py +32 -0
  789. ads/pipeline/cli.py +119 -0
  790. ads/pipeline/extension.py +291 -0
  791. ads/pipeline/schema/__init__.py +5 -0
  792. ads/pipeline/schema/cs_step_schema.json +35 -0
  793. ads/pipeline/schema/ml_step_schema.json +31 -0
  794. ads/pipeline/schema/pipeline_schema.json +71 -0
  795. ads/pipeline/visualizer/__init__.py +5 -0
  796. ads/pipeline/visualizer/base.py +570 -0
  797. ads/pipeline/visualizer/graph_renderer.py +272 -0
  798. ads/pipeline/visualizer/text_renderer.py +84 -0
  799. ads/secrets/__init__.py +11 -0
  800. ads/secrets/adb.py +386 -0
  801. ads/secrets/auth_token.py +86 -0
  802. ads/secrets/big_data_service.py +365 -0
  803. ads/secrets/mysqldb.py +149 -0
  804. ads/secrets/oracledb.py +160 -0
  805. ads/secrets/secrets.py +407 -0
  806. ads/telemetry/__init__.py +7 -0
  807. ads/telemetry/base.py +69 -0
  808. ads/telemetry/client.py +122 -0
  809. ads/telemetry/telemetry.py +257 -0
  810. ads/templates/dataflow_pyspark.jinja2 +13 -0
  811. ads/templates/dataflow_sparksql.jinja2 +22 -0
  812. ads/templates/func.jinja2 +20 -0
  813. ads/templates/schemas/openapi.json +1740 -0
  814. ads/templates/score-pkl.jinja2 +173 -0
  815. ads/templates/score.jinja2 +322 -0
  816. ads/templates/score_embedding_onnx.jinja2 +202 -0
  817. ads/templates/score_generic.jinja2 +165 -0
  818. ads/templates/score_huggingface_pipeline.jinja2 +217 -0
  819. ads/templates/score_lightgbm.jinja2 +185 -0
  820. ads/templates/score_onnx.jinja2 +407 -0
  821. ads/templates/score_onnx_new.jinja2 +473 -0
  822. ads/templates/score_oracle_automl.jinja2 +185 -0
  823. ads/templates/score_pyspark.jinja2 +154 -0
  824. ads/templates/score_pytorch.jinja2 +219 -0
  825. ads/templates/score_scikit-learn.jinja2 +184 -0
  826. ads/templates/score_tensorflow.jinja2 +184 -0
  827. ads/templates/score_xgboost.jinja2 +178 -0
  828. ads/text_dataset/__init__.py +5 -0
  829. ads/text_dataset/backends.py +211 -0
  830. ads/text_dataset/dataset.py +445 -0
  831. ads/text_dataset/extractor.py +207 -0
  832. ads/text_dataset/options.py +53 -0
  833. ads/text_dataset/udfs.py +22 -0
  834. ads/text_dataset/utils.py +49 -0
  835. ads/type_discovery/__init__.py +9 -0
  836. ads/type_discovery/abstract_detector.py +21 -0
  837. ads/type_discovery/constant_detector.py +41 -0
  838. ads/type_discovery/continuous_detector.py +54 -0
  839. ads/type_discovery/credit_card_detector.py +99 -0
  840. ads/type_discovery/datetime_detector.py +92 -0
  841. ads/type_discovery/discrete_detector.py +118 -0
  842. ads/type_discovery/document_detector.py +146 -0
  843. ads/type_discovery/ip_detector.py +68 -0
  844. ads/type_discovery/latlon_detector.py +90 -0
  845. ads/type_discovery/phone_number_detector.py +63 -0
  846. ads/type_discovery/type_discovery_driver.py +87 -0
  847. ads/type_discovery/typed_feature.py +594 -0
  848. ads/type_discovery/unknown_detector.py +41 -0
  849. ads/type_discovery/zipcode_detector.py +48 -0
  850. ads/vault/__init__.py +7 -0
  851. ads/vault/vault.py +237 -0
  852. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10rc0.dist-info}/METADATA +150 -149
  853. oracle_ads-2.13.10rc0.dist-info/RECORD +858 -0
  854. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10rc0.dist-info}/WHEEL +1 -2
  855. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10rc0.dist-info}/entry_points.txt +2 -1
  856. oracle_ads-2.13.9rc0.dist-info/RECORD +0 -9
  857. oracle_ads-2.13.9rc0.dist-info/top_level.txt +0 -1
  858. {oracle_ads-2.13.9rc0.dist-info → oracle_ads-2.13.10rc0.dist-info}/licenses/LICENSE.txt +0 -0
@@ -0,0 +1,1233 @@
1
+ #!/usr/bin/env python
2
+ # -*- coding: utf-8; -*-
3
+
4
+ # Copyright (c) 2021, 2024 Oracle and/or its affiliates.
5
+ # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
6
+ """Contains classes for conversion between ADS runtime and OCI Data Science Job implementation.
7
+ This module is for ADS developers only.
8
+ In this module, a payload is defined as a dictionary for initializing a DSCJob object.
9
+ The DSCJob can be initialized with the same arguments for initializing oci.data_science.models.Job,
10
+ plus an "artifact" argument for job artifact.
11
+ The payload also contain infrastructure information.
12
+ The conversion from a runtime to a payload is called translate in this module.
13
+ The conversion from a DSCJob to a runtime is called extract in this module.
14
+ """
15
+ from __future__ import annotations
16
+
17
+ import json
18
+ import os
19
+ import shlex
20
+ from typing import Optional
21
+ from urllib import parse
22
+ from ads.common.utils import extract_region
23
+ from ads.jobs.builders.runtimes.base import Runtime
24
+ from ads.jobs.builders.runtimes.python_runtime import (
25
+ CondaRuntime,
26
+ ScriptRuntime,
27
+ PythonRuntime,
28
+ NotebookRuntime,
29
+ GitPythonRuntime,
30
+ )
31
+ from ads.jobs.builders.runtimes.container_runtime import ContainerRuntime
32
+ from ads.jobs.builders.runtimes.pytorch_runtime import (
33
+ PyTorchDistributedRuntime,
34
+ PyTorchDistributedArtifact,
35
+ )
36
+ from ads.jobs.builders.runtimes.artifact import (
37
+ ScriptArtifact,
38
+ NotebookArtifact,
39
+ PythonArtifact,
40
+ GitPythonArtifact,
41
+ )
42
+ from ads.opctl.distributed.common import cluster_config_helper
43
+ from ads.jobs.builders.infrastructure.utils import get_value
44
+ from ads.jobs.templates import driver_utils
45
+
46
+
47
+ class IncompatibleRuntime(Exception): # pragma: no cover
48
+ """Represents an exception when runtime is not compatible with the OCI data science job configuration.
49
+ This exception is designed to be raised during the extraction of a runtime from OCI data science job.
50
+ The data science job does not explicitly contain information of the type of the ADS runtime.
51
+ Each runtime handler should determine if the configuration of the job can be converted to the runtime.
52
+ This exception should be raised during the extract() call if the configuration cannot be converted.
53
+ The RuntimeManager uses this exception to determine if the conversion is successful.
54
+ """
55
+
56
+
57
+ class RuntimeHandler:
58
+ """Base class for Runtime Handler.
59
+
60
+ Each runtime handler should define the RUNTIME_CLASS to be the runtime it can handle.
61
+
62
+ Each runtime handler is initialized with a DataScienceJob instance.
63
+ This instance is a reference and the modification will be exposed to the users.
64
+
65
+ Each runtime handler expose two methods: translate() and extract().
66
+ In this class, translate or extract signals the direction of conversion.
67
+ All method starts with "translate" handles the conversion from ADS runtime to OCI API payload.
68
+ All method starts with "extract" handles the conversion from OCI data science Job to ADS runtime.
69
+ This base class defines the default handling for translate() and extract().
70
+ Each sub-class can override the two methods to provide additional handling.
71
+ Alternatively, a sub-class can also override a sub-method, which is called by the translate() or extract() method.
72
+ For example, _translate_env() handles the conversion of environment variables from ADS runtime to OCI API payload.
73
+
74
+ See the individual methods for more details.
75
+ """
76
+
77
+ # Defines the class of the runtime to be handled.
78
+ RUNTIME_CLASS = Runtime
79
+
80
+ def __init__(self, data_science_job) -> None:
81
+ """Initialize the runtime handler.
82
+
83
+ Parameters
84
+ ----------
85
+ data_science_job : DataScienceJob
86
+ An instance of the DataScienceJob to be created or extracted from.
87
+ """
88
+ self.data_science_job = data_science_job
89
+
90
+ def translate(self, runtime: Runtime) -> dict:
91
+ """Translates the runtime into a JSON payload for OCI API.
92
+ This method calls the following sub-methods:
93
+ * _translate_artifact()
94
+ * _translate_config()
95
+ * _translate_env()
96
+ A sub-class can modify one of more of these methods.
97
+
98
+ Parameters
99
+ ----------
100
+ runtime : Runtime
101
+ An instance of the runtime to be converted to a JSON payload.
102
+
103
+ Returns
104
+ -------
105
+ dict
106
+ JSON payload for defining a Data Science Job with OCI API
107
+ """
108
+ payload = {}
109
+ payload["artifact"] = self._translate_artifact(runtime)
110
+ payload["job_configuration_details"] = self._translate_config(runtime)
111
+ if runtime.freeform_tags:
112
+ payload["freeform_tags"] = runtime.freeform_tags
113
+ if runtime.defined_tags:
114
+ payload["defined_tags"] = runtime.defined_tags
115
+ self.data_science_job.runtime = runtime
116
+ return payload
117
+
118
+ def _translate_artifact(self, runtime: Runtime):
119
+ """Translate the runtime artifact.
120
+ OCI data science requires an artifact file to be uploaded before the job is created.
121
+ For Python runtime, the artifact is the script for running the job.
122
+ For container runtime, the artifact is not actually used.
123
+ For notebook runtime, ADS needs to convert the artifact to Python script before uploading.
124
+
125
+ Parameters
126
+ ----------
127
+ runtime : Runtime
128
+ An instance of the runtime
129
+
130
+ Returns
131
+ -------
132
+ str or Artifact
133
+ The artifact that is ready to be used by DSCJob.
134
+ This can either be a string storing the path the artifact file,
135
+ or an instance of Artifact class, which contains logic for additional processing.
136
+ """
137
+ return None
138
+
139
+ def _translate_env(self, runtime: Runtime) -> dict:
140
+ """Translate the environment variable.
141
+
142
+ OCI Data Science job uses environment variables for various settings.
143
+ These settings are properties in ADS runtime.
144
+ This method is designed to handle the conversion of the ADS runtime properties to environment variables.
145
+ By default, no conversion is made in this method.
146
+ Sub-class should override this method to add conversion logic.
147
+
148
+ Parameters
149
+ ----------
150
+ runtime : Runtime
151
+ An instance of the runtime
152
+
153
+ Returns
154
+ -------
155
+ dict
156
+ A dictionary storing the environment variable for OCI data science job.
157
+ """
158
+ return runtime.envs
159
+
160
+ def _translate_config(self, runtime: Runtime) -> dict:
161
+ """Prepares the job configuration from runtime specifications.
162
+
163
+ Parameters
164
+ ----------
165
+ runtime : Runtime
166
+ An instance of the runtime
167
+
168
+ Returns
169
+ -------
170
+ dict
171
+ A dictionary for OCI data science job configuration.
172
+ The dictionary may have the following keys:
173
+ "jobType"
174
+ "commandLineArguments"
175
+ "environmentVariables"
176
+ "maximumRuntimeInMinutes"
177
+ The configurations will be used to initialize the DSCJob instance.
178
+ The DSCJob class can handle keys in either camel or snake format.
179
+ """
180
+ job_configuration_details = {
181
+ "jobType": self.data_science_job.job_type,
182
+ }
183
+ if runtime.maximum_runtime_in_minutes:
184
+ job_configuration_details["maximum_runtime_in_minutes"] = (
185
+ runtime.maximum_runtime_in_minutes
186
+ )
187
+ job_configuration_details["environment_variables"] = self._translate_env(
188
+ runtime
189
+ )
190
+ if runtime.args:
191
+ # shlex.join() is not available until python 3.8
192
+ job_configuration_details["command_line_arguments"] = " ".join(
193
+ shlex.quote(str(arg)) for arg in runtime.get_spec(runtime.CONST_ARGS)
194
+ )
195
+ return job_configuration_details
196
+
197
+ @staticmethod
198
+ def _translate_specs(
199
+ runtime: Runtime, spec_mappings: dict, delimiter: Optional[str] = None
200
+ ) -> dict:
201
+ """Converts runtime properties to OCI data science job environment variables based on a mapping.
202
+
203
+ Parameters
204
+ ----------
205
+ runtime : Runtime
206
+ The runtime containing the properties to be converted.
207
+ spec_mappings : dict
208
+ Mapping from runtime properties to environment variables.
209
+ Each key is a specification key (property name) of a runtime
210
+ Each value is the corresponding name of the environment variable in OCI data science job.
211
+ delimiter : str, Optional
212
+ Environment variables must be strings.
213
+ For list or tuple, specify the delimiter for joining the values into a string.
214
+
215
+ Returns
216
+ -------
217
+ dict
218
+ A dictionary containing environment variables for OCI data science job.
219
+ """
220
+ envs = {}
221
+ for spec_key, dsc_key in spec_mappings.items():
222
+ val = runtime.get_spec(spec_key)
223
+ if val:
224
+ if delimiter and isinstance(val, list) or isinstance(val, tuple):
225
+ val = delimiter.join(val)
226
+ envs[dsc_key] = val
227
+ return envs
228
+
229
+ @staticmethod
230
+ def _extract_specs(envs: dict, spec_mappings: dict) -> dict:
231
+ """Converts the environment variables in OCI data science job to runtime properties.
232
+
233
+ Parameters
234
+ ----------
235
+ envs : dict
236
+ A dictionary containing environment variables from OCI data science job.
237
+ spec_mappings : dict
238
+ Mapping from runtime properties to environment variables.
239
+ This mapping is the same as the one in _translate_spec().
240
+
241
+ This method does not convert strings into list or tuple as there is no way to identify them.
242
+
243
+ Returns
244
+ -------
245
+ dict
246
+ A dictionary for specifying the runtime.
247
+ """
248
+ spec = {}
249
+ for spec_key, dsc_key in spec_mappings.items():
250
+ val = envs.pop(dsc_key, None)
251
+ if val:
252
+ spec[spec_key] = val
253
+ return spec
254
+
255
+ @staticmethod
256
+ def _format_env_var(runtime_spec: dict) -> dict:
257
+ """Formats the environment variables in runtime specification (as dict) from a dictionary to list.
258
+ The list of environment variables uses the same format as environment variables in Kubernetes.
259
+
260
+ Parameters
261
+ ----------
262
+ runtime_spec : dict
263
+ Runtime specification in a dictionary.
264
+ This is the dictionary that can be used to initialize a runtime instance.
265
+ Except that environment variables are stored in a dict instead of list.
266
+
267
+ Returns
268
+ -------
269
+ dict
270
+ Runtime specification with environment variables stored in a list.
271
+ """
272
+ env_var = runtime_spec.pop(Runtime.CONST_ENV_VAR, None)
273
+ if env_var and isinstance(env_var, dict):
274
+ runtime_spec[Runtime.CONST_ENV_VAR] = [
275
+ {"name": k, "value": v} for k, v in env_var.items()
276
+ ]
277
+ return runtime_spec
278
+
279
+ def extract(self, dsc_job):
280
+ """Extract the runtime from an OCI data science job object.
281
+ This method calls the following sub-methods:
282
+ * _extract_tags()
283
+ * _extract_args()
284
+ * _extract_envs()
285
+ * _extract_artifact()
286
+ * _extract_runtime_minutes()
287
+ Each of these method returns a dict for specifying the runtime.
288
+ The dictionaries are combined before initalizing the runtime.
289
+ A sub-class can modify one of more of these methods.
290
+
291
+ Parameters
292
+ ----------
293
+ dsc_job : DSCJob or oci.datascience.models.Job
294
+ The data science job containing runtime information.
295
+
296
+ Returns
297
+ -------
298
+ Runtime:
299
+ The runtime extracted from the data science job.
300
+ """
301
+ runtime_spec = {}
302
+ extractions = [
303
+ self._extract_tags,
304
+ self._extract_args,
305
+ self._extract_envs,
306
+ self._extract_artifact,
307
+ self._extract_runtime_minutes,
308
+ self._extract_properties,
309
+ ]
310
+ for extraction in extractions:
311
+ runtime_spec.update(extraction(dsc_job))
312
+ return self.RUNTIME_CLASS(self._format_env_var(runtime_spec))
313
+
314
+ def _extract_properties(self, dsc_job) -> dict:
315
+ """Extract the job runtime properties from data science job.
316
+
317
+ This is the base method which does not extract the job runtime properties.
318
+ Sub-class should implement the extraction if needed.
319
+
320
+ Parameters
321
+ ----------
322
+ dsc_job : DSCJob or oci.datascience.models.Job
323
+ The data science job containing runtime information.
324
+
325
+ Returns
326
+ -------
327
+ dict
328
+ A runtime specification dictionary for initializing a runtime.
329
+ """
330
+ return {}
331
+
332
+ def _extract_args(self, dsc_job) -> dict:
333
+ """Extracts the command line arguments from data science job.
334
+
335
+ Parameters
336
+ ----------
337
+ dsc_job : DSCJob or oci.datascience.models.Job
338
+ The data science job containing runtime information.
339
+
340
+ Returns
341
+ -------
342
+ dict
343
+ A runtime specification dictionary for initializing a runtime.
344
+ """
345
+ args_string = get_value(
346
+ dsc_job, "job_configuration_details.command_line_arguments"
347
+ )
348
+ if args_string:
349
+ return {Runtime.CONST_ARGS: shlex.split(args_string)}
350
+ return {}
351
+
352
+ def _extract_envs(self, dsc_job):
353
+ """Extract the environment variables from data science job.
354
+
355
+ Parameters
356
+ ----------
357
+ dsc_job : DSCJob or oci.datascience.models.Job
358
+ The data science job containing runtime information.
359
+
360
+ Returns
361
+ -------
362
+ dict
363
+ A runtime specification dictionary for initializing a runtime.
364
+ """
365
+ envs = get_value(dsc_job, "job_configuration_details.environment_variables")
366
+ if envs:
367
+ return {Runtime.CONST_ENV_VAR: envs}
368
+ return {}
369
+
370
+ def _extract_tags(self, dsc_job):
371
+ """Extract the freeform tags from data science job.
372
+
373
+ Parameters
374
+ ----------
375
+ dsc_job : DSCJob or oci.datascience.models.Job
376
+ The data science job containing runtime information.
377
+
378
+ Returns
379
+ -------
380
+ dict
381
+ A runtime specification dictionary for initializing a runtime.
382
+ """
383
+ tags = {}
384
+ value = get_value(dsc_job, "freeform_tags")
385
+ if value:
386
+ tags[Runtime.CONST_FREEFORM_TAGS] = value
387
+ value = get_value(dsc_job, "defined_tags")
388
+ if value:
389
+ tags[Runtime.CONST_DEFINED_TAGS] = value
390
+ return tags
391
+
392
+ def _extract_artifact(self, dsc_job):
393
+ """Extract the job artifact from data science job.
394
+
395
+ This is the base method which does not extract the job artifact.
396
+ Sub-class should implement the extraction if needed.
397
+
398
+ Parameters
399
+ ----------
400
+ dsc_job : DSCJob or oci.datascience.models.Job
401
+ The data science job containing runtime information.
402
+
403
+ Returns
404
+ -------
405
+ dict
406
+ A runtime specification dictionary for initializing a runtime.
407
+ """
408
+ return {}
409
+
410
+ def _extract_runtime_minutes(self, dsc_job):
411
+ """Extract the maximum runtime in minutes from data science job.
412
+
413
+ Parameters
414
+ ----------
415
+ dsc_job : DSCJob or oci.datascience.models.Job
416
+ The data science job containing runtime information.
417
+
418
+ Returns
419
+ -------
420
+ dict
421
+ A runtime specification dictionary for initializing a runtime.
422
+ """
423
+ maximum_runtime_in_minutes = get_value(
424
+ dsc_job, "job_configuration_details.maximum_runtime_in_minutes"
425
+ )
426
+ if maximum_runtime_in_minutes:
427
+ return {
428
+ Runtime.CONST_MAXIMUM_RUNTIME_IN_MINUTES: maximum_runtime_in_minutes
429
+ }
430
+ return {}
431
+
432
+
433
+ class CondaRuntimeHandler(RuntimeHandler):
434
+ """Runtime Handler for CondaRuntime"""
435
+
436
+ RUNTIME_CLASS = CondaRuntime
437
+ CONST_CONDA_TYPE = "CONDA_ENV_TYPE"
438
+ CONST_CONDA_SLUG = "CONDA_ENV_SLUG"
439
+ CONST_CONDA_OBJ_NAME = "CONDA_ENV_OBJECT_NAME"
440
+ CONST_CONDA_REGION = "CONDA_ENV_REGION"
441
+ CONST_CONDA_NAMESPACE = "CONDA_ENV_NAMESPACE"
442
+ CONST_CONDA_BUCKET = "CONDA_ENV_BUCKET"
443
+
444
+ def __get_auth_region(self) -> str:
445
+ return extract_region(self.data_science_job.dsc_job.auth)
446
+
447
+ def _translate_env(self, runtime: CondaRuntime) -> dict:
448
+ """Translate the environment variable.
449
+
450
+ Parameters
451
+ ----------
452
+ runtime : CondaRuntime
453
+ An instance of CondaRuntime
454
+
455
+ Returns
456
+ -------
457
+ dict
458
+ A dictionary containing environment variables for OCI data science job.
459
+ """
460
+ envs = super()._translate_env(runtime)
461
+ if runtime.conda:
462
+ envs[self.CONST_CONDA_TYPE] = runtime.conda.get(
463
+ CondaRuntime.CONST_CONDA_TYPE
464
+ )
465
+ if (
466
+ runtime.conda.get(CondaRuntime.CONST_CONDA_TYPE)
467
+ == CondaRuntime.CONST_CONDA_TYPE_SERVICE
468
+ ):
469
+ envs.update(
470
+ {
471
+ self.CONST_CONDA_SLUG: runtime.conda.get(
472
+ CondaRuntime.CONST_CONDA_SLUG
473
+ ),
474
+ }
475
+ )
476
+ elif (
477
+ runtime.conda.get(CondaRuntime.CONST_CONDA_TYPE)
478
+ == CondaRuntime.CONST_CONDA_TYPE_CUSTOM
479
+ ):
480
+ uri = runtime.conda.get(CondaRuntime.CONST_CONDA_URI)
481
+ p = parse.urlparse(uri)
482
+ if not (p.username and p.hostname and p.path):
483
+ raise ValueError(
484
+ f"Invalid URI for custom conda pack: {uri}. "
485
+ "A valid URI should have the format: oci://your_bucket@namespace/object_name"
486
+ )
487
+ region = runtime.conda.get(CondaRuntime.CONST_CONDA_REGION)
488
+ if not region:
489
+ region = self.__get_auth_region()
490
+ if not region:
491
+ raise AttributeError(
492
+ "Unable to determine the region for the custom conda pack. "
493
+ "Specify the region using with_custom_conda(uri, region)."
494
+ )
495
+ envs.update(
496
+ {
497
+ self.CONST_CONDA_NAMESPACE: p.hostname,
498
+ self.CONST_CONDA_BUCKET: p.username,
499
+ self.CONST_CONDA_OBJ_NAME: p.path.lstrip("/"),
500
+ self.CONST_CONDA_REGION: region,
501
+ }
502
+ )
503
+ return envs
504
+
505
+ def _extract_envs(self, dsc_job) -> dict:
506
+ """Extract the environment variables from data science job.
507
+ CondaRuntime contains environment variables for specifying conda environment.
508
+
509
+ Parameters
510
+ ----------
511
+ dsc_job : DSCJob or oci.datascience.models.Job
512
+ The data science job containing runtime information.
513
+
514
+ Returns
515
+ -------
516
+ dict
517
+ A runtime specification dictionary for initializing a runtime.
518
+ """
519
+ spec = super()._extract_envs(dsc_job)
520
+ envs = spec.pop(CondaRuntime.CONST_ENV_VAR, {})
521
+ conda_spec = self.__extract_conda_env(envs)
522
+ if conda_spec:
523
+ spec[CondaRuntime.CONST_CONDA] = conda_spec
524
+ if envs:
525
+ spec[CondaRuntime.CONST_ENV_VAR] = envs
526
+ return spec
527
+
528
+ @staticmethod
529
+ def __extract_conda_env(envs: dict) -> Optional[dict]:
530
+ """Extracts conda pack specification from environment variables
531
+
532
+ Parameters
533
+ ----------
534
+ envs : dict
535
+ Environment variables.
536
+
537
+ Returns
538
+ -------
539
+ Optional[dict]
540
+ Conda pack runtime specification.
541
+ """
542
+ if not envs:
543
+ return None
544
+ if (
545
+ CondaRuntimeHandler.CONST_CONDA_TYPE in envs
546
+ and CondaRuntimeHandler.CONST_CONDA_SLUG in envs
547
+ ):
548
+ return {
549
+ CondaRuntime.CONST_CONDA_TYPE: envs.pop(
550
+ CondaRuntimeHandler.CONST_CONDA_TYPE
551
+ ),
552
+ CondaRuntime.CONST_CONDA_SLUG: envs.pop(
553
+ CondaRuntimeHandler.CONST_CONDA_SLUG
554
+ ),
555
+ }
556
+ if (
557
+ envs.get(CondaRuntimeHandler.CONST_CONDA_TYPE)
558
+ == CondaRuntime.CONST_CONDA_TYPE_CUSTOM
559
+ and CondaRuntimeHandler.CONST_CONDA_BUCKET in envs
560
+ and CondaRuntimeHandler.CONST_CONDA_BUCKET in envs
561
+ and CondaRuntimeHandler.CONST_CONDA_OBJ_NAME in envs
562
+ ):
563
+ bucket = envs.pop(CondaRuntimeHandler.CONST_CONDA_BUCKET)
564
+ namespace = envs.pop(CondaRuntimeHandler.CONST_CONDA_NAMESPACE)
565
+ name = envs.pop(CondaRuntimeHandler.CONST_CONDA_OBJ_NAME)
566
+ conda_spec = {
567
+ CondaRuntime.CONST_CONDA_TYPE: envs.pop(
568
+ CondaRuntimeHandler.CONST_CONDA_TYPE
569
+ ),
570
+ CondaRuntime.CONST_CONDA_URI: f"oci://{bucket}@{namespace}/{name}",
571
+ }
572
+ if CondaRuntimeHandler.CONST_CONDA_REGION in envs:
573
+ conda_spec[CondaRuntime.CONST_CONDA_REGION] = envs.pop(
574
+ CondaRuntimeHandler.CONST_CONDA_REGION
575
+ )
576
+ return conda_spec
577
+ return None
578
+
579
+
580
+ class ScriptRuntimeHandler(CondaRuntimeHandler):
581
+ """Runtime Handler for ScriptRuntime"""
582
+
583
+ RUNTIME_CLASS = ScriptRuntime
584
+ CONST_ENTRYPOINT = "JOB_RUN_ENTRYPOINT"
585
+
586
+ def _translate_env(self, runtime: ScriptRuntime) -> dict:
587
+ """Translate the environment variable.
588
+
589
+ Parameters
590
+ ----------
591
+ runtime : ScriptRuntime
592
+ An instance of ScriptRuntime
593
+
594
+ Returns
595
+ -------
596
+ dict
597
+ A dictionary contianing environment variables for OCI data science job.
598
+ """
599
+ envs = super()._translate_env(runtime)
600
+ if runtime.entrypoint:
601
+ envs[self.CONST_ENTRYPOINT] = runtime.entrypoint
602
+ return envs
603
+
604
+ def _translate_artifact(self, runtime: ScriptRuntime):
605
+ return ScriptArtifact(runtime.source_uri, runtime)
606
+
607
+ def _extract_envs(self, dsc_job) -> dict:
608
+ """Extract the environment variables from data science job.
609
+ ScriptRuntime may contain entrypoint as environment variable in addition to those for conda environment.
610
+
611
+ Parameters
612
+ ----------
613
+ dsc_job : DSCJob or oci.datascience.models.Job
614
+ The data science job containing runtime information.
615
+
616
+ Returns
617
+ -------
618
+ dict
619
+ A runtime specification dictionary for initializing a runtime.
620
+ """
621
+ spec = super()._extract_envs(dsc_job)
622
+ envs = spec.pop(ScriptRuntime.CONST_ENV_VAR, {})
623
+ entrypoint = envs.pop(ScriptRuntimeHandler.CONST_ENTRYPOINT, None)
624
+ if entrypoint:
625
+ spec[ScriptRuntime.CONST_ENTRYPOINT] = entrypoint
626
+ if envs:
627
+ spec[ScriptRuntime.CONST_ENV_VAR] = envs
628
+ return spec
629
+
630
+ def _extract_artifact(self, dsc_job):
631
+ """Extract the job artifact from data science job.
632
+
633
+ Parameters
634
+ ----------
635
+ dsc_job : DSCJob or oci.datascience.models.Job
636
+ The data science job containing runtime information.
637
+
638
+ Returns
639
+ -------
640
+ dict
641
+ A runtime specification dictionary for initializing a runtime.
642
+ """
643
+ spec = super()._extract_artifact(dsc_job)
644
+ spec.update({ScriptRuntime.CONST_SCRIPT_PATH: str(dsc_job.artifact)})
645
+ return spec
646
+
647
+
648
+ class PythonRuntimeHandler(CondaRuntimeHandler):
649
+ """Runtime Handler for PythonRuntime"""
650
+
651
+ RUNTIME_CLASS = PythonRuntime
652
+ PATH_DELIMITER = ":"
653
+ CONST_JOB_ENTRYPOINT = "JOB_RUN_ENTRYPOINT"
654
+ CONST_CODE_ENTRYPOINT = "CODE_ENTRYPOINT"
655
+ CONST_ENTRY_FUNCTION = "ENTRY_FUNCTION"
656
+ CONST_PYTHON_PATH = "PYTHON_PATH"
657
+ CONST_OUTPUT_DIR = "OUTPUT_DIR"
658
+ CONST_OUTPUT_URI = "OUTPUT_URI"
659
+ CONST_WORKING_DIR = "WORKING_DIR"
660
+
661
+ SPEC_MAPPINGS = {
662
+ PythonRuntime.CONST_ENTRYPOINT: CONST_CODE_ENTRYPOINT,
663
+ PythonRuntime.CONST_ENTRY_FUNCTION: CONST_ENTRY_FUNCTION,
664
+ PythonRuntime.CONST_PYTHON_PATH: CONST_PYTHON_PATH,
665
+ PythonRuntime.CONST_OUTPUT_DIR: CONST_OUTPUT_DIR,
666
+ PythonRuntime.CONST_OUTPUT_URI: CONST_OUTPUT_URI,
667
+ PythonRuntime.CONST_WORKING_DIR: CONST_WORKING_DIR,
668
+ }
669
+
670
+ def _translate_artifact(self, runtime: PythonRuntime):
671
+ return PythonArtifact(runtime.script_uri, runtime)
672
+
673
+ def _translate_env(self, runtime: PythonRuntime) -> dict:
674
+ envs = super()._translate_env(runtime)
675
+ envs.update(
676
+ self._translate_specs(runtime, self.SPEC_MAPPINGS, self.PATH_DELIMITER)
677
+ )
678
+
679
+ if runtime.entrypoint:
680
+ envs[self.CONST_CODE_ENTRYPOINT] = runtime.entrypoint
681
+ elif runtime.script_uri:
682
+ envs[self.CONST_CODE_ENTRYPOINT] = os.path.basename(runtime.script_uri)
683
+
684
+ envs[self.CONST_JOB_ENTRYPOINT] = PythonArtifact.CONST_DRIVER_SCRIPT
685
+ return envs
686
+
687
+ def _extract_envs(self, dsc_job) -> dict:
688
+ """Extract the runtime specification from environment variables.
689
+
690
+ Parameters
691
+ ----------
692
+ dsc_job : DSCJob or oci.datascience.models.Job
693
+ The data science job containing runtime information.
694
+
695
+ Returns
696
+ -------
697
+ dict
698
+ A runtime specification dictionary for initializing a runtime.
699
+ """
700
+ spec = super()._extract_envs(dsc_job)
701
+ envs = spec.pop(PythonRuntime.CONST_ENV_VAR, {})
702
+ if (
703
+ self.__class__ == PythonRuntimeHandler
704
+ and self.CONST_CODE_ENTRYPOINT not in envs
705
+ ):
706
+ raise IncompatibleRuntime()
707
+ # PyTorchDistributedRuntime does not require entrypoint.
708
+ envs.pop(PythonRuntimeHandler.CONST_JOB_ENTRYPOINT, None)
709
+ spec.update(self._extract_specs(envs, self.SPEC_MAPPINGS))
710
+ if PythonRuntime.CONST_PYTHON_PATH in spec:
711
+ spec[PythonRuntime.CONST_PYTHON_PATH] = spec[
712
+ PythonRuntime.CONST_PYTHON_PATH
713
+ ].split(self.PATH_DELIMITER)
714
+ if envs:
715
+ spec[PythonRuntime.CONST_ENV_VAR] = envs
716
+ return spec
717
+
718
+ def _extract_artifact(self, dsc_job):
719
+ """Extract the job artifact from data science job.
720
+
721
+ Parameters
722
+ ----------
723
+ dsc_job : DSCJob or oci.datascience.models.Job
724
+ The data science job containing runtime information.
725
+
726
+ Returns
727
+ -------
728
+ dict
729
+ A runtime specification dictionary for initializing a runtime.
730
+ """
731
+ spec = super()._extract_artifact(dsc_job)
732
+ # It is not possible to get the actual script path
733
+ # since the information is not stored in the job.
734
+ # Here we only extract the name of the artifact.
735
+ spec.update(
736
+ {
737
+ PythonRuntime.CONST_SCRIPT_PATH: os.path.splitext(
738
+ str(dsc_job.artifact)
739
+ )[0]
740
+ }
741
+ )
742
+ return spec
743
+
744
+
745
+ class NotebookRuntimeHandler(CondaRuntimeHandler):
746
+ """Runtime Handler for NotebookRuntime"""
747
+
748
+ RUNTIME_CLASS = NotebookRuntime
749
+ CONST_NOTEBOOK_NAME = "JOB_RUN_NOTEBOOK"
750
+ CONST_ENTRYPOINT = "JOB_RUN_ENTRYPOINT"
751
+ CONST_OUTPUT_URI = "OUTPUT_URI"
752
+ CONST_EXCLUDE_TAGS = "NOTEBOOK_EXCLUDE_TAGS"
753
+ CONST_NOTEBOOK_ENCODING = "NOTEBOOK_ENCODING"
754
+
755
+ SPEC_MAPPINGS = {
756
+ NotebookRuntime.CONST_OUTPUT_URI: CONST_OUTPUT_URI,
757
+ NotebookRuntime.CONST_EXCLUDE_TAG: CONST_EXCLUDE_TAGS,
758
+ NotebookRuntime.CONST_NOTEBOOK_ENCODING: CONST_NOTEBOOK_ENCODING,
759
+ }
760
+
761
+ def _translate_artifact(self, runtime: NotebookRuntime):
762
+ source = runtime.source if runtime.source else runtime.notebook_uri
763
+ return NotebookArtifact(source, runtime)
764
+
765
+ def _translate_env(self, runtime: NotebookRuntime) -> dict:
766
+ envs = super()._translate_env(runtime)
767
+
768
+ if runtime.notebook:
769
+ # runtime.notebook should always be a relative path from the root of the source.
770
+ # In NotebookArtifact, when zipping the files,
771
+ # a top level folder having the same name as the basename of runtime.source
772
+ # is used to contain all the user artifacts.
773
+ # The basename of runtime.source will also be used as the name of the artifact zip file.
774
+ envs[self.CONST_NOTEBOOK_NAME] = os.path.join(
775
+ os.path.basename(runtime.source), runtime.notebook
776
+ )
777
+ elif runtime.notebook_uri:
778
+ # For running a single notebook.
779
+ envs[self.CONST_NOTEBOOK_NAME] = os.path.basename(runtime.notebook_uri)
780
+ else:
781
+ raise ValueError(
782
+ "Notebook not specified. "
783
+ "Please specify the notebook using with_notebook_uri() or with_source() method."
784
+ )
785
+
786
+ envs[self.CONST_ENTRYPOINT] = NotebookArtifact.CONST_DRIVER_SCRIPT
787
+ if runtime.notebook_encoding:
788
+ envs[self.CONST_NOTEBOOK_ENCODING] = runtime.notebook_encoding
789
+ if runtime.exclude_tag:
790
+ envs[self.CONST_EXCLUDE_TAGS] = json.dumps(runtime.exclude_tag)
791
+ if runtime.output_uri:
792
+ envs[self.CONST_OUTPUT_URI] = runtime.output_uri
793
+ return envs
794
+
795
+ def _extract_envs(self, dsc_job) -> dict:
796
+ """Extract the runtime specification from environment variables.
797
+
798
+ Parameters
799
+ ----------
800
+ dsc_job : DSCJob or oci.datascience.models.Job
801
+ The data science job containing runtime information.
802
+
803
+ Returns
804
+ -------
805
+ dict
806
+ A runtime specification dictionary for initializing a runtime.
807
+ """
808
+ spec = super()._extract_envs(dsc_job)
809
+ envs = spec.pop(NotebookRuntime.CONST_ENV_VAR, {})
810
+ if not (self.CONST_NOTEBOOK_NAME in envs and self.CONST_ENTRYPOINT in envs):
811
+ raise IncompatibleRuntime()
812
+ # Remove job run entrypoint since it is the same for notebook runtime.
813
+ envs.pop(self.CONST_ENTRYPOINT)
814
+ # Extract exclude tags
815
+ exclude_tags = envs.pop(self.CONST_EXCLUDE_TAGS, None)
816
+ if exclude_tags:
817
+ # Exclude tags are in a JSON serialized string
818
+ try:
819
+ exclude_tags = json.loads(exclude_tags)
820
+ except ValueError:
821
+ # Ignore de-serialization error
822
+ pass
823
+ spec[NotebookRuntime.CONST_EXCLUDE_TAG] = exclude_tags
824
+
825
+ # Extract notebook name
826
+ notebook = envs.pop(self.CONST_NOTEBOOK_NAME)
827
+ if "/" in notebook:
828
+ # This indicate notebook is uploaded as part of a folder/zip
829
+ # When the source is a folder, the notebook name will have the format of
830
+ # folder/path/to/notebook.ipynb
831
+ (
832
+ spec[NotebookRuntime.CONST_SOURCE],
833
+ spec[NotebookRuntime.CONST_ENTRYPOINT],
834
+ ) = str(notebook).split("/", 1)
835
+ else:
836
+ # When the source is a single notebook, the notebook name will be the filename only.
837
+ # notebook.ipynb
838
+ spec[NotebookRuntime.CONST_NOTEBOOK_PATH] = notebook
839
+
840
+ spec.update(self._extract_specs(envs, self.SPEC_MAPPINGS))
841
+ spec[NotebookRuntime.CONST_ENV_VAR] = envs
842
+ return spec
843
+
844
+
845
+ class GitPythonRuntimeHandler(CondaRuntimeHandler):
846
+ """Runtime Handler for GitPythonRuntime"""
847
+
848
+ RUNTIME_CLASS = GitPythonRuntime
849
+
850
+ PATH_DELIMITER = ":"
851
+ CONST_GIT_URL = "GIT_URL"
852
+ CONST_GIT_BRANCH = "GIT_BRANCH"
853
+ CONST_GIT_COMMIT = "GIT_COMMIT"
854
+ CONST_GIT_CODE_DIR = "CODE_DIR"
855
+ CONST_GIT_SSH_SECRET_ID = "GIT_SECRET_OCID"
856
+ CONST_SKIP_METADATA = "SKIP_METADATA_UPDATE"
857
+
858
+ CONST_ENTRYPOINT = "GIT_ENTRYPOINT"
859
+ CONST_ENTRY_FUNCTION = "ENTRY_FUNCTION"
860
+ CONST_PYTHON_PATH = "PYTHON_PATH"
861
+ CONST_OUTPUT_DIR = "OUTPUT_DIR"
862
+ CONST_OUTPUT_URI = "OUTPUT_URI"
863
+ CONST_WORKING_DIR = "WORKING_DIR"
864
+
865
+ CONST_JOB_ENTRYPOINT = "JOB_RUN_ENTRYPOINT"
866
+
867
+ SPEC_MAPPINGS = {
868
+ GitPythonRuntime.CONST_GIT_URL: CONST_GIT_URL,
869
+ GitPythonRuntime.CONST_BRANCH: CONST_GIT_BRANCH,
870
+ GitPythonRuntime.CONST_COMMIT: CONST_GIT_COMMIT,
871
+ GitPythonRuntime.CONST_ENTRYPOINT: CONST_ENTRYPOINT,
872
+ GitPythonRuntime.CONST_ENTRY_FUNCTION: CONST_ENTRY_FUNCTION,
873
+ GitPythonRuntime.CONST_PYTHON_PATH: CONST_PYTHON_PATH,
874
+ GitPythonRuntime.CONST_GIT_SSH_SECRET_ID: CONST_GIT_SSH_SECRET_ID,
875
+ GitPythonRuntime.CONST_OUTPUT_DIR: CONST_OUTPUT_DIR,
876
+ GitPythonRuntime.CONST_OUTPUT_URI: CONST_OUTPUT_URI,
877
+ GitPythonRuntime.CONST_WORKING_DIR: CONST_WORKING_DIR,
878
+ }
879
+
880
+ def _translate_artifact(self, runtime: Runtime):
881
+ """Specifies the driver script as the job artifact.
882
+ runtime is not used in this method.
883
+
884
+ Parameters
885
+ ----------
886
+ runtime : Runtime
887
+ This is not used.
888
+
889
+ Returns
890
+ -------
891
+ str
892
+ Path to the git driver script.
893
+ """
894
+ return GitPythonArtifact()
895
+
896
+ def _translate_env(self, runtime: GitPythonRuntime) -> dict:
897
+ """Translate the environment variable.
898
+
899
+ Parameters
900
+ ----------
901
+ runtime : GitPythonRuntime
902
+ An instance of GitPythonRuntime
903
+
904
+ Returns
905
+ -------
906
+ dict
907
+ A dictionary containing environment variables for OCI data science job.
908
+ """
909
+ if not runtime.conda:
910
+ raise ValueError(
911
+ f"A conda pack is required for using the {runtime.__class__.__name__}. "
912
+ "You can specify a service conda pack using with_service_conda()."
913
+ )
914
+ envs = super()._translate_env(runtime)
915
+ envs.update(
916
+ self._translate_specs(runtime, self.SPEC_MAPPINGS, self.PATH_DELIMITER)
917
+ )
918
+ if runtime.skip_metadata_update:
919
+ envs[self.CONST_SKIP_METADATA] = "1"
920
+ # Add entrypoint as the ADS driver is packed in a zip file.
921
+ envs[self.CONST_JOB_ENTRYPOINT] = GitPythonArtifact.CONST_DRIVER_SCRIPT
922
+ return envs
923
+
924
+ def _extract_envs(self, dsc_job) -> dict:
925
+ """Extract the environment variables from data science job.
926
+
927
+ Parameters
928
+ ----------
929
+ dsc_job : DSCJob or oci.datascience.models.Job
930
+ The data science job containing runtime information.
931
+
932
+ Returns
933
+ -------
934
+ dict
935
+ A runtime specification dictionary for initializing a runtime.
936
+ """
937
+ spec = super()._extract_envs(dsc_job)
938
+ envs = spec.pop(CondaRuntime.CONST_ENV_VAR, {})
939
+
940
+ if self.CONST_GIT_URL not in envs or self.CONST_ENTRYPOINT not in envs:
941
+ raise IncompatibleRuntime()
942
+ # Remove entrypoint as it's added by ADS
943
+ envs.pop(self.CONST_JOB_ENTRYPOINT, None)
944
+ spec.update(self._extract_specs(envs, self.SPEC_MAPPINGS))
945
+ if GitPythonRuntime.CONST_PYTHON_PATH in spec:
946
+ spec[GitPythonRuntime.CONST_PYTHON_PATH] = spec[
947
+ GitPythonRuntime.CONST_PYTHON_PATH
948
+ ].split(self.PATH_DELIMITER)
949
+ if self.CONST_SKIP_METADATA in envs:
950
+ envs.pop(self.CONST_SKIP_METADATA, None)
951
+ spec[GitPythonRuntime.CONST_SKIP_METADATA] = True
952
+ if envs:
953
+ spec[ScriptRuntime.CONST_ENV_VAR] = envs
954
+ return spec
955
+
956
+ def _extract_artifact(self, dsc_job):
957
+ """Git runtime uses the driver script as artifact. This will not be extracted."""
958
+ return {}
959
+
960
+
961
+ class ContainerRuntimeHandler(RuntimeHandler):
962
+ RUNTIME_CLASS = ContainerRuntime
963
+ CMD_DELIMITER = ","
964
+
965
+ def translate(self, runtime: Runtime) -> dict:
966
+ payload = super().translate(runtime)
967
+ job_env_config = self._translate_env_config(runtime)
968
+ payload["job_environment_configuration_details"] = job_env_config
969
+ return payload
970
+
971
+ def _translate_artifact(self, runtime: ContainerRuntime):
972
+ """Additional artifact for the container"""
973
+ if runtime.artifact_uri:
974
+ return ScriptArtifact(runtime.artifact_uri, runtime)
975
+
976
+ def _translate_env_config(self, runtime: Runtime) -> dict:
977
+ """Converts runtime properties to ``OcirContainerJobEnvironmentConfigurationDetails`` payload required by OCI Data Science job.
978
+
979
+ Parameters
980
+ ----------
981
+ runtime : Runtime
982
+ The runtime containing the properties to be converted.
983
+
984
+ Returns
985
+ -------
986
+ dict
987
+ A dictionary storing the ``OcirContainerJobEnvironmentConfigurationDetails`` payload for OCI data science job.
988
+ """
989
+ job_environment_configuration_details = {
990
+ "job_environment_type": runtime.job_env_type
991
+ }
992
+
993
+ for key, value in ContainerRuntime.attribute_map.items():
994
+ property = runtime.get_spec(key, None)
995
+ if key in [
996
+ ContainerRuntime.CONST_CMD,
997
+ ContainerRuntime.CONST_ENTRYPOINT,
998
+ ] and isinstance(property, str):
999
+ property = self.split_args(property)
1000
+ if property is not None:
1001
+ job_environment_configuration_details[value] = property
1002
+
1003
+ return job_environment_configuration_details
1004
+
1005
+ @staticmethod
1006
+ def split_args(args: str) -> list:
1007
+ """Splits the cmd or entrypoint arguments for BYOC job into a list.
1008
+ BYOC jobs uses environment variables to store the values of cmd and entrypoint.
1009
+ In the values, comma(,) is used to separate cmd or entrypoint arguments.
1010
+ In YAML, the arguments are formatted into a list (Exec form).
1011
+
1012
+ >>> ContainerRuntimeHandler.split_args("/bin/bash")
1013
+ ["/bin/bash"]
1014
+ >>> ContainerRuntimeHandler.split_args("-c,echo Hello World")
1015
+ ['-c', 'echo Hello World']
1016
+
1017
+ Parameters
1018
+ ----------
1019
+ args : str
1020
+ Arguments in a comma separated string.
1021
+
1022
+ Returns
1023
+ -------
1024
+ list
1025
+ Arguments in a list
1026
+ """
1027
+ if not args:
1028
+ return []
1029
+ return [
1030
+ arg.strip() for arg in args.split(ContainerRuntimeHandler.CMD_DELIMITER)
1031
+ ]
1032
+
1033
+ def _extract_envs(self, dsc_job):
1034
+ """Extract the environment variables from data science job.
1035
+
1036
+ Parameters
1037
+ ----------
1038
+ dsc_job : DSCJob or oci.datascience.models.Job
1039
+ The data science job containing runtime information.
1040
+
1041
+ Returns
1042
+ -------
1043
+ dict
1044
+ A runtime specification dictionary for initializing a runtime.
1045
+ """
1046
+ spec = super()._extract_envs(dsc_job)
1047
+ envs = spec.pop(ContainerRuntime.CONST_ENV_VAR, {})
1048
+
1049
+ if envs:
1050
+ spec[ContainerRuntime.CONST_ENV_VAR] = envs
1051
+
1052
+ return spec
1053
+
1054
+ def _extract_properties(self, dsc_job) -> dict:
1055
+ """Extract the runtime properties from data science job.
1056
+
1057
+ Parameters
1058
+ ----------
1059
+ dsc_job : DSCJob or oci.datascience.models.Job
1060
+ The data science job containing runtime information.
1061
+
1062
+ Returns
1063
+ -------
1064
+ dict
1065
+ A runtime specification dictionary for initializing a runtime.
1066
+ """
1067
+ spec = super()._extract_envs(dsc_job)
1068
+
1069
+ job_env_config = getattr(dsc_job, "job_environment_configuration_details", None)
1070
+ job_env_type = getattr(job_env_config, "job_environment_type", None)
1071
+
1072
+ if not (job_env_config and job_env_type == "OCIR_CONTAINER"):
1073
+ raise IncompatibleRuntime()
1074
+
1075
+ for key, value in ContainerRuntime.attribute_map.items():
1076
+ property = getattr(job_env_config, value, None)
1077
+ if property is not None:
1078
+ spec[key] = property
1079
+ return spec
1080
+
1081
+
1082
+ class PyTorchDistributedRuntimeHandler(PythonRuntimeHandler):
1083
+ RUNTIME_CLASS = PyTorchDistributedRuntime
1084
+ CONST_WORKER_COUNT = "OCI__WORKER_COUNT"
1085
+ CONST_COMMAND = "OCI__LAUNCH_CMD"
1086
+ CONST_DEEPSPEED = "OCI__DEEPSPEED"
1087
+
1088
+ GIT_SPEC_MAPPINGS = {
1089
+ cluster_config_helper.OCI__RUNTIME_URI: GitPythonRuntime.CONST_GIT_URL,
1090
+ cluster_config_helper.OCI__RUNTIME_GIT_BRANCH: GitPythonRuntime.CONST_BRANCH,
1091
+ cluster_config_helper.OCI__RUNTIME_GIT_COMMIT: GitPythonRuntime.CONST_COMMIT,
1092
+ cluster_config_helper.OCI__RUNTIME_GIT_SECRET_ID: GitPythonRuntime.CONST_GIT_SSH_SECRET_ID,
1093
+ }
1094
+
1095
+ SPEC_MAPPINGS = PythonRuntimeHandler.SPEC_MAPPINGS
1096
+ SPEC_MAPPINGS.update(
1097
+ {
1098
+ PyTorchDistributedRuntime.CONST_COMMAND: CONST_COMMAND,
1099
+ }
1100
+ )
1101
+
1102
+ def _translate_artifact(self, runtime: PyTorchDistributedRuntime):
1103
+ return PyTorchDistributedArtifact(runtime.source_uri, runtime)
1104
+
1105
+ def _translate_env(self, runtime: PyTorchDistributedRuntime) -> dict:
1106
+ envs = super()._translate_env(runtime)
1107
+ replica = runtime.replica if runtime.replica else 1
1108
+ # WORKER_COUNT = REPLICA - 1 so that it will be same as distributed training
1109
+ envs[self.CONST_WORKER_COUNT] = str(replica - 1)
1110
+ envs[self.CONST_JOB_ENTRYPOINT] = PyTorchDistributedArtifact.CONST_DRIVER_SCRIPT
1111
+ if runtime.inputs:
1112
+ envs[driver_utils.CONST_ENV_INPUT_MAPPINGS] = json.dumps(runtime.inputs)
1113
+ if runtime.git:
1114
+ for env_key, spec_key in self.GIT_SPEC_MAPPINGS.items():
1115
+ if not runtime.git.get(spec_key):
1116
+ continue
1117
+ envs[env_key] = runtime.git[spec_key]
1118
+ if runtime.dependencies:
1119
+ if PyTorchDistributedRuntime.CONST_PIP_PKG in runtime.dependencies:
1120
+ envs[driver_utils.CONST_ENV_PIP_PKG] = runtime.dependencies[
1121
+ PyTorchDistributedRuntime.CONST_PIP_PKG
1122
+ ]
1123
+ if PyTorchDistributedRuntime.CONST_PIP_REQ in runtime.dependencies:
1124
+ envs[driver_utils.CONST_ENV_PIP_REQ] = runtime.dependencies[
1125
+ PyTorchDistributedRuntime.CONST_PIP_REQ
1126
+ ]
1127
+ if runtime.use_deepspeed:
1128
+ envs[self.CONST_DEEPSPEED] = "1"
1129
+ return envs
1130
+
1131
+ def _extract_envs(self, dsc_job) -> dict:
1132
+ spec = super()._extract_envs(dsc_job)
1133
+ envs = spec.pop(PythonRuntime.CONST_ENV_VAR, {})
1134
+ if self.CONST_WORKER_COUNT not in envs:
1135
+ raise IncompatibleRuntime()
1136
+ # Replicas
1137
+ spec[PyTorchDistributedRuntime.CONST_REPLICA] = (
1138
+ int(envs.pop(self.CONST_WORKER_COUNT)) + 1
1139
+ )
1140
+ # Git
1141
+ if cluster_config_helper.OCI__RUNTIME_URI in envs:
1142
+ git_spec = {}
1143
+ for env_key, spec_key in self.GIT_SPEC_MAPPINGS.items():
1144
+ if env_key in envs:
1145
+ git_spec[spec_key] = envs.pop(env_key)
1146
+ spec[PyTorchDistributedRuntime.CONST_GIT] = git_spec
1147
+ # Inputs
1148
+ input_mappings = envs.pop(driver_utils.CONST_ENV_INPUT_MAPPINGS, None)
1149
+ if input_mappings:
1150
+ try:
1151
+ spec[PyTorchDistributedRuntime.CONST_INPUT] = json.loads(input_mappings)
1152
+ except ValueError:
1153
+ spec[PyTorchDistributedRuntime.CONST_INPUT] = input_mappings
1154
+ # Dependencies
1155
+ dep = {}
1156
+ if driver_utils.CONST_ENV_PIP_PKG in envs:
1157
+ dep[PyTorchDistributedRuntime.CONST_PIP_PKG] = envs.pop(
1158
+ driver_utils.CONST_ENV_PIP_PKG
1159
+ )
1160
+ if driver_utils.CONST_ENV_PIP_REQ in envs:
1161
+ dep[PyTorchDistributedRuntime.CONST_PIP_REQ] = envs.pop(
1162
+ driver_utils.CONST_ENV_PIP_REQ
1163
+ )
1164
+ if dep:
1165
+ spec[PyTorchDistributedRuntime.CONST_DEP] = dep
1166
+ if envs.pop(self.CONST_DEEPSPEED, None):
1167
+ spec[PyTorchDistributedRuntime.CONST_DEEPSPEED] = True
1168
+ # Envs
1169
+ if envs:
1170
+ spec[PythonRuntime.CONST_ENV_VAR] = envs
1171
+ return spec
1172
+
1173
+
1174
+ class DataScienceJobRuntimeManager(RuntimeHandler):
1175
+ """This class is used by the DataScienceJob infrastructure to handle the runtime conversion.
1176
+ The translate() method determines the actual runtime handler by matching the RUNTIME_CLASS.
1177
+ The extract() method determines the actual runtime handler by checking if the runtime can be extracted.
1178
+ The order in runtime_handlers is used for extraction until a runtime is extracted.
1179
+ RuntimeHandler on the top of the list will have higher priority.
1180
+ If a runtime is a specify case of another runtime, the handler should be placed with higher priority.
1181
+ """
1182
+
1183
+ runtime_handlers = [
1184
+ ContainerRuntimeHandler,
1185
+ PyTorchDistributedRuntimeHandler,
1186
+ GitPythonRuntimeHandler,
1187
+ NotebookRuntimeHandler,
1188
+ PythonRuntimeHandler,
1189
+ ScriptRuntimeHandler,
1190
+ ]
1191
+
1192
+ def translate(self, runtime) -> dict:
1193
+ """Translates the runtime into a JSON payload for OCI API.
1194
+ This method determines the actual runtime handler by matching the RUNTIME_CLASS.
1195
+
1196
+ Parameters
1197
+ ----------
1198
+ runtime : Runtime
1199
+ An instance of the runtime to be converted to a JSON payload.
1200
+
1201
+ Returns
1202
+ -------
1203
+ dict
1204
+ JSON payload for defining a Data Science Job with OCI API
1205
+ """
1206
+ for runtime_handler in self.runtime_handlers:
1207
+ if runtime_handler.RUNTIME_CLASS == runtime.__class__:
1208
+ return runtime_handler(self.data_science_job).translate(runtime)
1209
+ raise NotImplementedError(
1210
+ f"{runtime.__class__.__name__} is not supported as the runtime of DataScienceJob."
1211
+ )
1212
+
1213
+ def extract(self, dsc_job):
1214
+ """Extract the runtime from an OCI data science job object.
1215
+
1216
+ This method determines the actual runtime handler by checking if the runtime can be extracted.
1217
+
1218
+ Parameters
1219
+ ----------
1220
+ dsc_job : DSCJob or oci.datascience.models.Job
1221
+ The data science job containing runtime information.
1222
+
1223
+ Returns
1224
+ -------
1225
+ Runtime:
1226
+ The runtime extracted from the data science job.
1227
+ """
1228
+ for runtime_handler in self.runtime_handlers:
1229
+ try:
1230
+ return runtime_handler(self.data_science_job).extract(dsc_job)
1231
+ except IncompatibleRuntime:
1232
+ pass
1233
+ raise NotImplementedError("Unable to extract runtime.")