acryl-datahub 1.1.1rc4__py3-none-any.whl → 1.3.0.1rc9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of acryl-datahub might be problematic. Click here for more details.

Files changed (414) hide show
  1. {acryl_datahub-1.1.1rc4.dist-info → acryl_datahub-1.3.0.1rc9.dist-info}/METADATA +2615 -2547
  2. {acryl_datahub-1.1.1rc4.dist-info → acryl_datahub-1.3.0.1rc9.dist-info}/RECORD +412 -338
  3. {acryl_datahub-1.1.1rc4.dist-info → acryl_datahub-1.3.0.1rc9.dist-info}/entry_points.txt +5 -0
  4. datahub/_version.py +1 -1
  5. datahub/api/entities/assertion/assertion.py +1 -1
  6. datahub/api/entities/common/serialized_value.py +1 -1
  7. datahub/api/entities/corpgroup/corpgroup.py +1 -1
  8. datahub/api/entities/dataproduct/dataproduct.py +32 -3
  9. datahub/api/entities/dataset/dataset.py +26 -23
  10. datahub/api/entities/external/__init__.py +0 -0
  11. datahub/api/entities/external/external_entities.py +724 -0
  12. datahub/api/entities/external/external_tag.py +147 -0
  13. datahub/api/entities/external/lake_formation_external_entites.py +162 -0
  14. datahub/api/entities/external/restricted_text.py +172 -0
  15. datahub/api/entities/external/unity_catalog_external_entites.py +172 -0
  16. datahub/api/entities/forms/forms.py +3 -3
  17. datahub/api/entities/structuredproperties/structuredproperties.py +4 -4
  18. datahub/api/graphql/operation.py +10 -6
  19. datahub/cli/check_cli.py +88 -7
  20. datahub/cli/cli_utils.py +63 -0
  21. datahub/cli/config_utils.py +18 -10
  22. datahub/cli/container_cli.py +5 -0
  23. datahub/cli/delete_cli.py +125 -27
  24. datahub/cli/docker_check.py +110 -14
  25. datahub/cli/docker_cli.py +153 -229
  26. datahub/cli/exists_cli.py +0 -2
  27. datahub/cli/get_cli.py +0 -2
  28. datahub/cli/graphql_cli.py +1422 -0
  29. datahub/cli/iceberg_cli.py +5 -0
  30. datahub/cli/ingest_cli.py +3 -15
  31. datahub/cli/migrate.py +2 -0
  32. datahub/cli/put_cli.py +1 -4
  33. datahub/cli/quickstart_versioning.py +53 -10
  34. datahub/cli/specific/assertions_cli.py +37 -6
  35. datahub/cli/specific/datacontract_cli.py +54 -7
  36. datahub/cli/specific/dataproduct_cli.py +2 -15
  37. datahub/cli/specific/dataset_cli.py +1 -8
  38. datahub/cli/specific/forms_cli.py +0 -4
  39. datahub/cli/specific/group_cli.py +0 -2
  40. datahub/cli/specific/structuredproperties_cli.py +1 -4
  41. datahub/cli/specific/user_cli.py +172 -3
  42. datahub/cli/state_cli.py +0 -2
  43. datahub/cli/timeline_cli.py +0 -2
  44. datahub/configuration/common.py +40 -1
  45. datahub/configuration/connection_resolver.py +5 -2
  46. datahub/configuration/env_vars.py +331 -0
  47. datahub/configuration/import_resolver.py +7 -4
  48. datahub/configuration/kafka.py +21 -1
  49. datahub/configuration/pydantic_migration_helpers.py +6 -13
  50. datahub/configuration/source_common.py +3 -2
  51. datahub/configuration/validate_field_deprecation.py +5 -2
  52. datahub/configuration/validate_field_removal.py +8 -2
  53. datahub/configuration/validate_field_rename.py +6 -5
  54. datahub/configuration/validate_multiline_string.py +5 -2
  55. datahub/emitter/mce_builder.py +8 -4
  56. datahub/emitter/rest_emitter.py +103 -30
  57. datahub/entrypoints.py +6 -3
  58. datahub/ingestion/api/auto_work_units/auto_ensure_aspect_size.py +297 -1
  59. datahub/ingestion/api/auto_work_units/auto_validate_input_fields.py +87 -0
  60. datahub/ingestion/api/decorators.py +15 -3
  61. datahub/ingestion/api/report.py +381 -3
  62. datahub/ingestion/api/sink.py +27 -2
  63. datahub/ingestion/api/source.py +165 -58
  64. datahub/ingestion/api/source_protocols.py +23 -0
  65. datahub/ingestion/autogenerated/__init__.py +0 -0
  66. datahub/ingestion/autogenerated/capability_summary.json +3652 -0
  67. datahub/ingestion/autogenerated/lineage.json +402 -0
  68. datahub/ingestion/autogenerated/lineage_helper.py +177 -0
  69. datahub/ingestion/extractor/schema_util.py +13 -4
  70. datahub/ingestion/glossary/classification_mixin.py +5 -0
  71. datahub/ingestion/graph/client.py +330 -25
  72. datahub/ingestion/graph/config.py +3 -2
  73. datahub/ingestion/graph/filters.py +30 -11
  74. datahub/ingestion/reporting/datahub_ingestion_run_summary_provider.py +21 -11
  75. datahub/ingestion/run/pipeline.py +81 -11
  76. datahub/ingestion/run/pipeline_config.py +2 -2
  77. datahub/ingestion/sink/datahub_kafka.py +1 -0
  78. datahub/ingestion/sink/datahub_rest.py +13 -5
  79. datahub/ingestion/sink/file.py +1 -0
  80. datahub/ingestion/source/abs/config.py +1 -1
  81. datahub/ingestion/source/abs/datalake_profiler_config.py +1 -1
  82. datahub/ingestion/source/abs/source.py +15 -30
  83. datahub/ingestion/source/aws/aws_common.py +185 -13
  84. datahub/ingestion/source/aws/glue.py +517 -244
  85. datahub/ingestion/source/aws/platform_resource_repository.py +30 -0
  86. datahub/ingestion/source/aws/s3_boto_utils.py +100 -5
  87. datahub/ingestion/source/aws/tag_entities.py +270 -0
  88. datahub/ingestion/source/azure/azure_common.py +3 -3
  89. datahub/ingestion/source/bigquery_v2/bigquery.py +67 -24
  90. datahub/ingestion/source/bigquery_v2/bigquery_config.py +47 -19
  91. datahub/ingestion/source/bigquery_v2/bigquery_connection.py +12 -1
  92. datahub/ingestion/source/bigquery_v2/bigquery_queries.py +3 -0
  93. datahub/ingestion/source/bigquery_v2/bigquery_report.py +0 -2
  94. datahub/ingestion/source/bigquery_v2/bigquery_schema.py +23 -16
  95. datahub/ingestion/source/bigquery_v2/bigquery_schema_gen.py +20 -5
  96. datahub/ingestion/source/bigquery_v2/common.py +1 -1
  97. datahub/ingestion/source/bigquery_v2/profiler.py +4 -2
  98. datahub/ingestion/source/bigquery_v2/queries.py +3 -3
  99. datahub/ingestion/source/bigquery_v2/queries_extractor.py +45 -9
  100. datahub/ingestion/source/cassandra/cassandra.py +6 -8
  101. datahub/ingestion/source/cassandra/cassandra_api.py +17 -1
  102. datahub/ingestion/source/cassandra/cassandra_config.py +5 -0
  103. datahub/ingestion/source/cassandra/cassandra_profiling.py +7 -6
  104. datahub/ingestion/source/cassandra/cassandra_utils.py +1 -2
  105. datahub/ingestion/source/common/gcp_credentials_config.py +3 -1
  106. datahub/ingestion/source/common/subtypes.py +53 -0
  107. datahub/ingestion/source/data_lake_common/data_lake_utils.py +37 -0
  108. datahub/ingestion/source/data_lake_common/object_store.py +115 -27
  109. datahub/ingestion/source/data_lake_common/path_spec.py +72 -43
  110. datahub/ingestion/source/datahub/config.py +12 -9
  111. datahub/ingestion/source/datahub/datahub_database_reader.py +26 -11
  112. datahub/ingestion/source/datahub/datahub_source.py +10 -0
  113. datahub/ingestion/source/dbt/dbt_cloud.py +16 -5
  114. datahub/ingestion/source/dbt/dbt_common.py +224 -9
  115. datahub/ingestion/source/dbt/dbt_core.py +3 -0
  116. datahub/ingestion/source/debug/__init__.py +0 -0
  117. datahub/ingestion/source/debug/datahub_debug.py +300 -0
  118. datahub/ingestion/source/delta_lake/config.py +9 -5
  119. datahub/ingestion/source/delta_lake/source.py +8 -0
  120. datahub/ingestion/source/dremio/dremio_api.py +114 -73
  121. datahub/ingestion/source/dremio/dremio_aspects.py +3 -2
  122. datahub/ingestion/source/dremio/dremio_config.py +5 -4
  123. datahub/ingestion/source/dremio/dremio_reporting.py +22 -3
  124. datahub/ingestion/source/dremio/dremio_source.py +132 -98
  125. datahub/ingestion/source/dremio/dremio_sql_queries.py +82 -21
  126. datahub/ingestion/source/dynamodb/dynamodb.py +11 -8
  127. datahub/ingestion/source/excel/__init__.py +0 -0
  128. datahub/ingestion/source/excel/config.py +92 -0
  129. datahub/ingestion/source/excel/excel_file.py +539 -0
  130. datahub/ingestion/source/excel/profiling.py +308 -0
  131. datahub/ingestion/source/excel/report.py +49 -0
  132. datahub/ingestion/source/excel/source.py +662 -0
  133. datahub/ingestion/source/excel/util.py +18 -0
  134. datahub/ingestion/source/feast.py +8 -10
  135. datahub/ingestion/source/file.py +3 -0
  136. datahub/ingestion/source/fivetran/config.py +66 -7
  137. datahub/ingestion/source/fivetran/fivetran.py +227 -43
  138. datahub/ingestion/source/fivetran/fivetran_log_api.py +37 -8
  139. datahub/ingestion/source/fivetran/fivetran_query.py +51 -29
  140. datahub/ingestion/source/fivetran/fivetran_rest_api.py +65 -0
  141. datahub/ingestion/source/fivetran/response_models.py +97 -0
  142. datahub/ingestion/source/gc/datahub_gc.py +0 -2
  143. datahub/ingestion/source/gcs/gcs_source.py +32 -4
  144. datahub/ingestion/source/ge_data_profiler.py +108 -31
  145. datahub/ingestion/source/ge_profiling_config.py +26 -11
  146. datahub/ingestion/source/grafana/entity_mcp_builder.py +272 -0
  147. datahub/ingestion/source/grafana/field_utils.py +307 -0
  148. datahub/ingestion/source/grafana/grafana_api.py +142 -0
  149. datahub/ingestion/source/grafana/grafana_config.py +104 -0
  150. datahub/ingestion/source/grafana/grafana_source.py +522 -84
  151. datahub/ingestion/source/grafana/lineage.py +202 -0
  152. datahub/ingestion/source/grafana/models.py +137 -0
  153. datahub/ingestion/source/grafana/report.py +90 -0
  154. datahub/ingestion/source/grafana/types.py +16 -0
  155. datahub/ingestion/source/hex/api.py +28 -1
  156. datahub/ingestion/source/hex/hex.py +16 -5
  157. datahub/ingestion/source/hex/mapper.py +16 -2
  158. datahub/ingestion/source/hex/model.py +2 -0
  159. datahub/ingestion/source/hex/query_fetcher.py +1 -1
  160. datahub/ingestion/source/iceberg/iceberg.py +123 -59
  161. datahub/ingestion/source/iceberg/iceberg_profiler.py +4 -2
  162. datahub/ingestion/source/identity/azure_ad.py +1 -1
  163. datahub/ingestion/source/identity/okta.py +1 -14
  164. datahub/ingestion/source/kafka/kafka.py +16 -0
  165. datahub/ingestion/source/kafka_connect/common.py +2 -2
  166. datahub/ingestion/source/kafka_connect/sink_connectors.py +156 -47
  167. datahub/ingestion/source/kafka_connect/source_connectors.py +62 -4
  168. datahub/ingestion/source/looker/looker_common.py +148 -79
  169. datahub/ingestion/source/looker/looker_config.py +15 -4
  170. datahub/ingestion/source/looker/looker_constant.py +4 -0
  171. datahub/ingestion/source/looker/looker_lib_wrapper.py +36 -3
  172. datahub/ingestion/source/looker/looker_liquid_tag.py +56 -5
  173. datahub/ingestion/source/looker/looker_source.py +503 -547
  174. datahub/ingestion/source/looker/looker_view_id_cache.py +1 -1
  175. datahub/ingestion/source/looker/lookml_concept_context.py +1 -1
  176. datahub/ingestion/source/looker/lookml_config.py +31 -3
  177. datahub/ingestion/source/looker/lookml_refinement.py +1 -1
  178. datahub/ingestion/source/looker/lookml_source.py +96 -117
  179. datahub/ingestion/source/looker/view_upstream.py +494 -1
  180. datahub/ingestion/source/metabase.py +32 -6
  181. datahub/ingestion/source/metadata/business_glossary.py +7 -7
  182. datahub/ingestion/source/metadata/lineage.py +9 -9
  183. datahub/ingestion/source/mlflow.py +12 -2
  184. datahub/ingestion/source/mock_data/__init__.py +0 -0
  185. datahub/ingestion/source/mock_data/datahub_mock_data.py +533 -0
  186. datahub/ingestion/source/mock_data/datahub_mock_data_report.py +12 -0
  187. datahub/ingestion/source/mock_data/table_naming_helper.py +97 -0
  188. datahub/ingestion/source/mode.py +26 -5
  189. datahub/ingestion/source/mongodb.py +11 -1
  190. datahub/ingestion/source/neo4j/neo4j_source.py +83 -144
  191. datahub/ingestion/source/nifi.py +2 -2
  192. datahub/ingestion/source/openapi.py +1 -1
  193. datahub/ingestion/source/powerbi/config.py +47 -21
  194. datahub/ingestion/source/powerbi/m_query/data_classes.py +1 -0
  195. datahub/ingestion/source/powerbi/m_query/parser.py +2 -2
  196. datahub/ingestion/source/powerbi/m_query/pattern_handler.py +100 -10
  197. datahub/ingestion/source/powerbi/powerbi.py +10 -6
  198. datahub/ingestion/source/powerbi/rest_api_wrapper/powerbi_api.py +0 -1
  199. datahub/ingestion/source/powerbi_report_server/report_server.py +0 -23
  200. datahub/ingestion/source/powerbi_report_server/report_server_domain.py +2 -4
  201. datahub/ingestion/source/preset.py +3 -3
  202. datahub/ingestion/source/qlik_sense/data_classes.py +28 -8
  203. datahub/ingestion/source/qlik_sense/qlik_sense.py +2 -1
  204. datahub/ingestion/source/redash.py +1 -1
  205. datahub/ingestion/source/redshift/config.py +15 -9
  206. datahub/ingestion/source/redshift/datashares.py +1 -1
  207. datahub/ingestion/source/redshift/lineage.py +386 -687
  208. datahub/ingestion/source/redshift/query.py +23 -19
  209. datahub/ingestion/source/redshift/redshift.py +52 -111
  210. datahub/ingestion/source/redshift/redshift_schema.py +17 -12
  211. datahub/ingestion/source/redshift/report.py +0 -2
  212. datahub/ingestion/source/redshift/usage.py +6 -5
  213. datahub/ingestion/source/s3/report.py +4 -2
  214. datahub/ingestion/source/s3/source.py +449 -248
  215. datahub/ingestion/source/sac/sac.py +3 -1
  216. datahub/ingestion/source/salesforce.py +28 -13
  217. datahub/ingestion/source/schema/json_schema.py +14 -14
  218. datahub/ingestion/source/schema_inference/object.py +22 -6
  219. datahub/ingestion/source/sigma/data_classes.py +3 -0
  220. datahub/ingestion/source/sigma/sigma.py +7 -1
  221. datahub/ingestion/source/slack/slack.py +10 -16
  222. datahub/ingestion/source/snaplogic/__init__.py +0 -0
  223. datahub/ingestion/source/snaplogic/snaplogic.py +355 -0
  224. datahub/ingestion/source/snaplogic/snaplogic_config.py +37 -0
  225. datahub/ingestion/source/snaplogic/snaplogic_lineage_extractor.py +107 -0
  226. datahub/ingestion/source/snaplogic/snaplogic_parser.py +168 -0
  227. datahub/ingestion/source/snaplogic/snaplogic_utils.py +31 -0
  228. datahub/ingestion/source/snowflake/constants.py +3 -0
  229. datahub/ingestion/source/snowflake/snowflake_config.py +76 -23
  230. datahub/ingestion/source/snowflake/snowflake_connection.py +24 -8
  231. datahub/ingestion/source/snowflake/snowflake_lineage_v2.py +19 -6
  232. datahub/ingestion/source/snowflake/snowflake_queries.py +464 -97
  233. datahub/ingestion/source/snowflake/snowflake_query.py +77 -5
  234. datahub/ingestion/source/snowflake/snowflake_report.py +1 -2
  235. datahub/ingestion/source/snowflake/snowflake_schema.py +352 -16
  236. datahub/ingestion/source/snowflake/snowflake_schema_gen.py +51 -10
  237. datahub/ingestion/source/snowflake/snowflake_summary.py +7 -1
  238. datahub/ingestion/source/snowflake/snowflake_usage_v2.py +8 -2
  239. datahub/ingestion/source/snowflake/snowflake_utils.py +36 -15
  240. datahub/ingestion/source/snowflake/snowflake_v2.py +39 -4
  241. datahub/ingestion/source/snowflake/stored_proc_lineage.py +143 -0
  242. datahub/ingestion/source/sql/athena.py +217 -25
  243. datahub/ingestion/source/sql/athena_properties_extractor.py +795 -0
  244. datahub/ingestion/source/sql/clickhouse.py +24 -8
  245. datahub/ingestion/source/sql/cockroachdb.py +5 -4
  246. datahub/ingestion/source/sql/druid.py +2 -2
  247. datahub/ingestion/source/sql/hana.py +3 -1
  248. datahub/ingestion/source/sql/hive.py +4 -3
  249. datahub/ingestion/source/sql/hive_metastore.py +19 -20
  250. datahub/ingestion/source/sql/mariadb.py +0 -1
  251. datahub/ingestion/source/sql/mssql/job_models.py +3 -1
  252. datahub/ingestion/source/sql/mssql/source.py +336 -57
  253. datahub/ingestion/source/sql/mysql.py +154 -4
  254. datahub/ingestion/source/sql/oracle.py +5 -5
  255. datahub/ingestion/source/sql/postgres.py +142 -6
  256. datahub/ingestion/source/sql/presto.py +2 -1
  257. datahub/ingestion/source/sql/sql_common.py +281 -49
  258. datahub/ingestion/source/sql/sql_generic_profiler.py +2 -1
  259. datahub/ingestion/source/sql/sql_types.py +22 -0
  260. datahub/ingestion/source/sql/sqlalchemy_uri.py +39 -7
  261. datahub/ingestion/source/sql/teradata.py +1028 -245
  262. datahub/ingestion/source/sql/trino.py +11 -1
  263. datahub/ingestion/source/sql/two_tier_sql_source.py +2 -3
  264. datahub/ingestion/source/sql/vertica.py +14 -7
  265. datahub/ingestion/source/sql_queries.py +219 -121
  266. datahub/ingestion/source/state/checkpoint.py +8 -29
  267. datahub/ingestion/source/state/entity_removal_state.py +5 -2
  268. datahub/ingestion/source/state/redundant_run_skip_handler.py +21 -0
  269. datahub/ingestion/source/state/stateful_ingestion_base.py +36 -11
  270. datahub/ingestion/source/superset.py +314 -67
  271. datahub/ingestion/source/tableau/tableau.py +135 -59
  272. datahub/ingestion/source/tableau/tableau_common.py +9 -2
  273. datahub/ingestion/source/tableau/tableau_constant.py +1 -4
  274. datahub/ingestion/source/tableau/tableau_server_wrapper.py +3 -0
  275. datahub/ingestion/source/unity/config.py +160 -40
  276. datahub/ingestion/source/unity/connection.py +61 -0
  277. datahub/ingestion/source/unity/connection_test.py +1 -0
  278. datahub/ingestion/source/unity/platform_resource_repository.py +19 -0
  279. datahub/ingestion/source/unity/proxy.py +794 -51
  280. datahub/ingestion/source/unity/proxy_patch.py +321 -0
  281. datahub/ingestion/source/unity/proxy_types.py +36 -2
  282. datahub/ingestion/source/unity/report.py +15 -3
  283. datahub/ingestion/source/unity/source.py +465 -131
  284. datahub/ingestion/source/unity/tag_entities.py +197 -0
  285. datahub/ingestion/source/unity/usage.py +46 -4
  286. datahub/ingestion/source/usage/clickhouse_usage.py +4 -1
  287. datahub/ingestion/source/usage/starburst_trino_usage.py +5 -2
  288. datahub/ingestion/source/usage/usage_common.py +4 -3
  289. datahub/ingestion/source/vertexai/vertexai.py +1 -1
  290. datahub/ingestion/source_config/pulsar.py +3 -1
  291. datahub/ingestion/source_report/ingestion_stage.py +50 -11
  292. datahub/ingestion/transformer/add_dataset_ownership.py +18 -2
  293. datahub/ingestion/transformer/base_transformer.py +8 -5
  294. datahub/ingestion/transformer/set_browse_path.py +112 -0
  295. datahub/integrations/assertion/snowflake/compiler.py +4 -3
  296. datahub/metadata/_internal_schema_classes.py +6806 -4871
  297. datahub/metadata/_urns/urn_defs.py +1767 -1539
  298. datahub/metadata/com/linkedin/pegasus2avro/application/__init__.py +19 -0
  299. datahub/metadata/com/linkedin/pegasus2avro/common/__init__.py +2 -0
  300. datahub/metadata/com/linkedin/pegasus2avro/file/__init__.py +19 -0
  301. datahub/metadata/com/linkedin/pegasus2avro/identity/__init__.py +2 -0
  302. datahub/metadata/com/linkedin/pegasus2avro/logical/__init__.py +15 -0
  303. datahub/metadata/com/linkedin/pegasus2avro/metadata/key/__init__.py +6 -0
  304. datahub/metadata/com/linkedin/pegasus2avro/module/__init__.py +31 -0
  305. datahub/metadata/com/linkedin/pegasus2avro/platform/event/v1/__init__.py +4 -0
  306. datahub/metadata/com/linkedin/pegasus2avro/role/__init__.py +2 -0
  307. datahub/metadata/com/linkedin/pegasus2avro/settings/asset/__init__.py +19 -0
  308. datahub/metadata/com/linkedin/pegasus2avro/settings/global/__init__.py +8 -0
  309. datahub/metadata/com/linkedin/pegasus2avro/template/__init__.py +31 -0
  310. datahub/metadata/schema.avsc +18395 -16979
  311. datahub/metadata/schemas/Actors.avsc +38 -1
  312. datahub/metadata/schemas/ApplicationKey.avsc +31 -0
  313. datahub/metadata/schemas/ApplicationProperties.avsc +72 -0
  314. datahub/metadata/schemas/Applications.avsc +38 -0
  315. datahub/metadata/schemas/AssetSettings.avsc +63 -0
  316. datahub/metadata/schemas/ChartInfo.avsc +2 -1
  317. datahub/metadata/schemas/ChartKey.avsc +1 -0
  318. datahub/metadata/schemas/ContainerKey.avsc +1 -0
  319. datahub/metadata/schemas/ContainerProperties.avsc +8 -0
  320. datahub/metadata/schemas/CorpUserEditableInfo.avsc +1 -1
  321. datahub/metadata/schemas/CorpUserSettings.avsc +50 -0
  322. datahub/metadata/schemas/DashboardKey.avsc +1 -0
  323. datahub/metadata/schemas/DataFlowInfo.avsc +8 -0
  324. datahub/metadata/schemas/DataFlowKey.avsc +1 -0
  325. datahub/metadata/schemas/DataHubFileInfo.avsc +230 -0
  326. datahub/metadata/schemas/DataHubFileKey.avsc +21 -0
  327. datahub/metadata/schemas/DataHubPageModuleKey.avsc +21 -0
  328. datahub/metadata/schemas/DataHubPageModuleProperties.avsc +298 -0
  329. datahub/metadata/schemas/DataHubPageTemplateKey.avsc +21 -0
  330. datahub/metadata/schemas/DataHubPageTemplateProperties.avsc +251 -0
  331. datahub/metadata/schemas/DataHubPolicyInfo.avsc +12 -1
  332. datahub/metadata/schemas/DataJobInfo.avsc +8 -0
  333. datahub/metadata/schemas/DataJobInputOutput.avsc +8 -0
  334. datahub/metadata/schemas/DataJobKey.avsc +1 -0
  335. datahub/metadata/schemas/DataProcessKey.avsc +8 -0
  336. datahub/metadata/schemas/DataProductKey.avsc +3 -1
  337. datahub/metadata/schemas/DataProductProperties.avsc +1 -1
  338. datahub/metadata/schemas/DatasetKey.avsc +11 -1
  339. datahub/metadata/schemas/DatasetUsageStatistics.avsc +8 -0
  340. datahub/metadata/schemas/DomainKey.avsc +2 -1
  341. datahub/metadata/schemas/GlobalSettingsInfo.avsc +134 -0
  342. datahub/metadata/schemas/GlossaryNodeKey.avsc +2 -1
  343. datahub/metadata/schemas/GlossaryTermKey.avsc +3 -1
  344. datahub/metadata/schemas/IcebergWarehouseInfo.avsc +8 -0
  345. datahub/metadata/schemas/IncidentInfo.avsc +3 -3
  346. datahub/metadata/schemas/InstitutionalMemory.avsc +31 -0
  347. datahub/metadata/schemas/LogicalParent.avsc +145 -0
  348. datahub/metadata/schemas/MLFeatureKey.avsc +1 -0
  349. datahub/metadata/schemas/MLFeatureTableKey.avsc +1 -0
  350. datahub/metadata/schemas/MLModelDeploymentKey.avsc +8 -0
  351. datahub/metadata/schemas/MLModelGroupKey.avsc +11 -1
  352. datahub/metadata/schemas/MLModelKey.avsc +9 -0
  353. datahub/metadata/schemas/MLPrimaryKeyKey.avsc +1 -0
  354. datahub/metadata/schemas/MetadataChangeEvent.avsc +151 -47
  355. datahub/metadata/schemas/MetadataChangeLog.avsc +62 -44
  356. datahub/metadata/schemas/MetadataChangeProposal.avsc +61 -0
  357. datahub/metadata/schemas/NotebookKey.avsc +1 -0
  358. datahub/metadata/schemas/Operation.avsc +4 -2
  359. datahub/metadata/schemas/Ownership.avsc +69 -0
  360. datahub/metadata/schemas/QuerySubjects.avsc +1 -12
  361. datahub/metadata/schemas/RelationshipChangeEvent.avsc +215 -0
  362. datahub/metadata/schemas/SchemaFieldKey.avsc +4 -1
  363. datahub/metadata/schemas/StructuredProperties.avsc +69 -0
  364. datahub/metadata/schemas/StructuredPropertySettings.avsc +9 -0
  365. datahub/metadata/schemas/SystemMetadata.avsc +61 -0
  366. datahub/metadata/schemas/UpstreamLineage.avsc +9 -0
  367. datahub/sdk/__init__.py +2 -0
  368. datahub/sdk/_all_entities.py +7 -0
  369. datahub/sdk/_shared.py +249 -5
  370. datahub/sdk/chart.py +386 -0
  371. datahub/sdk/container.py +7 -0
  372. datahub/sdk/dashboard.py +453 -0
  373. datahub/sdk/dataflow.py +7 -0
  374. datahub/sdk/datajob.py +45 -13
  375. datahub/sdk/dataset.py +56 -2
  376. datahub/sdk/entity_client.py +111 -9
  377. datahub/sdk/lineage_client.py +663 -82
  378. datahub/sdk/main_client.py +50 -16
  379. datahub/sdk/mlmodel.py +120 -38
  380. datahub/sdk/mlmodelgroup.py +7 -0
  381. datahub/sdk/search_client.py +7 -3
  382. datahub/sdk/search_filters.py +304 -36
  383. datahub/secret/datahub_secret_store.py +3 -0
  384. datahub/secret/environment_secret_store.py +29 -0
  385. datahub/secret/file_secret_store.py +49 -0
  386. datahub/specific/aspect_helpers/fine_grained_lineage.py +76 -0
  387. datahub/specific/aspect_helpers/siblings.py +73 -0
  388. datahub/specific/aspect_helpers/structured_properties.py +27 -0
  389. datahub/specific/chart.py +1 -1
  390. datahub/specific/datajob.py +15 -1
  391. datahub/specific/dataproduct.py +4 -0
  392. datahub/specific/dataset.py +39 -59
  393. datahub/sql_parsing/split_statements.py +13 -0
  394. datahub/sql_parsing/sql_parsing_aggregator.py +70 -26
  395. datahub/sql_parsing/sqlglot_lineage.py +196 -42
  396. datahub/sql_parsing/sqlglot_utils.py +12 -4
  397. datahub/sql_parsing/tool_meta_extractor.py +1 -3
  398. datahub/telemetry/telemetry.py +28 -14
  399. datahub/testing/sdk_v2_helpers.py +7 -1
  400. datahub/upgrade/upgrade.py +73 -17
  401. datahub/utilities/file_backed_collections.py +8 -9
  402. datahub/utilities/is_pytest.py +3 -2
  403. datahub/utilities/logging_manager.py +22 -6
  404. datahub/utilities/mapping.py +29 -2
  405. datahub/utilities/sample_data.py +5 -4
  406. datahub/utilities/server_config_util.py +10 -1
  407. datahub/utilities/sqlalchemy_query_combiner.py +5 -2
  408. datahub/utilities/stats_collections.py +4 -0
  409. datahub/utilities/urns/urn.py +41 -2
  410. datahub/emitter/sql_parsing_builder.py +0 -306
  411. datahub/ingestion/source/redshift/lineage_v2.py +0 -466
  412. {acryl_datahub-1.1.1rc4.dist-info → acryl_datahub-1.3.0.1rc9.dist-info}/WHEEL +0 -0
  413. {acryl_datahub-1.1.1rc4.dist-info → acryl_datahub-1.3.0.1rc9.dist-info}/licenses/LICENSE +0 -0
  414. {acryl_datahub-1.1.1rc4.dist-info → acryl_datahub-1.3.0.1rc9.dist-info}/top_level.txt +0 -0
@@ -42,7 +42,44 @@
42
42
  "name": "users",
43
43
  "default": null,
44
44
  "doc": "List of provisioned users of a role"
45
+ },
46
+ {
47
+ "type": [
48
+ "null",
49
+ {
50
+ "type": "array",
51
+ "items": {
52
+ "type": "record",
53
+ "name": "RoleGroup",
54
+ "namespace": "com.linkedin.pegasus2avro.role",
55
+ "fields": [
56
+ {
57
+ "Relationship": {
58
+ "entityTypes": [
59
+ "corpGroup"
60
+ ],
61
+ "name": "Has"
62
+ },
63
+ "java": {
64
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
65
+ },
66
+ "type": "string",
67
+ "name": "group",
68
+ "doc": "Link provisioned corp group for a role",
69
+ "Urn": "Urn",
70
+ "entityTypes": [
71
+ "corpGroup"
72
+ ]
73
+ }
74
+ ],
75
+ "doc": "Provisioned groups of a role"
76
+ }
77
+ }
78
+ ],
79
+ "name": "groups",
80
+ "default": null,
81
+ "doc": "List of provisioned groups of a role"
45
82
  }
46
83
  ],
47
- "doc": "Provisioned users of a role"
84
+ "doc": "Provisioned users and groups of a role"
48
85
  }
@@ -0,0 +1,31 @@
1
+ {
2
+ "type": "record",
3
+ "Aspect": {
4
+ "name": "applicationKey",
5
+ "keyForEntity": "application",
6
+ "entityCategory": "core",
7
+ "entityAspects": [
8
+ "applicationProperties",
9
+ "ownership",
10
+ "glossaryTerms",
11
+ "globalTags",
12
+ "domains",
13
+ "institutionalMemory",
14
+ "status",
15
+ "structuredProperties",
16
+ "forms",
17
+ "testResults",
18
+ "subTypes"
19
+ ]
20
+ },
21
+ "name": "ApplicationKey",
22
+ "namespace": "com.linkedin.pegasus2avro.application",
23
+ "fields": [
24
+ {
25
+ "type": "string",
26
+ "name": "id",
27
+ "doc": "A unique id for the Application."
28
+ }
29
+ ],
30
+ "doc": "Key for a Query"
31
+ }
@@ -0,0 +1,72 @@
1
+ {
2
+ "type": "record",
3
+ "Aspect": {
4
+ "name": "applicationProperties"
5
+ },
6
+ "name": "ApplicationProperties",
7
+ "namespace": "com.linkedin.pegasus2avro.application",
8
+ "fields": [
9
+ {
10
+ "Searchable": {
11
+ "/*": {
12
+ "fieldType": "TEXT",
13
+ "queryByDefault": true
14
+ }
15
+ },
16
+ "type": {
17
+ "type": "map",
18
+ "values": "string"
19
+ },
20
+ "name": "customProperties",
21
+ "default": {},
22
+ "doc": "Custom property bag."
23
+ },
24
+ {
25
+ "Searchable": {
26
+ "fieldType": "KEYWORD"
27
+ },
28
+ "java": {
29
+ "class": "com.linkedin.pegasus2avro.common.url.Url",
30
+ "coercerClass": "com.linkedin.pegasus2avro.common.url.UrlCoercer"
31
+ },
32
+ "type": [
33
+ "null",
34
+ "string"
35
+ ],
36
+ "name": "externalUrl",
37
+ "default": null,
38
+ "doc": "URL where the reference exist"
39
+ },
40
+ {
41
+ "Searchable": {
42
+ "boostScore": 10.0,
43
+ "enableAutocomplete": true,
44
+ "fieldNameAliases": [
45
+ "_entityName"
46
+ ],
47
+ "fieldType": "WORD_GRAM"
48
+ },
49
+ "type": [
50
+ "null",
51
+ "string"
52
+ ],
53
+ "name": "name",
54
+ "default": null,
55
+ "doc": "Display name of the Application"
56
+ },
57
+ {
58
+ "Searchable": {
59
+ "fieldType": "TEXT",
60
+ "hasValuesFieldName": "hasDescription"
61
+ },
62
+ "type": [
63
+ "null",
64
+ "string"
65
+ ],
66
+ "name": "description",
67
+ "default": null,
68
+ "doc": "Documentation of the application"
69
+ }
70
+ ],
71
+ "doc": "The main properties of an Application"
72
+ }
@@ -0,0 +1,38 @@
1
+ {
2
+ "type": "record",
3
+ "Aspect": {
4
+ "name": "applications"
5
+ },
6
+ "name": "Applications",
7
+ "namespace": "com.linkedin.pegasus2avro.application",
8
+ "fields": [
9
+ {
10
+ "Relationship": {
11
+ "/*": {
12
+ "entityTypes": [
13
+ "application"
14
+ ],
15
+ "name": "AssociatedWith"
16
+ }
17
+ },
18
+ "Searchable": {
19
+ "/*": {
20
+ "addToFilters": true,
21
+ "fieldName": "applications",
22
+ "fieldType": "URN",
23
+ "filterNameOverride": "Application",
24
+ "hasValuesFieldName": "hasApplication"
25
+ }
26
+ },
27
+ "type": {
28
+ "type": "array",
29
+ "items": "string"
30
+ },
31
+ "name": "applications",
32
+ "doc": "The Applications attached to an Asset",
33
+ "Urn": "Urn",
34
+ "urn_is_array": true
35
+ }
36
+ ],
37
+ "doc": "Links from an Asset to its Applications"
38
+ }
@@ -0,0 +1,63 @@
1
+ {
2
+ "type": "record",
3
+ "Aspect": {
4
+ "name": "assetSettings"
5
+ },
6
+ "name": "AssetSettings",
7
+ "namespace": "com.linkedin.pegasus2avro.settings.asset",
8
+ "fields": [
9
+ {
10
+ "type": [
11
+ "null",
12
+ {
13
+ "type": "record",
14
+ "name": "AssetSummarySettings",
15
+ "namespace": "com.linkedin.pegasus2avro.settings.asset",
16
+ "fields": [
17
+ {
18
+ "Relationship": {
19
+ "/*/template": {
20
+ "entityTypes": [
21
+ "dataHubPageTemplate"
22
+ ],
23
+ "name": "HasSummaryTemplate"
24
+ }
25
+ },
26
+ "type": [
27
+ {
28
+ "type": "array",
29
+ "items": {
30
+ "type": "record",
31
+ "name": "AssetSummarySettingsTemplate",
32
+ "namespace": "com.linkedin.pegasus2avro.settings.asset",
33
+ "fields": [
34
+ {
35
+ "java": {
36
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
37
+ },
38
+ "type": "string",
39
+ "name": "template",
40
+ "doc": "The urn of the template",
41
+ "Urn": "Urn"
42
+ }
43
+ ],
44
+ "doc": "Object containing the template and any additional info for asset summary settings"
45
+ }
46
+ },
47
+ "null"
48
+ ],
49
+ "name": "templates",
50
+ "default": [],
51
+ "doc": "The list of templates applied to this asset in order. Right now we only expect one."
52
+ }
53
+ ],
54
+ "doc": "Information related to the asset summary for this asset"
55
+ }
56
+ ],
57
+ "name": "assetSummary",
58
+ "default": null,
59
+ "doc": "Information related to the asset summary for this asset"
60
+ }
61
+ ],
62
+ "doc": "Settings associated with this asset"
63
+ }
@@ -188,7 +188,8 @@
188
188
  "createdActor": "inputEdges/*/created/actor",
189
189
  "createdOn": "inputEdges/*/created/time",
190
190
  "entityTypes": [
191
- "dataset"
191
+ "dataset",
192
+ "chart"
192
193
  ],
193
194
  "isLineage": true,
194
195
  "name": "Consumes",
@@ -13,6 +13,7 @@
13
13
  "embed",
14
14
  "browsePaths",
15
15
  "domains",
16
+ "applications",
16
17
  "container",
17
18
  "deprecation",
18
19
  "ownership",
@@ -18,6 +18,7 @@
18
18
  "browsePaths",
19
19
  "status",
20
20
  "domains",
21
+ "applications",
21
22
  "browsePathsV2",
22
23
  "structuredProperties",
23
24
  "forms",
@@ -93,13 +93,17 @@
93
93
  "DEV": "Designates development fabrics",
94
94
  "EI": "Designates early-integration fabrics",
95
95
  "NON_PROD": "Designates non-production fabrics",
96
+ "PRD": "Alternative Prod spelling",
96
97
  "PRE": "Designates pre-production fabrics",
97
98
  "PROD": "Designates production fabrics",
98
99
  "QA": "Designates quality assurance fabrics",
99
100
  "RVW": "Designates review fabrics",
100
101
  "SANDBOX": "Designates sandbox fabrics",
102
+ "SBX": "Alternative spelling for sandbox",
103
+ "SIT": "System Integration Testing",
101
104
  "STG": "Designates staging fabrics",
102
105
  "TEST": "Designates testing fabrics",
106
+ "TST": "Alternative Test spelling",
103
107
  "UAT": "Designates user acceptance testing fabrics"
104
108
  },
105
109
  "name": "FabricType",
@@ -116,6 +120,10 @@
116
120
  "PROD",
117
121
  "CORP",
118
122
  "RVW",
123
+ "PRD",
124
+ "TST",
125
+ "SIT",
126
+ "SBX",
119
127
  "SANDBOX"
120
128
  ],
121
129
  "doc": "Fabric group type"
@@ -53,7 +53,7 @@
53
53
  },
54
54
  "type": "string",
55
55
  "name": "pictureLink",
56
- "default": "https://raw.githubusercontent.com/datahub-project/datahub/master/datahub-web-react/src/images/default_avatar.png",
56
+ "default": "assets/platforms/default_avatar.png",
57
57
  "doc": "A URL which points to a picture which user wants to set as a profile photo"
58
58
  },
59
59
  {
@@ -159,6 +159,56 @@
159
159
  "name": "notificationSettings",
160
160
  "default": null,
161
161
  "doc": "Notification settings for a user"
162
+ },
163
+ {
164
+ "type": [
165
+ "null",
166
+ {
167
+ "type": "record",
168
+ "name": "CorpUserHomePageSettings",
169
+ "namespace": "com.linkedin.pegasus2avro.identity",
170
+ "fields": [
171
+ {
172
+ "Relationship": {
173
+ "entityTypes": [
174
+ "dataHubPageTemplate"
175
+ ],
176
+ "name": "HasPersonalPageTemplate"
177
+ },
178
+ "java": {
179
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
180
+ },
181
+ "type": [
182
+ "null",
183
+ "string"
184
+ ],
185
+ "name": "pageTemplate",
186
+ "default": null,
187
+ "doc": "The page template that will be rendered in the UI by default for this user",
188
+ "Urn": "Urn",
189
+ "entityTypes": [
190
+ "dataHubPageTemplate"
191
+ ]
192
+ },
193
+ {
194
+ "type": [
195
+ "null",
196
+ {
197
+ "type": "array",
198
+ "items": "string"
199
+ }
200
+ ],
201
+ "name": "dismissedAnnouncements",
202
+ "default": null,
203
+ "doc": "The list of announcement urns that have been dismissed by the user"
204
+ }
205
+ ],
206
+ "doc": "Settings related to the home page for a user"
207
+ }
208
+ ],
209
+ "name": "homePage",
210
+ "default": null,
211
+ "doc": "Settings related to the home page for a user"
162
212
  }
163
213
  ],
164
214
  "doc": "Settings that a user can customize through the datahub ui"
@@ -6,6 +6,7 @@
6
6
  "entityCategory": "_unset_",
7
7
  "entityAspects": [
8
8
  "domains",
9
+ "applications",
9
10
  "container",
10
11
  "deprecation",
11
12
  "dashboardUsageStatistics",
@@ -147,13 +147,17 @@
147
147
  "DEV": "Designates development fabrics",
148
148
  "EI": "Designates early-integration fabrics",
149
149
  "NON_PROD": "Designates non-production fabrics",
150
+ "PRD": "Alternative Prod spelling",
150
151
  "PRE": "Designates pre-production fabrics",
151
152
  "PROD": "Designates production fabrics",
152
153
  "QA": "Designates quality assurance fabrics",
153
154
  "RVW": "Designates review fabrics",
154
155
  "SANDBOX": "Designates sandbox fabrics",
156
+ "SBX": "Alternative spelling for sandbox",
157
+ "SIT": "System Integration Testing",
155
158
  "STG": "Designates staging fabrics",
156
159
  "TEST": "Designates testing fabrics",
160
+ "TST": "Alternative Test spelling",
157
161
  "UAT": "Designates user acceptance testing fabrics"
158
162
  },
159
163
  "name": "FabricType",
@@ -170,6 +174,10 @@
170
174
  "PROD",
171
175
  "CORP",
172
176
  "RVW",
177
+ "PRD",
178
+ "TST",
179
+ "SIT",
180
+ "SBX",
173
181
  "SANDBOX"
174
182
  ],
175
183
  "doc": "Fabric group type"
@@ -6,6 +6,7 @@
6
6
  "entityCategory": "core",
7
7
  "entityAspects": [
8
8
  "domains",
9
+ "applications",
9
10
  "deprecation",
10
11
  "versionInfo",
11
12
  "dataFlowInfo",
@@ -0,0 +1,230 @@
1
+ {
2
+ "type": "record",
3
+ "Aspect": {
4
+ "name": "dataHubFileInfo"
5
+ },
6
+ "name": "DataHubFileInfo",
7
+ "namespace": "com.linkedin.pegasus2avro.file",
8
+ "fields": [
9
+ {
10
+ "type": {
11
+ "type": "record",
12
+ "name": "BucketStorageLocation",
13
+ "namespace": "com.linkedin.pegasus2avro.file",
14
+ "fields": [
15
+ {
16
+ "Searchable": {
17
+ "fieldType": "KEYWORD"
18
+ },
19
+ "type": "string",
20
+ "name": "storageBucket",
21
+ "doc": "The storage bucket this file is stored in"
22
+ },
23
+ {
24
+ "Searchable": {
25
+ "fieldType": "KEYWORD"
26
+ },
27
+ "type": "string",
28
+ "name": "storageKey",
29
+ "doc": "The key for where this file is stored inside of the given bucket"
30
+ }
31
+ ],
32
+ "doc": "Information where a file is stored"
33
+ },
34
+ "name": "bucketStorageLocation",
35
+ "doc": "Info about where a file is stored"
36
+ },
37
+ {
38
+ "Searchable": {
39
+ "fieldType": "TEXT_PARTIAL"
40
+ },
41
+ "type": "string",
42
+ "name": "originalFileName",
43
+ "doc": "The original filename as uploaded by the user"
44
+ },
45
+ {
46
+ "Searchable": {
47
+ "fieldType": "KEYWORD"
48
+ },
49
+ "type": "string",
50
+ "name": "mimeType",
51
+ "doc": "MIME type of the file (e.g., image/png, application/pdf)"
52
+ },
53
+ {
54
+ "type": "long",
55
+ "name": "sizeInBytes",
56
+ "doc": "Size of the file in bytes"
57
+ },
58
+ {
59
+ "Searchable": {
60
+ "fieldType": "KEYWORD"
61
+ },
62
+ "type": {
63
+ "type": "enum",
64
+ "symbolDocs": {
65
+ "ASSET_DOCUMENTATION": "File uploaded for entity documentation"
66
+ },
67
+ "name": "FileUploadScenario",
68
+ "namespace": "com.linkedin.pegasus2avro.file",
69
+ "symbols": [
70
+ "ASSET_DOCUMENTATION"
71
+ ]
72
+ },
73
+ "name": "scenario",
74
+ "doc": "The scenario/context in which this file was uploaded"
75
+ },
76
+ {
77
+ "Relationship": {
78
+ "entityTypes": [
79
+ "dataset",
80
+ "chart",
81
+ "container",
82
+ "dashboard",
83
+ "dataFlow",
84
+ "dataJob",
85
+ "glossaryTerm",
86
+ "glossaryNode",
87
+ "mlModel",
88
+ "mlFeature",
89
+ "notebook",
90
+ "mlFeatureTable",
91
+ "mlPrimaryKey",
92
+ "mlModelGroup",
93
+ "domain",
94
+ "dataProduct",
95
+ "businessAttribute"
96
+ ],
97
+ "name": "ReferencedBy"
98
+ },
99
+ "Searchable": {
100
+ "fieldType": "URN"
101
+ },
102
+ "java": {
103
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
104
+ },
105
+ "type": [
106
+ "null",
107
+ "string"
108
+ ],
109
+ "name": "referencedByAsset",
110
+ "default": null,
111
+ "doc": "Optional URN of the entity this file is associated with (e.g., the dataset whose docs contain this file)",
112
+ "Urn": "Urn",
113
+ "entityTypes": [
114
+ "dataset",
115
+ "chart",
116
+ "container",
117
+ "dashboard",
118
+ "dataFlow",
119
+ "dataJob",
120
+ "glossaryTerm",
121
+ "glossaryNode",
122
+ "mlModel",
123
+ "mlFeature",
124
+ "notebook",
125
+ "mlFeatureTable",
126
+ "mlPrimaryKey",
127
+ "mlModelGroup",
128
+ "domain",
129
+ "dataProduct",
130
+ "businessAttribute"
131
+ ]
132
+ },
133
+ {
134
+ "Relationship": {
135
+ "entityTypes": [
136
+ "schemaField"
137
+ ],
138
+ "name": "ReferencedBy"
139
+ },
140
+ "Searchable": {
141
+ "fieldType": "URN"
142
+ },
143
+ "java": {
144
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
145
+ },
146
+ "type": [
147
+ "null",
148
+ "string"
149
+ ],
150
+ "name": "schemaField",
151
+ "default": null,
152
+ "doc": "The dataset schema field urn this file is referenced by",
153
+ "Urn": "Urn",
154
+ "entityTypes": [
155
+ "schemaField"
156
+ ]
157
+ },
158
+ {
159
+ "Searchable": {
160
+ "/actor": {
161
+ "fieldName": "createdBy",
162
+ "fieldType": "URN"
163
+ },
164
+ "/time": {
165
+ "fieldName": "createdAt",
166
+ "fieldType": "DATETIME"
167
+ }
168
+ },
169
+ "type": {
170
+ "type": "record",
171
+ "name": "AuditStamp",
172
+ "namespace": "com.linkedin.pegasus2avro.common",
173
+ "fields": [
174
+ {
175
+ "type": "long",
176
+ "name": "time",
177
+ "doc": "When did the resource/association/sub-resource move into the specific lifecycle stage represented by this AuditEvent."
178
+ },
179
+ {
180
+ "java": {
181
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
182
+ },
183
+ "type": "string",
184
+ "name": "actor",
185
+ "doc": "The entity (e.g. a member URN) which will be credited for moving the resource/association/sub-resource into the specific lifecycle stage. It is also the one used to authorize the change.",
186
+ "Urn": "Urn"
187
+ },
188
+ {
189
+ "java": {
190
+ "class": "com.linkedin.pegasus2avro.common.urn.Urn"
191
+ },
192
+ "type": [
193
+ "null",
194
+ "string"
195
+ ],
196
+ "name": "impersonator",
197
+ "default": null,
198
+ "doc": "The entity (e.g. a service URN) which performs the change on behalf of the Actor and must be authorized to act as the Actor.",
199
+ "Urn": "Urn"
200
+ },
201
+ {
202
+ "type": [
203
+ "null",
204
+ "string"
205
+ ],
206
+ "name": "message",
207
+ "default": null,
208
+ "doc": "Additional context around how DataHub was informed of the particular change. For example: was the change created by an automated process, or manually."
209
+ }
210
+ ],
211
+ "doc": "Data captured on a resource/association/sub-resource level giving insight into when that resource/association/sub-resource moved into a particular lifecycle stage, and who acted to move it into that specific lifecycle stage."
212
+ },
213
+ "name": "created",
214
+ "doc": "Timestamp when this file was created and by whom"
215
+ },
216
+ {
217
+ "Searchable": {
218
+ "fieldType": "KEYWORD"
219
+ },
220
+ "type": [
221
+ "null",
222
+ "string"
223
+ ],
224
+ "name": "contentHash",
225
+ "default": null,
226
+ "doc": "SHA-256 hash of file contents"
227
+ }
228
+ ],
229
+ "doc": "Information about a DataHub file - a file stored in S3 for use within DataHub platform features like documentation, home pages, and announcements."
230
+ }
@@ -0,0 +1,21 @@
1
+ {
2
+ "type": "record",
3
+ "Aspect": {
4
+ "name": "dataHubFileKey",
5
+ "keyForEntity": "dataHubFile",
6
+ "entityCategory": "core",
7
+ "entityAspects": [
8
+ "dataHubFileInfo"
9
+ ]
10
+ },
11
+ "name": "DataHubFileKey",
12
+ "namespace": "com.linkedin.pegasus2avro.metadata.key",
13
+ "fields": [
14
+ {
15
+ "type": "string",
16
+ "name": "id",
17
+ "doc": "Unique id for the file."
18
+ }
19
+ ],
20
+ "doc": "Key for a DataHubFile"
21
+ }