acryl-datahub 0.15.0.6rc3__py3-none-any.whl → 1.0.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of acryl-datahub might be problematic. Click here for more details.
- {acryl_datahub-0.15.0.6rc3.dist-info → acryl_datahub-1.0.0.dist-info}/METADATA +2552 -2523
- {acryl_datahub-0.15.0.6rc3.dist-info → acryl_datahub-1.0.0.dist-info}/RECORD +204 -191
- {acryl_datahub-0.15.0.6rc3.dist-info → acryl_datahub-1.0.0.dist-info}/WHEEL +1 -1
- {acryl_datahub-0.15.0.6rc3.dist-info → acryl_datahub-1.0.0.dist-info}/entry_points.txt +1 -0
- datahub/_version.py +1 -1
- datahub/api/entities/common/serialized_value.py +4 -3
- datahub/api/entities/dataset/dataset.py +731 -42
- datahub/api/entities/structuredproperties/structuredproperties.py +2 -2
- datahub/cli/check_cli.py +72 -19
- datahub/cli/docker_cli.py +3 -3
- datahub/cli/iceberg_cli.py +1 -1
- datahub/cli/ingest_cli.py +30 -93
- datahub/cli/lite_cli.py +4 -2
- datahub/cli/specific/dataproduct_cli.py +1 -1
- datahub/cli/specific/dataset_cli.py +128 -14
- datahub/configuration/common.py +10 -2
- datahub/configuration/git.py +1 -3
- datahub/configuration/kafka.py +1 -1
- datahub/emitter/mce_builder.py +28 -13
- datahub/emitter/mcp_builder.py +4 -1
- datahub/emitter/response_helper.py +145 -0
- datahub/emitter/rest_emitter.py +323 -10
- datahub/ingestion/api/decorators.py +1 -1
- datahub/ingestion/api/source_helpers.py +4 -0
- datahub/ingestion/fs/s3_fs.py +2 -2
- datahub/ingestion/glossary/classification_mixin.py +1 -5
- datahub/ingestion/graph/client.py +41 -22
- datahub/ingestion/graph/entity_versioning.py +3 -3
- datahub/ingestion/graph/filters.py +64 -37
- datahub/ingestion/reporting/datahub_ingestion_run_summary_provider.py +1 -6
- datahub/ingestion/run/pipeline.py +112 -148
- datahub/ingestion/run/sink_callback.py +77 -0
- datahub/ingestion/sink/datahub_rest.py +8 -0
- datahub/ingestion/source/abs/config.py +2 -4
- datahub/ingestion/source/bigquery_v2/bigquery_audit.py +1 -1
- datahub/ingestion/source/bigquery_v2/bigquery_config.py +2 -46
- datahub/ingestion/source/bigquery_v2/bigquery_schema.py +6 -1
- datahub/ingestion/source/bigquery_v2/bigquery_schema_gen.py +7 -4
- datahub/ingestion/source/cassandra/cassandra.py +152 -233
- datahub/ingestion/source/cassandra/cassandra_api.py +13 -5
- datahub/ingestion/source/common/gcp_credentials_config.py +53 -0
- datahub/ingestion/source/common/subtypes.py +12 -0
- datahub/ingestion/source/csv_enricher.py +3 -3
- datahub/ingestion/source/data_lake_common/path_spec.py +1 -3
- datahub/ingestion/source/dbt/dbt_common.py +3 -5
- datahub/ingestion/source/dbt/dbt_tests.py +4 -8
- datahub/ingestion/source/delta_lake/config.py +8 -1
- datahub/ingestion/source/delta_lake/report.py +4 -2
- datahub/ingestion/source/delta_lake/source.py +20 -5
- datahub/ingestion/source/dremio/dremio_api.py +4 -8
- datahub/ingestion/source/dremio/dremio_aspects.py +3 -5
- datahub/ingestion/source/dynamodb/dynamodb.py +1 -0
- datahub/ingestion/source/elastic_search.py +26 -6
- datahub/ingestion/source/feast.py +27 -8
- datahub/ingestion/source/file.py +6 -3
- datahub/ingestion/source/gc/dataprocess_cleanup.py +1 -1
- datahub/ingestion/source/gc/execution_request_cleanup.py +2 -1
- datahub/ingestion/source/ge_data_profiler.py +12 -15
- datahub/ingestion/source/iceberg/iceberg.py +46 -12
- datahub/ingestion/source/iceberg/iceberg_common.py +71 -21
- datahub/ingestion/source/identity/okta.py +37 -7
- datahub/ingestion/source/kafka/kafka.py +1 -1
- datahub/ingestion/source/kafka_connect/common.py +2 -7
- datahub/ingestion/source/kafka_connect/kafka_connect.py +97 -4
- datahub/ingestion/source/kafka_connect/sink_connectors.py +2 -2
- datahub/ingestion/source/kafka_connect/source_connectors.py +6 -9
- datahub/ingestion/source/looker/looker_common.py +3 -3
- datahub/ingestion/source/looker/looker_file_loader.py +2 -2
- datahub/ingestion/source/looker/looker_lib_wrapper.py +2 -1
- datahub/ingestion/source/looker/looker_source.py +1 -1
- datahub/ingestion/source/looker/looker_template_language.py +4 -2
- datahub/ingestion/source/looker/lookml_source.py +3 -2
- datahub/ingestion/source/metabase.py +57 -35
- datahub/ingestion/source/metadata/business_glossary.py +45 -3
- datahub/ingestion/source/metadata/lineage.py +2 -2
- datahub/ingestion/source/mlflow.py +365 -35
- datahub/ingestion/source/mode.py +18 -8
- datahub/ingestion/source/neo4j/neo4j_source.py +27 -7
- datahub/ingestion/source/nifi.py +37 -11
- datahub/ingestion/source/openapi.py +1 -1
- datahub/ingestion/source/openapi_parser.py +49 -17
- datahub/ingestion/source/powerbi/m_query/parser.py +3 -2
- datahub/ingestion/source/powerbi/m_query/tree_function.py +2 -1
- datahub/ingestion/source/powerbi/powerbi.py +1 -3
- datahub/ingestion/source/powerbi/rest_api_wrapper/data_resolver.py +2 -1
- datahub/ingestion/source/powerbi_report_server/report_server.py +26 -7
- datahub/ingestion/source/powerbi_report_server/report_server_domain.py +1 -1
- datahub/ingestion/source/preset.py +7 -4
- datahub/ingestion/source/pulsar.py +3 -2
- datahub/ingestion/source/qlik_sense/websocket_connection.py +4 -2
- datahub/ingestion/source/redash.py +31 -7
- datahub/ingestion/source/redshift/config.py +4 -0
- datahub/ingestion/source/redshift/datashares.py +236 -0
- datahub/ingestion/source/redshift/lineage.py +6 -2
- datahub/ingestion/source/redshift/lineage_v2.py +24 -9
- datahub/ingestion/source/redshift/profile.py +1 -1
- datahub/ingestion/source/redshift/query.py +133 -33
- datahub/ingestion/source/redshift/redshift.py +46 -73
- datahub/ingestion/source/redshift/redshift_schema.py +186 -6
- datahub/ingestion/source/redshift/report.py +3 -0
- datahub/ingestion/source/s3/config.py +5 -5
- datahub/ingestion/source/s3/source.py +20 -41
- datahub/ingestion/source/salesforce.py +550 -275
- datahub/ingestion/source/schema_inference/object.py +1 -1
- datahub/ingestion/source/sigma/sigma.py +1 -1
- datahub/ingestion/source/slack/slack.py +31 -10
- datahub/ingestion/source/snowflake/snowflake_connection.py +2 -2
- datahub/ingestion/source/snowflake/snowflake_queries.py +19 -13
- datahub/ingestion/source/snowflake/snowflake_query.py +6 -4
- datahub/ingestion/source/snowflake/snowflake_schema.py +3 -4
- datahub/ingestion/source/snowflake/snowflake_v2.py +1 -1
- datahub/ingestion/source/sql/athena.py +10 -16
- datahub/ingestion/source/sql/druid.py +1 -5
- datahub/ingestion/source/sql/hive.py +15 -6
- datahub/ingestion/source/sql/hive_metastore.py +3 -2
- datahub/ingestion/source/sql/mssql/job_models.py +29 -0
- datahub/ingestion/source/sql/mssql/source.py +11 -5
- datahub/ingestion/source/sql/oracle.py +127 -63
- datahub/ingestion/source/sql/sql_common.py +6 -12
- datahub/ingestion/source/sql/sql_types.py +2 -2
- datahub/ingestion/source/sql/teradata.py +7 -5
- datahub/ingestion/source/sql/trino.py +2 -2
- datahub/ingestion/source/state/stale_entity_removal_handler.py +4 -8
- datahub/ingestion/source/superset.py +222 -62
- datahub/ingestion/source/tableau/tableau.py +22 -6
- datahub/ingestion/source/tableau/tableau_common.py +3 -2
- datahub/ingestion/source/unity/ge_profiler.py +2 -1
- datahub/ingestion/source/unity/source.py +11 -1
- datahub/ingestion/source/vertexai.py +697 -0
- datahub/ingestion/source_config/pulsar.py +3 -1
- datahub/ingestion/transformer/pattern_cleanup_ownership.py +25 -7
- datahub/lite/duckdb_lite.py +3 -10
- datahub/lite/lite_local.py +1 -1
- datahub/lite/lite_util.py +4 -3
- datahub/metadata/_schema_classes.py +714 -417
- datahub/metadata/_urns/urn_defs.py +1673 -1649
- datahub/metadata/com/linkedin/pegasus2avro/incident/__init__.py +4 -0
- datahub/metadata/schema.avsc +16438 -16603
- datahub/metadata/schemas/AssertionInfo.avsc +3 -1
- datahub/metadata/schemas/BusinessAttributeInfo.avsc +6 -2
- datahub/metadata/schemas/BusinessAttributes.avsc +6 -0
- datahub/metadata/schemas/ChartInfo.avsc +1 -0
- datahub/metadata/schemas/CorpGroupKey.avsc +2 -1
- datahub/metadata/schemas/CorpUserInfo.avsc +13 -0
- datahub/metadata/schemas/CorpUserKey.avsc +2 -1
- datahub/metadata/schemas/DataHubIngestionSourceInfo.avsc +8 -3
- datahub/metadata/schemas/DataProcessInstanceInput.avsc +129 -1
- datahub/metadata/schemas/DataProcessInstanceOutput.avsc +131 -3
- datahub/metadata/schemas/DataProcessKey.avsc +2 -1
- datahub/metadata/schemas/DataProductKey.avsc +2 -1
- datahub/metadata/schemas/DomainKey.avsc +2 -1
- datahub/metadata/schemas/EditableSchemaMetadata.avsc +6 -2
- datahub/metadata/schemas/GlossaryNodeKey.avsc +3 -1
- datahub/metadata/schemas/GlossaryTermKey.avsc +2 -1
- datahub/metadata/schemas/GlossaryTerms.avsc +3 -1
- datahub/metadata/schemas/IncidentInfo.avsc +130 -46
- datahub/metadata/schemas/InputFields.avsc +3 -1
- datahub/metadata/schemas/MLFeatureKey.avsc +2 -1
- datahub/metadata/schemas/MLFeatureTableKey.avsc +2 -1
- datahub/metadata/schemas/MLModelDeploymentKey.avsc +2 -1
- datahub/metadata/schemas/MLModelGroupKey.avsc +3 -1
- datahub/metadata/schemas/MLModelKey.avsc +3 -1
- datahub/metadata/schemas/MLPrimaryKeyKey.avsc +2 -1
- datahub/metadata/schemas/MetadataChangeEvent.avsc +20 -2
- datahub/metadata/schemas/PostKey.avsc +2 -1
- datahub/metadata/schemas/SchemaFieldKey.avsc +2 -1
- datahub/metadata/schemas/SchemaMetadata.avsc +3 -1
- datahub/metadata/schemas/StructuredPropertyDefinition.avsc +14 -0
- datahub/metadata/schemas/VersionProperties.avsc +18 -0
- datahub/metadata/schemas/VersionSetProperties.avsc +5 -0
- datahub/pydantic/__init__.py +0 -0
- datahub/pydantic/compat.py +58 -0
- datahub/sdk/__init__.py +30 -12
- datahub/sdk/_all_entities.py +1 -1
- datahub/sdk/_attribution.py +4 -0
- datahub/sdk/_shared.py +251 -16
- datahub/sdk/_utils.py +35 -0
- datahub/sdk/container.py +29 -5
- datahub/sdk/dataset.py +118 -20
- datahub/sdk/{_entity.py → entity.py} +24 -1
- datahub/sdk/entity_client.py +1 -1
- datahub/sdk/main_client.py +23 -0
- datahub/sdk/resolver_client.py +17 -29
- datahub/sdk/search_client.py +50 -0
- datahub/sdk/search_filters.py +374 -0
- datahub/specific/dataset.py +3 -4
- datahub/sql_parsing/_sqlglot_patch.py +2 -10
- datahub/sql_parsing/schema_resolver.py +1 -1
- datahub/sql_parsing/split_statements.py +20 -13
- datahub/sql_parsing/sql_parsing_common.py +7 -0
- datahub/sql_parsing/sqlglot_lineage.py +1 -1
- datahub/sql_parsing/sqlglot_utils.py +1 -4
- datahub/testing/check_sql_parser_result.py +5 -6
- datahub/testing/compare_metadata_json.py +7 -6
- datahub/testing/pytest_hooks.py +56 -0
- datahub/upgrade/upgrade.py +2 -2
- datahub/utilities/file_backed_collections.py +3 -14
- datahub/utilities/ingest_utils.py +106 -0
- datahub/utilities/mapping.py +1 -1
- datahub/utilities/memory_footprint.py +3 -2
- datahub/utilities/sentinels.py +22 -0
- datahub/utilities/unified_diff.py +5 -1
- {acryl_datahub-0.15.0.6rc3.dist-info → acryl_datahub-1.0.0.dist-info}/LICENSE +0 -0
- {acryl_datahub-0.15.0.6rc3.dist-info → acryl_datahub-1.0.0.dist-info}/top_level.txt +0 -0
|
@@ -2010,7 +2010,9 @@
|
|
|
2010
2010
|
"fieldName": "glossaryTerms",
|
|
2011
2011
|
"fieldType": "URN",
|
|
2012
2012
|
"filterNameOverride": "Glossary Term",
|
|
2013
|
-
"hasValuesFieldName": "hasGlossaryTerms"
|
|
2013
|
+
"hasValuesFieldName": "hasGlossaryTerms",
|
|
2014
|
+
"includeSystemModifiedAt": true,
|
|
2015
|
+
"systemModifiedAtFieldName": "termsModifiedAt"
|
|
2014
2016
|
},
|
|
2015
2017
|
"java": {
|
|
2016
2018
|
"class": "com.linkedin.pegasus2avro.common.urn.GlossaryTermUrn"
|
|
@@ -221,7 +221,9 @@
|
|
|
221
221
|
"/terms/*/urn": {
|
|
222
222
|
"boostScore": 0.5,
|
|
223
223
|
"fieldName": "editedFieldGlossaryTerms",
|
|
224
|
-
"fieldType": "URN"
|
|
224
|
+
"fieldType": "URN",
|
|
225
|
+
"includeSystemModifiedAt": true,
|
|
226
|
+
"systemModifiedAtFieldName": "schemaFieldTermsModifiedAt"
|
|
225
227
|
}
|
|
226
228
|
},
|
|
227
229
|
"type": [
|
|
@@ -254,7 +256,9 @@
|
|
|
254
256
|
"fieldName": "glossaryTerms",
|
|
255
257
|
"fieldType": "URN",
|
|
256
258
|
"filterNameOverride": "Glossary Term",
|
|
257
|
-
"hasValuesFieldName": "hasGlossaryTerms"
|
|
259
|
+
"hasValuesFieldName": "hasGlossaryTerms",
|
|
260
|
+
"includeSystemModifiedAt": true,
|
|
261
|
+
"systemModifiedAtFieldName": "termsModifiedAt"
|
|
258
262
|
},
|
|
259
263
|
"java": {
|
|
260
264
|
"class": "com.linkedin.pegasus2avro.common.urn.GlossaryTermUrn"
|
|
@@ -31,6 +31,12 @@
|
|
|
31
31
|
"namespace": "com.linkedin.pegasus2avro.businessattribute",
|
|
32
32
|
"fields": [
|
|
33
33
|
{
|
|
34
|
+
"Searchable": {
|
|
35
|
+
"fieldName": "schemaFieldBusinessAttribute",
|
|
36
|
+
"includeSystemModifiedAt": true,
|
|
37
|
+
"queryByDefault": false,
|
|
38
|
+
"systemModifiedAtFieldName": "schemaFieldBusinessAttributeModifiedAt"
|
|
39
|
+
},
|
|
34
40
|
"java": {
|
|
35
41
|
"class": "com.linkedin.pegasus2avro.common.urn.BusinessAttributeUrn"
|
|
36
42
|
},
|
|
@@ -165,6 +165,19 @@
|
|
|
165
165
|
"name": "countryCode",
|
|
166
166
|
"default": null,
|
|
167
167
|
"doc": "two uppercase letters country code. e.g. US"
|
|
168
|
+
},
|
|
169
|
+
{
|
|
170
|
+
"Searchable": {
|
|
171
|
+
"fieldType": "BOOLEAN",
|
|
172
|
+
"queryByDefault": false
|
|
173
|
+
},
|
|
174
|
+
"type": [
|
|
175
|
+
"boolean",
|
|
176
|
+
"null"
|
|
177
|
+
],
|
|
178
|
+
"name": "system",
|
|
179
|
+
"default": false,
|
|
180
|
+
"doc": "Whether the corpUser is a system user."
|
|
168
181
|
}
|
|
169
182
|
],
|
|
170
183
|
"doc": "Linkedin corp user information"
|
|
@@ -16,7 +16,8 @@
|
|
|
16
16
|
},
|
|
17
17
|
{
|
|
18
18
|
"Searchable": {
|
|
19
|
-
"fieldType": "
|
|
19
|
+
"fieldType": "KEYWORD",
|
|
20
|
+
"queryByDefault": false
|
|
20
21
|
},
|
|
21
22
|
"type": "string",
|
|
22
23
|
"name": "type",
|
|
@@ -83,7 +84,9 @@
|
|
|
83
84
|
},
|
|
84
85
|
{
|
|
85
86
|
"Searchable": {
|
|
86
|
-
"fieldName": "sourceExecutorId"
|
|
87
|
+
"fieldName": "sourceExecutorId",
|
|
88
|
+
"fieldType": "KEYWORD",
|
|
89
|
+
"queryByDefault": false
|
|
87
90
|
},
|
|
88
91
|
"type": [
|
|
89
92
|
"null",
|
|
@@ -129,7 +132,9 @@
|
|
|
129
132
|
"fields": [
|
|
130
133
|
{
|
|
131
134
|
"Searchable": {
|
|
132
|
-
"fieldName": "sourceType"
|
|
135
|
+
"fieldName": "sourceType",
|
|
136
|
+
"fieldType": "KEYWORD",
|
|
137
|
+
"queryByDefault": false
|
|
133
138
|
},
|
|
134
139
|
"type": {
|
|
135
140
|
"type": "enum",
|
|
@@ -13,7 +13,6 @@
|
|
|
13
13
|
"dataset",
|
|
14
14
|
"mlModel"
|
|
15
15
|
],
|
|
16
|
-
"isLineage": true,
|
|
17
16
|
"name": "Consumes"
|
|
18
17
|
}
|
|
19
18
|
},
|
|
@@ -34,6 +33,135 @@
|
|
|
34
33
|
"doc": "Input assets consumed",
|
|
35
34
|
"Urn": "Urn",
|
|
36
35
|
"urn_is_array": true
|
|
36
|
+
},
|
|
37
|
+
{
|
|
38
|
+
"Relationship": {
|
|
39
|
+
"/*/destinationUrn": {
|
|
40
|
+
"createdActor": "inputEdges/*/created/actor",
|
|
41
|
+
"createdOn": "inputEdges/*/created/time",
|
|
42
|
+
"entityTypes": [
|
|
43
|
+
"dataset",
|
|
44
|
+
"mlModel"
|
|
45
|
+
],
|
|
46
|
+
"isLineage": true,
|
|
47
|
+
"name": "DataProcessInstanceConsumes",
|
|
48
|
+
"properties": "inputEdges/*/properties",
|
|
49
|
+
"updatedActor": "inputEdges/*/lastModified/actor",
|
|
50
|
+
"updatedOn": "inputEdges/*/lastModified/time"
|
|
51
|
+
}
|
|
52
|
+
},
|
|
53
|
+
"type": [
|
|
54
|
+
"null",
|
|
55
|
+
{
|
|
56
|
+
"type": "array",
|
|
57
|
+
"items": {
|
|
58
|
+
"type": "record",
|
|
59
|
+
"name": "Edge",
|
|
60
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
61
|
+
"fields": [
|
|
62
|
+
{
|
|
63
|
+
"java": {
|
|
64
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
65
|
+
},
|
|
66
|
+
"type": [
|
|
67
|
+
"null",
|
|
68
|
+
"string"
|
|
69
|
+
],
|
|
70
|
+
"name": "sourceUrn",
|
|
71
|
+
"default": null,
|
|
72
|
+
"doc": "Urn of the source of this relationship edge.\nIf not specified, assumed to be the entity that this aspect belongs to.",
|
|
73
|
+
"Urn": "Urn"
|
|
74
|
+
},
|
|
75
|
+
{
|
|
76
|
+
"java": {
|
|
77
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
78
|
+
},
|
|
79
|
+
"type": "string",
|
|
80
|
+
"name": "destinationUrn",
|
|
81
|
+
"doc": "Urn of the destination of this relationship edge.",
|
|
82
|
+
"Urn": "Urn"
|
|
83
|
+
},
|
|
84
|
+
{
|
|
85
|
+
"type": [
|
|
86
|
+
"null",
|
|
87
|
+
{
|
|
88
|
+
"type": "record",
|
|
89
|
+
"name": "AuditStamp",
|
|
90
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
91
|
+
"fields": [
|
|
92
|
+
{
|
|
93
|
+
"type": "long",
|
|
94
|
+
"name": "time",
|
|
95
|
+
"doc": "When did the resource/association/sub-resource move into the specific lifecycle stage represented by this AuditEvent."
|
|
96
|
+
},
|
|
97
|
+
{
|
|
98
|
+
"java": {
|
|
99
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
100
|
+
},
|
|
101
|
+
"type": "string",
|
|
102
|
+
"name": "actor",
|
|
103
|
+
"doc": "The entity (e.g. a member URN) which will be credited for moving the resource/association/sub-resource into the specific lifecycle stage. It is also the one used to authorize the change.",
|
|
104
|
+
"Urn": "Urn"
|
|
105
|
+
},
|
|
106
|
+
{
|
|
107
|
+
"java": {
|
|
108
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
109
|
+
},
|
|
110
|
+
"type": [
|
|
111
|
+
"null",
|
|
112
|
+
"string"
|
|
113
|
+
],
|
|
114
|
+
"name": "impersonator",
|
|
115
|
+
"default": null,
|
|
116
|
+
"doc": "The entity (e.g. a service URN) which performs the change on behalf of the Actor and must be authorized to act as the Actor.",
|
|
117
|
+
"Urn": "Urn"
|
|
118
|
+
},
|
|
119
|
+
{
|
|
120
|
+
"type": [
|
|
121
|
+
"null",
|
|
122
|
+
"string"
|
|
123
|
+
],
|
|
124
|
+
"name": "message",
|
|
125
|
+
"default": null,
|
|
126
|
+
"doc": "Additional context around how DataHub was informed of the particular change. For example: was the change created by an automated process, or manually."
|
|
127
|
+
}
|
|
128
|
+
],
|
|
129
|
+
"doc": "Data captured on a resource/association/sub-resource level giving insight into when that resource/association/sub-resource moved into a particular lifecycle stage, and who acted to move it into that specific lifecycle stage."
|
|
130
|
+
}
|
|
131
|
+
],
|
|
132
|
+
"name": "created",
|
|
133
|
+
"default": null,
|
|
134
|
+
"doc": "Audit stamp containing who created this relationship edge and when"
|
|
135
|
+
},
|
|
136
|
+
{
|
|
137
|
+
"type": [
|
|
138
|
+
"null",
|
|
139
|
+
"com.linkedin.pegasus2avro.common.AuditStamp"
|
|
140
|
+
],
|
|
141
|
+
"name": "lastModified",
|
|
142
|
+
"default": null,
|
|
143
|
+
"doc": "Audit stamp containing who last modified this relationship edge and when"
|
|
144
|
+
},
|
|
145
|
+
{
|
|
146
|
+
"type": [
|
|
147
|
+
"null",
|
|
148
|
+
{
|
|
149
|
+
"type": "map",
|
|
150
|
+
"values": "string"
|
|
151
|
+
}
|
|
152
|
+
],
|
|
153
|
+
"name": "properties",
|
|
154
|
+
"default": null,
|
|
155
|
+
"doc": "A generic properties bag that allows us to store specific information on this graph edge."
|
|
156
|
+
}
|
|
157
|
+
],
|
|
158
|
+
"doc": "A common structure to represent all edges to entities when used inside aspects as collections\nThis ensures that all edges have common structure around audit-stamps and will support PATCH, time-travel automatically."
|
|
159
|
+
}
|
|
160
|
+
}
|
|
161
|
+
],
|
|
162
|
+
"name": "inputEdges",
|
|
163
|
+
"default": null,
|
|
164
|
+
"doc": "Input assets consumed by the data process instance, with additional metadata.\nCounts as lineage.\nWill eventually deprecate the inputs field."
|
|
37
165
|
}
|
|
38
166
|
],
|
|
39
167
|
"doc": "Information about the inputs datasets of a Data process"
|
|
@@ -13,8 +13,6 @@
|
|
|
13
13
|
"dataset",
|
|
14
14
|
"mlModel"
|
|
15
15
|
],
|
|
16
|
-
"isLineage": true,
|
|
17
|
-
"isUpstream": false,
|
|
18
16
|
"name": "Produces"
|
|
19
17
|
}
|
|
20
18
|
},
|
|
@@ -32,9 +30,139 @@
|
|
|
32
30
|
"items": "string"
|
|
33
31
|
},
|
|
34
32
|
"name": "outputs",
|
|
35
|
-
"doc": "Output
|
|
33
|
+
"doc": "Output assets produced",
|
|
36
34
|
"Urn": "Urn",
|
|
37
35
|
"urn_is_array": true
|
|
36
|
+
},
|
|
37
|
+
{
|
|
38
|
+
"Relationship": {
|
|
39
|
+
"/*/destinationUrn": {
|
|
40
|
+
"createdActor": "outputEdges/*/created/actor",
|
|
41
|
+
"createdOn": "outputEdges/*/created/time",
|
|
42
|
+
"entityTypes": [
|
|
43
|
+
"dataset",
|
|
44
|
+
"mlModel"
|
|
45
|
+
],
|
|
46
|
+
"isLineage": true,
|
|
47
|
+
"isUpstream": false,
|
|
48
|
+
"name": "DataProcessInstanceProduces",
|
|
49
|
+
"properties": "outputEdges/*/properties",
|
|
50
|
+
"updatedActor": "outputEdges/*/lastModified/actor",
|
|
51
|
+
"updatedOn": "outputEdges/*/lastModified/time"
|
|
52
|
+
}
|
|
53
|
+
},
|
|
54
|
+
"type": [
|
|
55
|
+
"null",
|
|
56
|
+
{
|
|
57
|
+
"type": "array",
|
|
58
|
+
"items": {
|
|
59
|
+
"type": "record",
|
|
60
|
+
"name": "Edge",
|
|
61
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
62
|
+
"fields": [
|
|
63
|
+
{
|
|
64
|
+
"java": {
|
|
65
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
66
|
+
},
|
|
67
|
+
"type": [
|
|
68
|
+
"null",
|
|
69
|
+
"string"
|
|
70
|
+
],
|
|
71
|
+
"name": "sourceUrn",
|
|
72
|
+
"default": null,
|
|
73
|
+
"doc": "Urn of the source of this relationship edge.\nIf not specified, assumed to be the entity that this aspect belongs to.",
|
|
74
|
+
"Urn": "Urn"
|
|
75
|
+
},
|
|
76
|
+
{
|
|
77
|
+
"java": {
|
|
78
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
79
|
+
},
|
|
80
|
+
"type": "string",
|
|
81
|
+
"name": "destinationUrn",
|
|
82
|
+
"doc": "Urn of the destination of this relationship edge.",
|
|
83
|
+
"Urn": "Urn"
|
|
84
|
+
},
|
|
85
|
+
{
|
|
86
|
+
"type": [
|
|
87
|
+
"null",
|
|
88
|
+
{
|
|
89
|
+
"type": "record",
|
|
90
|
+
"name": "AuditStamp",
|
|
91
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
92
|
+
"fields": [
|
|
93
|
+
{
|
|
94
|
+
"type": "long",
|
|
95
|
+
"name": "time",
|
|
96
|
+
"doc": "When did the resource/association/sub-resource move into the specific lifecycle stage represented by this AuditEvent."
|
|
97
|
+
},
|
|
98
|
+
{
|
|
99
|
+
"java": {
|
|
100
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
101
|
+
},
|
|
102
|
+
"type": "string",
|
|
103
|
+
"name": "actor",
|
|
104
|
+
"doc": "The entity (e.g. a member URN) which will be credited for moving the resource/association/sub-resource into the specific lifecycle stage. It is also the one used to authorize the change.",
|
|
105
|
+
"Urn": "Urn"
|
|
106
|
+
},
|
|
107
|
+
{
|
|
108
|
+
"java": {
|
|
109
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
110
|
+
},
|
|
111
|
+
"type": [
|
|
112
|
+
"null",
|
|
113
|
+
"string"
|
|
114
|
+
],
|
|
115
|
+
"name": "impersonator",
|
|
116
|
+
"default": null,
|
|
117
|
+
"doc": "The entity (e.g. a service URN) which performs the change on behalf of the Actor and must be authorized to act as the Actor.",
|
|
118
|
+
"Urn": "Urn"
|
|
119
|
+
},
|
|
120
|
+
{
|
|
121
|
+
"type": [
|
|
122
|
+
"null",
|
|
123
|
+
"string"
|
|
124
|
+
],
|
|
125
|
+
"name": "message",
|
|
126
|
+
"default": null,
|
|
127
|
+
"doc": "Additional context around how DataHub was informed of the particular change. For example: was the change created by an automated process, or manually."
|
|
128
|
+
}
|
|
129
|
+
],
|
|
130
|
+
"doc": "Data captured on a resource/association/sub-resource level giving insight into when that resource/association/sub-resource moved into a particular lifecycle stage, and who acted to move it into that specific lifecycle stage."
|
|
131
|
+
}
|
|
132
|
+
],
|
|
133
|
+
"name": "created",
|
|
134
|
+
"default": null,
|
|
135
|
+
"doc": "Audit stamp containing who created this relationship edge and when"
|
|
136
|
+
},
|
|
137
|
+
{
|
|
138
|
+
"type": [
|
|
139
|
+
"null",
|
|
140
|
+
"com.linkedin.pegasus2avro.common.AuditStamp"
|
|
141
|
+
],
|
|
142
|
+
"name": "lastModified",
|
|
143
|
+
"default": null,
|
|
144
|
+
"doc": "Audit stamp containing who last modified this relationship edge and when"
|
|
145
|
+
},
|
|
146
|
+
{
|
|
147
|
+
"type": [
|
|
148
|
+
"null",
|
|
149
|
+
{
|
|
150
|
+
"type": "map",
|
|
151
|
+
"values": "string"
|
|
152
|
+
}
|
|
153
|
+
],
|
|
154
|
+
"name": "properties",
|
|
155
|
+
"default": null,
|
|
156
|
+
"doc": "A generic properties bag that allows us to store specific information on this graph edge."
|
|
157
|
+
}
|
|
158
|
+
],
|
|
159
|
+
"doc": "A common structure to represent all edges to entities when used inside aspects as collections\nThis ensures that all edges have common structure around audit-stamps and will support PATCH, time-travel automatically."
|
|
160
|
+
}
|
|
161
|
+
}
|
|
162
|
+
],
|
|
163
|
+
"name": "outputEdges",
|
|
164
|
+
"default": null,
|
|
165
|
+
"doc": "Output assets produced by the data process instance during processing, with additional metadata.\nCounts as lineage.\nWill eventually deprecate the outputs field."
|
|
38
166
|
}
|
|
39
167
|
],
|
|
40
168
|
"doc": "Information about the outputs of a Data process"
|
|
@@ -303,7 +303,9 @@
|
|
|
303
303
|
"/terms/*/urn": {
|
|
304
304
|
"boostScore": 0.5,
|
|
305
305
|
"fieldName": "editedFieldGlossaryTerms",
|
|
306
|
-
"fieldType": "URN"
|
|
306
|
+
"fieldType": "URN",
|
|
307
|
+
"includeSystemModifiedAt": true,
|
|
308
|
+
"systemModifiedAtFieldName": "schemaFieldTermsModifiedAt"
|
|
307
309
|
}
|
|
308
310
|
},
|
|
309
311
|
"type": [
|
|
@@ -336,7 +338,9 @@
|
|
|
336
338
|
"fieldName": "glossaryTerms",
|
|
337
339
|
"fieldType": "URN",
|
|
338
340
|
"filterNameOverride": "Glossary Term",
|
|
339
|
-
"hasValuesFieldName": "hasGlossaryTerms"
|
|
341
|
+
"hasValuesFieldName": "hasGlossaryTerms",
|
|
342
|
+
"includeSystemModifiedAt": true,
|
|
343
|
+
"systemModifiedAtFieldName": "termsModifiedAt"
|
|
340
344
|
},
|
|
341
345
|
"java": {
|
|
342
346
|
"class": "com.linkedin.pegasus2avro.common.urn.GlossaryTermUrn"
|
|
@@ -26,7 +26,9 @@
|
|
|
26
26
|
"fieldName": "glossaryTerms",
|
|
27
27
|
"fieldType": "URN",
|
|
28
28
|
"filterNameOverride": "Glossary Term",
|
|
29
|
-
"hasValuesFieldName": "hasGlossaryTerms"
|
|
29
|
+
"hasValuesFieldName": "hasGlossaryTerms",
|
|
30
|
+
"includeSystemModifiedAt": true,
|
|
31
|
+
"systemModifiedAtFieldName": "termsModifiedAt"
|
|
30
32
|
},
|
|
31
33
|
"java": {
|
|
32
34
|
"class": "com.linkedin.pegasus2avro.common.urn.GlossaryTermUrn"
|