acryl-datahub 0.15.0.1rc17__py3-none-any.whl → 0.15.0.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of acryl-datahub might be problematic. Click here for more details.
- {acryl_datahub-0.15.0.1rc17.dist-info → acryl_datahub-0.15.0.2.dist-info}/METADATA +2440 -2438
- {acryl_datahub-0.15.0.1rc17.dist-info → acryl_datahub-0.15.0.2.dist-info}/RECORD +211 -207
- {acryl_datahub-0.15.0.1rc17.dist-info → acryl_datahub-0.15.0.2.dist-info}/WHEEL +1 -1
- datahub/__init__.py +1 -1
- datahub/api/entities/assertion/assertion_operator.py +3 -5
- datahub/api/entities/corpgroup/corpgroup.py +1 -1
- datahub/api/entities/datacontract/assertion_operator.py +3 -5
- datahub/api/entities/dataproduct/dataproduct.py +4 -4
- datahub/api/entities/dataset/dataset.py +2 -1
- datahub/api/entities/structuredproperties/structuredproperties.py +18 -7
- datahub/cli/cli_utils.py +13 -2
- datahub/cli/delete_cli.py +3 -3
- datahub/cli/docker_cli.py +6 -6
- datahub/cli/ingest_cli.py +25 -15
- datahub/cli/lite_cli.py +2 -2
- datahub/cli/migrate.py +5 -5
- datahub/cli/specific/assertions_cli.py +3 -3
- datahub/cli/specific/structuredproperties_cli.py +84 -0
- datahub/cli/timeline_cli.py +1 -1
- datahub/configuration/common.py +1 -2
- datahub/configuration/config_loader.py +73 -50
- datahub/configuration/git.py +2 -2
- datahub/configuration/time_window_config.py +10 -5
- datahub/emitter/mce_builder.py +4 -8
- datahub/emitter/mcp_builder.py +27 -0
- datahub/emitter/mcp_patch_builder.py +1 -2
- datahub/emitter/rest_emitter.py +126 -85
- datahub/entrypoints.py +6 -0
- datahub/ingestion/api/incremental_lineage_helper.py +2 -8
- datahub/ingestion/api/report.py +1 -2
- datahub/ingestion/api/source.py +4 -2
- datahub/ingestion/api/source_helpers.py +1 -1
- datahub/ingestion/extractor/json_schema_util.py +3 -3
- datahub/ingestion/extractor/schema_util.py +3 -5
- datahub/ingestion/fs/s3_fs.py +3 -3
- datahub/ingestion/glossary/datahub_classifier.py +6 -4
- datahub/ingestion/graph/client.py +22 -19
- datahub/ingestion/graph/config.py +1 -1
- datahub/ingestion/run/pipeline.py +8 -7
- datahub/ingestion/run/pipeline_config.py +3 -3
- datahub/ingestion/source/abs/datalake_profiler_config.py +3 -3
- datahub/ingestion/source/abs/source.py +19 -8
- datahub/ingestion/source/aws/glue.py +77 -47
- datahub/ingestion/source/aws/s3_boto_utils.py +3 -3
- datahub/ingestion/source/aws/s3_util.py +24 -1
- datahub/ingestion/source/aws/sagemaker_processors/feature_groups.py +1 -1
- datahub/ingestion/source/aws/sagemaker_processors/models.py +2 -2
- datahub/ingestion/source/bigquery_v2/bigquery.py +34 -34
- datahub/ingestion/source/bigquery_v2/bigquery_audit.py +3 -3
- datahub/ingestion/source/bigquery_v2/bigquery_config.py +14 -6
- datahub/ingestion/source/bigquery_v2/bigquery_platform_resource_helper.py +8 -4
- datahub/ingestion/source/bigquery_v2/bigquery_report.py +0 -3
- datahub/ingestion/source/bigquery_v2/bigquery_schema_gen.py +22 -16
- datahub/ingestion/source/bigquery_v2/lineage.py +16 -16
- datahub/ingestion/source/bigquery_v2/queries.py +1 -3
- datahub/ingestion/source/bigquery_v2/queries_extractor.py +3 -3
- datahub/ingestion/source/bigquery_v2/usage.py +60 -60
- datahub/ingestion/source/cassandra/cassandra.py +0 -1
- datahub/ingestion/source/cassandra/cassandra_profiling.py +24 -24
- datahub/ingestion/source/cassandra/cassandra_utils.py +4 -7
- datahub/ingestion/source/confluent_schema_registry.py +6 -6
- datahub/ingestion/source/csv_enricher.py +29 -29
- datahub/ingestion/source/datahub/config.py +10 -0
- datahub/ingestion/source/datahub/datahub_database_reader.py +4 -2
- datahub/ingestion/source/datahub/datahub_source.py +12 -2
- datahub/ingestion/source/dbt/dbt_cloud.py +13 -13
- datahub/ingestion/source/dbt/dbt_common.py +9 -7
- datahub/ingestion/source/delta_lake/source.py +0 -5
- datahub/ingestion/source/demo_data.py +1 -1
- datahub/ingestion/source/dremio/dremio_api.py +4 -4
- datahub/ingestion/source/dremio/dremio_datahub_source_mapping.py +3 -3
- datahub/ingestion/source/dremio/dremio_reporting.py +0 -3
- datahub/ingestion/source/dremio/dremio_source.py +2 -2
- datahub/ingestion/source/elastic_search.py +4 -4
- datahub/ingestion/source/fivetran/fivetran.py +1 -6
- datahub/ingestion/source/gc/datahub_gc.py +11 -14
- datahub/ingestion/source/gc/execution_request_cleanup.py +31 -6
- datahub/ingestion/source/gc/soft_deleted_entity_cleanup.py +48 -15
- datahub/ingestion/source/gcs/gcs_source.py +3 -2
- datahub/ingestion/source/ge_data_profiler.py +2 -5
- datahub/ingestion/source/ge_profiling_config.py +3 -3
- datahub/ingestion/source/iceberg/iceberg.py +13 -6
- datahub/ingestion/source/iceberg/iceberg_common.py +49 -9
- datahub/ingestion/source/iceberg/iceberg_profiler.py +3 -1
- datahub/ingestion/source/identity/azure_ad.py +3 -3
- datahub/ingestion/source/identity/okta.py +3 -3
- datahub/ingestion/source/kafka/kafka.py +11 -9
- datahub/ingestion/source/kafka_connect/kafka_connect.py +3 -9
- datahub/ingestion/source/kafka_connect/sink_connectors.py +3 -3
- datahub/ingestion/source/kafka_connect/source_connectors.py +3 -3
- datahub/ingestion/source/looker/looker_common.py +19 -19
- datahub/ingestion/source/looker/looker_config.py +11 -6
- datahub/ingestion/source/looker/looker_source.py +25 -25
- datahub/ingestion/source/looker/looker_template_language.py +3 -3
- datahub/ingestion/source/looker/looker_usage.py +5 -7
- datahub/ingestion/source/looker/lookml_concept_context.py +6 -6
- datahub/ingestion/source/looker/lookml_source.py +13 -15
- datahub/ingestion/source/looker/view_upstream.py +5 -5
- datahub/ingestion/source/metabase.py +1 -6
- datahub/ingestion/source/mlflow.py +4 -9
- datahub/ingestion/source/mode.py +5 -5
- datahub/ingestion/source/mongodb.py +6 -4
- datahub/ingestion/source/neo4j/neo4j_source.py +1 -1
- datahub/ingestion/source/nifi.py +24 -31
- datahub/ingestion/source/openapi.py +9 -9
- datahub/ingestion/source/powerbi/config.py +12 -12
- datahub/ingestion/source/powerbi/m_query/parser.py +11 -11
- datahub/ingestion/source/powerbi/m_query/pattern_handler.py +26 -24
- datahub/ingestion/source/powerbi/m_query/resolver.py +13 -13
- datahub/ingestion/source/powerbi/powerbi.py +6 -6
- datahub/ingestion/source/powerbi/rest_api_wrapper/data_resolver.py +9 -9
- datahub/ingestion/source/powerbi/rest_api_wrapper/powerbi_api.py +7 -7
- datahub/ingestion/source/powerbi_report_server/report_server.py +1 -1
- datahub/ingestion/source/qlik_sense/qlik_api.py +1 -1
- datahub/ingestion/source/redash.py +0 -5
- datahub/ingestion/source/redshift/config.py +3 -3
- datahub/ingestion/source/redshift/redshift.py +45 -46
- datahub/ingestion/source/redshift/usage.py +33 -33
- datahub/ingestion/source/s3/datalake_profiler_config.py +3 -3
- datahub/ingestion/source/s3/source.py +11 -15
- datahub/ingestion/source/salesforce.py +26 -25
- datahub/ingestion/source/schema/json_schema.py +1 -1
- datahub/ingestion/source/sigma/sigma.py +3 -3
- datahub/ingestion/source/sigma/sigma_api.py +12 -10
- datahub/ingestion/source/snowflake/snowflake_config.py +30 -7
- datahub/ingestion/source/snowflake/snowflake_connection.py +6 -6
- datahub/ingestion/source/snowflake/snowflake_queries.py +2 -2
- datahub/ingestion/source/snowflake/snowflake_report.py +0 -3
- datahub/ingestion/source/snowflake/snowflake_schema.py +8 -5
- datahub/ingestion/source/snowflake/snowflake_schema_gen.py +136 -42
- datahub/ingestion/source/snowflake/snowflake_tag.py +21 -11
- datahub/ingestion/source/snowflake/snowflake_usage_v2.py +49 -50
- datahub/ingestion/source/snowflake/snowflake_utils.py +1 -2
- datahub/ingestion/source/snowflake/snowflake_v2.py +51 -47
- datahub/ingestion/source/sql/athena.py +1 -3
- datahub/ingestion/source/sql/clickhouse.py +8 -14
- datahub/ingestion/source/sql/oracle.py +1 -3
- datahub/ingestion/source/sql/sql_generic_profiler.py +1 -2
- datahub/ingestion/source/sql/sql_types.py +1 -2
- datahub/ingestion/source/sql/sql_utils.py +5 -0
- datahub/ingestion/source/sql/teradata.py +18 -5
- datahub/ingestion/source/state/profiling_state_handler.py +3 -3
- datahub/ingestion/source/state/redundant_run_skip_handler.py +5 -7
- datahub/ingestion/source/state/stale_entity_removal_handler.py +3 -3
- datahub/ingestion/source/state_provider/datahub_ingestion_checkpointing_provider.py +9 -9
- datahub/ingestion/source/state_provider/file_ingestion_checkpointing_provider.py +1 -1
- datahub/ingestion/source/superset.py +1 -6
- datahub/ingestion/source/tableau/tableau.py +343 -117
- datahub/ingestion/source/tableau/tableau_common.py +5 -2
- datahub/ingestion/source/unity/config.py +3 -1
- datahub/ingestion/source/unity/proxy.py +1 -1
- datahub/ingestion/source/unity/source.py +74 -74
- datahub/ingestion/source/unity/usage.py +3 -1
- datahub/ingestion/source/usage/clickhouse_usage.py +4 -4
- datahub/ingestion/source/usage/starburst_trino_usage.py +3 -3
- datahub/ingestion/source/usage/usage_common.py +1 -1
- datahub/ingestion/source_report/ingestion_stage.py +24 -20
- datahub/ingestion/transformer/add_dataset_dataproduct.py +4 -4
- datahub/ingestion/transformer/add_dataset_properties.py +3 -3
- datahub/ingestion/transformer/add_dataset_schema_tags.py +3 -3
- datahub/ingestion/transformer/add_dataset_schema_terms.py +3 -3
- datahub/ingestion/transformer/dataset_domain_based_on_tags.py +4 -4
- datahub/ingestion/transformer/extract_ownership_from_tags.py +3 -3
- datahub/ingestion/transformer/tags_to_terms.py +7 -7
- datahub/integrations/assertion/snowflake/compiler.py +10 -10
- datahub/lite/duckdb_lite.py +12 -10
- datahub/metadata/_schema_classes.py +317 -44
- datahub/metadata/_urns/urn_defs.py +69 -15
- datahub/metadata/com/linkedin/pegasus2avro/common/__init__.py +2 -0
- datahub/metadata/com/linkedin/pegasus2avro/metadata/key/__init__.py +2 -0
- datahub/metadata/com/linkedin/pegasus2avro/versionset/__init__.py +17 -0
- datahub/metadata/schema.avsc +302 -89
- datahub/metadata/schemas/DataFlowKey.avsc +1 -0
- datahub/metadata/schemas/DataJobKey.avsc +1 -0
- datahub/metadata/schemas/DataProcessInstanceInput.avsc +4 -2
- datahub/metadata/schemas/DataProcessInstanceOutput.avsc +2 -0
- datahub/metadata/schemas/DatasetKey.avsc +2 -1
- datahub/metadata/schemas/MLFeatureProperties.avsc +51 -0
- datahub/metadata/schemas/MLModelDeploymentProperties.avsc +51 -0
- datahub/metadata/schemas/MLModelGroupProperties.avsc +96 -23
- datahub/metadata/schemas/MLModelKey.avsc +2 -1
- datahub/metadata/schemas/MLModelProperties.avsc +96 -48
- datahub/metadata/schemas/MLPrimaryKeyProperties.avsc +51 -0
- datahub/metadata/schemas/MetadataChangeEvent.avsc +98 -71
- datahub/metadata/schemas/VersionProperties.avsc +216 -0
- datahub/metadata/schemas/VersionSetKey.avsc +26 -0
- datahub/metadata/schemas/VersionSetProperties.avsc +49 -0
- datahub/secret/datahub_secrets_client.py +12 -21
- datahub/secret/secret_common.py +14 -8
- datahub/specific/aspect_helpers/custom_properties.py +1 -2
- datahub/sql_parsing/schema_resolver.py +5 -10
- datahub/sql_parsing/sql_parsing_aggregator.py +18 -16
- datahub/sql_parsing/sqlglot_lineage.py +3 -3
- datahub/sql_parsing/sqlglot_utils.py +1 -1
- datahub/telemetry/stats.py +1 -2
- datahub/testing/mcp_diff.py +1 -1
- datahub/utilities/file_backed_collections.py +11 -11
- datahub/utilities/hive_schema_to_avro.py +2 -2
- datahub/utilities/logging_manager.py +2 -2
- datahub/utilities/lossy_collections.py +3 -3
- datahub/utilities/mapping.py +3 -3
- datahub/utilities/memory_footprint.py +3 -2
- datahub/utilities/perf_timer.py +11 -6
- datahub/utilities/serialized_lru_cache.py +3 -1
- datahub/utilities/sqlalchemy_query_combiner.py +6 -6
- datahub/utilities/sqllineage_patch.py +1 -1
- datahub/utilities/stats_collections.py +3 -1
- datahub/utilities/urns/_urn_base.py +28 -5
- datahub/utilities/urns/urn_iter.py +2 -2
- {acryl_datahub-0.15.0.1rc17.dist-info → acryl_datahub-0.15.0.2.dist-info}/entry_points.txt +0 -0
- {acryl_datahub-0.15.0.1rc17.dist-info → acryl_datahub-0.15.0.2.dist-info}/top_level.txt +0 -0
|
@@ -10,8 +10,10 @@
|
|
|
10
10
|
"Relationship": {
|
|
11
11
|
"/*": {
|
|
12
12
|
"entityTypes": [
|
|
13
|
-
"dataset"
|
|
13
|
+
"dataset",
|
|
14
|
+
"mlModel"
|
|
14
15
|
],
|
|
16
|
+
"isLineage": true,
|
|
15
17
|
"name": "Consumes"
|
|
16
18
|
}
|
|
17
19
|
},
|
|
@@ -29,7 +31,7 @@
|
|
|
29
31
|
"items": "string"
|
|
30
32
|
},
|
|
31
33
|
"name": "inputs",
|
|
32
|
-
"doc": "Input
|
|
34
|
+
"doc": "Input assets consumed",
|
|
33
35
|
"Urn": "Urn",
|
|
34
36
|
"urn_is_array": true
|
|
35
37
|
}
|
|
@@ -35,7 +35,8 @@
|
|
|
35
35
|
"access",
|
|
36
36
|
"structuredProperties",
|
|
37
37
|
"forms",
|
|
38
|
-
"partitionsSummary"
|
|
38
|
+
"partitionsSummary",
|
|
39
|
+
"versionProperties"
|
|
39
40
|
],
|
|
40
41
|
"entityDoc": "Datasets represent logical or physical data assets stored or represented in various data platforms. Tables, Views, Streams are all instances of datasets."
|
|
41
42
|
},
|
|
@@ -101,6 +101,57 @@
|
|
|
101
101
|
],
|
|
102
102
|
"name": "versionTag",
|
|
103
103
|
"default": null
|
|
104
|
+
},
|
|
105
|
+
{
|
|
106
|
+
"type": [
|
|
107
|
+
"null",
|
|
108
|
+
{
|
|
109
|
+
"type": "record",
|
|
110
|
+
"name": "MetadataAttribution",
|
|
111
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
112
|
+
"fields": [
|
|
113
|
+
{
|
|
114
|
+
"type": "long",
|
|
115
|
+
"name": "time",
|
|
116
|
+
"doc": "When this metadata was updated."
|
|
117
|
+
},
|
|
118
|
+
{
|
|
119
|
+
"java": {
|
|
120
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
121
|
+
},
|
|
122
|
+
"type": "string",
|
|
123
|
+
"name": "actor",
|
|
124
|
+
"doc": "The entity (e.g. a member URN) responsible for applying the assocated metadata. This can\neither be a user (in case of UI edits) or the datahub system for automation.",
|
|
125
|
+
"Urn": "Urn"
|
|
126
|
+
},
|
|
127
|
+
{
|
|
128
|
+
"java": {
|
|
129
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
130
|
+
},
|
|
131
|
+
"type": [
|
|
132
|
+
"null",
|
|
133
|
+
"string"
|
|
134
|
+
],
|
|
135
|
+
"name": "source",
|
|
136
|
+
"default": null,
|
|
137
|
+
"doc": "The DataHub source responsible for applying the associated metadata. This will only be filled out\nwhen a DataHub source is responsible. This includes the specific metadata test urn, the automation urn.",
|
|
138
|
+
"Urn": "Urn"
|
|
139
|
+
},
|
|
140
|
+
{
|
|
141
|
+
"type": {
|
|
142
|
+
"type": "map",
|
|
143
|
+
"values": "string"
|
|
144
|
+
},
|
|
145
|
+
"name": "sourceDetail",
|
|
146
|
+
"default": {},
|
|
147
|
+
"doc": "The details associated with why this metadata was applied. For example, this could include\nthe actual regex rule, sql statement, ingestion pipeline ID, etc."
|
|
148
|
+
}
|
|
149
|
+
],
|
|
150
|
+
"doc": "Information about who, why, and how this metadata was applied"
|
|
151
|
+
}
|
|
152
|
+
],
|
|
153
|
+
"name": "metadataAttribution",
|
|
154
|
+
"default": null
|
|
104
155
|
}
|
|
105
156
|
],
|
|
106
157
|
"doc": "A resource-defined string representing the resource state for the purpose of concurrency control"
|
|
@@ -74,6 +74,57 @@
|
|
|
74
74
|
],
|
|
75
75
|
"name": "versionTag",
|
|
76
76
|
"default": null
|
|
77
|
+
},
|
|
78
|
+
{
|
|
79
|
+
"type": [
|
|
80
|
+
"null",
|
|
81
|
+
{
|
|
82
|
+
"type": "record",
|
|
83
|
+
"name": "MetadataAttribution",
|
|
84
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
85
|
+
"fields": [
|
|
86
|
+
{
|
|
87
|
+
"type": "long",
|
|
88
|
+
"name": "time",
|
|
89
|
+
"doc": "When this metadata was updated."
|
|
90
|
+
},
|
|
91
|
+
{
|
|
92
|
+
"java": {
|
|
93
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
94
|
+
},
|
|
95
|
+
"type": "string",
|
|
96
|
+
"name": "actor",
|
|
97
|
+
"doc": "The entity (e.g. a member URN) responsible for applying the assocated metadata. This can\neither be a user (in case of UI edits) or the datahub system for automation.",
|
|
98
|
+
"Urn": "Urn"
|
|
99
|
+
},
|
|
100
|
+
{
|
|
101
|
+
"java": {
|
|
102
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
103
|
+
},
|
|
104
|
+
"type": [
|
|
105
|
+
"null",
|
|
106
|
+
"string"
|
|
107
|
+
],
|
|
108
|
+
"name": "source",
|
|
109
|
+
"default": null,
|
|
110
|
+
"doc": "The DataHub source responsible for applying the associated metadata. This will only be filled out\nwhen a DataHub source is responsible. This includes the specific metadata test urn, the automation urn.",
|
|
111
|
+
"Urn": "Urn"
|
|
112
|
+
},
|
|
113
|
+
{
|
|
114
|
+
"type": {
|
|
115
|
+
"type": "map",
|
|
116
|
+
"values": "string"
|
|
117
|
+
},
|
|
118
|
+
"name": "sourceDetail",
|
|
119
|
+
"default": {},
|
|
120
|
+
"doc": "The details associated with why this metadata was applied. For example, this could include\nthe actual regex rule, sql statement, ingestion pipeline ID, etc."
|
|
121
|
+
}
|
|
122
|
+
],
|
|
123
|
+
"doc": "Information about who, why, and how this metadata was applied"
|
|
124
|
+
}
|
|
125
|
+
],
|
|
126
|
+
"name": "metadataAttribution",
|
|
127
|
+
"default": null
|
|
77
128
|
}
|
|
78
129
|
],
|
|
79
130
|
"doc": "A resource-defined string representing the resource state for the purpose of concurrency control"
|
|
@@ -21,6 +21,51 @@
|
|
|
21
21
|
"default": {},
|
|
22
22
|
"doc": "Custom property bag."
|
|
23
23
|
},
|
|
24
|
+
{
|
|
25
|
+
"Relationship": {
|
|
26
|
+
"/*": {
|
|
27
|
+
"entityTypes": [
|
|
28
|
+
"dataJob",
|
|
29
|
+
"dataProcessInstance"
|
|
30
|
+
],
|
|
31
|
+
"isLineage": true,
|
|
32
|
+
"name": "TrainedBy"
|
|
33
|
+
}
|
|
34
|
+
},
|
|
35
|
+
"type": [
|
|
36
|
+
"null",
|
|
37
|
+
{
|
|
38
|
+
"type": "array",
|
|
39
|
+
"items": "string"
|
|
40
|
+
}
|
|
41
|
+
],
|
|
42
|
+
"name": "trainingJobs",
|
|
43
|
+
"default": null,
|
|
44
|
+
"doc": "List of jobs or process instances (if any) used to train the model or group. Visible in Lineage. Note that ML Models can also be specified as the output of a specific Data Process Instances (runs) via the DataProcessInstanceOutputs aspect."
|
|
45
|
+
},
|
|
46
|
+
{
|
|
47
|
+
"Relationship": {
|
|
48
|
+
"/*": {
|
|
49
|
+
"entityTypes": [
|
|
50
|
+
"dataJob",
|
|
51
|
+
"dataProcessInstance"
|
|
52
|
+
],
|
|
53
|
+
"isLineage": true,
|
|
54
|
+
"isUpstream": false,
|
|
55
|
+
"name": "UsedBy"
|
|
56
|
+
}
|
|
57
|
+
},
|
|
58
|
+
"type": [
|
|
59
|
+
"null",
|
|
60
|
+
{
|
|
61
|
+
"type": "array",
|
|
62
|
+
"items": "string"
|
|
63
|
+
}
|
|
64
|
+
],
|
|
65
|
+
"name": "downstreamJobs",
|
|
66
|
+
"default": null,
|
|
67
|
+
"doc": "List of jobs or process instances (if any) that use the model or group."
|
|
68
|
+
},
|
|
24
69
|
{
|
|
25
70
|
"Searchable": {
|
|
26
71
|
"boostScore": 10.0,
|
|
@@ -102,29 +147,6 @@
|
|
|
102
147
|
"default": null,
|
|
103
148
|
"doc": "Date when the MLModelGroup was last modified"
|
|
104
149
|
},
|
|
105
|
-
{
|
|
106
|
-
"Relationship": {
|
|
107
|
-
"/*": {
|
|
108
|
-
"entityTypes": [
|
|
109
|
-
"dataJob"
|
|
110
|
-
],
|
|
111
|
-
"isLineage": true,
|
|
112
|
-
"name": "TrainedBy"
|
|
113
|
-
}
|
|
114
|
-
},
|
|
115
|
-
"type": [
|
|
116
|
-
"null",
|
|
117
|
-
{
|
|
118
|
-
"type": "array",
|
|
119
|
-
"items": "string"
|
|
120
|
-
}
|
|
121
|
-
],
|
|
122
|
-
"name": "trainingJobs",
|
|
123
|
-
"default": null,
|
|
124
|
-
"doc": "List of jobs (if any) used to train the model group. Visible in Lineage.",
|
|
125
|
-
"Urn": "Urn",
|
|
126
|
-
"urn_is_array": true
|
|
127
|
-
},
|
|
128
150
|
{
|
|
129
151
|
"type": [
|
|
130
152
|
"null",
|
|
@@ -140,6 +162,57 @@
|
|
|
140
162
|
],
|
|
141
163
|
"name": "versionTag",
|
|
142
164
|
"default": null
|
|
165
|
+
},
|
|
166
|
+
{
|
|
167
|
+
"type": [
|
|
168
|
+
"null",
|
|
169
|
+
{
|
|
170
|
+
"type": "record",
|
|
171
|
+
"name": "MetadataAttribution",
|
|
172
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
173
|
+
"fields": [
|
|
174
|
+
{
|
|
175
|
+
"type": "long",
|
|
176
|
+
"name": "time",
|
|
177
|
+
"doc": "When this metadata was updated."
|
|
178
|
+
},
|
|
179
|
+
{
|
|
180
|
+
"java": {
|
|
181
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
182
|
+
},
|
|
183
|
+
"type": "string",
|
|
184
|
+
"name": "actor",
|
|
185
|
+
"doc": "The entity (e.g. a member URN) responsible for applying the assocated metadata. This can\neither be a user (in case of UI edits) or the datahub system for automation.",
|
|
186
|
+
"Urn": "Urn"
|
|
187
|
+
},
|
|
188
|
+
{
|
|
189
|
+
"java": {
|
|
190
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
191
|
+
},
|
|
192
|
+
"type": [
|
|
193
|
+
"null",
|
|
194
|
+
"string"
|
|
195
|
+
],
|
|
196
|
+
"name": "source",
|
|
197
|
+
"default": null,
|
|
198
|
+
"doc": "The DataHub source responsible for applying the associated metadata. This will only be filled out\nwhen a DataHub source is responsible. This includes the specific metadata test urn, the automation urn.",
|
|
199
|
+
"Urn": "Urn"
|
|
200
|
+
},
|
|
201
|
+
{
|
|
202
|
+
"type": {
|
|
203
|
+
"type": "map",
|
|
204
|
+
"values": "string"
|
|
205
|
+
},
|
|
206
|
+
"name": "sourceDetail",
|
|
207
|
+
"default": {},
|
|
208
|
+
"doc": "The details associated with why this metadata was applied. For example, this could include\nthe actual regex rule, sql statement, ingestion pipeline ID, etc."
|
|
209
|
+
}
|
|
210
|
+
],
|
|
211
|
+
"doc": "Information about who, why, and how this metadata was applied"
|
|
212
|
+
}
|
|
213
|
+
],
|
|
214
|
+
"name": "metadataAttribution",
|
|
215
|
+
"default": null
|
|
143
216
|
}
|
|
144
217
|
],
|
|
145
218
|
"doc": "A resource-defined string representing the resource state for the purpose of concurrency control"
|
|
@@ -37,6 +37,51 @@
|
|
|
37
37
|
"default": null,
|
|
38
38
|
"doc": "URL where the reference exist"
|
|
39
39
|
},
|
|
40
|
+
{
|
|
41
|
+
"Relationship": {
|
|
42
|
+
"/*": {
|
|
43
|
+
"entityTypes": [
|
|
44
|
+
"dataJob",
|
|
45
|
+
"dataProcessInstance"
|
|
46
|
+
],
|
|
47
|
+
"isLineage": true,
|
|
48
|
+
"name": "TrainedBy"
|
|
49
|
+
}
|
|
50
|
+
},
|
|
51
|
+
"type": [
|
|
52
|
+
"null",
|
|
53
|
+
{
|
|
54
|
+
"type": "array",
|
|
55
|
+
"items": "string"
|
|
56
|
+
}
|
|
57
|
+
],
|
|
58
|
+
"name": "trainingJobs",
|
|
59
|
+
"default": null,
|
|
60
|
+
"doc": "List of jobs or process instances (if any) used to train the model or group. Visible in Lineage. Note that ML Models can also be specified as the output of a specific Data Process Instances (runs) via the DataProcessInstanceOutputs aspect."
|
|
61
|
+
},
|
|
62
|
+
{
|
|
63
|
+
"Relationship": {
|
|
64
|
+
"/*": {
|
|
65
|
+
"entityTypes": [
|
|
66
|
+
"dataJob",
|
|
67
|
+
"dataProcessInstance"
|
|
68
|
+
],
|
|
69
|
+
"isLineage": true,
|
|
70
|
+
"isUpstream": false,
|
|
71
|
+
"name": "UsedBy"
|
|
72
|
+
}
|
|
73
|
+
},
|
|
74
|
+
"type": [
|
|
75
|
+
"null",
|
|
76
|
+
{
|
|
77
|
+
"type": "array",
|
|
78
|
+
"items": "string"
|
|
79
|
+
}
|
|
80
|
+
],
|
|
81
|
+
"name": "downstreamJobs",
|
|
82
|
+
"default": null,
|
|
83
|
+
"doc": "List of jobs or process instances (if any) that use the model or group."
|
|
84
|
+
},
|
|
40
85
|
{
|
|
41
86
|
"Searchable": {
|
|
42
87
|
"boostScore": 10.0,
|
|
@@ -133,6 +178,57 @@
|
|
|
133
178
|
],
|
|
134
179
|
"name": "versionTag",
|
|
135
180
|
"default": null
|
|
181
|
+
},
|
|
182
|
+
{
|
|
183
|
+
"type": [
|
|
184
|
+
"null",
|
|
185
|
+
{
|
|
186
|
+
"type": "record",
|
|
187
|
+
"name": "MetadataAttribution",
|
|
188
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
189
|
+
"fields": [
|
|
190
|
+
{
|
|
191
|
+
"type": "long",
|
|
192
|
+
"name": "time",
|
|
193
|
+
"doc": "When this metadata was updated."
|
|
194
|
+
},
|
|
195
|
+
{
|
|
196
|
+
"java": {
|
|
197
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
198
|
+
},
|
|
199
|
+
"type": "string",
|
|
200
|
+
"name": "actor",
|
|
201
|
+
"doc": "The entity (e.g. a member URN) responsible for applying the assocated metadata. This can\neither be a user (in case of UI edits) or the datahub system for automation.",
|
|
202
|
+
"Urn": "Urn"
|
|
203
|
+
},
|
|
204
|
+
{
|
|
205
|
+
"java": {
|
|
206
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
207
|
+
},
|
|
208
|
+
"type": [
|
|
209
|
+
"null",
|
|
210
|
+
"string"
|
|
211
|
+
],
|
|
212
|
+
"name": "source",
|
|
213
|
+
"default": null,
|
|
214
|
+
"doc": "The DataHub source responsible for applying the associated metadata. This will only be filled out\nwhen a DataHub source is responsible. This includes the specific metadata test urn, the automation urn.",
|
|
215
|
+
"Urn": "Urn"
|
|
216
|
+
},
|
|
217
|
+
{
|
|
218
|
+
"type": {
|
|
219
|
+
"type": "map",
|
|
220
|
+
"values": "string"
|
|
221
|
+
},
|
|
222
|
+
"name": "sourceDetail",
|
|
223
|
+
"default": {},
|
|
224
|
+
"doc": "The details associated with why this metadata was applied. For example, this could include\nthe actual regex rule, sql statement, ingestion pipeline ID, etc."
|
|
225
|
+
}
|
|
226
|
+
],
|
|
227
|
+
"doc": "Information about who, why, and how this metadata was applied"
|
|
228
|
+
}
|
|
229
|
+
],
|
|
230
|
+
"name": "metadataAttribution",
|
|
231
|
+
"default": null
|
|
136
232
|
}
|
|
137
233
|
],
|
|
138
234
|
"doc": "A resource-defined string representing the resource state for the purpose of concurrency control"
|
|
@@ -346,54 +442,6 @@
|
|
|
346
442
|
"Urn": "Urn",
|
|
347
443
|
"urn_is_array": true
|
|
348
444
|
},
|
|
349
|
-
{
|
|
350
|
-
"Relationship": {
|
|
351
|
-
"/*": {
|
|
352
|
-
"entityTypes": [
|
|
353
|
-
"dataJob",
|
|
354
|
-
"dataProcessInstance"
|
|
355
|
-
],
|
|
356
|
-
"isLineage": true,
|
|
357
|
-
"name": "TrainedBy"
|
|
358
|
-
}
|
|
359
|
-
},
|
|
360
|
-
"type": [
|
|
361
|
-
"null",
|
|
362
|
-
{
|
|
363
|
-
"type": "array",
|
|
364
|
-
"items": "string"
|
|
365
|
-
}
|
|
366
|
-
],
|
|
367
|
-
"name": "trainingJobs",
|
|
368
|
-
"default": null,
|
|
369
|
-
"doc": "List of jobs (if any) used to train the model. Visible in Lineage. Note that ML Models can also be specified as the output of a specific Data Process Instances (runs) via the DataProcessInstanceOutputs aspect.",
|
|
370
|
-
"Urn": "Urn",
|
|
371
|
-
"urn_is_array": true
|
|
372
|
-
},
|
|
373
|
-
{
|
|
374
|
-
"Relationship": {
|
|
375
|
-
"/*": {
|
|
376
|
-
"entityTypes": [
|
|
377
|
-
"dataJob"
|
|
378
|
-
],
|
|
379
|
-
"isLineage": true,
|
|
380
|
-
"isUpstream": false,
|
|
381
|
-
"name": "UsedBy"
|
|
382
|
-
}
|
|
383
|
-
},
|
|
384
|
-
"type": [
|
|
385
|
-
"null",
|
|
386
|
-
{
|
|
387
|
-
"type": "array",
|
|
388
|
-
"items": "string"
|
|
389
|
-
}
|
|
390
|
-
],
|
|
391
|
-
"name": "downstreamJobs",
|
|
392
|
-
"default": null,
|
|
393
|
-
"doc": "List of jobs (if any) that use the model",
|
|
394
|
-
"Urn": "Urn",
|
|
395
|
-
"urn_is_array": true
|
|
396
|
-
},
|
|
397
445
|
{
|
|
398
446
|
"Relationship": {
|
|
399
447
|
"/*": {
|
|
@@ -97,6 +97,57 @@
|
|
|
97
97
|
],
|
|
98
98
|
"name": "versionTag",
|
|
99
99
|
"default": null
|
|
100
|
+
},
|
|
101
|
+
{
|
|
102
|
+
"type": [
|
|
103
|
+
"null",
|
|
104
|
+
{
|
|
105
|
+
"type": "record",
|
|
106
|
+
"name": "MetadataAttribution",
|
|
107
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
108
|
+
"fields": [
|
|
109
|
+
{
|
|
110
|
+
"type": "long",
|
|
111
|
+
"name": "time",
|
|
112
|
+
"doc": "When this metadata was updated."
|
|
113
|
+
},
|
|
114
|
+
{
|
|
115
|
+
"java": {
|
|
116
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
117
|
+
},
|
|
118
|
+
"type": "string",
|
|
119
|
+
"name": "actor",
|
|
120
|
+
"doc": "The entity (e.g. a member URN) responsible for applying the assocated metadata. This can\neither be a user (in case of UI edits) or the datahub system for automation.",
|
|
121
|
+
"Urn": "Urn"
|
|
122
|
+
},
|
|
123
|
+
{
|
|
124
|
+
"java": {
|
|
125
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
126
|
+
},
|
|
127
|
+
"type": [
|
|
128
|
+
"null",
|
|
129
|
+
"string"
|
|
130
|
+
],
|
|
131
|
+
"name": "source",
|
|
132
|
+
"default": null,
|
|
133
|
+
"doc": "The DataHub source responsible for applying the associated metadata. This will only be filled out\nwhen a DataHub source is responsible. This includes the specific metadata test urn, the automation urn.",
|
|
134
|
+
"Urn": "Urn"
|
|
135
|
+
},
|
|
136
|
+
{
|
|
137
|
+
"type": {
|
|
138
|
+
"type": "map",
|
|
139
|
+
"values": "string"
|
|
140
|
+
},
|
|
141
|
+
"name": "sourceDetail",
|
|
142
|
+
"default": {},
|
|
143
|
+
"doc": "The details associated with why this metadata was applied. For example, this could include\nthe actual regex rule, sql statement, ingestion pipeline ID, etc."
|
|
144
|
+
}
|
|
145
|
+
],
|
|
146
|
+
"doc": "Information about who, why, and how this metadata was applied"
|
|
147
|
+
}
|
|
148
|
+
],
|
|
149
|
+
"name": "metadataAttribution",
|
|
150
|
+
"default": null
|
|
100
151
|
}
|
|
101
152
|
],
|
|
102
153
|
"doc": "A resource-defined string representing the resource state for the purpose of concurrency control"
|