acryl-datahub-cloud 0.3.9rc6__py3-none-any.whl → 0.3.9rc8__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of acryl-datahub-cloud might be problematic. Click here for more details.
- acryl_datahub_cloud/_codegen_config.json +1 -1
- acryl_datahub_cloud/datahub_reporting/datahub_form_reporting.py +2 -2
- acryl_datahub_cloud/metadata/_urns/urn_defs.py +69 -69
- acryl_datahub_cloud/metadata/schema.avsc +56 -4
- acryl_datahub_cloud/metadata/schema_classes.py +173 -1
- acryl_datahub_cloud/metadata/schemas/DataProcessInstanceInput.avsc +129 -1
- acryl_datahub_cloud/metadata/schemas/DataProcessInstanceOutput.avsc +131 -3
- {acryl_datahub_cloud-0.3.9rc6.dist-info → acryl_datahub_cloud-0.3.9rc8.dist-info}/METADATA +45 -45
- {acryl_datahub_cloud-0.3.9rc6.dist-info → acryl_datahub_cloud-0.3.9rc8.dist-info}/RECORD +12 -12
- {acryl_datahub_cloud-0.3.9rc6.dist-info → acryl_datahub_cloud-0.3.9rc8.dist-info}/WHEEL +0 -0
- {acryl_datahub_cloud-0.3.9rc6.dist-info → acryl_datahub_cloud-0.3.9rc8.dist-info}/entry_points.txt +0 -0
- {acryl_datahub_cloud-0.3.9rc6.dist-info → acryl_datahub_cloud-0.3.9rc8.dist-info}/top_level.txt +0 -0
|
@@ -22196,7 +22196,6 @@
|
|
|
22196
22196
|
"dataset",
|
|
22197
22197
|
"mlModel"
|
|
22198
22198
|
],
|
|
22199
|
-
"isLineage": true,
|
|
22200
22199
|
"name": "Consumes"
|
|
22201
22200
|
}
|
|
22202
22201
|
},
|
|
@@ -22217,6 +22216,33 @@
|
|
|
22217
22216
|
},
|
|
22218
22217
|
"name": "inputs",
|
|
22219
22218
|
"doc": "Input assets consumed"
|
|
22219
|
+
},
|
|
22220
|
+
{
|
|
22221
|
+
"Relationship": {
|
|
22222
|
+
"/*/destinationUrn": {
|
|
22223
|
+
"createdActor": "inputEdges/*/created/actor",
|
|
22224
|
+
"createdOn": "inputEdges/*/created/time",
|
|
22225
|
+
"entityTypes": [
|
|
22226
|
+
"dataset",
|
|
22227
|
+
"mlModel"
|
|
22228
|
+
],
|
|
22229
|
+
"isLineage": true,
|
|
22230
|
+
"name": "DataProcessInstanceConsumes",
|
|
22231
|
+
"properties": "inputEdges/*/properties",
|
|
22232
|
+
"updatedActor": "inputEdges/*/lastModified/actor",
|
|
22233
|
+
"updatedOn": "inputEdges/*/lastModified/time"
|
|
22234
|
+
}
|
|
22235
|
+
},
|
|
22236
|
+
"type": [
|
|
22237
|
+
"null",
|
|
22238
|
+
{
|
|
22239
|
+
"type": "array",
|
|
22240
|
+
"items": "com.linkedin.pegasus2avro.common.Edge"
|
|
22241
|
+
}
|
|
22242
|
+
],
|
|
22243
|
+
"name": "inputEdges",
|
|
22244
|
+
"default": null,
|
|
22245
|
+
"doc": "Input assets consumed by the data process instance, with additional metadata.\nCounts as lineage.\nWill eventually deprecate the inputs field."
|
|
22220
22246
|
}
|
|
22221
22247
|
],
|
|
22222
22248
|
"doc": "Information about the inputs datasets of a Data process"
|
|
@@ -22567,8 +22593,6 @@
|
|
|
22567
22593
|
"dataset",
|
|
22568
22594
|
"mlModel"
|
|
22569
22595
|
],
|
|
22570
|
-
"isLineage": true,
|
|
22571
|
-
"isUpstream": false,
|
|
22572
22596
|
"name": "Produces"
|
|
22573
22597
|
}
|
|
22574
22598
|
},
|
|
@@ -22588,7 +22612,35 @@
|
|
|
22588
22612
|
"items": "string"
|
|
22589
22613
|
},
|
|
22590
22614
|
"name": "outputs",
|
|
22591
|
-
"doc": "Output
|
|
22615
|
+
"doc": "Output assets produced"
|
|
22616
|
+
},
|
|
22617
|
+
{
|
|
22618
|
+
"Relationship": {
|
|
22619
|
+
"/*/destinationUrn": {
|
|
22620
|
+
"createdActor": "outputEdges/*/created/actor",
|
|
22621
|
+
"createdOn": "outputEdges/*/created/time",
|
|
22622
|
+
"entityTypes": [
|
|
22623
|
+
"dataset",
|
|
22624
|
+
"mlModel"
|
|
22625
|
+
],
|
|
22626
|
+
"isLineage": true,
|
|
22627
|
+
"isUpstream": false,
|
|
22628
|
+
"name": "DataProcessInstanceProduces",
|
|
22629
|
+
"properties": "outputEdges/*/properties",
|
|
22630
|
+
"updatedActor": "outputEdges/*/lastModified/actor",
|
|
22631
|
+
"updatedOn": "outputEdges/*/lastModified/time"
|
|
22632
|
+
}
|
|
22633
|
+
},
|
|
22634
|
+
"type": [
|
|
22635
|
+
"null",
|
|
22636
|
+
{
|
|
22637
|
+
"type": "array",
|
|
22638
|
+
"items": "com.linkedin.pegasus2avro.common.Edge"
|
|
22639
|
+
}
|
|
22640
|
+
],
|
|
22641
|
+
"name": "outputEdges",
|
|
22642
|
+
"default": null,
|
|
22643
|
+
"doc": "Output assets produced by the data process instance during processing, with additional metadata.\nCounts as lineage.\nWill eventually deprecate the outputs field."
|
|
22592
22644
|
}
|
|
22593
22645
|
],
|
|
22594
22646
|
"doc": "Information about the outputs of a Data process"
|
|
@@ -13563,13 +13563,16 @@ class DataProcessInstanceInputClass(_Aspect):
|
|
|
13563
13563
|
|
|
13564
13564
|
def __init__(self,
|
|
13565
13565
|
inputs: List[str],
|
|
13566
|
+
inputEdges: Union[None, List["EdgeClass"]]=None,
|
|
13566
13567
|
):
|
|
13567
13568
|
super().__init__()
|
|
13568
13569
|
|
|
13569
13570
|
self.inputs = inputs
|
|
13571
|
+
self.inputEdges = inputEdges
|
|
13570
13572
|
|
|
13571
13573
|
def _restore_defaults(self) -> None:
|
|
13572
13574
|
self.inputs = list()
|
|
13575
|
+
self.inputEdges = self.RECORD_SCHEMA.fields_dict["inputEdges"].default
|
|
13573
13576
|
|
|
13574
13577
|
|
|
13575
13578
|
@property
|
|
@@ -13582,6 +13585,18 @@ class DataProcessInstanceInputClass(_Aspect):
|
|
|
13582
13585
|
self._inner_dict['inputs'] = value
|
|
13583
13586
|
|
|
13584
13587
|
|
|
13588
|
+
@property
|
|
13589
|
+
def inputEdges(self) -> Union[None, List["EdgeClass"]]:
|
|
13590
|
+
"""Input assets consumed by the data process instance, with additional metadata.
|
|
13591
|
+
Counts as lineage.
|
|
13592
|
+
Will eventually deprecate the inputs field."""
|
|
13593
|
+
return self._inner_dict.get('inputEdges') # type: ignore
|
|
13594
|
+
|
|
13595
|
+
@inputEdges.setter
|
|
13596
|
+
def inputEdges(self, value: Union[None, List["EdgeClass"]]) -> None:
|
|
13597
|
+
self._inner_dict['inputEdges'] = value
|
|
13598
|
+
|
|
13599
|
+
|
|
13585
13600
|
class DataProcessInstanceOutputClass(_Aspect):
|
|
13586
13601
|
"""Information about the outputs of a Data process"""
|
|
13587
13602
|
|
|
@@ -13592,18 +13607,21 @@ class DataProcessInstanceOutputClass(_Aspect):
|
|
|
13592
13607
|
|
|
13593
13608
|
def __init__(self,
|
|
13594
13609
|
outputs: List[str],
|
|
13610
|
+
outputEdges: Union[None, List["EdgeClass"]]=None,
|
|
13595
13611
|
):
|
|
13596
13612
|
super().__init__()
|
|
13597
13613
|
|
|
13598
13614
|
self.outputs = outputs
|
|
13615
|
+
self.outputEdges = outputEdges
|
|
13599
13616
|
|
|
13600
13617
|
def _restore_defaults(self) -> None:
|
|
13601
13618
|
self.outputs = list()
|
|
13619
|
+
self.outputEdges = self.RECORD_SCHEMA.fields_dict["outputEdges"].default
|
|
13602
13620
|
|
|
13603
13621
|
|
|
13604
13622
|
@property
|
|
13605
13623
|
def outputs(self) -> List[str]:
|
|
13606
|
-
"""Output
|
|
13624
|
+
"""Output assets produced"""
|
|
13607
13625
|
return self._inner_dict.get('outputs') # type: ignore
|
|
13608
13626
|
|
|
13609
13627
|
@outputs.setter
|
|
@@ -13611,6 +13629,18 @@ class DataProcessInstanceOutputClass(_Aspect):
|
|
|
13611
13629
|
self._inner_dict['outputs'] = value
|
|
13612
13630
|
|
|
13613
13631
|
|
|
13632
|
+
@property
|
|
13633
|
+
def outputEdges(self) -> Union[None, List["EdgeClass"]]:
|
|
13634
|
+
"""Output assets produced by the data process instance during processing, with additional metadata.
|
|
13635
|
+
Counts as lineage.
|
|
13636
|
+
Will eventually deprecate the outputs field."""
|
|
13637
|
+
return self._inner_dict.get('outputEdges') # type: ignore
|
|
13638
|
+
|
|
13639
|
+
@outputEdges.setter
|
|
13640
|
+
def outputEdges(self, value: Union[None, List["EdgeClass"]]) -> None:
|
|
13641
|
+
self._inner_dict['outputEdges'] = value
|
|
13642
|
+
|
|
13643
|
+
|
|
13614
13644
|
class DataProcessInstancePropertiesClass(_Aspect):
|
|
13615
13645
|
"""The inputs and outputs of this data process"""
|
|
13616
13646
|
|
|
@@ -37834,6 +37864,7 @@ ASPECT_NAME_MAP: Dict[str, Type[_Aspect]] = {
|
|
|
37834
37864
|
for aspect in ASPECT_CLASSES
|
|
37835
37865
|
}
|
|
37836
37866
|
|
|
37867
|
+
from typing import Literal
|
|
37837
37868
|
from typing_extensions import TypedDict
|
|
37838
37869
|
|
|
37839
37870
|
class AspectBag(TypedDict, total=False):
|
|
@@ -38176,4 +38207,145 @@ KEY_ASPECTS: Dict[str, Type[_Aspect]] = {
|
|
|
38176
38207
|
'telemetry': TelemetryKeyClass
|
|
38177
38208
|
}
|
|
38178
38209
|
|
|
38210
|
+
ENTITY_TYPE_NAMES: List[str] = [
|
|
38211
|
+
'dataProduct',
|
|
38212
|
+
'structuredProperty',
|
|
38213
|
+
'entityType',
|
|
38214
|
+
'platformResource',
|
|
38215
|
+
'businessAttribute',
|
|
38216
|
+
'dataType',
|
|
38217
|
+
'inviteToken',
|
|
38218
|
+
'assertion',
|
|
38219
|
+
'schemaField',
|
|
38220
|
+
'corpGroup',
|
|
38221
|
+
'role',
|
|
38222
|
+
'dataProcessInstance',
|
|
38223
|
+
'dataHubSecret',
|
|
38224
|
+
'dataHubPersona',
|
|
38225
|
+
'mlFeatureTable',
|
|
38226
|
+
'glossaryTerm',
|
|
38227
|
+
'recommendationModule',
|
|
38228
|
+
'post',
|
|
38229
|
+
'mlPrimaryKey',
|
|
38230
|
+
'dataPlatformInstance',
|
|
38231
|
+
'dataHubMetricCube',
|
|
38232
|
+
'query',
|
|
38233
|
+
'dataset',
|
|
38234
|
+
'dataHubExecutionRequest',
|
|
38235
|
+
'chart',
|
|
38236
|
+
'mlModelGroup',
|
|
38237
|
+
'subscription',
|
|
38238
|
+
'anomaly',
|
|
38239
|
+
'dataHubRemoteExecutorPool',
|
|
38240
|
+
'dataJob',
|
|
38241
|
+
'domain',
|
|
38242
|
+
'erModelRelationship',
|
|
38243
|
+
'dataHubRole',
|
|
38244
|
+
'form',
|
|
38245
|
+
'dataHubAccessToken',
|
|
38246
|
+
'dataHubAction',
|
|
38247
|
+
'dataPlatform',
|
|
38248
|
+
'container',
|
|
38249
|
+
'tag',
|
|
38250
|
+
'dataHubPolicy',
|
|
38251
|
+
'constraint',
|
|
38252
|
+
'glossaryNode',
|
|
38253
|
+
'dataProcess',
|
|
38254
|
+
'dataHubStepState',
|
|
38255
|
+
'notebook',
|
|
38256
|
+
'mlFeature',
|
|
38257
|
+
'dataHubUpgrade',
|
|
38258
|
+
'dashboard',
|
|
38259
|
+
'mlModel',
|
|
38260
|
+
'incident',
|
|
38261
|
+
'globalSettings',
|
|
38262
|
+
'dataHubView',
|
|
38263
|
+
'dataHubRetention',
|
|
38264
|
+
'ownershipType',
|
|
38265
|
+
'actionRequest',
|
|
38266
|
+
'dataHubRemoteExecutorGlobalConfig',
|
|
38267
|
+
'dataFlow',
|
|
38268
|
+
'dataContract',
|
|
38269
|
+
'dataHubConnection',
|
|
38270
|
+
'dataHubRemoteExecutor',
|
|
38271
|
+
'monitor',
|
|
38272
|
+
'corpuser',
|
|
38273
|
+
'versionSet',
|
|
38274
|
+
'test',
|
|
38275
|
+
'dataHubIngestionSource',
|
|
38276
|
+
'mlModelDeployment',
|
|
38277
|
+
'linkPreview',
|
|
38278
|
+
'telemetry'
|
|
38279
|
+
]
|
|
38280
|
+
EntityTypeName = Literal[
|
|
38281
|
+
'dataProduct',
|
|
38282
|
+
'structuredProperty',
|
|
38283
|
+
'entityType',
|
|
38284
|
+
'platformResource',
|
|
38285
|
+
'businessAttribute',
|
|
38286
|
+
'dataType',
|
|
38287
|
+
'inviteToken',
|
|
38288
|
+
'assertion',
|
|
38289
|
+
'schemaField',
|
|
38290
|
+
'corpGroup',
|
|
38291
|
+
'role',
|
|
38292
|
+
'dataProcessInstance',
|
|
38293
|
+
'dataHubSecret',
|
|
38294
|
+
'dataHubPersona',
|
|
38295
|
+
'mlFeatureTable',
|
|
38296
|
+
'glossaryTerm',
|
|
38297
|
+
'recommendationModule',
|
|
38298
|
+
'post',
|
|
38299
|
+
'mlPrimaryKey',
|
|
38300
|
+
'dataPlatformInstance',
|
|
38301
|
+
'dataHubMetricCube',
|
|
38302
|
+
'query',
|
|
38303
|
+
'dataset',
|
|
38304
|
+
'dataHubExecutionRequest',
|
|
38305
|
+
'chart',
|
|
38306
|
+
'mlModelGroup',
|
|
38307
|
+
'subscription',
|
|
38308
|
+
'anomaly',
|
|
38309
|
+
'dataHubRemoteExecutorPool',
|
|
38310
|
+
'dataJob',
|
|
38311
|
+
'domain',
|
|
38312
|
+
'erModelRelationship',
|
|
38313
|
+
'dataHubRole',
|
|
38314
|
+
'form',
|
|
38315
|
+
'dataHubAccessToken',
|
|
38316
|
+
'dataHubAction',
|
|
38317
|
+
'dataPlatform',
|
|
38318
|
+
'container',
|
|
38319
|
+
'tag',
|
|
38320
|
+
'dataHubPolicy',
|
|
38321
|
+
'constraint',
|
|
38322
|
+
'glossaryNode',
|
|
38323
|
+
'dataProcess',
|
|
38324
|
+
'dataHubStepState',
|
|
38325
|
+
'notebook',
|
|
38326
|
+
'mlFeature',
|
|
38327
|
+
'dataHubUpgrade',
|
|
38328
|
+
'dashboard',
|
|
38329
|
+
'mlModel',
|
|
38330
|
+
'incident',
|
|
38331
|
+
'globalSettings',
|
|
38332
|
+
'dataHubView',
|
|
38333
|
+
'dataHubRetention',
|
|
38334
|
+
'ownershipType',
|
|
38335
|
+
'actionRequest',
|
|
38336
|
+
'dataHubRemoteExecutorGlobalConfig',
|
|
38337
|
+
'dataFlow',
|
|
38338
|
+
'dataContract',
|
|
38339
|
+
'dataHubConnection',
|
|
38340
|
+
'dataHubRemoteExecutor',
|
|
38341
|
+
'monitor',
|
|
38342
|
+
'corpuser',
|
|
38343
|
+
'versionSet',
|
|
38344
|
+
'test',
|
|
38345
|
+
'dataHubIngestionSource',
|
|
38346
|
+
'mlModelDeployment',
|
|
38347
|
+
'linkPreview',
|
|
38348
|
+
'telemetry'
|
|
38349
|
+
]
|
|
38350
|
+
|
|
38179
38351
|
# fmt: on
|
|
@@ -13,7 +13,6 @@
|
|
|
13
13
|
"dataset",
|
|
14
14
|
"mlModel"
|
|
15
15
|
],
|
|
16
|
-
"isLineage": true,
|
|
17
16
|
"name": "Consumes"
|
|
18
17
|
}
|
|
19
18
|
},
|
|
@@ -34,6 +33,135 @@
|
|
|
34
33
|
"doc": "Input assets consumed",
|
|
35
34
|
"Urn": "Urn",
|
|
36
35
|
"urn_is_array": true
|
|
36
|
+
},
|
|
37
|
+
{
|
|
38
|
+
"Relationship": {
|
|
39
|
+
"/*/destinationUrn": {
|
|
40
|
+
"createdActor": "inputEdges/*/created/actor",
|
|
41
|
+
"createdOn": "inputEdges/*/created/time",
|
|
42
|
+
"entityTypes": [
|
|
43
|
+
"dataset",
|
|
44
|
+
"mlModel"
|
|
45
|
+
],
|
|
46
|
+
"isLineage": true,
|
|
47
|
+
"name": "DataProcessInstanceConsumes",
|
|
48
|
+
"properties": "inputEdges/*/properties",
|
|
49
|
+
"updatedActor": "inputEdges/*/lastModified/actor",
|
|
50
|
+
"updatedOn": "inputEdges/*/lastModified/time"
|
|
51
|
+
}
|
|
52
|
+
},
|
|
53
|
+
"type": [
|
|
54
|
+
"null",
|
|
55
|
+
{
|
|
56
|
+
"type": "array",
|
|
57
|
+
"items": {
|
|
58
|
+
"type": "record",
|
|
59
|
+
"name": "Edge",
|
|
60
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
61
|
+
"fields": [
|
|
62
|
+
{
|
|
63
|
+
"java": {
|
|
64
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
65
|
+
},
|
|
66
|
+
"type": [
|
|
67
|
+
"null",
|
|
68
|
+
"string"
|
|
69
|
+
],
|
|
70
|
+
"name": "sourceUrn",
|
|
71
|
+
"default": null,
|
|
72
|
+
"doc": "Urn of the source of this relationship edge.\nIf not specified, assumed to be the entity that this aspect belongs to.",
|
|
73
|
+
"Urn": "Urn"
|
|
74
|
+
},
|
|
75
|
+
{
|
|
76
|
+
"java": {
|
|
77
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
78
|
+
},
|
|
79
|
+
"type": "string",
|
|
80
|
+
"name": "destinationUrn",
|
|
81
|
+
"doc": "Urn of the destination of this relationship edge.",
|
|
82
|
+
"Urn": "Urn"
|
|
83
|
+
},
|
|
84
|
+
{
|
|
85
|
+
"type": [
|
|
86
|
+
"null",
|
|
87
|
+
{
|
|
88
|
+
"type": "record",
|
|
89
|
+
"name": "AuditStamp",
|
|
90
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
91
|
+
"fields": [
|
|
92
|
+
{
|
|
93
|
+
"type": "long",
|
|
94
|
+
"name": "time",
|
|
95
|
+
"doc": "When did the resource/association/sub-resource move into the specific lifecycle stage represented by this AuditEvent."
|
|
96
|
+
},
|
|
97
|
+
{
|
|
98
|
+
"java": {
|
|
99
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
100
|
+
},
|
|
101
|
+
"type": "string",
|
|
102
|
+
"name": "actor",
|
|
103
|
+
"doc": "The entity (e.g. a member URN) which will be credited for moving the resource/association/sub-resource into the specific lifecycle stage. It is also the one used to authorize the change.",
|
|
104
|
+
"Urn": "Urn"
|
|
105
|
+
},
|
|
106
|
+
{
|
|
107
|
+
"java": {
|
|
108
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
109
|
+
},
|
|
110
|
+
"type": [
|
|
111
|
+
"null",
|
|
112
|
+
"string"
|
|
113
|
+
],
|
|
114
|
+
"name": "impersonator",
|
|
115
|
+
"default": null,
|
|
116
|
+
"doc": "The entity (e.g. a service URN) which performs the change on behalf of the Actor and must be authorized to act as the Actor.",
|
|
117
|
+
"Urn": "Urn"
|
|
118
|
+
},
|
|
119
|
+
{
|
|
120
|
+
"type": [
|
|
121
|
+
"null",
|
|
122
|
+
"string"
|
|
123
|
+
],
|
|
124
|
+
"name": "message",
|
|
125
|
+
"default": null,
|
|
126
|
+
"doc": "Additional context around how DataHub was informed of the particular change. For example: was the change created by an automated process, or manually."
|
|
127
|
+
}
|
|
128
|
+
],
|
|
129
|
+
"doc": "Data captured on a resource/association/sub-resource level giving insight into when that resource/association/sub-resource moved into a particular lifecycle stage, and who acted to move it into that specific lifecycle stage."
|
|
130
|
+
}
|
|
131
|
+
],
|
|
132
|
+
"name": "created",
|
|
133
|
+
"default": null,
|
|
134
|
+
"doc": "Audit stamp containing who created this relationship edge and when"
|
|
135
|
+
},
|
|
136
|
+
{
|
|
137
|
+
"type": [
|
|
138
|
+
"null",
|
|
139
|
+
"com.linkedin.pegasus2avro.common.AuditStamp"
|
|
140
|
+
],
|
|
141
|
+
"name": "lastModified",
|
|
142
|
+
"default": null,
|
|
143
|
+
"doc": "Audit stamp containing who last modified this relationship edge and when"
|
|
144
|
+
},
|
|
145
|
+
{
|
|
146
|
+
"type": [
|
|
147
|
+
"null",
|
|
148
|
+
{
|
|
149
|
+
"type": "map",
|
|
150
|
+
"values": "string"
|
|
151
|
+
}
|
|
152
|
+
],
|
|
153
|
+
"name": "properties",
|
|
154
|
+
"default": null,
|
|
155
|
+
"doc": "A generic properties bag that allows us to store specific information on this graph edge."
|
|
156
|
+
}
|
|
157
|
+
],
|
|
158
|
+
"doc": "A common structure to represent all edges to entities when used inside aspects as collections\nThis ensures that all edges have common structure around audit-stamps and will support PATCH, time-travel automatically."
|
|
159
|
+
}
|
|
160
|
+
}
|
|
161
|
+
],
|
|
162
|
+
"name": "inputEdges",
|
|
163
|
+
"default": null,
|
|
164
|
+
"doc": "Input assets consumed by the data process instance, with additional metadata.\nCounts as lineage.\nWill eventually deprecate the inputs field."
|
|
37
165
|
}
|
|
38
166
|
],
|
|
39
167
|
"doc": "Information about the inputs datasets of a Data process"
|
|
@@ -13,8 +13,6 @@
|
|
|
13
13
|
"dataset",
|
|
14
14
|
"mlModel"
|
|
15
15
|
],
|
|
16
|
-
"isLineage": true,
|
|
17
|
-
"isUpstream": false,
|
|
18
16
|
"name": "Produces"
|
|
19
17
|
}
|
|
20
18
|
},
|
|
@@ -32,9 +30,139 @@
|
|
|
32
30
|
"items": "string"
|
|
33
31
|
},
|
|
34
32
|
"name": "outputs",
|
|
35
|
-
"doc": "Output
|
|
33
|
+
"doc": "Output assets produced",
|
|
36
34
|
"Urn": "Urn",
|
|
37
35
|
"urn_is_array": true
|
|
36
|
+
},
|
|
37
|
+
{
|
|
38
|
+
"Relationship": {
|
|
39
|
+
"/*/destinationUrn": {
|
|
40
|
+
"createdActor": "outputEdges/*/created/actor",
|
|
41
|
+
"createdOn": "outputEdges/*/created/time",
|
|
42
|
+
"entityTypes": [
|
|
43
|
+
"dataset",
|
|
44
|
+
"mlModel"
|
|
45
|
+
],
|
|
46
|
+
"isLineage": true,
|
|
47
|
+
"isUpstream": false,
|
|
48
|
+
"name": "DataProcessInstanceProduces",
|
|
49
|
+
"properties": "outputEdges/*/properties",
|
|
50
|
+
"updatedActor": "outputEdges/*/lastModified/actor",
|
|
51
|
+
"updatedOn": "outputEdges/*/lastModified/time"
|
|
52
|
+
}
|
|
53
|
+
},
|
|
54
|
+
"type": [
|
|
55
|
+
"null",
|
|
56
|
+
{
|
|
57
|
+
"type": "array",
|
|
58
|
+
"items": {
|
|
59
|
+
"type": "record",
|
|
60
|
+
"name": "Edge",
|
|
61
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
62
|
+
"fields": [
|
|
63
|
+
{
|
|
64
|
+
"java": {
|
|
65
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
66
|
+
},
|
|
67
|
+
"type": [
|
|
68
|
+
"null",
|
|
69
|
+
"string"
|
|
70
|
+
],
|
|
71
|
+
"name": "sourceUrn",
|
|
72
|
+
"default": null,
|
|
73
|
+
"doc": "Urn of the source of this relationship edge.\nIf not specified, assumed to be the entity that this aspect belongs to.",
|
|
74
|
+
"Urn": "Urn"
|
|
75
|
+
},
|
|
76
|
+
{
|
|
77
|
+
"java": {
|
|
78
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
79
|
+
},
|
|
80
|
+
"type": "string",
|
|
81
|
+
"name": "destinationUrn",
|
|
82
|
+
"doc": "Urn of the destination of this relationship edge.",
|
|
83
|
+
"Urn": "Urn"
|
|
84
|
+
},
|
|
85
|
+
{
|
|
86
|
+
"type": [
|
|
87
|
+
"null",
|
|
88
|
+
{
|
|
89
|
+
"type": "record",
|
|
90
|
+
"name": "AuditStamp",
|
|
91
|
+
"namespace": "com.linkedin.pegasus2avro.common",
|
|
92
|
+
"fields": [
|
|
93
|
+
{
|
|
94
|
+
"type": "long",
|
|
95
|
+
"name": "time",
|
|
96
|
+
"doc": "When did the resource/association/sub-resource move into the specific lifecycle stage represented by this AuditEvent."
|
|
97
|
+
},
|
|
98
|
+
{
|
|
99
|
+
"java": {
|
|
100
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
101
|
+
},
|
|
102
|
+
"type": "string",
|
|
103
|
+
"name": "actor",
|
|
104
|
+
"doc": "The entity (e.g. a member URN) which will be credited for moving the resource/association/sub-resource into the specific lifecycle stage. It is also the one used to authorize the change.",
|
|
105
|
+
"Urn": "Urn"
|
|
106
|
+
},
|
|
107
|
+
{
|
|
108
|
+
"java": {
|
|
109
|
+
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
110
|
+
},
|
|
111
|
+
"type": [
|
|
112
|
+
"null",
|
|
113
|
+
"string"
|
|
114
|
+
],
|
|
115
|
+
"name": "impersonator",
|
|
116
|
+
"default": null,
|
|
117
|
+
"doc": "The entity (e.g. a service URN) which performs the change on behalf of the Actor and must be authorized to act as the Actor.",
|
|
118
|
+
"Urn": "Urn"
|
|
119
|
+
},
|
|
120
|
+
{
|
|
121
|
+
"type": [
|
|
122
|
+
"null",
|
|
123
|
+
"string"
|
|
124
|
+
],
|
|
125
|
+
"name": "message",
|
|
126
|
+
"default": null,
|
|
127
|
+
"doc": "Additional context around how DataHub was informed of the particular change. For example: was the change created by an automated process, or manually."
|
|
128
|
+
}
|
|
129
|
+
],
|
|
130
|
+
"doc": "Data captured on a resource/association/sub-resource level giving insight into when that resource/association/sub-resource moved into a particular lifecycle stage, and who acted to move it into that specific lifecycle stage."
|
|
131
|
+
}
|
|
132
|
+
],
|
|
133
|
+
"name": "created",
|
|
134
|
+
"default": null,
|
|
135
|
+
"doc": "Audit stamp containing who created this relationship edge and when"
|
|
136
|
+
},
|
|
137
|
+
{
|
|
138
|
+
"type": [
|
|
139
|
+
"null",
|
|
140
|
+
"com.linkedin.pegasus2avro.common.AuditStamp"
|
|
141
|
+
],
|
|
142
|
+
"name": "lastModified",
|
|
143
|
+
"default": null,
|
|
144
|
+
"doc": "Audit stamp containing who last modified this relationship edge and when"
|
|
145
|
+
},
|
|
146
|
+
{
|
|
147
|
+
"type": [
|
|
148
|
+
"null",
|
|
149
|
+
{
|
|
150
|
+
"type": "map",
|
|
151
|
+
"values": "string"
|
|
152
|
+
}
|
|
153
|
+
],
|
|
154
|
+
"name": "properties",
|
|
155
|
+
"default": null,
|
|
156
|
+
"doc": "A generic properties bag that allows us to store specific information on this graph edge."
|
|
157
|
+
}
|
|
158
|
+
],
|
|
159
|
+
"doc": "A common structure to represent all edges to entities when used inside aspects as collections\nThis ensures that all edges have common structure around audit-stamps and will support PATCH, time-travel automatically."
|
|
160
|
+
}
|
|
161
|
+
}
|
|
162
|
+
],
|
|
163
|
+
"name": "outputEdges",
|
|
164
|
+
"default": null,
|
|
165
|
+
"doc": "Output assets produced by the data process instance during processing, with additional metadata.\nCounts as lineage.\nWill eventually deprecate the outputs field."
|
|
38
166
|
}
|
|
39
167
|
],
|
|
40
168
|
"doc": "Information about the outputs of a Data process"
|