acryl-datahub 0.15.0.1rc3__py3-none-any.whl → 0.15.0.1rc5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of acryl-datahub might be problematic. Click here for more details.
- {acryl_datahub-0.15.0.1rc3.dist-info → acryl_datahub-0.15.0.1rc5.dist-info}/METADATA +2447 -2447
- {acryl_datahub-0.15.0.1rc3.dist-info → acryl_datahub-0.15.0.1rc5.dist-info}/RECORD +10 -10
- datahub/__init__.py +1 -1
- datahub/ingestion/source/datahub/config.py +12 -1
- datahub/ingestion/source/snowflake/snowflake_lineage_v2.py +3 -3
- datahub/ingestion/source/sql/mssql/job_models.py +0 -26
- datahub/ingestion/source/sql/mssql/source.py +0 -10
- {acryl_datahub-0.15.0.1rc3.dist-info → acryl_datahub-0.15.0.1rc5.dist-info}/WHEEL +0 -0
- {acryl_datahub-0.15.0.1rc3.dist-info → acryl_datahub-0.15.0.1rc5.dist-info}/entry_points.txt +0 -0
- {acryl_datahub-0.15.0.1rc3.dist-info → acryl_datahub-0.15.0.1rc5.dist-info}/top_level.txt +0 -0
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
datahub/__init__.py,sha256
|
|
1
|
+
datahub/__init__.py,sha256=-18N2YVu8PrOIy0Yx0RekGYrAFfiraOziwq167Rr-A0,576
|
|
2
2
|
datahub/__main__.py,sha256=pegIvQ9hzK7IhqVeUi1MeADSZ2QlP-D3K0OQdEg55RU,106
|
|
3
3
|
datahub/entrypoints.py,sha256=3-qSfXAx3Z0FEkBV5tlO8fQr4xk4ySeDRMVTpS5Xd6A,7793
|
|
4
4
|
datahub/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
@@ -265,7 +265,7 @@ datahub/ingestion/source/data_lake_common/config.py,sha256=qUk83B01hjuBKHvVz8SmX
|
|
|
265
265
|
datahub/ingestion/source/data_lake_common/data_lake_utils.py,sha256=nxu7osuzqxScPFc-1ODA2M1c_xPNPpRH_SMMU7zKOIE,6212
|
|
266
266
|
datahub/ingestion/source/data_lake_common/path_spec.py,sha256=u3u2eMe70V5vur-j8mYtupZdoeA2hSeK262Whdsc2YU,23506
|
|
267
267
|
datahub/ingestion/source/datahub/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
268
|
-
datahub/ingestion/source/datahub/config.py,sha256=
|
|
268
|
+
datahub/ingestion/source/datahub/config.py,sha256=rqZFvEmjxjBcW2cTEPYDVTAk3OLzuGIjEFghXPNeZNY,3955
|
|
269
269
|
datahub/ingestion/source/datahub/datahub_api_reader.py,sha256=hlKADVEPoTFiRGKqRsMF5mL4fSu_IrIW8Nx7LpEzvkM,2134
|
|
270
270
|
datahub/ingestion/source/datahub/datahub_database_reader.py,sha256=F8JrOjSrmJ2B6m1MWh83A1EYFDcGMla749HUeQWMnL0,9464
|
|
271
271
|
datahub/ingestion/source/datahub/datahub_kafka_reader.py,sha256=8x9_u5kRjgSmu7c295ZIZjxP6bgoZZbWsKRicuLStRQ,4145
|
|
@@ -432,7 +432,7 @@ datahub/ingestion/source/snowflake/snowflake_assertion.py,sha256=_l3k4aI9wvioE81
|
|
|
432
432
|
datahub/ingestion/source/snowflake/snowflake_config.py,sha256=LZqnTELtzRNf0vsKG-xXggXyt13S9RYvHOZEZHRjgNk,18851
|
|
433
433
|
datahub/ingestion/source/snowflake/snowflake_connection.py,sha256=yzv-01FdmfDSCJY5rqKNNodXxzg3SS5DF7oA4WXArOA,17793
|
|
434
434
|
datahub/ingestion/source/snowflake/snowflake_data_reader.py,sha256=ffR5E2uhD71FUMXd3XOg2rHwrp1rbbGEFTAbqKcmI2s,2195
|
|
435
|
-
datahub/ingestion/source/snowflake/snowflake_lineage_v2.py,sha256=
|
|
435
|
+
datahub/ingestion/source/snowflake/snowflake_lineage_v2.py,sha256=kpZvGbWmLMEUBslGToeA3oBO__8V2FzPvUKJSNw_3VM,21598
|
|
436
436
|
datahub/ingestion/source/snowflake/snowflake_profiler.py,sha256=0DJiSwII6FY34urlBja2FW66NaVvhbBWmG0p7u8Xyrc,7548
|
|
437
437
|
datahub/ingestion/source/snowflake/snowflake_queries.py,sha256=8QEihOfivalVR9vLo6vCUL-vnZfAGgMio0uhPYX0jTo,25883
|
|
438
438
|
datahub/ingestion/source/snowflake/snowflake_query.py,sha256=yDu_1aTAG7eLEh1w1FGmn2-c6NJZURdslnI6fC_4B_0,38723
|
|
@@ -472,8 +472,8 @@ datahub/ingestion/source/sql/trino.py,sha256=FEn_BQ3pm23hKx94ek5kk5IXGNYcBqZEhll
|
|
|
472
472
|
datahub/ingestion/source/sql/two_tier_sql_source.py,sha256=YDrGBb5WKVls6qv17QU5foKrf71SydzEltc3WsVAhQc,5732
|
|
473
473
|
datahub/ingestion/source/sql/vertica.py,sha256=_9OgSgIgqBml0av063rb8nACiT3SAmzpw0ouyF91wv8,33382
|
|
474
474
|
datahub/ingestion/source/sql/mssql/__init__.py,sha256=1agpl8S_uDW40olkhCX_W19dbr5GO9qgjS3R7pLRZSk,87
|
|
475
|
-
datahub/ingestion/source/sql/mssql/job_models.py,sha256=
|
|
476
|
-
datahub/ingestion/source/sql/mssql/source.py,sha256=
|
|
475
|
+
datahub/ingestion/source/sql/mssql/job_models.py,sha256=ztXDrD4anhzwWvACIm9fucE2WhMDMKkJ4alMYOQOqWA,7083
|
|
476
|
+
datahub/ingestion/source/sql/mssql/source.py,sha256=ODdsOIbDA3X0E7En6GT15mD49W6RW9sXLwRoUgw2a8I,30925
|
|
477
477
|
datahub/ingestion/source/sql/mssql/stored_procedure_lineage.py,sha256=RpnvKPalAAaOD_eUg8bZ4VkGTSeLFWuy0mefwc4s3x8,2837
|
|
478
478
|
datahub/ingestion/source/state/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
479
479
|
datahub/ingestion/source/state/checkpoint.py,sha256=x9Xww-MIFXSKjeg1tOZXE72LehCm5OfKy3HfucgIRWM,8833
|
|
@@ -981,8 +981,8 @@ datahub_provider/operators/datahub_assertion_operator.py,sha256=uvTQ-jk2F0sbqqxp
|
|
|
981
981
|
datahub_provider/operators/datahub_assertion_sensor.py,sha256=lCBj_3x1cf5GMNpHdfkpHuyHfVxsm6ff5x2Z5iizcAo,140
|
|
982
982
|
datahub_provider/operators/datahub_operation_operator.py,sha256=aevDp2FzX7FxGlXrR0khoHNbxbhKR2qPEX5e8O2Jyzw,174
|
|
983
983
|
datahub_provider/operators/datahub_operation_sensor.py,sha256=8fcdVBCEPgqy1etTXgLoiHoJrRt_nzFZQMdSzHqSG7M,168
|
|
984
|
-
acryl_datahub-0.15.0.
|
|
985
|
-
acryl_datahub-0.15.0.
|
|
986
|
-
acryl_datahub-0.15.0.
|
|
987
|
-
acryl_datahub-0.15.0.
|
|
988
|
-
acryl_datahub-0.15.0.
|
|
984
|
+
acryl_datahub-0.15.0.1rc5.dist-info/METADATA,sha256=wHBTsOtPztz6CEvfrpn9IJGxoQfDKocsKdaI1MZTEj8,173642
|
|
985
|
+
acryl_datahub-0.15.0.1rc5.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
|
|
986
|
+
acryl_datahub-0.15.0.1rc5.dist-info/entry_points.txt,sha256=xnPSPLK3bJGADxe4TDS4wL4u0FT_PGlahDa-ENYdYCQ,9512
|
|
987
|
+
acryl_datahub-0.15.0.1rc5.dist-info/top_level.txt,sha256=iLjSrLK5ox1YVYcglRUkcvfZPvKlobBWx7CTUXx8_GI,25
|
|
988
|
+
acryl_datahub-0.15.0.1rc5.dist-info/RECORD,,
|
datahub/__init__.py
CHANGED
|
@@ -14,6 +14,17 @@ from datahub.ingestion.source.state.stateful_ingestion_base import (
|
|
|
14
14
|
DEFAULT_DATABASE_TABLE_NAME = "metadata_aspect_v2"
|
|
15
15
|
DEFAULT_KAFKA_TOPIC_NAME = "MetadataChangeLog_Timeseries_v1"
|
|
16
16
|
DEFAULT_DATABASE_BATCH_SIZE = 10_000
|
|
17
|
+
DEFAULT_EXCLUDE_ASPECTS = {
|
|
18
|
+
"dataHubIngestionSourceKey",
|
|
19
|
+
"dataHubIngestionSourceInfo",
|
|
20
|
+
"datahubIngestionRunSummary",
|
|
21
|
+
"datahubIngestionCheckpoint",
|
|
22
|
+
"dataHubSecretKey",
|
|
23
|
+
"dataHubSecretValue",
|
|
24
|
+
"globalSettingsKey",
|
|
25
|
+
"globalSettingsInfo",
|
|
26
|
+
"testResults",
|
|
27
|
+
}
|
|
17
28
|
|
|
18
29
|
|
|
19
30
|
class DataHubSourceConfig(StatefulIngestionConfigBase):
|
|
@@ -44,7 +55,7 @@ class DataHubSourceConfig(StatefulIngestionConfigBase):
|
|
|
44
55
|
)
|
|
45
56
|
|
|
46
57
|
exclude_aspects: Set[str] = Field(
|
|
47
|
-
|
|
58
|
+
default=DEFAULT_EXCLUDE_ASPECTS,
|
|
48
59
|
description="Set of aspect names to exclude from ingestion",
|
|
49
60
|
)
|
|
50
61
|
|
|
@@ -4,7 +4,7 @@ from dataclasses import dataclass
|
|
|
4
4
|
from datetime import datetime
|
|
5
5
|
from typing import Any, Collection, Iterable, List, Optional, Set, Tuple, Type
|
|
6
6
|
|
|
7
|
-
from pydantic import BaseModel, validator
|
|
7
|
+
from pydantic import BaseModel, Field, validator
|
|
8
8
|
|
|
9
9
|
from datahub.configuration.datetimes import parse_absolute_time
|
|
10
10
|
from datahub.ingestion.api.closeable import Closeable
|
|
@@ -72,8 +72,8 @@ class ColumnUpstreamJob(BaseModel):
|
|
|
72
72
|
|
|
73
73
|
|
|
74
74
|
class ColumnUpstreamLineage(BaseModel):
|
|
75
|
-
column_name: str
|
|
76
|
-
upstreams: List[ColumnUpstreamJob]
|
|
75
|
+
column_name: Optional[str]
|
|
76
|
+
upstreams: List[ColumnUpstreamJob] = Field(default_factory=list)
|
|
77
77
|
|
|
78
78
|
|
|
79
79
|
class UpstreamTableNode(BaseModel):
|
|
@@ -7,9 +7,7 @@ from datahub.emitter.mce_builder import (
|
|
|
7
7
|
make_data_platform_urn,
|
|
8
8
|
make_dataplatform_instance_urn,
|
|
9
9
|
)
|
|
10
|
-
from datahub.emitter.mcp_builder import DatabaseKey
|
|
11
10
|
from datahub.metadata.schema_classes import (
|
|
12
|
-
ContainerClass,
|
|
13
11
|
DataFlowInfoClass,
|
|
14
12
|
DataJobInfoClass,
|
|
15
13
|
DataJobInputOutputClass,
|
|
@@ -212,18 +210,6 @@ class MSSQLDataJob:
|
|
|
212
210
|
status=self.status,
|
|
213
211
|
)
|
|
214
212
|
|
|
215
|
-
@property
|
|
216
|
-
def as_container_aspect(self) -> ContainerClass:
|
|
217
|
-
databaseKey = DatabaseKey(
|
|
218
|
-
platform=self.entity.flow.orchestrator,
|
|
219
|
-
instance=self.entity.flow.platform_instance
|
|
220
|
-
if self.entity.flow.platform_instance
|
|
221
|
-
else None,
|
|
222
|
-
env=self.entity.flow.env,
|
|
223
|
-
database=self.entity.flow.db,
|
|
224
|
-
)
|
|
225
|
-
return ContainerClass(container=databaseKey.as_urn())
|
|
226
|
-
|
|
227
213
|
@property
|
|
228
214
|
def as_maybe_platform_instance_aspect(self) -> Optional[DataPlatformInstanceClass]:
|
|
229
215
|
if self.entity.flow.platform_instance:
|
|
@@ -271,18 +257,6 @@ class MSSQLDataFlow:
|
|
|
271
257
|
externalUrl=self.external_url,
|
|
272
258
|
)
|
|
273
259
|
|
|
274
|
-
@property
|
|
275
|
-
def as_container_aspect(self) -> ContainerClass:
|
|
276
|
-
databaseKey = DatabaseKey(
|
|
277
|
-
platform=self.entity.orchestrator,
|
|
278
|
-
instance=self.entity.platform_instance
|
|
279
|
-
if self.entity.platform_instance
|
|
280
|
-
else None,
|
|
281
|
-
env=self.entity.env,
|
|
282
|
-
database=self.entity.db,
|
|
283
|
-
)
|
|
284
|
-
return ContainerClass(container=databaseKey.as_urn())
|
|
285
|
-
|
|
286
260
|
@property
|
|
287
261
|
def as_maybe_platform_instance_aspect(self) -> Optional[DataPlatformInstanceClass]:
|
|
288
262
|
if self.entity.platform_instance:
|
|
@@ -639,11 +639,6 @@ class SQLServerSource(SQLAlchemySource):
|
|
|
639
639
|
aspect=data_job.as_datajob_info_aspect,
|
|
640
640
|
).as_workunit()
|
|
641
641
|
|
|
642
|
-
yield MetadataChangeProposalWrapper(
|
|
643
|
-
entityUrn=data_job.urn,
|
|
644
|
-
aspect=data_job.as_container_aspect,
|
|
645
|
-
).as_workunit()
|
|
646
|
-
|
|
647
642
|
data_platform_instance_aspect = data_job.as_maybe_platform_instance_aspect
|
|
648
643
|
if data_platform_instance_aspect:
|
|
649
644
|
yield MetadataChangeProposalWrapper(
|
|
@@ -667,11 +662,6 @@ class SQLServerSource(SQLAlchemySource):
|
|
|
667
662
|
aspect=data_flow.as_dataflow_info_aspect,
|
|
668
663
|
).as_workunit()
|
|
669
664
|
|
|
670
|
-
yield MetadataChangeProposalWrapper(
|
|
671
|
-
entityUrn=data_flow.urn,
|
|
672
|
-
aspect=data_flow.as_container_aspect,
|
|
673
|
-
).as_workunit()
|
|
674
|
-
|
|
675
665
|
data_platform_instance_aspect = data_flow.as_maybe_platform_instance_aspect
|
|
676
666
|
if data_platform_instance_aspect:
|
|
677
667
|
yield MetadataChangeProposalWrapper(
|
|
File without changes
|
{acryl_datahub-0.15.0.1rc3.dist-info → acryl_datahub-0.15.0.1rc5.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
|
File without changes
|