acryl-datahub 0.15.0.1rc3__py3-none-any.whl → 0.15.0.1rc5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of acryl-datahub might be problematic. Click here for more details.

@@ -1,4 +1,4 @@
1
- datahub/__init__.py,sha256=BqWrG3ZFOnsobExCu08Kaj1mOgrBZ-Jmo_XLdalPyI0,576
1
+ datahub/__init__.py,sha256=-18N2YVu8PrOIy0Yx0RekGYrAFfiraOziwq167Rr-A0,576
2
2
  datahub/__main__.py,sha256=pegIvQ9hzK7IhqVeUi1MeADSZ2QlP-D3K0OQdEg55RU,106
3
3
  datahub/entrypoints.py,sha256=3-qSfXAx3Z0FEkBV5tlO8fQr4xk4ySeDRMVTpS5Xd6A,7793
4
4
  datahub/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -265,7 +265,7 @@ datahub/ingestion/source/data_lake_common/config.py,sha256=qUk83B01hjuBKHvVz8SmX
265
265
  datahub/ingestion/source/data_lake_common/data_lake_utils.py,sha256=nxu7osuzqxScPFc-1ODA2M1c_xPNPpRH_SMMU7zKOIE,6212
266
266
  datahub/ingestion/source/data_lake_common/path_spec.py,sha256=u3u2eMe70V5vur-j8mYtupZdoeA2hSeK262Whdsc2YU,23506
267
267
  datahub/ingestion/source/datahub/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
268
- datahub/ingestion/source/datahub/config.py,sha256=pOXt0b1PX6D7dtD4RuKwdmr6sQKnXSf6LHxfPUMhP8s,3658
268
+ datahub/ingestion/source/datahub/config.py,sha256=rqZFvEmjxjBcW2cTEPYDVTAk3OLzuGIjEFghXPNeZNY,3955
269
269
  datahub/ingestion/source/datahub/datahub_api_reader.py,sha256=hlKADVEPoTFiRGKqRsMF5mL4fSu_IrIW8Nx7LpEzvkM,2134
270
270
  datahub/ingestion/source/datahub/datahub_database_reader.py,sha256=F8JrOjSrmJ2B6m1MWh83A1EYFDcGMla749HUeQWMnL0,9464
271
271
  datahub/ingestion/source/datahub/datahub_kafka_reader.py,sha256=8x9_u5kRjgSmu7c295ZIZjxP6bgoZZbWsKRicuLStRQ,4145
@@ -432,7 +432,7 @@ datahub/ingestion/source/snowflake/snowflake_assertion.py,sha256=_l3k4aI9wvioE81
432
432
  datahub/ingestion/source/snowflake/snowflake_config.py,sha256=LZqnTELtzRNf0vsKG-xXggXyt13S9RYvHOZEZHRjgNk,18851
433
433
  datahub/ingestion/source/snowflake/snowflake_connection.py,sha256=yzv-01FdmfDSCJY5rqKNNodXxzg3SS5DF7oA4WXArOA,17793
434
434
  datahub/ingestion/source/snowflake/snowflake_data_reader.py,sha256=ffR5E2uhD71FUMXd3XOg2rHwrp1rbbGEFTAbqKcmI2s,2195
435
- datahub/ingestion/source/snowflake/snowflake_lineage_v2.py,sha256=uMGmMEl4hWEmN7GxMyDBdwlIPAW7WmOnu41kZ0dvCG4,21551
435
+ datahub/ingestion/source/snowflake/snowflake_lineage_v2.py,sha256=kpZvGbWmLMEUBslGToeA3oBO__8V2FzPvUKJSNw_3VM,21598
436
436
  datahub/ingestion/source/snowflake/snowflake_profiler.py,sha256=0DJiSwII6FY34urlBja2FW66NaVvhbBWmG0p7u8Xyrc,7548
437
437
  datahub/ingestion/source/snowflake/snowflake_queries.py,sha256=8QEihOfivalVR9vLo6vCUL-vnZfAGgMio0uhPYX0jTo,25883
438
438
  datahub/ingestion/source/snowflake/snowflake_query.py,sha256=yDu_1aTAG7eLEh1w1FGmn2-c6NJZURdslnI6fC_4B_0,38723
@@ -472,8 +472,8 @@ datahub/ingestion/source/sql/trino.py,sha256=FEn_BQ3pm23hKx94ek5kk5IXGNYcBqZEhll
472
472
  datahub/ingestion/source/sql/two_tier_sql_source.py,sha256=YDrGBb5WKVls6qv17QU5foKrf71SydzEltc3WsVAhQc,5732
473
473
  datahub/ingestion/source/sql/vertica.py,sha256=_9OgSgIgqBml0av063rb8nACiT3SAmzpw0ouyF91wv8,33382
474
474
  datahub/ingestion/source/sql/mssql/__init__.py,sha256=1agpl8S_uDW40olkhCX_W19dbr5GO9qgjS3R7pLRZSk,87
475
- datahub/ingestion/source/sql/mssql/job_models.py,sha256=qMA4yzRiX-60ugsFu5ob3tOSgVs0uPTW_O8OHCECS_0,8002
476
- datahub/ingestion/source/sql/mssql/source.py,sha256=0ivc6svImkYfGYuAPDX4ZsaYZTilohwaV4cg3KWOqNI,31237
475
+ datahub/ingestion/source/sql/mssql/job_models.py,sha256=ztXDrD4anhzwWvACIm9fucE2WhMDMKkJ4alMYOQOqWA,7083
476
+ datahub/ingestion/source/sql/mssql/source.py,sha256=ODdsOIbDA3X0E7En6GT15mD49W6RW9sXLwRoUgw2a8I,30925
477
477
  datahub/ingestion/source/sql/mssql/stored_procedure_lineage.py,sha256=RpnvKPalAAaOD_eUg8bZ4VkGTSeLFWuy0mefwc4s3x8,2837
478
478
  datahub/ingestion/source/state/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
479
479
  datahub/ingestion/source/state/checkpoint.py,sha256=x9Xww-MIFXSKjeg1tOZXE72LehCm5OfKy3HfucgIRWM,8833
@@ -981,8 +981,8 @@ datahub_provider/operators/datahub_assertion_operator.py,sha256=uvTQ-jk2F0sbqqxp
981
981
  datahub_provider/operators/datahub_assertion_sensor.py,sha256=lCBj_3x1cf5GMNpHdfkpHuyHfVxsm6ff5x2Z5iizcAo,140
982
982
  datahub_provider/operators/datahub_operation_operator.py,sha256=aevDp2FzX7FxGlXrR0khoHNbxbhKR2qPEX5e8O2Jyzw,174
983
983
  datahub_provider/operators/datahub_operation_sensor.py,sha256=8fcdVBCEPgqy1etTXgLoiHoJrRt_nzFZQMdSzHqSG7M,168
984
- acryl_datahub-0.15.0.1rc3.dist-info/METADATA,sha256=JxWLTgCDIjuZb3Q_cRrG3nTw6mqsweOED2pg_izLT5I,173642
985
- acryl_datahub-0.15.0.1rc3.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
986
- acryl_datahub-0.15.0.1rc3.dist-info/entry_points.txt,sha256=xnPSPLK3bJGADxe4TDS4wL4u0FT_PGlahDa-ENYdYCQ,9512
987
- acryl_datahub-0.15.0.1rc3.dist-info/top_level.txt,sha256=iLjSrLK5ox1YVYcglRUkcvfZPvKlobBWx7CTUXx8_GI,25
988
- acryl_datahub-0.15.0.1rc3.dist-info/RECORD,,
984
+ acryl_datahub-0.15.0.1rc5.dist-info/METADATA,sha256=wHBTsOtPztz6CEvfrpn9IJGxoQfDKocsKdaI1MZTEj8,173642
985
+ acryl_datahub-0.15.0.1rc5.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
986
+ acryl_datahub-0.15.0.1rc5.dist-info/entry_points.txt,sha256=xnPSPLK3bJGADxe4TDS4wL4u0FT_PGlahDa-ENYdYCQ,9512
987
+ acryl_datahub-0.15.0.1rc5.dist-info/top_level.txt,sha256=iLjSrLK5ox1YVYcglRUkcvfZPvKlobBWx7CTUXx8_GI,25
988
+ acryl_datahub-0.15.0.1rc5.dist-info/RECORD,,
datahub/__init__.py CHANGED
@@ -3,7 +3,7 @@ import warnings
3
3
 
4
4
  # Published at https://pypi.org/project/acryl-datahub/.
5
5
  __package_name__ = "acryl-datahub"
6
- __version__ = "0.15.0.1rc3"
6
+ __version__ = "0.15.0.1rc5"
7
7
 
8
8
 
9
9
  def is_dev_mode() -> bool:
@@ -14,6 +14,17 @@ from datahub.ingestion.source.state.stateful_ingestion_base import (
14
14
  DEFAULT_DATABASE_TABLE_NAME = "metadata_aspect_v2"
15
15
  DEFAULT_KAFKA_TOPIC_NAME = "MetadataChangeLog_Timeseries_v1"
16
16
  DEFAULT_DATABASE_BATCH_SIZE = 10_000
17
+ DEFAULT_EXCLUDE_ASPECTS = {
18
+ "dataHubIngestionSourceKey",
19
+ "dataHubIngestionSourceInfo",
20
+ "datahubIngestionRunSummary",
21
+ "datahubIngestionCheckpoint",
22
+ "dataHubSecretKey",
23
+ "dataHubSecretValue",
24
+ "globalSettingsKey",
25
+ "globalSettingsInfo",
26
+ "testResults",
27
+ }
17
28
 
18
29
 
19
30
  class DataHubSourceConfig(StatefulIngestionConfigBase):
@@ -44,7 +55,7 @@ class DataHubSourceConfig(StatefulIngestionConfigBase):
44
55
  )
45
56
 
46
57
  exclude_aspects: Set[str] = Field(
47
- default_factory=set,
58
+ default=DEFAULT_EXCLUDE_ASPECTS,
48
59
  description="Set of aspect names to exclude from ingestion",
49
60
  )
50
61
 
@@ -4,7 +4,7 @@ from dataclasses import dataclass
4
4
  from datetime import datetime
5
5
  from typing import Any, Collection, Iterable, List, Optional, Set, Tuple, Type
6
6
 
7
- from pydantic import BaseModel, validator
7
+ from pydantic import BaseModel, Field, validator
8
8
 
9
9
  from datahub.configuration.datetimes import parse_absolute_time
10
10
  from datahub.ingestion.api.closeable import Closeable
@@ -72,8 +72,8 @@ class ColumnUpstreamJob(BaseModel):
72
72
 
73
73
 
74
74
  class ColumnUpstreamLineage(BaseModel):
75
- column_name: str
76
- upstreams: List[ColumnUpstreamJob]
75
+ column_name: Optional[str]
76
+ upstreams: List[ColumnUpstreamJob] = Field(default_factory=list)
77
77
 
78
78
 
79
79
  class UpstreamTableNode(BaseModel):
@@ -7,9 +7,7 @@ from datahub.emitter.mce_builder import (
7
7
  make_data_platform_urn,
8
8
  make_dataplatform_instance_urn,
9
9
  )
10
- from datahub.emitter.mcp_builder import DatabaseKey
11
10
  from datahub.metadata.schema_classes import (
12
- ContainerClass,
13
11
  DataFlowInfoClass,
14
12
  DataJobInfoClass,
15
13
  DataJobInputOutputClass,
@@ -212,18 +210,6 @@ class MSSQLDataJob:
212
210
  status=self.status,
213
211
  )
214
212
 
215
- @property
216
- def as_container_aspect(self) -> ContainerClass:
217
- databaseKey = DatabaseKey(
218
- platform=self.entity.flow.orchestrator,
219
- instance=self.entity.flow.platform_instance
220
- if self.entity.flow.platform_instance
221
- else None,
222
- env=self.entity.flow.env,
223
- database=self.entity.flow.db,
224
- )
225
- return ContainerClass(container=databaseKey.as_urn())
226
-
227
213
  @property
228
214
  def as_maybe_platform_instance_aspect(self) -> Optional[DataPlatformInstanceClass]:
229
215
  if self.entity.flow.platform_instance:
@@ -271,18 +257,6 @@ class MSSQLDataFlow:
271
257
  externalUrl=self.external_url,
272
258
  )
273
259
 
274
- @property
275
- def as_container_aspect(self) -> ContainerClass:
276
- databaseKey = DatabaseKey(
277
- platform=self.entity.orchestrator,
278
- instance=self.entity.platform_instance
279
- if self.entity.platform_instance
280
- else None,
281
- env=self.entity.env,
282
- database=self.entity.db,
283
- )
284
- return ContainerClass(container=databaseKey.as_urn())
285
-
286
260
  @property
287
261
  def as_maybe_platform_instance_aspect(self) -> Optional[DataPlatformInstanceClass]:
288
262
  if self.entity.platform_instance:
@@ -639,11 +639,6 @@ class SQLServerSource(SQLAlchemySource):
639
639
  aspect=data_job.as_datajob_info_aspect,
640
640
  ).as_workunit()
641
641
 
642
- yield MetadataChangeProposalWrapper(
643
- entityUrn=data_job.urn,
644
- aspect=data_job.as_container_aspect,
645
- ).as_workunit()
646
-
647
642
  data_platform_instance_aspect = data_job.as_maybe_platform_instance_aspect
648
643
  if data_platform_instance_aspect:
649
644
  yield MetadataChangeProposalWrapper(
@@ -667,11 +662,6 @@ class SQLServerSource(SQLAlchemySource):
667
662
  aspect=data_flow.as_dataflow_info_aspect,
668
663
  ).as_workunit()
669
664
 
670
- yield MetadataChangeProposalWrapper(
671
- entityUrn=data_flow.urn,
672
- aspect=data_flow.as_container_aspect,
673
- ).as_workunit()
674
-
675
665
  data_platform_instance_aspect = data_flow.as_maybe_platform_instance_aspect
676
666
  if data_platform_instance_aspect:
677
667
  yield MetadataChangeProposalWrapper(