acryl-datahub 0.15.0rc18__py3-none-any.whl → 0.15.0rc19__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of acryl-datahub might be problematic. Click here for more details.
- {acryl_datahub-0.15.0rc18.dist-info → acryl_datahub-0.15.0rc19.dist-info}/METADATA +2511 -2511
- {acryl_datahub-0.15.0rc18.dist-info → acryl_datahub-0.15.0rc19.dist-info}/RECORD +11 -11
- datahub/__init__.py +1 -1
- datahub/ingestion/source/snowflake/snowflake_utils.py +1 -1
- datahub/metadata/schema.avsc +4 -0
- datahub/metadata/schemas/FormInfo.avsc +4 -0
- datahub/sql_parsing/sql_parsing_aggregator.py +1 -2
- datahub/sql_parsing/sqlglot_utils.py +8 -2
- {acryl_datahub-0.15.0rc18.dist-info → acryl_datahub-0.15.0rc19.dist-info}/WHEEL +0 -0
- {acryl_datahub-0.15.0rc18.dist-info → acryl_datahub-0.15.0rc19.dist-info}/entry_points.txt +0 -0
- {acryl_datahub-0.15.0rc18.dist-info → acryl_datahub-0.15.0rc19.dist-info}/top_level.txt +0 -0
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
datahub/__init__.py,sha256=
|
|
1
|
+
datahub/__init__.py,sha256=zTa1Zc6cS51RVM7kIIa6JgOSFayPVXd-AmsJeebmbNQ,575
|
|
2
2
|
datahub/__main__.py,sha256=pegIvQ9hzK7IhqVeUi1MeADSZ2QlP-D3K0OQdEg55RU,106
|
|
3
3
|
datahub/entrypoints.py,sha256=3-qSfXAx3Z0FEkBV5tlO8fQr4xk4ySeDRMVTpS5Xd6A,7793
|
|
4
4
|
datahub/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
@@ -438,7 +438,7 @@ datahub/ingestion/source/snowflake/snowflake_shares.py,sha256=ud3Ah4qHrmSfpD8Od-
|
|
|
438
438
|
datahub/ingestion/source/snowflake/snowflake_summary.py,sha256=kTmuCtRnvHqM8WBYhWeK4XafJq3ssFL9kcS03jEeWT4,5506
|
|
439
439
|
datahub/ingestion/source/snowflake/snowflake_tag.py,sha256=fyfWmFVz2WZrpTJWNIe9m0WpDHgeFrGPf8diORJZUwo,6212
|
|
440
440
|
datahub/ingestion/source/snowflake/snowflake_usage_v2.py,sha256=PEmYNMXJRUvLQmVd8juVqjokfuSPuH9ppcM0ruXamxA,24807
|
|
441
|
-
datahub/ingestion/source/snowflake/snowflake_utils.py,sha256=
|
|
441
|
+
datahub/ingestion/source/snowflake/snowflake_utils.py,sha256=YczNEupY89jeegjR2_1pT4bPi9wQ69EIhGpzyCe9Jdg,12600
|
|
442
442
|
datahub/ingestion/source/snowflake/snowflake_v2.py,sha256=lo_3asTuIZbF-LuEUcYL-9NIZ720n7oB9mYA6WVTWA4,31960
|
|
443
443
|
datahub/ingestion/source/sql/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
444
444
|
datahub/ingestion/source/sql/athena.py,sha256=G3cIY8H_76lIUAzQWW2kLnZOEsfbakmojxbiHb3dYZ8,24059
|
|
@@ -560,7 +560,7 @@ datahub/lite/lite_server.py,sha256=p9Oa2nNs65mqcssSIVOr7VOzWqfVstz6ZQEdT4f82S0,1
|
|
|
560
560
|
datahub/lite/lite_util.py,sha256=pgBpT3vTO1YCQ2njZRNyicSkHYeEmQCt41BaXU8WvMo,4503
|
|
561
561
|
datahub/metadata/__init__.py,sha256=AjhXPjI6cnpdcrBRrE5gOWo15vv2TTl2ctU4UAnUN7A,238
|
|
562
562
|
datahub/metadata/_schema_classes.py,sha256=iPeBXGvbNEm0vw5pYwunnvx7bTtBdmIQVtzMOlS6bSI,955042
|
|
563
|
-
datahub/metadata/schema.avsc,sha256=
|
|
563
|
+
datahub/metadata/schema.avsc,sha256=Xx93OdPzQfBb2CtntIYE-HAeKNg-JZcCtRU95v7ZZCs,677728
|
|
564
564
|
datahub/metadata/schema_classes.py,sha256=X5Jl5EaSxyHdXOQv14pJ5WkQALun4MRpJ4q12wVFE18,1299
|
|
565
565
|
datahub/metadata/urns.py,sha256=nfrCTExR-k2P9w272WVtWSN3xW1VUJngPwP3xnvULjU,1217
|
|
566
566
|
datahub/metadata/_urns/__init__.py,sha256=cOF3GHMDgPhmbLKbN02NPpuLGHSu0qNgQyBRv08eqF0,243
|
|
@@ -757,7 +757,7 @@ datahub/metadata/schemas/ExecutionRequestKey.avsc,sha256=SvjnlTAGYsSnvVE0rZ9-7UP
|
|
|
757
757
|
datahub/metadata/schemas/ExecutionRequestResult.avsc,sha256=kg3xMNr9kYLPnFsV-iqcGm1sh1muQVGJvxUt15L1yKo,2333
|
|
758
758
|
datahub/metadata/schemas/ExecutionRequestSignal.avsc,sha256=dsIUa6tfVSXqYOgh4cW6_Hzi8RjHuJJoO-mBAuZukpA,2515
|
|
759
759
|
datahub/metadata/schemas/Filter.avsc,sha256=PU-aGkc2-sI3ZXY7ci-Y0A7zp1jux3VW_6c8MJRAokg,5933
|
|
760
|
-
datahub/metadata/schemas/FormInfo.avsc,sha256=
|
|
760
|
+
datahub/metadata/schemas/FormInfo.avsc,sha256=FbN34htiCgm3LqKDL3sVsJhMUHIyc5jYpGJtYm7Ysd4,6270
|
|
761
761
|
datahub/metadata/schemas/FormKey.avsc,sha256=1-wE28B8T3WJ3JtexreNtFvP3To3n7U-jvYudCuSM9o,437
|
|
762
762
|
datahub/metadata/schemas/Forms.avsc,sha256=shmkhRoHN2gTaTsqGrGDRoNwe_z-nrFbbLjH9MtVDCs,10955
|
|
763
763
|
datahub/metadata/schemas/GlobalSettingsInfo.avsc,sha256=OVMM6FwhHhufHkezYcVePK0zI2llzFYLVFJhmAiHoiI,10102
|
|
@@ -869,11 +869,11 @@ datahub/sql_parsing/datajob.py,sha256=1X8KpEk-y3_8xJuA_Po27EHZgOcxK9QADI6Om9gSGn
|
|
|
869
869
|
datahub/sql_parsing/query_types.py,sha256=FKjDzszZzsrCfYfm7dgD6T_8865qxWl767fdGyHWBh4,2720
|
|
870
870
|
datahub/sql_parsing/schema_resolver.py,sha256=9INZWdxA2dMSLK6RXaVqjbjyLY_VKMhCkQv_Xd6Ln3I,10848
|
|
871
871
|
datahub/sql_parsing/split_statements.py,sha256=uZhAXLaRxDfmK0lPBW2oM_YVdJfSMhdgndnfd9iIXuA,5001
|
|
872
|
-
datahub/sql_parsing/sql_parsing_aggregator.py,sha256=
|
|
872
|
+
datahub/sql_parsing/sql_parsing_aggregator.py,sha256=F-aj7yqOwbo7FpxduFO5a7cLWkojL_Npv3_dlfHPNGY,69877
|
|
873
873
|
datahub/sql_parsing/sql_parsing_common.py,sha256=h_V_m54hJ9EUh5kczq7cYOIeNeo4bgf0Px0H-Nq-UIg,2602
|
|
874
874
|
datahub/sql_parsing/sql_parsing_result_utils.py,sha256=prwWTj1EB2fRPv1eMB4EkpFNafIYAt-X8TIK0NWqank,796
|
|
875
875
|
datahub/sql_parsing/sqlglot_lineage.py,sha256=CLDOc0HNqL_539eahOP3QOoldIYC6CF29id4Xe3TlEM,47018
|
|
876
|
-
datahub/sql_parsing/sqlglot_utils.py,sha256=
|
|
876
|
+
datahub/sql_parsing/sqlglot_utils.py,sha256=n6yufzEGwSlFeCSU540hEldIuab0q8KGqm9x0vSawkc,14699
|
|
877
877
|
datahub/sql_parsing/tool_meta_extractor.py,sha256=pE-pkRKBfNTXEJkaQM9NlG807mc-X6OtetgskJySCs8,2908
|
|
878
878
|
datahub/telemetry/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
879
879
|
datahub/telemetry/stats.py,sha256=YltbtC3fe6rl1kcxn1A-mSnVpECTPm5k-brrUt7QxTI,967
|
|
@@ -974,8 +974,8 @@ datahub_provider/operators/datahub_assertion_operator.py,sha256=uvTQ-jk2F0sbqqxp
|
|
|
974
974
|
datahub_provider/operators/datahub_assertion_sensor.py,sha256=lCBj_3x1cf5GMNpHdfkpHuyHfVxsm6ff5x2Z5iizcAo,140
|
|
975
975
|
datahub_provider/operators/datahub_operation_operator.py,sha256=aevDp2FzX7FxGlXrR0khoHNbxbhKR2qPEX5e8O2Jyzw,174
|
|
976
976
|
datahub_provider/operators/datahub_operation_sensor.py,sha256=8fcdVBCEPgqy1etTXgLoiHoJrRt_nzFZQMdSzHqSG7M,168
|
|
977
|
-
acryl_datahub-0.15.
|
|
978
|
-
acryl_datahub-0.15.
|
|
979
|
-
acryl_datahub-0.15.
|
|
980
|
-
acryl_datahub-0.15.
|
|
981
|
-
acryl_datahub-0.15.
|
|
977
|
+
acryl_datahub-0.15.0rc19.dist-info/METADATA,sha256=q_LaYt6m4WYgYyJo2ZA3Gj3a7kk5MKwiWvJheDfSPc8,173559
|
|
978
|
+
acryl_datahub-0.15.0rc19.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
|
|
979
|
+
acryl_datahub-0.15.0rc19.dist-info/entry_points.txt,sha256=Yj0PWB0LQOq4Rj2fyR6ETx4BUGw4TOcNL0ZNoAZ9kQg,9504
|
|
980
|
+
acryl_datahub-0.15.0rc19.dist-info/top_level.txt,sha256=iLjSrLK5ox1YVYcglRUkcvfZPvKlobBWx7CTUXx8_GI,25
|
|
981
|
+
acryl_datahub-0.15.0rc19.dist-info/RECORD,,
|
datahub/__init__.py
CHANGED
|
@@ -119,7 +119,6 @@ class SnowflakeFilter:
|
|
|
119
119
|
) -> bool:
|
|
120
120
|
if not dataset_type or not dataset_name:
|
|
121
121
|
return True
|
|
122
|
-
dataset_params = dataset_name.split(".")
|
|
123
122
|
if dataset_type.lower() not in (
|
|
124
123
|
SnowflakeObjectDomain.TABLE,
|
|
125
124
|
SnowflakeObjectDomain.EXTERNAL_TABLE,
|
|
@@ -131,6 +130,7 @@ class SnowflakeFilter:
|
|
|
131
130
|
if _is_sys_table(dataset_name):
|
|
132
131
|
return False
|
|
133
132
|
|
|
133
|
+
dataset_params = _split_qualified_name(dataset_name)
|
|
134
134
|
if len(dataset_params) != 3:
|
|
135
135
|
self.structured_reporter.info(
|
|
136
136
|
title="Unexpected dataset pattern",
|
datahub/metadata/schema.avsc
CHANGED
|
@@ -18518,6 +18518,10 @@
|
|
|
18518
18518
|
"namespace": "com.linkedin.pegasus2avro.form",
|
|
18519
18519
|
"fields": [
|
|
18520
18520
|
{
|
|
18521
|
+
"Searchable": {
|
|
18522
|
+
"fieldName": "structuredPropertyPromptUrns",
|
|
18523
|
+
"fieldType": "URN"
|
|
18524
|
+
},
|
|
18521
18525
|
"java": {
|
|
18522
18526
|
"class": "com.linkedin.pegasus2avro.common.urn.Urn"
|
|
18523
18527
|
},
|
|
@@ -1383,8 +1383,7 @@ class SqlParsingAggregator(Closeable):
|
|
|
1383
1383
|
return QueryUrn(query_id).urn()
|
|
1384
1384
|
|
|
1385
1385
|
@classmethod
|
|
1386
|
-
def _composite_query_id(cls, composed_of_queries:
|
|
1387
|
-
composed_of_queries = list(composed_of_queries)
|
|
1386
|
+
def _composite_query_id(cls, composed_of_queries: List[QueryId]) -> str:
|
|
1388
1387
|
combined = json.dumps(composed_of_queries)
|
|
1389
1388
|
return f"composite_{generate_hash(combined)}"
|
|
1390
1389
|
|
|
@@ -121,7 +121,7 @@ _BASIC_NORMALIZATION_RULES = {
|
|
|
121
121
|
# Remove /* */ comments.
|
|
122
122
|
re.compile(r"/\*.*?\*/", re.DOTALL): "",
|
|
123
123
|
# Remove -- comments.
|
|
124
|
-
re.compile(r"--.*$"): "",
|
|
124
|
+
re.compile(r"--.*$", re.MULTILINE): "",
|
|
125
125
|
# Replace all runs of whitespace with a single space.
|
|
126
126
|
re.compile(r"\s+"): " ",
|
|
127
127
|
# Remove leading and trailing whitespace and trailing semicolons.
|
|
@@ -131,10 +131,16 @@ _BASIC_NORMALIZATION_RULES = {
|
|
|
131
131
|
# Replace anything that looks like a string with a placeholder.
|
|
132
132
|
re.compile(r"'[^']*'"): "?",
|
|
133
133
|
# Replace sequences of IN/VALUES with a single placeholder.
|
|
134
|
-
|
|
134
|
+
# The r" ?" makes it more robust to uneven spacing.
|
|
135
|
+
re.compile(r"\b(IN|VALUES)\s*\( ?\?(?:, ?\?)* ?\)", re.IGNORECASE): r"\1 (?)",
|
|
135
136
|
# Normalize parenthesis spacing.
|
|
136
137
|
re.compile(r"\( "): "(",
|
|
137
138
|
re.compile(r" \)"): ")",
|
|
139
|
+
# Fix up spaces before commas in column lists.
|
|
140
|
+
# e.g. "col1 , col2" -> "col1, col2"
|
|
141
|
+
# e.g. "col1,col2" -> "col1, col2"
|
|
142
|
+
re.compile(r"\b ,"): ",",
|
|
143
|
+
re.compile(r"\b,\b"): ", ",
|
|
138
144
|
}
|
|
139
145
|
_TABLE_NAME_NORMALIZATION_RULES = {
|
|
140
146
|
# Replace UUID-like strings with a placeholder (both - and _ variants).
|
|
File without changes
|
|
File without changes
|
|
File without changes
|