PyPI - acryl-datahub - Versions diffs - 1.0.0.3rc8__py3-none-any.whl → 1.0.0.3rc10__py3-none-any.whl - Mend

acryl-datahub 1.0.0.3rc8py3-none-any.whl → 1.0.0.3rc10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of acryl-datahub might be problematic. Click here for more details.

Files changed (60) hide show

{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/METADATA +2466 -2466
{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/RECORD +60 -60
{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/WHEEL +1 -1
datahub/_version.py +1 -1
datahub/api/circuit_breaker/operation_circuit_breaker.py +2 -2
datahub/api/entities/datajob/dataflow.py +3 -3
datahub/api/entities/dataset/dataset.py +9 -11
datahub/api/entities/forms/forms.py +34 -35
datahub/api/graphql/assertion.py +1 -1
datahub/api/graphql/operation.py +4 -4
datahub/cli/delete_cli.py +1 -1
datahub/cli/docker_cli.py +2 -2
datahub/configuration/common.py +5 -0
datahub/configuration/source_common.py +1 -1
datahub/emitter/request_helper.py +116 -3
datahub/emitter/rest_emitter.py +44 -52
datahub/ingestion/api/source.py +2 -5
datahub/ingestion/api/source_helpers.py +1 -0
datahub/ingestion/glossary/classification_mixin.py +4 -2
datahub/ingestion/graph/client.py +3 -1
datahub/ingestion/graph/config.py +1 -0
datahub/ingestion/graph/filters.py +1 -1
datahub/ingestion/source/aws/sagemaker_processors/feature_groups.py +1 -1
datahub/ingestion/source/bigquery_v2/bigquery.py +24 -23
datahub/ingestion/source/cassandra/cassandra_profiling.py +25 -24
datahub/ingestion/source/datahub/datahub_database_reader.py +12 -11
datahub/ingestion/source/dbt/dbt_cloud.py +2 -6
datahub/ingestion/source/dbt/dbt_common.py +10 -2
datahub/ingestion/source/dbt/dbt_core.py +82 -42
datahub/ingestion/source/feast.py +4 -4
datahub/ingestion/source/iceberg/iceberg_common.py +2 -2
datahub/ingestion/source/ldap.py +1 -1
datahub/ingestion/source/looker/looker_lib_wrapper.py +1 -1
datahub/ingestion/source/looker/lookml_source.py +7 -1
datahub/ingestion/source/mode.py +74 -28
datahub/ingestion/source/neo4j/neo4j_source.py +85 -55
datahub/ingestion/source/powerbi/config.py +1 -1
datahub/ingestion/source/powerbi/rest_api_wrapper/data_resolver.py +2 -2
datahub/ingestion/source/redshift/usage.py +10 -9
datahub/ingestion/source/slack/slack.py +4 -52
datahub/ingestion/source/snowflake/snowflake_connection.py +19 -1
datahub/ingestion/source/sql/clickhouse.py +5 -1
datahub/ingestion/source/sql/druid.py +7 -2
datahub/ingestion/source/sql/oracle.py +6 -2
datahub/ingestion/source/tableau/tableau_validation.py +1 -1
datahub/ingestion/source/usage/clickhouse_usage.py +7 -3
datahub/ingestion/source/usage/starburst_trino_usage.py +5 -3
datahub/metadata/{_schema_classes.py → _internal_schema_classes.py} +490 -490
datahub/metadata/_urns/urn_defs.py +1786 -1786
datahub/metadata/schema.avsc +17364 -16988
datahub/metadata/schema_classes.py +3 -3
datahub/metadata/schemas/__init__.py +3 -3
datahub/specific/dataset.py +12 -0
datahub/testing/check_imports.py +1 -1
datahub/utilities/logging_manager.py +8 -1
datahub/utilities/sqlalchemy_query_combiner.py +4 -5
datahub/utilities/urn_encoder.py +1 -1
{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/entry_points.txt +0 -0
{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/licenses/LICENSE +0 -0
{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/top_level.txt +0 -0

datahub/metadata/schema_classes.py CHANGED Viewed

@@ -20,16 +20,16 @@ from datahub.utilities._custom_package_loader import get_custom_models_package
 _custom_package_path = get_custom_models_package()
 if TYPE_CHECKING or not _custom_package_path:
-    from ._schema_classes import *
+    from ._internal_schema_classes import *
     # Required explicitly because __all__ doesn't include _ prefixed names.
-    from ._schema_classes import __SCHEMA_TYPES
+    from ._internal_schema_classes import __SCHEMA_TYPES
     if IS_SPHINX_BUILD:
         # Set __module__ to the current module so that Sphinx will document the
         # classes as belonging to this module instead of the custom package.
         for _cls in list(globals().values()):
-            if hasattr(_cls, "__module__") and "datahub.metadata._schema_classes" in _cls.__module__:
+            if hasattr(_cls, "__module__") and "datahub.metadata._internal_schema_classes" in _cls.__module__:
                 _cls.__module__ = __name__
 else:
     _custom_package = importlib.import_module(_custom_package_path)

datahub/metadata/schemas/__init__.py CHANGED Viewed

@@ -15,10 +15,10 @@ import pathlib
 def _load_schema(schema_name: str) -> str:
     return (pathlib.Path(__file__).parent / f"{schema_name}.avsc").read_text()
-def getMetadataChangeProposalSchema() -> str:
-    return _load_schema("MetadataChangeProposal")
 def getMetadataChangeEventSchema() -> str:
     return _load_schema("MetadataChangeEvent")
+def getMetadataChangeProposalSchema() -> str:
+    return _load_schema("MetadataChangeProposal")
 # fmt: on

datahub/specific/dataset.py CHANGED Viewed

@@ -292,3 +292,15 @@ class DatasetPatchBuilder(
                 value=timestamp,
             )
         return self
+    def set_external_url(
+        self, external_url: Optional[str] = None
+    ) -> "DatasetPatchBuilder":
+        if external_url is not None:
+            self._add_patch(
+                DatasetProperties.ASPECT_NAME,
+                "add",
+                path=("externalUrl",),
+                value=external_url,
+            )
+        return self

datahub/testing/check_imports.py CHANGED Viewed

@@ -9,7 +9,7 @@ def ensure_no_indirect_model_imports(dirs: List[pathlib.Path]) -> None:
     # If our needs become more complex, we should move to a proper linter.
     denied_imports = {
         "src.": "datahub.*",
-        "datahub.metadata._schema_classes": "datahub.metadata.schema_classes",
+        "datahub.metadata._internal_schema_classes": "datahub.metadata.schema_classes",
         "datahub.metadata._urns": "datahub.metadata.urns",
     }
     ignored_files = {

datahub/utilities/logging_manager.py CHANGED Viewed

@@ -161,6 +161,7 @@ class _LogBuffer:
         self._buffer: Deque[str] = collections.deque(maxlen=maxlen)
     def write(self, line: str) -> None:
+        # We do not expect `line` to have a trailing newline.
         if len(line) > IN_MEMORY_LOG_BUFFER_MAX_LINE_LENGTH:
             line = line[:IN_MEMORY_LOG_BUFFER_MAX_LINE_LENGTH] + "[truncated]"
@@ -188,7 +189,13 @@ class _BufferLogHandler(logging.Handler):
             message = self.format(record)
         except TypeError as e:
             message = f"Error formatting log message: {e}\nMessage: {record.msg}, Args: {record.args}"
-        self._storage.write(message)
+        # For exception stack traces, the message is split over multiple lines,
+        # but we store it as a single string. Because we truncate based on line
+        # length, it's better for us to split it into multiple lines so that we
+        # don't lose any information on deeper stack traces.
+        for line in message.split("\n"):
+            self._storage.write(line)
 def _remove_all_handlers(logger: logging.Logger) -> None:

datahub/utilities/sqlalchemy_query_combiner.py CHANGED Viewed

@@ -272,11 +272,10 @@ class SQLAlchemyQueryCombiner:
                     self.report.uncombined_queries_issued += 1
                     return _sa_execute_underlying_method(conn, query, *args, **kwargs)
-        with _sa_execute_method_patching_lock:
-            with unittest.mock.patch(
-                "sqlalchemy.engine.Connection.execute", _sa_execute_fake
-            ):
-                yield self
+        with _sa_execute_method_patching_lock, unittest.mock.patch(
+            "sqlalchemy.engine.Connection.execute", _sa_execute_fake
+        ):
+            yield self
     def run(self, method: Callable[[], None]) -> None:
         """

datahub/utilities/urn_encoder.py CHANGED Viewed

@@ -4,7 +4,7 @@ from typing import List
 # NOTE: Frontend relies on encoding these three characters. Specifically, we decode and encode schema fields for column level lineage.
 # If this changes, make appropriate changes to datahub-web-react/src/app/lineage/utils/columnLineageUtils.ts
 # We also rely on encoding these exact three characters when generating schemaField urns in our graphQL layer. Update SchemaFieldUtils if this changes.
-# Also see https://datahubproject.io/docs/what/urn/#restrictions
+# Also see https://docs.datahub.com/docs/what/urn/#restrictions
 RESERVED_CHARS = {",", "(", ")", "␟"}
 RESERVED_CHARS_EXTENDED = RESERVED_CHARS.union({"%"})

{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{acryl_datahub-1.0.0.3rc8.dist-info → acryl_datahub-1.0.0.3rc10.dist-info}/top_level.txt RENAMED Viewed

File without changes

acryl-datahub 1.0.0.3rc8__py3-none-any.whl → 1.0.0.3rc10__py3-none-any.whl

Potentially problematic release.

acryl-datahub 1.0.0.3rc8py3-none-any.whl → 1.0.0.3rc10py3-none-any.whl