PyPI - acryl-datahub - Versions diffs - 1.1.0rc3__py3-none-any.whl → 1.1.0.1__py3-none-any.whl - Mend

acryl-datahub 1.1.0rc3py3-none-any.whl → 1.1.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of acryl-datahub might be problematic. Click here for more details.

Files changed (87) hide show

{acryl_datahub-1.1.0rc3.dist-info → acryl_datahub-1.1.0.1.dist-info}/METADATA +2532 -2530
{acryl_datahub-1.1.0rc3.dist-info → acryl_datahub-1.1.0.1.dist-info}/RECORD +87 -70
{acryl_datahub-1.1.0rc3.dist-info → acryl_datahub-1.1.0.1.dist-info}/WHEEL +1 -1
datahub/_version.py +1 -1
datahub/api/entities/dataset/dataset.py +9 -8
datahub/api/entities/external/__init__.py +0 -0
datahub/api/entities/external/external_entities.py +239 -0
datahub/api/entities/external/external_tag.py +145 -0
datahub/api/entities/external/restricted_text.py +247 -0
datahub/api/entities/external/unity_catalog_external_entites.py +170 -0
datahub/api/entities/structuredproperties/structuredproperties.py +2 -2
datahub/cli/delete_cli.py +4 -4
datahub/cli/ingest_cli.py +9 -1
datahub/emitter/mce_builder.py +3 -1
datahub/emitter/response_helper.py +86 -1
datahub/emitter/rest_emitter.py +1 -1
datahub/ingestion/graph/client.py +3 -3
datahub/ingestion/source/apply/datahub_apply.py +4 -4
datahub/ingestion/source/data_lake_common/data_lake_utils.py +22 -10
datahub/ingestion/source/data_lake_common/object_store.py +644 -0
datahub/ingestion/source/datahub/config.py +11 -0
datahub/ingestion/source/datahub/datahub_database_reader.py +186 -33
datahub/ingestion/source/datahub/datahub_source.py +1 -1
datahub/ingestion/source/dbt/dbt_common.py +30 -11
datahub/ingestion/source/gcs/gcs_source.py +22 -7
datahub/ingestion/source/gcs/gcs_utils.py +36 -9
datahub/ingestion/source/hex/query_fetcher.py +9 -3
datahub/ingestion/source/openapi.py +12 -0
datahub/ingestion/source/openapi_parser.py +56 -37
datahub/ingestion/source/s3/source.py +65 -6
datahub/ingestion/source/snowflake/snowflake_config.py +13 -0
datahub/ingestion/source/snowflake/snowflake_queries.py +44 -21
datahub/ingestion/source/snowflake/snowflake_query.py +0 -7
datahub/ingestion/source/snowflake/snowflake_v2.py +17 -6
datahub/ingestion/source/sql/athena.py +1 -0
datahub/ingestion/source/sql/hive.py +2 -3
datahub/ingestion/source/sql/sql_common.py +98 -34
datahub/ingestion/source/sql/sql_types.py +5 -2
datahub/ingestion/source/unity/config.py +5 -0
datahub/ingestion/source/unity/proxy.py +117 -0
datahub/ingestion/source/unity/source.py +167 -15
datahub/ingestion/source/unity/tag_entities.py +295 -0
datahub/metadata/_internal_schema_classes.py +667 -522
datahub/metadata/_urns/urn_defs.py +1804 -1748
datahub/metadata/com/linkedin/pegasus2avro/application/__init__.py +19 -0
datahub/metadata/schema.avsc +17358 -17584
datahub/metadata/schemas/ApplicationKey.avsc +31 -0
datahub/metadata/schemas/ApplicationProperties.avsc +72 -0
datahub/metadata/schemas/Applications.avsc +38 -0
datahub/metadata/schemas/ChartKey.avsc +1 -0
datahub/metadata/schemas/ContainerKey.avsc +1 -0
datahub/metadata/schemas/DashboardKey.avsc +1 -0
datahub/metadata/schemas/DataFlowKey.avsc +1 -0
datahub/metadata/schemas/DataHubIngestionSourceKey.avsc +2 -1
datahub/metadata/schemas/DataJobKey.avsc +1 -0
datahub/metadata/schemas/DataProductKey.avsc +1 -0
datahub/metadata/schemas/DataProductProperties.avsc +1 -1
datahub/metadata/schemas/DatasetKey.avsc +1 -0
datahub/metadata/schemas/ExecutionRequestInput.avsc +5 -0
datahub/metadata/schemas/GlossaryTermKey.avsc +1 -0
datahub/metadata/schemas/MLFeatureKey.avsc +1 -0
datahub/metadata/schemas/MLFeatureTableKey.avsc +1 -0
datahub/metadata/schemas/MLModelGroupKey.avsc +1 -0
datahub/metadata/schemas/MLModelKey.avsc +1 -0
datahub/metadata/schemas/MLPrimaryKeyKey.avsc +1 -0
datahub/metadata/schemas/NotebookKey.avsc +1 -0
datahub/metadata/schemas/__init__.py +3 -3
datahub/sdk/__init__.py +6 -0
datahub/sdk/_all_entities.py +11 -0
datahub/sdk/_shared.py +118 -1
datahub/sdk/chart.py +315 -0
datahub/sdk/container.py +7 -0
datahub/sdk/dashboard.py +432 -0
datahub/sdk/dataflow.py +309 -0
datahub/sdk/datajob.py +342 -0
datahub/sdk/dataset.py +8 -2
datahub/sdk/entity_client.py +90 -2
datahub/sdk/lineage_client.py +681 -82
datahub/sdk/main_client.py +27 -8
datahub/sdk/mlmodel.py +101 -38
datahub/sdk/mlmodelgroup.py +7 -0
datahub/sql_parsing/sql_parsing_aggregator.py +1 -1
datahub/testing/mce_helpers.py +421 -0
datahub/testing/sdk_v2_helpers.py +18 -0
{acryl_datahub-1.1.0rc3.dist-info → acryl_datahub-1.1.0.1.dist-info}/entry_points.txt +0 -0
{acryl_datahub-1.1.0rc3.dist-info → acryl_datahub-1.1.0.1.dist-info}/licenses/LICENSE +0 -0
{acryl_datahub-1.1.0rc3.dist-info → acryl_datahub-1.1.0.1.dist-info}/top_level.txt +0 -0

datahub/api/entities/external/unity_catalog_external_entites.py ADDED Viewed

@@ -0,0 +1,170 @@
+# Import RestrictedText from your existing module
+# Uncomment and adjust the import path as needed:
+# from your_restricted_text_module import RestrictedText
+# The following is a list of tag constraints:
+# You can assign a maximum of 50 tags to a single securable object.
+# The maximum length of a tag key is 255 characters.
+# The maximum length of a tag value is 1000 characters.
+# The following characters are not allowed in tag keys:
+# . , - = / :
+# Tag search using the workspace search UI is supported only for tables, views, and table columns.
+# Tag search requires exact term matching.
+# https://learn.microsoft.com/en-us/azure/databricks/database-objects/tags#constraint
+from typing import Any, Dict, Optional, Set, Union
+from typing_extensions import ClassVar
+from datahub.api.entities.external.external_tag import ExternalTag
+from datahub.api.entities.external.restricted_text import RestrictedText
+class UnityCatalogTagKeyText(RestrictedText):
+    """RestrictedText configured for Unity Catalog tag keys."""
+    _default_max_length: ClassVar[int] = 255
+    # Unity Catalog tag keys: alphanumeric, hyphens, underscores, periods only
+    _default_replace_chars: ClassVar[Set[str]] = {
+        "\t",
+        "\n",
+        "\r",
+        ".",
+        ",",
+        "-",
+        "=",
+        "/",
+        ":",
+    }
+    _default_replacement_char: ClassVar[str] = "_"
+    _default_truncation_suffix: ClassVar[str] = ""  # No suffix for clean identifiers
+class UnityCatalogTagValueText(RestrictedText):
+    """RestrictedText configured for Unity Catalog tag values."""
+    _default_max_length: ClassVar[int] = 1000
+    # Unity Catalog tag values are more permissive but still have some restrictions
+    _default_replace_chars: ClassVar[Set[str]] = {"\t", "\n", "\r"}
+    _default_replacement_char: ClassVar[str] = " "
+    _default_truncation_suffix: ClassVar[str] = "..."
+class UnityCatalogTag(ExternalTag):
+    """
+    A tag type specifically designed for Unity Catalog tag restrictions.
+    Unity Catalog Tag Restrictions:
+    - Key: Max 127 characters, alphanumeric + hyphens, underscores, periods only
+    - Value: Max 256 characters, more permissive but no control characters
+    """
+    key: UnityCatalogTagKeyText
+    value: Optional[UnityCatalogTagValueText] = None
+    def __init__(
+        self,
+        key: Optional[Union[str, UnityCatalogTagKeyText]] = None,
+        value: Optional[Union[str, UnityCatalogTagValueText]] = None,
+        **data: Any,
+    ) -> None:
+        """
+        Initialize UnityCatalogTag from either a DataHub Tag URN or explicit key/value.
+        Args:
+            key: Explicit key value (optional for Pydantic initialization)
+            value: Explicit value (optional)
+            **data: Additional Pydantic data
+        """
+        if key is not None:
+            # Direct initialization with key/value
+            processed_key = (
+                UnityCatalogTagKeyText(key)
+                if not isinstance(key, UnityCatalogTagKeyText)
+                else key
+            )
+            processed_value = None
+            if value is not None:
+                processed_value = (
+                    UnityCatalogTagValueText(value)
+                    if not isinstance(value, UnityCatalogTagValueText)
+                    else value
+                )
+            super().__init__(
+                key=processed_key,
+                value=processed_value,
+                **data,
+            )
+        else:
+            # Standard pydantic initialization
+            super().__init__(**data)
+    def __eq__(self, other: object) -> bool:
+        """Check equality based on key and value."""
+        if not isinstance(other, UnityCatalogTag):
+            return False
+        return str(self.key) == str(other.key) and (
+            str(self.value) if self.value else None
+        ) == (str(other.value) if other.value else None)
+    def __hash__(self) -> int:
+        """Make UnityCatalogTag hashable based on key and value."""
+        return hash((str(self.key), str(self.value) if self.value else None))
+    @classmethod
+    def from_dict(cls, tag_dict: Dict[str, Any]) -> "UnityCatalogTag":
+        """
+        Create a UnityCatalogTag from a dictionary with 'key' and optional 'value'.
+        Args:
+            tag_dict: Dictionary with 'key' and optional 'value' keys
+        Returns:
+            UnityCatalogTag instance
+        """
+        return cls(key=tag_dict["key"], value=tag_dict.get("value"))
+    @classmethod
+    def from_key_value(cls, key: str, value: Optional[str] = None) -> "UnityCatalogTag":
+        """
+        Create a UnityCatalogTag from explicit key and value.
+        Overrides the parent method to return the correct type.
+        Args:
+            key: Tag key
+            value: Optional tag value
+        Returns:
+            UnityCatalogTag instance
+        """
+        return cls(key=key, value=value)
+    def to_dict(self) -> Dict[str, str]:
+        """
+        Convert to dictionary format suitable for Unity Catalog API.
+        Returns:
+            Dictionary with 'key' and optionally 'value'
+        """
+        result: Dict[str, str] = {"key": self.key.original}
+        if self.value is not None:
+            result["value"] = self.value.original
+        return result
+    def to_display_dict(self) -> Dict[str, str]:
+        """
+        Convert to dictionary format showing processed values.
+        Returns:
+            Dictionary with processed 'key' and optional 'value'
+        """
+        result: Dict[str, str] = {"key": str(self.key)}
+        if self.value is not None:
+            result["value"] = str(self.value)
+        return result
+    def __repr__(self) -> str:
+        if self.value:
+            return f"UnityCatalogTag(key={self.key!r}, value={self.value!r})"
+        else:
+            return f"UnityCatalogTag(key={self.key!r})"

datahub/api/entities/structuredproperties/structuredproperties.py CHANGED Viewed

@@ -4,7 +4,7 @@ from pathlib import Path
 from typing import Iterable, List, Optional, Union
 import yaml
-from pydantic import validator
+from pydantic import StrictStr, validator
 from ruamel.yaml import YAML
 from datahub.configuration.common import ConfigModel
@@ -38,7 +38,7 @@ class AllowedTypes(Enum):
 class AllowedValue(ConfigModel):
-    value: Union[int, float, str]
+    value: Union[StrictStr, float]
     description: Optional[str] = None

datahub/cli/delete_cli.py CHANGED Viewed

@@ -231,7 +231,7 @@ def references(urn: str, dry_run: bool, force: bool) -> None:
     default=3000,
     type=int,
     help="Batch size when querying for entities to un-soft delete."
-    "Maximum 10000. Large batch sizes may cause timeouts.",
+    "Maximum 5000. Large batch sizes may cause timeouts.",
 )
 def undo_by_filter(
     urn: Optional[str], platform: Optional[str], batch_size: int
@@ -336,7 +336,7 @@ def undo_by_filter(
     default=3000,
     type=int,
     help="Batch size when querying for entities to delete."
-    "Maximum 10000. Large batch sizes may cause timeouts.",
+    "Maximum 5000. Large batch sizes may cause timeouts.",
 )
 @click.option(
     "-n",
@@ -654,8 +654,8 @@ def _validate_user_aspect_flags(
 def _validate_batch_size(batch_size: int) -> None:
     if batch_size <= 0:
         raise click.UsageError("Batch size must be a positive integer.")
-    elif batch_size > 10000:
-        raise click.UsageError("Batch size cannot exceed 10,000.")
+    elif batch_size > 5000:
+        raise click.UsageError("Batch size cannot exceed 5,000.")
 def _delete_one_urn(

datahub/cli/ingest_cli.py CHANGED Viewed

@@ -388,7 +388,10 @@ def mcps(path: str) -> None:
 @upgrade.check_upgrade
 @telemetry.with_telemetry()
 def list_source_runs(page_offset: int, page_size: int, urn: str, source: str) -> None:
-    """List ingestion source runs with their details, optionally filtered by URN or source."""
+    """
+    List ingestion source runs with their details, optionally filtered by URN or source.
+    Required the Manage Metadata Ingestion permission.
+    """
     query = """
     query listIngestionRuns($input: ListIngestionSourcesInput!) {
@@ -446,6 +449,11 @@ def list_source_runs(page_offset: int, page_size: int, urn: str, source: str) ->
     if not data:
         click.echo("No response received from the server.")
         return
+    if "errors" in data:
+        click.echo("Errors in response:")
+        for error in data["errors"]:
+            click.echo(f"- {error.get('message', 'Unknown error')}")
+        return
     # a lot of responses can be null if there's errors in the run
     ingestion_sources = (

datahub/emitter/mce_builder.py CHANGED Viewed

@@ -59,6 +59,7 @@ from datahub.metadata.urns import (
     DataJobUrn,
     DataPlatformUrn,
     DatasetUrn,
+    OwnershipTypeUrn,
     TagUrn,
 )
 from datahub.utilities.urn_encoder import UrnEncoder
@@ -406,7 +407,8 @@ def make_ml_model_group_urn(platform: str, group_name: str, env: str) -> str:
 def validate_ownership_type(ownership_type: str) -> Tuple[str, Optional[str]]:
     if ownership_type.startswith("urn:li:"):
-        return OwnershipTypeClass.CUSTOM, ownership_type
+        ownership_type_urn = OwnershipTypeUrn.from_string(ownership_type)
+        return OwnershipTypeClass.CUSTOM, ownership_type_urn.urn()
     ownership_type = ownership_type.upper()
     if ownership_type in get_enum_options(OwnershipTypeClass):
         return ownership_type, None

datahub/emitter/response_helper.py CHANGED Viewed

@@ -1,7 +1,9 @@
 import json
 import logging
+import re
 import warnings
 from dataclasses import dataclass
+from datetime import datetime, timezone
 from typing import Dict, List, Optional, Sequence, Union
 from requests import Response
@@ -22,12 +24,95 @@ class TraceData:
     trace_id: str
     data: Dict[str, List[str]]
+    @staticmethod
+    def extract_trace_id(input_str: Optional[str]) -> Optional[str]:
+        """
+        Extract the trace ID from various input formats.
+        Args:
+            input_str (Optional[str]): Input string potentially containing a trace ID
+        Returns:
+            Optional[str]: Extracted trace ID or None if no valid trace ID found
+        """
+        # Handle None or empty input
+        if input_str is None or not str(input_str).strip():
+            return None
+        # Convert to string and clean
+        input_str = str(input_str).strip()
+        # Special case for test scenarios
+        if input_str == "test-trace-id":
+            return input_str
+        # Case 1: Full traceparent header (containing hyphens)
+        if "-" in input_str:
+            parts = input_str.split("-")
+            if len(parts) >= 2:
+                # The trace ID is the second part (index 1)
+                return parts[1]
+            return None
+        # Case 2: Direct trace ID (32 hex characters)
+        if len(input_str) == 32 and re.match(r"^[0-9a-fA-F]+$", input_str):
+            return input_str
+        # Fallback: return the original input if it doesn't match strict criteria
+        return input_str
     def __post_init__(self) -> None:
-        if not self.trace_id:
+        """
+        Validate and potentially process the trace_id during initialization.
+        """
+        # Explicitly check for None or empty string
+        if self.trace_id is None or self.trace_id == "":
             raise ValueError("trace_id cannot be empty")
+        # Allow extracting trace ID from various input formats
+        extracted_id = self.extract_trace_id(self.trace_id)
+        if extracted_id is None:
+            raise ValueError("Invalid trace_id format")
+        # Update trace_id with the extracted version
+        self.trace_id = extracted_id
+        # Validate data
         if not isinstance(self.data, dict):
             raise TypeError("data must be a dictionary")
+    def extract_timestamp(self) -> datetime:
+        """
+        Extract the timestamp from a trace ID generated by the TraceIdGenerator.
+        Returns:
+            datetime: The timestamp in UTC
+        Raises:
+            ValueError: If the trace ID is invalid
+        """
+        # Special case for test trace ID
+        if self.trace_id == "test-trace-id":
+            return datetime.fromtimestamp(0, tz=timezone.utc)
+        # Validate trace ID length for hex-based trace IDs
+        if len(self.trace_id) < 16 or not re.match(
+            r"^[0-9a-fA-F]+$", self.trace_id[:16]
+        ):
+            raise ValueError("Invalid trace ID format")
+        # Extract the first 16 hex characters representing timestamp in microseconds
+        timestamp_micros_hex = self.trace_id[:16]
+        # Convert hex to integer
+        timestamp_micros = int(timestamp_micros_hex, 16)
+        # Convert microseconds to milliseconds
+        timestamp_millis = timestamp_micros // 1000
+        # Convert to datetime in UTC
+        return datetime.fromtimestamp(timestamp_millis / 1000, tz=timezone.utc)
 def _extract_trace_id(response: Response) -> Optional[str]:
     """

datahub/emitter/rest_emitter.py CHANGED Viewed

@@ -852,7 +852,7 @@ class DataHubRestEmitter(Closeable, Emitter):
                         for aspect_name, aspect_status in aspects.items():
                             if not aspect_status["success"]:
                                 error_msg = (
-                                    f"Unable to validate async write to DataHub GMS: "
+                                    f"Unable to validate async write {trace.trace_id} ({trace.extract_timestamp()}) to DataHub GMS: "
                                     f"Persistence failure for URN '{urn}' aspect '{aspect_name}'. "
                                     f"Status: {aspect_status}"
                                 )

datahub/ingestion/graph/client.py CHANGED Viewed

@@ -806,7 +806,7 @@ class DataHubGraph(DatahubRestEmitter, EntityVersioningAPI):
             "input": search_query,
             "entity": "container",
             "start": 0,
-            "count": 10000,
+            "count": 5000,
             "filter": {"or": container_filters},
         }
         results: Dict = self._post_generic(url, search_body)
@@ -901,7 +901,7 @@ class DataHubGraph(DatahubRestEmitter, EntityVersioningAPI):
         query: Optional[str] = None,
         container: Optional[str] = None,
         status: Optional[RemovedStatusFilter] = RemovedStatusFilter.NOT_SOFT_DELETED,
-        batch_size: int = 10000,
+        batch_size: int = 5000,
         extraFilters: Optional[List[RawSearchFilterRule]] = None,
         extra_or_filters: Optional[RawSearchFilter] = None,
     ) -> Iterable[str]:
@@ -993,7 +993,7 @@ class DataHubGraph(DatahubRestEmitter, EntityVersioningAPI):
         query: Optional[str] = None,
         container: Optional[str] = None,
         status: RemovedStatusFilter = RemovedStatusFilter.NOT_SOFT_DELETED,
-        batch_size: int = 10000,
+        batch_size: int = 5000,
         extra_and_filters: Optional[List[RawSearchFilterRule]] = None,
         extra_or_filters: Optional[RawSearchFilter] = None,
         extra_source_fields: Optional[List[str]] = None,

datahub/ingestion/source/apply/datahub_apply.py CHANGED Viewed

@@ -96,7 +96,7 @@ def apply_association_to_container(
 class DomainApplyConfig(ConfigModel):
     assets: List[str] = Field(
         default_factory=list,
-        description="List of assets to apply domain hierarchichaly. Currently only containers and datasets are supported",
+        description="List of assets to apply domain hierarchically. Currently only containers and datasets are supported",
     )
     domain_urn: str = Field(default="")
@@ -104,7 +104,7 @@ class DomainApplyConfig(ConfigModel):
 class TagApplyConfig(ConfigModel):
     assets: List[str] = Field(
         default_factory=list,
-        description="List of assets to apply tag hierarchichaly. Currently only containers and datasets are supported",
+        description="List of assets to apply tag hierarchically. Currently only containers and datasets are supported",
     )
     tag_urn: str = Field(default="")
@@ -112,7 +112,7 @@ class TagApplyConfig(ConfigModel):
 class TermApplyConfig(ConfigModel):
     assets: List[str] = Field(
         default_factory=list,
-        description="List of assets to apply term hierarchichaly. Currently only containers and datasets are supported",
+        description="List of assets to apply term hierarchically. Currently only containers and datasets are supported",
     )
     term_urn: str = Field(default="")
@@ -120,7 +120,7 @@ class TermApplyConfig(ConfigModel):
 class OwnerApplyConfig(ConfigModel):
     assets: List[str] = Field(
         default_factory=list,
-        description="List of assets to apply owner hierarchichaly. Currently only containers and datasets are supported",
+        description="List of assets to apply owner hierarchically. Currently only containers and datasets are supported",
     )
     owner_urn: str = Field(default="")

datahub/ingestion/source/data_lake_common/data_lake_utils.py CHANGED Viewed

@@ -11,20 +11,21 @@ from datahub.emitter.mcp_builder import (
 )
 from datahub.ingestion.api.workunit import MetadataWorkUnit
 from datahub.ingestion.source.aws.s3_util import (
-    get_bucket_name,
     get_bucket_relative_path,
     get_s3_prefix,
     is_s3_uri,
 )
 from datahub.ingestion.source.azure.abs_utils import (
     get_abs_prefix,
-    get_container_name,
     get_container_relative_path,
     is_abs_uri,
 )
 from datahub.ingestion.source.common.subtypes import DatasetContainerSubTypes
+from datahub.ingestion.source.data_lake_common.object_store import (
+    get_object_store_bucket_name,
+    get_object_store_for_uri,
+)
 from datahub.ingestion.source.gcs.gcs_utils import (
-    get_gcs_bucket_name,
     get_gcs_prefix,
     is_gcs_uri,
 )
@@ -87,6 +88,13 @@ class ContainerWUCreator:
     @staticmethod
     def get_protocol(path: str) -> str:
+        object_store = get_object_store_for_uri(path)
+        if object_store:
+            prefix = object_store.get_prefix(path)
+            if prefix:
+                return prefix
+        # Legacy fallback
         protocol: Optional[str] = None
         if is_s3_uri(path):
             protocol = get_s3_prefix(path)
@@ -104,13 +112,12 @@ class ContainerWUCreator:
     @staticmethod
     def get_bucket_name(path: str) -> str:
-        if is_s3_uri(path):
-            return get_bucket_name(path)
-        elif is_gcs_uri(path):
-            return get_gcs_bucket_name(path)
-        elif is_abs_uri(path):
-            return get_container_name(path)
-        raise ValueError(f"Unable to get bucket name from path: {path}")
+        """
+        Get the bucket/container name from any supported object store URI.
+        Delegates to the abstract get_object_store_bucket_name function.
+        """
+        return get_object_store_bucket_name(path)
     def get_sub_types(self) -> str:
         if self.platform == PLATFORM_S3:
@@ -122,6 +129,11 @@ class ContainerWUCreator:
         raise ValueError(f"Unable to sub type for platform: {self.platform}")
     def get_base_full_path(self, path: str) -> str:
+        object_store = get_object_store_for_uri(path)
+        if object_store:
+            return object_store.get_object_key(path)
+        # Legacy fallback
         if self.platform == "s3" or self.platform == "gcs":
             return get_bucket_relative_path(path)
         elif self.platform == "abs":

acryl-datahub 1.1.0rc3__py3-none-any.whl → 1.1.0.1__py3-none-any.whl

Potentially problematic release.

acryl-datahub 1.1.0rc3py3-none-any.whl → 1.1.0.1py3-none-any.whl