PyPI - castor-extractor - Versions diffs - 0.17.0__py3-none-any.whl → 0.17.3__py3-none-any.whl - Mend

castor-extractor 0.17.0py3-none-any.whl → 0.17.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of castor-extractor might be problematic. Click here for more details.

Files changed (16) hide show

CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,17 @@
 # Changelog
+## 0.17.3 - 2024-06-24
+* Databricks: extract tags for tables and column
+## 0.17.2 - 2024-06-14
+* Uploader: support multipart
+## 0.17.1 - 2024-06-12
+* Databricks: extract table source links
 ## 0.17.0 - 2024-06-10
 * Uploader: redirect to the proxy, replace credentials with token

castor_extractor/uploader/upload.py CHANGED Viewed

@@ -83,7 +83,7 @@ def _upload(
             response = requests.post(
                 url=url,
                 headers=headers,
-                data=file_content,
+                files={"file": file_content},
                 timeout=timeout,
             )
             response.raise_for_status()

castor_extractor/utils/client/api.py CHANGED Viewed

@@ -58,7 +58,12 @@ class APIClient:
         return result.json()
-    def get(self, path: str, payload: Optional[dict] = None) -> dict:
+    def get(
+        self,
+        path: str,
+        payload: Optional[dict] = None,
+        processor: Optional[Callable] = None,
+    ) -> dict:
         """path: REST API operation path, such as /api/2.0/clusters/get"""
         url = self.build_url(self._host, path)
-        return self._call(url=url, data=payload)
+        return self._call(url=url, data=payload, processor=processor)

castor_extractor/warehouse/databricks/__init__.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from .client import DatabricksClient
-from .credentials import DatabricksCredentials, to_credentials
+from .credentials import DatabricksCredentials
 from .extract import (
     DATABRICKS_ASSETS,
     DatabricksExtractionProcessor,

castor_extractor/warehouse/databricks/client.py CHANGED Viewed

@@ -1,10 +1,14 @@
 import logging
+from collections import defaultdict
 from concurrent.futures import ThreadPoolExecutor
 from datetime import date
+from enum import Enum
 from functools import partial
 from typing import Any, Dict, List, Optional, Set, Tuple, cast
 import requests
+from databricks import sql  # type: ignore
+from requests import Response
 from ...utils import (
     SafeMode,
@@ -18,8 +22,9 @@ from ...utils.client.api import APIClient
 from ...utils.pager import PagerOnToken
 from ..abstract.time_filter import TimeFilter
 from .credentials import DatabricksCredentials
-from .format import DatabricksFormatter
+from .format import DatabricksFormatter, TagMapping
 from .types import Link, Ostr, OTimestampedLink, TablesColumns, TimestampedLink
+from .utils import build_path, tag_label
 logger = logging.getLogger(__name__)
@@ -30,10 +35,20 @@ _RETRY_BASE_MS = 1000
 _RETRY_EXCEPTIONS = [
     requests.exceptions.ConnectTimeout,
 ]
+_WORKSPACE_ID_HEADER = "X-Databricks-Org-Id"
+_INFORMATION_SCHEMA_SQL = "SELECT * FROM system.information_schema"
 safe_params = SafeMode((BaseException,), _MAX_NUMBER_OF_LINEAGE_ERRORS)
+class TagEntity(Enum):
+    """Entities that can be tagged in Databricks"""
+    COLUMN = "COLUMN"
+    TABLE = "TABLE"
 def _day_to_epoch_ms(day: date) -> int:
     return int(at_midnight(day).timestamp() * 1000)
@@ -74,12 +89,38 @@ class DatabricksClient(APIClient):
         credentials: DatabricksCredentials,
         db_allowed: Optional[Set[str]] = None,
         db_blocked: Optional[Set[str]] = None,
+        has_table_tags: bool = False,
+        has_column_tags: bool = False,
     ):
         super().__init__(host=credentials.host, token=credentials.token)
+        self._http_path = credentials.http_path
         self._db_allowed = db_allowed
         self._db_blocked = db_blocked
+        self._has_table_tags = has_table_tags
+        self._has_column_tags = has_column_tags
         self.formatter = DatabricksFormatter()
+    def execute_sql(
+        self,
+        query: str,
+        params: Optional[dict] = None,
+    ):
+        """
+        Execute a SQL query on Databricks system tables and return the results.
+        https://docs.databricks.com/en/dev-tools/python-sql-connector.html
+        /!\ credentials.http_path is required in order to run SQL queries
+        """
+        assert self._http_path, "HTTP_PATH is required to run SQL queries"
+        with sql.connect(
+            server_hostname=self._host,
+            http_path=self._http_path,
+            access_token=self._token,
+        ) as connection:
+            with connection.cursor() as cursor:
+                cursor.execute(query, params)
+                return cursor.fetchall()
     @staticmethod
     def name() -> str:
         return "Databricks"
@@ -120,15 +161,38 @@ class DatabricksClient(APIClient):
             for schema in self._schemas_of_database(database)
         ]
-    def _tables_columns_of_schema(self, schema: dict) -> TablesColumns:
+    @staticmethod
+    def _process_table_response(response: Response) -> Tuple[dict, str]:
+        """
+        Returns both the JSON content and the Workspace ID, which is found
+        in the response's headers.
+        """
+        return response.json(), response.headers[_WORKSPACE_ID_HEADER]
+    def _tables_columns_of_schema(
+        self,
+        schema: dict,
+        table_tags: TagMapping,
+        column_tags: TagMapping,
+    ) -> TablesColumns:
         path = "api/2.1/unity-catalog/tables"
         payload = {
             "catalog_name": schema["database_id"],
             "schema_name": schema["schema_name"],
         }
-        content = self.get(path=path, payload=payload)
+        content, workspace_id = self.get(
+            path=path,
+            payload=payload,
+            processor=self._process_table_response,
+        )
+        host = self.build_url(self._host, path="")
         return self.formatter.format_table_column(
-            content.get("tables", []), schema
+            raw_tables=content.get("tables", []),
+            schema=schema,
+            host=host,
+            workspace_id=workspace_id,
+            table_tags=table_tags,
+            column_tags=column_tags,
         )
     @staticmethod
@@ -141,6 +205,40 @@ class DatabricksClient(APIClient):
             return table
         return {**table, "owner_external_id": owner_external_id}
+    def _needs_extraction(self, entity: TagEntity) -> bool:
+        if entity == TagEntity.TABLE:
+            return self._has_table_tags
+        if entity == TagEntity.COLUMN:
+            return self._has_column_tags
+        raise AssertionError(f"Entity not supported: {entity}")
+    def _get_tags_mapping(self, entity: TagEntity) -> TagMapping:
+        """
+        Fetch tags of the given entity and build a mapping:
+        { path: list[tags] }
+        https://docs.databricks.com/en/sql/language-manual/information-schema/table_tags.html
+        https://docs.databricks.com/en/sql/language-manual/information-schema/column_tags.html
+        """
+        if not self._needs_extraction(entity):
+            # extracting tags require additional credentials (http_path)
+            return dict()
+        table = f"{entity.value.lower()}_tags"
+        query = f"{_INFORMATION_SCHEMA_SQL}.{table}"
+        result = self.execute_sql(query)
+        mapping = defaultdict(list)
+        for row in result:
+            dict_row = row.asDict()
+            keys = ["catalog_name", "schema_name", "table_name"]
+            if entity == TagEntity.COLUMN:
+                keys.append("column_name")
+            path = build_path(dict_row, keys)
+            label = tag_label(dict_row)
+            mapping[path].append(label)
+        return mapping
     @staticmethod
     def _get_user_mapping(users: List[dict]) -> dict:
         return {
@@ -157,8 +255,15 @@ class DatabricksClient(APIClient):
         tables: List[dict] = []
         columns: List[dict] = []
         user_mapping = self._get_user_mapping(users)
+        table_tags = self._get_tags_mapping(TagEntity.TABLE)
+        column_tags = self._get_tags_mapping(TagEntity.COLUMN)
         for schema in schemas:
-            t_to_add, c_to_add = self._tables_columns_of_schema(schema)
+            t_to_add, c_to_add = self._tables_columns_of_schema(
+                schema=schema,
+                table_tags=table_tags,
+                column_tags=column_tags,
+            )
             t_with_owner = [
                 self._match_table_with_user(table, user_mapping)
                 for table in t_to_add

castor_extractor/warehouse/databricks/credentials.py CHANGED Viewed

@@ -1,11 +1,10 @@
 from dataclasses import field
+from typing import Optional
 from pydantic.dataclasses import dataclass
+from pydantic_settings import SettingsConfigDict
-from ...utils import from_env
-_HOST = "CASTOR_DATABRICKS_HOST"
-_TOKEN = "CASTOR_DATABRICKS_TOKEN"  # noqa: S105
+DATABRICKS_ENV_PREFIX = "CASTOR_DATABRICKS_"
 @dataclass
@@ -19,10 +18,10 @@ class DatabricksCredentials:
     host: str
     token: str = field(metadata={"sensitive": True})
+    http_path: Optional[str] = field(default=None)
-def to_credentials(params: dict) -> DatabricksCredentials:
-    """extract Databricks credentials"""
-    host = params.get("host") or from_env(_HOST)
-    token = params.get("token") or from_env(_TOKEN)
-    return DatabricksCredentials(host=host, token=token)
+    model_config = SettingsConfigDict(
+        env_prefix=DATABRICKS_ENV_PREFIX,
+        extra="ignore",
+        populate_by_name=True,
+    )

castor_extractor/warehouse/databricks/extract.py CHANGED Viewed

@@ -15,7 +15,7 @@ from ..abstract import (
     common_args,
 )
 from .client import DatabricksClient
-from .credentials import to_credentials
+from .credentials import DatabricksCredentials
 DATABRICKS_ASSETS: SupportedAssets = {
     WarehouseAssetGroup.ADDITIONAL_LINEAGE: ADDITIONAL_LINEAGE_ASSETS,
@@ -170,7 +170,7 @@ def extract_all(**kwargs) -> None:
     output_directory, skip_existing = common_args(kwargs)
     client = DatabricksClient(
-        credentials=to_credentials(kwargs),
+        credentials=DatabricksCredentials(**kwargs),
         db_allowed=kwargs.get("db_allowed"),
         db_blocked=kwargs.get("db_blocked"),
     )

castor_extractor/warehouse/databricks/format.py CHANGED Viewed

@@ -1,14 +1,19 @@
 import logging
 from datetime import datetime
-from typing import List, Optional
+from typing import Dict, List, Optional
 from .types import TablesColumns
+from .utils import build_path
 logger = logging.getLogger(__name__)
 EXCLUDED_DATABASES = {"system"}
 EXCLUDED_SCHEMAS = {"information_schema", "default"}
+TABLE_URL_TPL = "{host}explore/data/{catalog_name}/{schema_name}/{table_name}?o={workspace_id}"
+TagMapping = Dict[str, List[str]]
 def _to_datetime_or_none(time_ms: Optional[int]) -> Optional[datetime]:
     """return time in ms as datetime or None"""
@@ -17,26 +22,61 @@ def _to_datetime_or_none(time_ms: Optional[int]) -> Optional[datetime]:
     return datetime.fromtimestamp(time_ms / 1000.0)
-def _table_payload(schema: dict, table: dict) -> dict:
+def _table_payload(
+    schema: dict,
+    table: dict,
+    host: str,
+    workspace_id: str,
+    tags: TagMapping,
+) -> dict:
+    """
+    Prepares the table payload. This also includes a source link which is built
+    here using the host and workspace_id.
+    """
+    url = TABLE_URL_TPL.format(
+        host=host,
+        catalog_name=table["catalog_name"],
+        schema_name=table["schema_name"],
+        table_name=table["name"],
+        workspace_id=workspace_id,
+    )
+    keys = ["catalog_name", "schema_name", "name"]
+    path = build_path(table, keys)
     return {
         "description": table.get("comment"),
         "id": table["table_id"],
         "owner_email": table.get("owner"),
         "schema_id": f"{schema['id']}",
         "table_name": table["name"],
-        "tags": [],
+        "tags": tags.get(path, []),
         "type": table.get("table_type"),
+        "url": url,
     }
-def _column_payload(table: dict, column: dict) -> dict:
+def _column_path(table: dict, column: dict) -> str:
+    keys = ["catalog_name", "schema_name", "name"]
+    table_path = build_path(table, keys)
+    column_name = column["name"]
+    return f"{table_path}.{column_name}"
+def _column_payload(
+    table: dict,
+    column: dict,
+    tags: TagMapping,
+) -> dict:
+    path = _column_path(table, column)
     return {
         "column_name": column["name"],
         "data_type": column["type_name"],
         "description": column.get("comment"),
-        "id": f"`{table['id']}`.`{column['name']}`",
+        "id": f"`{table['table_id']}`.`{column['name']}`",
         "ordinal_position": column["position"],
-        "table_id": table["id"],
+        "table_id": table["table_id"],
+        "tags": tags.get(path, []),
     }
@@ -78,19 +118,24 @@ class DatabricksFormatter:
     @staticmethod
     def format_table_column(
-        raw_tables: List[dict], schema: dict
+        raw_tables: List[dict],
+        schema: dict,
+        host: str,
+        workspace_id: str,
+        table_tags: TagMapping,
+        column_tags: TagMapping,
     ) -> TablesColumns:
         tables = []
         columns = []
         if not raw_tables:
             return [], []
         for table in raw_tables:
-            t = _table_payload(schema, table)
+            t = _table_payload(schema, table, host, workspace_id, table_tags)
             tables.append(t)
             if not table.get("columns"):
                 continue
             for column in table["columns"]:
-                c = _column_payload(t, column)
+                c = _column_payload(table, column, column_tags)
                 columns.append(c)
         return tables, columns

castor_extractor/warehouse/databricks/format_test.py CHANGED Viewed

@@ -1,6 +1,12 @@
 from datetime import datetime
-from .format import DatabricksFormatter, _column_payload, _to_datetime_or_none
+from .format import (
+    DatabricksFormatter,
+    _column_path,
+    _column_payload,
+    _table_payload,
+    _to_datetime_or_none,
+)
 def test__to_datetime_or_none():
@@ -23,42 +29,95 @@ def test_DatabricksFormatter__primary():
     assert DatabricksFormatter._primary([]) is None
+def test__table_payload():
+    schema = {"id": "id123"}
+    table = {
+        "name": "baz",
+        "catalog_name": "foo",
+        "schema_name": "bar",
+        "table_type": "MANAGED",
+        "owner": "pot@ato.com",
+        "table_id": "732pot5e-8ato-4c27-b701-9fa51febc192",
+    }
+    host = "https://some.cloud.databricks.net/"
+    workspace_id = "123456"
+    tags = {
+        "foo.bar.baz": ["riri", "fifi"],
+        "dummy.path": ["loulou"],
+    }
+    payload = _table_payload(schema, table, host, workspace_id, tags)
+    expected = {
+        "description": None,
+        "id": "732pot5e-8ato-4c27-b701-9fa51febc192",
+        "owner_email": "pot@ato.com",
+        "schema_id": "id123",
+        "table_name": "baz",
+        "tags": ["riri", "fifi"],
+        "type": "MANAGED",
+        "url": "https://some.cloud.databricks.net/explore/data/foo/bar/baz?o=123456",
+    }
+    assert payload == expected
 def test__column_payload():
     table = {
-        "id": "18175cd5-9b9b-4d78-9d28-caaa12c21ce0",
-        "schema_id": "dv_microservices.company_silver",
-        "table_name": "companyrepository_organization_v1",
-        "description": "some description",
-        "tags": [],
-        "type": "TABLE",
+        "catalog_name": "foo",
+        "name": "baz",
+        "owner": "pot@ato.com",
+        "schema_name": "bar",
+        "table_id": "732pot5e-8ato-4c27-b701-9fa51febc192",
+        "table_type": "MANAGED",
     }
     column = {
+        "comment": "some description",
         "name": "Uid",
-        "type_text": "string",
-        "type_name": "STRING",
+        "nullable": True,
         "position": 0,
+        "type_json": '{"name":"Uid","type":"string","nullable":true,"metadata":{}}',
+        "type_name": "STRING",
         "type_precision": 0,
         "type_scale": 0,
-        "type_json": '{"name":"Uid","type":"string","nullable":true,"metadata":{}}',
-        "nullable": True,
-        "comment": "some description",
+        "type_text": "string",
     }
-    payload = _column_payload(table, column)
+    tags = {
+        "foo.bar.baz.Uid": ["riri", "fifi"],
+        "dummy.path": ["loulou"],
+    }
+    payload = _column_payload(table, column, tags)
     expected = {
-        "id": "`18175cd5-9b9b-4d78-9d28-caaa12c21ce0`.`Uid`",
         "column_name": "Uid",
-        "table_id": "18175cd5-9b9b-4d78-9d28-caaa12c21ce0",
-        "description": "some description",
         "data_type": "STRING",
+        "description": "some description",
+        "id": "`732pot5e-8ato-4c27-b701-9fa51febc192`.`Uid`",
         "ordinal_position": 0,
+        "table_id": "732pot5e-8ato-4c27-b701-9fa51febc192",
+        "tags": ["riri", "fifi"],
     }
     assert payload == expected
     # case where there are spaces in the name
     column["name"] = "column name with spaces"
-    payload = _column_payload(table, column)
+    payload = _column_payload(table, column, tags)
     expected_id = (
-        "`18175cd5-9b9b-4d78-9d28-caaa12c21ce0`.`column name with spaces`"
+        "`732pot5e-8ato-4c27-b701-9fa51febc192`.`column name with spaces`"
     )
     assert payload["id"] == expected_id
+def test__column_path():
+    table = {
+        "catalog_name": "Jo",
+        "schema_name": "William",
+        "name": "Jack",
+    }
+    column = {
+        "name": "Averell",
+    }
+    expected = "Jo.William.Jack.Averell"
+    assert _column_path(table=table, column=column) == expected

castor_extractor/warehouse/databricks/utils.py ADDED Viewed

@@ -0,0 +1,27 @@
+from typing import Dict, List
+def build_path(
+    row: Dict,
+    keys: List[str],
+) -> str:
+    """
+    format an asset's path:
+    - picks the given keys from dict
+    - join keys with a dot "."
+    """
+    key_values = [row[key] for key in keys]
+    return ".".join(key_values)
+def tag_label(row: Dict) -> str:
+    """
+    format the tag's label:
+    - {key:value} when the value is not empty
+    - {key} otherwise
+    """
+    tag_name = row["tag_name"]
+    tag_value = row["tag_value"]
+    if not tag_value:
+        return tag_name
+    return f"{tag_name}:{tag_value}"

castor_extractor/warehouse/databricks/utils_test.py ADDED Viewed

@@ -0,0 +1,25 @@
+from .utils import build_path, tag_label
+def test_build_path():
+    row = {
+        "bigflo": "oli",
+        "laurel": "hardy",
+        "dupond": "dupont",
+    }
+    keys = ["laurel", "dupond"]
+    assert build_path(row, keys) == "hardy.dupont"
+def test_tag_label():
+    row = {
+        "tag_name": "marketplace",
+        "tag_value": "",
+    }
+    assert tag_label(row) == "marketplace"
+    row = {
+        "tag_name": "fi",
+        "tag_value": "fou",
+    }
+    assert tag_label(row) == "fi:fou"

{castor_extractor-0.17.0.dist-info → castor_extractor-0.17.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: castor-extractor
-Version: 0.17.0
+Version: 0.17.3
 Summary: Extract your metadata assets.
 Home-page: https://www.castordoc.com/
 License: EULA
@@ -17,6 +17,7 @@ Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Provides-Extra: all
 Provides-Extra: bigquery
+Provides-Extra: databricks
 Provides-Extra: dbt
 Provides-Extra: looker
 Provides-Extra: metabase
@@ -29,6 +30,7 @@ Provides-Extra: snowflake
 Provides-Extra: sqlserver
 Provides-Extra: tableau
 Requires-Dist: cryptography (>=41.0.5) ; extra == "snowflake"
+Requires-Dist: databricks-sql-connector (>=3.2.0,<4.0.0) ; extra == "databricks" or extra == "all"
 Requires-Dist: google-api-core (>=2.1.1,<3.0.0)
 Requires-Dist: google-auth (>=2,<3)
 Requires-Dist: google-cloud-core (>=2.1.0,<3.0.0)
@@ -39,6 +41,9 @@ Requires-Dist: looker-sdk (>=23.0.0) ; extra == "looker" or extra == "all"
 Requires-Dist: msal (>=1.20.0,<2.0.0) ; extra == "powerbi" or extra == "all"
 Requires-Dist: numpy (<1.25) ; python_version >= "3.8" and python_version < "3.9"
 Requires-Dist: numpy (>=1.26,<2) ; python_version >= "3.12" and python_version < "3.13"
+Requires-Dist: pandas (>=2,<2.2.0) ; python_version >= "3.9" and python_full_version <= "3.11.0"
+Requires-Dist: pandas (>=2.0,<2.1) ; python_version >= "3.8" and python_version < "3.9"
+Requires-Dist: pandas (>=2.1,<2.2.0) ; python_version >= "3.12" and python_version < "3.13"
 Requires-Dist: psycopg2-binary (>=2.0.0,<3.0.0) ; extra == "metabase" or extra == "postgres" or extra == "redshift" or extra == "all"
 Requires-Dist: pycryptodome (>=3.0.0,<4.0.0) ; extra == "metabase" or extra == "all"
 Requires-Dist: pydantic (>=2.6,<3.0)

{castor_extractor-0.17.0.dist-info → castor_extractor-0.17.3.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-CHANGELOG.md,sha256=EVZ9vhIVN7HLn5PYkRyBWyT3hk72Nt3i1SghwSipfR4,10957
+CHANGELOG.md,sha256=dxvJYXKwACP7txJdP-1Ug0G6tj34Vsd8TkEn1uuhLgs,11152
 Dockerfile,sha256=HcX5z8OpeSvkScQsN-Y7CNMUig_UB6vTMDl7uqzuLGE,303
 LICENCE,sha256=sL-IGa4hweyya1HgzMskrRdybbIa2cktzxb5qmUgDg8,8254
 README.md,sha256=uF6PXm9ocPITlKVSh9afTakHmpLx3TvawLf-CbMP3wM,3578
@@ -41,13 +41,13 @@ castor_extractor/uploader/__init__.py,sha256=SSRtwjg-dNoxME-RJy9G1flASiUKAC5bH1h
 castor_extractor/uploader/constant.py,sha256=yTigLHDlYwoRr6CpFIl7ReElFsQd4H-qkluMZJPWSx0,865
 castor_extractor/uploader/env.py,sha256=5HSniVSOYVg4u38O4k8TB_qaJq9s8yJ1hjedkq_gdVg,878
 castor_extractor/uploader/env_test.py,sha256=ClCWWtwd2N-5ClIDUxVMeKkWfhhOTxpppsXUDmdjxSg,472
-castor_extractor/uploader/upload.py,sha256=bTWD1_-hmJ6q1qcEosjZ96wsBtWDnWoCt692NYX_Nko,3228
+castor_extractor/uploader/upload.py,sha256=W1TGqO8_PtFdR661qNlh6v-LOIRvoJoda65-5OujFXs,3239
 castor_extractor/uploader/upload_test.py,sha256=7fwstdQe7FjuwGilsCdFpEQr1qLoR2WTRUzyy93fISw,402
 castor_extractor/uploader/utils.py,sha256=Tx_i875L2vJ8btOLV3-L0UMEFiyhH8E5n0XXRyLjO0Y,793
 castor_extractor/utils/__init__.py,sha256=bmzAOc-PKsVreMJtF7DGpPQeHrVqxWel_BblRftt6Ag,1186
 castor_extractor/utils/client/__init__.py,sha256=CRE-xJKm6fVV9dB8ljzB5YoOxX4I1sCD1KSgqs3Y8_Y,161
 castor_extractor/utils/client/abstract.py,sha256=aA5Qcb9TwWDSMq8WpXbGkOB20hehwX2VTpqQAwV76wk,2048
-castor_extractor/utils/client/api.py,sha256=z1o4fteWx1HxNTqCYihl9sGkIgSQTbd8lW_B9Y2wyeQ,1742
+castor_extractor/utils/client/api.py,sha256=AGDj2JH__Q_x7RQdodoVazGvjGQJ9TzNqs-XEX6Hrms,1840
 castor_extractor/utils/client/api_test.py,sha256=NSMdXg1FLc37erqHp2FZsIsogWVv6lFSs7rDXHikr-E,542
 castor_extractor/utils/client/postgres.py,sha256=n6ulaT222WWPY0_6qAZ0MHF0m91HtI9mMqL71nyygo0,866
 castor_extractor/utils/client/query.py,sha256=O6D5EjD1KmBlwa786Uw4D4kzxx97_HH50xIIeSWt0B8,205
@@ -276,15 +276,17 @@ castor_extractor/warehouse/bigquery/queries/user.sql,sha256=l-fkNGWJVdZwVhbFZL23
 castor_extractor/warehouse/bigquery/queries/view_ddl.sql,sha256=obCm-IN9V8_YSZTwcgNSBDD0ZXPgRjlxJjrZDSEH2MU,326
 castor_extractor/warehouse/bigquery/query.py,sha256=hrFfjd5jW2oQnZ6ozlkn-gDe6sCIzu5zSX19T9W6fIk,4162
 castor_extractor/warehouse/bigquery/types.py,sha256=LZVWSmE57lOemNbB5hBRyYmDk9bFAU4nbRaJWALl6N8,140
-castor_extractor/warehouse/databricks/__init__.py,sha256=bTvDxjGQGM2J3hOnVhfNmFP1y8DK0tySiD_EXe5_xWE,200
-castor_extractor/warehouse/databricks/client.py,sha256=oHR_htE25p5tiAAFZKbF48efo7tqIENW4dAGA7yEqHg,16895
+castor_extractor/warehouse/databricks/__init__.py,sha256=YG3YSIJgCFRjjI8eExy9T7qGnfnjWhMFh8c15KTs_BA,184
+castor_extractor/warehouse/databricks/client.py,sha256=pnYb6nl9U33nH6UukYP5piWGYF-m1SP2TYiWiUozM_4,20552
 castor_extractor/warehouse/databricks/client_test.py,sha256=KNp4Hi_CC6GwiW2QDJQQwqALfUebuT9D_qL6FuP_8tY,5246
-castor_extractor/warehouse/databricks/credentials.py,sha256=PpGv5_GP320UQjV_gvaxSpOw58AmqSznmjGhGfe6bdU,655
-castor_extractor/warehouse/databricks/extract.py,sha256=VX-3uo5dZucenrg-wnPur3CxOgpC5H7Ds92TO7OTAjc,7379
-castor_extractor/warehouse/databricks/format.py,sha256=2bRy2fa45NW3uk030rmyba4n2Em-NnyZPBurUslEbcw,5522
-castor_extractor/warehouse/databricks/format_test.py,sha256=iPmdJof43fBYL1Sa_fBrCWDQHCHgm7IWCZag1kWkj9E,1970
+castor_extractor/warehouse/databricks/credentials.py,sha256=iphbVynVTQXMEbJy4QaT5fer-GpOi7QtbAlg8R7-Lj4,598
+castor_extractor/warehouse/databricks/extract.py,sha256=VYygE06f7ngYWVlRa48O6drLIZF-_4IBJdyXTYfxZQU,7395
+castor_extractor/warehouse/databricks/format.py,sha256=p252NFzQN1uZdsu5wpP-bMHK0rBBVzallX3-o92Mvh4,6744
+castor_extractor/warehouse/databricks/format_test.py,sha256=ls0IcOElqp_qecAzNbK0zdca7Pms4seCHimbw8NAoAI,3322
 castor_extractor/warehouse/databricks/test_constants.py,sha256=Hm96yq_ltVAKv7WYhYz637r4Cuj-1cCdyOuxMEe3J-Q,2246
 castor_extractor/warehouse/databricks/types.py,sha256=hD6gC8oiT3QSWEvbtgUOGK_lLzzz36sEauB3lS_wxlE,218
+castor_extractor/warehouse/databricks/utils.py,sha256=RWRViqLaj2K0in5T5F6OLp7HCm554BCh3zi4CJqOEt8,576
+castor_extractor/warehouse/databricks/utils_test.py,sha256=5Qrd_tLNLWrDHX2uQyVUf0vqXJzD44uQGGxDBOkwvUU,503
 castor_extractor/warehouse/mysql/__init__.py,sha256=2KFDogo9GNbApHqw3Vm5t_uNmIRjdp76nmP_WQQMfQY,116
 castor_extractor/warehouse/mysql/client.py,sha256=IwoJvbmE5VZkMCP9yHf6ta3_AQPEuBPrZZ3meefbcJs,974
 castor_extractor/warehouse/mysql/client_test.py,sha256=wRTv-3c5chy_HKj-buasNiYOOCIfynYqbabM4Hxdh5E,1052
@@ -370,8 +372,8 @@ castor_extractor/warehouse/synapse/queries/schema.sql,sha256=aX9xNrBD_ydwl-znGSF
 castor_extractor/warehouse/synapse/queries/table.sql,sha256=mCE8bR1Vb7j7SwZW2gafcXidQ2fo1HwxcybA8wP2Kfs,1049
 castor_extractor/warehouse/synapse/queries/user.sql,sha256=sTb_SS7Zj3AXW1SggKPLNMCd0qoTpL7XI_BJRMaEpBg,67
 castor_extractor/warehouse/synapse/queries/view_ddl.sql,sha256=3EVbp5_yTgdByHFIPLHmnoOnqqLE77SrjAwFDvu4e54,249
-castor_extractor-0.17.0.dist-info/LICENCE,sha256=sL-IGa4hweyya1HgzMskrRdybbIa2cktzxb5qmUgDg8,8254
-castor_extractor-0.17.0.dist-info/METADATA,sha256=mPiUyxCqXFifcPbhcOPFsnkPAV4OcWXoYzGeUKlbkoo,6582
-castor_extractor-0.17.0.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-castor_extractor-0.17.0.dist-info/entry_points.txt,sha256=SbyPk58Gh-FRztfCNnUZQ6w7SatzNJFZ6GIJLNsy7tI,1427
-castor_extractor-0.17.0.dist-info/RECORD,,
+castor_extractor-0.17.3.dist-info/LICENCE,sha256=sL-IGa4hweyya1HgzMskrRdybbIa2cktzxb5qmUgDg8,8254
+castor_extractor-0.17.3.dist-info/METADATA,sha256=v_xgS6DS7FC1kVzma9Z69XiMOjDn6BHckEJJ-rJ5TZI,6985
+castor_extractor-0.17.3.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+castor_extractor-0.17.3.dist-info/entry_points.txt,sha256=SbyPk58Gh-FRztfCNnUZQ6w7SatzNJFZ6GIJLNsy7tI,1427
+castor_extractor-0.17.3.dist-info/RECORD,,

{castor_extractor-0.17.0.dist-info → castor_extractor-0.17.3.dist-info}/LICENCE RENAMED Viewed

File without changes

{castor_extractor-0.17.0.dist-info → castor_extractor-0.17.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{castor_extractor-0.17.0.dist-info → castor_extractor-0.17.3.dist-info}/entry_points.txt RENAMED Viewed

File without changes

castor-extractor 0.17.0__py3-none-any.whl → 0.17.3__py3-none-any.whl

Potentially problematic release.

castor-extractor 0.17.0py3-none-any.whl → 0.17.3py3-none-any.whl