PyPI - castor-extractor - Versions diffs - 0.21.9__py3-none-any.whl → 0.22.0__py3-none-any.whl - Mend

castor-extractor 0.21.9py3-none-any.whl → 0.22.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of castor-extractor might be problematic. Click here for more details.

Files changed (128) hide show

castor_extractor/visualization/tableau/client/client_utils.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from typing import Dict, Iterator, Optional
+from collections.abc import Iterator
+from typing import Optional
 from ....utils import SerializedAsset
 from ..assets import TableauAsset
@@ -69,6 +70,6 @@ def query_scroll(
             break
-def extract_asset(asset: Dict, asset_type: TableauAsset) -> Dict:
+def extract_asset(asset: dict, asset_type: TableauAsset) -> dict:
     """Agnostic function extracting dedicated attributes with define asset"""
     return {key: getattr(asset, key) for key in TSC_FIELDS[asset_type]}

castor_extractor/visualization/tableau/client/credentials.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from enum import Enum
-from typing import Dict, Optional
+from typing import Optional
 from ....utils import from_env
@@ -20,7 +20,7 @@ class CredentialsKey(Enum):
     TABLEAU_SERVER_URL = "server_url"
-CREDENTIALS_ENV: Dict[CredentialsKey, str] = {
+CREDENTIALS_ENV: dict[CredentialsKey, str] = {
     CredentialsKey.TABLEAU_USER: "CASTOR_TABLEAU_USER",
     CredentialsKey.TABLEAU_PASSWORD: "CASTOR_TABLEAU_PASSWORD",
     CredentialsKey.TABLEAU_TOKEN_NAME: "CASTOR_TABLEAU_TOKEN_NAME",
@@ -89,7 +89,7 @@ class CredentialsApi:
             CredentialsKey.TABLEAU_TOKEN: token,
         }
-    def to_dict(self, hide: bool = False) -> Dict[str, str]:
+    def to_dict(self, hide: bool = False) -> dict[str, str]:
         safe = (
             CredentialsKey.TABLEAU_USER,
             CredentialsKey.TABLEAU_SITE_ID,

castor_extractor/visualization/tableau/client/safe_mode.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import logging
-from typing import Dict, List
 import tableauserverclient as TSC  # type: ignore
@@ -48,7 +47,7 @@ def safe_mode_fetch_usage(client) -> SerializedAsset:
     Returns computed usages when page number is not found
     Log errors if ServerResponseError is return
     """
-    list_usages: List[Dict] = []
+    list_usages: list[dict] = []
     page_number: int = 0
     while True:

castor_extractor/visualization/tableau/extract.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import logging
-from typing import Iterable, Tuple
+from collections.abc import Iterable
 from ...utils import (
     OUTPUT_DIR,
@@ -19,7 +19,7 @@ logger = logging.getLogger(__name__)
 def iterate_all_data(
     client: Client,
-) -> Iterable[Tuple[TableauAsset, list]]:
+) -> Iterable[tuple[TableauAsset, list]]:
     """Iterate over the extracted Data from Tableau"""
     logger.info("Extracting USER from Tableau API")

castor_extractor/visualization/tableau/gql_fields.py CHANGED Viewed

@@ -1,6 +1,6 @@
 # Fields which will be use for Tableau GraphQL API
 from enum import Enum
-from typing import Dict, List, Union
+from typing import Union
 from .assets import TableauAsset, TableauGraphqlAsset
@@ -189,9 +189,9 @@ class GQLQueryFields(Enum):
     """
-QueryInfo = List[Dict[str, Union[GQLQueryFields, TableauGraphqlAsset]]]
+QueryInfo = list[dict[str, Union[GQLQueryFields, TableauGraphqlAsset]]]
-QUERY_FIELDS: Dict[TableauAsset, QueryInfo] = {
+QUERY_FIELDS: dict[TableauAsset, QueryInfo] = {
     TableauAsset.CUSTOM_SQL_TABLE: [
         {
             FIELDS: GQLQueryFields.CUSTOM_SQL_TABLE,

castor_extractor/visualization/tableau/tsc_fields.py CHANGED Viewed

@@ -1,10 +1,9 @@
 # TSC for TableauServerClient: basic REST API to extracting core objects
-from typing import Dict, Set
 from .assets import TableauAsset
 # TSC fields extracted per assets
-TSC_FIELDS: Dict[TableauAsset, Set[str]] = {
+TSC_FIELDS: dict[TableauAsset, set[str]] = {
     TableauAsset.PROJECT: {
         "id",
         "name",

castor_extractor/visualization/tableau/types.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from typing import Dict, List, Tuple, Union
+from typing import Union
 from tableauserverclient import ServerResponseError  # type: ignore
 from typing_extensions import Literal
@@ -6,6 +6,6 @@ from typing_extensions import Literal
 from .errors import TableauErrorCode
 PageReturn = Union[
-    Tuple[List[Dict], Literal[None]],
-    Tuple[Literal[None], Union[TableauErrorCode, ServerResponseError]],
+    tuple[list[dict], Literal[None]],
+    tuple[Literal[None], Union[TableauErrorCode, ServerResponseError]],
 ]

castor_extractor/visualization/tableau_revamp/client/client_metadata_api.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from typing import Dict, Iterator, Optional
+from collections.abc import Iterator
+from typing import Optional
 import tableauserverclient as TSC  # type: ignore
@@ -10,7 +11,7 @@ from .gql_queries import FIELDS_QUERIES, GQL_QUERIES, QUERY_TEMPLATE
 # increase the value when extraction is too slow
 # decrease the value when timeouts arise
-_CUSTOM_PAGE_SIZE: Dict[TableauRevampAsset, int] = {
+_CUSTOM_PAGE_SIZE: dict[TableauRevampAsset, int] = {
     # for some clients, extraction of columns tend to hit the node limit
     # https://community.tableau.com/s/question/0D54T00000YuK60SAF/metadata-query-nodelimitexceeded-error
     # the workaround is to reduce pagination

castor_extractor/visualization/tableau_revamp/client/client_rest_api.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import logging
-from typing import Dict, Optional
+from typing import Optional
 import requests
 import tableauserverclient as TSC  # type: ignore
@@ -40,7 +40,7 @@ class TableauClientRestApi:
         return self._server.http_options["timeout"]
     @property
-    def headers(self) -> Dict[str, str]:
+    def headers(self) -> dict[str, str]:
         return {"x-tableau-auth": self._server.auth_token}
     def _get_site_name(self) -> str:
@@ -52,7 +52,7 @@ class TableauClientRestApi:
         self,
         url: str,
         page_token: Optional[str] = None,
-    ) -> Dict:
+    ) -> dict:
         if page_token:
             url += f"?page_token={page_token}"

castor_extractor/visualization/tableau_revamp/client/client_tsc.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from typing import Any, Dict, Iterable, Iterator
+from collections.abc import Iterable, Iterator
+from typing import Any
 import tableauserverclient as TSC  # type: ignore
@@ -30,7 +31,7 @@ class TableauClientTSC:
         self,
         data: Iterable,
         asset: TableauRevampAsset,
-    ) -> Iterator[Dict]:
+    ) -> Iterator[dict]:
         keys = REST_FIELDS[asset]
         for row in data:

castor_extractor/visualization/tableau_revamp/client/gql_queries.py CHANGED Viewed

@@ -1,5 +1,3 @@
-from typing import Dict, Tuple
 from ..assets import TableauRevampAsset
 QUERY_TEMPLATE = """
@@ -130,7 +128,7 @@ workbook { id }
 """
-GQL_QUERIES: Dict[TableauRevampAsset, Tuple[str, str]] = {
+GQL_QUERIES: dict[TableauRevampAsset, tuple[str, str]] = {
     TableauRevampAsset.COLUMN: ("columns", _COLUMNS_QUERY),
     TableauRevampAsset.DASHBOARD: ("dashboards", _DASHBOARDS_QUERY),
     TableauRevampAsset.DATASOURCE: ("datasources", _DATASOURCES_QUERY),

castor_extractor/visualization/tableau_revamp/client/rest_fields.py CHANGED Viewed

@@ -1,9 +1,7 @@
-from typing import Dict, Set
 from ..assets import TableauRevampAsset
 # list of fields to pick in REST API or TSC responses
-REST_FIELDS: Dict[TableauRevampAsset, Set[str]] = {
+REST_FIELDS: dict[TableauRevampAsset, set[str]] = {
     TableauRevampAsset.DATASOURCE: {
         "id",
         "project_id",

castor_extractor/visualization/tableau_revamp/extract.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import logging
-from typing import Iterable, Tuple
+from collections.abc import Iterable
 from ...utils import (
     OUTPUT_DIR,
@@ -18,7 +18,7 @@ logger = logging.getLogger(__name__)
 def iterate_all_data(
     client: TableauRevampClient,
-) -> Iterable[Tuple[TableauRevampAsset, list]]:
+) -> Iterable[tuple[TableauRevampAsset, list]]:
     """Iterate over the extracted Data from Tableau"""
     for asset in TableauRevampAsset:

castor_extractor/visualization/thoughtspot/client/client.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from typing import Dict, Iterator, Optional
+from collections.abc import Iterator
+from typing import Optional
 import requests
@@ -35,7 +36,7 @@ THOUGHTSPOT_SAFE_MODE = RequestSafeMode()
 class ThoughtspotBearerAuth(BearerAuth):
-    def __init__(self, host: str, token_payload: Dict[str, str]):
+    def __init__(self, host: str, token_payload: dict[str, str]):
         auth_endpoint = ThoughtspotEndpointFactory.authentication()
         self.authentication_url = build_url(host, auth_endpoint)
         self.token_payload = token_payload

castor_extractor/visualization/thoughtspot/client/utils.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import csv
+from collections.abc import Iterator
 from io import StringIO
-from typing import Iterator
 def usage_liveboard_reader(usage_liveboard_csv: str) -> Iterator[dict]:

castor_extractor/visualization/thoughtspot/extract.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import logging
-from typing import Iterable, Iterator, Tuple, Union
+from collections.abc import Iterable, Iterator
+from typing import Union
 from ...utils import (
     OUTPUT_DIR,
@@ -21,7 +22,7 @@ logger = logging.getLogger(__name__)
 def iterate_all_data(
     client: ThoughtspotClient,
-) -> Iterable[Tuple[ThoughtspotAsset, Union[list, Iterator, dict]]]:
+) -> Iterable[tuple[ThoughtspotAsset, Union[list, Iterator, dict]]]:
     """Iterate over the extracted data from Thoughtspot"""
     for asset in ThoughtspotAsset:

castor_extractor/warehouse/abstract/asset.py CHANGED Viewed

@@ -1,5 +1,4 @@
 from enum import Enum
-from typing import Dict, List, Set, Tuple
 from ...types import ExternalAsset, classproperty
@@ -26,7 +25,7 @@ class WarehouseAsset(ExternalAsset):
     VIEW_DDL = "view_ddl"
     @classproperty
-    def optional(cls) -> Set["WarehouseAsset"]:
+    def optional(cls) -> set["WarehouseAsset"]:
         return {
             WarehouseAsset.ADDITIONAL_COLUMN_LINEAGE,
             WarehouseAsset.ADDITIONAL_TABLE_LINEAGE,
@@ -50,7 +49,7 @@ class WarehouseAssetGroup(Enum):
 # tuple of supported assets for each group (depends on the technology)
-SupportedAssets = Dict[WarehouseAssetGroup, Tuple[WarehouseAsset, ...]]
+SupportedAssets = dict[WarehouseAssetGroup, tuple[WarehouseAsset, ...]]
 # shared by all technologies
 CATALOG_ASSETS = (
@@ -80,13 +79,13 @@ NON_EXTRACTABLE_ASSETS = {WarehouseAssetGroup.EXTERNAL_LINEAGE}
 def extractable_asset_groups(
     supported_assets: SupportedAssets,
-) -> List[Tuple[WarehouseAsset, ...]]:
+) -> list[tuple[WarehouseAsset, ...]]:
     """
     helper function to differentiate
     extractable assets vs supported (ingest-able) assets
     """
     groups = set(supported_assets).difference(NON_EXTRACTABLE_ASSETS)
-    extractable: Set[Tuple[WarehouseAsset, ...]] = {
+    extractable: set[tuple[WarehouseAsset, ...]] = {
         supported_assets[group] for group in groups
     }
     return list(extractable)

castor_extractor/warehouse/abstract/extract.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import logging
+from collections.abc import Iterator
 from itertools import chain
-from typing import Callable, Iterator, List, Optional, Tuple
+from typing import Callable, Optional
 from ...utils import (
     OUTPUT_DIR,
@@ -16,7 +17,7 @@ from .query import AbstractQueryBuilder, ExtractionQuery
 logger = logging.getLogger(__name__)
-def common_args(kwargs: dict) -> Tuple[str, bool]:
+def common_args(kwargs: dict) -> tuple[str, bool]:
     """Args used by all technologies"""
     output_directory = kwargs.get("output_directory") or from_env(OUTPUT_DIR)
     skip_existing = kwargs.get("skip_existing") or False
@@ -39,7 +40,7 @@ class SQLExtractionProcessor:
         self._safe_mode = safe_mode
     @staticmethod
-    def _unique(data: Iterator[dict]) -> List[dict]:
+    def _unique(data: Iterator[dict]) -> list[dict]:
         """
         Remove duplicate in the given data.
         Remark: this method implies loading all data in memory: it breaks the streaming pipeline !

castor_extractor/warehouse/abstract/query.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import inspect
 import os
 from abc import ABC, abstractmethod
-from typing import List, Optional, Tuple
+from typing import Optional
 from .asset import WarehouseAsset
 from .time_filter import TimeFilter
@@ -37,7 +37,7 @@ class AbstractQueryBuilder(ABC):
     def __init__(
         self,
         time_filter: Optional[TimeFilter],
-        duplicated: Optional[Tuple[WarehouseAsset, ...]] = None,
+        duplicated: Optional[tuple[WarehouseAsset, ...]] = None,
     ):
         self._time_filter = time_filter or TimeFilter.default()
         self._duplicated = duplicated
@@ -55,7 +55,7 @@ class AbstractQueryBuilder(ABC):
         """read from a file located in queries directory"""
         root = os.path.dirname(inspect.getfile(self.__class__))
         path = os.path.join(root, QUERIES_DIR, filename)
-        with open(path, "r") as f:
+        with open(path) as f:
             return f.read()
     def load_statement(self, asset: WarehouseAsset) -> str:
@@ -75,7 +75,7 @@ class AbstractQueryBuilder(ABC):
         return ExtractionQuery(statement, params)
     @abstractmethod
-    def build(self, asset: WarehouseAsset) -> List[ExtractionQuery]:
+    def build(self, asset: WarehouseAsset) -> list[ExtractionQuery]:
         """
         Build the Query allowing extraction of the given asset
         - Most of the time, returns a single query

castor_extractor/warehouse/bigquery/client.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import itertools
 import logging
-from typing import List, Optional, Set
+from typing import Optional
 from google.api_core.exceptions import Forbidden  # type: ignore
 from google.cloud.bigquery import Client as GoogleCloudClient  # type: ignore
@@ -27,9 +27,9 @@ class BigQueryClient(SqlalchemyClient):
     def __init__(
         self,
         credentials: dict,
-        db_allowed: Optional[Set[str]] = None,
-        db_blocked: Optional[Set[str]] = None,
-        dataset_blocked: Optional[Set[str]] = None,
+        db_allowed: Optional[set[str]] = None,
+        db_blocked: Optional[set[str]] = None,
+        dataset_blocked: Optional[set[str]] = None,
     ):
         super().__init__(credentials)
         self._db_allowed = db_allowed
@@ -37,8 +37,8 @@ class BigQueryClient(SqlalchemyClient):
         self._dataset_blocked = dataset_blocked
         self.credentials = self._credentials()
         self.client = self._client()
-        self._projects: List[str] | None = None
-        self._datasets: List[Dataset] | None = None
+        self._projects: list[str] | None = None
+        self._datasets: list[Dataset] | None = None
     @staticmethod
     def name() -> str:
@@ -78,7 +78,7 @@ class BigQueryClient(SqlalchemyClient):
             credentials=self.credentials,
         )
-    def _list_datasets(self) -> List[Dataset]:
+    def _list_datasets(self) -> list[Dataset]:
         """
         Returns datasets available for the given GCP client
         Cache the result in self._datasets to reduce number of API calls
@@ -98,7 +98,7 @@ class BigQueryClient(SqlalchemyClient):
         base_ms=_RETRY_BASE_MS,
         log_exc_info=True,
     )
-    def get_projects(self) -> List[str]:
+    def get_projects(self) -> list[str]:
         """
         Returns distinct project_id available for the given GCP client
         Cache the result in self._projects to reduce number of API calls.

castor_extractor/warehouse/bigquery/extract.py CHANGED Viewed

@@ -38,7 +38,7 @@ def _credentials(params: dict) -> dict:
     """extract GCP credentials"""
     path = params.get("credentials") or from_env(BIGQUERY_CREDENTIALS)
     logger.info(f"Credentials fetched from {path}")
-    with open(path, "r") as file:
+    with open(path) as file:
         return cast(dict, json.load(file))

castor_extractor/warehouse/bigquery/query.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import logging
-from typing import List, Optional
+from typing import Optional
 from ..abstract import (
     AbstractQueryBuilder,
@@ -109,7 +109,7 @@ class BigQueryQueryBuilder(AbstractQueryBuilder):
             else self._regions
         )
-    def build(self, asset: WarehouseAsset) -> List[ExtractionQuery]:
+    def build(self, asset: WarehouseAsset) -> list[ExtractionQuery]:
         """
         It would be easier to stitch data directly in the query statement (UNION ALL).
         Unfortunately, querying INFORMATION_SCHEMA on multiple regions

castor_extractor/warehouse/bigquery/types.py CHANGED Viewed

@@ -1,4 +1,2 @@
-from typing import Set, Tuple
-SetString = Set[str]
-SetTwoString = Set[Tuple[str, str]]
+SetString = set[str]
+SetTwoString = set[tuple[str, str]]

castor_extractor/warehouse/databricks/api_client.py CHANGED Viewed

@@ -1,7 +1,8 @@
 import logging
+from collections.abc import Iterator
 from functools import partial
 from http import HTTPStatus
-from typing import Iterator, List, Optional, Set, Tuple
+from typing import Optional
 import requests
@@ -55,8 +56,8 @@ class DatabricksAPIClient(APIClient):
     def __init__(
         self,
         credentials: DatabricksCredentials,
-        db_allowed: Optional[Set[str]] = None,
-        db_blocked: Optional[Set[str]] = None,
+        db_allowed: Optional[set[str]] = None,
+        db_blocked: Optional[set[str]] = None,
     ):
         auth = DatabricksAuth(credentials)
         super().__init__(
@@ -81,18 +82,18 @@ class DatabricksAPIClient(APIClient):
             return False
         return True
-    def databases(self) -> List[dict]:
+    def databases(self) -> list[dict]:
         content = self._get(DatabricksEndpointFactory.databases())
         _databases = self.formatter.format_database(content.get("catalogs", []))
         return [d for d in _databases if self._keep_catalog(d["database_name"])]
-    def _schemas_of_database(self, database: dict) -> List[dict]:
+    def _schemas_of_database(self, database: dict) -> list[dict]:
         payload = {"catalog_name": database["database_name"]}
         content = self._get(DatabricksEndpointFactory.schemas(), params=payload)
         schemas = content.get("schemas", [])
         return self.formatter.format_schema(schemas, database)
-    def schemas(self, databases: List[dict]) -> List[dict]:
+    def schemas(self, databases: list[dict]) -> list[dict]:
         """
         Get the databricks schemas (also sometimes called databases)
         (which correspond to the schemas in Castor)
@@ -143,8 +144,8 @@ class DatabricksAPIClient(APIClient):
     )
     def get_single_column_lineage(
         self,
-        names: Tuple[str, str],
-    ) -> List[TimestampedLink]:
+        names: tuple[str, str],
+    ) -> list[TimestampedLink]:
         """
         Helper function used in get_lineage_links.
         Call data lineage API and return the content of the result
@@ -172,7 +173,7 @@ class DatabricksAPIClient(APIClient):
     )
     def get_single_table_lineage(
         self, table_path: str
-    ) -> List[TimestampedLink]:
+    ) -> list[TimestampedLink]:
         """
         Helper function used in get_lineage_links.
         Call data lineage API and return the content of the result
@@ -210,7 +211,7 @@ class DatabricksAPIClient(APIClient):
         queries = fetch_all_pages(request, DatabricksPagination)
         return queries
-    def queries(self, time_filter: Optional[TimeFilter] = None) -> List[dict]:
+    def queries(self, time_filter: Optional[TimeFilter] = None) -> list[dict]:
         """get all queries, hour per hour"""
         time_range_filters = hourly_time_filters(time_filter)
         raw_queries = []
@@ -220,14 +221,14 @@ class DatabricksAPIClient(APIClient):
             raw_queries.extend(hourly)
         return self.formatter.format_query(raw_queries)
-    def users(self) -> List[dict]:
+    def users(self) -> list[dict]:
         """
         retrieve user from api
         """
         content = self._get(DatabricksEndpointFactory.users())
         return self.formatter.format_user(content.get("Resources", []))
-    def _view_ddl_per_schema(self, schema: dict) -> List[dict]:
+    def _view_ddl_per_schema(self, schema: dict) -> list[dict]:
         payload = {
             "catalog_name": schema["database_id"],
             "schema_name": schema["schema_name"],
@@ -236,9 +237,9 @@ class DatabricksAPIClient(APIClient):
         content = self._get(DatabricksEndpointFactory.tables(), params=payload)
         return self.formatter.format_view_ddl(content.get("tables", []), schema)
-    def view_ddl(self, schemas: List[dict]) -> List[dict]:
+    def view_ddl(self, schemas: list[dict]) -> list[dict]:
         """retrieve view ddl"""
-        view_ddl: List[dict] = []
+        view_ddl: list[dict] = []
         for schema in schemas:
             v_to_add = self._view_ddl_per_schema(schema)
             view_ddl.extend(v_to_add)

castor_extractor/warehouse/databricks/client.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import logging
 from concurrent.futures import ThreadPoolExecutor
-from typing import List, Optional, Set
+from typing import Optional
 from ...utils import (
     mapping_from_rows,
@@ -25,8 +25,8 @@ class DatabricksClient:
     def __init__(
         self,
         credentials: DatabricksCredentials,
-        db_allowed: Optional[Set[str]] = None,
-        db_blocked: Optional[Set[str]] = None,
+        db_allowed: Optional[set[str]] = None,
+        db_blocked: Optional[set[str]] = None,
         has_table_tags: bool = False,
         has_column_tags: bool = False,
     ):
@@ -58,26 +58,26 @@ class DatabricksClient:
         return {**table, "owner_external_id": owner_external_id}
     @staticmethod
-    def _get_user_mapping(users: List[dict]) -> dict:
+    def _get_user_mapping(users: list[dict]) -> dict:
         return {
             **mapping_from_rows(users, "email", "id"),
             **mapping_from_rows(users, "user_name", "id"),
         }
-    def schemas(self, databases: List[dict]) -> List[dict]:
+    def schemas(self, databases: list[dict]) -> list[dict]:
         return self.api_client.schemas(databases)
-    def databases(self) -> List[dict]:
+    def databases(self) -> list[dict]:
         return self.api_client.databases()
     def tables_and_columns(
-        self, schemas: List[dict], users: List[dict]
+        self, schemas: list[dict], users: list[dict]
     ) -> TablesColumns:
         """
         Get the databricks tables & columns leveraging the unity catalog API
         """
-        tables: List[dict] = []
-        columns: List[dict] = []
+        tables: list[dict] = []
+        columns: list[dict] = []
         user_mapping = self._get_user_mapping(users)
         table_tags = self.sql_client.get_tags_mapping(TagEntity.TABLE)
         column_tags = self.sql_client.get_tags_mapping(TagEntity.COLUMN)
@@ -95,7 +95,7 @@ class DatabricksClient:
             columns.extend(c_to_add)
         return tables, columns
-    def table_lineage(self, tables: List[dict]) -> List[dict]:
+    def table_lineage(self, tables: list[dict]) -> list[dict]:
         """
         Wrapper function that retrieves all table lineage
         """
@@ -113,8 +113,8 @@ class DatabricksClient:
         return self.formatter.format_lineage(deduplicated)
     def column_lineage(
-        self, tables: List[dict], columns: List[dict], table_lineage: List[dict]
-    ) -> List[dict]:
+        self, tables: list[dict], columns: list[dict], table_lineage: list[dict]
+    ) -> list[dict]:
         """
         Wrapper function that retrieves all column lineage
         we only try to retrieve column lineage if we found table lineage
@@ -129,17 +129,17 @@ class DatabricksClient:
             results = executor.map(
                 self.api_client.get_single_column_lineage, candidate_paths
             )
-        lineages: List[TimestampedLink] = [
+        lineages: list[TimestampedLink] = [
             link for links in results for link in links
         ]
         deduplicated = deduplicate_lineage(lineages)
         return self.formatter.format_lineage(deduplicated)
-    def queries(self, time_filter: Optional[TimeFilter] = None) -> List[dict]:
+    def queries(self, time_filter: Optional[TimeFilter] = None) -> list[dict]:
         return self.api_client.queries(time_filter)
-    def users(self) -> List[dict]:
+    def users(self) -> list[dict]:
         return self.api_client.users()
-    def view_ddl(self, schemas: List[dict]) -> List[dict]:
+    def view_ddl(self, schemas: list[dict]) -> list[dict]:
         return self.api_client.view_ddl(schemas)

castor-extractor 0.21.9__py3-none-any.whl → 0.22.0__py3-none-any.whl

Potentially problematic release.

castor-extractor 0.21.9py3-none-any.whl → 0.22.0py3-none-any.whl