PyPI - ygg - Versions diffs - 0.1.56__py3-none-any.whl → 0.1.60__py3-none-any.whl - Mend

ygg 0.1.56py3-none-any.whl → 0.1.60py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

{ygg-0.1.56.dist-info → ygg-0.1.60.dist-info}/METADATA +1 -1
ygg-0.1.60.dist-info/RECORD +74 -0
{ygg-0.1.56.dist-info → ygg-0.1.60.dist-info}/WHEEL +1 -1
yggdrasil/ai/__init__.py +2 -0
yggdrasil/ai/session.py +89 -0
yggdrasil/ai/sql_session.py +310 -0
yggdrasil/databricks/__init__.py +0 -3
yggdrasil/databricks/compute/cluster.py +68 -113
yggdrasil/databricks/compute/command_execution.py +674 -0
yggdrasil/databricks/compute/exceptions.py +7 -2
yggdrasil/databricks/compute/execution_context.py +465 -277
yggdrasil/databricks/compute/remote.py +4 -14
yggdrasil/databricks/exceptions.py +10 -0
yggdrasil/databricks/sql/__init__.py +0 -4
yggdrasil/databricks/sql/engine.py +161 -173
yggdrasil/databricks/sql/exceptions.py +9 -1
yggdrasil/databricks/sql/statement_result.py +108 -120
yggdrasil/databricks/sql/warehouse.py +331 -92
yggdrasil/databricks/workspaces/io.py +92 -9
yggdrasil/databricks/workspaces/path.py +120 -74
yggdrasil/databricks/workspaces/workspace.py +212 -68
yggdrasil/libs/databrickslib.py +23 -18
yggdrasil/libs/extensions/spark_extensions.py +1 -1
yggdrasil/libs/pandaslib.py +15 -6
yggdrasil/libs/polarslib.py +49 -13
yggdrasil/pyutils/__init__.py +1 -0
yggdrasil/pyutils/callable_serde.py +12 -19
yggdrasil/pyutils/exceptions.py +16 -0
yggdrasil/pyutils/mimetypes.py +0 -0
yggdrasil/pyutils/python_env.py +13 -12
yggdrasil/pyutils/waiting_config.py +171 -0
yggdrasil/types/cast/arrow_cast.py +3 -0
yggdrasil/types/cast/pandas_cast.py +157 -169
yggdrasil/types/cast/polars_cast.py +11 -43
yggdrasil/types/dummy_class.py +81 -0
yggdrasil/version.py +1 -1
ygg-0.1.56.dist-info/RECORD +0 -68
yggdrasil/databricks/ai/__init__.py +0 -1
yggdrasil/databricks/ai/loki.py +0 -374
{ygg-0.1.56.dist-info → ygg-0.1.60.dist-info}/entry_points.txt +0 -0
{ygg-0.1.56.dist-info → ygg-0.1.60.dist-info}/licenses/LICENSE +0 -0
{ygg-0.1.56.dist-info → ygg-0.1.60.dist-info}/top_level.txt +0 -0

yggdrasil/databricks/compute/remote.py CHANGED Viewed

@@ -36,11 +36,8 @@ def databricks_remote_compute(
     cluster_name: Optional[str] = None,
     workspace: Optional[Union[Workspace, str]] = None,
     cluster: Optional["Cluster"] = None,
-    timeout: Optional[dt.timedelta] = None,
     env_keys: Optional[List[str]] = None,
     force_local: bool = False,
-    update_timeout: Optional[Union[float, dt.timedelta]] = None,
-    **options
 ) -> Callable[[Callable[..., ReturnType]], Callable[..., ReturnType]]:
     """Return a decorator that executes functions on a remote cluster.
@@ -50,11 +47,8 @@ def databricks_remote_compute(
         cluster_name: Optional cluster name to target.
         workspace: Workspace instance or host string for lookup.
         cluster: Pre-configured Cluster instance to reuse.
-        timeout: Optional execution timeout for remote calls.
         env_keys: Optional environment variable names to forward.
         force_local: Force local execution
-        update_timeout: creation or update wait timeout
-        **options: Extra options forwarded to the execution decorator.
     Returns:
         A decorator that runs functions on the resolved Databricks cluster.
@@ -85,14 +79,10 @@ def databricks_remote_compute(
                 workspace=workspace,
                 cluster_name=cluster_name,
                 single_user_name=workspace.current_user.user_name,
-                update_timeout=update_timeout
+                wait_update=False
             )
-    cluster.ensure_running(wait_timeout=None)
-    return cluster.execution_decorator(
-        _func=_func,
-        env_keys=env_keys,
-        timeout=timeout,
-        **options
+    return cluster.system_context.decorate(
+        func=_func,
+        environ=env_keys,
     )

yggdrasil/databricks/exceptions.py ADDED Viewed

@@ -0,0 +1,10 @@
+from ..exceptions import YGGException
+__all__ = [
+    "DatabricksException"
+]
+class DatabricksException(YGGException):
+    pass

yggdrasil/databricks/sql/__init__.py CHANGED Viewed

@@ -2,7 +2,3 @@
 from .engine import SQLEngine, StatementResult
 from .exceptions import SqlStatementError
-# Backwards compatibility
-DBXSQL = SQLEngine
-DBXStatementResult = StatementResult

yggdrasil/databricks/sql/engine.py CHANGED Viewed

@@ -16,16 +16,20 @@ import logging
 import random
 import string
 import time
+from threading import Thread
 from typing import Optional, Union, Any, Dict, List, Literal
 import pyarrow as pa
+import pyarrow.dataset as pds
 from .statement_result import StatementResult
 from .types import column_info_to_arrow_field
-from .. import DatabricksPathKind, DatabricksPath
-from ..workspaces import WorkspaceService
-from ...libs.databrickslib import databricks_sdk
+from .warehouse import SQLWarehouse
+from ..workspaces import WorkspaceService, DatabricksPath
+from ...ai.sql_session import SQLAISession, SQLFlavor
+from ...libs.databrickslib import databricks_sdk, DatabricksDummyClass
 from ...libs.sparklib import SparkSession, SparkDataFrame, pyspark
+from ...pyutils.waiting_config import WaitingConfigArg
 from ...types import is_arrow_type_string_like, is_arrow_type_binary_like
 from ...types.cast.cast_options import CastOptions
 from ...types.cast.registry import convert
@@ -43,13 +47,14 @@ except ImportError:
 if databricks_sdk is not None:
     from databricks.sdk.service.sql import (
-        StatementResponse, Disposition, Format,
+        Disposition, Format,
         ExecuteStatementRequestOnWaitTimeout, StatementParameterListItem
     )
-    StatementResponse = StatementResponse
 else:
-    class StatementResponse:  # pragma: no cover
-        pass
+    Disposition = DatabricksDummyClass
+    Format = DatabricksDummyClass
+    ExecuteStatementRequestOnWaitTimeout = DatabricksDummyClass
+    StatementParameterListItem = DatabricksDummyClass
 logger = logging.getLogger(__name__)
@@ -57,7 +62,11 @@ logger = logging.getLogger(__name__)
 if pyspark is not None:
     import pyspark.sql.functions as F
-__all__ = ["SQLEngine", "StatementResult"]
+__all__ = [
+    "SQLEngine",
+    "StatementResult"
+]
 @dataclasses.dataclass
@@ -88,10 +97,12 @@ def _needs_column_mapping(col_name: str) -> bool:
 @dataclasses.dataclass
 class SQLEngine(WorkspaceService):
     """Execute SQL statements and manage tables via Databricks SQL / Spark."""
-    warehouse_id: Optional[str] = None
     catalog_name: Optional[str] = None
     schema_name: Optional[str] = None
+    _warehouse: Optional[SQLWarehouse] = dataclasses.field(default=None, repr=False, hash=False, compare=False)
+    _ai_session: Optional[SQLAISession] = dataclasses.field(default=None, repr=False, hash=False, compare=False)
     def table_full_name(
         self,
         catalog_name: Optional[str] = None,
@@ -147,68 +158,8 @@ class SQLEngine(WorkspaceService):
             return self.catalog_name, parts[0], parts[1]
         catalog_name, schema_name, table_name = parts[-3], parts[-2], parts[-1]
-        catalog_name = catalog_name or self.catalog_name
-        schema_name = schema_name or self.schema_name
-        return catalog_name, schema_name, table_name
-    def _default_warehouse(
-        self,
-        cluster_size: str = "Small"
-    ):
-        """Pick a default SQL warehouse (best-effort) matching the desired size.
-        Args:
-            cluster_size: Desired warehouse size (Databricks "cluster_size"), e.g. "Small".
-                If empty/None, returns the first warehouse encountered.
-        Returns:
-            Warehouse object.
-        Raises:
-            ValueError: If no warehouses exist in the workspace.
-        """
-        wk = self.workspace.sdk()
-        existing = list(wk.warehouses.list())
-        first = None
-        for warehouse in existing:
-            if first is None:
-                first = warehouse
-            if cluster_size:
-                if getattr(warehouse, "cluster_size", None) == cluster_size:
-                    logger.debug("Default warehouse match found: id=%s cluster_size=%s", warehouse.id, warehouse.cluster_size)
-                    return warehouse
-            else:
-                logger.debug("Default warehouse selected (first): id=%s", warehouse.id)
-                return warehouse
-        if first is not None:
-            logger.info(
-                "No warehouse matched cluster_size=%s; falling back to first warehouse id=%s cluster_size=%s",
-                cluster_size,
-                getattr(first, "id", None),
-                getattr(first, "cluster_size", None),
-            )
-            return first
-        raise ValueError(f"No default warehouse found in {wk.config.host}")
-    def _get_or_default_warehouse_id(self, cluster_size: str = "Small") -> str:
-        """Return configured warehouse_id or resolve a default one.
-        Args:
-            cluster_size: Desired warehouse size filter used when resolving defaults.
-        Returns:
-            Warehouse id string.
-        """
-        if not self.warehouse_id:
-            dft = self._default_warehouse(cluster_size=cluster_size)
-            self.warehouse_id = dft.id
-            logger.info("Resolved default warehouse_id=%s (cluster_size=%s)", self.warehouse_id, cluster_size)
-        return self.warehouse_id
+        return catalog_name or self.catalog_name, schema_name or self.schema_name, table_name
     @staticmethod
     def _random_suffix(prefix: str = "") -> str:
@@ -217,12 +168,44 @@ class SQLEngine(WorkspaceService):
         timestamp = int(time.time() * 1000)
         return f"{prefix}{timestamp}_{unique}"
-    @staticmethod
-    def _sql_preview(sql: str, limit: int = 220) -> str:
-        """Short, single-line preview for logs (avoids spewing giant SQL)."""
-        if not sql:
-            return ""
-        return sql[:limit] + ("…" if len(sql) > limit else "")
+    def warehouse(
+        self,
+        warehouse_id: Optional[str] = None,
+        warehouse_name: Optional[str] = None,
+    ) -> SQLWarehouse:
+        if self._warehouse is None:
+            wh = SQLWarehouse(
+                workspace=self.workspace,
+                warehouse_id=warehouse_id,
+                warehouse_name=warehouse_name
+            )
+            self._warehouse = wh.find_warehouse(
+                warehouse_id=warehouse_id,
+                warehouse_name=warehouse_name,
+                raise_error=False
+            )
+            if self._warehouse is None:
+                self._warehouse = wh.create_or_update()
+        return self._warehouse.find_warehouse(
+            warehouse_id=warehouse_id,
+            warehouse_name=warehouse_name,
+            raise_error=True
+        )
+    def ai_session(
+        self,
+        model: str = "databricks-gemini-2-5-pro",
+        flavor: SQLFlavor = SQLFlavor.DATABRICKS
+    ):
+        return SQLAISession(
+            model=model,
+            api_key=self.workspace.current_token(),
+            base_url="%s/serving-endpoints" % self.workspace.safe_host,
+            flavor=flavor
+        )
     def execute(
         self,
@@ -230,17 +213,17 @@ class SQLEngine(WorkspaceService):
         *,
         engine: Optional[Literal["spark", "api"]] = None,
         warehouse_id: Optional[str] = None,
+        warehouse_name: Optional[str] = None,
         byte_limit: Optional[int] = None,
-        disposition: Optional["Disposition"] = None,
-        format: Optional["Format"] = None,
-        on_wait_timeout: Optional["ExecuteStatementRequestOnWaitTimeout"] = None,
-        parameters: Optional[List["StatementParameterListItem"]] = None,
+        disposition: Optional[Disposition] = None,
+        format: Optional[Format] = None,
+        on_wait_timeout: Optional[ExecuteStatementRequestOnWaitTimeout] = None,
+        parameters: Optional[List[StatementParameterListItem]] = None,
         row_limit: Optional[int] = None,
         wait_timeout: Optional[str] = None,
         catalog_name: Optional[str] = None,
         schema_name: Optional[str] = None,
-        table_name: Optional[str] = None,
-        wait_result: bool = True,
+        wait: Optional[WaitingConfigArg] = True
     ) -> "StatementResult":
         """Execute a SQL statement via Spark or Databricks SQL Statement Execution API.
@@ -256,6 +239,7 @@ class SQLEngine(WorkspaceService):
             statement: SQL statement to execute. If None, a `SELECT *` is generated from the table params.
             engine: "spark" or "api".
             warehouse_id: Warehouse override (for API engine).
+            warehouse_name: Warehouse name override (for API engine).
             byte_limit: Optional byte limit for results.
             disposition: Result disposition mode (API engine).
             format: Result format (API engine).
@@ -265,8 +249,7 @@ class SQLEngine(WorkspaceService):
             wait_timeout: API wait timeout value.
             catalog_name: Optional catalog override for API engine.
             schema_name: Optional schema override for API engine.
-            table_name: Optional table override used when `statement` is None.
-            wait_result: Whether to block until completion (API engine).
+            wait: Whether to block until completion (API engine).
         Returns:
             StatementResult.
@@ -284,72 +267,44 @@ class SQLEngine(WorkspaceService):
             if spark_session is None:
                 raise ValueError("No spark session found to run sql query")
-            df: SparkDataFrame = spark_session.sql(statement)
-            if row_limit:
-                df = df.limit(row_limit)
             logger.debug(
-                "SPARK SQL executed query:\n%s",
+                "SPARK SQL executing query:\n%s",
                 statement
             )
-            # Avoid Disposition dependency if SDK imports are absent
-            spark_disp = disposition if disposition is not None else getattr(globals().get("Disposition", object), "EXTERNAL_LINKS", None)
+            df: SparkDataFrame = spark_session.sql(statement)
+            if row_limit:
+                df = df.limit(row_limit)
             return StatementResult(
-                engine=self,
-                statement_id="sparksql",
-                disposition=spark_disp,
+                workspace_client=self.workspace.sdk(),
+                warehouse_id="SparkSQL",
+                statement_id="SparkSQL",
+                disposition=Disposition.EXTERNAL_LINKS,
                 _spark_df=df,
             )
-        # --- API path defaults ---
-        if format is None:
-            format = Format.ARROW_STREAM
-        if (disposition is None or disposition == Disposition.INLINE) and format in [Format.CSV, Format.ARROW_STREAM]:
-            disposition = Disposition.EXTERNAL_LINKS
-        if not statement:
-            full_name = self.table_full_name(catalog_name=catalog_name, schema_name=schema_name, table_name=table_name)
-            statement = f"SELECT * FROM {full_name}"
-        if not warehouse_id:
-            warehouse_id = self._get_or_default_warehouse_id()
+        wh = self.warehouse(
+            warehouse_id=warehouse_id,
+            warehouse_name=warehouse_name,
+        )
-        response = self.workspace.sdk().statement_execution.execute_statement(
+        return wh.execute(
             statement=statement,
             warehouse_id=warehouse_id,
+            warehouse_name=warehouse_name,
             byte_limit=byte_limit,
             disposition=disposition,
             format=format,
             on_wait_timeout=on_wait_timeout,
             parameters=parameters,
-            row_limit=row_limit,
             wait_timeout=wait_timeout,
-            catalog=catalog_name or self.catalog_name,
-            schema=schema_name or self.schema_name,
-        )
-        execution = StatementResult(
-            engine=self,
-            statement_id=response.statement_id,
-            _response=response,
-            disposition=disposition,
-        )
-        logger.info(
-            "API SQL executed statement '%s'",
-            execution.statement_id
-        )
-        logger.debug(
-            "API SQL executed query:\n%s",
-            statement
+            catalog_name=catalog_name,
+            schema_name=schema_name,
+            wait=wait
         )
-        return execution.wait() if wait_result else execution
     def spark_table(
         self,
         full_name: Optional[str] = None,
@@ -412,7 +367,7 @@ class SQLEngine(WorkspaceService):
             None (mutates the destination table).
         """
-        if pyspark is not None:
+        if pyspark is not None or spark_session is not None:
             spark_session = SparkSession.getActiveSession() if spark_session is None else spark_session
             if spark_session is not None or isinstance(data, SparkDataFrame):
@@ -502,6 +457,7 @@ class SQLEngine(WorkspaceService):
             if existing_schema is None:
                 try:
                     existing_schema = connected.get_table_schema(
+                        location=location,
                         catalog_name=catalog_name,
                         schema_name=schema_name,
                         table_name=table_name,
@@ -511,8 +467,7 @@ class SQLEngine(WorkspaceService):
                     data_tbl = convert(data, pa.Table)
                     existing_schema = data_tbl.schema
                     logger.warning(
-                        "Table %s not found (%s). Creating it from input schema (columns=%s)",
-                        location,
+                        "%s, creating it from input schema (columns=%s)",
                         exc,
                         existing_schema.names,
                     )
@@ -544,13 +499,11 @@ class SQLEngine(WorkspaceService):
                     except Exception:
                         logger.exception("Arrow insert failed after auto-creating %s; attempting cleanup (DROP TABLE)", location)
                         try:
-                            connected.drop_table(location=location)
+                            connected.drop_table(location=location, wait=True)
                         except Exception:
                             logger.exception("Failed to drop table %s after auto creation error", location)
                         raise
-            transaction_id = self._random_suffix()
             data_tbl = convert(
                 data, pa.Table,
                 options=cast_options, target_field=existing_schema
@@ -567,14 +520,15 @@ class SQLEngine(WorkspaceService):
             )
             # Write in temp volume
-            temp_volume_path = connected.dbfs_path(
-                kind=DatabricksPathKind.VOLUME,
-                parts=[catalog_name, schema_name, "tmp", "sql", transaction_id],
+            temp_volume_path = self.workspace.tmp_path(
+                catalog_name=catalog_name,
+                schema_name=schema_name,
+                volume_name="tmp",
+                extension="parquet"
             ) if temp_volume_path is None else DatabricksPath.parse(obj=temp_volume_path, workspace=connected.workspace)
             logger.debug("Staging Parquet to temp volume: %s", temp_volume_path)
-            temp_volume_path.mkdir()
-            temp_volume_path.write_arrow_table(data_tbl)
+            temp_volume_path.write_arrow_table(data_tbl, file_format=pds.ParquetFileFormat())
             columns = list(existing_schema.names)
             cols_quoted = ", ".join([f"`{c}`" for c in columns])
@@ -620,7 +574,12 @@ FROM parquet.`{temp_volume_path}`"""
                     connected.execute(stmt.strip())
             finally:
                 try:
-                    temp_volume_path.rmdir(recursive=True)
+                    Thread(
+                        target=temp_volume_path.rmdir,
+                        kwargs={
+                            "recursive": True
+                        }
+                    ).start()
                 except Exception:
                     logger.exception("Failed cleaning temp volume: %s", temp_volume_path)
@@ -732,8 +691,6 @@ FROM parquet.`{temp_volume_path}`"""
             cast_options = CastOptions.check_arg(options=cast_options, target_field=existing_schema)
             data = cast_spark_dataframe(data, options=cast_options)
-        logger.debug("Incoming Spark columns: %s", data.columns)
         if match_by:
             notnull = None
             for k in match_by:
@@ -788,6 +745,7 @@ FROM parquet.`{temp_volume_path}`"""
     def get_table_schema(
         self,
+        location: Optional[str] = None,
         catalog_name: Optional[str] = None,
         schema_name: Optional[str] = None,
         table_name: Optional[str] = None,
@@ -796,6 +754,7 @@ FROM parquet.`{temp_volume_path}`"""
         """Fetch a table schema from Unity Catalog and convert it to Arrow types.
         Args:
+            location: Optional Fully qualified location name
             catalog_name: Optional catalog override.
             schema_name: Optional schema override.
             table_name: Optional table name override.
@@ -804,25 +763,44 @@ FROM parquet.`{temp_volume_path}`"""
         Returns:
             Arrow Schema or a STRUCT Field representing the table.
         """
-        full_name = self.table_full_name(
+        location, catalog_name, schema_name, table_name = self._check_location_params(
+            location=location,
             catalog_name=catalog_name,
             schema_name=schema_name,
             table_name=table_name,
             safe_chars=False,
         )
-        wk = self.workspace.sdk()
+        client = self.workspace.sdk().tables
         try:
-            table = wk.tables.get(full_name)
+            table = client.get(location)
         except Exception as e:
-            raise ValueError(f"Table %s not found, {type(e)} {e}" % full_name)
+            raise ValueError(f"Table %s not found, {type(e)} {e}" % location)
-        fields = [column_info_to_arrow_field(_) for _ in table.columns]
+        fields = [
+            column_info_to_arrow_field(_) for _ in table.columns
+        ]
+        metadata = {
+            b"engine": b"databricks",
+            b"full_name": location,
+            b"catalog_name": catalog_name,
+            b"schema_name": schema_name,
+            b"table_name": table_name,
+        }
         if to_arrow_schema:
-            return pa.schema(fields, metadata={b"name": table_name})
-        return pa.field(table.name, pa.struct(fields))
+            return pa.schema(
+                fields,
+                metadata=metadata
+            )
+        return pa.field(
+            location,
+            pa.struct(fields),
+            metadata=metadata
+        )
     def drop_table(
         self,
@@ -830,6 +808,7 @@ FROM parquet.`{temp_volume_path}`"""
         catalog_name: Optional[str] = None,
         schema_name: Optional[str] = None,
         table_name: Optional[str] = None,
+        wait: Optional[WaitingConfigArg] = True
     ):
         """Drop a table if it exists."""
         location, _, _, _ = self._check_location_params(
@@ -839,13 +818,17 @@ FROM parquet.`{temp_volume_path}`"""
             table_name=table_name,
             safe_chars=True,
         )
-        logger.info("Dropping table if exists: %s", location)
-        return self.execute(f"DROP TABLE IF EXISTS {location}")
+        logger.debug("Dropping table if exists: %s", location)
+        self.execute(f"DROP TABLE IF EXISTS {location}", wait=wait)
+        logger.info("Dropped table if exists: %s", location)
     def create_table(
         self,
         field: Union[pa.Field, pa.Schema],
-        table_fqn: Optional[str] = None,            # e.g. catalog.schema.table
+        full_name: Optional[str] = None,            # e.g. catalog.schema.table
         catalog_name: Optional[str] = None,
         schema_name: Optional[str] = None,
         table_name: Optional[str] = None,
@@ -853,7 +836,7 @@ FROM parquet.`{temp_volume_path}`"""
         partition_by: Optional[list[str]] = None,
         cluster_by: Optional[bool | list[str]] = True,
         comment: Optional[str] = None,
-        tblproperties: Optional[dict[str, Any]] = None,
+        properties: Optional[dict[str, Any]] = None,
         if_not_exists: bool = True,
         or_replace: bool = False,
         using: str = "DELTA",
@@ -886,7 +869,7 @@ FROM parquet.`{temp_volume_path}`"""
             - If `pa.Schema`, all schema fields are used as columns.
             - If `pa.Field` with struct type, its children become columns.
             - If `pa.Field` non-struct, it becomes a single-column table.
-        table_fqn:
+        full_name:
             Fully-qualified table name, e.g. `"catalog.schema.table"`.
             If provided, it takes precedence over `catalog_name`/`schema_name`/`table_name`.
             Parts are quoted as needed.
@@ -906,7 +889,7 @@ FROM parquet.`{temp_volume_path}`"""
             - list[str] -> emits `CLUSTER BY (<cols...>)` (all cols must exist in schema)
         comment:
             Optional table comment. If not provided and Arrow metadata contains `b"comment"`, that is used.
-        tblproperties:
+        properties:
             Additional/override Delta table properties (final say).
             Example: `{"delta.enableChangeDataFeed": "true"}` or `{"delta.logRetentionDuration": "30 days"}`
         if_not_exists:
@@ -973,19 +956,22 @@ FROM parquet.`{temp_volume_path}`"""
         Examples
         --------
         Create a managed Delta table with auto clustering and auto column mapping:
-            >>> plan = client.create_table(schema, table_fqn="main.analytics.events", execute=False, return_plan=True)
+            >>> plan = client.create_table(schema, full_name="main.analytics.events", execute=False, return_plan=True)
             >>> print(plan.sql)
         External table with explicit partitioning and CDF:
             >>> client.create_table(
             ...     schema,
-            ...     table_fqn="main.analytics.events",
+            ...     full_name="main.analytics.events",
             ...     storage_location="abfss://.../events",
             ...     partition_by=["event_date"],
             ...     enable_cdf=True,
             ... )
         """
+        if not isinstance(field, (pa.Field, pa.Schema)):
+            field = convert(field, pa.Field)
         # ---- Normalize Arrow input ----
         if isinstance(field, pa.Schema):
             arrow_fields = list(field)
@@ -998,16 +984,13 @@ FROM parquet.`{temp_volume_path}`"""
             else:
                 arrow_fields = [field]
-        # ---- Resolve table FQN ----
-        # Prefer explicit table_fqn. Else build from catalog/schema/table_name.
-        if table_fqn is None:
-            if not (catalog_name and schema_name and table_name):
-                raise ValueError("Provide table_fqn or (catalog_name, schema_name, table_name).")
-            table_fqn = ".".join(map(_quote_ident, [catalog_name, schema_name, table_name]))
-        else:
-            # If caller passes raw "cat.schema.table", quote each part safely
-            parts = table_fqn.split(".")
-            table_fqn = ".".join(_quote_ident(p) for p in parts)
+        full_name, catalog_name, schema_name, table_name = self._check_location_params(
+            location=full_name,
+            catalog_name=catalog_name,
+            schema_name=schema_name,
+            table_name=table_name,
+            safe_chars=True
+        )
         # ---- Comments ----
         if comment is None and schema_metadata:
@@ -1051,7 +1034,7 @@ FROM parquet.`{temp_volume_path}`"""
             create_kw = "CREATE TABLE IF NOT EXISTS"
         sql_parts: list[str] = [
-            f"{create_kw} {table_fqn} (",
+            f"{create_kw} {full_name} (",
             "  " + ",\n  ".join(column_definitions),
             ")",
             f"USING {using}",
@@ -1096,8 +1079,8 @@ FROM parquet.`{temp_volume_path}`"""
             pass
         # Let caller override anything (final say)
-        if tblproperties:
-            props.update(tblproperties)
+        if properties:
+            props.update(properties)
         if any_invalid and column_mapping_mode == "none":
             warnings.append(
@@ -1105,6 +1088,11 @@ FROM parquet.`{temp_volume_path}`"""
                 "This will fail unless you rename/escape columns."
             )
+        default_tags = self.workspace.default_tags()
+        for k, v in default_tags.items():
+            props[f"tags.{k}"] = v
         if props:
             def fmt(k: str, v: Any) -> str:
                 if isinstance(v, str):
@@ -1122,7 +1110,7 @@ FROM parquet.`{temp_volume_path}`"""
         if not execute:
             return plan if return_plan else statement
-        res = self.execute(statement, wait_result=wait_result)
+        res = self.execute(statement, wait=wait_result)
         plan.result = res
         return plan if return_plan else res

ygg 0.1.56__py3-none-any.whl → 0.1.60__py3-none-any.whl

ygg 0.1.56py3-none-any.whl → 0.1.60py3-none-any.whl