PyPI - duckdb - Versions diffs - 1.5.0.dev44__cp313-cp313-win_amd64.whl → 1.5.0.dev94__cp313-cp313-win_amd64.whl - Mend

duckdb 1.5.0.dev44__cp313-cp313-win_amd64.whl → 1.5.0.dev94__cp313-cp313-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of duckdb might be problematic. Click here for more details.

Files changed (56) hide show

_duckdb-stubs/__init__.pyi +1443 -0
_duckdb-stubs/_func.pyi +46 -0
_duckdb-stubs/_sqltypes.pyi +75 -0
_duckdb.cp313-win_amd64.pyd +0 -0
adbc_driver_duckdb/__init__.py +49 -0
adbc_driver_duckdb/dbapi.py +115 -0
duckdb/__init__.py +341 -435
duckdb/_dbapi_type_object.py +231 -0
duckdb/_version.py +22 -0
duckdb/bytes_io_wrapper.py +12 -9
duckdb/experimental/__init__.py +2 -1
duckdb/experimental/spark/__init__.py +3 -4
duckdb/experimental/spark/_globals.py +8 -8
duckdb/experimental/spark/_typing.py +7 -9
duckdb/experimental/spark/conf.py +16 -15
duckdb/experimental/spark/context.py +60 -44
duckdb/experimental/spark/errors/__init__.py +33 -35
duckdb/experimental/spark/errors/error_classes.py +1 -1
duckdb/experimental/spark/errors/exceptions/__init__.py +1 -1
duckdb/experimental/spark/errors/exceptions/base.py +39 -88
duckdb/experimental/spark/errors/utils.py +11 -16
duckdb/experimental/spark/exception.py +9 -6
duckdb/experimental/spark/sql/__init__.py +5 -5
duckdb/experimental/spark/sql/_typing.py +8 -15
duckdb/experimental/spark/sql/catalog.py +21 -20
duckdb/experimental/spark/sql/column.py +48 -55
duckdb/experimental/spark/sql/conf.py +9 -8
duckdb/experimental/spark/sql/dataframe.py +185 -233
duckdb/experimental/spark/sql/functions.py +1222 -1248
duckdb/experimental/spark/sql/group.py +56 -52
duckdb/experimental/spark/sql/readwriter.py +80 -94
duckdb/experimental/spark/sql/session.py +64 -59
duckdb/experimental/spark/sql/streaming.py +9 -10
duckdb/experimental/spark/sql/type_utils.py +67 -65
duckdb/experimental/spark/sql/types.py +309 -345
duckdb/experimental/spark/sql/udf.py +6 -6
duckdb/filesystem.py +26 -16
duckdb/func/__init__.py +3 -0
duckdb/functional/__init__.py +12 -16
duckdb/polars_io.py +130 -83
duckdb/query_graph/__main__.py +91 -96
duckdb/sqltypes/__init__.py +63 -0
duckdb/typing/__init__.py +18 -8
duckdb/udf.py +10 -5
duckdb/value/__init__.py +1 -0
duckdb/value/constant/__init__.py +62 -60
{duckdb-1.5.0.dev44.dist-info → duckdb-1.5.0.dev94.dist-info}/METADATA +12 -4
duckdb-1.5.0.dev94.dist-info/RECORD +52 -0
duckdb/__init__.pyi +0 -713
duckdb/functional/__init__.pyi +0 -31
duckdb/typing/__init__.pyi +0 -36
duckdb/value/constant/__init__.pyi +0 -115
duckdb-1.5.0.dev44.dist-info/RECORD +0 -47
/duckdb/{value/__init__.pyi → py.typed} +0 -0
{duckdb-1.5.0.dev44.dist-info → duckdb-1.5.0.dev94.dist-info}/WHEEL +0 -0
{duckdb-1.5.0.dev44.dist-info → duckdb-1.5.0.dev94.dist-info}/licenses/LICENSE +0 -0

duckdb/experimental/spark/sql/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
-from .session import SparkSession
-from .readwriter import DataFrameWriter
-from .dataframe import DataFrame
+from .catalog import Catalog  # noqa: D104
 from .conf import RuntimeConfig
-from .catalog import Catalog
+from .dataframe import DataFrame
+from .readwriter import DataFrameWriter
+from .session import SparkSession
-__all__ = ["SparkSession", "DataFrame", "RuntimeConfig", "DataFrameWriter", "Catalog"]
+__all__ = ["Catalog", "DataFrame", "DataFrameWriter", "RuntimeConfig", "SparkSession"]

duckdb/experimental/spark/sql/_typing.py CHANGED Viewed

@@ -19,12 +19,11 @@
 from typing import (
     Any,
     Callable,
-    List,
     Optional,
-    Tuple,
     TypeVar,
     Union,
 )
 try:
     from typing import Literal, Protocol
 except ImportError:
@@ -57,24 +56,21 @@ AtomicValue = TypeVar(
     float,
 )
-RowLike = TypeVar("RowLike", List[Any], Tuple[Any, ...], types.Row)
+RowLike = TypeVar("RowLike", list[Any], tuple[Any, ...], types.Row)
 SQLBatchedUDFType = Literal[100]
 class SupportsOpen(Protocol):
-    def open(self, partition_id: int, epoch_id: int) -> bool:
-        ...
+    def open(self, partition_id: int, epoch_id: int) -> bool: ...
 class SupportsProcess(Protocol):
-    def process(self, row: types.Row) -> None:
-        ...
+    def process(self, row: types.Row) -> None: ...
 class SupportsClose(Protocol):
-    def close(self, error: Exception) -> None:
-        ...
+    def close(self, error: Exception) -> None: ...
 class UserDefinedFunctionLike(Protocol):
@@ -83,11 +79,8 @@ class UserDefinedFunctionLike(Protocol):
     deterministic: bool
     @property
-    def returnType(self) -> types.DataType:
-        ...
+    def returnType(self) -> types.DataType: ...
-    def __call__(self, *args: ColumnOrName) -> Column:
-        ...
+    def __call__(self, *args: ColumnOrName) -> Column: ...
-    def asNondeterministic(self) -> "UserDefinedFunctionLike":
-        ...
+    def asNondeterministic(self) -> "UserDefinedFunctionLike": ...

duckdb/experimental/spark/sql/catalog.py CHANGED Viewed

@@ -1,14 +1,15 @@
-from typing import List, NamedTuple, Optional
+from typing import NamedTuple, Optional, Union  # noqa: D100
 from .session import SparkSession
-class Database(NamedTuple):
+class Database(NamedTuple):  # noqa: D101
     name: str
     description: Optional[str]
     locationUri: str
-class Table(NamedTuple):
+class Table(NamedTuple):  # noqa: D101
     name: str
     database: Optional[str]
     description: Optional[str]
@@ -16,7 +17,7 @@ class Table(NamedTuple):
     isTemporary: bool
-class Column(NamedTuple):
+class Column(NamedTuple):  # noqa: D101
     name: str
     description: Optional[str]
     dataType: str
@@ -25,36 +26,36 @@ class Column(NamedTuple):
     isBucket: bool
-class Function(NamedTuple):
+class Function(NamedTuple):  # noqa: D101
     name: str
     description: Optional[str]
     className: str
     isTemporary: bool
-class Catalog:
-    def __init__(self, session: SparkSession):
+class Catalog:  # noqa: D101
+    def __init__(self, session: SparkSession) -> None:  # noqa: D107
         self._session = session
-    def listDatabases(self) -> List[Database]:
-        res = self._session.conn.sql('select database_name from duckdb_databases()').fetchall()
+    def listDatabases(self) -> list[Database]:  # noqa: D102
+        res = self._session.conn.sql("select database_name from duckdb_databases()").fetchall()
-        def transform_to_database(x) -> Database:
-            return Database(name=x[0], description=None, locationUri='')
+        def transform_to_database(x: list[str]) -> Database:
+            return Database(name=x[0], description=None, locationUri="")
         databases = [transform_to_database(x) for x in res]
         return databases
-    def listTables(self) -> List[Table]:
-        res = self._session.conn.sql('select table_name, database_name, sql, temporary from duckdb_tables()').fetchall()
+    def listTables(self) -> list[Table]:  # noqa: D102
+        res = self._session.conn.sql("select table_name, database_name, sql, temporary from duckdb_tables()").fetchall()
-        def transform_to_table(x) -> Table:
-            return Table(name=x[0], database=x[1], description=x[2], tableType='', isTemporary=x[3])
+        def transform_to_table(x: list[str]) -> Table:
+            return Table(name=x[0], database=x[1], description=x[2], tableType="", isTemporary=x[3])
         tables = [transform_to_table(x) for x in res]
         return tables
-    def listColumns(self, tableName: str, dbName: Optional[str] = None) -> List[Column]:
+    def listColumns(self, tableName: str, dbName: Optional[str] = None) -> list[Column]:  # noqa: D102
         query = f"""
 			select column_name, data_type, is_nullable from duckdb_columns() where table_name = '{tableName}'
 		"""
@@ -62,17 +63,17 @@ class Catalog:
             query += f" and database_name = '{dbName}'"
         res = self._session.conn.sql(query).fetchall()
-        def transform_to_column(x) -> Column:
+        def transform_to_column(x: list[Union[str, bool]]) -> Column:
             return Column(name=x[0], description=None, dataType=x[1], nullable=x[2], isPartition=False, isBucket=False)
         columns = [transform_to_column(x) for x in res]
         return columns
-    def listFunctions(self, dbName: Optional[str] = None) -> List[Function]:
+    def listFunctions(self, dbName: Optional[str] = None) -> list[Function]:  # noqa: D102
         raise NotImplementedError
-    def setCurrentDatabase(self, dbName: str) -> None:
+    def setCurrentDatabase(self, dbName: str) -> None:  # noqa: D102
         raise NotImplementedError
-__all__ = ["Catalog", "Table", "Column", "Function", "Database"]
+__all__ = ["Catalog", "Column", "Database", "Function", "Table"]

duckdb/experimental/spark/sql/column.py CHANGED Viewed

@@ -1,19 +1,19 @@
-from typing import Union, TYPE_CHECKING, Any, cast, Callable, Tuple
-from ..exception import ContributionsAcceptedError
+from collections.abc import Iterable  # noqa: D100
+from typing import TYPE_CHECKING, Any, Callable, Union, cast
+from ..exception import ContributionsAcceptedError
 from .types import DataType
 if TYPE_CHECKING:
-    from ._typing import ColumnOrName, LiteralType, DecimalLiteral, DateTimeLiteral
+    from ._typing import DateTimeLiteral, DecimalLiteral, LiteralType
-from duckdb import ConstantExpression, ColumnExpression, FunctionExpression, Expression
-from duckdb.typing import DuckDBPyType
+from duckdb import ColumnExpression, ConstantExpression, Expression, FunctionExpression
+from duckdb.sqltypes import DuckDBPyType
 __all__ = ["Column"]
-def _get_expr(x) -> Expression:
+def _get_expr(x: Union["Column", str]) -> Expression:
     return x.expr if isinstance(x, Column) else ConstantExpression(x)
@@ -30,7 +30,7 @@ def _unary_op(
     name: str,
     doc: str = "unary operator",
 ) -> Callable[["Column"], "Column"]:
-    """Create a method for given unary operator"""
+    """Create a method for given unary operator."""
     def _(self: "Column") -> "Column":
         # Call the function identified by 'name' on the internal Expression object
@@ -45,7 +45,7 @@ def _bin_op(
     name: str,
     doc: str = "binary operator",
 ) -> Callable[["Column", Union["Column", "LiteralType", "DecimalLiteral", "DateTimeLiteral"]], "Column"]:
-    """Create a method for given binary operator"""
+    """Create a method for given binary operator."""
     def _(
         self: "Column",
@@ -63,7 +63,7 @@ def _bin_func(
     name: str,
     doc: str = "binary function",
 ) -> Callable[["Column", Union["Column", "LiteralType", "DecimalLiteral", "DateTimeLiteral"]], "Column"]:
-    """Create a function expression for the given binary function"""
+    """Create a function expression for the given binary function."""
     def _(
         self: "Column",
@@ -78,8 +78,7 @@ def _bin_func(
 class Column:
-    """
-    A column in a DataFrame.
+    """A column in a DataFrame.
     :class:`Column` instances can be created by::
@@ -95,11 +94,11 @@ class Column:
     .. versionadded:: 1.3.0
     """
-    def __init__(self, expr: Expression):
+    def __init__(self, expr: Expression) -> None:  # noqa: D107
         self.expr = expr
     # arithmetic operators
-    def __neg__(self):
+    def __neg__(self) -> "Column":  # noqa: D105
         return Column(-self.expr)
     # `and`, `or`, `not` cannot be overloaded in Python,
@@ -138,9 +137,8 @@ class Column:
     __rpow__ = _bin_op("__rpow__")
-    def __getitem__(self, k: Any) -> "Column":
-        """
-        An expression that gets an item at position ``ordinal`` out of a list,
+    def __getitem__(self, k: Any) -> "Column":  # noqa: ANN401
+        """An expression that gets an item at position ``ordinal`` out of a list,
         or gets an item by key out of a dict.
         .. versionadded:: 1.3.0
@@ -153,35 +151,34 @@ class Column:
         k
             a literal value, or a slice object without step.
-        Returns
+        Returns:
         -------
         :class:`Column`
             Column representing the item got by key out of a dict, or substrings sliced by
             the given slice object.
-        Examples
+        Examples:
         --------
-        >>> df = spark.createDataFrame([('abcedfg', {"key": "value"})], ["l", "d"])
-        >>> df.select(df.l[slice(1, 3)], df.d['key']).show()
+        >>> df = spark.createDataFrame([("abcedfg", {"key": "value"})], ["l", "d"])
+        >>> df.select(df.l[slice(1, 3)], df.d["key"]).show()
         +------------------+------+
         |substring(l, 1, 3)|d[key]|
         +------------------+------+
         |               abc| value|
         +------------------+------+
-        """
+        """  # noqa: D205
         if isinstance(k, slice):
             raise ContributionsAcceptedError
             # if k.step is not None:
             #    raise ValueError("Using a slice with a step value is not supported")
             # return self.substr(k.start, k.stop)
         else:
-            # FIXME: this is super hacky
+            # TODO: this is super hacky  # noqa: TD002, TD003
             expr_str = str(self.expr) + "." + str(k)
             return Column(ColumnExpression(expr_str))
-    def __getattr__(self, item: Any) -> "Column":
-        """
-        An expression that gets an item at position ``ordinal`` out of a list,
+    def __getattr__(self, item: Any) -> "Column":  # noqa: ANN401
+        """An expression that gets an item at position ``ordinal`` out of a list,
         or gets an item by key out of a dict.
         Parameters
@@ -189,55 +186,53 @@ class Column:
         item
             a literal value.
-        Returns
+        Returns:
         -------
         :class:`Column`
             Column representing the item got by key out of a dict.
-        Examples
+        Examples:
         --------
-        >>> df = spark.createDataFrame([('abcedfg', {"key": "value"})], ["l", "d"])
+        >>> df = spark.createDataFrame([("abcedfg", {"key": "value"})], ["l", "d"])
         >>> df.select(df.d.key).show()
         +------+
         |d[key]|
         +------+
         | value|
         +------+
-        """
+        """  # noqa: D205
         if item.startswith("__"):
-            raise AttributeError("Can not access __ (dunder) method")
+            msg = "Can not access __ (dunder) method"
+            raise AttributeError(msg)
         return self[item]
-    def alias(self, alias: str):
+    def alias(self, alias: str) -> "Column":  # noqa: D102
         return Column(self.expr.alias(alias))
-    def when(self, condition: "Column", value: Any):
+    def when(self, condition: "Column", value: Union["Column", str]) -> "Column":  # noqa: D102
         if not isinstance(condition, Column):
-            raise TypeError("condition should be a Column")
+            msg = "condition should be a Column"
+            raise TypeError(msg)
         v = _get_expr(value)
         expr = self.expr.when(condition.expr, v)
         return Column(expr)
-    def otherwise(self, value: Any):
+    def otherwise(self, value: Union["Column", str]) -> "Column":  # noqa: D102
         v = _get_expr(value)
         expr = self.expr.otherwise(v)
         return Column(expr)
-    def cast(self, dataType: Union[DataType, str]) -> "Column":
-        if isinstance(dataType, str):
-            # Try to construct a default DuckDBPyType from it
-            internal_type = DuckDBPyType(dataType)
-        else:
-            internal_type = dataType.duckdb_type
+    def cast(self, dataType: Union[DataType, str]) -> "Column":  # noqa: D102
+        internal_type = DuckDBPyType(dataType) if isinstance(dataType, str) else dataType.duckdb_type
         return Column(self.expr.cast(internal_type))
-    def isin(self, *cols: Any) -> "Column":
+    def isin(self, *cols: Union[Iterable[Union["Column", str]], Union["Column", str]]) -> "Column":  # noqa: D102
         if len(cols) == 1 and isinstance(cols[0], (list, set)):
             # Only one argument supplied, it's a list
-            cols = cast(Tuple, cols[0])
+            cols = cast("tuple", cols[0])
         cols = cast(
-            Tuple,
+            "tuple",
             [_get_expr(c) for c in cols],
         )
         return Column(self.expr.isin(*cols))
@@ -247,14 +242,14 @@ class Column:
         self,
         other: Union["Column", "LiteralType", "DecimalLiteral", "DateTimeLiteral"],
     ) -> "Column":
-        """binary function"""
+        """Binary function."""
         return Column(self.expr == (_get_expr(other)))
     def __ne__(  # type: ignore[override]
         self,
-        other: Any,
+        other: object,
     ) -> "Column":
-        """binary function"""
+        """Binary function."""
         return Column(self.expr != (_get_expr(other)))
     __lt__ = _bin_op("__lt__")
@@ -347,22 +342,20 @@ class Column:
     nulls_first = _unary_op("nulls_first")
     nulls_last = _unary_op("nulls_last")
-    def asc_nulls_first(self) -> "Column":
+    def asc_nulls_first(self) -> "Column":  # noqa: D102
         return self.asc().nulls_first()
-    def asc_nulls_last(self) -> "Column":
+    def asc_nulls_last(self) -> "Column":  # noqa: D102
         return self.asc().nulls_last()
-    def desc_nulls_first(self) -> "Column":
+    def desc_nulls_first(self) -> "Column":  # noqa: D102
         return self.desc().nulls_first()
-    def desc_nulls_last(self) -> "Column":
+    def desc_nulls_last(self) -> "Column":  # noqa: D102
         return self.desc().nulls_last()
-    def isNull(self) -> "Column":
+    def isNull(self) -> "Column":  # noqa: D102
         return Column(self.expr.isnull())
-    def isNotNull(self) -> "Column":
+    def isNotNull(self) -> "Column":  # noqa: D102
         return Column(self.expr.isnotnull())

duckdb/experimental/spark/sql/conf.py CHANGED Viewed

@@ -1,22 +1,23 @@
-from typing import Optional, Union
-from duckdb.experimental.spark._globals import _NoValueType, _NoValue
+from typing import Optional, Union  # noqa: D100
 from duckdb import DuckDBPyConnection
+from duckdb.experimental.spark._globals import _NoValue, _NoValueType
-class RuntimeConfig:
-    def __init__(self, connection: DuckDBPyConnection):
+class RuntimeConfig:  # noqa: D101
+    def __init__(self, connection: DuckDBPyConnection) -> None:  # noqa: D107
         self._connection = connection
-    def set(self, key: str, value: str) -> None:
+    def set(self, key: str, value: str) -> None:  # noqa: D102
         raise NotImplementedError
-    def isModifiable(self, key: str) -> bool:
+    def isModifiable(self, key: str) -> bool:  # noqa: D102
         raise NotImplementedError
-    def unset(self, key: str) -> None:
+    def unset(self, key: str) -> None:  # noqa: D102
         raise NotImplementedError
-    def get(self, key: str, default: Union[Optional[str], _NoValueType] = _NoValue) -> str:
+    def get(self, key: str, default: Union[Optional[str], _NoValueType] = _NoValue) -> str:  # noqa: D102
         raise NotImplementedError