PyPI - polars-runtime-compat - Versions diffs - 1.34.0b2__cp39-abi3-win_amd64.whl → 1.34.0b4__cp39-abi3-win_amd64.whl - Mend

polars-runtime-compat 1.34.0b2__cp39-abi3-win_amd64.whl → 1.34.0b4__cp39-abi3-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of polars-runtime-compat might be problematic. Click here for more details.

Files changed (203) hide show

_polars_runtime_compat/_polars_runtime_compat.pyd +0 -0
{polars_runtime_compat-1.34.0b2.dist-info → polars_runtime_compat-1.34.0b4.dist-info}/METADATA +1 -1
polars_runtime_compat-1.34.0b4.dist-info/RECORD +6 -0
polars/__init__.py +0 -528
polars/_cpu_check.py +0 -265
polars/_dependencies.py +0 -355
polars/_plr.py +0 -99
polars/_plr.pyi +0 -2496
polars/_reexport.py +0 -23
polars/_typing.py +0 -478
polars/_utils/__init__.py +0 -37
polars/_utils/async_.py +0 -102
polars/_utils/cache.py +0 -176
polars/_utils/cloud.py +0 -40
polars/_utils/constants.py +0 -29
polars/_utils/construction/__init__.py +0 -46
polars/_utils/construction/dataframe.py +0 -1397
polars/_utils/construction/other.py +0 -72
polars/_utils/construction/series.py +0 -560
polars/_utils/construction/utils.py +0 -118
polars/_utils/convert.py +0 -224
polars/_utils/deprecation.py +0 -406
polars/_utils/getitem.py +0 -457
polars/_utils/logging.py +0 -11
polars/_utils/nest_asyncio.py +0 -264
polars/_utils/parquet.py +0 -15
polars/_utils/parse/__init__.py +0 -12
polars/_utils/parse/expr.py +0 -242
polars/_utils/polars_version.py +0 -19
polars/_utils/pycapsule.py +0 -53
polars/_utils/scan.py +0 -27
polars/_utils/serde.py +0 -63
polars/_utils/slice.py +0 -215
polars/_utils/udfs.py +0 -1251
polars/_utils/unstable.py +0 -63
polars/_utils/various.py +0 -782
polars/_utils/wrap.py +0 -25
polars/api.py +0 -370
polars/catalog/__init__.py +0 -0
polars/catalog/unity/__init__.py +0 -19
polars/catalog/unity/client.py +0 -733
polars/catalog/unity/models.py +0 -152
polars/config.py +0 -1571
polars/convert/__init__.py +0 -25
polars/convert/general.py +0 -1046
polars/convert/normalize.py +0 -261
polars/dataframe/__init__.py +0 -5
polars/dataframe/_html.py +0 -186
polars/dataframe/frame.py +0 -12582
polars/dataframe/group_by.py +0 -1067
polars/dataframe/plotting.py +0 -257
polars/datatype_expr/__init__.py +0 -5
polars/datatype_expr/array.py +0 -56
polars/datatype_expr/datatype_expr.py +0 -304
polars/datatype_expr/list.py +0 -18
polars/datatype_expr/struct.py +0 -69
polars/datatypes/__init__.py +0 -122
polars/datatypes/_parse.py +0 -195
polars/datatypes/_utils.py +0 -48
polars/datatypes/classes.py +0 -1213
polars/datatypes/constants.py +0 -11
polars/datatypes/constructor.py +0 -172
polars/datatypes/convert.py +0 -366
polars/datatypes/group.py +0 -130
polars/exceptions.py +0 -230
polars/expr/__init__.py +0 -7
polars/expr/array.py +0 -964
polars/expr/binary.py +0 -346
polars/expr/categorical.py +0 -306
polars/expr/datetime.py +0 -2620
polars/expr/expr.py +0 -11272
polars/expr/list.py +0 -1408
polars/expr/meta.py +0 -444
polars/expr/name.py +0 -321
polars/expr/string.py +0 -3045
polars/expr/struct.py +0 -357
polars/expr/whenthen.py +0 -185
polars/functions/__init__.py +0 -193
polars/functions/aggregation/__init__.py +0 -33
polars/functions/aggregation/horizontal.py +0 -298
polars/functions/aggregation/vertical.py +0 -341
polars/functions/as_datatype.py +0 -848
polars/functions/business.py +0 -138
polars/functions/col.py +0 -384
polars/functions/datatype.py +0 -121
polars/functions/eager.py +0 -524
polars/functions/escape_regex.py +0 -29
polars/functions/lazy.py +0 -2751
polars/functions/len.py +0 -68
polars/functions/lit.py +0 -210
polars/functions/random.py +0 -22
polars/functions/range/__init__.py +0 -19
polars/functions/range/_utils.py +0 -15
polars/functions/range/date_range.py +0 -303
polars/functions/range/datetime_range.py +0 -370
polars/functions/range/int_range.py +0 -348
polars/functions/range/linear_space.py +0 -311
polars/functions/range/time_range.py +0 -287
polars/functions/repeat.py +0 -301
polars/functions/whenthen.py +0 -353
polars/interchange/__init__.py +0 -10
polars/interchange/buffer.py +0 -77
polars/interchange/column.py +0 -190
polars/interchange/dataframe.py +0 -230
polars/interchange/from_dataframe.py +0 -328
polars/interchange/protocol.py +0 -303
polars/interchange/utils.py +0 -170
polars/io/__init__.py +0 -64
polars/io/_utils.py +0 -317
polars/io/avro.py +0 -49
polars/io/clipboard.py +0 -36
polars/io/cloud/__init__.py +0 -17
polars/io/cloud/_utils.py +0 -80
polars/io/cloud/credential_provider/__init__.py +0 -17
polars/io/cloud/credential_provider/_builder.py +0 -520
polars/io/cloud/credential_provider/_providers.py +0 -618
polars/io/csv/__init__.py +0 -9
polars/io/csv/_utils.py +0 -38
polars/io/csv/batched_reader.py +0 -142
polars/io/csv/functions.py +0 -1495
polars/io/database/__init__.py +0 -6
polars/io/database/_arrow_registry.py +0 -70
polars/io/database/_cursor_proxies.py +0 -147
polars/io/database/_executor.py +0 -578
polars/io/database/_inference.py +0 -314
polars/io/database/_utils.py +0 -144
polars/io/database/functions.py +0 -516
polars/io/delta.py +0 -499
polars/io/iceberg/__init__.py +0 -3
polars/io/iceberg/_utils.py +0 -697
polars/io/iceberg/dataset.py +0 -556
polars/io/iceberg/functions.py +0 -151
polars/io/ipc/__init__.py +0 -8
polars/io/ipc/functions.py +0 -514
polars/io/json/__init__.py +0 -3
polars/io/json/read.py +0 -101
polars/io/ndjson.py +0 -332
polars/io/parquet/__init__.py +0 -17
polars/io/parquet/field_overwrites.py +0 -140
polars/io/parquet/functions.py +0 -722
polars/io/partition.py +0 -491
polars/io/plugins.py +0 -187
polars/io/pyarrow_dataset/__init__.py +0 -5
polars/io/pyarrow_dataset/anonymous_scan.py +0 -109
polars/io/pyarrow_dataset/functions.py +0 -79
polars/io/scan_options/__init__.py +0 -5
polars/io/scan_options/_options.py +0 -59
polars/io/scan_options/cast_options.py +0 -126
polars/io/spreadsheet/__init__.py +0 -6
polars/io/spreadsheet/_utils.py +0 -52
polars/io/spreadsheet/_write_utils.py +0 -647
polars/io/spreadsheet/functions.py +0 -1323
polars/lazyframe/__init__.py +0 -9
polars/lazyframe/engine_config.py +0 -61
polars/lazyframe/frame.py +0 -8564
polars/lazyframe/group_by.py +0 -669
polars/lazyframe/in_process.py +0 -42
polars/lazyframe/opt_flags.py +0 -333
polars/meta/__init__.py +0 -14
polars/meta/build.py +0 -33
polars/meta/index_type.py +0 -27
polars/meta/thread_pool.py +0 -50
polars/meta/versions.py +0 -120
polars/ml/__init__.py +0 -0
polars/ml/torch.py +0 -213
polars/ml/utilities.py +0 -30
polars/plugins.py +0 -155
polars/py.typed +0 -0
polars/pyproject.toml +0 -96
polars/schema.py +0 -265
polars/selectors.py +0 -3117
polars/series/__init__.py +0 -5
polars/series/array.py +0 -776
polars/series/binary.py +0 -254
polars/series/categorical.py +0 -246
polars/series/datetime.py +0 -2275
polars/series/list.py +0 -1087
polars/series/plotting.py +0 -191
polars/series/series.py +0 -9197
polars/series/string.py +0 -2367
polars/series/struct.py +0 -154
polars/series/utils.py +0 -191
polars/sql/__init__.py +0 -7
polars/sql/context.py +0 -677
polars/sql/functions.py +0 -139
polars/string_cache.py +0 -185
polars/testing/__init__.py +0 -13
polars/testing/asserts/__init__.py +0 -9
polars/testing/asserts/frame.py +0 -231
polars/testing/asserts/series.py +0 -219
polars/testing/asserts/utils.py +0 -12
polars/testing/parametric/__init__.py +0 -33
polars/testing/parametric/profiles.py +0 -107
polars/testing/parametric/strategies/__init__.py +0 -22
polars/testing/parametric/strategies/_utils.py +0 -14
polars/testing/parametric/strategies/core.py +0 -615
polars/testing/parametric/strategies/data.py +0 -452
polars/testing/parametric/strategies/dtype.py +0 -436
polars/testing/parametric/strategies/legacy.py +0 -169
polars/type_aliases.py +0 -24
polars_runtime_compat-1.34.0b2.dist-info/RECORD +0 -203
{polars_runtime_compat-1.34.0b2.dist-info → polars_runtime_compat-1.34.0b4.dist-info}/WHEEL +0 -0
{polars_runtime_compat-1.34.0b2.dist-info → polars_runtime_compat-1.34.0b4.dist-info}/licenses/LICENSE +0 -0

polars/io/iceberg/_utils.py DELETED Viewed

@@ -1,697 +0,0 @@
-from __future__ import annotations
-import abc
-import ast
-import contextlib
-from _ast import GtE, Lt, LtE
-from ast import (
-    Attribute,
-    BinOp,
-    BitAnd,
-    BitOr,
-    Call,
-    Compare,
-    Constant,
-    Eq,
-    Gt,
-    Invert,
-    List,
-    Name,
-    UnaryOp,
-)
-from dataclasses import dataclass
-from functools import cache, singledispatch
-from typing import TYPE_CHECKING, Any, Callable
-import polars._reexport as pl
-from polars._utils.convert import to_py_date, to_py_datetime
-from polars._utils.logging import eprint
-from polars._utils.wrap import wrap_s
-from polars.exceptions import ComputeError
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-    from datetime import date, datetime
-    import pyiceberg
-    import pyiceberg.schema
-    from pyiceberg.manifest import DataFile
-    from pyiceberg.table import Table
-    from pyiceberg.types import IcebergType
-    from polars import DataFrame, Series
-else:
-    from polars._dependencies import pyiceberg
-_temporal_conversions: dict[str, Callable[..., datetime | date]] = {
-    "to_py_date": to_py_date,
-    "to_py_datetime": to_py_datetime,
-}
-ICEBERG_TIME_TO_NS: int = 1000
-def _scan_pyarrow_dataset_impl(
-    tbl: Table,
-    with_columns: list[str] | None = None,
-    predicate: str | None = None,
-    n_rows: int | None = None,
-    snapshot_id: int | None = None,
-    **kwargs: Any,
-) -> DataFrame | Series:
-    """
-    Take the projected columns and materialize an arrow table.
-    Parameters
-    ----------
-    tbl
-        pyarrow dataset
-    with_columns
-        Columns that are projected
-    predicate
-        pyarrow expression that can be evaluated with eval
-    n_rows:
-        Materialize only n rows from the arrow dataset.
-    snapshot_id:
-        The snapshot ID to scan from.
-    batch_size
-        The maximum row count for scanned pyarrow record batches.
-    kwargs:
-        For backward compatibility
-    Returns
-    -------
-    DataFrame
-    """
-    from polars import from_arrow
-    scan = tbl.scan(limit=n_rows, snapshot_id=snapshot_id)
-    if with_columns is not None:
-        scan = scan.select(*with_columns)
-    if predicate is not None:
-        try:
-            expr_ast = _to_ast(predicate)
-            pyiceberg_expr = _convert_predicate(expr_ast)
-        except ValueError as e:
-            msg = f"Could not convert predicate to PyIceberg: {predicate}"
-            raise ValueError(msg) from e
-        scan = scan.filter(pyiceberg_expr)
-    return from_arrow(scan.to_arrow())
-def _to_ast(expr: str) -> ast.expr:
-    """
-    Converts a Python string to an AST.
-    This will take the Python Arrow expression (as a string), and it will
-    be converted into a Python AST that can be traversed to convert it to a PyIceberg
-    expression.
-    The reason to convert it to an AST is because the PyArrow expression
-    itself doesn't have any methods/properties to traverse the expression.
-    We need this to convert it into a PyIceberg expression.
-    Parameters
-    ----------
-    expr
-        The string expression
-    Returns
-    -------
-    The AST representing the Arrow expression
-    """
-    return ast.parse(expr, mode="eval").body
-@singledispatch
-def _convert_predicate(a: Any) -> Any:
-    """Walks the AST to convert the PyArrow expression to a PyIceberg expression."""
-    msg = f"Unexpected symbol: {a}"
-    raise ValueError(msg)
-@_convert_predicate.register(Constant)
-def _(a: Constant) -> Any:
-    return a.value
-@_convert_predicate.register(Name)
-def _(a: Name) -> Any:
-    return a.id
-@_convert_predicate.register(UnaryOp)
-def _(a: UnaryOp) -> Any:
-    if isinstance(a.op, Invert):
-        return pyiceberg.expressions.Not(_convert_predicate(a.operand))
-    else:
-        msg = f"Unexpected UnaryOp: {a}"
-        raise TypeError(msg)
-@_convert_predicate.register(Call)
-def _(a: Call) -> Any:
-    args = [_convert_predicate(arg) for arg in a.args]
-    f = _convert_predicate(a.func)
-    if f == "field":
-        return args
-    elif f == "scalar":
-        return args[0]
-    elif f in _temporal_conversions:
-        # convert from polars-native i64 to ISO8601 string
-        return _temporal_conversions[f](*args).isoformat()
-    else:
-        ref = _convert_predicate(a.func.value)[0]  # type: ignore[attr-defined]
-        if f == "isin":
-            return pyiceberg.expressions.In(ref, args[0])
-        elif f == "is_null":
-            return pyiceberg.expressions.IsNull(ref)
-        elif f == "is_nan":
-            return pyiceberg.expressions.IsNaN(ref)
-    msg = f"Unknown call: {f!r}"
-    raise ValueError(msg)
-@_convert_predicate.register(Attribute)
-def _(a: Attribute) -> Any:
-    return a.attr
-@_convert_predicate.register(BinOp)
-def _(a: BinOp) -> Any:
-    lhs = _convert_predicate(a.left)
-    rhs = _convert_predicate(a.right)
-    op = a.op
-    if isinstance(op, BitAnd):
-        return pyiceberg.expressions.And(lhs, rhs)
-    if isinstance(op, BitOr):
-        return pyiceberg.expressions.Or(lhs, rhs)
-    else:
-        msg = f"Unknown: {lhs} {op} {rhs}"
-        raise TypeError(msg)
-@_convert_predicate.register(Compare)
-def _(a: Compare) -> Any:
-    op = a.ops[0]
-    lhs = _convert_predicate(a.left)[0]
-    rhs = _convert_predicate(a.comparators[0])
-    if isinstance(op, Gt):
-        return pyiceberg.expressions.GreaterThan(lhs, rhs)
-    if isinstance(op, GtE):
-        return pyiceberg.expressions.GreaterThanOrEqual(lhs, rhs)
-    if isinstance(op, Eq):
-        return pyiceberg.expressions.EqualTo(lhs, rhs)
-    if isinstance(op, Lt):
-        return pyiceberg.expressions.LessThan(lhs, rhs)
-    if isinstance(op, LtE):
-        return pyiceberg.expressions.LessThanOrEqual(lhs, rhs)
-    else:
-        msg = f"Unknown comparison: {op}"
-        raise TypeError(msg)
-@_convert_predicate.register(List)
-def _(a: List) -> Any:
-    return [_convert_predicate(e) for e in a.elts]
-class IdentityTransformedPartitionValuesBuilder:
-    def __init__(
-        self,
-        table: Table,
-        projected_schema: pyiceberg.schema.Schema,
-    ) -> None:
-        import pyiceberg.schema
-        from pyiceberg.io.pyarrow import schema_to_pyarrow
-        from pyiceberg.transforms import IdentityTransform
-        from pyiceberg.types import (
-            DoubleType,
-            FloatType,
-            IntegerType,
-            LongType,
-        )
-        projected_ids: set[int] = projected_schema.field_ids
-        # {source_field_id: [values] | error_message}
-        self.partition_values: dict[int, list[Any] | str] = {}
-        # Logical types will have length-2 list [<constructor type>, <cast type>].
-        # E.g. for Datetime it will be [Int64, Datetime]
-        self.partition_values_dtypes: dict[int, pl.DataType] = {}
-        # {spec_id: [partition_value_index, source_field_id]}
-        self.partition_spec_id_to_identity_transforms: dict[
-            int, list[tuple[int, int]]
-        ] = {}
-        partition_specs = table.specs()
-        for spec_id, spec in partition_specs.items():
-            out = []
-            for field_index, field in enumerate(spec.fields):
-                if field.source_id in projected_ids and isinstance(
-                    field.transform, IdentityTransform
-                ):
-                    out.append((field_index, field.source_id))
-                    self.partition_values[field.source_id] = []
-            self.partition_spec_id_to_identity_transforms[spec_id] = out
-        for field_id in self.partition_values:
-            projected_field = projected_schema.find_field(field_id)
-            projected_type = projected_field.field_type
-            _, output_dtype = pl.Schema(
-                schema_to_pyarrow(pyiceberg.schema.Schema(projected_field))
-            ).popitem()
-            self.partition_values_dtypes[field_id] = output_dtype
-            if not projected_type.is_primitive or output_dtype.is_nested():
-                self.partition_values[field_id] = (
-                    f"non-primitive type: {projected_type = } {output_dtype = }"
-                )
-            for schema in table.schemas().values():
-                try:
-                    type_this_schema = schema.find_field(field_id).field_type
-                except ValueError:
-                    continue
-                if not (
-                    projected_type == type_this_schema
-                    or (
-                        isinstance(projected_type, LongType)
-                        and isinstance(type_this_schema, IntegerType)
-                    )
-                    or (
-                        isinstance(projected_type, (DoubleType, FloatType))
-                        and isinstance(type_this_schema, (DoubleType, FloatType))
-                    )
-                ):
-                    self.partition_values[field_id] = (
-                        f"unsupported type change: from: {type_this_schema}, "
-                        f"to: {projected_type}"
-                    )
-    def push_partition_values(
-        self,
-        *,
-        current_index: int,
-        partition_spec_id: int,
-        partition_values: pyiceberg.typedef.Record,
-    ) -> None:
-        try:
-            identity_transforms = self.partition_spec_id_to_identity_transforms[
-                partition_spec_id
-            ]
-        except KeyError:
-            self.partition_values = {
-                k: f"partition spec ID not found: {partition_spec_id}"
-                for k in self.partition_values
-            }
-            return
-        for i, source_field_id in identity_transforms:
-            partition_value = partition_values[i]
-            if isinstance(values := self.partition_values[source_field_id], list):
-                # extend() - there can be gaps from partitions being
-                # added/removed/re-added
-                values.extend(None for _ in range(current_index - len(values)))
-                values.append(partition_value)
-    def finish(self) -> dict[int, pl.Series | str]:
-        from polars.datatypes import Date, Datetime, Duration, Int32, Int64, Time
-        out: dict[int, pl.Series | str] = {}
-        for field_id, v in self.partition_values.items():
-            if isinstance(v, str):
-                out[field_id] = v
-            else:
-                try:
-                    output_dtype = self.partition_values_dtypes[field_id]
-                    constructor_dtype = (
-                        Int64
-                        if isinstance(output_dtype, (Datetime, Duration, Time))
-                        else Int32
-                        if isinstance(output_dtype, Date)
-                        else output_dtype
-                    )
-                    s = pl.Series(v, dtype=constructor_dtype)
-                    assert not s.dtype.is_nested()
-                    if isinstance(output_dtype, Time):
-                        # Physical from PyIceberg is in microseconds, physical
-                        # used by polars is in nanoseconds.
-                        s = s * ICEBERG_TIME_TO_NS
-                    s = s.cast(output_dtype)
-                    out[field_id] = s
-                except Exception as e:
-                    out[field_id] = f"failed to load partition values: {e}"
-        return out
-class IcebergStatisticsLoader:
-    def __init__(
-        self,
-        table: Table,
-        projected_filter_schema: pyiceberg.schema.Schema,
-    ) -> None:
-        import pyiceberg.schema
-        from pyiceberg.io.pyarrow import schema_to_pyarrow
-        import polars as pl
-        import polars._utils.logging
-        verbose = polars._utils.logging.verbose()
-        self.file_column_statistics: dict[int, IcebergColumnStatisticsLoader] = {}
-        self.load_as_empty_statistics: list[str] = []
-        self.file_lengths: list[int] = []
-        self.projected_filter_schema = projected_filter_schema
-        for field in projected_filter_schema.fields:
-            field_all_types = set()
-            for schema in table.schemas().values():
-                with contextlib.suppress(ValueError):
-                    field_all_types.add(schema.find_field(field.field_id).field_type)
-            _, field_polars_dtype = pl.Schema(
-                schema_to_pyarrow(pyiceberg.schema.Schema(field))
-            ).popitem()
-            load_from_bytes_impl = LoadFromBytesImpl.init_for_field_type(
-                field.field_type,
-                field_all_types,
-                field_polars_dtype,
-            )
-            if verbose:
-                _load_from_bytes_impl = (
-                    type(load_from_bytes_impl).__name__
-                    if load_from_bytes_impl is not None
-                    else "None"
-                )
-                eprint(
-                    "IcebergStatisticsLoader: "
-                    f"{field.name = }, "
-                    f"{field.field_id = }, "
-                    f"{field.field_type = }, "
-                    f"{field_all_types = }, "
-                    f"{field_polars_dtype = }, "
-                    f"{_load_from_bytes_impl = }"
-                )
-            self.file_column_statistics[field.field_id] = IcebergColumnStatisticsLoader(
-                field_id=field.field_id,
-                column_name=field.name,
-                column_dtype=field_polars_dtype,
-                load_from_bytes_impl=load_from_bytes_impl,
-                min_values=[],
-                max_values=[],
-                null_count=[],
-            )
-    def push_file_statistics(self, file: DataFile) -> None:
-        self.file_lengths.append(file.record_count)
-        for stats in self.file_column_statistics.values():
-            stats.push_file_statistics(file)
-    def finish(
-        self,
-        expected_height: int,
-        identity_transformed_values: dict[int, pl.Series | str],
-    ) -> pl.DataFrame:
-        import polars as pl
-        out: list[pl.DataFrame] = [
-            pl.Series("len", self.file_lengths, dtype=pl.UInt32).to_frame()
-        ]
-        for field_id, stat_builder in self.file_column_statistics.items():
-            if (p := identity_transformed_values.get(field_id)) is not None:
-                if isinstance(p, str):
-                    msg = f"statistics load failure for filter column: {p}"
-                    raise ComputeError(msg)
-            column_stats_df = stat_builder.finish(expected_height, p)
-            out.append(column_stats_df)
-        return pl.concat(out, how="horizontal")
-@dataclass
-class IcebergColumnStatisticsLoader:
-    column_name: str
-    column_dtype: pl.DataType
-    field_id: int
-    load_from_bytes_impl: LoadFromBytesImpl | None
-    null_count: list[int | None]
-    min_values: list[bytes | None]
-    max_values: list[bytes | None]
-    def push_file_statistics(self, file: DataFile) -> None:
-        self.null_count.append(file.null_value_counts.get(self.field_id))
-        if self.load_from_bytes_impl is not None:
-            self.min_values.append(file.lower_bounds.get(self.field_id))
-            self.max_values.append(file.upper_bounds.get(self.field_id))
-    def finish(
-        self,
-        expected_height: int,
-        identity_transformed_values: pl.Series | None,
-    ) -> pl.DataFrame:
-        import polars as pl
-        c = self.column_name
-        assert len(self.null_count) == expected_height
-        out = pl.Series(f"{c}_nc", self.null_count, dtype=pl.UInt32).to_frame()
-        if self.load_from_bytes_impl is None:
-            s = (
-                identity_transformed_values
-                if identity_transformed_values is not None
-                else pl.repeat(None, expected_height, dtype=self.column_dtype)
-            )
-            return out.with_columns(s.alias(f"{c}_min"), s.alias(f"{c}_max"))
-        assert len(self.min_values) == expected_height
-        assert len(self.max_values) == expected_height
-        if self.column_dtype.is_nested():
-            raise NotImplementedError
-        min_values = self.load_from_bytes_impl.load_from_bytes(self.min_values)
-        max_values = self.load_from_bytes_impl.load_from_bytes(self.max_values)
-        if identity_transformed_values is not None:
-            assert identity_transformed_values.dtype == self.column_dtype
-            identity_transformed_values = identity_transformed_values.extend_constant(
-                None, expected_height - identity_transformed_values.len()
-            )
-            min_values = identity_transformed_values.fill_null(min_values)
-            max_values = identity_transformed_values.fill_null(max_values)
-        return out.with_columns(
-            min_values.alias(f"{c}_min"), max_values.alias(f"{c}_max")
-        )
-# Lazy init instead of global const as PyIceberg is an optional dependency
-@cache
-def _bytes_loader_lookup() -> dict[
-    type[IcebergType],
-    tuple[type[LoadFromBytesImpl], type[IcebergType] | Sequence[type[IcebergType]]],
-]:
-    from pyiceberg.types import (
-        BinaryType,
-        BooleanType,
-        DateType,
-        DecimalType,
-        FixedType,
-        IntegerType,
-        LongType,
-        StringType,
-        TimestampType,
-        TimestamptzType,
-        TimeType,
-    )
-    # TODO: Float statistics
-    return {
-        BooleanType: (LoadBooleanFromBytes, BooleanType),
-        DateType: (LoadDateFromBytes, DateType),
-        TimeType: (LoadTimeFromBytes, TimeType),
-        TimestampType: (LoadTimestampFromBytes, TimestampType),
-        TimestamptzType: (LoadTimestamptzFromBytes, TimestamptzType),
-        IntegerType: (LoadInt32FromBytes, IntegerType),
-        LongType: (LoadInt64FromBytes, (LongType, IntegerType)),
-        StringType: (LoadStringFromBytes, StringType),
-        BinaryType: (LoadBinaryFromBytes, BinaryType),
-        DecimalType: (LoadDecimalFromBytes, DecimalType),
-        FixedType: (LoadFixedFromBytes, FixedType),
-    }
-class LoadFromBytesImpl(abc.ABC):
-    def __init__(self, polars_dtype: pl.DataType) -> None:
-        self.polars_dtype = polars_dtype
-    @staticmethod
-    def init_for_field_type(
-        current_field_type: IcebergType,
-        # All types that this field ID has been set to across schema changes.
-        all_field_types: set[IcebergType],
-        field_polars_dtype: pl.DataType,
-    ) -> LoadFromBytesImpl | None:
-        if (v := _bytes_loader_lookup().get(type(current_field_type))) is None:
-            return None
-        loader_impl, allowed_field_types = v
-        return (
-            loader_impl(field_polars_dtype)
-            if all(isinstance(x, allowed_field_types) for x in all_field_types)  # type: ignore[arg-type]
-            else None
-        )
-    @abc.abstractmethod
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        """`bytes_values` should be of binary type."""
-class LoadBinaryFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return pl.Series(byte_values, dtype=pl.Binary)
-class LoadDateFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return (
-            pl.Series(byte_values, dtype=pl.Binary)
-            .bin.reinterpret(dtype=pl.Int32, endianness="little")
-            .cast(pl.Date)
-        )
-class LoadTimeFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return (
-            pl.Series(byte_values, dtype=pl.Binary).bin.reinterpret(
-                dtype=pl.Int64, endianness="little"
-            )
-            * ICEBERG_TIME_TO_NS
-        ).cast(pl.Time)
-class LoadTimestampFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return (
-            pl.Series(byte_values, dtype=pl.Binary)
-            .bin.reinterpret(dtype=pl.Int64, endianness="little")
-            .cast(pl.Datetime("us"))
-        )
-class LoadTimestamptzFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return (
-            pl.Series(byte_values, dtype=pl.Binary)
-            .bin.reinterpret(dtype=pl.Int64, endianness="little")
-            .cast(pl.Datetime("us", time_zone="UTC"))
-        )
-class LoadBooleanFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return (
-            pl.Series(byte_values, dtype=pl.Binary)
-            .bin.reinterpret(dtype=pl.UInt8, endianness="little")
-            .cast(pl.Boolean)
-        )
-class LoadDecimalFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        from polars._plr import PySeries
-        dtype = self.polars_dtype
-        assert isinstance(dtype, pl.Decimal)
-        assert dtype.precision is not None
-        return wrap_s(
-            PySeries._import_decimal_from_iceberg_binary_repr(
-                bytes_list=byte_values,
-                precision=dtype.precision,
-                scale=dtype.scale,
-            )
-        )
-class LoadFixedFromBytes(LoadBinaryFromBytes): ...
-class LoadInt32FromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return pl.Series(byte_values, dtype=pl.Binary).bin.reinterpret(
-            dtype=pl.Int32, endianness="little"
-        )
-class LoadInt64FromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        s = pl.Series(byte_values, dtype=pl.Binary)
-        return s.bin.reinterpret(dtype=pl.Int64, endianness="little").fill_null(
-            s.bin.reinterpret(dtype=pl.Int32, endianness="little").cast(pl.Int64)
-        )
-class LoadStringFromBytes(LoadFromBytesImpl):
-    def load_from_bytes(self, byte_values: list[bytes | None]) -> pl.Series:
-        import polars as pl
-        return pl.Series(byte_values, dtype=pl.Binary).cast(pl.String)