polars-runtime-compat 1.34.0b3__cp39-abi3-macosx_11_0_arm64.whl → 1.34.0b5__cp39-abi3-macosx_11_0_arm64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of polars-runtime-compat might be problematic. Click here for more details.
- _polars_runtime_compat/_polars_runtime_compat.abi3.so +0 -0
- polars_runtime_compat-1.34.0b5.dist-info/METADATA +35 -0
- polars_runtime_compat-1.34.0b5.dist-info/RECORD +6 -0
- polars/__init__.py +0 -528
- polars/_cpu_check.py +0 -265
- polars/_dependencies.py +0 -355
- polars/_plr.py +0 -99
- polars/_plr.pyi +0 -2496
- polars/_reexport.py +0 -23
- polars/_typing.py +0 -478
- polars/_utils/__init__.py +0 -37
- polars/_utils/async_.py +0 -102
- polars/_utils/cache.py +0 -176
- polars/_utils/cloud.py +0 -40
- polars/_utils/constants.py +0 -29
- polars/_utils/construction/__init__.py +0 -46
- polars/_utils/construction/dataframe.py +0 -1397
- polars/_utils/construction/other.py +0 -72
- polars/_utils/construction/series.py +0 -560
- polars/_utils/construction/utils.py +0 -118
- polars/_utils/convert.py +0 -224
- polars/_utils/deprecation.py +0 -406
- polars/_utils/getitem.py +0 -457
- polars/_utils/logging.py +0 -11
- polars/_utils/nest_asyncio.py +0 -264
- polars/_utils/parquet.py +0 -15
- polars/_utils/parse/__init__.py +0 -12
- polars/_utils/parse/expr.py +0 -242
- polars/_utils/polars_version.py +0 -19
- polars/_utils/pycapsule.py +0 -53
- polars/_utils/scan.py +0 -27
- polars/_utils/serde.py +0 -63
- polars/_utils/slice.py +0 -215
- polars/_utils/udfs.py +0 -1251
- polars/_utils/unstable.py +0 -63
- polars/_utils/various.py +0 -782
- polars/_utils/wrap.py +0 -25
- polars/api.py +0 -370
- polars/catalog/__init__.py +0 -0
- polars/catalog/unity/__init__.py +0 -19
- polars/catalog/unity/client.py +0 -733
- polars/catalog/unity/models.py +0 -152
- polars/config.py +0 -1571
- polars/convert/__init__.py +0 -25
- polars/convert/general.py +0 -1046
- polars/convert/normalize.py +0 -261
- polars/dataframe/__init__.py +0 -5
- polars/dataframe/_html.py +0 -186
- polars/dataframe/frame.py +0 -12582
- polars/dataframe/group_by.py +0 -1067
- polars/dataframe/plotting.py +0 -257
- polars/datatype_expr/__init__.py +0 -5
- polars/datatype_expr/array.py +0 -56
- polars/datatype_expr/datatype_expr.py +0 -304
- polars/datatype_expr/list.py +0 -18
- polars/datatype_expr/struct.py +0 -69
- polars/datatypes/__init__.py +0 -122
- polars/datatypes/_parse.py +0 -195
- polars/datatypes/_utils.py +0 -48
- polars/datatypes/classes.py +0 -1213
- polars/datatypes/constants.py +0 -11
- polars/datatypes/constructor.py +0 -172
- polars/datatypes/convert.py +0 -366
- polars/datatypes/group.py +0 -130
- polars/exceptions.py +0 -230
- polars/expr/__init__.py +0 -7
- polars/expr/array.py +0 -964
- polars/expr/binary.py +0 -346
- polars/expr/categorical.py +0 -306
- polars/expr/datetime.py +0 -2620
- polars/expr/expr.py +0 -11272
- polars/expr/list.py +0 -1408
- polars/expr/meta.py +0 -444
- polars/expr/name.py +0 -321
- polars/expr/string.py +0 -3045
- polars/expr/struct.py +0 -357
- polars/expr/whenthen.py +0 -185
- polars/functions/__init__.py +0 -193
- polars/functions/aggregation/__init__.py +0 -33
- polars/functions/aggregation/horizontal.py +0 -298
- polars/functions/aggregation/vertical.py +0 -341
- polars/functions/as_datatype.py +0 -848
- polars/functions/business.py +0 -138
- polars/functions/col.py +0 -384
- polars/functions/datatype.py +0 -121
- polars/functions/eager.py +0 -524
- polars/functions/escape_regex.py +0 -29
- polars/functions/lazy.py +0 -2751
- polars/functions/len.py +0 -68
- polars/functions/lit.py +0 -210
- polars/functions/random.py +0 -22
- polars/functions/range/__init__.py +0 -19
- polars/functions/range/_utils.py +0 -15
- polars/functions/range/date_range.py +0 -303
- polars/functions/range/datetime_range.py +0 -370
- polars/functions/range/int_range.py +0 -348
- polars/functions/range/linear_space.py +0 -311
- polars/functions/range/time_range.py +0 -287
- polars/functions/repeat.py +0 -301
- polars/functions/whenthen.py +0 -353
- polars/interchange/__init__.py +0 -10
- polars/interchange/buffer.py +0 -77
- polars/interchange/column.py +0 -190
- polars/interchange/dataframe.py +0 -230
- polars/interchange/from_dataframe.py +0 -328
- polars/interchange/protocol.py +0 -303
- polars/interchange/utils.py +0 -170
- polars/io/__init__.py +0 -64
- polars/io/_utils.py +0 -317
- polars/io/avro.py +0 -49
- polars/io/clipboard.py +0 -36
- polars/io/cloud/__init__.py +0 -17
- polars/io/cloud/_utils.py +0 -80
- polars/io/cloud/credential_provider/__init__.py +0 -17
- polars/io/cloud/credential_provider/_builder.py +0 -520
- polars/io/cloud/credential_provider/_providers.py +0 -618
- polars/io/csv/__init__.py +0 -9
- polars/io/csv/_utils.py +0 -38
- polars/io/csv/batched_reader.py +0 -142
- polars/io/csv/functions.py +0 -1495
- polars/io/database/__init__.py +0 -6
- polars/io/database/_arrow_registry.py +0 -70
- polars/io/database/_cursor_proxies.py +0 -147
- polars/io/database/_executor.py +0 -578
- polars/io/database/_inference.py +0 -314
- polars/io/database/_utils.py +0 -144
- polars/io/database/functions.py +0 -516
- polars/io/delta.py +0 -499
- polars/io/iceberg/__init__.py +0 -3
- polars/io/iceberg/_utils.py +0 -697
- polars/io/iceberg/dataset.py +0 -556
- polars/io/iceberg/functions.py +0 -151
- polars/io/ipc/__init__.py +0 -8
- polars/io/ipc/functions.py +0 -514
- polars/io/json/__init__.py +0 -3
- polars/io/json/read.py +0 -101
- polars/io/ndjson.py +0 -332
- polars/io/parquet/__init__.py +0 -17
- polars/io/parquet/field_overwrites.py +0 -140
- polars/io/parquet/functions.py +0 -722
- polars/io/partition.py +0 -491
- polars/io/plugins.py +0 -187
- polars/io/pyarrow_dataset/__init__.py +0 -5
- polars/io/pyarrow_dataset/anonymous_scan.py +0 -109
- polars/io/pyarrow_dataset/functions.py +0 -79
- polars/io/scan_options/__init__.py +0 -5
- polars/io/scan_options/_options.py +0 -59
- polars/io/scan_options/cast_options.py +0 -126
- polars/io/spreadsheet/__init__.py +0 -6
- polars/io/spreadsheet/_utils.py +0 -52
- polars/io/spreadsheet/_write_utils.py +0 -647
- polars/io/spreadsheet/functions.py +0 -1323
- polars/lazyframe/__init__.py +0 -9
- polars/lazyframe/engine_config.py +0 -61
- polars/lazyframe/frame.py +0 -8564
- polars/lazyframe/group_by.py +0 -669
- polars/lazyframe/in_process.py +0 -42
- polars/lazyframe/opt_flags.py +0 -333
- polars/meta/__init__.py +0 -14
- polars/meta/build.py +0 -33
- polars/meta/index_type.py +0 -27
- polars/meta/thread_pool.py +0 -50
- polars/meta/versions.py +0 -120
- polars/ml/__init__.py +0 -0
- polars/ml/torch.py +0 -213
- polars/ml/utilities.py +0 -30
- polars/plugins.py +0 -155
- polars/py.typed +0 -0
- polars/pyproject.toml +0 -103
- polars/schema.py +0 -265
- polars/selectors.py +0 -3117
- polars/series/__init__.py +0 -5
- polars/series/array.py +0 -776
- polars/series/binary.py +0 -254
- polars/series/categorical.py +0 -246
- polars/series/datetime.py +0 -2275
- polars/series/list.py +0 -1087
- polars/series/plotting.py +0 -191
- polars/series/series.py +0 -9197
- polars/series/string.py +0 -2367
- polars/series/struct.py +0 -154
- polars/series/utils.py +0 -191
- polars/sql/__init__.py +0 -7
- polars/sql/context.py +0 -677
- polars/sql/functions.py +0 -139
- polars/string_cache.py +0 -185
- polars/testing/__init__.py +0 -13
- polars/testing/asserts/__init__.py +0 -9
- polars/testing/asserts/frame.py +0 -231
- polars/testing/asserts/series.py +0 -219
- polars/testing/asserts/utils.py +0 -12
- polars/testing/parametric/__init__.py +0 -33
- polars/testing/parametric/profiles.py +0 -107
- polars/testing/parametric/strategies/__init__.py +0 -22
- polars/testing/parametric/strategies/_utils.py +0 -14
- polars/testing/parametric/strategies/core.py +0 -615
- polars/testing/parametric/strategies/data.py +0 -452
- polars/testing/parametric/strategies/dtype.py +0 -436
- polars/testing/parametric/strategies/legacy.py +0 -169
- polars/type_aliases.py +0 -24
- polars_runtime_compat-1.34.0b3.dist-info/METADATA +0 -190
- polars_runtime_compat-1.34.0b3.dist-info/RECORD +0 -203
- {polars_runtime_compat-1.34.0b3.dist-info → polars_runtime_compat-1.34.0b5.dist-info}/WHEEL +0 -0
- {polars_runtime_compat-1.34.0b3.dist-info → polars_runtime_compat-1.34.0b5.dist-info}/licenses/LICENSE +0 -0
polars/datatype_expr/struct.py
DELETED
|
@@ -1,69 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
import polars._reexport as pl
|
|
4
|
-
from polars._utils.various import qualified_type_name
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
class DataTypeExprStructNameSpace:
|
|
8
|
-
"""Namespace for struct datatype expressions."""
|
|
9
|
-
|
|
10
|
-
_accessor = "struct"
|
|
11
|
-
|
|
12
|
-
def __init__(self, expr: pl.DataTypeExpr) -> None:
|
|
13
|
-
self._pydatatype_expr = expr._pydatatype_expr
|
|
14
|
-
|
|
15
|
-
def __getitem__(self, item: str | int) -> pl.DataTypeExpr:
|
|
16
|
-
if isinstance(item, str):
|
|
17
|
-
return self.field_dtype(item)
|
|
18
|
-
elif isinstance(item, int):
|
|
19
|
-
return pl.DataTypeExpr._from_pydatatype_expr(
|
|
20
|
-
self._pydatatype_expr.struct_field_dtype_by_index(item)
|
|
21
|
-
)
|
|
22
|
-
else:
|
|
23
|
-
msg = f"expected type 'int | str', got {qualified_type_name(item)!r} ({item!r})"
|
|
24
|
-
raise TypeError(msg)
|
|
25
|
-
|
|
26
|
-
def field_dtype(self, field_name: str) -> pl.DataTypeExpr:
|
|
27
|
-
"""
|
|
28
|
-
|
|
29
|
-
Get the DataType of field with a specific field name.
|
|
30
|
-
|
|
31
|
-
Notes
|
|
32
|
-
-----
|
|
33
|
-
The `struct` namespace has implemented `__getitem__` so you can also access
|
|
34
|
-
fields by index:
|
|
35
|
-
|
|
36
|
-
>>> (
|
|
37
|
-
... pl.Struct({"x": pl.Int64, "y": pl.String})
|
|
38
|
-
... .to_dtype_expr()
|
|
39
|
-
... .struct[1]
|
|
40
|
-
... .collect_dtype({})
|
|
41
|
-
... )
|
|
42
|
-
String
|
|
43
|
-
"""
|
|
44
|
-
return pl.DataTypeExpr._from_pydatatype_expr(
|
|
45
|
-
self._pydatatype_expr.struct_field_dtype_by_name(field_name)
|
|
46
|
-
)
|
|
47
|
-
|
|
48
|
-
def field_names(self) -> pl.Expr:
|
|
49
|
-
"""
|
|
50
|
-
Get the field names in a struct as a list.
|
|
51
|
-
|
|
52
|
-
Examples
|
|
53
|
-
--------
|
|
54
|
-
>>> pl.select(
|
|
55
|
-
... pl.Struct({"x": pl.Int64, "y": pl.String})
|
|
56
|
-
... .to_dtype_expr()
|
|
57
|
-
... .struct.field_names()
|
|
58
|
-
... )
|
|
59
|
-
shape: (2, 1)
|
|
60
|
-
┌─────────┐
|
|
61
|
-
│ literal │
|
|
62
|
-
│ --- │
|
|
63
|
-
│ str │
|
|
64
|
-
╞═════════╡
|
|
65
|
-
│ x │
|
|
66
|
-
│ y │
|
|
67
|
-
└─────────┘
|
|
68
|
-
"""
|
|
69
|
-
return pl.Expr._from_pyexpr(self._pydatatype_expr.struct_field_names())
|
polars/datatypes/__init__.py
DELETED
|
@@ -1,122 +0,0 @@
|
|
|
1
|
-
from polars.datatypes._parse import (
|
|
2
|
-
parse_into_datatype_expr,
|
|
3
|
-
parse_into_dtype,
|
|
4
|
-
try_parse_into_dtype,
|
|
5
|
-
)
|
|
6
|
-
from polars.datatypes.classes import (
|
|
7
|
-
Array,
|
|
8
|
-
Binary,
|
|
9
|
-
Boolean,
|
|
10
|
-
Categorical,
|
|
11
|
-
Categories,
|
|
12
|
-
DataType,
|
|
13
|
-
DataTypeClass,
|
|
14
|
-
Date,
|
|
15
|
-
Datetime,
|
|
16
|
-
Decimal,
|
|
17
|
-
Duration,
|
|
18
|
-
Enum,
|
|
19
|
-
Field,
|
|
20
|
-
Float32,
|
|
21
|
-
Float64,
|
|
22
|
-
Int8,
|
|
23
|
-
Int16,
|
|
24
|
-
Int32,
|
|
25
|
-
Int64,
|
|
26
|
-
Int128,
|
|
27
|
-
IntegerType,
|
|
28
|
-
List,
|
|
29
|
-
Null,
|
|
30
|
-
Object,
|
|
31
|
-
String,
|
|
32
|
-
Struct,
|
|
33
|
-
TemporalType,
|
|
34
|
-
Time,
|
|
35
|
-
UInt8,
|
|
36
|
-
UInt16,
|
|
37
|
-
UInt32,
|
|
38
|
-
UInt64,
|
|
39
|
-
UInt128,
|
|
40
|
-
Unknown,
|
|
41
|
-
Utf8,
|
|
42
|
-
)
|
|
43
|
-
from polars.datatypes.constants import (
|
|
44
|
-
DTYPE_TEMPORAL_UNITS,
|
|
45
|
-
N_INFER_DEFAULT,
|
|
46
|
-
)
|
|
47
|
-
from polars.datatypes.constructor import (
|
|
48
|
-
numpy_type_to_constructor,
|
|
49
|
-
numpy_values_and_dtype,
|
|
50
|
-
polars_type_to_constructor,
|
|
51
|
-
py_type_to_constructor,
|
|
52
|
-
)
|
|
53
|
-
from polars.datatypes.convert import (
|
|
54
|
-
dtype_to_ffiname,
|
|
55
|
-
dtype_to_py_type,
|
|
56
|
-
is_polars_dtype,
|
|
57
|
-
maybe_cast,
|
|
58
|
-
numpy_char_code_to_dtype,
|
|
59
|
-
py_type_to_arrow_type,
|
|
60
|
-
supported_numpy_char_code,
|
|
61
|
-
unpack_dtypes,
|
|
62
|
-
)
|
|
63
|
-
|
|
64
|
-
__all__ = [
|
|
65
|
-
# classes
|
|
66
|
-
"Array",
|
|
67
|
-
"Binary",
|
|
68
|
-
"Boolean",
|
|
69
|
-
"Categorical",
|
|
70
|
-
"Categories",
|
|
71
|
-
"DataType",
|
|
72
|
-
"DataTypeClass",
|
|
73
|
-
"Date",
|
|
74
|
-
"Datetime",
|
|
75
|
-
"Decimal",
|
|
76
|
-
"Duration",
|
|
77
|
-
"Enum",
|
|
78
|
-
"Field",
|
|
79
|
-
"Float32",
|
|
80
|
-
"Float64",
|
|
81
|
-
"Int16",
|
|
82
|
-
"Int128",
|
|
83
|
-
"Int32",
|
|
84
|
-
"Int64",
|
|
85
|
-
"Int8",
|
|
86
|
-
"IntegerType",
|
|
87
|
-
"List",
|
|
88
|
-
"Null",
|
|
89
|
-
"Object",
|
|
90
|
-
"String",
|
|
91
|
-
"Struct",
|
|
92
|
-
"TemporalType",
|
|
93
|
-
"Time",
|
|
94
|
-
"UInt16",
|
|
95
|
-
"UInt128",
|
|
96
|
-
"UInt32",
|
|
97
|
-
"UInt64",
|
|
98
|
-
"UInt8",
|
|
99
|
-
"Unknown",
|
|
100
|
-
"Utf8",
|
|
101
|
-
# constants
|
|
102
|
-
"N_INFER_DEFAULT",
|
|
103
|
-
"DTYPE_TEMPORAL_UNITS",
|
|
104
|
-
# constructor
|
|
105
|
-
"numpy_type_to_constructor",
|
|
106
|
-
"numpy_values_and_dtype",
|
|
107
|
-
"polars_type_to_constructor",
|
|
108
|
-
"py_type_to_constructor",
|
|
109
|
-
# convert
|
|
110
|
-
"dtype_to_ffiname",
|
|
111
|
-
"dtype_to_py_type",
|
|
112
|
-
"is_polars_dtype",
|
|
113
|
-
"maybe_cast",
|
|
114
|
-
"numpy_char_code_to_dtype",
|
|
115
|
-
"py_type_to_arrow_type",
|
|
116
|
-
"supported_numpy_char_code",
|
|
117
|
-
"unpack_dtypes",
|
|
118
|
-
# _parse
|
|
119
|
-
"parse_into_dtype",
|
|
120
|
-
"parse_into_datatype_expr",
|
|
121
|
-
"try_parse_into_dtype",
|
|
122
|
-
]
|
polars/datatypes/_parse.py
DELETED
|
@@ -1,195 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
import enum
|
|
4
|
-
import functools
|
|
5
|
-
import re
|
|
6
|
-
import sys
|
|
7
|
-
from datetime import date, datetime, time, timedelta
|
|
8
|
-
from decimal import Decimal as PyDecimal
|
|
9
|
-
from inspect import isclass
|
|
10
|
-
from typing import TYPE_CHECKING, Any, ForwardRef, NoReturn, Union, get_args
|
|
11
|
-
|
|
12
|
-
import polars._reexport as pl
|
|
13
|
-
from polars.datatypes.classes import (
|
|
14
|
-
Binary,
|
|
15
|
-
Boolean,
|
|
16
|
-
Date,
|
|
17
|
-
Datetime,
|
|
18
|
-
Decimal,
|
|
19
|
-
Duration,
|
|
20
|
-
Enum,
|
|
21
|
-
Float64,
|
|
22
|
-
Int64,
|
|
23
|
-
List,
|
|
24
|
-
Null,
|
|
25
|
-
Object,
|
|
26
|
-
String,
|
|
27
|
-
Time,
|
|
28
|
-
Unknown,
|
|
29
|
-
)
|
|
30
|
-
from polars.datatypes.convert import is_polars_dtype
|
|
31
|
-
|
|
32
|
-
if TYPE_CHECKING:
|
|
33
|
-
from polars._typing import PolarsDataType, PythonDataType, SchemaDict
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
UnionTypeOld = type(Union[int, str])
|
|
37
|
-
if sys.version_info >= (3, 10):
|
|
38
|
-
from types import NoneType, UnionType
|
|
39
|
-
else: # pragma: no cover
|
|
40
|
-
# Define equivalent for older Python versions
|
|
41
|
-
NoneType = type(None)
|
|
42
|
-
UnionType = UnionTypeOld
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
def parse_into_datatype_expr(input: Any) -> pl.DataTypeExpr:
|
|
46
|
-
"""Parse an input into a DataTypeExpr."""
|
|
47
|
-
if isinstance(input, pl.DataTypeExpr):
|
|
48
|
-
return input
|
|
49
|
-
else:
|
|
50
|
-
return parse_into_dtype(input).to_dtype_expr()
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
def parse_into_dtype(input: Any) -> PolarsDataType:
|
|
54
|
-
"""
|
|
55
|
-
Parse an input into a Polars data type.
|
|
56
|
-
|
|
57
|
-
Raises
|
|
58
|
-
------
|
|
59
|
-
TypeError
|
|
60
|
-
If the input cannot be parsed into a Polars data type.
|
|
61
|
-
"""
|
|
62
|
-
if is_polars_dtype(input):
|
|
63
|
-
return input
|
|
64
|
-
elif isinstance(input, ForwardRef):
|
|
65
|
-
return _parse_forward_ref_into_dtype(input)
|
|
66
|
-
elif isinstance(input, (UnionType, UnionTypeOld)):
|
|
67
|
-
return _parse_union_type_into_dtype(input)
|
|
68
|
-
else:
|
|
69
|
-
return parse_py_type_into_dtype(input)
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
def try_parse_into_dtype(input: Any) -> PolarsDataType | None:
|
|
73
|
-
"""Try parsing an input into a Polars data type, returning None on failure."""
|
|
74
|
-
try:
|
|
75
|
-
return parse_into_dtype(input)
|
|
76
|
-
except TypeError:
|
|
77
|
-
return None
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
@functools.lru_cache(16)
|
|
81
|
-
def parse_py_type_into_dtype(input: PythonDataType | type[object]) -> PolarsDataType:
|
|
82
|
-
"""Convert Python data type to Polars data type."""
|
|
83
|
-
if input is int:
|
|
84
|
-
return Int64()
|
|
85
|
-
elif input is float:
|
|
86
|
-
return Float64()
|
|
87
|
-
elif input is str:
|
|
88
|
-
return String()
|
|
89
|
-
elif input is bool:
|
|
90
|
-
return Boolean()
|
|
91
|
-
elif isinstance(input, type) and issubclass(input, datetime): # type: ignore[redundant-expr]
|
|
92
|
-
return Datetime("us")
|
|
93
|
-
elif isinstance(input, type) and issubclass(input, date): # type: ignore[redundant-expr]
|
|
94
|
-
return Date()
|
|
95
|
-
elif input is timedelta:
|
|
96
|
-
return Duration
|
|
97
|
-
elif input is time:
|
|
98
|
-
return Time()
|
|
99
|
-
elif input is PyDecimal:
|
|
100
|
-
return Decimal
|
|
101
|
-
elif input is bytes:
|
|
102
|
-
return Binary()
|
|
103
|
-
elif input is object:
|
|
104
|
-
return Object()
|
|
105
|
-
elif input is NoneType:
|
|
106
|
-
return Null()
|
|
107
|
-
elif input is list or input is tuple:
|
|
108
|
-
return List
|
|
109
|
-
elif isclass(input) and issubclass(input, enum.Enum):
|
|
110
|
-
return Enum(input)
|
|
111
|
-
# this is required as pass through. Don't remove
|
|
112
|
-
elif input == Unknown:
|
|
113
|
-
return Unknown
|
|
114
|
-
elif hasattr(input, "__origin__") and hasattr(input, "__args__"):
|
|
115
|
-
return _parse_generic_into_dtype(input)
|
|
116
|
-
else:
|
|
117
|
-
_raise_on_invalid_dtype(input)
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
def _parse_generic_into_dtype(input: Any) -> PolarsDataType:
|
|
121
|
-
"""Parse a generic type (from typing annotation) into a Polars data type."""
|
|
122
|
-
base_type = input.__origin__
|
|
123
|
-
if base_type not in (tuple, list):
|
|
124
|
-
_raise_on_invalid_dtype(input)
|
|
125
|
-
|
|
126
|
-
inner_types = input.__args__
|
|
127
|
-
inner_type = inner_types[0]
|
|
128
|
-
if len(inner_types) > 1:
|
|
129
|
-
all_equal = all(t in (inner_type, ...) for t in inner_types)
|
|
130
|
-
if not all_equal:
|
|
131
|
-
_raise_on_invalid_dtype(input)
|
|
132
|
-
|
|
133
|
-
inner_type = inner_types[0]
|
|
134
|
-
inner_dtype = parse_py_type_into_dtype(inner_type)
|
|
135
|
-
return List(inner_dtype)
|
|
136
|
-
|
|
137
|
-
|
|
138
|
-
PY_TYPE_STR_TO_DTYPE: SchemaDict = {
|
|
139
|
-
"Decimal": Decimal,
|
|
140
|
-
"NoneType": Null(),
|
|
141
|
-
"bool": Boolean(),
|
|
142
|
-
"bytes": Binary(),
|
|
143
|
-
"date": Date(),
|
|
144
|
-
"datetime": Datetime("us"),
|
|
145
|
-
"float": Float64(),
|
|
146
|
-
"int": Int64(),
|
|
147
|
-
"list": List,
|
|
148
|
-
"object": Object(),
|
|
149
|
-
"str": String(),
|
|
150
|
-
"time": Time(),
|
|
151
|
-
"timedelta": Duration,
|
|
152
|
-
"tuple": List,
|
|
153
|
-
}
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
def _parse_forward_ref_into_dtype(input: ForwardRef) -> PolarsDataType:
|
|
157
|
-
"""Parse a ForwardRef into a Polars data type."""
|
|
158
|
-
annotation = input.__forward_arg__
|
|
159
|
-
|
|
160
|
-
# Strip "optional" designation - Polars data types are always nullable
|
|
161
|
-
formatted = re.sub(r"(^None \|)|(\| None$)", "", annotation).strip()
|
|
162
|
-
|
|
163
|
-
try:
|
|
164
|
-
return PY_TYPE_STR_TO_DTYPE[formatted]
|
|
165
|
-
except KeyError:
|
|
166
|
-
_raise_on_invalid_dtype(input)
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
def _parse_union_type_into_dtype(input: Any) -> PolarsDataType:
|
|
170
|
-
"""
|
|
171
|
-
Parse a union of types into a Polars data type.
|
|
172
|
-
|
|
173
|
-
Unions of multiple non-null types (e.g. `int | float`) are not supported.
|
|
174
|
-
|
|
175
|
-
Parameters
|
|
176
|
-
----------
|
|
177
|
-
input
|
|
178
|
-
A union type, e.g. `str | None` (new syntax) or `Union[str, None]` (old syntax).
|
|
179
|
-
"""
|
|
180
|
-
# Strip "optional" designation - Polars data types are always nullable
|
|
181
|
-
inner_types = [tp for tp in get_args(input) if tp is not NoneType]
|
|
182
|
-
|
|
183
|
-
if len(inner_types) != 1:
|
|
184
|
-
_raise_on_invalid_dtype(input)
|
|
185
|
-
|
|
186
|
-
input = inner_types[0]
|
|
187
|
-
return parse_into_dtype(input)
|
|
188
|
-
|
|
189
|
-
|
|
190
|
-
def _raise_on_invalid_dtype(input: Any) -> NoReturn:
|
|
191
|
-
"""Raise an informative error if the input could not be parsed."""
|
|
192
|
-
input_type = input if type(input) is type else f"of type {type(input).__name__!r}"
|
|
193
|
-
input_detail = "" if type(input) is type else f" (given: {input!r})"
|
|
194
|
-
msg = f"cannot parse input {input_type} into Polars data type{input_detail}"
|
|
195
|
-
raise TypeError(msg) from None
|
polars/datatypes/_utils.py
DELETED
|
@@ -1,48 +0,0 @@
|
|
|
1
|
-
"""Utility functions for handling and processing of datatypes."""
|
|
2
|
-
|
|
3
|
-
from polars._typing import PolarsDataType
|
|
4
|
-
from polars.datatypes.classes import Array, List, Struct
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
def dtype_to_init_repr(dtype: PolarsDataType, prefix: str = "pl.") -> str:
|
|
8
|
-
"""Convert a Polars dtype to a prefixed string representation."""
|
|
9
|
-
if isinstance(dtype, List):
|
|
10
|
-
init_repr = _dtype_to_init_repr_list(dtype, prefix)
|
|
11
|
-
elif isinstance(dtype, Array):
|
|
12
|
-
init_repr = _dtype_to_init_repr_array(dtype, prefix)
|
|
13
|
-
elif isinstance(dtype, Struct):
|
|
14
|
-
init_repr = _dtype_to_init_repr_struct(dtype, prefix)
|
|
15
|
-
else:
|
|
16
|
-
init_repr = f"{prefix}{dtype!r}"
|
|
17
|
-
return init_repr
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
def _dtype_to_init_repr_list(dtype: List, prefix: str) -> str:
|
|
21
|
-
class_name = dtype.__class__.__name__
|
|
22
|
-
if dtype.inner is not None:
|
|
23
|
-
inner_repr = dtype_to_init_repr(dtype.inner, prefix)
|
|
24
|
-
else:
|
|
25
|
-
inner_repr = ""
|
|
26
|
-
init_repr = f"{prefix}{class_name}({inner_repr})"
|
|
27
|
-
return init_repr
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
def _dtype_to_init_repr_array(dtype: Array, prefix: str) -> str:
|
|
31
|
-
class_name = dtype.__class__.__name__
|
|
32
|
-
if dtype.inner is not None:
|
|
33
|
-
inner_repr = dtype_to_init_repr(dtype.inner, prefix)
|
|
34
|
-
else:
|
|
35
|
-
inner_repr = ""
|
|
36
|
-
init_repr = f"{prefix}{class_name}({inner_repr}, shape={dtype.shape})"
|
|
37
|
-
return init_repr
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
def _dtype_to_init_repr_struct(dtype: Struct, prefix: str) -> str:
|
|
41
|
-
class_name = dtype.__class__.__name__
|
|
42
|
-
inner_list = [
|
|
43
|
-
f"{field_name!r}: {dtype_to_init_repr(inner_dtype, prefix)}"
|
|
44
|
-
for field_name, inner_dtype in dict(dtype).items()
|
|
45
|
-
]
|
|
46
|
-
inner_repr = "{" + ", ".join(inner_list) + "}"
|
|
47
|
-
init_repr = f"{prefix}{class_name}({inner_repr})"
|
|
48
|
-
return init_repr
|