polars-runtime-compat 1.34.0b3__cp39-abi3-win_amd64.whl → 1.34.0b5__cp39-abi3-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of polars-runtime-compat might be problematic. Click here for more details.
- _polars_runtime_compat/_polars_runtime_compat.pyd +0 -0
- polars_runtime_compat-1.34.0b5.dist-info/METADATA +35 -0
- polars_runtime_compat-1.34.0b5.dist-info/RECORD +6 -0
- polars/__init__.py +0 -528
- polars/_cpu_check.py +0 -265
- polars/_dependencies.py +0 -355
- polars/_plr.py +0 -99
- polars/_plr.pyi +0 -2496
- polars/_reexport.py +0 -23
- polars/_typing.py +0 -478
- polars/_utils/__init__.py +0 -37
- polars/_utils/async_.py +0 -102
- polars/_utils/cache.py +0 -176
- polars/_utils/cloud.py +0 -40
- polars/_utils/constants.py +0 -29
- polars/_utils/construction/__init__.py +0 -46
- polars/_utils/construction/dataframe.py +0 -1397
- polars/_utils/construction/other.py +0 -72
- polars/_utils/construction/series.py +0 -560
- polars/_utils/construction/utils.py +0 -118
- polars/_utils/convert.py +0 -224
- polars/_utils/deprecation.py +0 -406
- polars/_utils/getitem.py +0 -457
- polars/_utils/logging.py +0 -11
- polars/_utils/nest_asyncio.py +0 -264
- polars/_utils/parquet.py +0 -15
- polars/_utils/parse/__init__.py +0 -12
- polars/_utils/parse/expr.py +0 -242
- polars/_utils/polars_version.py +0 -19
- polars/_utils/pycapsule.py +0 -53
- polars/_utils/scan.py +0 -27
- polars/_utils/serde.py +0 -63
- polars/_utils/slice.py +0 -215
- polars/_utils/udfs.py +0 -1251
- polars/_utils/unstable.py +0 -63
- polars/_utils/various.py +0 -782
- polars/_utils/wrap.py +0 -25
- polars/api.py +0 -370
- polars/catalog/__init__.py +0 -0
- polars/catalog/unity/__init__.py +0 -19
- polars/catalog/unity/client.py +0 -733
- polars/catalog/unity/models.py +0 -152
- polars/config.py +0 -1571
- polars/convert/__init__.py +0 -25
- polars/convert/general.py +0 -1046
- polars/convert/normalize.py +0 -261
- polars/dataframe/__init__.py +0 -5
- polars/dataframe/_html.py +0 -186
- polars/dataframe/frame.py +0 -12582
- polars/dataframe/group_by.py +0 -1067
- polars/dataframe/plotting.py +0 -257
- polars/datatype_expr/__init__.py +0 -5
- polars/datatype_expr/array.py +0 -56
- polars/datatype_expr/datatype_expr.py +0 -304
- polars/datatype_expr/list.py +0 -18
- polars/datatype_expr/struct.py +0 -69
- polars/datatypes/__init__.py +0 -122
- polars/datatypes/_parse.py +0 -195
- polars/datatypes/_utils.py +0 -48
- polars/datatypes/classes.py +0 -1213
- polars/datatypes/constants.py +0 -11
- polars/datatypes/constructor.py +0 -172
- polars/datatypes/convert.py +0 -366
- polars/datatypes/group.py +0 -130
- polars/exceptions.py +0 -230
- polars/expr/__init__.py +0 -7
- polars/expr/array.py +0 -964
- polars/expr/binary.py +0 -346
- polars/expr/categorical.py +0 -306
- polars/expr/datetime.py +0 -2620
- polars/expr/expr.py +0 -11272
- polars/expr/list.py +0 -1408
- polars/expr/meta.py +0 -444
- polars/expr/name.py +0 -321
- polars/expr/string.py +0 -3045
- polars/expr/struct.py +0 -357
- polars/expr/whenthen.py +0 -185
- polars/functions/__init__.py +0 -193
- polars/functions/aggregation/__init__.py +0 -33
- polars/functions/aggregation/horizontal.py +0 -298
- polars/functions/aggregation/vertical.py +0 -341
- polars/functions/as_datatype.py +0 -848
- polars/functions/business.py +0 -138
- polars/functions/col.py +0 -384
- polars/functions/datatype.py +0 -121
- polars/functions/eager.py +0 -524
- polars/functions/escape_regex.py +0 -29
- polars/functions/lazy.py +0 -2751
- polars/functions/len.py +0 -68
- polars/functions/lit.py +0 -210
- polars/functions/random.py +0 -22
- polars/functions/range/__init__.py +0 -19
- polars/functions/range/_utils.py +0 -15
- polars/functions/range/date_range.py +0 -303
- polars/functions/range/datetime_range.py +0 -370
- polars/functions/range/int_range.py +0 -348
- polars/functions/range/linear_space.py +0 -311
- polars/functions/range/time_range.py +0 -287
- polars/functions/repeat.py +0 -301
- polars/functions/whenthen.py +0 -353
- polars/interchange/__init__.py +0 -10
- polars/interchange/buffer.py +0 -77
- polars/interchange/column.py +0 -190
- polars/interchange/dataframe.py +0 -230
- polars/interchange/from_dataframe.py +0 -328
- polars/interchange/protocol.py +0 -303
- polars/interchange/utils.py +0 -170
- polars/io/__init__.py +0 -64
- polars/io/_utils.py +0 -317
- polars/io/avro.py +0 -49
- polars/io/clipboard.py +0 -36
- polars/io/cloud/__init__.py +0 -17
- polars/io/cloud/_utils.py +0 -80
- polars/io/cloud/credential_provider/__init__.py +0 -17
- polars/io/cloud/credential_provider/_builder.py +0 -520
- polars/io/cloud/credential_provider/_providers.py +0 -618
- polars/io/csv/__init__.py +0 -9
- polars/io/csv/_utils.py +0 -38
- polars/io/csv/batched_reader.py +0 -142
- polars/io/csv/functions.py +0 -1495
- polars/io/database/__init__.py +0 -6
- polars/io/database/_arrow_registry.py +0 -70
- polars/io/database/_cursor_proxies.py +0 -147
- polars/io/database/_executor.py +0 -578
- polars/io/database/_inference.py +0 -314
- polars/io/database/_utils.py +0 -144
- polars/io/database/functions.py +0 -516
- polars/io/delta.py +0 -499
- polars/io/iceberg/__init__.py +0 -3
- polars/io/iceberg/_utils.py +0 -697
- polars/io/iceberg/dataset.py +0 -556
- polars/io/iceberg/functions.py +0 -151
- polars/io/ipc/__init__.py +0 -8
- polars/io/ipc/functions.py +0 -514
- polars/io/json/__init__.py +0 -3
- polars/io/json/read.py +0 -101
- polars/io/ndjson.py +0 -332
- polars/io/parquet/__init__.py +0 -17
- polars/io/parquet/field_overwrites.py +0 -140
- polars/io/parquet/functions.py +0 -722
- polars/io/partition.py +0 -491
- polars/io/plugins.py +0 -187
- polars/io/pyarrow_dataset/__init__.py +0 -5
- polars/io/pyarrow_dataset/anonymous_scan.py +0 -109
- polars/io/pyarrow_dataset/functions.py +0 -79
- polars/io/scan_options/__init__.py +0 -5
- polars/io/scan_options/_options.py +0 -59
- polars/io/scan_options/cast_options.py +0 -126
- polars/io/spreadsheet/__init__.py +0 -6
- polars/io/spreadsheet/_utils.py +0 -52
- polars/io/spreadsheet/_write_utils.py +0 -647
- polars/io/spreadsheet/functions.py +0 -1323
- polars/lazyframe/__init__.py +0 -9
- polars/lazyframe/engine_config.py +0 -61
- polars/lazyframe/frame.py +0 -8564
- polars/lazyframe/group_by.py +0 -669
- polars/lazyframe/in_process.py +0 -42
- polars/lazyframe/opt_flags.py +0 -333
- polars/meta/__init__.py +0 -14
- polars/meta/build.py +0 -33
- polars/meta/index_type.py +0 -27
- polars/meta/thread_pool.py +0 -50
- polars/meta/versions.py +0 -120
- polars/ml/__init__.py +0 -0
- polars/ml/torch.py +0 -213
- polars/ml/utilities.py +0 -30
- polars/plugins.py +0 -155
- polars/py.typed +0 -0
- polars/pyproject.toml +0 -103
- polars/schema.py +0 -265
- polars/selectors.py +0 -3117
- polars/series/__init__.py +0 -5
- polars/series/array.py +0 -776
- polars/series/binary.py +0 -254
- polars/series/categorical.py +0 -246
- polars/series/datetime.py +0 -2275
- polars/series/list.py +0 -1087
- polars/series/plotting.py +0 -191
- polars/series/series.py +0 -9197
- polars/series/string.py +0 -2367
- polars/series/struct.py +0 -154
- polars/series/utils.py +0 -191
- polars/sql/__init__.py +0 -7
- polars/sql/context.py +0 -677
- polars/sql/functions.py +0 -139
- polars/string_cache.py +0 -185
- polars/testing/__init__.py +0 -13
- polars/testing/asserts/__init__.py +0 -9
- polars/testing/asserts/frame.py +0 -231
- polars/testing/asserts/series.py +0 -219
- polars/testing/asserts/utils.py +0 -12
- polars/testing/parametric/__init__.py +0 -33
- polars/testing/parametric/profiles.py +0 -107
- polars/testing/parametric/strategies/__init__.py +0 -22
- polars/testing/parametric/strategies/_utils.py +0 -14
- polars/testing/parametric/strategies/core.py +0 -615
- polars/testing/parametric/strategies/data.py +0 -452
- polars/testing/parametric/strategies/dtype.py +0 -436
- polars/testing/parametric/strategies/legacy.py +0 -169
- polars/type_aliases.py +0 -24
- polars_runtime_compat-1.34.0b3.dist-info/METADATA +0 -190
- polars_runtime_compat-1.34.0b3.dist-info/RECORD +0 -203
- {polars_runtime_compat-1.34.0b3.dist-info → polars_runtime_compat-1.34.0b5.dist-info}/WHEEL +0 -0
- {polars_runtime_compat-1.34.0b3.dist-info → polars_runtime_compat-1.34.0b5.dist-info}/licenses/LICENSE +0 -0
polars/dataframe/plotting.py
DELETED
|
@@ -1,257 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
import inspect
|
|
4
|
-
from typing import TYPE_CHECKING, Callable, Union
|
|
5
|
-
|
|
6
|
-
from polars._dependencies import altair as alt
|
|
7
|
-
|
|
8
|
-
if TYPE_CHECKING:
|
|
9
|
-
import sys
|
|
10
|
-
|
|
11
|
-
from altair.typing import ChannelColor as Color
|
|
12
|
-
from altair.typing import ChannelOrder as Order
|
|
13
|
-
from altair.typing import ChannelSize as Size
|
|
14
|
-
from altair.typing import ChannelTooltip as Tooltip
|
|
15
|
-
from altair.typing import ChannelX as X
|
|
16
|
-
from altair.typing import ChannelY as Y
|
|
17
|
-
from altair.typing import EncodeKwds
|
|
18
|
-
|
|
19
|
-
from polars import DataFrame
|
|
20
|
-
|
|
21
|
-
if sys.version_info >= (3, 10):
|
|
22
|
-
from typing import TypeAlias
|
|
23
|
-
else:
|
|
24
|
-
from typing_extensions import TypeAlias
|
|
25
|
-
if sys.version_info >= (3, 11):
|
|
26
|
-
from typing import Unpack
|
|
27
|
-
else:
|
|
28
|
-
from typing_extensions import Unpack
|
|
29
|
-
|
|
30
|
-
Encoding: TypeAlias = Union[X, Y, Color, Order, Size, Tooltip]
|
|
31
|
-
Encodings: TypeAlias = dict[str, Encoding]
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
class DataFramePlot:
|
|
35
|
-
"""DataFrame.plot namespace."""
|
|
36
|
-
|
|
37
|
-
def __init__(self, df: DataFrame) -> None:
|
|
38
|
-
self._chart = alt.Chart(df)
|
|
39
|
-
|
|
40
|
-
def bar(
|
|
41
|
-
self,
|
|
42
|
-
x: X | None = None,
|
|
43
|
-
y: Y | None = None,
|
|
44
|
-
color: Color | None = None,
|
|
45
|
-
/,
|
|
46
|
-
**kwargs: Unpack[EncodeKwds],
|
|
47
|
-
) -> alt.Chart:
|
|
48
|
-
"""
|
|
49
|
-
Draw bar plot.
|
|
50
|
-
|
|
51
|
-
Polars does not implement plotting logic itself but instead defers to
|
|
52
|
-
`Altair <https://altair-viz.github.io/>`_.
|
|
53
|
-
|
|
54
|
-
`df.plot.bar(**kwargs)` is shorthand for
|
|
55
|
-
`alt.Chart(df).mark_bar().encode(**kwargs).interactive()`,
|
|
56
|
-
and is provided for convenience - for full customisability, use a plotting
|
|
57
|
-
library directly.
|
|
58
|
-
|
|
59
|
-
.. versionchanged:: 1.6.0
|
|
60
|
-
In prior versions of Polars, HvPlot was the plotting backend. If you would
|
|
61
|
-
like to restore the previous plotting functionality, all you need to do
|
|
62
|
-
is add `import hvplot.polars` at the top of your script and replace
|
|
63
|
-
`df.plot` with `df.hvplot`.
|
|
64
|
-
|
|
65
|
-
Parameters
|
|
66
|
-
----------
|
|
67
|
-
x
|
|
68
|
-
Column with x-coordinates of bars.
|
|
69
|
-
y
|
|
70
|
-
Column with y-coordinates of bars.
|
|
71
|
-
color
|
|
72
|
-
Column to color bars by.
|
|
73
|
-
**kwargs
|
|
74
|
-
Additional keyword arguments passed to Altair.
|
|
75
|
-
|
|
76
|
-
Examples
|
|
77
|
-
--------
|
|
78
|
-
>>> df = pl.DataFrame(
|
|
79
|
-
... {
|
|
80
|
-
... "day": ["Mon", "Tue", "Wed", "Thu", "Fri", "Sat", "Sun"] * 2,
|
|
81
|
-
... "group": ["a"] * 7 + ["b"] * 7,
|
|
82
|
-
... "value": [1, 3, 2, 4, 5, 6, 1, 1, 3, 2, 4, 5, 1, 2],
|
|
83
|
-
... }
|
|
84
|
-
... )
|
|
85
|
-
>>> df.plot.bar(
|
|
86
|
-
... x="day", y="value", color="day", column="group"
|
|
87
|
-
... ) # doctest: +SKIP
|
|
88
|
-
"""
|
|
89
|
-
encodings: Encodings = {}
|
|
90
|
-
if x is not None:
|
|
91
|
-
encodings["x"] = x
|
|
92
|
-
if y is not None:
|
|
93
|
-
encodings["y"] = y
|
|
94
|
-
if color is not None:
|
|
95
|
-
encodings["color"] = color
|
|
96
|
-
return (
|
|
97
|
-
self._chart.mark_bar(tooltip=True)
|
|
98
|
-
.encode(**encodings, **kwargs)
|
|
99
|
-
.interactive()
|
|
100
|
-
)
|
|
101
|
-
|
|
102
|
-
def line(
|
|
103
|
-
self,
|
|
104
|
-
x: X | None = None,
|
|
105
|
-
y: Y | None = None,
|
|
106
|
-
color: Color | None = None,
|
|
107
|
-
order: Order | None = None,
|
|
108
|
-
/,
|
|
109
|
-
**kwargs: Unpack[EncodeKwds],
|
|
110
|
-
) -> alt.Chart:
|
|
111
|
-
"""
|
|
112
|
-
Draw line plot.
|
|
113
|
-
|
|
114
|
-
Polars does not implement plotting logic itself but instead defers to
|
|
115
|
-
`Altair <https://altair-viz.github.io/>`_.
|
|
116
|
-
|
|
117
|
-
`df.plot.line(**kwargs)` is shorthand for
|
|
118
|
-
`alt.Chart(df).mark_line().encode(**kwargs).interactive()`,
|
|
119
|
-
and is provided for convenience - for full customisatibility, use a plotting
|
|
120
|
-
library directly.
|
|
121
|
-
|
|
122
|
-
.. versionchanged:: 1.6.0
|
|
123
|
-
In prior versions of Polars, HvPlot was the plotting backend. If you would
|
|
124
|
-
like to restore the previous plotting functionality, all you need to do
|
|
125
|
-
is add `import hvplot.polars` at the top of your script and replace
|
|
126
|
-
`df.plot` with `df.hvplot`.
|
|
127
|
-
|
|
128
|
-
Parameters
|
|
129
|
-
----------
|
|
130
|
-
x
|
|
131
|
-
Column with x-coordinates of lines.
|
|
132
|
-
y
|
|
133
|
-
Column with y-coordinates of lines.
|
|
134
|
-
color
|
|
135
|
-
Column to color lines by.
|
|
136
|
-
order
|
|
137
|
-
Column to use for order of data points in lines.
|
|
138
|
-
**kwargs
|
|
139
|
-
Additional keyword arguments passed to Altair.
|
|
140
|
-
|
|
141
|
-
Examples
|
|
142
|
-
--------
|
|
143
|
-
>>> from datetime import date
|
|
144
|
-
>>> df = pl.DataFrame(
|
|
145
|
-
... {
|
|
146
|
-
... "date": [date(2020, 1, 2), date(2020, 1, 3), date(2020, 1, 4)] * 2,
|
|
147
|
-
... "price": [1, 4, 6, 1, 5, 2],
|
|
148
|
-
... "stock": ["a", "a", "a", "b", "b", "b"],
|
|
149
|
-
... }
|
|
150
|
-
... )
|
|
151
|
-
>>> df.plot.line(x="date", y="price", color="stock") # doctest: +SKIP
|
|
152
|
-
"""
|
|
153
|
-
encodings: Encodings = {}
|
|
154
|
-
if x is not None:
|
|
155
|
-
encodings["x"] = x
|
|
156
|
-
if y is not None:
|
|
157
|
-
encodings["y"] = y
|
|
158
|
-
if color is not None:
|
|
159
|
-
encodings["color"] = color
|
|
160
|
-
if order is not None:
|
|
161
|
-
encodings["order"] = order
|
|
162
|
-
return (
|
|
163
|
-
self._chart.mark_line(tooltip=True)
|
|
164
|
-
.encode(**encodings, **kwargs)
|
|
165
|
-
.interactive()
|
|
166
|
-
)
|
|
167
|
-
|
|
168
|
-
def point(
|
|
169
|
-
self,
|
|
170
|
-
x: X | None = None,
|
|
171
|
-
y: Y | None = None,
|
|
172
|
-
color: Color | None = None,
|
|
173
|
-
size: Size | None = None,
|
|
174
|
-
/,
|
|
175
|
-
**kwargs: Unpack[EncodeKwds],
|
|
176
|
-
) -> alt.Chart:
|
|
177
|
-
"""
|
|
178
|
-
Draw scatter plot.
|
|
179
|
-
|
|
180
|
-
Polars does not implement plotting logic itself but instead defers to
|
|
181
|
-
`Altair <https://altair-viz.github.io/>`_.
|
|
182
|
-
|
|
183
|
-
`df.plot.point(**kwargs)` is shorthand for
|
|
184
|
-
`alt.Chart(df).mark_point().encode(**kwargs).interactive()`,
|
|
185
|
-
and is provided for convenience - for full customisatibility, use a plotting
|
|
186
|
-
library directly.
|
|
187
|
-
|
|
188
|
-
.. versionchanged:: 1.6.0
|
|
189
|
-
In prior versions of Polars, HvPlot was the plotting backend. If you would
|
|
190
|
-
like to restore the previous plotting functionality, all you need to do
|
|
191
|
-
is add `import hvplot.polars` at the top of your script and replace
|
|
192
|
-
`df.plot` with `df.hvplot`.
|
|
193
|
-
|
|
194
|
-
Parameters
|
|
195
|
-
----------
|
|
196
|
-
x
|
|
197
|
-
Column with x-coordinates of points.
|
|
198
|
-
y
|
|
199
|
-
Column with y-coordinates of points.
|
|
200
|
-
color
|
|
201
|
-
Column to color points by.
|
|
202
|
-
size
|
|
203
|
-
Column which determines points' sizes.
|
|
204
|
-
**kwargs
|
|
205
|
-
Additional keyword arguments passed to Altair.
|
|
206
|
-
|
|
207
|
-
Examples
|
|
208
|
-
--------
|
|
209
|
-
>>> df = pl.DataFrame(
|
|
210
|
-
... {
|
|
211
|
-
... "length": [1, 4, 6],
|
|
212
|
-
... "width": [4, 5, 6],
|
|
213
|
-
... "species": ["setosa", "setosa", "versicolor"],
|
|
214
|
-
... }
|
|
215
|
-
... )
|
|
216
|
-
>>> df.plot.point(x="length", y="width", color="species") # doctest: +SKIP
|
|
217
|
-
"""
|
|
218
|
-
encodings: Encodings = {}
|
|
219
|
-
if x is not None:
|
|
220
|
-
encodings["x"] = x
|
|
221
|
-
if y is not None:
|
|
222
|
-
encodings["y"] = y
|
|
223
|
-
if color is not None:
|
|
224
|
-
encodings["color"] = color
|
|
225
|
-
if size is not None:
|
|
226
|
-
encodings["size"] = size
|
|
227
|
-
return (
|
|
228
|
-
self._chart.mark_point(tooltip=True)
|
|
229
|
-
.encode(
|
|
230
|
-
**encodings,
|
|
231
|
-
**kwargs,
|
|
232
|
-
)
|
|
233
|
-
.interactive()
|
|
234
|
-
)
|
|
235
|
-
|
|
236
|
-
# Alias to `point` because of how common it is.
|
|
237
|
-
scatter = point
|
|
238
|
-
|
|
239
|
-
def __getattr__(self, attr: str) -> Callable[..., alt.Chart]:
|
|
240
|
-
method = getattr(self._chart, f"mark_{attr}", None)
|
|
241
|
-
if method is None:
|
|
242
|
-
msg = f"Altair has no method 'mark_{attr}'"
|
|
243
|
-
raise AttributeError(msg)
|
|
244
|
-
|
|
245
|
-
accepts_tooltip_argument = "tooltip" in {
|
|
246
|
-
value.name for value in inspect.signature(method).parameters.values()
|
|
247
|
-
}
|
|
248
|
-
if accepts_tooltip_argument:
|
|
249
|
-
|
|
250
|
-
def func(**kwargs: EncodeKwds) -> alt.Chart:
|
|
251
|
-
return method(tooltip=True).encode(**kwargs).interactive()
|
|
252
|
-
else:
|
|
253
|
-
|
|
254
|
-
def func(**kwargs: EncodeKwds) -> alt.Chart:
|
|
255
|
-
return method().encode(**kwargs).interactive()
|
|
256
|
-
|
|
257
|
-
return func
|
polars/datatype_expr/__init__.py
DELETED
polars/datatype_expr/array.py
DELETED
|
@@ -1,56 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
import polars._reexport as pl
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
class DataTypeExprArrNameSpace:
|
|
7
|
-
"""Namespace for arr datatype expressions."""
|
|
8
|
-
|
|
9
|
-
_accessor = "arr"
|
|
10
|
-
|
|
11
|
-
def __init__(self, expr: pl.DataTypeExpr) -> None:
|
|
12
|
-
self._pydatatype_expr = expr._pydatatype_expr
|
|
13
|
-
|
|
14
|
-
def inner_dtype(self) -> pl.DataTypeExpr:
|
|
15
|
-
"""Get the inner DataType of array."""
|
|
16
|
-
return pl.DataTypeExpr._from_pydatatype_expr(
|
|
17
|
-
self._pydatatype_expr.arr_inner_dtype()
|
|
18
|
-
)
|
|
19
|
-
|
|
20
|
-
def width(self) -> pl.Expr:
|
|
21
|
-
"""
|
|
22
|
-
Get the array width.
|
|
23
|
-
|
|
24
|
-
Examples
|
|
25
|
-
--------
|
|
26
|
-
>>> pl.select(pl.Array(pl.Int8, (1, 2, 3)).to_dtype_expr().arr.width())
|
|
27
|
-
shape: (1, 1)
|
|
28
|
-
┌─────────┐
|
|
29
|
-
│ literal │
|
|
30
|
-
│ --- │
|
|
31
|
-
│ u32 │
|
|
32
|
-
╞═════════╡
|
|
33
|
-
│ 1 │
|
|
34
|
-
└─────────┘
|
|
35
|
-
"""
|
|
36
|
-
return pl.Expr._from_pyexpr(self._pydatatype_expr.arr_width())
|
|
37
|
-
|
|
38
|
-
def shape(self) -> pl.Expr:
|
|
39
|
-
"""
|
|
40
|
-
Get the array shape.
|
|
41
|
-
|
|
42
|
-
Examples
|
|
43
|
-
--------
|
|
44
|
-
>>> pl.select(pl.Array(pl.Int8, (1, 2, 3)).to_dtype_expr().arr.shape())
|
|
45
|
-
shape: (3, 1)
|
|
46
|
-
┌─────────┐
|
|
47
|
-
│ literal │
|
|
48
|
-
│ --- │
|
|
49
|
-
│ u32 │
|
|
50
|
-
╞═════════╡
|
|
51
|
-
│ 1 │
|
|
52
|
-
│ 2 │
|
|
53
|
-
│ 3 │
|
|
54
|
-
└─────────┘
|
|
55
|
-
"""
|
|
56
|
-
return pl.Expr._from_pyexpr(self._pydatatype_expr.arr_shape())
|
|
@@ -1,304 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
from collections.abc import Mapping
|
|
4
|
-
from typing import TYPE_CHECKING
|
|
5
|
-
|
|
6
|
-
import polars._reexport as pl
|
|
7
|
-
from polars._utils.various import BUILDING_SPHINX_DOCS, sphinx_accessor
|
|
8
|
-
from polars.datatype_expr.array import DataTypeExprArrNameSpace
|
|
9
|
-
from polars.datatype_expr.list import DataTypeExprListNameSpace
|
|
10
|
-
from polars.datatype_expr.struct import DataTypeExprStructNameSpace
|
|
11
|
-
|
|
12
|
-
if TYPE_CHECKING:
|
|
13
|
-
import contextlib
|
|
14
|
-
from typing import ClassVar
|
|
15
|
-
|
|
16
|
-
from polars import DataType
|
|
17
|
-
from polars._typing import PolarsDataType, SchemaDict
|
|
18
|
-
|
|
19
|
-
with contextlib.suppress(ImportError): # Module not available when building docs
|
|
20
|
-
from polars._plr import PyDataTypeExpr
|
|
21
|
-
elif BUILDING_SPHINX_DOCS:
|
|
22
|
-
import sys
|
|
23
|
-
|
|
24
|
-
# note: we assign this way to work around an autocomplete issue in ipython/jedi
|
|
25
|
-
# (ref: https://github.com/davidhalter/jedi/issues/2057)
|
|
26
|
-
current_module = sys.modules[__name__]
|
|
27
|
-
current_module.property = sphinx_accessor
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
class DataTypeExpr:
|
|
31
|
-
"""
|
|
32
|
-
A lazily instantiated :class:`DataType` that can be used in an :class:`Expr`.
|
|
33
|
-
|
|
34
|
-
.. warning::
|
|
35
|
-
This functionality is considered **unstable**. It may be changed
|
|
36
|
-
at any point without it being considered a breaking change.
|
|
37
|
-
|
|
38
|
-
This expression is made to represent a :class:`DataType` that can be used to
|
|
39
|
-
reference a datatype in a lazy context.
|
|
40
|
-
|
|
41
|
-
Examples
|
|
42
|
-
--------
|
|
43
|
-
>>> lf = pl.LazyFrame({"a": [1, 2, 3]})
|
|
44
|
-
>>> lf.with_columns(
|
|
45
|
-
... pl.col.a.map_batches(lambda x: x * 2, return_dtype=pl.dtype_of("a"))
|
|
46
|
-
... ).collect()
|
|
47
|
-
shape: (3, 1)
|
|
48
|
-
┌─────┐
|
|
49
|
-
│ a │
|
|
50
|
-
│ --- │
|
|
51
|
-
│ i64 │
|
|
52
|
-
╞═════╡
|
|
53
|
-
│ 2 │
|
|
54
|
-
│ 4 │
|
|
55
|
-
│ 6 │
|
|
56
|
-
└─────┘
|
|
57
|
-
"""
|
|
58
|
-
|
|
59
|
-
# NOTE: This `= None` is needed to generate the docs with sphinx_accessor.
|
|
60
|
-
_pydatatype_expr: PyDataTypeExpr = None # type: ignore[assignment]
|
|
61
|
-
_accessors: ClassVar[set[str]] = {
|
|
62
|
-
"arr",
|
|
63
|
-
"enum",
|
|
64
|
-
"list",
|
|
65
|
-
"struct",
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
def __eq__(self, value: PolarsDataType | DataTypeExpr) -> pl.Expr: # type: ignore[override]
|
|
69
|
-
cmp_with: DataTypeExpr
|
|
70
|
-
if isinstance(value, pl.DataType):
|
|
71
|
-
cmp_with = value.to_dtype_expr()
|
|
72
|
-
elif isinstance(value, pl.DataTypeClass):
|
|
73
|
-
cmp_with = value.to_dtype_expr()
|
|
74
|
-
elif isinstance(value, DataTypeExpr):
|
|
75
|
-
cmp_with = value
|
|
76
|
-
else:
|
|
77
|
-
msg = f"cannot compare {self!r} to {value!r}"
|
|
78
|
-
raise TypeError(msg) from None
|
|
79
|
-
|
|
80
|
-
return pl.Expr._from_pyexpr(
|
|
81
|
-
self._pydatatype_expr.equals(cmp_with._pydatatype_expr)
|
|
82
|
-
)
|
|
83
|
-
|
|
84
|
-
def __ne__(self, value: PolarsDataType | DataTypeExpr) -> pl.Expr: # type: ignore[override]
|
|
85
|
-
return (self == value).not_()
|
|
86
|
-
|
|
87
|
-
@classmethod
|
|
88
|
-
def _from_pydatatype_expr(cls, pydatatype_expr: PyDataTypeExpr) -> DataTypeExpr:
|
|
89
|
-
slf = cls()
|
|
90
|
-
slf._pydatatype_expr = pydatatype_expr
|
|
91
|
-
return slf
|
|
92
|
-
|
|
93
|
-
def inner_dtype(self) -> DataTypeExpr:
|
|
94
|
-
"""Get the inner DataType of a List or Array."""
|
|
95
|
-
return DataTypeExpr._from_pydatatype_expr(self._pydatatype_expr.inner_dtype())
|
|
96
|
-
|
|
97
|
-
def display(self) -> pl.Expr:
|
|
98
|
-
"""
|
|
99
|
-
Get a formatted version of the output DataType.
|
|
100
|
-
|
|
101
|
-
Examples
|
|
102
|
-
--------
|
|
103
|
-
>>> df = pl.DataFrame(
|
|
104
|
-
... {
|
|
105
|
-
... "a": [1, 2, 3],
|
|
106
|
-
... "b": ["X", "Y", "Z"],
|
|
107
|
-
... "c": [1.3, 3.7, 4.2],
|
|
108
|
-
... }
|
|
109
|
-
... )
|
|
110
|
-
>>> df.select(
|
|
111
|
-
... a=pl.dtype_of("a").display(),
|
|
112
|
-
... b=pl.dtype_of("b").display(),
|
|
113
|
-
... c=pl.dtype_of("c").display(),
|
|
114
|
-
... ).transpose(include_header=True, column_names=["dtype"])
|
|
115
|
-
shape: (3, 2)
|
|
116
|
-
┌────────┬───────┐
|
|
117
|
-
│ column ┆ dtype │
|
|
118
|
-
│ --- ┆ --- │
|
|
119
|
-
│ str ┆ str │
|
|
120
|
-
╞════════╪═══════╡
|
|
121
|
-
│ a ┆ i64 │
|
|
122
|
-
│ b ┆ str │
|
|
123
|
-
│ c ┆ f64 │
|
|
124
|
-
└────────┴───────┘
|
|
125
|
-
"""
|
|
126
|
-
return pl.Expr._from_pyexpr(self._pydatatype_expr.display())
|
|
127
|
-
|
|
128
|
-
def matches(self, selector: pl.Selector) -> pl.Expr:
|
|
129
|
-
"""
|
|
130
|
-
Get whether the output DataType is matches a certain selector.
|
|
131
|
-
|
|
132
|
-
Examples
|
|
133
|
-
--------
|
|
134
|
-
>>> import polars.selectors as cs
|
|
135
|
-
>>> pl.DataFrame(
|
|
136
|
-
... {
|
|
137
|
-
... "a": [1, 2, 3],
|
|
138
|
-
... }
|
|
139
|
-
... ).select(
|
|
140
|
-
... a_is_string=pl.dtype_of("a").matches(cs.string()),
|
|
141
|
-
... a_is_integer=pl.dtype_of("a").matches(cs.integer()),
|
|
142
|
-
... )
|
|
143
|
-
shape: (1, 2)
|
|
144
|
-
┌─────────────┬──────────────┐
|
|
145
|
-
│ a_is_string ┆ a_is_integer │
|
|
146
|
-
│ --- ┆ --- │
|
|
147
|
-
│ bool ┆ bool │
|
|
148
|
-
╞═════════════╪══════════════╡
|
|
149
|
-
│ false ┆ true │
|
|
150
|
-
└─────────────┴──────────────┘
|
|
151
|
-
"""
|
|
152
|
-
return pl.Expr._from_pyexpr(self._pydatatype_expr.matches(selector._pyselector))
|
|
153
|
-
|
|
154
|
-
def wrap_in_list(self) -> DataTypeExpr:
|
|
155
|
-
"""
|
|
156
|
-
Get the DataType wrapped in a list.
|
|
157
|
-
|
|
158
|
-
Examples
|
|
159
|
-
--------
|
|
160
|
-
>>> pl.Int32.to_dtype_expr().wrap_in_list().collect_dtype({})
|
|
161
|
-
List(Int32)
|
|
162
|
-
|
|
163
|
-
"""
|
|
164
|
-
return DataTypeExpr._from_pydatatype_expr(self._pydatatype_expr.wrap_in_list())
|
|
165
|
-
|
|
166
|
-
def wrap_in_array(self, *, width: int) -> DataTypeExpr:
|
|
167
|
-
"""
|
|
168
|
-
Get the DataType wrapped in an array.
|
|
169
|
-
|
|
170
|
-
Examples
|
|
171
|
-
--------
|
|
172
|
-
>>> pl.Int32.to_dtype_expr().wrap_in_array(width=5).collect_dtype({})
|
|
173
|
-
Array(Int32, shape=(5,))
|
|
174
|
-
"""
|
|
175
|
-
return DataTypeExpr._from_pydatatype_expr(
|
|
176
|
-
self._pydatatype_expr.wrap_in_array(width)
|
|
177
|
-
)
|
|
178
|
-
|
|
179
|
-
def to_unsigned_integer(self) -> pl.DataTypeExpr:
|
|
180
|
-
"""
|
|
181
|
-
Get the unsigned integer version of the same bitsize.
|
|
182
|
-
|
|
183
|
-
Examples
|
|
184
|
-
--------
|
|
185
|
-
>>> int32 = pl.Int32.to_dtype_expr()
|
|
186
|
-
>>> int32.to_unsigned_integer().collect_dtype({})
|
|
187
|
-
UInt32
|
|
188
|
-
"""
|
|
189
|
-
return pl.DataTypeExpr._from_pydatatype_expr(
|
|
190
|
-
self._pydatatype_expr.to_unsigned_integer()
|
|
191
|
-
)
|
|
192
|
-
|
|
193
|
-
def to_signed_integer(self) -> pl.DataTypeExpr:
|
|
194
|
-
"""
|
|
195
|
-
Get the signed integer version of the same bitsize.
|
|
196
|
-
|
|
197
|
-
Examples
|
|
198
|
-
--------
|
|
199
|
-
>>> uint32 = pl.UInt32.to_dtype_expr()
|
|
200
|
-
>>> uint32.to_signed_integer().collect_dtype({})
|
|
201
|
-
Int32
|
|
202
|
-
"""
|
|
203
|
-
return pl.DataTypeExpr._from_pydatatype_expr(
|
|
204
|
-
self._pydatatype_expr.to_signed_integer()
|
|
205
|
-
)
|
|
206
|
-
|
|
207
|
-
def default_value(
|
|
208
|
-
self,
|
|
209
|
-
n: int = 1,
|
|
210
|
-
*,
|
|
211
|
-
numeric_to_one: bool = False,
|
|
212
|
-
num_list_values: int = 0,
|
|
213
|
-
) -> pl.Expr:
|
|
214
|
-
"""
|
|
215
|
-
Get a default value of a specific type.
|
|
216
|
-
|
|
217
|
-
- Integers and floats are their zero value as default, unless otherwise
|
|
218
|
-
specified
|
|
219
|
-
- Temporals are a physical zero as default
|
|
220
|
-
- `pl.Decimal` is zero as default
|
|
221
|
-
- `pl.String` and `pl.Binary` are an empty string
|
|
222
|
-
- `pl.List` is an empty list, unless otherwise specified
|
|
223
|
-
- `pl.Array` is the inner default value repeated over the shape
|
|
224
|
-
- `pl.Struct` is the inner default value for all fields
|
|
225
|
-
- `pl.Enum` is the first category if it exists
|
|
226
|
-
- `pl.Null`, `pl.Object` and `pl.Categorical` are `null`.
|
|
227
|
-
|
|
228
|
-
Parameters
|
|
229
|
-
----------
|
|
230
|
-
n
|
|
231
|
-
Number of types you want the value
|
|
232
|
-
numeric_to_one
|
|
233
|
-
Use `1` instead of `0` as the default value for numeric types
|
|
234
|
-
num_list_values
|
|
235
|
-
The amount of values a list contains
|
|
236
|
-
|
|
237
|
-
Examples
|
|
238
|
-
--------
|
|
239
|
-
>>> uint32 = pl.UInt32.to_dtype_expr()
|
|
240
|
-
>>> pl.select(default=uint32.default_value())
|
|
241
|
-
shape: (1, 1)
|
|
242
|
-
┌─────────┐
|
|
243
|
-
│ default │
|
|
244
|
-
│ --- │
|
|
245
|
-
│ u32 │
|
|
246
|
-
╞═════════╡
|
|
247
|
-
│ 0 │
|
|
248
|
-
└─────────┘
|
|
249
|
-
"""
|
|
250
|
-
return pl.Expr._from_pyexpr(
|
|
251
|
-
self._pydatatype_expr.default_value(
|
|
252
|
-
n=n, numeric_to_one=numeric_to_one, num_list_values=num_list_values
|
|
253
|
-
)
|
|
254
|
-
)
|
|
255
|
-
|
|
256
|
-
@property
|
|
257
|
-
def list(self) -> DataTypeExprListNameSpace:
|
|
258
|
-
"""Create an object namespace of all list related methods."""
|
|
259
|
-
return DataTypeExprListNameSpace(self)
|
|
260
|
-
|
|
261
|
-
@property
|
|
262
|
-
def arr(self) -> DataTypeExprArrNameSpace:
|
|
263
|
-
"""Create an object namespace of all array related methods."""
|
|
264
|
-
return DataTypeExprArrNameSpace(self)
|
|
265
|
-
|
|
266
|
-
@property
|
|
267
|
-
def struct(self) -> DataTypeExprStructNameSpace:
|
|
268
|
-
"""Create an object namespace of all struct related methods."""
|
|
269
|
-
return DataTypeExprStructNameSpace(self)
|
|
270
|
-
|
|
271
|
-
def collect_dtype(
|
|
272
|
-
self, context: SchemaDict | pl.Schema | pl.DataFrame | pl.LazyFrame
|
|
273
|
-
) -> DataType:
|
|
274
|
-
"""
|
|
275
|
-
Materialize the :class:`DataTypeExpr` in a specific context.
|
|
276
|
-
|
|
277
|
-
This is a useful function when debugging datatype expressions.
|
|
278
|
-
|
|
279
|
-
Examples
|
|
280
|
-
--------
|
|
281
|
-
>>> lf = pl.LazyFrame(
|
|
282
|
-
... {
|
|
283
|
-
... "a": [1, 2, 3],
|
|
284
|
-
... }
|
|
285
|
-
... )
|
|
286
|
-
>>> pl.dtype_of("a").collect_dtype(lf)
|
|
287
|
-
Int64
|
|
288
|
-
>>> pl.dtype_of("a").collect_dtype({"a": pl.String})
|
|
289
|
-
String
|
|
290
|
-
"""
|
|
291
|
-
schema: pl.Schema
|
|
292
|
-
if isinstance(context, pl.Schema):
|
|
293
|
-
schema = context
|
|
294
|
-
elif isinstance(context, Mapping):
|
|
295
|
-
schema = pl.Schema(context)
|
|
296
|
-
elif isinstance(context, pl.DataFrame):
|
|
297
|
-
schema = context.schema
|
|
298
|
-
elif isinstance(context, pl.LazyFrame):
|
|
299
|
-
schema = context.collect_schema()
|
|
300
|
-
else:
|
|
301
|
-
msg = f"DataTypeExpr.collect_dtype did not expect {context!r}"
|
|
302
|
-
raise TypeError(msg)
|
|
303
|
-
|
|
304
|
-
return self._pydatatype_expr.collect_dtype(schema)
|
polars/datatype_expr/list.py
DELETED
|
@@ -1,18 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
import polars._reexport as pl
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
class DataTypeExprListNameSpace:
|
|
7
|
-
"""Namespace for list datatype expressions."""
|
|
8
|
-
|
|
9
|
-
_accessor = "list"
|
|
10
|
-
|
|
11
|
-
def __init__(self, expr: pl.DataTypeExpr) -> None:
|
|
12
|
-
self._pydatatype_expr = expr._pydatatype_expr
|
|
13
|
-
|
|
14
|
-
def inner_dtype(self) -> pl.DataTypeExpr:
|
|
15
|
-
"""Get the inner DataType of list."""
|
|
16
|
-
return pl.DataTypeExpr._from_pydatatype_expr(
|
|
17
|
-
self._pydatatype_expr.list_inner_dtype()
|
|
18
|
-
)
|