polars-df 0.12.0-arm64-darwin → 0.14.0-arm64-darwin
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +11 -0
- data/Cargo.lock +331 -316
- data/LICENSE-THIRD-PARTY.txt +1095 -1301
- data/lib/polars/3.1/polars.bundle +0 -0
- data/lib/polars/3.2/polars.bundle +0 -0
- data/lib/polars/3.3/polars.bundle +0 -0
- data/lib/polars/data_frame.rb +10 -10
- data/lib/polars/expr.rb +6 -6
- data/lib/polars/io/ipc.rb +28 -8
- data/lib/polars/io/parquet.rb +10 -4
- data/lib/polars/lazy_frame.rb +5 -1
- data/lib/polars/series.rb +8 -7
- data/lib/polars/string_expr.rb +9 -9
- data/lib/polars/version.rb +1 -1
- metadata +2 -2
Binary file
|
Binary file
|
Binary file
|
data/lib/polars/data_frame.rb
CHANGED
@@ -2426,15 +2426,15 @@ module Polars
|
|
2426
2426
|
# df.map_rows { |t| t[0] * 2 + t[1] }
|
2427
2427
|
# # =>
|
2428
2428
|
# # shape: (3, 1)
|
2429
|
-
# #
|
2430
|
-
# # │
|
2431
|
-
# # │ ---
|
2432
|
-
# # │ i64
|
2433
|
-
# #
|
2434
|
-
# # │ 1
|
2435
|
-
# # │ 9
|
2436
|
-
# # │ 14
|
2437
|
-
# #
|
2429
|
+
# # ┌─────┐
|
2430
|
+
# # │ map │
|
2431
|
+
# # │ --- │
|
2432
|
+
# # │ i64 │
|
2433
|
+
# # ╞═════╡
|
2434
|
+
# # │ 1 │
|
2435
|
+
# # │ 9 │
|
2436
|
+
# # │ 14 │
|
2437
|
+
# # └─────┘
|
2438
2438
|
def map_rows(return_dtype: nil, inference_size: 256, &f)
|
2439
2439
|
out, is_df = _df.map_rows(f, return_dtype, inference_size)
|
2440
2440
|
if is_df
|
@@ -4234,7 +4234,7 @@ module Polars
|
|
4234
4234
|
if n.nil? && !frac.nil?
|
4235
4235
|
frac = Series.new("frac", [frac]) unless frac.is_a?(Series)
|
4236
4236
|
|
4237
|
-
_from_rbdf(
|
4237
|
+
return _from_rbdf(
|
4238
4238
|
_df.sample_frac(frac._s, with_replacement, shuffle, seed)
|
4239
4239
|
)
|
4240
4240
|
end
|
data/lib/polars/expr.rb
CHANGED
@@ -1182,7 +1182,7 @@ module Polars
|
|
1182
1182
|
# "b" => [1, 1, 2, 2]
|
1183
1183
|
# }
|
1184
1184
|
# )
|
1185
|
-
# df.select(Polars.all.mode)
|
1185
|
+
# df.select(Polars.all.mode.first)
|
1186
1186
|
# # =>
|
1187
1187
|
# # shape: (2, 2)
|
1188
1188
|
# # ┌─────┬─────┐
|
@@ -6015,12 +6015,12 @@ module Polars
|
|
6015
6015
|
# # ┌──────┐
|
6016
6016
|
# # │ a │
|
6017
6017
|
# # │ --- │
|
6018
|
-
# # │
|
6018
|
+
# # │ f64 │
|
6019
6019
|
# # ╞══════╡
|
6020
|
-
# # │ -1
|
6021
|
-
# # │ 0
|
6022
|
-
# # │ 0
|
6023
|
-
# # │ 1
|
6020
|
+
# # │ -1.0 │
|
6021
|
+
# # │ -0.0 │
|
6022
|
+
# # │ 0.0 │
|
6023
|
+
# # │ 1.0 │
|
6024
6024
|
# # │ null │
|
6025
6025
|
# # └──────┘
|
6026
6026
|
def sign
|
data/lib/polars/io/ipc.rb
CHANGED
@@ -189,10 +189,18 @@ module Polars
|
|
189
189
|
# Offset to start the row_count column (only use if the name is set).
|
190
190
|
# @param storage_options [Hash]
|
191
191
|
# Extra options that make sense for a particular storage connection.
|
192
|
-
# @param
|
193
|
-
#
|
194
|
-
#
|
195
|
-
#
|
192
|
+
# @param hive_partitioning [Boolean]
|
193
|
+
# Infer statistics and schema from Hive partitioned URL and use them
|
194
|
+
# to prune reads. This is unset by default (i.e. `nil`), meaning it is
|
195
|
+
# automatically enabled when a single directory is passed, and otherwise
|
196
|
+
# disabled.
|
197
|
+
# @param hive_schema [Hash]
|
198
|
+
# The column names and data types of the columns by which the data is partitioned.
|
199
|
+
# If set to `nil` (default), the schema of the Hive partitions is inferred.
|
200
|
+
# @param try_parse_hive_dates [Boolean]
|
201
|
+
# Whether to try parsing hive values as date/datetime types.
|
202
|
+
# @param include_file_paths [String]
|
203
|
+
# Include the path of the source file(s) as a column with this name.
|
196
204
|
#
|
197
205
|
# @return [LazyFrame]
|
198
206
|
def scan_ipc(
|
@@ -203,7 +211,10 @@ module Polars
|
|
203
211
|
row_count_name: nil,
|
204
212
|
row_count_offset: 0,
|
205
213
|
storage_options: nil,
|
206
|
-
|
214
|
+
hive_partitioning: nil,
|
215
|
+
hive_schema: nil,
|
216
|
+
try_parse_hive_dates: true,
|
217
|
+
include_file_paths: nil
|
207
218
|
)
|
208
219
|
_scan_ipc_impl(
|
209
220
|
source,
|
@@ -213,7 +224,10 @@ module Polars
|
|
213
224
|
row_count_name: row_count_name,
|
214
225
|
row_count_offset: row_count_offset,
|
215
226
|
storage_options: storage_options,
|
216
|
-
|
227
|
+
hive_partitioning: hive_partitioning,
|
228
|
+
hive_schema: hive_schema,
|
229
|
+
try_parse_hive_dates: try_parse_hive_dates,
|
230
|
+
include_file_paths: include_file_paths
|
217
231
|
)
|
218
232
|
end
|
219
233
|
|
@@ -226,7 +240,10 @@ module Polars
|
|
226
240
|
row_count_name: nil,
|
227
241
|
row_count_offset: 0,
|
228
242
|
storage_options: nil,
|
229
|
-
|
243
|
+
hive_partitioning: nil,
|
244
|
+
hive_schema: nil,
|
245
|
+
try_parse_hive_dates: true,
|
246
|
+
include_file_paths: nil
|
230
247
|
)
|
231
248
|
if Utils.pathlike?(file)
|
232
249
|
file = Utils.normalize_filepath(file)
|
@@ -239,7 +256,10 @@ module Polars
|
|
239
256
|
cache,
|
240
257
|
rechunk,
|
241
258
|
Utils.parse_row_index_args(row_count_name, row_count_offset),
|
242
|
-
|
259
|
+
hive_partitioning,
|
260
|
+
hive_schema,
|
261
|
+
try_parse_hive_dates,
|
262
|
+
include_file_paths
|
243
263
|
)
|
244
264
|
Utils.wrap_ldf(rblf)
|
245
265
|
end
|
data/lib/polars/io/parquet.rb
CHANGED
@@ -158,6 +158,8 @@ module Polars
|
|
158
158
|
# Extra options that make sense for a particular storage connection.
|
159
159
|
# @param low_memory [Boolean]
|
160
160
|
# Reduce memory pressure at the expense of performance.
|
161
|
+
# @param include_file_paths [String]
|
162
|
+
# Include the path of the source file(s) as a column with this name.
|
161
163
|
#
|
162
164
|
# @return [LazyFrame]
|
163
165
|
def scan_parquet(
|
@@ -170,7 +172,8 @@ module Polars
|
|
170
172
|
row_count_name: nil,
|
171
173
|
row_count_offset: 0,
|
172
174
|
storage_options: nil,
|
173
|
-
low_memory: false
|
175
|
+
low_memory: false,
|
176
|
+
include_file_paths: nil
|
174
177
|
)
|
175
178
|
if Utils.pathlike?(source)
|
176
179
|
source = Utils.normalize_filepath(source)
|
@@ -186,7 +189,8 @@ module Polars
|
|
186
189
|
row_count_offset: row_count_offset,
|
187
190
|
storage_options: storage_options,
|
188
191
|
low_memory: low_memory,
|
189
|
-
glob: glob
|
192
|
+
glob: glob,
|
193
|
+
include_file_paths: include_file_paths
|
190
194
|
)
|
191
195
|
end
|
192
196
|
|
@@ -203,7 +207,8 @@ module Polars
|
|
203
207
|
low_memory: false,
|
204
208
|
use_statistics: true,
|
205
209
|
hive_partitioning: nil,
|
206
|
-
glob: true
|
210
|
+
glob: true,
|
211
|
+
include_file_paths: nil
|
207
212
|
)
|
208
213
|
rblf =
|
209
214
|
RbLazyFrame.new_from_parquet(
|
@@ -219,7 +224,8 @@ module Polars
|
|
219
224
|
hive_partitioning,
|
220
225
|
nil,
|
221
226
|
true,
|
222
|
-
glob
|
227
|
+
glob,
|
228
|
+
include_file_paths
|
223
229
|
)
|
224
230
|
Utils.wrap_ldf(rblf)
|
225
231
|
end
|
data/lib/polars/lazy_frame.rb
CHANGED
@@ -2526,11 +2526,15 @@ module Polars
|
|
2526
2526
|
value_name: nil,
|
2527
2527
|
streamable: true
|
2528
2528
|
)
|
2529
|
+
if !streamable
|
2530
|
+
warn "The `streamable` parameter for `LazyFrame.unpivot` is deprecated"
|
2531
|
+
end
|
2532
|
+
|
2529
2533
|
on = on.nil? ? [] : Utils._expand_selectors(self, on)
|
2530
2534
|
index = index.nil? ? [] : Utils._expand_selectors(self, index)
|
2531
2535
|
|
2532
2536
|
_from_rbldf(
|
2533
|
-
_ldf.unpivot(on, index, value_name, variable_name
|
2537
|
+
_ldf.unpivot(on, index, value_name, variable_name)
|
2534
2538
|
)
|
2535
2539
|
end
|
2536
2540
|
alias_method :melt, :unpivot
|
data/lib/polars/series.rb
CHANGED
@@ -1790,9 +1790,10 @@ module Polars
|
|
1790
1790
|
# Use this to swiftly assert a Series does not have null values.
|
1791
1791
|
#
|
1792
1792
|
# @return [Boolean]
|
1793
|
-
def
|
1794
|
-
_s.
|
1793
|
+
def has_nulls
|
1794
|
+
_s.has_nulls
|
1795
1795
|
end
|
1796
|
+
alias_method :has_validity, :has_nulls
|
1796
1797
|
|
1797
1798
|
# Check if the Series is empty.
|
1798
1799
|
#
|
@@ -2605,12 +2606,12 @@ module Polars
|
|
2605
2606
|
# s.sign
|
2606
2607
|
# # =>
|
2607
2608
|
# # shape: (5,)
|
2608
|
-
# # Series: 'a' [
|
2609
|
+
# # Series: 'a' [f64]
|
2609
2610
|
# # [
|
2610
|
-
# # -1
|
2611
|
-
# # 0
|
2612
|
-
# # 0
|
2613
|
-
# # 1
|
2611
|
+
# # -1.0
|
2612
|
+
# # -0.0
|
2613
|
+
# # 0.0
|
2614
|
+
# # 1.0
|
2614
2615
|
# # null
|
2615
2616
|
# # ]
|
2616
2617
|
def sign
|
data/lib/polars/string_expr.rb
CHANGED
@@ -792,15 +792,15 @@ module Polars
|
|
792
792
|
# df.select(Polars.col("json").str.json_decode(dtype))
|
793
793
|
# # =>
|
794
794
|
# # shape: (3, 1)
|
795
|
-
# #
|
796
|
-
# # │ json
|
797
|
-
# # │ ---
|
798
|
-
# # │ struct[2]
|
799
|
-
# #
|
800
|
-
# # │ {1,true}
|
801
|
-
# # │
|
802
|
-
# # │ {2,false}
|
803
|
-
# #
|
795
|
+
# # ┌───────────┐
|
796
|
+
# # │ json │
|
797
|
+
# # │ --- │
|
798
|
+
# # │ struct[2] │
|
799
|
+
# # ╞═══════════╡
|
800
|
+
# # │ {1,true} │
|
801
|
+
# # │ null │
|
802
|
+
# # │ {2,false} │
|
803
|
+
# # └───────────┘
|
804
804
|
def json_decode(dtype = nil, infer_schema_length: 100)
|
805
805
|
if !dtype.nil?
|
806
806
|
dtype = Utils.rb_type_to_dtype(dtype)
|
data/lib/polars/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: polars-df
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.14.0
|
5
5
|
platform: arm64-darwin
|
6
6
|
authors:
|
7
7
|
- Andrew Kane
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2024-
|
11
|
+
date: 2024-09-17 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: bigdecimal
|