polars-df 0.12.0-arm64-darwin → 0.14.0-arm64-darwin
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +11 -0
- data/Cargo.lock +331 -316
- data/LICENSE-THIRD-PARTY.txt +1095 -1301
- data/lib/polars/3.1/polars.bundle +0 -0
- data/lib/polars/3.2/polars.bundle +0 -0
- data/lib/polars/3.3/polars.bundle +0 -0
- data/lib/polars/data_frame.rb +10 -10
- data/lib/polars/expr.rb +6 -6
- data/lib/polars/io/ipc.rb +28 -8
- data/lib/polars/io/parquet.rb +10 -4
- data/lib/polars/lazy_frame.rb +5 -1
- data/lib/polars/series.rb +8 -7
- data/lib/polars/string_expr.rb +9 -9
- data/lib/polars/version.rb +1 -1
- metadata +2 -2
| Binary file | 
| Binary file | 
| Binary file | 
    
        data/lib/polars/data_frame.rb
    CHANGED
    
    | @@ -2426,15 +2426,15 @@ module Polars | |
| 2426 2426 | 
             
                #   df.map_rows { |t| t[0] * 2 + t[1] }
         | 
| 2427 2427 | 
             
                #   # =>
         | 
| 2428 2428 | 
             
                #   # shape: (3, 1)
         | 
| 2429 | 
            -
                #   #  | 
| 2430 | 
            -
                #   # │  | 
| 2431 | 
            -
                #   # │ --- | 
| 2432 | 
            -
                #   # │ i64 | 
| 2433 | 
            -
                #   #  | 
| 2434 | 
            -
                #   # │ 1 | 
| 2435 | 
            -
                #   # │ 9 | 
| 2436 | 
            -
                #   # │ 14 | 
| 2437 | 
            -
                #   #  | 
| 2429 | 
            +
                #   # ┌─────┐
         | 
| 2430 | 
            +
                #   # │ map │
         | 
| 2431 | 
            +
                #   # │ --- │
         | 
| 2432 | 
            +
                #   # │ i64 │
         | 
| 2433 | 
            +
                #   # ╞═════╡
         | 
| 2434 | 
            +
                #   # │ 1   │
         | 
| 2435 | 
            +
                #   # │ 9   │
         | 
| 2436 | 
            +
                #   # │ 14  │
         | 
| 2437 | 
            +
                #   # └─────┘
         | 
| 2438 2438 | 
             
                def map_rows(return_dtype: nil, inference_size: 256, &f)
         | 
| 2439 2439 | 
             
                  out, is_df = _df.map_rows(f, return_dtype, inference_size)
         | 
| 2440 2440 | 
             
                  if is_df
         | 
| @@ -4234,7 +4234,7 @@ module Polars | |
| 4234 4234 | 
             
                  if n.nil? && !frac.nil?
         | 
| 4235 4235 | 
             
                    frac = Series.new("frac", [frac]) unless frac.is_a?(Series)
         | 
| 4236 4236 |  | 
| 4237 | 
            -
                    _from_rbdf(
         | 
| 4237 | 
            +
                    return _from_rbdf(
         | 
| 4238 4238 | 
             
                      _df.sample_frac(frac._s, with_replacement, shuffle, seed)
         | 
| 4239 4239 | 
             
                    )
         | 
| 4240 4240 | 
             
                  end
         | 
    
        data/lib/polars/expr.rb
    CHANGED
    
    | @@ -1182,7 +1182,7 @@ module Polars | |
| 1182 1182 | 
             
                #       "b" => [1, 1, 2, 2]
         | 
| 1183 1183 | 
             
                #     }
         | 
| 1184 1184 | 
             
                #   )
         | 
| 1185 | 
            -
                #   df.select(Polars.all.mode)
         | 
| 1185 | 
            +
                #   df.select(Polars.all.mode.first)
         | 
| 1186 1186 | 
             
                #   # =>
         | 
| 1187 1187 | 
             
                #   # shape: (2, 2)
         | 
| 1188 1188 | 
             
                #   # ┌─────┬─────┐
         | 
| @@ -6015,12 +6015,12 @@ module Polars | |
| 6015 6015 | 
             
                #   # ┌──────┐
         | 
| 6016 6016 | 
             
                #   # │ a    │
         | 
| 6017 6017 | 
             
                #   # │ ---  │
         | 
| 6018 | 
            -
                #   # │  | 
| 6018 | 
            +
                #   # │ f64  │
         | 
| 6019 6019 | 
             
                #   # ╞══════╡
         | 
| 6020 | 
            -
                #   # │ -1 | 
| 6021 | 
            -
                #   # │ 0 | 
| 6022 | 
            -
                #   # │ 0 | 
| 6023 | 
            -
                #   # │ 1 | 
| 6020 | 
            +
                #   # │ -1.0 │
         | 
| 6021 | 
            +
                #   # │ -0.0 │
         | 
| 6022 | 
            +
                #   # │ 0.0  │
         | 
| 6023 | 
            +
                #   # │ 1.0  │
         | 
| 6024 6024 | 
             
                #   # │ null │
         | 
| 6025 6025 | 
             
                #   # └──────┘
         | 
| 6026 6026 | 
             
                def sign
         | 
    
        data/lib/polars/io/ipc.rb
    CHANGED
    
    | @@ -189,10 +189,18 @@ module Polars | |
| 189 189 | 
             
                #   Offset to start the row_count column (only use if the name is set).
         | 
| 190 190 | 
             
                # @param storage_options [Hash]
         | 
| 191 191 | 
             
                #   Extra options that make sense for a particular storage connection.
         | 
| 192 | 
            -
                # @param  | 
| 193 | 
            -
                #    | 
| 194 | 
            -
                #    | 
| 195 | 
            -
                #    | 
| 192 | 
            +
                # @param hive_partitioning [Boolean]
         | 
| 193 | 
            +
                #   Infer statistics and schema from Hive partitioned URL and use them
         | 
| 194 | 
            +
                #   to prune reads. This is unset by default (i.e. `nil`), meaning it is
         | 
| 195 | 
            +
                #   automatically enabled when a single directory is passed, and otherwise
         | 
| 196 | 
            +
                #   disabled.
         | 
| 197 | 
            +
                # @param hive_schema [Hash]
         | 
| 198 | 
            +
                #   The column names and data types of the columns by which the data is partitioned.
         | 
| 199 | 
            +
                #   If set to `nil` (default), the schema of the Hive partitions is inferred.
         | 
| 200 | 
            +
                # @param try_parse_hive_dates [Boolean]
         | 
| 201 | 
            +
                #   Whether to try parsing hive values as date/datetime types.
         | 
| 202 | 
            +
                # @param include_file_paths [String]
         | 
| 203 | 
            +
                #   Include the path of the source file(s) as a column with this name.
         | 
| 196 204 | 
             
                #
         | 
| 197 205 | 
             
                # @return [LazyFrame]
         | 
| 198 206 | 
             
                def scan_ipc(
         | 
| @@ -203,7 +211,10 @@ module Polars | |
| 203 211 | 
             
                  row_count_name: nil,
         | 
| 204 212 | 
             
                  row_count_offset: 0,
         | 
| 205 213 | 
             
                  storage_options: nil,
         | 
| 206 | 
            -
                   | 
| 214 | 
            +
                  hive_partitioning: nil,
         | 
| 215 | 
            +
                  hive_schema: nil,
         | 
| 216 | 
            +
                  try_parse_hive_dates: true,
         | 
| 217 | 
            +
                  include_file_paths: nil
         | 
| 207 218 | 
             
                )
         | 
| 208 219 | 
             
                  _scan_ipc_impl(
         | 
| 209 220 | 
             
                    source,
         | 
| @@ -213,7 +224,10 @@ module Polars | |
| 213 224 | 
             
                    row_count_name: row_count_name,
         | 
| 214 225 | 
             
                    row_count_offset: row_count_offset,
         | 
| 215 226 | 
             
                    storage_options: storage_options,
         | 
| 216 | 
            -
                     | 
| 227 | 
            +
                    hive_partitioning: hive_partitioning,
         | 
| 228 | 
            +
                    hive_schema: hive_schema,
         | 
| 229 | 
            +
                    try_parse_hive_dates: try_parse_hive_dates,
         | 
| 230 | 
            +
                    include_file_paths: include_file_paths
         | 
| 217 231 | 
             
                  )
         | 
| 218 232 | 
             
                end
         | 
| 219 233 |  | 
| @@ -226,7 +240,10 @@ module Polars | |
| 226 240 | 
             
                  row_count_name: nil,
         | 
| 227 241 | 
             
                  row_count_offset: 0,
         | 
| 228 242 | 
             
                  storage_options: nil,
         | 
| 229 | 
            -
                   | 
| 243 | 
            +
                  hive_partitioning: nil,
         | 
| 244 | 
            +
                  hive_schema: nil,
         | 
| 245 | 
            +
                  try_parse_hive_dates: true,
         | 
| 246 | 
            +
                  include_file_paths: nil
         | 
| 230 247 | 
             
                )
         | 
| 231 248 | 
             
                  if Utils.pathlike?(file)
         | 
| 232 249 | 
             
                    file = Utils.normalize_filepath(file)
         | 
| @@ -239,7 +256,10 @@ module Polars | |
| 239 256 | 
             
                      cache,
         | 
| 240 257 | 
             
                      rechunk,
         | 
| 241 258 | 
             
                      Utils.parse_row_index_args(row_count_name, row_count_offset),
         | 
| 242 | 
            -
                       | 
| 259 | 
            +
                      hive_partitioning,
         | 
| 260 | 
            +
                      hive_schema,
         | 
| 261 | 
            +
                      try_parse_hive_dates,
         | 
| 262 | 
            +
                      include_file_paths
         | 
| 243 263 | 
             
                    )
         | 
| 244 264 | 
             
                  Utils.wrap_ldf(rblf)
         | 
| 245 265 | 
             
                end
         | 
    
        data/lib/polars/io/parquet.rb
    CHANGED
    
    | @@ -158,6 +158,8 @@ module Polars | |
| 158 158 | 
             
                #   Extra options that make sense for a particular storage connection.
         | 
| 159 159 | 
             
                # @param low_memory [Boolean]
         | 
| 160 160 | 
             
                #   Reduce memory pressure at the expense of performance.
         | 
| 161 | 
            +
                # @param include_file_paths [String]
         | 
| 162 | 
            +
                #  Include the path of the source file(s) as a column with this name.
         | 
| 161 163 | 
             
                #
         | 
| 162 164 | 
             
                # @return [LazyFrame]
         | 
| 163 165 | 
             
                def scan_parquet(
         | 
| @@ -170,7 +172,8 @@ module Polars | |
| 170 172 | 
             
                  row_count_name: nil,
         | 
| 171 173 | 
             
                  row_count_offset: 0,
         | 
| 172 174 | 
             
                  storage_options: nil,
         | 
| 173 | 
            -
                  low_memory: false
         | 
| 175 | 
            +
                  low_memory: false,
         | 
| 176 | 
            +
                  include_file_paths: nil
         | 
| 174 177 | 
             
                )
         | 
| 175 178 | 
             
                  if Utils.pathlike?(source)
         | 
| 176 179 | 
             
                    source = Utils.normalize_filepath(source)
         | 
| @@ -186,7 +189,8 @@ module Polars | |
| 186 189 | 
             
                    row_count_offset: row_count_offset,
         | 
| 187 190 | 
             
                    storage_options: storage_options,
         | 
| 188 191 | 
             
                    low_memory: low_memory,
         | 
| 189 | 
            -
                    glob: glob
         | 
| 192 | 
            +
                    glob: glob,
         | 
| 193 | 
            +
                    include_file_paths: include_file_paths
         | 
| 190 194 | 
             
                  )
         | 
| 191 195 | 
             
                end
         | 
| 192 196 |  | 
| @@ -203,7 +207,8 @@ module Polars | |
| 203 207 | 
             
                  low_memory: false,
         | 
| 204 208 | 
             
                  use_statistics: true,
         | 
| 205 209 | 
             
                  hive_partitioning: nil,
         | 
| 206 | 
            -
                  glob: true
         | 
| 210 | 
            +
                  glob: true,
         | 
| 211 | 
            +
                  include_file_paths: nil
         | 
| 207 212 | 
             
                )
         | 
| 208 213 | 
             
                  rblf =
         | 
| 209 214 | 
             
                    RbLazyFrame.new_from_parquet(
         | 
| @@ -219,7 +224,8 @@ module Polars | |
| 219 224 | 
             
                      hive_partitioning,
         | 
| 220 225 | 
             
                      nil,
         | 
| 221 226 | 
             
                      true,
         | 
| 222 | 
            -
                      glob
         | 
| 227 | 
            +
                      glob,
         | 
| 228 | 
            +
                      include_file_paths
         | 
| 223 229 | 
             
                    )
         | 
| 224 230 | 
             
                  Utils.wrap_ldf(rblf)
         | 
| 225 231 | 
             
                end
         | 
    
        data/lib/polars/lazy_frame.rb
    CHANGED
    
    | @@ -2526,11 +2526,15 @@ module Polars | |
| 2526 2526 | 
             
                  value_name: nil,
         | 
| 2527 2527 | 
             
                  streamable: true
         | 
| 2528 2528 | 
             
                )
         | 
| 2529 | 
            +
                  if !streamable
         | 
| 2530 | 
            +
                    warn "The `streamable` parameter for `LazyFrame.unpivot` is deprecated"
         | 
| 2531 | 
            +
                  end
         | 
| 2532 | 
            +
             | 
| 2529 2533 | 
             
                  on = on.nil? ? [] : Utils._expand_selectors(self, on)
         | 
| 2530 2534 | 
             
                  index = index.nil? ? [] : Utils._expand_selectors(self, index)
         | 
| 2531 2535 |  | 
| 2532 2536 | 
             
                  _from_rbldf(
         | 
| 2533 | 
            -
                    _ldf.unpivot(on, index, value_name, variable_name | 
| 2537 | 
            +
                    _ldf.unpivot(on, index, value_name, variable_name)
         | 
| 2534 2538 | 
             
                  )
         | 
| 2535 2539 | 
             
                end
         | 
| 2536 2540 | 
             
                alias_method :melt, :unpivot
         | 
    
        data/lib/polars/series.rb
    CHANGED
    
    | @@ -1790,9 +1790,10 @@ module Polars | |
| 1790 1790 | 
             
                # Use this to swiftly assert a Series does not have null values.
         | 
| 1791 1791 | 
             
                #
         | 
| 1792 1792 | 
             
                # @return [Boolean]
         | 
| 1793 | 
            -
                def  | 
| 1794 | 
            -
                  _s. | 
| 1793 | 
            +
                def has_nulls
         | 
| 1794 | 
            +
                  _s.has_nulls
         | 
| 1795 1795 | 
             
                end
         | 
| 1796 | 
            +
                alias_method :has_validity, :has_nulls
         | 
| 1796 1797 |  | 
| 1797 1798 | 
             
                # Check if the Series is empty.
         | 
| 1798 1799 | 
             
                #
         | 
| @@ -2605,12 +2606,12 @@ module Polars | |
| 2605 2606 | 
             
                #   s.sign
         | 
| 2606 2607 | 
             
                #   # =>
         | 
| 2607 2608 | 
             
                #   # shape: (5,)
         | 
| 2608 | 
            -
                #   # Series: 'a' [ | 
| 2609 | 
            +
                #   # Series: 'a' [f64]
         | 
| 2609 2610 | 
             
                #   # [
         | 
| 2610 | 
            -
                #   #         -1
         | 
| 2611 | 
            -
                #   #         0
         | 
| 2612 | 
            -
                #   #         0
         | 
| 2613 | 
            -
                #   #         1
         | 
| 2611 | 
            +
                #   #         -1.0
         | 
| 2612 | 
            +
                #   #         -0.0
         | 
| 2613 | 
            +
                #   #         0.0
         | 
| 2614 | 
            +
                #   #         1.0
         | 
| 2614 2615 | 
             
                #   #         null
         | 
| 2615 2616 | 
             
                #   # ]
         | 
| 2616 2617 | 
             
                def sign
         | 
    
        data/lib/polars/string_expr.rb
    CHANGED
    
    | @@ -792,15 +792,15 @@ module Polars | |
| 792 792 | 
             
                #   df.select(Polars.col("json").str.json_decode(dtype))
         | 
| 793 793 | 
             
                #   # =>
         | 
| 794 794 | 
             
                #   # shape: (3, 1)
         | 
| 795 | 
            -
                #   #  | 
| 796 | 
            -
                #   # │ json | 
| 797 | 
            -
                #   # │ --- | 
| 798 | 
            -
                #   # │ struct[2] | 
| 799 | 
            -
                #   #  | 
| 800 | 
            -
                #   # │ {1,true} | 
| 801 | 
            -
                #   # │  | 
| 802 | 
            -
                #   # │ {2,false} | 
| 803 | 
            -
                #   #  | 
| 795 | 
            +
                #   # ┌───────────┐
         | 
| 796 | 
            +
                #   # │ json      │
         | 
| 797 | 
            +
                #   # │ ---       │
         | 
| 798 | 
            +
                #   # │ struct[2] │
         | 
| 799 | 
            +
                #   # ╞═══════════╡
         | 
| 800 | 
            +
                #   # │ {1,true}  │
         | 
| 801 | 
            +
                #   # │ null      │
         | 
| 802 | 
            +
                #   # │ {2,false} │
         | 
| 803 | 
            +
                #   # └───────────┘
         | 
| 804 804 | 
             
                def json_decode(dtype = nil, infer_schema_length: 100)
         | 
| 805 805 | 
             
                  if !dtype.nil?
         | 
| 806 806 | 
             
                    dtype = Utils.rb_type_to_dtype(dtype)
         | 
    
        data/lib/polars/version.rb
    CHANGED
    
    
    
        metadata
    CHANGED
    
    | @@ -1,14 +1,14 @@ | |
| 1 1 | 
             
            --- !ruby/object:Gem::Specification
         | 
| 2 2 | 
             
            name: polars-df
         | 
| 3 3 | 
             
            version: !ruby/object:Gem::Version
         | 
| 4 | 
            -
              version: 0. | 
| 4 | 
            +
              version: 0.14.0
         | 
| 5 5 | 
             
            platform: arm64-darwin
         | 
| 6 6 | 
             
            authors:
         | 
| 7 7 | 
             
            - Andrew Kane
         | 
| 8 8 | 
             
            autorequire: 
         | 
| 9 9 | 
             
            bindir: bin
         | 
| 10 10 | 
             
            cert_chain: []
         | 
| 11 | 
            -
            date: 2024- | 
| 11 | 
            +
            date: 2024-09-17 00:00:00.000000000 Z
         | 
| 12 12 | 
             
            dependencies:
         | 
| 13 13 | 
             
            - !ruby/object:Gem::Dependency
         | 
| 14 14 | 
             
              name: bigdecimal
         |