RubyGems - red_amber - Versions diffs - 0.3.0 → 0.4.1 - Mend

red_amber 0.3.0 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

checksums.yaml +4 -4
data/.rubocop.yml +56 -22
data/.yardopts +2 -0
data/CHANGELOG.md +178 -0
data/Gemfile +1 -1
data/LICENSE +1 -1
data/README.md +29 -30
data/benchmark/basic.yml +7 -7
data/benchmark/combine.yml +3 -3
data/benchmark/dataframe.yml +15 -9
data/benchmark/group.yml +6 -6
data/benchmark/reshape.yml +6 -6
data/benchmark/vector.yml +6 -3
data/doc/DataFrame.md +32 -12
data/doc/DataFrame_Comparison.md +65 -0
data/doc/SubFrames.md +11 -0
data/doc/Vector.md +207 -1
data/doc/yard-templates/default/fulldoc/html/css/common.css +6 -0
data/lib/red_amber/data_frame.rb +454 -85
data/lib/red_amber/data_frame_combinable.rb +609 -115
data/lib/red_amber/data_frame_displayable.rb +313 -34
data/lib/red_amber/data_frame_indexable.rb +122 -19
data/lib/red_amber/data_frame_loadsave.rb +78 -10
data/lib/red_amber/data_frame_reshaping.rb +184 -14
data/lib/red_amber/data_frame_selectable.rb +623 -70
data/lib/red_amber/data_frame_variable_operation.rb +452 -35
data/lib/red_amber/group.rb +186 -22
data/lib/red_amber/helper.rb +74 -14
data/lib/red_amber/refinements.rb +26 -6
data/lib/red_amber/subframes.rb +1101 -0
data/lib/red_amber/vector.rb +362 -11
data/lib/red_amber/vector_aggregation.rb +312 -0
data/lib/red_amber/vector_binary_element_wise.rb +506 -0
data/lib/red_amber/vector_selectable.rb +265 -23
data/lib/red_amber/vector_unary_element_wise.rb +529 -0
data/lib/red_amber/vector_updatable.rb +278 -34
data/lib/red_amber/version.rb +2 -1
data/lib/red_amber.rb +13 -1
data/red_amber.gemspec +2 -2
metadata +13 -8
data/doc/image/dataframe/reshaping_DataFrames.png +0 -0
data/lib/red_amber/vector_functions.rb +0 -242

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 78fa72064f9494f0f756f15cf1daaacb3640535e899ba71ab080730c0d61b0b2
-  data.tar.gz: 3f2de4a449c38eb995ebcc0394a1a93633f097e533696edfa91267a596dcb580
+  metadata.gz: 264e7637475fd01946900335751a1592a3859e9bfa772ecc0800ab05c4d852f0
+  data.tar.gz: a57400445419698a66d6b5c94e15fa8c040f2f3930f9fbf75603ffb6e18bd9cf
 SHA512:
-  metadata.gz: 45a7c37cc746c606e8d4d2a43005da8154b60df21bf2cf6b2bafa9f7ad5f962a3e3c8e2f931e6543b20b8f6cd8c8a447b99b7f0127854d3bb716ea763ab3cae5
-  data.tar.gz: b3ac4479df1e30b75e7ccfcc48b09f709cea536c98072bfe937ae283c0cc1d203ab97388cf6f57c39fd31c6beceadcb850c3f14e8e07e5e196cc0c862634f36d
+  metadata.gz: 0fdbcdb732e36bb866a8251800ab3fa1a714fa075234bf8cd516f2542ab6704ebfa429a7177da2bd8cd6fa6eb1158efb0d68f46f43d1dc088a9a0f0debdc5c54
+  data.tar.gz: f9c1dffaa157ecf34b0b4fec6c1d7972b4773bbf7a11101a345172d621753cd9fc3818753b329dd2906a506af294d6a96c0180a0fb4dc84c2b54bceef6b520f5

data/.rubocop.yml CHANGED Viewed

@@ -31,16 +31,28 @@ Style/TrailingCommaInHashLiteral:
 # To let you know the possibility of refactoring ===
-# avoid unused variable asignment
-Rubycw/Rubycw:
+# Max: 120
+# This cop supports safe autocorrection (--autocorrect).
+# Configuration parameters: AllowHeredoc, AllowURI, URISchemes, IgnoreCopDirectives, AllowedPatterns, IgnoredPatterns.
+# URISchemes: http, https
+Layout/LineLength:
+  Max: 90
   Exclude:
     - 'test/**/*'
+# EnforcedStyle: aligned
+Layout/MultilineMethodCallIndentation:
+  EnforcedStyle: indented_relative_to_receiver
 # Disabled to define Vector operators
 # Offense count: 38
 Lint/BinaryOperatorWithIdenticalOperands:
   Exclude:
-    - 'test/test_vector_function.rb'
+    - 'test/test_vector_binary_element_wise.rb'
+Lint/Debugger:
+  Exclude:
+    - 'bin/example'
 # Need for test with empty block
 # Offense count: 1
@@ -55,15 +67,6 @@ Lint/UselessAssignment:
   Exclude:
     - 'test/**/*'
-# Max: 120
-# This cop supports safe autocorrection (--autocorrect).
-# Configuration parameters: AllowHeredoc, AllowURI, URISchemes, IgnoreCopDirectives, AllowedPatterns, IgnoredPatterns.
-# URISchemes: http, https
-Layout/LineLength:
-  Max: 90
-  Exclude:
-    - 'test/**/*'
 # <= 17 satisfactory
 # 18..30 unsatisfactory
 # > 30 dangerous
@@ -83,6 +86,7 @@ Metrics/AbcSize:
     'drop', # 31.42
     '[]', # 33.76
     'split', # 37.35
+    'aggregate', # 38.13
   ]
 # Max: 25
@@ -104,7 +108,9 @@ Metrics/ClassLength:
     - 'test/**/*'
     - 'lib/red_amber/data_frame.rb' # 162
     - 'lib/red_amber/group.rb' # 105
+    - 'lib/red_amber/subframes.rb' # 110
     - 'lib/red_amber/vector.rb' # 152
+    - 'lib/red_amber/vector_binary_element_wise.rb' # 109
 # Only for monitoring. I will measure by PerceivedComplexity.
 # Max: 7
@@ -113,14 +119,17 @@ Metrics/ClassLength:
 Metrics/CyclomaticComplexity:
   Max: 12
   AllowedMethods: [
-    'join', # 14
+    'split', # 33
     'format_table', # 21
+    'normalize_element', # 17
     'slice_by', # 16
+    'assign_update', # 14
+    'join', # 14
+    'parse_range', # 14
     'remove', # 14
-    'normalize_element', # 17
     '[]', # 13
-    'parse_range', # 14
-    'split', # 33
+    'drop', # 13
+    'aggregate', # 13
   ]
 # Max: 10
@@ -134,6 +143,8 @@ Metrics/MethodLength:
     'format_table', # 53
     'slice_by', # 38
     'assign_update', # 35
+    'drop', # 32
+    'aggregate', # 31
   ]
 # Max: 100
@@ -163,17 +174,24 @@ Metrics/ParameterLists:
 Metrics/PerceivedComplexity:
   Max: 10
   AllowedMethods: [
-    'join', # 14
-    'dataframe_info', # 13
     'format_table', # 22
     'slice_by', # 20
-    'remove', # 14
-    'drop', # 12
-    'filters', # 11
     'normalize_element', # 17
-    '[]', # 11
+    'assign_update', # 15
     'parse_range', # 15
+    'join', # 14
+    'remove', # 14
     'split', # 14
+    'dataframe_info', # 13
+    'replace', # 13
+    'drop', # 12
+    'initialize', # 12
+    'aggregate', # 12
+    '[]', # 11
+    'filters', # 11
+    'html_table', # 11
+    'slice', # 11
+    'pick', # 11
   ]
 # Offense count: 1
@@ -197,6 +215,18 @@ Naming/PredicateName:
     - 'lib/red_amber/vector_functions.rb'
     - 'lib/red_amber/vector_selectable.rb'
+# avoid unused variable asignment
+Rubycw/Rubycw:
+  Exclude:
+    - 'test/**/*'
+    - 'bin/example'
+# Offense count: 16
+# This cop supports safe autocorrection (--autocorrect).
+Style/OperatorMethodCall:
+  Exclude:
+    - 'test/test_vector_binary_element_wise.rb'
 # Necessary to test when range.end == -1
 # Offense count: 2
 # This cop supports unsafe autocorrection (--autocorrect-all).
@@ -204,6 +234,10 @@ Style/SlicingWithRange:
   Exclude:
     - 'test/test_data_frame_selectable.rb'
+Style/MixinUsage:
+  Exclude:
+    - 'bin/example'
 # Necessary to Vector < 0 element-wise comparison
 # Offense count: 5
 # This cop supports unsafe autocorrection (--autocorrect-all).

data/.yardopts CHANGED Viewed

@@ -1 +1,3 @@
 --output-dir doc/yard
+--template-path doc/yard-templates
+--use-cache

data/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,181 @@
+## [0.4.1] - 2023-03-11
+- Breaking change
+  - Remove Vector.aggregate? method (#200)
+- Bug fixes
+  - Return self in DataFrame#drop when dropper is empty (reverts 746ac263) (#193)
+  - Return self in DataFrame#rename when renaming to same name (#193)
+  - Return self in DataFrame#pick when pick itself (#199)
+  - Fix column width for non-ascii elemnts in DataFrame#to_s (#193)
+    - This change uses String#width.
+  - Fix DataFrame#to_iruby when data is date32 type (#193)
+  - Fix DataFrame#shorthand to show temporal type data simply (#193)
+  - Fix Vector#rank when data is ChunkedArray (#198)
+  - Fix Vector element-wise functions with nil as scalar (#198)
+  - Support :force_order for all methods of join family (#199)
+    - Supports :force_order option to force sorting after join for all #join familiy.
+    - This will valuable in some cases such as large dataframes.
+  - Ensure baseframe's schema for SubFrames (#200)
+- New features and improvements
+  - Add Vector#first, #last method (#198)
+    - This method will be used in SubFrames feature.
+  - Add Vector#modulo method (#198)
+    - The divmod function in Arrow C++ is still in draft state.
+      This method was created by combining existing functions
+  - Add Vector#quotient method (#198)
+  - Add aliases #div, #mod, #mul, #pow, #quo and #sub for Vector (#198)
+  - Add Vector#*_checked functions (#198)
+    - This functions will check numeric range overflow.
+  - Add 'tdra' and 'plain' in display mode (#193)
+    - The plain mode and default inspect will show up to 128 rows and 128 columns.
+  - Add String#width method in refinements (#193)
+    - This will be used to update DataFrame#to_s.
+  - Introduce pre-loaded REPL environment (#199)
+    - This commit will add bin/example and it will start irb environment
+      with enabled commonly used datasets such as penguins, diamonds, etc.
+  - Upgrade SubFrames#aggregate to accept block (#200)
+- Refactoring
+  - Use symbolized keys in refinements of Table#keys, #key? (#193)
+    - This can be treat Tables and DataFrames as same manner.
+  - Use key_name.succ in suffix of DataFrame#join (#193)
+    - This will make simple to get name candidate.
+  - Use ||= to memorize instance variables (#193)
+  - Refine vector projection to use #variables (#193)
+    - #variables is fastest when picking Vectors.
+  - Refine Vector#is_in to avoid #pack (#198)
+  - Refine Vector#index (#198)
+- Improve in tests/CI
+  - Tests
+    - Update benchmarks to test from older version (#193)
+    - Refine test of Vector function with scalar (#198)
+    - Refine test subframes and test_vector_selectable (#200)
+  - Cops
+  - CI
+- Documentation
+  - Update documents(small fix) (#201)
+- GitHub site
+- Thanks
+## [0.4.0] - 2023-02-25
+- Breaking change
+  - Upgrade dependency to Arrow 11.0.0 (#188)
+- Bug fixes
+  - Add :force_order option for DataFrame#join (#174)
+  - Return error for empty DataFrame in DataFrame#filter (#172)
+  - Accept ChunkedArray in DataFrame#filter (#172)
+  - Fix Vector#replace to accept Arrow::Array as a replacer (#179)
+  - Fix Vector#round_to_multiple to accept Float or Integer (#180)
+  - Change Vector atan2 to a class method (#180)
+  - Fix Vector#shift when boolean Vector (#184)
+  - Fix processing empty SubFrames (#183)
+  - Do not check object id in DataFrame#rename, #drop for self (#188)
+- New features and improvements
+  - Accept a block in DataFrame#filter (#172)
+  - Add Vector.aggregate? method (#175)
+  - Introduce Vector#propagate method (#175)
+  - Add Vector#rank methods (#176)
+  - Add Vector#sample method (#176)
+  - Add Vector#sort method (#176)
+  - Promote DataFrame#shape_str to public (#184)
+  - Introduce Vector#concatenate (#184)
+  - Add #numeric? in refinements of Array (#184)
+  - Add Vector#cumulative_sum_checked and #cumsum (#184)
+  - Add Vector#resolve method (#184)
+  - Add DataFrame#tdra method (#184)
+  - Add #expand as an alias for Vector#propagate (#184)
+  - Add #glimpse as an alias for DataFrame#tdr (#184)
+  - New class SubFrames (#183)
+    - Introduce class SubFrames
+    - Memorize dataframes in SubFrames
+    - Add @frames to memorize sub DataFrames
+    - Accept filters in SubFrames.new
+    - Accept block in SubFrames.new
+    - Add SubFrames.by_filter
+    - Introduce methods creating SubFrames from DataFrame
+    - Introduce SubFrames#each method
+    - Add SubFrames#to_s method
+    - Add SubFrames#concatenate method
+    - Add SubFrames#offset_indices method
+    - SubFrames#aggregate method
+    - Redefine SubFrames#map to return SubFrames
+    - Define SubFrame#map dynamically
+    - Add SubFrames#assign method
+    - Redefine SubFrames#select to return SubFrames
+    - Add SubFrames#reject method
+    - Add SubFrames#filter_map method
+    - Refine DataFrame#indices memorizing @indices
+    - Rename SubFrames#universal_frame as #baseframe
+    - Set Group iteration feature to @api private
+- Refactoring
+  - Generate Vector functions in class method (#177)
+  - Set Constant visibility to private (#179)
+  - Separate test_vector_function (#179)
+  - Relocate methods in DataFrameIndexable (#179)
+  - Rename Array refinements to the same name as Vector (#184)
+- Improve in tests/CI
+  - Tests
+    - Update benchmarks to set 0.3.0 as a reference (#167)
+    - Move test of Vector#logb to proper location (#180)
+  - Cops
+    - Update .rubocop.yml to align with latest cops (#174)
+    - Unify style of MethodCallIndentation as relative to reciever (#184)
+  - CI
+    - Fix setting up Arrow by homebrew in CI (#167)
+    - Fix CI error on homebrew deleting python link (#167)
+    - Set cache-version to get new C extensions in CI (#173)
+      - Thanks to @kou for suggestion.
+- Documentation
+  - Update DataFrame.md about loading csv without headers (#165)
+    - Thanks to kojix2
+  - Update YARD in DataFrame combinable (#168)
+  - Update comment for Ruby 2.7 support in README.md
+  - Update license year
+  - Update README (#172)
+  - Update Vector.md and yardoc in #propagate (#175)
+  - Use customized style sheet for YARD (#179)
+  - Add examples for the doc of #pick and #drop (#179)
+  - Add examples to YARD in DataFrame reshaping methods (#179)
+  - Update documents in DataFrameDisplayable (#179)
+  - Update documents in DataFrameVariableOperation (#179)
+  - Update document for dynamically generated methods (#179)
+  - Unify style in document (#179)
+  - Update documents in DataFrameSelectable (#179)
+  - Update documents of basic Vector methods (#179)
+  - Update document in VectorUpdatable (#179)
+  - Update document of Group (#179)
+  - Update document of DataFrameLoadSave (#180)
+  - Add examples for document of ArrowFunction (#180)
+  - Update document of Vector_unary_aggregation (#180)
+  - Update document of Vector_unary_element_wise (#180)
+  - Update document of Vector_biary_element_wise (#180)
+  - Add documentation to give comparison of dataframes(#169)
+    - Thanks to Benson Muite
+  - Update documents for consistency of method indentation (#189)
+  - Update CHANGELOG (#189)
+  - Update README for 0.4.0 (#189)
+- GitHub site
+- Thanks
+  - kojix2
+  - Benson Muite
 ## [0.3.0] - 2022-12-18
 - Breaking change

data/Gemfile CHANGED Viewed

@@ -7,7 +7,7 @@ gemspec
 group :test do
   gem 'rake'
-  gem 'red-parquet', '~> 10.0.0'
+  gem 'red-parquet', '~> 11.0.0'
   gem 'rover-df', '~> 0.3.0'
   gem 'rubocop'

data/LICENSE CHANGED Viewed

@@ -1,6 +1,6 @@
 The MIT License (MIT)
-Copyright (c) 2022 Hirokazu SUZUKI (heronshoes)
+Copyright (c) 2022-2023 Hirokazu SUZUKI (heronshoes)
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

data/README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 # RedAmber
-[![Gem Version](https://badge.fury.io/rb/red_amber.svg)](https://badge.fury.io/rb/red_amber)
+[![Gem Version](https://img.shields.io/gem/v/red_amber?color=brightgreen)](https://rubygems.org/gems/red_amber)
 [![CI](https://github.com/heronshoes/red_amber/actions/workflows/ci.yml/badge.svg)](https://github.com/heronshoes/red_amber/actions/workflows/ci.yml)
 [![Maintainability](https://api.codeclimate.com/v1/badges/b8a745047045d2f49daa/maintainability)](https://codeclimate.com/github/heronshoes/red_amber/maintainability)
 [![Test coverage](https://api.codeclimate.com/v1/badges/b8a745047045d2f49daa/test_coverage)](https://codeclimate.com/github/heronshoes/red_amber/test_coverage)
@@ -10,34 +10,32 @@
 A simple dataframe library for Ruby.
 - Powered by [Red Arrow](https://github.com/apache/arrow/tree/master/ruby/red-arrow)
-[![Gitter Chat](https://badges.gitter.im/red-data-tools/en.svg)](https://gitter.im/red-data-tools/en)
+[![Gitter Chat](https://badges.gitter.im/red-data-tools/en.svg)](https://gitter.im/red-data-tools/en) [![Gem Version](https://img.shields.io/gem/v/red-arrow?color=brightgreen)](https://rubygems.org/gems/red-arrow)
 - Inspired by the dataframe library [Rover-df](https://github.com/ankane/rover)
 ![screenshot from jupyterlab](https://raw.githubusercontent.com/heronshoes/red_amber/main/doc/image/screenshot.png)
 ## Requirements
+### Ruby
 Supported Ruby version is >= 3.0 (since RedAmber 0.3.0).
+- I decided to remove support for Ruby 2.7 without waiting for its EOL. See [Release note for v0.3.0](https://github.com/heronshoes/red_amber/discussions/162) for details.
-- I decided to remove Ruby 2.7 without waiting for EOL because it cannot solve the problem of simultaneous use of Hash and keyword arguments when implementing DataFrame#join.
+### Libraries
 ```ruby
-# Libraries required
-gem 'red-arrow',   '~> 10.0.0' # Requires Apache Arrow (see installation below)
-gem 'red-parquet', '~> 10.0.0' # Optional, if you use IO from/to parquet
+gem 'red-arrow',   '~> 11.0.0' # Requires Apache Arrow (see installation below)
+gem 'red-parquet', '~> 11.0.0' # Optional, if you use IO from/to parquet
 gem 'rover-df',    '~> 0.3.0' # Optional, if you use IO from/to Rover::DataFrame
 ```
 ## Installation
-Install requirements before you install Red Amber.
+Install requirements before you install RedAmber.
-- Apache Arrow (~> 10.0.0)
-- Apache Arrow GLib (~> 10.0.0)
-- Apache Parquet GLib (~> 10.0.0)  # If you use IO from/to parquet
+- Apache Arrow (~> 11.0.0)
+- Apache Arrow GLib (~> 11.0.0)
+- Apache Parquet GLib (~> 11.0.0)  # If you use IO from/to parquet
-  See [Apache Arrow install document](https://arrow.apache.org/install/).
+See [Apache Arrow install document](https://arrow.apache.org/install/).
   - Minimum installation example for the latest Ubuntu:
@@ -58,43 +56,44 @@ Install requirements before you install Red Amber.
       sudo dnf -y install gcc-c++ libarrow-devel libarrow-glib-devel ruby-devel
       ```
-  - On macOS, you can install Apache Arrow C++ library using Homebrew:
+  - On macOS, using Homebrew:
       ```
       brew install apache-arrow
-      ```
-    and GLib (C) package with:
-      ```
       brew install apache-arrow-glib
       ```
 If you prepared Apache Arrow, add these lines to your Gemfile:
 ```ruby
-gem 'red-arrow',   '~> 10.0.0'
+gem 'red-arrow',   '~> 11.0.0'
 gem 'red_amber'
-gem 'red-parquet', '~> 10.0.0' # Optional, if you use IO from/to parquet
+gem 'red-parquet', '~> 11.0.0' # Optional, if you use IO from/to parquet
 gem 'rover-df',    '~> 0.3.0'  # Optional, if you use IO from/to Rover::DataFrame
 gem 'red-datasets-arrow'       # Optional, recommended if you use Red Datasets
 gem 'red-arrow-numo-narray'    # Optional, recommended if you use inputs from Numo::NArray
 ```
-And then execute `bundle install` or install it yourself as `gem install red_amber`.
+And then execute `bundle install` or install them yourself such as `gem install red_amber`.
 ## Docker image and Jupyter Notebook
-[RubyData Docker Stacks](https://github.com/RubyData/docker-stacks) is available as a ready-to-run Docker image containing Jupyter and useful data tools as well as RedAmber (Thanks to @mrkn).
+[RubyData Docker Stacks](https://github.com/RubyData/docker-stacks) is available as a ready-to-run Docker image containing Jupyter and useful data tools as well as RedAmber (Thanks to Kenta Murata).
 Also you can try the contents of this README interactively by [Binder](https://mybinder.org/v2/gh/heronshoes/docker-stacks/RedAmber-binder?filepath=red-amber.ipynb).
 [![Binder](https://mybinder.org/badge_logo.svg)](https://mybinder.org/v2/gh/heronshoes/docker-stacks/RedAmber-binder?filepath=red-amber.ipynb)
+## Comparison of DataFrames
+Comparison of  basic features of RedAmber with Python
+[pandas](https://pandas.pydata.org/),
+R [Tidyverse](https://www.tidyverse.org/) and
+Julia [Dataframes](https://dataframes.juliadata.org/stable/) is in [DataFrame_Comparison.md](doc/DataFrame_Comparison.md) (Thanks to Benson Muite).
 ## Data frame in `RedAmber`
 Class `RedAmber::DataFrame` represents a set of data in 2D-shape.
-The entity is a Red Arrow's Table object.
+Its entity is a Red Arrow's Table object.
 ![dataframe model of RedAmber](https://raw.githubusercontent.com/heronshoes/red_amber/main/doc/image/dataframe_model.png)
@@ -116,7 +115,7 @@ then
 require 'datasets-arrow' # to load sample data
 dataset = Datasets::Diamonds.new
-diamonds = DataFrame.new(dataset) # from v0.2.2, should be `dataset.to_arrow` if older.
+diamonds = DataFrame.new(dataset) # before v0.2.3, should be `dataset.to_arrow`
 # =>
 #<RedAmber::DataFrame : 53940 x 10 Vectors, 0x000000000000f668>
@@ -137,7 +136,7 @@ For example, we can compute mean prices per cut for the data larger than 1 carat
 ```ruby
 df = diamonds
-  .slice { carat > 1 }
+  .slice { carat > 1 } # or use #filter instead of #slice
   .group(:cut)
   .mean(:price) # `pick` prior to `group` is not required if `:price` is specified here.
   .sort('-mean(price)')
@@ -175,7 +174,7 @@ df.rename('mean(price)': :mean_price_USD)
 ### Example: starwars dataset
-Next example is `starwars` dataset reading from the downloaded CSV file. Followed by minimum data cleansing.
+Next example is `starwars` dataset reading from the downloaded CSV file. Followed by minimum data cleaning.
 ```ruby
 uri = URI('https://vincentarelbundock.github.io/Rdatasets/csv/dplyr/starwars.csv')
@@ -186,7 +185,7 @@ starwars
   .drop(0) # delete unnecessary index column
   .remove { species == "NA" } # delete unnecessary rows
   .group(:species) { [count(:species), mean(:height, :mass)] }
-  .slice { count > 1 }
+  .slice { count > 1 } # or use #filter instead of slice
 # =>
 #<RedAmber::DataFrame : 8 x 4 Vectors, 0x000000000000f848>
@@ -213,7 +212,7 @@ See [Vector.md](doc/Vector.md) for details.
 ## Jupyter notebook
-[89 Examples of Red Amber](https://github.com/heronshoes/docker-stacks/blob/RedAmber-binder/binder/examples_of_red_amber.ipynb)
+[Examples of Red Amber](https://github.com/heronshoes/docker-stacks/blob/RedAmber-binder/binder/examples_of_red_amber.ipynb)
 ([raw file](https://raw.githubusercontent.com/heronshoes/docker-stacks/RedAmber-binder/binder/examples_of_red_amber.ipynb)) shows more examples in jupyter notebook.
 You can try this notebook on [Binder](https://mybinder.org/v2/gh/heronshoes/docker-stacks/RedAmber-binder?filepath=examples_of_red_amber.ipynb).

data/benchmark/basic.yml CHANGED Viewed

@@ -1,18 +1,18 @@
 loop_count: 3
 contexts:
-  - name: HEAD
-    prelude: |
-      $LOAD_PATH.unshift(File.expand_path('lib'))
-  - name: 0.2.3
+  - name: 0.1.5
     gems:
-      red_amber: 0.2.3
+      red_amber: 0.1.5
   - name: 0.2.0
     gems:
       red_amber: 0.2.0
-  - name: 0.1.5
+  - name: 0.3.0
     gems:
-      red_amber: 0.1.5
+      red_amber: 0.3.0
+  - name: HEAD
+    prelude: |
+      $LOAD_PATH.unshift(File.expand_path('lib'))
 prelude: |
   require 'red_amber'

data/benchmark/combine.yml CHANGED Viewed

@@ -1,12 +1,12 @@
 loop_count: 3
 contexts:
+  - name: 0.3.0
+    gems:
+      red_amber: 0.3.0
   - name: HEAD
     prelude: |
       $LOAD_PATH.unshift(File.expand_path('lib'))
-  - name: 0.2.3
-    gems:
-      red_amber: 0.2.3
 prelude: |
   require 'red_amber'

data/benchmark/dataframe.yml CHANGED Viewed

@@ -1,15 +1,15 @@
 loop_count: 3
 contexts:
-  - name: HEAD
-    prelude: |
-      $LOAD_PATH.unshift(File.expand_path('lib'))
-  - name: 0.2.3
-    gems:
-      red_amber: 0.2.3
   - name: 0.2.0
     gems:
       red_amber: 0.2.0
+  - name: 0.3.0
+    gems:
+      red_amber: 0.3.0
+  - name: HEAD
+    prelude: |
+      $LOAD_PATH.unshift(File.expand_path('lib'))
 prelude: |
   require 'red_amber'
@@ -19,8 +19,14 @@ prelude: |
   starwars = RedAmber::DataFrame.new(Datasets::Rdataset.new('dplyr', 'starwars').to_arrow)
-  uri = URI("https://raw.githubusercontent.com/heronshoes/red_amber/master/test/entity/import_cars.tsv")
-  import_cars = RedAmber::DataFrame.load(uri)
+  import_cars = RedAmber::DataFrame.load(Arrow::Buffer.new(<<~TSV), format: :tsv)
+    Year	Audi	BMW	BMW_MINI	Mercedes-Benz	VW
+    2017	28336	52527	25427	68221	49040
+    2018	26473	50982	25984	67554	51961
+    2019	24222	46814	23813	66553	46794
+    2020	22304	35712	20196	57041	36576
+    2021	22535	35905	18211	51722	35215
+  TSV
   ds = Datasets::Rdataset.new('openintro', 'simpsons_paradox_covid')
   simpsons_paradox_covid = RedAmber::DataFrame.new(ds.to_arrow)
@@ -43,7 +49,7 @@ benchmark:
       .group(:species) { [count(:species), mean(:height, :mass)] }
       .slice { v(:count) > 1 }
-  'D03: Inport cars test': |
+  'D03: Import cars test': |
     import_cars
       .to_long(:Year, name: :Manufacturer, value: :Num_of_imported)
       .to_wide(name: :Manufacturer, value: :Num_of_imported)

data/benchmark/group.yml CHANGED Viewed

@@ -1,15 +1,15 @@
 loop_count: 3
 contexts:
-  - name: HEAD
-    prelude: |
-      $LOAD_PATH.unshift(File.expand_path('lib'))
-  - name: 0.2.3
-    gems:
-      red_amber: 0.2.3
   - name: 0.2.2
     gems:
       red_amber: 0.2.2
+  - name: 0.3.0
+    gems:
+      red_amber: 0.3.0
+  - name: HEAD
+    prelude: |
+      $LOAD_PATH.unshift(File.expand_path('lib'))
 prelude: |
   require 'red_amber'

data/benchmark/reshape.yml CHANGED Viewed

@@ -1,15 +1,15 @@
 loop_count: 3
 contexts:
-  - name: HEAD
-    prelude: |
-      $LOAD_PATH.unshift(File.expand_path('lib'))
-  - name: 0.2.3
-    gems:
-      red_amber: 0.2.3
   - name: 0.2.2
     gems:
       red_amber: 0.2.2
+  - name: 0.3.0
+    gems:
+      red_amber: 0.3.0
+  - name: HEAD
+    prelude: |
+      $LOAD_PATH.unshift(File.expand_path('lib'))
 prelude: |
   require 'red_amber'

data/benchmark/vector.yml CHANGED Viewed

@@ -1,12 +1,15 @@
 loop_count: 10
 contexts:
-  - name: HEAD
-    prelude: |
-      $LOAD_PATH.unshift(File.expand_path('lib'))
   - name: 0.2.0
     gems:
       red_amber: 0.2.0
+  - name: 0.3.0
+    gems:
+      red_amber: 0.3.0
+  - name: HEAD
+    prelude: |
+      $LOAD_PATH.unshift(File.expand_path('lib'))
 prelude: |
   require 'red_amber'