daru 0.1.4.1 → 0.1.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.rubocop.yml +3 -0
- data/.travis.yml +3 -0
- data/CONTRIBUTING.md +27 -3
- data/Guardfile +7 -0
- data/History.md +39 -1
- data/README.md +1 -1
- data/daru.gemspec +9 -2
- data/lib/daru.rb +4 -1
- data/lib/daru/accessors/gsl_wrapper.rb +93 -91
- data/lib/daru/accessors/nmatrix_wrapper.rb +109 -107
- data/lib/daru/category.rb +22 -15
- data/lib/daru/core/group_by.rb +13 -2
- data/lib/daru/core/merge.rb +37 -31
- data/lib/daru/core/query.rb +10 -2
- data/lib/daru/dataframe.rb +95 -34
- data/lib/daru/date_time/index.rb +15 -16
- data/lib/daru/date_time/offsets.rb +14 -11
- data/lib/daru/formatters/table.rb +2 -2
- data/lib/daru/index/categorical_index.rb +201 -0
- data/lib/daru/index/index.rb +289 -0
- data/lib/daru/index/multi_index.rb +266 -0
- data/lib/daru/maths/statistics/vector.rb +13 -9
- data/lib/daru/monkeys.rb +0 -7
- data/lib/daru/plotting/gruff/category.rb +1 -0
- data/lib/daru/plotting/gruff/dataframe.rb +3 -3
- data/lib/daru/plotting/nyaplot/dataframe.rb +1 -1
- data/lib/daru/vector.rb +36 -21
- data/lib/daru/version.rb +1 -1
- data/spec/accessors/array_wrapper_spec.rb +3 -0
- data/spec/accessors/{wrappers_spec.rb → gsl_wrapper_spec.rb} +0 -35
- data/spec/accessors/nmatrix_wrapper_spec.rb +32 -0
- data/spec/{categorical_spec.rb → category_spec.rb} +3 -0
- data/spec/core/group_by_spec.rb +17 -1
- data/spec/core/merge_spec.rb +38 -1
- data/spec/core/query_spec.rb +5 -0
- data/spec/dataframe_spec.rb +230 -57
- data/spec/date_time/offsets_spec.rb +84 -3
- data/spec/formatters/table_formatter_spec.rb +9 -0
- data/spec/index/categorical_index_spec.rb +2 -0
- data/spec/index/index_spec.rb +17 -2
- data/spec/{math → maths}/arithmetic/dataframe_spec.rb +0 -0
- data/spec/{math → maths}/arithmetic/vector_spec.rb +0 -0
- data/spec/{math → maths}/statistics/dataframe_spec.rb +1 -1
- data/spec/{math → maths}/statistics/vector_spec.rb +7 -12
- data/spec/plotting/gruff/category_spec.rb +44 -0
- data/spec/plotting/gruff/dataframe_spec.rb +84 -0
- data/spec/plotting/gruff/vector_spec.rb +70 -0
- data/spec/plotting/nyaplot/category_spec.rb +51 -0
- data/spec/plotting/{dataframe_spec.rb → nyaplot/dataframe_spec.rb} +0 -83
- data/spec/plotting/nyaplot/vector_spec.rb +66 -0
- data/spec/spec_helper.rb +3 -2
- data/spec/vector_spec.rb +68 -1
- metadata +53 -24
- data/lib/daru/index.rb +0 -761
- data/spec/plotting/vector_spec.rb +0 -230
@@ -301,86 +301,3 @@ describe Daru::DataFrame, 'category plotting' do
|
|
301
301
|
it { expect { df.plot(type: :box, categorized: {by: :c, method: :color}) }.to raise_error ArgumentError }
|
302
302
|
end
|
303
303
|
end
|
304
|
-
|
305
|
-
describe Daru::DataFrame, 'plotting dataframe using gruff' do
|
306
|
-
before { Daru.plotting_library = :gruff }
|
307
|
-
let(:df) do
|
308
|
-
Daru::DataFrame.new({
|
309
|
-
a: [1, 3, 5, 2, 5, 0],
|
310
|
-
b: [1, 5, 2, 5, 1, 0],
|
311
|
-
c: [1, 6, 7, 2, 6, 0]
|
312
|
-
}, index: 'a'..'f')
|
313
|
-
end
|
314
|
-
|
315
|
-
context 'bar' do
|
316
|
-
let(:plot) { instance_double 'Gruff::Bar' }
|
317
|
-
before { allow(Gruff::Bar).to receive(:new).and_return(plot) }
|
318
|
-
it 'plots bar graph' do
|
319
|
-
expect(plot).to receive :labels=
|
320
|
-
expect(plot).to receive(:data).exactly(3).times
|
321
|
-
df.plot type: :bar
|
322
|
-
end
|
323
|
-
|
324
|
-
it 'plots bar graph with block' do
|
325
|
-
expect(plot).to receive :labels=
|
326
|
-
expect(plot).to receive(:data).exactly(3).times
|
327
|
-
expect(plot).to receive :title=
|
328
|
-
df.plot(type: :bar) { |p| p.title = 'hello' }
|
329
|
-
end
|
330
|
-
|
331
|
-
it 'plots with specified columns' do
|
332
|
-
expect(plot).to receive :labels=
|
333
|
-
expect(plot).to receive(:data).exactly(2).times
|
334
|
-
df.plot type: :bar, y: [:a, :b]
|
335
|
-
end
|
336
|
-
end
|
337
|
-
|
338
|
-
context 'line' do
|
339
|
-
let(:plot) { instance_double 'Gruff::Line' }
|
340
|
-
before { allow(Gruff::Line).to receive(:new).and_return(plot) }
|
341
|
-
it 'plots line graph' do
|
342
|
-
expect(plot).to receive :labels=
|
343
|
-
expect(plot).to receive(:data).exactly(3).times
|
344
|
-
df.plot type: :line
|
345
|
-
end
|
346
|
-
end
|
347
|
-
|
348
|
-
context 'scatter' do
|
349
|
-
let(:plot) { instance_double 'Gruff::Scatter' }
|
350
|
-
before { allow(Gruff::Scatter).to receive(:new).and_return(plot) }
|
351
|
-
it 'plots scatter graph' do
|
352
|
-
expect(plot).to receive(:data).exactly(3).times
|
353
|
-
df.plot type: :scatter
|
354
|
-
end
|
355
|
-
|
356
|
-
it 'plots with specified columns' do
|
357
|
-
expect(plot).to receive(:data).exactly(1).times
|
358
|
-
df.plot type: :scatter, x: :c, y: :a
|
359
|
-
end
|
360
|
-
end
|
361
|
-
|
362
|
-
context 'invalid type' do
|
363
|
-
it { expect { df.plot type: :lol }.to raise_error ArgumentError }
|
364
|
-
end
|
365
|
-
end
|
366
|
-
|
367
|
-
describe Daru::DataFrame, 'dataframe category plotting with gruff' do
|
368
|
-
before { Daru.plotting_library = :gruff }
|
369
|
-
let(:df) do
|
370
|
-
Daru::DataFrame.new({
|
371
|
-
a: [1, 3, 5, 2, 5, 0],
|
372
|
-
b: [1, 5, 2, 5, 1, 0],
|
373
|
-
c: [:a, :b, :a, :a, :b, :a]
|
374
|
-
}, index: 'a'..'f')
|
375
|
-
end
|
376
|
-
before { df.to_category :c }
|
377
|
-
|
378
|
-
context 'scatter' do
|
379
|
-
let(:plot) { instance_double 'Gruff::Scatter' }
|
380
|
-
before { allow(Gruff::Scatter).to receive(:new).and_return(plot) }
|
381
|
-
it 'plots scatter plot categorized by category vector' do
|
382
|
-
expect(plot).to receive(:data).exactly(2).times
|
383
|
-
df.plot type: :scatter, x: :a, y: :b, categorized: { by: :c }
|
384
|
-
end
|
385
|
-
end
|
386
|
-
end
|
@@ -0,0 +1,66 @@
|
|
1
|
+
require 'spec_helper.rb'
|
2
|
+
|
3
|
+
describe Daru::Vector, 'plotting' do
|
4
|
+
let(:vector) { Daru::Vector.new([11, 22, 33], index: [:a, :b, :c]) }
|
5
|
+
let(:plot) { instance_double('Nyaplot::Plot') }
|
6
|
+
let(:diagram) { instance_double('Nyaplot::Diagram') }
|
7
|
+
|
8
|
+
before do
|
9
|
+
Daru.plotting_library = :nyaplot
|
10
|
+
allow(Nyaplot::Plot).to receive(:new).and_return(plot)
|
11
|
+
end
|
12
|
+
|
13
|
+
it 'plots the vector' do
|
14
|
+
expect(plot).to receive(:add).with(:box, [11, 22, 33]).ordered
|
15
|
+
expect(plot).to receive(:show).ordered
|
16
|
+
|
17
|
+
vector.plot(type: :box)
|
18
|
+
end
|
19
|
+
|
20
|
+
context 'scatter' do
|
21
|
+
it 'is default type' do
|
22
|
+
expect(plot).to receive(:add).with(:scatter, instance_of(Array), instance_of(Array)).ordered
|
23
|
+
expect(plot).to receive(:show).ordered
|
24
|
+
|
25
|
+
vector.plot
|
26
|
+
end
|
27
|
+
|
28
|
+
it 'sets x_axis to 0...size' do
|
29
|
+
expect(plot).to receive(:add).with(:scatter, [0, 1, 2], [11, 22, 33]).ordered
|
30
|
+
expect(plot).to receive(:show).ordered
|
31
|
+
|
32
|
+
vector.plot(type: :scatter)
|
33
|
+
end
|
34
|
+
end
|
35
|
+
|
36
|
+
[:box, :histogram].each do |type|
|
37
|
+
context type.to_s do
|
38
|
+
it 'does not set x axis' do
|
39
|
+
expect(plot).to receive(:add).with(type, [11, 22, 33]).ordered
|
40
|
+
expect(plot).to receive(:show).ordered
|
41
|
+
|
42
|
+
vector.plot(type: type)
|
43
|
+
end
|
44
|
+
end
|
45
|
+
end
|
46
|
+
|
47
|
+
[:bar, :line].each do |type| # FIXME: what other types 2D plot could have?..
|
48
|
+
context type.to_s do
|
49
|
+
it 'sets x axis to index' do
|
50
|
+
expect(plot).to receive(:add).with(type, [:a, :b, :c], [11, 22, 33]).ordered
|
51
|
+
expect(plot).to receive(:show).ordered
|
52
|
+
|
53
|
+
vector.plot(type: type)
|
54
|
+
end
|
55
|
+
end
|
56
|
+
end
|
57
|
+
|
58
|
+
context 'with block provided' do
|
59
|
+
it 'yields plot and diagram' do
|
60
|
+
expect(plot).to receive(:add).with(:box, [11, 22, 33]).ordered.and_return(diagram)
|
61
|
+
expect(plot).to receive(:show).ordered
|
62
|
+
|
63
|
+
expect { |b| vector.plot(type: :box, &b) }.to yield_with_args(plot, diagram)
|
64
|
+
end
|
65
|
+
end
|
66
|
+
end
|
data/spec/spec_helper.rb
CHANGED
@@ -26,8 +26,9 @@ RSpec::Expectations.configuration.warn_about_potential_false_positives = false
|
|
26
26
|
|
27
27
|
require 'simplecov'
|
28
28
|
SimpleCov.start do
|
29
|
-
|
30
|
-
|
29
|
+
add_filter 'vendor'
|
30
|
+
add_filter 'spec'
|
31
|
+
minimum_coverage_by_file 95
|
31
32
|
end
|
32
33
|
|
33
34
|
$LOAD_PATH.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
|
data/spec/vector_spec.rb
CHANGED
@@ -1,3 +1,5 @@
|
|
1
|
+
require 'spec_helper.rb'
|
2
|
+
|
1
3
|
describe Daru::Vector do
|
2
4
|
ALL_DTYPES.each do |dtype|
|
3
5
|
describe dtype.to_s do
|
@@ -84,6 +86,30 @@ describe Daru::Vector do
|
|
84
86
|
|
85
87
|
end
|
86
88
|
|
89
|
+
context "#reorder!" do
|
90
|
+
let(:vector_with_dtype) do
|
91
|
+
Daru::Vector.new(
|
92
|
+
[1, 2, 3, 4],
|
93
|
+
index: [:a, :b, :c, :d],
|
94
|
+
dtype: dtype)
|
95
|
+
end
|
96
|
+
let(:arranged_vector) do
|
97
|
+
Daru::Vector.new([4,3,2,1], index: [:d, :c, :b, :a], dtype: dtype)
|
98
|
+
end
|
99
|
+
|
100
|
+
before do
|
101
|
+
vector_with_dtype.reorder! [3, 2, 1, 0]
|
102
|
+
end
|
103
|
+
|
104
|
+
it "rearranges with passed order" do
|
105
|
+
expect(vector_with_dtype).to eq arranged_vector
|
106
|
+
end
|
107
|
+
|
108
|
+
it "doesn't change dtype" do
|
109
|
+
expect(vector_with_dtype.data.class).to eq arranged_vector.data.class
|
110
|
+
end
|
111
|
+
end
|
112
|
+
|
87
113
|
context ".new_with_size" do
|
88
114
|
it "creates new vector from only size" do
|
89
115
|
v1 = Daru::Vector.new 10.times.map { nil }, dtype: dtype
|
@@ -1177,10 +1203,25 @@ describe Daru::Vector do
|
|
1177
1203
|
expect(@vector['2012-1-1']).to eq(1)
|
1178
1204
|
end
|
1179
1205
|
|
1206
|
+
it "accepts an array as index" do
|
1207
|
+
@vector.index = [5,4,3,2,1]
|
1208
|
+
|
1209
|
+
expect(@vector.index.class).to eq(Daru::Index)
|
1210
|
+
expect(@vector[5]).to eq(1)
|
1211
|
+
end
|
1212
|
+
|
1213
|
+
it "accepts an range as index" do
|
1214
|
+
@vector.index = 'a'..'e'
|
1215
|
+
|
1216
|
+
expect(@vector.index.class).to eq(Daru::Index)
|
1217
|
+
expect(@vector['a']).to eq(1)
|
1218
|
+
end
|
1219
|
+
|
1180
1220
|
it "raises error for index size != vector size" do
|
1181
1221
|
expect {
|
1182
1222
|
@vector.index = Daru::Index.new([4,2,6])
|
1183
|
-
}.to raise_error
|
1223
|
+
}.to raise_error(ArgumentError, 'Size of supplied index 3 '\
|
1224
|
+
'does not match size of Vector')
|
1184
1225
|
end
|
1185
1226
|
end
|
1186
1227
|
|
@@ -1882,6 +1923,32 @@ describe Daru::Vector do
|
|
1882
1923
|
expect(lag2[lag2.size - 2]).to be_within(0.001).of(16.56)
|
1883
1924
|
end
|
1884
1925
|
end
|
1926
|
+
|
1927
|
+
context "#group_by" do
|
1928
|
+
let(:dv) { Daru::Vector.new [:a, :b, :a, :b, :c] }
|
1929
|
+
|
1930
|
+
context 'vector not specified' do
|
1931
|
+
subject { dv.group_by }
|
1932
|
+
|
1933
|
+
it { is_expected.to be_a Daru::Core::GroupBy }
|
1934
|
+
its(:'groups.size') { is_expected.to eq 3 }
|
1935
|
+
its(:groups) { is_expected.to eq({[:a]=>[0, 2], [:b]=>[1, 3], [:c]=>[4]}) }
|
1936
|
+
end
|
1937
|
+
|
1938
|
+
context 'vector name specified' do
|
1939
|
+
before { dv.name = :hello }
|
1940
|
+
subject { dv.group_by :hello }
|
1941
|
+
|
1942
|
+
it { is_expected.to be_a Daru::Core::GroupBy }
|
1943
|
+
its(:'groups.size') { is_expected.to eq 3 }
|
1944
|
+
its(:groups) { is_expected.to eq({[:a]=>[0, 2], [:b]=>[1, 3], [:c]=>[4]}) }
|
1945
|
+
end
|
1946
|
+
|
1947
|
+
context 'vector name invalid' do
|
1948
|
+
before { dv.name = :hello }
|
1949
|
+
it { expect { dv.group_by :abc }.to raise_error }
|
1950
|
+
end
|
1951
|
+
end
|
1885
1952
|
|
1886
1953
|
context '#method_missing' do
|
1887
1954
|
context 'getting' do
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: daru
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
4
|
+
version: 0.1.5
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Sameer Deshmukh
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2017-01-31 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: backports
|
@@ -207,19 +207,19 @@ dependencies:
|
|
207
207
|
- !ruby/object:Gem::Version
|
208
208
|
version: '0.7'
|
209
209
|
- !ruby/object:Gem::Dependency
|
210
|
-
name:
|
210
|
+
name: gsl
|
211
211
|
requirement: !ruby/object:Gem::Requirement
|
212
212
|
requirements:
|
213
213
|
- - "~>"
|
214
214
|
- !ruby/object:Gem::Version
|
215
|
-
version:
|
215
|
+
version: 2.1.0.2
|
216
216
|
type: :development
|
217
217
|
prerelease: false
|
218
218
|
version_requirements: !ruby/object:Gem::Requirement
|
219
219
|
requirements:
|
220
220
|
- - "~>"
|
221
221
|
- !ruby/object:Gem::Version
|
222
|
-
version:
|
222
|
+
version: 2.1.0.2
|
223
223
|
- !ruby/object:Gem::Dependency
|
224
224
|
name: dbd-sqlite3
|
225
225
|
requirement: !ruby/object:Gem::Requirement
|
@@ -318,6 +318,20 @@ dependencies:
|
|
318
318
|
- - ">="
|
319
319
|
- !ruby/object:Gem::Version
|
320
320
|
version: '0'
|
321
|
+
- !ruby/object:Gem::Dependency
|
322
|
+
name: gruff
|
323
|
+
requirement: !ruby/object:Gem::Requirement
|
324
|
+
requirements:
|
325
|
+
- - ">="
|
326
|
+
- !ruby/object:Gem::Version
|
327
|
+
version: '0'
|
328
|
+
type: :development
|
329
|
+
prerelease: false
|
330
|
+
version_requirements: !ruby/object:Gem::Requirement
|
331
|
+
requirements:
|
332
|
+
- - ">="
|
333
|
+
- !ruby/object:Gem::Version
|
334
|
+
version: '0'
|
321
335
|
- !ruby/object:Gem::Dependency
|
322
336
|
name: nokogiri
|
323
337
|
requirement: !ruby/object:Gem::Requirement
|
@@ -333,7 +347,7 @@ dependencies:
|
|
333
347
|
- !ruby/object:Gem::Version
|
334
348
|
version: '0'
|
335
349
|
- !ruby/object:Gem::Dependency
|
336
|
-
name:
|
350
|
+
name: guard-rspec
|
337
351
|
requirement: !ruby/object:Gem::Requirement
|
338
352
|
requirements:
|
339
353
|
- - ">="
|
@@ -366,6 +380,7 @@ files:
|
|
366
380
|
- ".travis.yml"
|
367
381
|
- CONTRIBUTING.md
|
368
382
|
- Gemfile
|
383
|
+
- Guardfile
|
369
384
|
- History.md
|
370
385
|
- LICENSE
|
371
386
|
- README.md
|
@@ -415,7 +430,9 @@ files:
|
|
415
430
|
- lib/daru/extensions/rserve.rb
|
416
431
|
- lib/daru/formatters/table.rb
|
417
432
|
- lib/daru/helpers/array.rb
|
418
|
-
- lib/daru/index.rb
|
433
|
+
- lib/daru/index/categorical_index.rb
|
434
|
+
- lib/daru/index/index.rb
|
435
|
+
- lib/daru/index/multi_index.rb
|
419
436
|
- lib/daru/io/io.rb
|
420
437
|
- lib/daru/io/sql_data_source.rb
|
421
438
|
- lib/daru/iruby/helpers.rb
|
@@ -445,8 +462,10 @@ files:
|
|
445
462
|
- profile/joining.rb
|
446
463
|
- profile/sorting.rb
|
447
464
|
- profile/vector_each_with_index.rb
|
448
|
-
- spec/accessors/
|
449
|
-
- spec/
|
465
|
+
- spec/accessors/array_wrapper_spec.rb
|
466
|
+
- spec/accessors/gsl_wrapper_spec.rb
|
467
|
+
- spec/accessors/nmatrix_wrapper_spec.rb
|
468
|
+
- spec/category_spec.rb
|
450
469
|
- spec/core/group_by_spec.rb
|
451
470
|
- spec/core/merge_spec.rb
|
452
471
|
- spec/core/query_spec.rb
|
@@ -477,13 +496,17 @@ files:
|
|
477
496
|
- spec/iruby/helpers_spec.rb
|
478
497
|
- spec/iruby/multi_index_spec.rb
|
479
498
|
- spec/iruby/vector_spec.rb
|
480
|
-
- spec/
|
481
|
-
- spec/
|
482
|
-
- spec/
|
483
|
-
- spec/
|
499
|
+
- spec/maths/arithmetic/dataframe_spec.rb
|
500
|
+
- spec/maths/arithmetic/vector_spec.rb
|
501
|
+
- spec/maths/statistics/dataframe_spec.rb
|
502
|
+
- spec/maths/statistics/vector_spec.rb
|
484
503
|
- spec/monkeys_spec.rb
|
485
|
-
- spec/plotting/
|
486
|
-
- spec/plotting/
|
504
|
+
- spec/plotting/gruff/category_spec.rb
|
505
|
+
- spec/plotting/gruff/dataframe_spec.rb
|
506
|
+
- spec/plotting/gruff/vector_spec.rb
|
507
|
+
- spec/plotting/nyaplot/category_spec.rb
|
508
|
+
- spec/plotting/nyaplot/dataframe_spec.rb
|
509
|
+
- spec/plotting/nyaplot/vector_spec.rb
|
487
510
|
- spec/shared/vector_display_spec.rb
|
488
511
|
- spec/spec_helper.rb
|
489
512
|
- spec/support/database_helper.rb
|
@@ -527,13 +550,15 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
527
550
|
version: '0'
|
528
551
|
requirements: []
|
529
552
|
rubyforge_project:
|
530
|
-
rubygems_version: 2.
|
553
|
+
rubygems_version: 2.6.8
|
531
554
|
signing_key:
|
532
555
|
specification_version: 4
|
533
556
|
summary: Data Analysis in RUby
|
534
557
|
test_files:
|
535
|
-
- spec/accessors/
|
536
|
-
- spec/
|
558
|
+
- spec/accessors/array_wrapper_spec.rb
|
559
|
+
- spec/accessors/gsl_wrapper_spec.rb
|
560
|
+
- spec/accessors/nmatrix_wrapper_spec.rb
|
561
|
+
- spec/category_spec.rb
|
537
562
|
- spec/core/group_by_spec.rb
|
538
563
|
- spec/core/merge_spec.rb
|
539
564
|
- spec/core/query_spec.rb
|
@@ -564,13 +589,17 @@ test_files:
|
|
564
589
|
- spec/iruby/helpers_spec.rb
|
565
590
|
- spec/iruby/multi_index_spec.rb
|
566
591
|
- spec/iruby/vector_spec.rb
|
567
|
-
- spec/
|
568
|
-
- spec/
|
569
|
-
- spec/
|
570
|
-
- spec/
|
592
|
+
- spec/maths/arithmetic/dataframe_spec.rb
|
593
|
+
- spec/maths/arithmetic/vector_spec.rb
|
594
|
+
- spec/maths/statistics/dataframe_spec.rb
|
595
|
+
- spec/maths/statistics/vector_spec.rb
|
571
596
|
- spec/monkeys_spec.rb
|
572
|
-
- spec/plotting/
|
573
|
-
- spec/plotting/
|
597
|
+
- spec/plotting/gruff/category_spec.rb
|
598
|
+
- spec/plotting/gruff/dataframe_spec.rb
|
599
|
+
- spec/plotting/gruff/vector_spec.rb
|
600
|
+
- spec/plotting/nyaplot/category_spec.rb
|
601
|
+
- spec/plotting/nyaplot/dataframe_spec.rb
|
602
|
+
- spec/plotting/nyaplot/vector_spec.rb
|
574
603
|
- spec/shared/vector_display_spec.rb
|
575
604
|
- spec/spec_helper.rb
|
576
605
|
- spec/support/database_helper.rb
|
data/lib/daru/index.rb
DELETED
@@ -1,761 +0,0 @@
|
|
1
|
-
module Daru
|
2
|
-
class Index
|
3
|
-
include Enumerable
|
4
|
-
# It so happens that over riding the .new method in a super class also
|
5
|
-
# tampers with the default .new method for class that inherit from the
|
6
|
-
# super class (Index in this case). Thus we first alias the original
|
7
|
-
# new method (from Object) to __new__ when the Index class is evaluated,
|
8
|
-
# and then we use an inherited hook such that the old new method (from
|
9
|
-
# Object) is once again the default .new for the subclass.
|
10
|
-
# Refer http://blog.sidu.in/2007/12/rubys-new-as-factory.html
|
11
|
-
class << self
|
12
|
-
alias :__new__ :new
|
13
|
-
|
14
|
-
def inherited subclass
|
15
|
-
class << subclass
|
16
|
-
alias :new :__new__
|
17
|
-
end
|
18
|
-
end
|
19
|
-
end
|
20
|
-
|
21
|
-
# We over-ride the .new method so that any sort of Index can be generated
|
22
|
-
# from Daru::Index based on the types of arguments supplied.
|
23
|
-
def self.new *args, &block
|
24
|
-
# FIXME: I'm not sure this clever trick really deserves our attention.
|
25
|
-
# Most of common ruby libraries just avoid it in favor of usual
|
26
|
-
# factor method, like `Index.create`. When `Index.new(...).class != Index`
|
27
|
-
# it just leads to confusion and surprises. - zverok, 2016-05-18
|
28
|
-
source = args.first
|
29
|
-
|
30
|
-
MultiIndex.try_from_tuples(source) ||
|
31
|
-
DateTimeIndex.try_create(source) ||
|
32
|
-
allocate.tap { |i| i.send :initialize, *args, &block }
|
33
|
-
end
|
34
|
-
|
35
|
-
def self.coerce maybe_index
|
36
|
-
maybe_index.is_a?(Index) ? maybe_index : Daru::Index.new(maybe_index)
|
37
|
-
end
|
38
|
-
|
39
|
-
def each(&block)
|
40
|
-
return to_enum(:each) unless block_given?
|
41
|
-
|
42
|
-
@relation_hash.each_key(&block)
|
43
|
-
self
|
44
|
-
end
|
45
|
-
|
46
|
-
def map(&block)
|
47
|
-
to_a.map(&block)
|
48
|
-
end
|
49
|
-
|
50
|
-
attr_reader :relation_hash, :size
|
51
|
-
|
52
|
-
def initialize index
|
53
|
-
index =
|
54
|
-
case index
|
55
|
-
when nil
|
56
|
-
[]
|
57
|
-
when Integer
|
58
|
-
index.times.to_a
|
59
|
-
when Enumerable
|
60
|
-
index.to_a
|
61
|
-
else
|
62
|
-
raise ArgumentError,
|
63
|
-
"Cannot create index from #{index.class} #{index.inspect}"
|
64
|
-
end
|
65
|
-
|
66
|
-
@relation_hash = index.each_with_index.to_h.freeze
|
67
|
-
@keys = @relation_hash.keys
|
68
|
-
@size = @relation_hash.size
|
69
|
-
end
|
70
|
-
|
71
|
-
def ==(other)
|
72
|
-
return false if self.class != other.class || other.size != @size
|
73
|
-
|
74
|
-
@relation_hash.keys == other.to_a &&
|
75
|
-
@relation_hash.values == other.relation_hash.values
|
76
|
-
end
|
77
|
-
|
78
|
-
def [](key, *rest)
|
79
|
-
case
|
80
|
-
when key.is_a?(Range)
|
81
|
-
by_range key
|
82
|
-
when !rest.empty?
|
83
|
-
by_multi_key key, *rest
|
84
|
-
else
|
85
|
-
by_single_key key
|
86
|
-
end
|
87
|
-
end
|
88
|
-
|
89
|
-
# Returns true if all arguments are either a valid category or position
|
90
|
-
# @param [Array<object>] *indexes categories or positions
|
91
|
-
# @return [true, false]
|
92
|
-
# @example
|
93
|
-
# idx.valid? :a, 2
|
94
|
-
# # => true
|
95
|
-
# idx.valid? 3
|
96
|
-
# # => false
|
97
|
-
def valid? *indexes
|
98
|
-
indexes.all? { |i| to_a.include?(i) || (i.is_a?(Numeric) && i < size) }
|
99
|
-
end
|
100
|
-
|
101
|
-
# Returns positions given indexes or positions
|
102
|
-
# @note If the arugent is both a valid index and a valid position,
|
103
|
-
# it will treated as valid index
|
104
|
-
# @param [Array<object>] *indexes indexes or positions
|
105
|
-
# @example
|
106
|
-
# x = Daru::Index.new [:a, :b, :c]
|
107
|
-
# x.pos :a, 1
|
108
|
-
# # => [0, 1]
|
109
|
-
def pos *indexes
|
110
|
-
indexes = preprocess_range(indexes.first) if indexes.first.is_a? Range
|
111
|
-
|
112
|
-
if indexes.size == 1
|
113
|
-
self[indexes.first]
|
114
|
-
else
|
115
|
-
indexes.map { |index| by_single_key index }
|
116
|
-
end
|
117
|
-
end
|
118
|
-
|
119
|
-
def subset *indexes
|
120
|
-
if indexes.first.is_a? Range
|
121
|
-
slice indexes.first.begin, indexes.first.end
|
122
|
-
elsif include? indexes.first
|
123
|
-
# Assume 'indexes' contain indexes not positions
|
124
|
-
Daru::Index.new indexes
|
125
|
-
else
|
126
|
-
# Assume 'indexes' contain positions not indexes
|
127
|
-
Daru::Index.new indexes.map { |k| key k }
|
128
|
-
end
|
129
|
-
end
|
130
|
-
|
131
|
-
# Takes positional values and returns subset of the self
|
132
|
-
# capturing the indexes at mentioned positions
|
133
|
-
# @param [Array<Integer>] positional values
|
134
|
-
# @return [object] index object
|
135
|
-
# @example
|
136
|
-
# idx = Daru::Index.new [:a, :b, :c]
|
137
|
-
# idx.at 0, 1
|
138
|
-
# # => #<Daru::Index(2): {a, b}>
|
139
|
-
def at *positions
|
140
|
-
positions = preprocess_positions(*positions)
|
141
|
-
validate_positions(*positions)
|
142
|
-
if positions.is_a? Integer
|
143
|
-
key(positions)
|
144
|
-
else
|
145
|
-
self.class.new positions.map(&method(:key))
|
146
|
-
end
|
147
|
-
end
|
148
|
-
|
149
|
-
def inspect threshold=20
|
150
|
-
if size <= threshold
|
151
|
-
"#<#{self.class}(#{size}): {#{to_a.join(', ')}}>"
|
152
|
-
else
|
153
|
-
"#<#{self.class}(#{size}): {#{to_a.first(threshold).join(', ')} ... #{to_a.last}}>"
|
154
|
-
end
|
155
|
-
end
|
156
|
-
|
157
|
-
def slice *args
|
158
|
-
start = args[0]
|
159
|
-
en = args[1]
|
160
|
-
|
161
|
-
if start.is_a?(Integer) && en.is_a?(Integer)
|
162
|
-
Index.new @keys[start..en]
|
163
|
-
else
|
164
|
-
start_idx = @relation_hash[start]
|
165
|
-
en_idx = @relation_hash[en]
|
166
|
-
|
167
|
-
Index.new @keys[start_idx..en_idx]
|
168
|
-
end
|
169
|
-
end
|
170
|
-
|
171
|
-
# Produce new index from the set union of two indexes.
|
172
|
-
def |(other)
|
173
|
-
Index.new(to_a | other.to_a)
|
174
|
-
end
|
175
|
-
|
176
|
-
# Produce a new index from the set intersection of two indexes
|
177
|
-
def & other
|
178
|
-
Index.new(to_a & other.to_a)
|
179
|
-
end
|
180
|
-
|
181
|
-
def to_a
|
182
|
-
@relation_hash.keys
|
183
|
-
end
|
184
|
-
|
185
|
-
def key(value)
|
186
|
-
return nil unless value.is_a?(Numeric)
|
187
|
-
@keys[value]
|
188
|
-
end
|
189
|
-
|
190
|
-
def include? index
|
191
|
-
@relation_hash.key? index
|
192
|
-
end
|
193
|
-
|
194
|
-
def empty?
|
195
|
-
@relation_hash.empty?
|
196
|
-
end
|
197
|
-
|
198
|
-
def dup
|
199
|
-
Daru::Index.new @relation_hash.keys
|
200
|
-
end
|
201
|
-
|
202
|
-
def add *indexes
|
203
|
-
Daru::Index.new(to_a + indexes)
|
204
|
-
end
|
205
|
-
|
206
|
-
def _dump(*)
|
207
|
-
Marshal.dump(relation_hash: @relation_hash)
|
208
|
-
end
|
209
|
-
|
210
|
-
def self._load data
|
211
|
-
h = Marshal.load data
|
212
|
-
|
213
|
-
Daru::Index.new(h[:relation_hash].keys)
|
214
|
-
end
|
215
|
-
|
216
|
-
# Provide an Index for sub vector produced
|
217
|
-
#
|
218
|
-
# @param input_indexes [Array] the input by user to index the vector
|
219
|
-
# @return [Object] the Index object for sub vector produced
|
220
|
-
def conform(*)
|
221
|
-
self
|
222
|
-
end
|
223
|
-
|
224
|
-
def reorder(new_order)
|
225
|
-
from = to_a
|
226
|
-
self.class.new(new_order.map { |i| from[i] })
|
227
|
-
end
|
228
|
-
|
229
|
-
private
|
230
|
-
|
231
|
-
def preprocess_range rng
|
232
|
-
start = rng.begin
|
233
|
-
en = rng.end
|
234
|
-
|
235
|
-
if start.is_a?(Integer) && en.is_a?(Integer)
|
236
|
-
@keys[start..en]
|
237
|
-
else
|
238
|
-
start_idx = @relation_hash[start]
|
239
|
-
en_idx = @relation_hash[en]
|
240
|
-
|
241
|
-
@keys[start_idx..en_idx]
|
242
|
-
end
|
243
|
-
end
|
244
|
-
|
245
|
-
def by_range rng
|
246
|
-
slice rng.begin, rng.end
|
247
|
-
end
|
248
|
-
|
249
|
-
def by_multi_key *key
|
250
|
-
if include? key[0]
|
251
|
-
Daru::Index.new key.map { |k| k }
|
252
|
-
else
|
253
|
-
# Assume the user is specifing values for index not keys
|
254
|
-
# Return index object having keys corresponding to values provided
|
255
|
-
Daru::Index.new key.map { |k| key k }
|
256
|
-
end
|
257
|
-
end
|
258
|
-
|
259
|
-
def by_single_key key
|
260
|
-
if @relation_hash.key?(key)
|
261
|
-
@relation_hash[key]
|
262
|
-
elsif key.is_a?(Numeric) && key < size
|
263
|
-
key
|
264
|
-
else
|
265
|
-
raise IndexError, "Specified index #{key.inspect} does not exist"
|
266
|
-
end
|
267
|
-
end
|
268
|
-
|
269
|
-
# Raises IndexError when one of the positions is an invalid position
|
270
|
-
def validate_positions *positions
|
271
|
-
positions = [positions] if positions.is_a? Integer
|
272
|
-
positions.each do |pos|
|
273
|
-
raise IndexError, "#{pos} is not a valid position." if pos >= size
|
274
|
-
end
|
275
|
-
end
|
276
|
-
|
277
|
-
# Preprocess ranges, integers and array in appropriate ways
|
278
|
-
def preprocess_positions *positions
|
279
|
-
if positions.size == 1
|
280
|
-
case positions.first
|
281
|
-
when Integer
|
282
|
-
positions.first
|
283
|
-
when Range
|
284
|
-
size.times.to_a[positions.first]
|
285
|
-
else
|
286
|
-
raise ArgumentError, 'Unkown position type.'
|
287
|
-
end
|
288
|
-
else
|
289
|
-
positions
|
290
|
-
end
|
291
|
-
end
|
292
|
-
end # class Index
|
293
|
-
|
294
|
-
class MultiIndex < Index
|
295
|
-
def each(&block)
|
296
|
-
to_a.each(&block)
|
297
|
-
end
|
298
|
-
|
299
|
-
def map(&block)
|
300
|
-
to_a.map(&block)
|
301
|
-
end
|
302
|
-
|
303
|
-
attr_reader :labels
|
304
|
-
|
305
|
-
def levels
|
306
|
-
@levels.map(&:keys)
|
307
|
-
end
|
308
|
-
|
309
|
-
def initialize opts={}
|
310
|
-
labels = opts[:labels]
|
311
|
-
levels = opts[:levels]
|
312
|
-
raise ArgumentError,
|
313
|
-
'Must specify both labels and levels' unless labels && levels
|
314
|
-
raise ArgumentError,
|
315
|
-
'Labels and levels should be same size' if labels.size != levels.size
|
316
|
-
raise ArgumentError,
|
317
|
-
'Incorrect labels and levels' if incorrect_fields?(labels, levels)
|
318
|
-
|
319
|
-
@labels = labels
|
320
|
-
@levels = levels.map { |e| e.map.with_index.to_h }
|
321
|
-
end
|
322
|
-
|
323
|
-
def incorrect_fields?(_labels, levels)
|
324
|
-
levels[0].size # FIXME: without this exact call some specs are failing
|
325
|
-
|
326
|
-
levels.any? { |e| e.uniq.size != e.size }
|
327
|
-
end
|
328
|
-
|
329
|
-
private :incorrect_fields?
|
330
|
-
|
331
|
-
def self.from_arrays arrays
|
332
|
-
levels = arrays.map { |e| e.uniq.sort_by(&:to_s) }
|
333
|
-
|
334
|
-
labels = arrays.each_with_index.map do |arry, level_index|
|
335
|
-
level = levels[level_index]
|
336
|
-
arry.map { |lvl| level.index(lvl) }
|
337
|
-
end
|
338
|
-
|
339
|
-
MultiIndex.new labels: labels, levels: levels
|
340
|
-
end
|
341
|
-
|
342
|
-
def self.from_tuples tuples
|
343
|
-
from_arrays tuples.transpose
|
344
|
-
end
|
345
|
-
|
346
|
-
def self.try_from_tuples tuples
|
347
|
-
if tuples.respond_to?(:first) && tuples.first.is_a?(Array)
|
348
|
-
from_tuples(tuples)
|
349
|
-
else
|
350
|
-
nil
|
351
|
-
end
|
352
|
-
end
|
353
|
-
|
354
|
-
def [] *key
|
355
|
-
key.flatten!
|
356
|
-
case
|
357
|
-
when key[0].is_a?(Range)
|
358
|
-
retrieve_from_range(key[0])
|
359
|
-
when key[0].is_a?(Integer) && key.size == 1
|
360
|
-
try_retrieve_from_integer(key[0])
|
361
|
-
else
|
362
|
-
begin
|
363
|
-
retrieve_from_tuples key
|
364
|
-
rescue NoMethodError
|
365
|
-
raise IndexError, "Specified index #{key.inspect} do not exist"
|
366
|
-
end
|
367
|
-
end
|
368
|
-
end
|
369
|
-
|
370
|
-
def valid? *indexes
|
371
|
-
# FIXME: This is perhaps not a good method
|
372
|
-
pos(*indexes)
|
373
|
-
return true
|
374
|
-
rescue IndexError
|
375
|
-
return false
|
376
|
-
end
|
377
|
-
|
378
|
-
# Returns positions given indexes or positions
|
379
|
-
# @note If the arugent is both a valid index and a valid position,
|
380
|
-
# it will treated as valid index
|
381
|
-
# @param [Array<object>] *indexes indexes or positions
|
382
|
-
# @example
|
383
|
-
# idx = Daru::MultiIndex.from_tuples [[:a, :one], [:a, :two], [:b, :one], [:b, :two]]
|
384
|
-
# idx.pos :a
|
385
|
-
# # => [0, 1]
|
386
|
-
def pos *indexes
|
387
|
-
if indexes.first.is_a? Integer
|
388
|
-
return indexes.first if indexes.size == 1
|
389
|
-
return indexes
|
390
|
-
end
|
391
|
-
res = self[indexes]
|
392
|
-
return res if res.is_a? Integer
|
393
|
-
res.map { |i| self[i] }
|
394
|
-
end
|
395
|
-
|
396
|
-
def subset *indexes
|
397
|
-
if indexes.first.is_a? Integer
|
398
|
-
MultiIndex.from_tuples(indexes.map { |index| key(index) })
|
399
|
-
else
|
400
|
-
self[indexes].conform indexes
|
401
|
-
end
|
402
|
-
end
|
403
|
-
|
404
|
-
# Takes positional values and returns subset of the self
|
405
|
-
# capturing the indexes at mentioned positions
|
406
|
-
# @param [Array<Integer>] positional values
|
407
|
-
# @return [object] index object
|
408
|
-
# @example
|
409
|
-
# idx = Daru::MultiIndex.from_tuples [[:a, :one], [:a, :two], [:b, :one], [:b, :two]]
|
410
|
-
# idx.at 0, 1
|
411
|
-
# # => #<Daru::MultiIndex(2x2)>
|
412
|
-
# # a one
|
413
|
-
# # two
|
414
|
-
def at *positions
|
415
|
-
positions = preprocess_positions(*positions)
|
416
|
-
validate_positions(*positions)
|
417
|
-
if positions.is_a? Integer
|
418
|
-
key(positions)
|
419
|
-
else
|
420
|
-
Daru::MultiIndex.from_tuples positions.map(&method(:key))
|
421
|
-
end
|
422
|
-
end
|
423
|
-
|
424
|
-
def add *indexes
|
425
|
-
Daru::MultiIndex.from_tuples to_a << indexes
|
426
|
-
end
|
427
|
-
|
428
|
-
def reorder(new_order)
|
429
|
-
from = to_a
|
430
|
-
self.class.from_tuples(new_order.map { |i| from[i] })
|
431
|
-
end
|
432
|
-
|
433
|
-
def try_retrieve_from_integer int
|
434
|
-
@levels[0].key?(int) ? retrieve_from_tuples([int]) : int
|
435
|
-
end
|
436
|
-
|
437
|
-
def retrieve_from_range range
|
438
|
-
MultiIndex.from_tuples(range.map { |index| key(index) })
|
439
|
-
end
|
440
|
-
|
441
|
-
def retrieve_from_tuples key
|
442
|
-
chosen = []
|
443
|
-
|
444
|
-
key.each_with_index do |k, depth|
|
445
|
-
level_index = @levels[depth][k]
|
446
|
-
raise IndexError, "Specified index #{key.inspect} do not exist" if level_index.nil?
|
447
|
-
label = @labels[depth]
|
448
|
-
chosen = find_all_indexes label, level_index, chosen
|
449
|
-
end
|
450
|
-
|
451
|
-
return chosen[0] if chosen.size == 1 && key.size == @levels.size
|
452
|
-
multi_index_from_multiple_selections(chosen)
|
453
|
-
end
|
454
|
-
|
455
|
-
def multi_index_from_multiple_selections chosen
|
456
|
-
MultiIndex.from_tuples(chosen.map { |e| key(e) })
|
457
|
-
end
|
458
|
-
|
459
|
-
def find_all_indexes label, level_index, chosen
|
460
|
-
if chosen.empty?
|
461
|
-
label.each_with_index
|
462
|
-
.select { |lbl, _| lbl == level_index }.map(&:last)
|
463
|
-
else
|
464
|
-
chosen.keep_if { |c| label[c] == level_index }
|
465
|
-
end
|
466
|
-
end
|
467
|
-
|
468
|
-
private :find_all_indexes, :multi_index_from_multiple_selections,
|
469
|
-
:retrieve_from_range, :retrieve_from_tuples
|
470
|
-
|
471
|
-
def key index
|
472
|
-
raise ArgumentError,
|
473
|
-
"Key #{index} is too large" if index >= @labels[0].size
|
474
|
-
|
475
|
-
@labels
|
476
|
-
.each_with_index
|
477
|
-
.map { |label, i| @levels[i].keys[label[index]] }
|
478
|
-
end
|
479
|
-
|
480
|
-
def dup
|
481
|
-
MultiIndex.new levels: levels.dup, labels: labels
|
482
|
-
end
|
483
|
-
|
484
|
-
def drop_left_level by=1
|
485
|
-
MultiIndex.from_arrays to_a.transpose[by..-1]
|
486
|
-
end
|
487
|
-
|
488
|
-
def | other
|
489
|
-
MultiIndex.from_tuples(to_a | other.to_a)
|
490
|
-
end
|
491
|
-
|
492
|
-
def & other
|
493
|
-
MultiIndex.from_tuples(to_a & other.to_a)
|
494
|
-
end
|
495
|
-
|
496
|
-
def empty?
|
497
|
-
@labels.flatten.empty? && @levels.all?(&:empty?)
|
498
|
-
end
|
499
|
-
|
500
|
-
def include? tuple
|
501
|
-
return false unless tuple.is_a? Enumerable
|
502
|
-
tuple.flatten.each_with_index
|
503
|
-
.all? { |tup, i| @levels[i][tup] }
|
504
|
-
end
|
505
|
-
|
506
|
-
def size
|
507
|
-
@labels[0].size
|
508
|
-
end
|
509
|
-
|
510
|
-
def width
|
511
|
-
@levels.size
|
512
|
-
end
|
513
|
-
|
514
|
-
def == other
|
515
|
-
self.class == other.class &&
|
516
|
-
labels == other.labels &&
|
517
|
-
levels == other.levels
|
518
|
-
end
|
519
|
-
|
520
|
-
def to_a
|
521
|
-
(0...size).map { |e| key(e) }
|
522
|
-
end
|
523
|
-
|
524
|
-
def values
|
525
|
-
Array.new(size) { |i| i }
|
526
|
-
end
|
527
|
-
|
528
|
-
def inspect threshold=20
|
529
|
-
"#<Daru::MultiIndex(#{size}x#{width})>\n" +
|
530
|
-
Formatters::Table.format([], row_headers: sparse_tuples, threshold: threshold)
|
531
|
-
end
|
532
|
-
|
533
|
-
def to_html
|
534
|
-
path = File.expand_path('../iruby/templates/multi_index.html.erb', __FILE__)
|
535
|
-
ERB.new(File.read(path).strip).result(binding)
|
536
|
-
end
|
537
|
-
|
538
|
-
# Provide a MultiIndex for sub vector produced
|
539
|
-
#
|
540
|
-
# @param input_indexes [Array] the input by user to index the vector
|
541
|
-
# @return [Object] the MultiIndex object for sub vector produced
|
542
|
-
def conform input_indexes
|
543
|
-
return self if input_indexes[0].is_a? Range
|
544
|
-
drop_left_level input_indexes.size
|
545
|
-
end
|
546
|
-
|
547
|
-
# Return tuples with nils in place of repeating values, like this:
|
548
|
-
#
|
549
|
-
# [:a , :bar, :one]
|
550
|
-
# [nil, nil , :two]
|
551
|
-
# [nil, :foo, :one]
|
552
|
-
#
|
553
|
-
def sparse_tuples
|
554
|
-
tuples = to_a
|
555
|
-
[tuples.first] + each_cons(2).map { |prev, cur|
|
556
|
-
left = cur.zip(prev).drop_while { |c, p| c == p }
|
557
|
-
[nil] * (cur.size - left.size) + left.map(&:first)
|
558
|
-
}
|
559
|
-
end
|
560
|
-
end
|
561
|
-
|
562
|
-
class CategoricalIndex < Index
|
563
|
-
# Create a categorical index object.
|
564
|
-
# @param indexes [Array<object>] array of indexes
|
565
|
-
# @return [Daru::CategoricalIndex] categorical index
|
566
|
-
# @example
|
567
|
-
# Daru::CategoricalIndex.new [:a, 1, :a, 1, :c]
|
568
|
-
# # => #<Daru::CategoricalIndex(5): {a, 1, a, 1, c}>
|
569
|
-
def initialize indexes
|
570
|
-
# Create a hash to map each category to positional indexes
|
571
|
-
categories = indexes.each_with_index.group_by(&:first)
|
572
|
-
@cat_hash = categories.map { |cat, group| [cat, group.map(&:last)] }.to_h
|
573
|
-
|
574
|
-
# Map each category to a unique integer for effective storage in @array
|
575
|
-
map_cat_int = categories.keys.each_with_index.to_h
|
576
|
-
|
577
|
-
# To link every instance to its category,
|
578
|
-
# it stores integer for every instance representing its category
|
579
|
-
@array = map_cat_int.values_at(*indexes)
|
580
|
-
end
|
581
|
-
|
582
|
-
# Duplicates the index object and return it
|
583
|
-
# @return [Daru::CategoricalIndex] duplicated index object
|
584
|
-
def dup
|
585
|
-
# Improve it by intializing index by hash
|
586
|
-
Daru::CategoricalIndex.new to_a
|
587
|
-
end
|
588
|
-
|
589
|
-
# Returns true index or category is valid
|
590
|
-
# @param index [object] the index value to look for
|
591
|
-
# @return [true, false] true if index is included, false otherwise
|
592
|
-
def include? index
|
593
|
-
@cat_hash.include? index
|
594
|
-
end
|
595
|
-
|
596
|
-
# Returns array of categories
|
597
|
-
# @example
|
598
|
-
# x = Daru::CategoricalIndex.new [:a, 1, :a, 1, :c]
|
599
|
-
# x.categories
|
600
|
-
# # => [:a, 1, :c]
|
601
|
-
def categories
|
602
|
-
@cat_hash.keys
|
603
|
-
end
|
604
|
-
|
605
|
-
# Returns positions given categories or positions
|
606
|
-
# @note If the argument does not a valid category it treats it as position
|
607
|
-
# value and return it as it is.
|
608
|
-
# @param [Array<object>] *indexes categories or positions
|
609
|
-
# @example
|
610
|
-
# x = Daru::CategoricalIndex.new [:a, 1, :a, 1, :c]
|
611
|
-
# x.pos :a, 1
|
612
|
-
# # => [0, 1, 2, 3]
|
613
|
-
def pos *indexes
|
614
|
-
positions = indexes.map do |index|
|
615
|
-
if include? index
|
616
|
-
@cat_hash[index]
|
617
|
-
elsif index.is_a?(Numeric) && index < @array.size
|
618
|
-
index
|
619
|
-
else
|
620
|
-
raise IndexError, "#{index.inspect} is neither a valid category"\
|
621
|
-
' nor a valid position'
|
622
|
-
end
|
623
|
-
end
|
624
|
-
|
625
|
-
positions.flatten!
|
626
|
-
positions.size == 1 ? positions.first : positions.sort
|
627
|
-
end
|
628
|
-
|
629
|
-
# Returns index value from position
|
630
|
-
# @param pos [Integer] the position to look for
|
631
|
-
# @return [object] category corresponding to position
|
632
|
-
# @example
|
633
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a, :b, :c]
|
634
|
-
# idx.index_from_pos 1
|
635
|
-
# # => :b
|
636
|
-
def index_from_pos pos
|
637
|
-
cat_from_int @array[pos]
|
638
|
-
end
|
639
|
-
|
640
|
-
# Returns enumerator enumerating all index values in the order they occur
|
641
|
-
# @return [Enumerator] all index values
|
642
|
-
# @example
|
643
|
-
# idx = Daru::CategoricalIndex.new [:a, :a, :b]
|
644
|
-
# idx.each.to_a
|
645
|
-
# # => [:a, :a, :b]
|
646
|
-
def each
|
647
|
-
return enum_for(:each) unless block_given?
|
648
|
-
@array.each { |pos| yield cat_from_int pos }
|
649
|
-
self
|
650
|
-
end
|
651
|
-
|
652
|
-
# Compares two index object. Returns true if every instance of category
|
653
|
-
# occur at the same position
|
654
|
-
# @param [Daru::CateogricalIndex] other index object to be checked against
|
655
|
-
# @return [true, false] true if other is similar to self
|
656
|
-
# @example
|
657
|
-
# a = Daru::CategoricalIndex.new [:a, :a, :b]
|
658
|
-
# b = Daru::CategoricalIndex.new [:b, :a, :a]
|
659
|
-
# a == b
|
660
|
-
# # => false
|
661
|
-
def == other
|
662
|
-
self.class == other.class &&
|
663
|
-
size == other.size &&
|
664
|
-
to_h == other.to_h
|
665
|
-
end
|
666
|
-
|
667
|
-
# Returns all the index values
|
668
|
-
# @return [Array] all index values
|
669
|
-
# @example
|
670
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a]
|
671
|
-
# idx.to_a
|
672
|
-
def to_a
|
673
|
-
each.to_a
|
674
|
-
end
|
675
|
-
|
676
|
-
# Returns hash table mapping category to positions at which they occur
|
677
|
-
# @return [Hash] hash table mapping category to array of positions
|
678
|
-
# @example
|
679
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a]
|
680
|
-
# idx.to_h
|
681
|
-
# # => {:a=>[0, 2], :b=>[1]}
|
682
|
-
def to_h
|
683
|
-
@cat_hash
|
684
|
-
end
|
685
|
-
|
686
|
-
# Returns size of the index object
|
687
|
-
# @return [Integer] total number of instances of all categories
|
688
|
-
# @example
|
689
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a]
|
690
|
-
# idx.size
|
691
|
-
# # => 3
|
692
|
-
def size
|
693
|
-
@array.size
|
694
|
-
end
|
695
|
-
|
696
|
-
# Returns true if index object is storing no category
|
697
|
-
# @return [true, false] true if index object is empty
|
698
|
-
# @example
|
699
|
-
# i = Daru::CategoricalIndex.new []
|
700
|
-
# # => #<Daru::CategoricalIndex(0): {}>
|
701
|
-
# i.empty?
|
702
|
-
# # => true
|
703
|
-
def empty?
|
704
|
-
@array.empty?
|
705
|
-
end
|
706
|
-
|
707
|
-
# Return subset given categories or positions
|
708
|
-
# @param [Array<object>] *indexes categories or positions
|
709
|
-
# @return [Daru::CategoricalIndex] subset of the self containing the
|
710
|
-
# mentioned categories or positions
|
711
|
-
# @example
|
712
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a, :b, :c]
|
713
|
-
# idx.subset :a, :b
|
714
|
-
# # => #<Daru::CategoricalIndex(4): {a, b, a, b}>
|
715
|
-
def subset *indexes
|
716
|
-
positions = pos(*indexes)
|
717
|
-
new_index = positions.map { |pos| index_from_pos pos }
|
718
|
-
|
719
|
-
Daru::CategoricalIndex.new new_index.flatten
|
720
|
-
end
|
721
|
-
|
722
|
-
# Takes positional values and returns subset of the self
|
723
|
-
# capturing the categories at mentioned positions
|
724
|
-
# @param [Array<Integer>] positional values
|
725
|
-
# @return [object] index object
|
726
|
-
# @example
|
727
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a, :b, :c]
|
728
|
-
# idx.at 0, 1
|
729
|
-
# # => #<Daru::CategoricalIndex(2): {a, b}>
|
730
|
-
def at *positions
|
731
|
-
positions = preprocess_positions(*positions)
|
732
|
-
validate_positions(*positions)
|
733
|
-
if positions.is_a? Integer
|
734
|
-
index_from_pos(positions)
|
735
|
-
else
|
736
|
-
Daru::CategoricalIndex.new positions.map(&method(:index_from_pos))
|
737
|
-
end
|
738
|
-
end
|
739
|
-
|
740
|
-
# Add specified index values to the index object
|
741
|
-
# @param [Array<object>] *indexes index values to add
|
742
|
-
# @return [Daru::CategoricalIndex] index object with added values
|
743
|
-
# @example
|
744
|
-
# idx = Daru::CategoricalIndex.new [:a, :b, :a, :b, :c]
|
745
|
-
# idx.add :d
|
746
|
-
# # => #<Daru::CategoricalIndex(6): {a, b, a, b, c, d}>
|
747
|
-
def add *indexes
|
748
|
-
Daru::CategoricalIndex.new(to_a + indexes)
|
749
|
-
end
|
750
|
-
|
751
|
-
private
|
752
|
-
|
753
|
-
def int_from_cat cat
|
754
|
-
@cat_hash.keys.index cat
|
755
|
-
end
|
756
|
-
|
757
|
-
def cat_from_int cat
|
758
|
-
@cat_hash.keys[cat]
|
759
|
-
end
|
760
|
-
end
|
761
|
-
end
|