RubyGems - statsample - Versions diffs - 1.5.0 → 2.0.0 - Mend

statsample 1.5.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (114) hide show

checksums.yaml +4 -4
data/.build.sh +15 -0
data/.gitignore +1 -0
data/.travis.yml +19 -7
data/CONTRIBUTING.md +33 -0
data/History.txt +5 -0
data/README.md +41 -53
data/benchmarks/correlation_matrix_15_variables.rb +6 -5
data/benchmarks/correlation_matrix_5_variables.rb +6 -5
data/benchmarks/correlation_matrix_methods/correlation_matrix.rb +23 -26
data/examples/boxplot.rb +17 -5
data/examples/correlation_matrix.rb +36 -7
data/examples/dataset.rb +25 -5
data/examples/dominance_analysis.rb +8 -7
data/examples/dominance_analysis_bootstrap.rb +16 -11
data/examples/histogram.rb +16 -2
data/examples/icc.rb +5 -6
data/examples/levene.rb +17 -3
data/examples/multiple_regression.rb +6 -3
data/examples/parallel_analysis.rb +11 -6
data/examples/polychoric.rb +26 -13
data/examples/principal_axis.rb +8 -4
data/examples/reliability.rb +10 -10
data/examples/scatterplot.rb +8 -0
data/examples/t_test.rb +7 -0
data/examples/u_test.rb +10 -2
data/examples/vector.rb +9 -6
data/examples/velicer_map_test.rb +12 -8
data/lib/statsample.rb +13 -47
data/lib/statsample/analysis/suite.rb +1 -1
data/lib/statsample/anova/oneway.rb +6 -6
data/lib/statsample/anova/twoway.rb +26 -24
data/lib/statsample/bivariate.rb +78 -61
data/lib/statsample/bivariate/pearson.rb +2 -2
data/lib/statsample/codification.rb +45 -32
data/lib/statsample/converter/csv.rb +15 -53
data/lib/statsample/converter/spss.rb +6 -5
data/lib/statsample/converters.rb +50 -211
data/lib/statsample/crosstab.rb +26 -25
data/lib/statsample/daru.rb +117 -0
data/lib/statsample/dataset.rb +70 -942
data/lib/statsample/dominanceanalysis.rb +16 -17
data/lib/statsample/dominanceanalysis/bootstrap.rb +26 -28
data/lib/statsample/factor/parallelanalysis.rb +17 -19
data/lib/statsample/factor/pca.rb +21 -20
data/lib/statsample/factor/principalaxis.rb +3 -3
data/lib/statsample/graph/boxplot.rb +8 -16
data/lib/statsample/graph/histogram.rb +4 -4
data/lib/statsample/graph/scatterplot.rb +8 -7
data/lib/statsample/histogram.rb +128 -119
data/lib/statsample/matrix.rb +20 -16
data/lib/statsample/multiset.rb +39 -38
data/lib/statsample/regression.rb +3 -3
data/lib/statsample/regression/multiple.rb +8 -10
data/lib/statsample/regression/multiple/alglibengine.rb +96 -89
data/lib/statsample/regression/multiple/baseengine.rb +32 -32
data/lib/statsample/regression/multiple/gslengine.rb +33 -36
data/lib/statsample/regression/multiple/matrixengine.rb +7 -9
data/lib/statsample/regression/multiple/rubyengine.rb +39 -41
data/lib/statsample/reliability.rb +23 -25
data/lib/statsample/reliability/icc.rb +8 -7
data/lib/statsample/reliability/multiscaleanalysis.rb +14 -12
data/lib/statsample/reliability/scaleanalysis.rb +58 -60
data/lib/statsample/reliability/skillscaleanalysis.rb +34 -29
data/lib/statsample/resample.rb +1 -1
data/lib/statsample/shorthand.rb +29 -25
data/lib/statsample/test/kolmogorovsmirnov.rb +5 -3
data/lib/statsample/test/levene.rb +28 -27
data/lib/statsample/test/t.rb +7 -9
data/lib/statsample/test/umannwhitney.rb +28 -28
data/lib/statsample/test/wilcoxonsignedrank.rb +45 -43
data/lib/statsample/vector.rb +70 -1013
data/lib/statsample/version.rb +1 -1
data/statsample.gemspec +12 -16
data/test/helpers_tests.rb +1 -1
data/test/test_analysis.rb +17 -17
data/test/test_anova_contrast.rb +6 -6
data/test/test_anovatwowaywithdataset.rb +8 -8
data/test/test_anovawithvectors.rb +8 -8
data/test/test_awesome_print_bug.rb +1 -1
data/test/test_bartlettsphericity.rb +4 -4
data/test/test_bivariate.rb +48 -43
data/test/test_codification.rb +33 -33
data/test/test_crosstab.rb +9 -9
data/test/test_dataset.rb +28 -458
data/test/test_factor.rb +46 -38
data/test/test_factor_pa.rb +22 -13
data/test/test_ggobi.rb +4 -4
data/test/test_gsl.rb +4 -4
data/test/test_histogram.rb +3 -3
data/test/test_matrix.rb +13 -13
data/test/test_multiset.rb +103 -91
data/test/test_regression.rb +57 -52
data/test/test_reliability.rb +55 -45
data/test/test_reliability_icc.rb +8 -8
data/test/test_reliability_skillscale.rb +26 -24
data/test/test_resample.rb +1 -1
data/test/test_statistics.rb +3 -13
data/test/test_stest.rb +9 -9
data/test/test_stratified.rb +3 -3
data/test/test_test_t.rb +12 -12
data/test/test_umannwhitney.rb +2 -2
data/test/test_vector.rb +76 -613
data/test/test_wilcoxonsignedrank.rb +4 -4
metadata +57 -28
data/lib/statsample/rserve_extension.rb +0 -20
data/lib/statsample/vector/gsl.rb +0 -106
data/test/fixtures/repeated_fields.csv +0 -7
data/test/fixtures/scientific_notation.csv +0 -4
data/test/fixtures/test_csv.csv +0 -7
data/test/fixtures/test_xls.xls +0 -0
data/test/test_csv.rb +0 -63
data/test/test_rserve_extension.rb +0 -42
data/test/test_xls.rb +0 -52

data/test/test_reliability_skillscale.rb CHANGED

@@ -5,30 +5,32 @@ class StatsampleReliabilitySkillScaleTestCase < Minitest::Test
     setup do
       options = %w(a b c d e)
       cases = 20
-      @id = cases.times.map { |v| v }.to_numeric
-      @a = cases.times.map { options[rand(5)] }.to_vector
-      @b = cases.times.map { options[rand(5)] }.to_vector
-      @c = cases.times.map { options[rand(5)] }.to_vector
-      @d = cases.times.map { options[rand(5)] }.to_vector
-      @e = cases.times.map {|i|
-        i == 0 ? options[rand(0)] :
+      @id = Daru::Vector.new(cases.times.map { |v| v })
+      @a = Daru::Vector.new(cases.times.map { options[rand(5)] })
+      @b = Daru::Vector.new(cases.times.map { options[rand(5)] })
+      @c = Daru::Vector.new(cases.times.map { options[rand(5)] })
+      @d = Daru::Vector.new(cases.times.map { options[rand(5)] })
+      @e = Daru::Vector.new(
+        cases.times.map do |i|
+          i == 0 ? options[rand(0)] :
           rand > 0.8 ? nil : options[rand(5)]
-      }.to_vector
-      @ds = { 'id' => @id, 'a' => @a, 'b' => @b, 'c' => @c, 'd' => @d, 'e' => @e }.to_dataset
-      @key = { 'a' => 'a', 'b' => options[rand(5)], 'c' => options[rand(5)], 'd' => options[rand(5)], 'e' => options[rand(5)] }
+        end
+      )
+      @ds = Daru::DataFrame.new({ :id => @id, :a => @a, :b => @b, :c => @c, :d => @d, :e => @e })
+      @key = { :a => 'a', :b => options[rand(5)], :c => options[rand(5)], :d => options[rand(5)], :e => options[rand(5)] }
       @ssa = Statsample::Reliability::SkillScaleAnalysis.new(@ds, @key)
-      @ac = @a.map { |v| v == @key['a'] ? 1 : 0 }.to_numeric
-      @bc = @b.map { |v| v == @key['b'] ? 1 : 0 }.to_numeric
-      @cc = @c.map { |v| v == @key['c'] ? 1 : 0 }.to_numeric
-      @dc = @d.map { |v| v == @key['d'] ? 1 : 0 }.to_numeric
-      @ec = @e.map { |v| v.nil? ? nil : (v == @key['e'] ? 1 : 0) }.to_numeric
+      @ac = Daru::Vector.new(@a.map { |v| v == @key[:a] ? 1 : 0 })
+      @bc = Daru::Vector.new(@b.map { |v| v == @key[:b] ? 1 : 0 })
+      @cc = Daru::Vector.new(@c.map { |v| v == @key[:c] ? 1 : 0 })
+      @dc = Daru::Vector.new(@d.map { |v| v == @key[:d] ? 1 : 0 })
+      @ec = Daru::Vector.new(@e.map { |v| v.nil? ? nil : (v == @key[:e] ? 1 : 0) })
     end
     should 'return proper corrected dataset' do
-      cds = { 'id' => @id, 'a' => @ac, 'b' => @bc, 'c' => @cc, 'd' => @dc, 'e' => @ec }.to_dataset
+      cds = Daru::DataFrame.new({ :id => @id, :a => @ac, :b => @bc, :c => @cc, :d => @dc, :e => @ec })
       assert_equal(cds, @ssa.corrected_dataset)
     end
     should 'return proper corrected minimal dataset' do
-      cdsm = { 'a' => @ac, 'b' => @bc, 'c' => @cc, 'd' => @dc, 'e' => @ec }.to_dataset
+      cdsm = Daru::DataFrame.new({ :a => @ac, :b => @bc, :c => @cc, :d => @dc, :e => @ec })
       assert_equal(cdsm, @ssa.corrected_dataset_minimal)
     end
     should 'return correct vector_sum and vector_sum' do
@@ -37,13 +39,13 @@ class StatsampleReliabilitySkillScaleTestCase < Minitest::Test
       assert_equal(cdsm.vector_mean, @ssa.vector_mean)
     end
     should 'not crash on rare case' do
-      a = Statsample::Vector['c', 'c', 'a', 'a', 'c', 'a', 'b', 'c', 'c', 'b', 'a', 'd', 'a', 'd', 'a', 'a', 'd', 'e', 'c', 'd']
-      b = Statsample::Vector['e', 'b', 'e', 'b', 'c', 'd', 'a', 'e', 'e', 'c', 'b', 'e', 'e', 'b', 'd', 'c', 'e', 'b', 'b', 'd']
-      c = Statsample::Vector['e', 'b', 'e', 'c', 'e', 'c', 'b', 'd', 'e', 'c', 'a', 'a', 'b', 'd', 'e', 'c', 'b', 'a', 'a', 'e']
-      d = Statsample::Vector['a', 'b', 'd', 'd', 'e', 'b', 'e', 'b', 'd', 'c', 'e', 'a', 'c', 'd', 'c', 'c', 'e', 'd', 'd', 'b']
-      e = Statsample::Vector['a', 'b', nil, 'd', 'c', 'c', 'd', nil, 'd', 'd', 'e', 'e', nil, nil, nil, 'd', 'c', nil, 'e', 'd']
-      key = { 'a' => 'a', 'b' => 'e', 'c' => 'd', 'd' => 'c', 'e' => 'd' }
-      ds = Statsample::Dataset.new('a' => a, 'b' => b, 'c' => c, 'd' => d, 'e' => e)
+      a = Daru::Vector.new(['c', 'c', 'a', 'a', 'c', 'a', 'b', 'c', 'c', 'b', 'a', 'd', 'a', 'd', 'a', 'a', 'd', 'e', 'c', 'd'])
+      b = Daru::Vector.new(['e', 'b', 'e', 'b', 'c', 'd', 'a', 'e', 'e', 'c', 'b', 'e', 'e', 'b', 'd', 'c', 'e', 'b', 'b', 'd'])
+      c = Daru::Vector.new(['e', 'b', 'e', 'c', 'e', 'c', 'b', 'd', 'e', 'c', 'a', 'a', 'b', 'd', 'e', 'c', 'b', 'a', 'a', 'e'])
+      d = Daru::Vector.new(['a', 'b', 'd', 'd', 'e', 'b', 'e', 'b', 'd', 'c', 'e', 'a', 'c', 'd', 'c', 'c', 'e', 'd', 'd', 'b'])
+      e = Daru::Vector.new(['a', 'b', nil, 'd', 'c', 'c', 'd', nil, 'd', 'd', 'e', 'e', nil, nil, nil, 'd', 'c', nil, 'e', 'd'])
+      key = { :a => 'a', :b => 'e', :c => 'd', :d => 'c', :e => 'd' }
+      ds = Daru::DataFrame.new({:a => a, :b => b, :c => c, :d => d, :e => e})
       ssa = Statsample::Reliability::SkillScaleAnalysis.new(ds, key)
       assert(ssa.summary)
     end

data/test/test_resample.rb CHANGED

@@ -17,7 +17,7 @@ class StatsampleResampleTestCase < Minitest::Test
       Statsample::Resample.generate(20, 1, 10).count(1)
     }
     assert_equal(400, r.size)
-    v = Statsample::Vector.new(r, :numeric)
+    v = Daru::Vector.new(r)
     a = v.count { |x|  x > 3 }
     assert(a >= 30 && a <= 70)
   end

data/test/test_statistics.rb CHANGED

@@ -32,7 +32,7 @@ class StatsampleStatisicsTestCase < Minitest::Test
   end
   def test_estimation_mean
-    v = ([42] * 23 + [41] * 4 + [36] * 1 + [32] * 1 + [29] * 1 + [27] * 2 + [23] * 1 + [19] * 1 + [16] * 2 + [15] * 2 + [14, 11, 10, 9, 7] + [6] * 3 + [5] * 2 + [4, 3]).to_vector(:numeric)
+    v = Daru::Vector.new([42] * 23 + [41] * 4 + [36] * 1 + [32] * 1 + [29] * 1 + [27] * 2 + [23] * 1 + [19] * 1 + [16] * 2 + [15] * 2 + [14, 11, 10, 9, 7] + [6] * 3 + [5] * 2 + [4, 3])
     assert_equal(50, v.size)
     assert_equal(1471, v.sum)
     # limits=Statsample::SRS.mean_confidence_interval_z(v.mean(), v.sds(), v.size,676,0.80)
@@ -55,19 +55,9 @@ class StatsampleStatisicsTestCase < Minitest::Test
     assert_in_delta(0.46, l[1], 0.01)
   end
-  def test_ml
-    if true
-      # real=[1,1,1,1].to_vector(:numeric)
-      # pred=[0.0001,0.0001,0.0001,0.0001].to_vector(:numeric)
-      # puts  Statsample::Bivariate.maximum_likehood_dichotomic(pred,real)
-    end
-  end
   def test_simple_linear_regression
-    a = [1, 2, 3, 4, 5, 6].to_vector(:numeric)
-    b = [6, 2, 4, 10, 12, 8].to_vector(:numeric)
+    a = Daru::Vector.new([1, 2, 3, 4, 5, 6])
+    b = Daru::Vector.new([6, 2, 4, 10, 12, 8])
     reg = Statsample::Regression::Simple.new_from_vectors(a, b)
     assert_in_delta((reg.ssr + reg.sse).to_f, reg.sst, 0.001)
     assert_in_delta(Statsample::Bivariate.pearson(a, b), reg.r, 0.001)

data/test/test_stest.rb CHANGED

@@ -24,26 +24,26 @@ class StatsampleTestTestCase < Minitest::Test
   end
   def test_u_mannwhitney
-    a = [1, 2, 3, 4, 5, 6].to_numeric
-    b = [0, 5, 7, 9, 10, 11].to_numeric
+    a = Daru::Vector.new([1, 2, 3, 4, 5, 6])
+    b = Daru::Vector.new([0, 5, 7, 9, 10, 11])
     assert_equal(7.5, Statsample::Test.u_mannwhitney(a, b).u)
     assert_equal(7.5, Statsample::Test.u_mannwhitney(b, a).u)
-    a = [1, 7, 8, 9, 10, 11].to_numeric
-    b = [2, 3, 4, 5, 6, 12].to_numeric
+    a = Daru::Vector.new([1, 7, 8, 9, 10, 11])
+    b = Daru::Vector.new([2, 3, 4, 5, 6, 12])
     assert_equal(11, Statsample::Test.u_mannwhitney(a, b).u)
   end
   def test_levene
-    a = [1, 2, 3, 4, 5, 6, 7, 8, 100, 10].to_numeric
-    b = [30, 40, 50, 60, 70, 80, 90, 100, 110, 120].to_numeric
+    a = Daru::Vector.new([1, 2, 3, 4, 5, 6, 7, 8, 100, 10])
+    b = Daru::Vector.new([30, 40, 50, 60, 70, 80, 90, 100, 110, 120])
     levene = Statsample::Test::Levene.new([a, b])
     assert_levene(levene)
   end
   def test_levene_dataset
-    a = [1, 2, 3, 4, 5, 6, 7, 8, 100, 10].to_numeric
-    b = [30, 40, 50, 60, 70, 80, 90, 100, 110, 120].to_numeric
-    ds = { 'a' => a, 'b' => b }.to_dataset
+    a = Daru::Vector.new([1, 2, 3, 4, 5, 6, 7, 8, 100, 10])
+    b = Daru::Vector.new([30, 40, 50, 60, 70, 80, 90, 100, 110, 120])
+    ds = Daru::DataFrame.new({ :a => a, :b => b })
     levene = Statsample::Test::Levene.new(ds)
     assert_levene(levene)
   end

data/test/test_stratified.rb CHANGED

@@ -9,9 +9,9 @@ class StatsampleStratifiedTestCase < Minitest::Test
     a = [10, 20, 30, 40, 50]
     b = [110, 120, 130, 140]
     pop = a + b
-    av = a.to_vector(:numeric)
-    bv = b.to_vector(:numeric)
-    popv = pop.to_vector(:numeric)
+    av   = Daru::Vector.new(a)
+    bv   = Daru::Vector.new(b)
+    popv = Daru::Vector.new(pop)
     assert_equal(popv.mean, Statsample::StratifiedSample.mean(av, bv))
   end
 end

data/test/test_test_t.rb CHANGED

@@ -4,24 +4,24 @@ class StatsampleTestTTestCase < Minitest::Test
   include Math
   context T do
     setup do
-      @a = [30.02, 29.99, 30.11, 29.97, 30.01, 29.99].to_numeric
-      @b = [29.89, 29.93, 29.72, 29.98, 30.02, 29.98].to_numeric
+      @a = Daru::Vector.new([30.02, 29.99, 30.11, 29.97, 30.01, 29.99])
+      @b = Daru::Vector.new([29.89, 29.93, 29.72, 29.98, 30.02, 29.98])
       @x1 = @a.mean
       @x2 = @b.mean
       @s1 = @a.sd
       @s2 = @b.sd
-      @n1 = @a.n
-      @n2 = @b.n
+      @n1 = @a.size
+      @n2 = @b.size
     end
     should 'calculate correctly standard t' do
-      t = Statsample::Test::T.new(@x1, @s1.quo(Math.sqrt(@a.n)), @a.n - 1)
-      assert_equal((@x1).quo(@s1.quo(Math.sqrt(@a.n))), t.t)
-      assert_equal(@a.n - 1, t.df)
+      t = Statsample::Test::T.new(@x1, @s1.quo(Math.sqrt(@a.size)), @a.size - 1)
+      assert_equal((@x1).quo(@s1.quo(Math.sqrt(@a.size))), t.t)
+      assert_equal(@a.size - 1, t.df)
       assert(t.summary.size > 0)
     end
     should 'calculate correctly t for one sample' do
-      t1 = [6, 4, 6, 7, 4, 5, 5, 12, 6, 1].to_numeric
-      t2 = [9, 6, 5, 10, 10, 8, 7, 10, 6, 5].to_numeric
+      t1 = Daru::Vector.new([6, 4, 6, 7, 4, 5, 5, 12, 6, 1])
+      t2 = Daru::Vector.new([9, 6, 5, 10, 10, 8, 7, 10, 6, 5])
       d = t1 - t2
       t = Statsample::Test::T::OneSample.new(d)
       assert_in_delta(-2.631, t.t, 0.001)
@@ -48,14 +48,14 @@ class StatsampleTestTTestCase < Minitest::Test
       assert_in_delta(0.09095, t.probability_not_equal_variance, 0.001)
     end
     should 'be the same using shorthand' do
-      v = 100.times.map { rand(100) }.to_numeric
+      v = Daru::Vector.new(100.times.map { rand(100) })
       assert_equal(Statsample::Test.t_one_sample(v).t, T::OneSample.new(v).t)
     end
     should 'calculate all values for one sample T test' do
       u = @a.mean + (1 - rand * 2)
       tos = T::OneSample.new(@a, u: u)
-      assert_equal((@a.mean - u).quo(@a.sd.quo(sqrt(@a.n))), tos.t)
-      assert_equal(@a.n - 1, tos.df)
+      assert_equal((@a.mean - u).quo(@a.sd.quo(sqrt(@a.size))), tos.t)
+      assert_equal(@a.size - 1, tos.df)
       assert(tos.summary.size > 0)
     end
   end

data/test/test_umannwhitney.rb CHANGED

@@ -4,8 +4,8 @@ class StatsampleUMannWhitneyTestCase < Minitest::Test
   include Statsample::Test
   context Statsample::Test::UMannWhitney do
     setup do
-      @v1 = [1, 2, 3, 4, 7, 8, 9, 10, 14, 15].to_numeric
-      @v2 = [5, 6, 11, 12, 13, 16, 17, 18, 19].to_numeric
+      @v1 = Daru::Vector.new([1, 2, 3, 4, 7, 8, 9, 10, 14, 15])
+      @v2 = Daru::Vector.new([5, 6, 11, 12, 13, 16, 17, 18, 19])
       @u = Statsample::Test::UMannWhitney.new(@v1, @v2)
     end
     should 'have same result using class or Test#u_mannwhitney' do

data/test/test_vector.rb CHANGED

@@ -3,24 +3,11 @@ require(File.expand_path(File.dirname(__FILE__) + '/helpers_tests.rb'))
 class StatsampleTestVector < Minitest::Test
   include Statsample::Shorthand
-  def setup
-    @c = Statsample::Vector.new([5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, -99, -99], :object)
-    @c.name = 'Test Vector'
-    @c.missing_values = [-99]
-  end
-  def assert_counting_tokens(b)
-    assert_equal([1, 1, 0, 1, 0, nil], b['a'].to_a)
-    assert_equal([0, 1, 0, 0, 0, nil], b['b'].to_a)
-    assert_equal([0, 0, 1, 0, 0, nil], b['c'].to_a)
-    assert_equal([0, 0, 1, 1, 0, nil], b['d'].to_a)
-    assert_equal([0, 0, 0, 0, 1, nil], b[10].to_a)
-  end
   context Statsample do
     setup do
       @sample = 100
-      @a = @sample.times.map { |i| (i + rand(10)) % 10 == 0 ? nil : rand(100) }.to_numeric
-      @b = @sample.times.map { |i| (i + rand(10)) % 10 == 0 ? nil : rand(100) }.to_numeric
+      @a = Daru::Vector.new(@sample.times.map { |i| (i + rand(10)) % 10 == 0 ? nil : rand(100) })
+      @b = Daru::Vector.new(@sample.times.map { |i| (i + rand(10)) % 10 == 0 ? nil : rand(100) })
       @correct_a = []
       @correct_b = []
       @a.each_with_index do |_v, i|
@@ -29,8 +16,8 @@ class StatsampleTestVector < Minitest::Test
           @correct_b.push(@b[i])
         end
       end
-      @correct_a = @correct_a.to_numeric
-      @correct_b = @correct_b.to_numeric
+      @correct_a = Daru::Vector.new(@correct_a)
+      @correct_b = Daru::Vector.new(@correct_b)
       @common = lambda  do |av, bv|
         assert_equal(@correct_a, av, 'A no es esperado')
@@ -39,649 +26,125 @@ class StatsampleTestVector < Minitest::Test
         assert(!bv.has_missing_data?, 'b tiene datos faltantes')
       end
     end
     should 'return correct only_valid' do
       av, bv = Statsample.only_valid @a, @b
+      av.reset_index!
+      bv.reset_index!
       av2, bv2 = Statsample.only_valid av, bv
       @common.call(av, bv)
       assert_equal(av, av2)
       assert_not_same(av, av2)
       assert_not_same(bv, bv2)
     end
     should 'return correct only_valid_clone' do
       av, bv = Statsample.only_valid_clone @a, @b
+      av.reset_index!
+      bv.reset_index!
       @common.call(av, bv)
       av2, bv2 = Statsample.only_valid_clone av, bv
       assert_equal(av, av2)
       assert_same(av, av2)
       assert_same(bv, bv2)
     end
-  end
-  context Statsample::Vector do
-    setup do
-      @c = Statsample::Vector.new([5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, -99, -99], :object)
-      @c.name = 'Test Vector'
-      @c.missing_values = [-99]
-    end
-    should_with_gsl 'be created with GSL::Vector' do
-      gsl = GSL::Vector[1, 2, 3, 4, 5]
-      v = Statsample::Vector.new(gsl)
-      assert_equal([1, 2, 3, 4, 5], v.to_a)
-      refute(v.flawed?)
-    end
-    context 'using matrix operations' do
-      setup do
-        @a = [1, 2, 3, 4, 5].to_numeric
-      end
-      should 'to_matrix returns a matrix with 1 row' do
-        mh = Matrix[[1, 2, 3, 4, 5]]
-        assert_equal(mh, @a.to_matrix)
-      end
-      should 'to_matrix(:vertical) returns a matrix with 1 column' do
-        mv = Matrix.columns([[1, 2, 3, 4, 5]])
-        assert_equal(mv, @a.to_matrix(:vertical))
-      end
-      should 'returns valid submatrixes' do
-        # 3*4 + 2*5 = 22
-        a = [3, 2].to_vector(:numeric)
-        b = [4, 5].to_vector(:numeric)
-        assert_equal(22, (a.to_matrix * b.to_matrix(:vertical))[0, 0])
-      end
+    should 'returns correct vector_cols_matrix' do
+      v1 = Daru::Vector.new(%w(a a a b b b c c))
+      v2 = Daru::Vector.new(%w(1 3 4 5 6 4 3 2))
+      v3 = Daru::Vector.new(%w(1 0 0 0 1 1 1 0))
+      ex = Matrix.rows([%w(a 1 1), %w(a 3 0), %w(a 4 0), %w(b 5 0), %w(b 6 1), %w(b 4 1), %w(c 3 1), %w(c 2 0)])
+      assert_equal(ex, Statsample.vector_cols_matrix(v1, v2, v3))
     end
-    context 'when initializing' do
-      setup do
-        @data = (10.times.map { rand(100) }) + [nil]
-        @original = Statsample::Vector.new(@data, :numeric)
-      end
-      should 'be the sample using []' do
-        second = Statsample::Vector[*@data]
-        assert_equal(@original, second)
-      end
-      should '[] returns same results as R-c()' do
-        reference = [0, 4, 5, 6, 10].to_numeric
-        assert_equal(reference, Statsample::Vector[0, 4, 5, 6, 10])
-        assert_equal(reference, Statsample::Vector[0, 4..6, 10])
-        assert_equal(reference, Statsample::Vector[[0], [4, 5, 6], [10]])
-        assert_equal(reference, Statsample::Vector[[0], [4, [5, [6]]], [10]])
-        assert_equal(reference, Statsample::Vector[[0], [4, 5, 6].to_vector, [10]])
-      end
-      should 'be the same usign #to_vector' do
-        lazy1 = @data.to_vector(:numeric)
-        assert_equal(@original, lazy1)
-      end
-      should 'be the same using #to_numeric' do
-        lazy2 = @data.to_numeric
-        assert_equal(@original, lazy2)
-        assert_equal(:numeric, lazy2.type)
-        assert_equal(@data.find_all { |v| !v.nil? }, lazy2.valid_data)
-      end
-      should 'could use new_numeric with size only' do
-        v1 = 10.times.map { nil }.to_numeric
-        v2 = Statsample::Vector.new_numeric(10)
-        assert_equal(v1, v2)
-      end
-      should 'could use new_numeric with size and value' do
-        a = rand
-        v1 = 10.times.map { a }.to_numeric
-        v2 = Statsample::Vector.new_numeric(10, a)
-        assert_equal(v1, v2)
-      end
-      should 'could use new_numeric with func' do
-        v1 = 10.times.map { |i| i * 2 }.to_numeric
-        v2 = Statsample::Vector.new_numeric(10) { |i| i * 2 }
-        assert_equal(v1, v2)
-      end
-    end
-    context "new types :numeric and :object" do
-      should "set default type of vector to :object" do
-        v = Statsample::Vector.new [1,2,3,4,5]
-        assert_equal(:object, v.type)
-      end
-      should "initialize Vector with :numeric type" do
-        v = Statsample::Vector.new [1,2,3,4,5,nil], :numeric
-        assert_equal(:numeric, v.type)
-        assert_equal([1,2,3,4,5], v.valid_data)
-      end
-      should "show a warning when initializing with :nominal, :numeric or :ordinal" do
-        assert_output(nil,"WARNING: nominal has been deprecated. Use :object instead.\n") do
-          Statsample::Vector.new [1,2,3,4,5,nil,'hello'], :nominal
-        end
-        assert_output(nil,"WARNING: scale has been deprecated. Use :numeric instead.\n") do
-          Statsample::Vector.new [1,2,3,4,nil,5], :scale
-        end
-        assert_output(nil,"WARNING: ordinal has been deprecated. Use :numeric instead.\n") do
-          Statsample::Vector.new [1,2,3,4,5], :ordinal
-        end
+  end
-        assert_output(nil,"WARNING: .new_scale has been deprecated. Use .new_numeric instead.\n") do
-          Statsample::Vector.new_scale 10, 1
+  context Statsample::Vector do
+    context 'when initializing' do
+      should '.new creates a Daru::Vector internally and shows a warning' do
+        assert_output(nil, "WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\n") do
+          data = (10.times.map { rand(100) }) + [nil]
+          original = Statsample::Vector.new(@data, :numeric)
+          assert_equal(true, original.kind_of?(Daru::Vector))
         end
       end
-      should "test that new shorthands work" do
-        numeric = Statsample::Vector.new([1,2,3,4,nil,5], :numeric)
-        assert_equal(numeric, [1,2,3,4,nil,5].to_numeric)
-        assert_equal(numeric, [1,2,3,4,nil,5].to_vector(:numeric))
-        obj = Statsample::Vector.new([1,2,3,4,'one','two'], :object)
-        assert_equal(obj, [1,2,3,4,'one','two'].to_vector(:object))
-      end
-      should "test that old shorthands raise warnings" do
-        assert_output(nil,"WARNING: to_scale has been deprecated. Use to_numeric instead.\n") do
-          [1,2,3,4,nil,5].to_scale
+      should '[] returns same results as R-c()' do
+        assert_output(nil, "WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\n") do
+          assert_equal(true, Statsample::Vector[1,2,3,4,5].kind_of?(Daru::Vector))
         end
       end
-    end
-    context '#split_by_separator' do
-      setup do
-        @a = Statsample::Vector.new(['a', 'a,b', 'c,d', 'a,d', 10, nil], :object)
-        @b = @a.split_by_separator(',')
-      end
-      should 'returns a Hash' do
-        assert_kind_of(Hash, @b)
-      end
-      should 'return a Hash with keys with different values of @a' do
-        expected = ['a', 'b', 'c', 'd', 10]
-        assert_equal(expected, @b.keys)
-      end
+      should "new_numeric/new_scale creates a Daru::Vector internally and shows a warning" do
+        assert_output(nil, "WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\n") do
+          Statsample::Vector.new_scale(4)
+        end
-      should 'returns a Hash, which values are Statsample::Vector' do
-        @b.each_key { |k| assert_instance_of(Statsample::Vector, @b[k]) }
-      end
-      should 'hash values are n times the tokens appears' do
-        assert_counting_tokens(@b)
-      end
-      should '#split_by_separator_freq returns the number of ocurrences of tokens' do
-        assert_equal({ 'a' => 3, 'b' => 1, 'c' => 1, 'd' => 2, 10 => 1 }, @a.split_by_separator_freq)
-      end
-      should 'using a different separator give the same values' do
-        a = Statsample::Vector.new(['a', 'a*b', 'c*d', 'a*d', 10, nil], :object)
-        b = a.split_by_separator('*')
-        assert_counting_tokens(b)
-      end
-    end
-    should 'return correct median_absolute_deviation' do
-      a = [1, 1, 2, 2, 4, 6, 9].to_numeric
-      assert_equal(1, a.median_absolute_deviation)
-    end
-    should 'return correct histogram' do
-      a = 10.times.map { |v| v }.to_numeric
-      hist = a.histogram(2)
-      assert_equal([5, 5], hist.bin)
-      3.times do |i|
-        assert_in_delta(i * 4.5, hist.get_range(i)[0], 1e-9)
+        assert_output(nil, "WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\n") do
+          Statsample::Vector.new_numeric(4)
+        end
       end
     end
-    should 'have a name' do
-      @c.name == 'Test Vector'
-    end
-    should 'without explicit name, returns vector with succesive numbers' do
-      a = 10.times.map { rand(100) }.to_numeric
-      b = 10.times.map { rand(100) }.to_numeric
-      assert_match(/Vector \d+/, a.name)
-      a.name =~ /Vector (\d+)/
-      next_number = Regexp.last_match(1).to_i + 1
-      assert_equal("Vector #{next_number}", b.name)
-    end
-    should 'save to a file and load the same Vector' do
-      outfile = Tempfile.new('vector.vec')
-      @c.save(outfile.path)
-      a = Statsample.load(outfile.path)
-      assert_equal(@c, a)
-    end
-    should '#collect returns an array' do
-      val = @c.collect { |v| v }
-      assert_equal(val, [5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, -99, -99])
-    end
+  end
-    should '#recode returns a recoded array' do
-      a = @c.recode { |v| @c.is_valid?(v) ? 0 : 1 }
-      exp = [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1].to_vector
-      assert_equal(exp, a)
-      exp.recode! { |v| v == 0 ? 1 : 0 }
-      exp2 = (([1] * 15) + ([0] * 3)).to_vector
-      assert_equal(exp2, exp)
-    end
-    should '#product returns the * of all values' do
-      a = [1, 2, 3, 4, 5].to_vector(:numeric)
-      assert_equal(120, a.product)
+  context "new types :numeric and :object" do
+    should "numerical data is automatically detected to be of type :numeric" do
+      v = Statsample::Vector.new [1,2,3,4,5,nil]
+      assert_equal(:numeric, v.type)
     end
-    should 'missing values' do
-      @c.missing_values = [10]
-      assert_equal([-99, -99, 1, 2, 3, 4, 5, 5, 5, 5, 5, 6, 6, 7, 8, 9], @c.valid_data.sort)
-      assert_equal([5, 5, 5, 5, 5, 6, 6, 7, 8, 9, nil, 1, 2, 3, 4, nil, -99, -99], @c.data_with_nils)
-      @c.missing_values = [-99]
-      assert_equal(@c.valid_data.sort, [1, 2, 3, 4, 5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10])
-      assert_equal(@c.data_with_nils, [5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, nil, nil])
-      @c.missing_values = []
-      assert_equal(@c.valid_data.sort, [-99, -99, 1, 2, 3, 4, 5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10])
-      assert_equal(@c.data_with_nils, [5, 5, 5, 5, 5, 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, -99, -99])
-    end
-    should 'correct has_missing_data? with missing data' do
-      a = [1, 2, 3, nil].to_vector
-      assert(a.has_missing_data?)
-    end
-    should 'correct has_missing_data? without missing data' do
-      a = [1, 2, 3, 4, 10].to_vector
-      assert(!a.has_missing_data?)
-    end
-    should 'with explicit missing_values, should respond has_missing_data?' do
-      a = [1, 2, 3, 4, 10].to_vector
-      a.missing_values = [10]
-      assert(a.has_missing_data?)
-    end
-    should 'label correctly fields' do
-      @c.labels = { 5 => 'FIVE' }
-      assert_equal(['FIVE', 'FIVE', 'FIVE', 'FIVE', 'FIVE', 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, -99, -99], @c.vector_labeled.to_a)
-    end
-    should 'verify' do
-      h = @c.verify { |d| !d.nil? and d > 0 }
-      e = { 15 => nil, 16 => -99, 17 => -99 }
-      assert_equal(e, h)
-    end
-    should 'have a summary with name on it' do
-      assert_match(/#{@c.name}/, @c.summary)
+    should "object data automatically detected as :object" do
+      v = Statsample::Vector.new [1,2,3,4,'hello','world']
+      assert_equal(:object, v.type)
     end
-    should 'GSL::Vector based should push correcty' do
-      if Statsample.has_gsl?
-        v = GSL::Vector[1, 2, 3, 4, 5].to_numeric
-        v.push(nil)
-        assert_equal([1, 2, 3, 4, 5, nil], v.to_a)
-        assert(v.flawed?)
-      else
-        skip('Requires GSL')
+    should "initialize Vector with :numeric type" do
+      v = Statsample::Vector.new [1,2,3,4,5,nil], :numeric
+      assert_equal(:numeric, v.type)
+      assert_output(nil, "WARNING: valid_data in Statsample::Vector has been deprecated in favor of only_valid in Daru::Vector. Please use that.\n") do
+        assert_equal([1,2,3,4,5], v.valid_data)
       end
     end
-    should 'split correctly' do
-      a = Statsample::Vector.new(['a', 'a,b', 'c,d', 'a,d', 'd', 10, nil], :object)
-      assert_equal([%w(a), %w(a b), %w(c d), %w(a d), %w(d), [10], nil], a.splitted)
-    end
-    should 'multiply correct for scalar' do
-      a = [1, 2, 3].to_numeric
-      assert_equal([5, 10, 15].to_numeric, a * 5)
-    end
-    should 'multiply correct with other vector' do
-      a = [1, 2, 3].to_numeric
-      b = [2, 4, 6].to_numeric
-      assert_equal([2, 8, 18].to_numeric, a * b)
-    end
-    should 'sum correct for scalar' do
-      a = [1, 2, 3].to_numeric
-      assert_equal([11, 12, 13].to_numeric, a + 10)
-    end
-    should 'raise NoMethodError when method requires numeric and vector is object' do
-      @c.type = :object
-      assert_raise(::NoMethodError) { @c.median }
-    end
-    should 'jacknife correctly with named method' do
-      # First example
-      a = [1, 2, 3, 4].to_numeric
-      ds = a.jacknife(:mean)
-      assert_equal(a.mean, ds[:mean].mean)
-      ds = a.jacknife([:mean, :sd])
-      assert_equal(a.mean, ds[:mean].mean)
-      assert_equal(a.sd, ds[:mean].sd)
-    end
-    should 'jacknife correctly with custom method' do
-      # Second example
-      a = [17.23, 18.71, 13.93, 18.81, 15.78, 11.29, 14.91, 13.39, 18.21, 11.57, 14.28, 10.94, 18.83, 15.52, 13.45, 15.25].to_numeric
-      ds = a.jacknife(log_s2: ->(v) {  Math.log(v.variance) })
-      exp = [1.605, 2.972, 1.151, 3.097, 0.998, 3.308, 0.942, 1.393, 2.416, 2.951, 1.043, 3.806, 3.122, 0.958, 1.362, 0.937].to_numeric
-      assert_similar_vector(exp, ds[:log_s2], 0.001)
-      assert_in_delta(2.00389, ds[:log_s2].mean, 0.00001)
-      assert_in_delta(1.091, ds[:log_s2].variance, 0.001)
-    end
-    should 'jacknife correctly with k>1' do
-      a = rnorm(6)
-      ds = a.jacknife(:mean, 2)
-      mean = a.mean
-      exp = [3 * mean - 2 * (a[2] + a[3] + a[4] + a[5]) / 4, 3 * mean - 2 * (a[0] + a[1] + a[4] + a[5]) / 4, 3 * mean - 2 * (a[0] + a[1] + a[2] + a[3]) / 4].to_numeric
-      assert_similar_vector(exp, ds[:mean], 1e-13)
-    end
-    should 'bootstrap should return a vector with mean=mu and sd=se' do
-      a = rnorm(100)
-      ds = a.bootstrap([:mean, :sd], 200)
-      se = 1 / Math.sqrt(a.size)
-      assert_in_delta(0, ds[:mean].mean, 0.3)
-      assert_in_delta(se, ds[:mean].sd, 0.02)
-    end
-  end
-  def test_object
-    assert_equal(@c[1], 5)
-    assert_equal({ 1 => 1, 2 => 1, 3 => 1, 4 => 1, 5 => 5, 6 => 2, 7 => 1, 8 => 1, 9 => 1, 10 => 1 }, @c.frequencies)
-    assert_equal({ 1 => 1, 2 => 1, 3 => 1, 4 => 1, 5 => 5, 6 => 2, 7 => 1, 8 => 1, 9 => 1, 10 => 1 }, @c._frequencies)
-    assert_equal({ 1 => 1.quo(15), 2 => 1.quo(15), 3 => 1.quo(15), 4 => 1.quo(15), 5 => 5.quo(15), 6 => 2.quo(15), 7 => 1.quo(15), 8 => 1.quo(15), 9 => 1.quo(15), 10 => 1.quo(15) }, @c.proportions)
-    assert_equal(@c.proportion, 1.quo(15))
-    assert_equal(@c.proportion(2), 1.quo(15))
-    assert_equal([1, 2, 3, 4, 5, 6, 7, 8, 9, 10], @c.factors.sort)
-    assert_equal(@c.mode, 5)
-    assert_equal(@c.n_valid, 15)
-  end
-  def test_equality
-    v1 = [1, 2, 3].to_vector
-    v2 = [1, 2, 3].to_vector
-    assert_equal(v1, v2)
-    v1 = [1, 2, 3].to_vector(:object)
-    v2 = [1, 2, 3].to_vector(:numeric)
-    assert_not_equal(v1, v2)
-    v2 = [1, 2, 3]
-    assert_not_equal(v1, v2)
-    v1 = [1, 2, 3].to_vector
-    v2 = [1, 2, 3].to_vector
-    assert_equal(v1, v2)
-    assert_equal(false, v1 == Object.new)
-  end
-  def test_vector_percentil
-    a = [1, 2, 2, 3, 4, 5, 5, 5, 6, 10].to_numeric
-    expected = [10, 25, 25, 40, 50, 70, 70, 70, 90, 100].to_numeric
-    assert_equal(expected, a.vector_percentil)
-    a = [1, nil, nil, 2, 2, 3, 4, nil, nil, 5, 5, 5, 6, 10].to_numeric
-    expected = [10, nil, nil, 25, 25, 40, 50, nil, nil, 70, 70, 70, 90, 100].to_numeric
-    assert_equal(expected, a.vector_percentil)
-  end
-  def test_numeric
-    @c.type = :numeric
-    assert_equal(5, @c.median)
-    assert_equal(4, @c.percentil(25))
-    assert_equal(7, @c.percentil(75))
-    v = [200_000, 200_000, 210_000, 220_000, 230_000, 250_000, 250_000, 250_000, 270_000, 300_000, 450_000, 130_000, 140_000, 140_000, 140_000, 145_000, 148_000, 165_000, 170_000, 180_000, 180_000, 180_000, 180_000, 180_000, 180_000].to_numeric
-    assert_equal(180_000, v.median)
-    a = [7.0, 7.0, 7.0, 7.0, 7.0, 8.0, 8.0, 8.0, 9.0, 9.0, 10.0, 10.0, 10.0, 10.0, 10.0, 12.0, 12.0, 13.0, 14.0, 14.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 6.0, 6.0, 6.0].to_numeric
-    assert_equal(4.5, a.percentil(25))
-    assert_equal(6.5, a.percentil(50))
-    assert_equal(9.5, a.percentil(75))
-    assert_equal(3.0, a.percentil(10))
-  end
-  def test_linear_percentil_strategy
-    values = [102, 104, 105, 107, 108, 109, 110, 112, 115, 116].shuffle.to_numeric
-    assert_equal 102, values.percentil(0, :linear)
-    assert_equal 104.75, values.percentil(25, :linear)
-    assert_equal 108.5, values.percentil(50, :linear)
-    assert_equal 112.75, values.percentil(75, :linear)
-    assert_equal 116, values.percentil(100, :linear)
-    values = [102, 104, 105, 107, 108, 109, 110, 112, 115, 116, 118].shuffle.to_numeric
-    assert_equal 102, values.percentil(0, :linear)
-    assert_equal 105, values.percentil(25, :linear)
-    assert_equal 109, values.percentil(50, :linear)
-    assert_equal 115, values.percentil(75, :linear)
-    assert_equal 118, values.percentil(100, :linear)
-  end
-  def test_ranked
-    v1 = [0.8, 1.2, 1.2, 2.3, 18].to_vector(:numeric)
-    expected = [1, 2.5, 2.5, 4, 5].to_vector(:numeric)
-    assert_equal(expected, v1.ranked)
-    v1 = [nil, 0.8, 1.2, 1.2, 2.3, 18, nil].to_vector(:numeric)
-    expected = [nil, 1, 2.5, 2.5, 4, 5, nil].to_vector(:numeric)
-    assert_equal(expected, v1.ranked)
-  end
-  def test_numeric
-    a = Statsample::Vector.new([1, 2, 3, 4, 'STRING'], :numeric)
-    assert_equal(10, a.sum)
-    i = 0
-    factors = a.factors.sort
-    [0, 1, 2, 3, 4].each{|v|
-      assert(v == factors[i])
-      assert(v.class == factors[i].class, "#{v} - #{v.class} != #{factors[i]} - #{factors[i].class}")
-      i += 1
-    }
-  end
-  def test_vector_centered
-    mean = rand
-    samples = 11
-    centered = samples.times.map { |i| i - ((samples / 2).floor).to_i }.to_numeric
-    not_centered = centered.recode { |v| v + mean }
-    obs = not_centered.centered
-    centered.each_with_index do |v, i|
-      assert_in_delta(v, obs[i], 0.0001)
-    end
-  end
-  def test_vector_standarized
-    v1 = [1, 2, 3, 4, nil].to_vector(:numeric)
-    sds = v1.sds
-    expected = [((1 - 2.5).quo(sds)), ((2 - 2.5).quo(sds)), ((3 - 2.5).quo(sds)), ((4 - 2.5).quo(sds)), nil].to_vector(:numeric)
-    vs = v1.vector_standarized
-    assert_equal(expected, vs)
-    assert_equal(0, vs.mean)
-    assert_equal(1, vs.sds)
-  end
-  def test_vector_standarized_with_zero_variance
-    v1 = 100.times.map { |_i| 1 }.to_numeric
-    exp = 100.times.map { nil }.to_numeric
-    assert_equal(exp, v1.standarized)
-  end
-  def test_check_type
-    v = Statsample::Vector.new
-    v.type = :object
-    assert_raise(NoMethodError) { v.check_type(:numeric) }
-    assert(v.check_type(:object).nil?)
-    v.type = :numeric
-    assert(v.check_type(:numeric).nil?)
-    assert(v.check_type(:object).nil?)
+    should "show a warning when initializing with :nominal, :numeric or :ordinal" do
+      assert_output(nil,"WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\nWARNING: nominal has been deprecated.\n") do
+        Statsample::Vector.new [1,2,3,4,5,nil,'hello'], :nominal
+      end
-    v.type = :date
-    assert_raise(NoMethodError) { v.check_type(:numeric) }
-    assert_raise(NoMethodError) { v.check_type(:numeric) }
-    assert_raise(NoMethodError) { v.check_type(:object) }
-end
+      assert_output(nil,"WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\nWARNING: scale has been deprecated.\n") do
+        Statsample::Vector.new [1,2,3,4,nil,5], :scale
+      end
-  def test_add
-    a = Statsample::Vector.new([1, 2, 3, 4, 5], :numeric)
-    b = Statsample::Vector.new([11, 12, 13, 14, 15], :numeric)
-    assert_equal([3, 4, 5, 6, 7], (a + 2).to_a)
-    assert_equal([12, 14, 16, 18, 20], (a + b).to_a)
-    assert_raise ArgumentError do
-      a + @c
-    end
-    assert_raise TypeError do
-      a + 'string'
-    end
-    a = Statsample::Vector.new([nil, 1, 2, 3, 4, 5], :numeric)
-    b = Statsample::Vector.new([11, 12, nil, 13, 14, 15], :numeric)
-    assert_equal([nil, 13, nil, 16, 18, 20], (a + b).to_a)
-    assert_equal([nil, 13, nil, 16, 18, 20], (a + b.to_a).to_a)
-  end
+      assert_output(nil,"WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\nWARNING: ordinal has been deprecated.\n") do
+        Statsample::Vector.new [1,2,3,4,5], :ordinal
+      end
-  def test_minus
-    a = Statsample::Vector.new([1, 2, 3, 4, 5], :numeric)
-    b = Statsample::Vector.new([11, 12, 13, 14, 15], :numeric)
-    assert_equal([-1, 0, 1, 2, 3], (a - 2).to_a)
-    assert_equal([10, 10, 10, 10, 10], (b - a).to_a)
-    assert_raise ArgumentError do
-      a - @c
-    end
-    assert_raise TypeError do
-      a - 'string'
+      assert_output(nil,"WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\n") do
+        Statsample::Vector.new_scale 10, 1
+      end
     end
-    a = Statsample::Vector.new([nil, 1, 2, 3, 4, 5], :numeric)
-    b = Statsample::Vector.new([11, 12, nil, 13, 14, 15], :numeric)
-    assert_equal([nil, 11, nil, 10, 10, 10], (b - a).to_a)
-    assert_equal([nil, 11, nil, 10, 10, 10], (b - a.to_a).to_a)
-  end
-  def test_sum_of_squares
-    a = [1, 2, 3, 4, 5, 6].to_vector(:numeric)
-    assert_equal(17.5, a.sum_of_squared_deviation)
-  end
+    should "show a warning when Statsample::Vector shorthands are used" do
+      numeric = Statsample::Vector.new([1,2,3,4,nil,5], :numeric)
+      assert_equal(numeric, [1,2,3,4,nil,5].to_numeric)
+      assert_equal(numeric, [1,2,3,4,nil,5].to_vector(:numeric))
-  def test_average_deviation
-    a = [1, 2, 3, 4, 5, 6, 7, 8, 9].to_numeric
-    assert_equal(20.quo(9), a.average_deviation_population)
-  end
-  def test_samples
-    srand(1)
-    assert_equal(100, @c.sample_with_replacement(100).size)
-    assert_equal(@c.valid_data.to_a.sort, @c.sample_without_replacement(15).sort)
-    assert_raise ArgumentError do
-      @c.sample_without_replacement(20)
+      obj = Statsample::Vector.new([1,2,3,4,'one','two'], :object)
+      assert_equal(obj, [1,2,3,4,'one','two'].to_vector(:object))
     end
-    @c.type = :numeric
-    srand(1)
-    assert_equal(100, @c.sample_with_replacement(100).size)
-    assert_equal(@c.valid_data.to_a.sort, @c.sample_without_replacement(15).sort)
-  end
-  def test_valid_data
-    a = Statsample::Vector.new([1, 2, 3, 4, 'STRING'])
-    a.missing_values = [-99]
-    a.add(1, false)
-    a.add(2, false)
-    a.add(-99, false)
-    a.set_valid_data
-    exp_valid_data = [1, 2, 3, 4, 'STRING', 1, 2]
-    assert_equal(exp_valid_data, a.valid_data)
-    a.add(20, false)
-    a.add(30, false)
-    assert_equal(exp_valid_data, a.valid_data)
-    a.set_valid_data
-    exp_valid_data_2 = [1, 2, 3, 4, 'STRING', 1, 2, 20, 30]
-    assert_equal(exp_valid_data_2, a.valid_data)
-  end
-  def test_set_value
-    @c[2] = 10
-    expected = [5, 5, 10, 5, 5, 6, 6, 7, 8, 9, 10, 1, 2, 3, 4, nil, -99, -99].to_vector
-    assert_equal(expected.data, @c.data)
-  end
-  def test_gsl
-    if Statsample.has_gsl?
-      a = Statsample::Vector.new([1, 2, 3, 4, 'STRING'], :numeric)
-      assert_equal(2, a.mean)
-      assert_equal(a.variance_sample_ruby, a.variance_sample)
-      assert_equal(a.standard_deviation_sample_ruby, a.sds)
-      assert_equal(a.variance_population_ruby, a.variance_population)
-      assert_equal(a.standard_deviation_population_ruby, a.standard_deviation_population)
-      assert_nothing_raised do
-        a = [].to_vector(:numeric)
+    should "test that old shorthands show deprecation warnings" do
+      assert_output(nil,"WARNING: Statsample::Dataset and Statsample::Vector have been deprecated in favor of Daru::DataFrame and Daru::Vector. Please switch to using that.\n") do
+        [1,2,3,4,nil,5].to_scale
       end
-      a.add(1, false)
-      a.add(2, false)
-      a.set_valid_data
-      assert_equal(3, a.sum)
-      b = [1, 2, nil, 3, 4, 5, nil, 6].to_vector(:numeric)
-      assert_equal(21, b.sum)
-      assert_equal(3.5, b.mean)
-      assert_equal(6, b.gsl.size)
-      c = [10, 20, 30, 40, 50, 100, 1000, 2000, 5000].to_numeric
-      assert_in_delta(c.skew,     c.skew_ruby, 0.0001)
-      assert_in_delta(c.kurtosis, c.kurtosis_ruby, 0.0001)
     end
   end
-  def test_vector_matrix
-    v1 = %w(a a a b b b c c).to_vector
-    v2 = %w(1 3 4 5 6 4 3 2).to_vector
-    v3 = %w(1 0 0 0 1 1 1 0).to_vector
-    ex = Matrix.rows([%w(a 1 1), %w(a 3 0), %w(a 4 0), %w(b 5 0), %w(b 6 1), %w(b 4 1), %w(c 3 1), %w(c 2 0)])
-    assert_equal(ex, Statsample.vector_cols_matrix(v1, v2, v3))
-  end
-  def test_marshalling
-    v1 = (0..100).to_a.collect { |_n| rand(100) }.to_vector(:numeric)
-    v2 = Marshal.load(Marshal.dump(v1))
-    assert_equal(v1, v2)
-  end
-  def test_dup
-    v1 = %w(a a a b b b c c).to_vector
-    v2 = v1.dup
-    assert_equal(v1.data, v2.data)
-    assert_not_same(v1.data, v2.data)
-    assert_equal(v1.type, v2.type)
-    v1.type = :numeric
-    assert_not_equal(v1.type, v2.type)
-    assert_equal(v1.missing_values, v2.missing_values)
-    assert_not_same(v1.missing_values, v2.missing_values)
-    assert_equal(v1.labels, v2.labels)
-    assert_not_same(v1.labels, v2.labels)
-    v3 = v1.dup_empty
-    assert_equal([], v3.data)
-    assert_not_equal(v1.data, v3.data)
-    assert_not_same(v1.data, v3.data)
-    assert_equal(v1.type, v3.type)
-    v1.type = :numeric
-    v3.type = :object
-    assert_not_equal(v1.type, v3.type)
-    assert_equal(v1.missing_values, v3.missing_values)
-    assert_not_same(v1.missing_values, v3.missing_values)
-    assert_equal(v1.labels, v3.labels)
-    assert_not_same(v1.labels, v3.labels)
-  end
-  def test_paired_ties
-    a = [0, 0, 0, 1, 1, 2, 3, 3, 4, 4, 4].to_vector(:numeric)
-    expected = [2, 2, 2, 4.5, 4.5, 6, 7.5, 7.5, 10, 10, 10].to_vector(:numeric)
-    assert_equal(expected, a.ranked)
-  end
-  def test_dichotomize
-    a = [0, 0, 0, 1, 2, 3, nil].to_vector
-    exp = [0, 0, 0, 1, 1, 1, nil].to_numeric
-    assert_equal(exp, a.dichotomize)
-    a = [1, 1, 1, 2, 2, 2, 3].to_vector
-    exp = [0, 0, 0, 1, 1, 1, 1].to_numeric
-    assert_equal(exp, a.dichotomize)
-    a = [0, 0, 0, 1, 2, 3, nil].to_vector
-    exp = [0, 0, 0, 0, 1, 1, nil].to_numeric
-    assert_equal(exp, a.dichotomize(1))
-    a = %w(a a a b c d).to_vector
-    exp = [0, 0, 0, 1, 1, 1].to_numeric
-    assert_equal(exp, a.dichotomize)
-  end
-  def test_can_be_methods
-    a = [0, 0, 0, 1, 2, 3, nil].to_vector
-    assert(a.can_be_numeric?)
-    a = [0, 's', 0, 1, 2, 3, nil].to_vector
-    assert(!a.can_be_numeric?)
-    a.missing_values = ['s']
-    assert(a.can_be_numeric?)
-    a = [Date.new(2009, 10, 10), Date.today, '2009-10-10', '2009-1-1', nil, 'NOW'].to_vector
-    assert(a.can_be_date?)
-    a = [Date.new(2009, 10, 10), Date.today, nil, 'sss'].to_vector
-    assert(!a.can_be_date?)
-  end
-  def test_date_vector
-    a = [Date.new(2009, 10, 10), :NOW, '2009-10-10', '2009-1-1', nil, 'NOW', 'MISSING'].to_vector(:date, missing_values: ['MISSING'])
-    assert(a.type == :date)
-    expected = [Date.new(2009, 10, 10), Date.today, Date.new(2009, 10, 10), Date.new(2009, 1, 1), nil, Date.today, nil]
-    assert_equal(expected, a.date_data_with_nils)
+  should 'return correct histogram' do
+    a = Daru::Vector.new(10.times.map { |v| v })
+    hist = a.histogram(2)
+    assert_equal([5, 5], hist.bin)
+    3.times do |i|
+      assert_in_delta(i * 4.5, hist.get_range(i)[0], 1e-9)
+    end
   end
 end