eps 0.3.7 → 0.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +14 -0
- data/LICENSE.txt +1 -1
- data/README.md +2 -2
- data/lib/eps/data_frame.rb +6 -3
- data/lib/eps/lightgbm.rb +1 -1
- data/lib/eps/linear_regression.rb +5 -28
- data/lib/eps/pmml/loader.rb +1 -1
- data/lib/eps/version.rb +1 -1
- metadata +5 -89
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: ed82418a666490dc6683d0b1258c2dbc7451d86e9421bc5e1581a216e9b48a6f
|
4
|
+
data.tar.gz: d725f5e8f826f6e875aa06811a2d6cbf1fcbffd32073324eb43b32d6e99040eb
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: e3a8e472c998061e3a493ea2b2762a12747bac71d5544ca818bf69f50ac5e4c12cd7a2e0c5a8b767667c92238bbda54e7ef800f740210088fc982bfa84afa7a2
|
7
|
+
data.tar.gz: 2cdb0dda86b60c80a4a7fc4ad0fabafab71e57cfef8cdef349a190da4501e3105c1032b68f64c4196c99df1157da1a068d3bf6831b129b1544f925e371d924da
|
data/CHANGELOG.md
CHANGED
@@ -1,3 +1,17 @@
|
|
1
|
+
## 0.4.0 (2022-09-02)
|
2
|
+
|
3
|
+
- Fixed `stack level too deep` error with many rows
|
4
|
+
- Dropped support for `gsl` gem (use `gslr` instead)
|
5
|
+
- Dropped support for Ruby < 2.7
|
6
|
+
|
7
|
+
## 0.3.9 (2021-10-14)
|
8
|
+
|
9
|
+
- Fixed error with `lessOrEqual` operator
|
10
|
+
|
11
|
+
## 0.3.8 (2021-02-08)
|
12
|
+
|
13
|
+
- Fixed error with categorical and text features
|
14
|
+
|
1
15
|
## 0.3.7 (2020-11-23)
|
2
16
|
|
3
17
|
- Fixed error with LightGBM summary
|
data/LICENSE.txt
CHANGED
data/README.md
CHANGED
@@ -14,7 +14,7 @@ Check out [this post](https://ankane.org/rails-meet-data-science) for more info
|
|
14
14
|
Add this line to your application’s Gemfile:
|
15
15
|
|
16
16
|
```ruby
|
17
|
-
gem
|
17
|
+
gem "eps"
|
18
18
|
```
|
19
19
|
|
20
20
|
On Mac, also install OpenMP:
|
@@ -388,7 +388,7 @@ brew install gsl
|
|
388
388
|
Then, add this line to your application’s Gemfile:
|
389
389
|
|
390
390
|
```ruby
|
391
|
-
gem
|
391
|
+
gem "gslr", group: :development
|
392
392
|
```
|
393
393
|
|
394
394
|
It only needs to be available in environments used to build the model.
|
data/lib/eps/data_frame.rb
CHANGED
@@ -85,6 +85,8 @@ module Eps
|
|
85
85
|
finish -= 1 if rows.exclude_end?
|
86
86
|
rows = Range.new(rows.begin, size - 1) if finish >= size - 1
|
87
87
|
end
|
88
|
+
elsif rows.is_a?(Integer)
|
89
|
+
rows = [rows]
|
88
90
|
end
|
89
91
|
|
90
92
|
if cols
|
@@ -118,10 +120,11 @@ module Eps
|
|
118
120
|
cols.each do |c|
|
119
121
|
raise "Undefined column: #{c}" unless columns.include?(c)
|
120
122
|
|
121
|
-
|
123
|
+
col = columns[c]
|
124
|
+
df.columns[c] = rows.map { |i| col[i] }
|
122
125
|
end
|
123
|
-
df.label =
|
124
|
-
df.weight =
|
126
|
+
df.label = rows.map { |i| label[i] } if label
|
127
|
+
df.weight = rows.map { |i| weight[i] } if weight
|
125
128
|
|
126
129
|
singular ? df.columns[cols[0]] : df
|
127
130
|
end
|
data/lib/eps/lightgbm.rb
CHANGED
@@ -71,7 +71,7 @@ module Eps
|
|
71
71
|
end
|
72
72
|
|
73
73
|
# create datasets
|
74
|
-
categorical_idx =
|
74
|
+
categorical_idx = train_set.columns.keys.map.with_index.select { |k, _| @features[k] == "categorical" }.map(&:last)
|
75
75
|
train_ds = ::LightGBM::Dataset.new(train_set.map_rows(&:to_a), label: train_set.label, weight: train_set.weight, categorical_feature: categorical_idx, params: params)
|
76
76
|
validation_ds = ::LightGBM::Dataset.new(validation_set.map_rows(&:to_a), label: validation_set.label, weight: validation_set.weight, categorical_feature: categorical_idx, params: params, reference: train_ds) if validation_set
|
77
77
|
|
@@ -37,8 +37,7 @@ module Eps
|
|
37
37
|
str
|
38
38
|
end
|
39
39
|
|
40
|
-
|
41
|
-
def _train(**options)
|
40
|
+
def _train(intercept: true, gsl: nil)
|
42
41
|
raise "Target must be numeric" if @target_type != "numeric"
|
43
42
|
check_missing_value(@train_set)
|
44
43
|
check_missing_value(@validation_set) if @validation_set
|
@@ -51,26 +50,16 @@ module Eps
|
|
51
50
|
|
52
51
|
x = data.map_rows(&:to_a)
|
53
52
|
|
54
|
-
gsl =
|
55
|
-
if options.key?(:gsl)
|
56
|
-
options[:gsl]
|
57
|
-
elsif defined?(GSL)
|
58
|
-
true
|
59
|
-
elsif defined?(GSLR)
|
60
|
-
:gslr
|
61
|
-
else
|
62
|
-
false
|
63
|
-
end
|
53
|
+
gsl = defined?(GSLR) if gsl.nil?
|
64
54
|
|
65
|
-
|
66
|
-
if intercept && gsl != :gslr
|
55
|
+
if intercept && !gsl
|
67
56
|
data.size.times do |i|
|
68
57
|
x[i].unshift(1)
|
69
58
|
end
|
70
59
|
end
|
71
60
|
|
72
61
|
v3 =
|
73
|
-
if gsl
|
62
|
+
if gsl
|
74
63
|
model = GSLR::OLS.new(intercept: intercept)
|
75
64
|
model.fit(x, data.label, weight: data.weight)
|
76
65
|
|
@@ -79,12 +68,6 @@ module Eps
|
|
79
68
|
coefficients = model.coefficients.dup
|
80
69
|
coefficients.unshift(model.intercept) if intercept
|
81
70
|
coefficients
|
82
|
-
elsif gsl
|
83
|
-
x = GSL::Matrix.alloc(*x)
|
84
|
-
y = GSL::Vector.alloc(data.label)
|
85
|
-
w = GSL::Vector.alloc(data.weight) if data.weight
|
86
|
-
c, @covariance, _, _ = w ? GSL::MultiFit.wlinear(x, w, y) : GSL::MultiFit.linear(x, y)
|
87
|
-
c.to_a
|
88
71
|
else
|
89
72
|
x = Matrix.rows(x)
|
90
73
|
y = Matrix.column_vector(data.label)
|
@@ -195,13 +178,7 @@ module Eps
|
|
195
178
|
def p_value
|
196
179
|
@p_value ||= begin
|
197
180
|
Hash[@coefficients.map do |k, _|
|
198
|
-
tp =
|
199
|
-
if @gsl
|
200
|
-
GSL::Cdf.tdist_P(t_value[k].abs, degrees_of_freedom)
|
201
|
-
else
|
202
|
-
Eps::Statistics.tdist_p(t_value[k].abs, degrees_of_freedom)
|
203
|
-
end
|
204
|
-
|
181
|
+
tp = Eps::Statistics.tdist_p(t_value[k].abs, degrees_of_freedom)
|
205
182
|
[k, 2 * (1 - tp)]
|
206
183
|
end]
|
207
184
|
end
|
data/lib/eps/pmml/loader.rb
CHANGED
@@ -222,7 +222,7 @@ module Eps
|
|
222
222
|
else
|
223
223
|
operator = xml_predicate.attribute("operator").value
|
224
224
|
value = xml_predicate.attribute("value").value
|
225
|
-
value = value.to_f if operator == "greaterThan"
|
225
|
+
value = value.to_f if operator == "greaterThan" || operator == "lessOrEqual"
|
226
226
|
field = xml_predicate.attribute("field").value
|
227
227
|
field = derived_fields[field] if derived_fields[field]
|
228
228
|
{
|
data/lib/eps/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: eps
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.4.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Andrew Kane
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2022-09-02 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: lightgbm
|
@@ -38,92 +38,8 @@ dependencies:
|
|
38
38
|
- - ">="
|
39
39
|
- !ruby/object:Gem::Version
|
40
40
|
version: '0'
|
41
|
-
- !ruby/object:Gem::Dependency
|
42
|
-
name: bundler
|
43
|
-
requirement: !ruby/object:Gem::Requirement
|
44
|
-
requirements:
|
45
|
-
- - ">="
|
46
|
-
- !ruby/object:Gem::Version
|
47
|
-
version: '0'
|
48
|
-
type: :development
|
49
|
-
prerelease: false
|
50
|
-
version_requirements: !ruby/object:Gem::Requirement
|
51
|
-
requirements:
|
52
|
-
- - ">="
|
53
|
-
- !ruby/object:Gem::Version
|
54
|
-
version: '0'
|
55
|
-
- !ruby/object:Gem::Dependency
|
56
|
-
name: daru
|
57
|
-
requirement: !ruby/object:Gem::Requirement
|
58
|
-
requirements:
|
59
|
-
- - ">="
|
60
|
-
- !ruby/object:Gem::Version
|
61
|
-
version: '0'
|
62
|
-
type: :development
|
63
|
-
prerelease: false
|
64
|
-
version_requirements: !ruby/object:Gem::Requirement
|
65
|
-
requirements:
|
66
|
-
- - ">="
|
67
|
-
- !ruby/object:Gem::Version
|
68
|
-
version: '0'
|
69
|
-
- !ruby/object:Gem::Dependency
|
70
|
-
name: minitest
|
71
|
-
requirement: !ruby/object:Gem::Requirement
|
72
|
-
requirements:
|
73
|
-
- - ">="
|
74
|
-
- !ruby/object:Gem::Version
|
75
|
-
version: '0'
|
76
|
-
type: :development
|
77
|
-
prerelease: false
|
78
|
-
version_requirements: !ruby/object:Gem::Requirement
|
79
|
-
requirements:
|
80
|
-
- - ">="
|
81
|
-
- !ruby/object:Gem::Version
|
82
|
-
version: '0'
|
83
|
-
- !ruby/object:Gem::Dependency
|
84
|
-
name: numo-narray
|
85
|
-
requirement: !ruby/object:Gem::Requirement
|
86
|
-
requirements:
|
87
|
-
- - ">="
|
88
|
-
- !ruby/object:Gem::Version
|
89
|
-
version: '0'
|
90
|
-
type: :development
|
91
|
-
prerelease: false
|
92
|
-
version_requirements: !ruby/object:Gem::Requirement
|
93
|
-
requirements:
|
94
|
-
- - ">="
|
95
|
-
- !ruby/object:Gem::Version
|
96
|
-
version: '0'
|
97
|
-
- !ruby/object:Gem::Dependency
|
98
|
-
name: rake
|
99
|
-
requirement: !ruby/object:Gem::Requirement
|
100
|
-
requirements:
|
101
|
-
- - ">="
|
102
|
-
- !ruby/object:Gem::Version
|
103
|
-
version: '0'
|
104
|
-
type: :development
|
105
|
-
prerelease: false
|
106
|
-
version_requirements: !ruby/object:Gem::Requirement
|
107
|
-
requirements:
|
108
|
-
- - ">="
|
109
|
-
- !ruby/object:Gem::Version
|
110
|
-
version: '0'
|
111
|
-
- !ruby/object:Gem::Dependency
|
112
|
-
name: rover-df
|
113
|
-
requirement: !ruby/object:Gem::Requirement
|
114
|
-
requirements:
|
115
|
-
- - ">="
|
116
|
-
- !ruby/object:Gem::Version
|
117
|
-
version: '0'
|
118
|
-
type: :development
|
119
|
-
prerelease: false
|
120
|
-
version_requirements: !ruby/object:Gem::Requirement
|
121
|
-
requirements:
|
122
|
-
- - ">="
|
123
|
-
- !ruby/object:Gem::Version
|
124
|
-
version: '0'
|
125
41
|
description:
|
126
|
-
email: andrew@
|
42
|
+
email: andrew@ankane.org
|
127
43
|
executables: []
|
128
44
|
extensions: []
|
129
45
|
extra_rdoc_files: []
|
@@ -164,14 +80,14 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
164
80
|
requirements:
|
165
81
|
- - ">="
|
166
82
|
- !ruby/object:Gem::Version
|
167
|
-
version: '2.
|
83
|
+
version: '2.7'
|
168
84
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
169
85
|
requirements:
|
170
86
|
- - ">="
|
171
87
|
- !ruby/object:Gem::Version
|
172
88
|
version: '0'
|
173
89
|
requirements: []
|
174
|
-
rubygems_version: 3.
|
90
|
+
rubygems_version: 3.3.7
|
175
91
|
signing_key:
|
176
92
|
specification_version: 4
|
177
93
|
summary: Machine learning for Ruby. Supports regression (linear regression) and classification
|