classifier 2.1.0 → 2.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.md +70 -199
- data/exe/classifier +9 -0
- data/ext/classifier/classifier_ext.c +1 -0
- data/ext/classifier/incremental_svd.c +393 -0
- data/ext/classifier/linalg.h +8 -0
- data/lib/classifier/bayes.rb +177 -53
- data/lib/classifier/cli.rb +880 -0
- data/lib/classifier/errors.rb +3 -0
- data/lib/classifier/knn.rb +351 -0
- data/lib/classifier/logistic_regression.rb +593 -0
- data/lib/classifier/lsi/incremental_svd.rb +166 -0
- data/lib/classifier/lsi/summary.rb +25 -5
- data/lib/classifier/lsi.rb +365 -17
- data/lib/classifier/streaming/line_reader.rb +99 -0
- data/lib/classifier/streaming/progress.rb +96 -0
- data/lib/classifier/streaming.rb +122 -0
- data/lib/classifier/tfidf.rb +408 -0
- data/lib/classifier/version.rb +3 -0
- data/lib/classifier.rb +5 -0
- data/sig/classifier.rbs +3 -0
- data/sig/vendor/json.rbs +1 -0
- data/sig/vendor/matrix.rbs +25 -14
- data/sig/vendor/optparse.rbs +19 -0
- data/sig/vendor/streaming.rbs +14 -0
- metadata +39 -6
metadata
CHANGED
|
@@ -1,11 +1,11 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: classifier
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 2.
|
|
4
|
+
version: 2.3.0
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Lucas Carlson
|
|
8
|
-
bindir:
|
|
8
|
+
bindir: exe
|
|
9
9
|
cert_chain: []
|
|
10
10
|
date: 1980-01-02 00:00:00.000000000 Z
|
|
11
11
|
dependencies:
|
|
@@ -121,9 +121,27 @@ dependencies:
|
|
|
121
121
|
- - ">="
|
|
122
122
|
- !ruby/object:Gem::Version
|
|
123
123
|
version: '0'
|
|
124
|
-
|
|
124
|
+
- !ruby/object:Gem::Dependency
|
|
125
|
+
name: webmock
|
|
126
|
+
requirement: !ruby/object:Gem::Requirement
|
|
127
|
+
requirements:
|
|
128
|
+
- - ">="
|
|
129
|
+
- !ruby/object:Gem::Version
|
|
130
|
+
version: '0'
|
|
131
|
+
type: :development
|
|
132
|
+
prerelease: false
|
|
133
|
+
version_requirements: !ruby/object:Gem::Requirement
|
|
134
|
+
requirements:
|
|
135
|
+
- - ">="
|
|
136
|
+
- !ruby/object:Gem::Version
|
|
137
|
+
version: '0'
|
|
138
|
+
description: A Ruby library for text classification featuring Naive Bayes, LSI (Latent
|
|
139
|
+
Semantic Indexing), Logistic Regression, and k-Nearest Neighbors classifiers. Includes
|
|
140
|
+
TF-IDF vectorization, streaming/incremental training, pluggable persistence backends,
|
|
141
|
+
thread safety, and a native C extension for fast LSI operations.
|
|
125
142
|
email: lucas@rufy.com
|
|
126
|
-
executables:
|
|
143
|
+
executables:
|
|
144
|
+
- classifier
|
|
127
145
|
extensions:
|
|
128
146
|
- ext/classifier/extconf.rb
|
|
129
147
|
extra_rdoc_files: []
|
|
@@ -133,31 +151,45 @@ files:
|
|
|
133
151
|
- README.md
|
|
134
152
|
- bin/bayes.rb
|
|
135
153
|
- bin/summarize.rb
|
|
154
|
+
- exe/classifier
|
|
136
155
|
- ext/classifier/classifier_ext.c
|
|
137
156
|
- ext/classifier/extconf.rb
|
|
157
|
+
- ext/classifier/incremental_svd.c
|
|
138
158
|
- ext/classifier/linalg.h
|
|
139
159
|
- ext/classifier/matrix.c
|
|
140
160
|
- ext/classifier/svd.c
|
|
141
161
|
- ext/classifier/vector.c
|
|
142
162
|
- lib/classifier.rb
|
|
143
163
|
- lib/classifier/bayes.rb
|
|
164
|
+
- lib/classifier/cli.rb
|
|
144
165
|
- lib/classifier/errors.rb
|
|
145
166
|
- lib/classifier/extensions/string.rb
|
|
146
167
|
- lib/classifier/extensions/vector.rb
|
|
147
168
|
- lib/classifier/extensions/word_hash.rb
|
|
169
|
+
- lib/classifier/knn.rb
|
|
170
|
+
- lib/classifier/logistic_regression.rb
|
|
148
171
|
- lib/classifier/lsi.rb
|
|
149
172
|
- lib/classifier/lsi/content_node.rb
|
|
173
|
+
- lib/classifier/lsi/incremental_svd.rb
|
|
150
174
|
- lib/classifier/lsi/summary.rb
|
|
151
175
|
- lib/classifier/lsi/word_list.rb
|
|
152
176
|
- lib/classifier/storage.rb
|
|
153
177
|
- lib/classifier/storage/base.rb
|
|
154
178
|
- lib/classifier/storage/file.rb
|
|
155
179
|
- lib/classifier/storage/memory.rb
|
|
180
|
+
- lib/classifier/streaming.rb
|
|
181
|
+
- lib/classifier/streaming/line_reader.rb
|
|
182
|
+
- lib/classifier/streaming/progress.rb
|
|
183
|
+
- lib/classifier/tfidf.rb
|
|
184
|
+
- lib/classifier/version.rb
|
|
185
|
+
- sig/classifier.rbs
|
|
156
186
|
- sig/vendor/fast_stemmer.rbs
|
|
157
187
|
- sig/vendor/gsl.rbs
|
|
158
188
|
- sig/vendor/json.rbs
|
|
159
189
|
- sig/vendor/matrix.rbs
|
|
160
190
|
- sig/vendor/mutex_m.rbs
|
|
191
|
+
- sig/vendor/optparse.rbs
|
|
192
|
+
- sig/vendor/streaming.rbs
|
|
161
193
|
- test/test_helper.rb
|
|
162
194
|
homepage: https://rubyclassifier.com
|
|
163
195
|
licenses:
|
|
@@ -174,7 +206,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
|
174
206
|
requirements:
|
|
175
207
|
- - ">="
|
|
176
208
|
- !ruby/object:Gem::Version
|
|
177
|
-
version: '
|
|
209
|
+
version: '3.1'
|
|
178
210
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
|
179
211
|
requirements:
|
|
180
212
|
- - ">="
|
|
@@ -183,5 +215,6 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
|
183
215
|
requirements: []
|
|
184
216
|
rubygems_version: 4.0.3
|
|
185
217
|
specification_version: 4
|
|
186
|
-
summary:
|
|
218
|
+
summary: Text classification with Bayesian, LSI, Logistic Regression, kNN, and TF-IDF
|
|
219
|
+
vectorization.
|
|
187
220
|
test_files: []
|