fast_bayes 1.0.1 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.travis.yml +10 -2
- data/README.md +16 -3
- data/benchmarks/bench.rb +46 -0
- data/bin/setup +1 -2
- data/ext/Makefile +1 -1
- data/ext/fast_bayes/Makefile +6 -6
- data/ext/fast_bayes/bayes.h +35 -24
- data/ext/fast_bayes/extconf.rb +2 -0
- data/ext/fast_bayes/stopwords.h +23 -0
- data/ext/fast_bayes/stopwords/en +174 -0
- data/ext/test/classification_test.cpp +5 -5
- data/ext/test/data/r8-test-all-terms.txt +2189 -0
- data/ext/test/data/r8-train-all-terms.txt +5485 -0
- data/fast_bayes.gemspec +1 -0
- data/lib/fast_bayes.rb +20 -2
- data/lib/fast_bayes/version.rb +1 -1
- metadata +27 -2
data/fast_bayes.gemspec
CHANGED
@@ -23,6 +23,7 @@ Gem::Specification.new do |spec|
|
|
23
23
|
spec.require_paths = ["lib"]
|
24
24
|
|
25
25
|
spec.add_runtime_dependency 'rice', '~> 2.1', '>= 2.1.0'
|
26
|
+
spec.add_runtime_dependency 'fast-stemmer', '~> 1.0', '>= 1.0.0'
|
26
27
|
|
27
28
|
spec.add_development_dependency "bundler", "~> 1.13"
|
28
29
|
spec.add_development_dependency "rake", "~> 10.0"
|
data/lib/fast_bayes.rb
CHANGED
@@ -1,7 +1,25 @@
|
|
1
1
|
require "fast_bayes/version"
|
2
|
+
require 'fast-stemmer'
|
3
|
+
require "fast_bayes/fast_bayes"
|
2
4
|
|
3
5
|
class FastBayes
|
4
6
|
|
5
|
-
|
7
|
+
# Stem all words, this is a lot slower (TODO this fast)
|
8
|
+
def observe_better(data, label)
|
9
|
+
newdata = ""
|
10
|
+
data.split(" ").each do |i|
|
11
|
+
newdata += (i.stem + " ")
|
12
|
+
end
|
13
|
+
observe(newdata, label)
|
14
|
+
end
|
6
15
|
|
7
|
-
|
16
|
+
# Stem all words, this is a lot slower (TODO this fast)
|
17
|
+
def classify_better(data)
|
18
|
+
newdata = ""
|
19
|
+
data.split(" ").each do |i|
|
20
|
+
newdata += (i.stem + " ")
|
21
|
+
end
|
22
|
+
classify(newdata)
|
23
|
+
end
|
24
|
+
|
25
|
+
end
|
data/lib/fast_bayes/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: fast_bayes
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.0
|
4
|
+
version: 1.1.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Chang Rajani
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2016-12-
|
11
|
+
date: 2016-12-04 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: rice
|
@@ -30,6 +30,26 @@ dependencies:
|
|
30
30
|
- - ">="
|
31
31
|
- !ruby/object:Gem::Version
|
32
32
|
version: 2.1.0
|
33
|
+
- !ruby/object:Gem::Dependency
|
34
|
+
name: fast-stemmer
|
35
|
+
requirement: !ruby/object:Gem::Requirement
|
36
|
+
requirements:
|
37
|
+
- - "~>"
|
38
|
+
- !ruby/object:Gem::Version
|
39
|
+
version: '1.0'
|
40
|
+
- - ">="
|
41
|
+
- !ruby/object:Gem::Version
|
42
|
+
version: 1.0.0
|
43
|
+
type: :runtime
|
44
|
+
prerelease: false
|
45
|
+
version_requirements: !ruby/object:Gem::Requirement
|
46
|
+
requirements:
|
47
|
+
- - "~>"
|
48
|
+
- !ruby/object:Gem::Version
|
49
|
+
version: '1.0'
|
50
|
+
- - ">="
|
51
|
+
- !ruby/object:Gem::Version
|
52
|
+
version: 1.0.0
|
33
53
|
- !ruby/object:Gem::Dependency
|
34
54
|
name: bundler
|
35
55
|
requirement: !ruby/object:Gem::Requirement
|
@@ -108,6 +128,7 @@ files:
|
|
108
128
|
- LICENSE.txt
|
109
129
|
- README.md
|
110
130
|
- Rakefile
|
131
|
+
- benchmarks/bench.rb
|
111
132
|
- bin/console
|
112
133
|
- bin/setup
|
113
134
|
- ext/Makefile
|
@@ -115,11 +136,15 @@ files:
|
|
115
136
|
- ext/fast_bayes/bayes.h
|
116
137
|
- ext/fast_bayes/extconf.rb
|
117
138
|
- ext/fast_bayes/main.cpp
|
139
|
+
- ext/fast_bayes/stopwords.h
|
140
|
+
- ext/fast_bayes/stopwords/en
|
118
141
|
- ext/fast_bayes/wrapper.cpp
|
119
142
|
- ext/test/catch.hpp
|
120
143
|
- ext/test/classification_test.cpp
|
121
144
|
- ext/test/data/20ng-test-all-terms.txt
|
122
145
|
- ext/test/data/20ng-train-all-terms.txt
|
146
|
+
- ext/test/data/r8-test-all-terms.txt
|
147
|
+
- ext/test/data/r8-train-all-terms.txt
|
123
148
|
- ext/test/test_helper.h
|
124
149
|
- fast_bayes.gemspec
|
125
150
|
- lib/fast_bayes.rb
|