luisparravicini-classifier 1.3.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/LICENSE +429 -0
- data/Manifest +19 -0
- data/README +87 -0
- data/Rakefile +21 -0
- data/VERSION.yml +5 -0
- data/lib/classifier.rb +32 -0
- data/lib/classifier/base.rb +55 -0
- data/lib/classifier/bayes.rb +136 -0
- data/lib/classifier/extensions/vector.rb +109 -0
- data/lib/classifier/extensions/vector_serialize.rb +20 -0
- data/lib/classifier/lsi.rb +337 -0
- data/lib/classifier/lsi/content_node.rb +73 -0
- data/lib/classifier/lsi/summary.rb +31 -0
- data/lib/classifier/lsi/word_list.rb +36 -0
- data/lib/classifier/stopwords.rb +30 -0
- data/lib/classifier/stopwords/en +82 -0
- data/lib/classifier/stopwords/es +339 -0
- data/lib/classifier/stopwords/ru +161 -0
- data/lib/init.rb +1 -0
- data/luisparravicini-classifier.gemspec +76 -0
- data/tasks/test.rake +6 -0
- data/test/base_test.rb +17 -0
- data/test/bayes/bayesian_test.rb +58 -0
- data/test/lsi/lsi_test.rb +167 -0
- data/test/stopwords_test.rb +20 -0
- data/test/test_helper.rb +4 -0
- metadata +104 -0
@@ -0,0 +1,20 @@
|
|
1
|
+
# coding:utf-8
|
2
|
+
require File.dirname(__FILE__) + '/test_helper'
|
3
|
+
class SkipWordsTest < Test::Unit::TestCase
|
4
|
+
def test_en
|
5
|
+
assert_equal 80, Classifier::SkipWords.for('en').size
|
6
|
+
end
|
7
|
+
|
8
|
+
def test_ru
|
9
|
+
assert_equal 159, Classifier::SkipWords.for('ru').size
|
10
|
+
end
|
11
|
+
|
12
|
+
def test_stopword_es
|
13
|
+
list = Classifier::SkipWords.for('es')
|
14
|
+
assert list.include?('más')
|
15
|
+
end
|
16
|
+
|
17
|
+
def test_unknown
|
18
|
+
assert_equal [], Classifier::SkipWords.for('xxyyzz')
|
19
|
+
end
|
20
|
+
end
|
data/test/test_helper.rb
ADDED
metadata
ADDED
@@ -0,0 +1,104 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: luisparravicini-classifier
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 1.3.7
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Yury Korolev
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
|
12
|
+
date: 2009-12-24 00:00:00 -02:00
|
13
|
+
default_executable:
|
14
|
+
dependencies:
|
15
|
+
- !ruby/object:Gem::Dependency
|
16
|
+
name: activesupport
|
17
|
+
type: :runtime
|
18
|
+
version_requirement:
|
19
|
+
version_requirements: !ruby/object:Gem::Requirement
|
20
|
+
requirements:
|
21
|
+
- - ">="
|
22
|
+
- !ruby/object:Gem::Version
|
23
|
+
version: 2.2.2
|
24
|
+
version:
|
25
|
+
- !ruby/object:Gem::Dependency
|
26
|
+
name: ruby-stemmer
|
27
|
+
type: :runtime
|
28
|
+
version_requirement:
|
29
|
+
version_requirements: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - ">="
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: 0.5.1
|
34
|
+
version:
|
35
|
+
description: Bayesian classifier and others.
|
36
|
+
email: yury.korolev@gmail.com
|
37
|
+
executables: []
|
38
|
+
|
39
|
+
extensions: []
|
40
|
+
|
41
|
+
extra_rdoc_files:
|
42
|
+
- LICENSE
|
43
|
+
- README
|
44
|
+
files:
|
45
|
+
- LICENSE
|
46
|
+
- Manifest
|
47
|
+
- README
|
48
|
+
- Rakefile
|
49
|
+
- VERSION.yml
|
50
|
+
- lib/classifier.rb
|
51
|
+
- lib/classifier/base.rb
|
52
|
+
- lib/classifier/bayes.rb
|
53
|
+
- lib/classifier/extensions/vector.rb
|
54
|
+
- lib/classifier/extensions/vector_serialize.rb
|
55
|
+
- lib/classifier/lsi.rb
|
56
|
+
- lib/classifier/lsi/content_node.rb
|
57
|
+
- lib/classifier/lsi/summary.rb
|
58
|
+
- lib/classifier/lsi/word_list.rb
|
59
|
+
- lib/classifier/stopwords.rb
|
60
|
+
- lib/classifier/stopwords/en
|
61
|
+
- lib/classifier/stopwords/es
|
62
|
+
- lib/classifier/stopwords/ru
|
63
|
+
- lib/init.rb
|
64
|
+
- luisparravicini-classifier.gemspec
|
65
|
+
- tasks/test.rake
|
66
|
+
- test/base_test.rb
|
67
|
+
- test/bayes/bayesian_test.rb
|
68
|
+
- test/lsi/lsi_test.rb
|
69
|
+
- test/stopwords_test.rb
|
70
|
+
- test/test_helper.rb
|
71
|
+
has_rdoc: true
|
72
|
+
homepage: http://github.com/yury/classifier
|
73
|
+
licenses: []
|
74
|
+
|
75
|
+
post_install_message:
|
76
|
+
rdoc_options:
|
77
|
+
- --charset=UTF-8
|
78
|
+
require_paths:
|
79
|
+
- lib
|
80
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
81
|
+
requirements:
|
82
|
+
- - ">="
|
83
|
+
- !ruby/object:Gem::Version
|
84
|
+
version: "0"
|
85
|
+
version:
|
86
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
87
|
+
requirements:
|
88
|
+
- - ">="
|
89
|
+
- !ruby/object:Gem::Version
|
90
|
+
version: "0"
|
91
|
+
version:
|
92
|
+
requirements: []
|
93
|
+
|
94
|
+
rubyforge_project:
|
95
|
+
rubygems_version: 1.3.5
|
96
|
+
signing_key:
|
97
|
+
specification_version: 3
|
98
|
+
summary: A general classifier module to allow Bayesian and other types of classifications.
|
99
|
+
test_files:
|
100
|
+
- test/base_test.rb
|
101
|
+
- test/bayes/bayesian_test.rb
|
102
|
+
- test/lsi/lsi_test.rb
|
103
|
+
- test/stopwords_test.rb
|
104
|
+
- test/test_helper.rb
|