luisparravicini-classifier 1.3.7
Sign up to get free protection for your applications and to get access to all the features.
- data/LICENSE +429 -0
- data/Manifest +19 -0
- data/README +87 -0
- data/Rakefile +21 -0
- data/VERSION.yml +5 -0
- data/lib/classifier.rb +32 -0
- data/lib/classifier/base.rb +55 -0
- data/lib/classifier/bayes.rb +136 -0
- data/lib/classifier/extensions/vector.rb +109 -0
- data/lib/classifier/extensions/vector_serialize.rb +20 -0
- data/lib/classifier/lsi.rb +337 -0
- data/lib/classifier/lsi/content_node.rb +73 -0
- data/lib/classifier/lsi/summary.rb +31 -0
- data/lib/classifier/lsi/word_list.rb +36 -0
- data/lib/classifier/stopwords.rb +30 -0
- data/lib/classifier/stopwords/en +82 -0
- data/lib/classifier/stopwords/es +339 -0
- data/lib/classifier/stopwords/ru +161 -0
- data/lib/init.rb +1 -0
- data/luisparravicini-classifier.gemspec +76 -0
- data/tasks/test.rake +6 -0
- data/test/base_test.rb +17 -0
- data/test/bayes/bayesian_test.rb +58 -0
- data/test/lsi/lsi_test.rb +167 -0
- data/test/stopwords_test.rb +20 -0
- data/test/test_helper.rb +4 -0
- metadata +104 -0
@@ -0,0 +1,20 @@
|
|
1
|
+
# coding:utf-8
|
2
|
+
require File.dirname(__FILE__) + '/test_helper'
|
3
|
+
class SkipWordsTest < Test::Unit::TestCase
|
4
|
+
def test_en
|
5
|
+
assert_equal 80, Classifier::SkipWords.for('en').size
|
6
|
+
end
|
7
|
+
|
8
|
+
def test_ru
|
9
|
+
assert_equal 159, Classifier::SkipWords.for('ru').size
|
10
|
+
end
|
11
|
+
|
12
|
+
def test_stopword_es
|
13
|
+
list = Classifier::SkipWords.for('es')
|
14
|
+
assert list.include?('más')
|
15
|
+
end
|
16
|
+
|
17
|
+
def test_unknown
|
18
|
+
assert_equal [], Classifier::SkipWords.for('xxyyzz')
|
19
|
+
end
|
20
|
+
end
|
data/test/test_helper.rb
ADDED
metadata
ADDED
@@ -0,0 +1,104 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: luisparravicini-classifier
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 1.3.7
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Yury Korolev
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
|
12
|
+
date: 2009-12-24 00:00:00 -02:00
|
13
|
+
default_executable:
|
14
|
+
dependencies:
|
15
|
+
- !ruby/object:Gem::Dependency
|
16
|
+
name: activesupport
|
17
|
+
type: :runtime
|
18
|
+
version_requirement:
|
19
|
+
version_requirements: !ruby/object:Gem::Requirement
|
20
|
+
requirements:
|
21
|
+
- - ">="
|
22
|
+
- !ruby/object:Gem::Version
|
23
|
+
version: 2.2.2
|
24
|
+
version:
|
25
|
+
- !ruby/object:Gem::Dependency
|
26
|
+
name: ruby-stemmer
|
27
|
+
type: :runtime
|
28
|
+
version_requirement:
|
29
|
+
version_requirements: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - ">="
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: 0.5.1
|
34
|
+
version:
|
35
|
+
description: Bayesian classifier and others.
|
36
|
+
email: yury.korolev@gmail.com
|
37
|
+
executables: []
|
38
|
+
|
39
|
+
extensions: []
|
40
|
+
|
41
|
+
extra_rdoc_files:
|
42
|
+
- LICENSE
|
43
|
+
- README
|
44
|
+
files:
|
45
|
+
- LICENSE
|
46
|
+
- Manifest
|
47
|
+
- README
|
48
|
+
- Rakefile
|
49
|
+
- VERSION.yml
|
50
|
+
- lib/classifier.rb
|
51
|
+
- lib/classifier/base.rb
|
52
|
+
- lib/classifier/bayes.rb
|
53
|
+
- lib/classifier/extensions/vector.rb
|
54
|
+
- lib/classifier/extensions/vector_serialize.rb
|
55
|
+
- lib/classifier/lsi.rb
|
56
|
+
- lib/classifier/lsi/content_node.rb
|
57
|
+
- lib/classifier/lsi/summary.rb
|
58
|
+
- lib/classifier/lsi/word_list.rb
|
59
|
+
- lib/classifier/stopwords.rb
|
60
|
+
- lib/classifier/stopwords/en
|
61
|
+
- lib/classifier/stopwords/es
|
62
|
+
- lib/classifier/stopwords/ru
|
63
|
+
- lib/init.rb
|
64
|
+
- luisparravicini-classifier.gemspec
|
65
|
+
- tasks/test.rake
|
66
|
+
- test/base_test.rb
|
67
|
+
- test/bayes/bayesian_test.rb
|
68
|
+
- test/lsi/lsi_test.rb
|
69
|
+
- test/stopwords_test.rb
|
70
|
+
- test/test_helper.rb
|
71
|
+
has_rdoc: true
|
72
|
+
homepage: http://github.com/yury/classifier
|
73
|
+
licenses: []
|
74
|
+
|
75
|
+
post_install_message:
|
76
|
+
rdoc_options:
|
77
|
+
- --charset=UTF-8
|
78
|
+
require_paths:
|
79
|
+
- lib
|
80
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
81
|
+
requirements:
|
82
|
+
- - ">="
|
83
|
+
- !ruby/object:Gem::Version
|
84
|
+
version: "0"
|
85
|
+
version:
|
86
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
87
|
+
requirements:
|
88
|
+
- - ">="
|
89
|
+
- !ruby/object:Gem::Version
|
90
|
+
version: "0"
|
91
|
+
version:
|
92
|
+
requirements: []
|
93
|
+
|
94
|
+
rubyforge_project:
|
95
|
+
rubygems_version: 1.3.5
|
96
|
+
signing_key:
|
97
|
+
specification_version: 3
|
98
|
+
summary: A general classifier module to allow Bayesian and other types of classifications.
|
99
|
+
test_files:
|
100
|
+
- test/base_test.rb
|
101
|
+
- test/bayes/bayesian_test.rb
|
102
|
+
- test/lsi/lsi_test.rb
|
103
|
+
- test/stopwords_test.rb
|
104
|
+
- test/test_helper.rb
|