plexus-rmmseg 0.1.6
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/.gitignore +1 -0
- data/History.txt +42 -0
- data/Manifest.txt +51 -0
- data/README.txt +74 -0
- data/Rakefile +12 -0
- data/TODO.txt +5 -0
- data/bin/rmmseg +65 -0
- data/data/chars.dic +12638 -0
- data/data/custom.dic +12 -0
- data/data/punctuation.dic +79 -0
- data/data/words.dic +120330 -0
- data/lib/rmmseg.rb +13 -0
- data/lib/rmmseg/algorithm.rb +136 -0
- data/lib/rmmseg/amibguity.rb +4 -0
- data/lib/rmmseg/chunk.rb +41 -0
- data/lib/rmmseg/complex_algorithm.rb +122 -0
- data/lib/rmmseg/config.rb +65 -0
- data/lib/rmmseg/dictionary.rb +80 -0
- data/lib/rmmseg/ferret.rb +109 -0
- data/lib/rmmseg/lawl_rule.rb +12 -0
- data/lib/rmmseg/lsdmfocw_rule.rb +13 -0
- data/lib/rmmseg/mm_rule.rb +13 -0
- data/lib/rmmseg/rule_helper.rb +28 -0
- data/lib/rmmseg/simple_algorithm.rb +37 -0
- data/lib/rmmseg/svwl_rule.rb +12 -0
- data/lib/rmmseg/token.rb +30 -0
- data/lib/rmmseg/version.rb +3 -0
- data/lib/rmmseg/word.rb +38 -0
- data/misc/ferret_example.rb +56 -0
- data/misc/homepage.erb +170 -0
- data/misc/homepage.html +1214 -0
- data/plexus-rmmseg.gemspec +20 -0
- data/spec/chunk_spec.rb +25 -0
- data/spec/complex_algorithm_spec.rb +18 -0
- data/spec/config_spec.rb +12 -0
- data/spec/dictionary_spec.rb +20 -0
- data/spec/lawl_rule_spec.rb +15 -0
- data/spec/lsdmfocw_rule_spec.rb +14 -0
- data/spec/mm_rule_spec.rb +15 -0
- data/spec/simple_algorithm_spec.rb +46 -0
- data/spec/spec_helper.rb +12 -0
- data/spec/svwl_rule_spec.rb +14 -0
- data/spec/word_spec.rb +9 -0
- data/tasks/ann.rake +76 -0
- data/tasks/annotations.rake +22 -0
- data/tasks/doc.rake +48 -0
- data/tasks/gem.rake +110 -0
- data/tasks/homepage.rake +12 -0
- data/tasks/manifest.rake +49 -0
- data/tasks/post_load.rake +26 -0
- data/tasks/rubyforge.rake +57 -0
- data/tasks/setup.rb +227 -0
- data/tasks/spec.rake +54 -0
- data/tasks/svn.rake +44 -0
- data/tasks/test.rake +38 -0
- metadata +121 -0
data/tasks/test.rake
ADDED
@@ -0,0 +1,38 @@
|
|
1
|
+
# $Id$
|
2
|
+
|
3
|
+
require 'rake/testtask'
|
4
|
+
|
5
|
+
namespace :test do
|
6
|
+
|
7
|
+
Rake::TestTask.new(:run) do |t|
|
8
|
+
t.libs = PROJ.libs
|
9
|
+
t.test_files = if test(?f, PROJ.test_file) then [PROJ.test_file]
|
10
|
+
else PROJ.tests end
|
11
|
+
t.ruby_opts += PROJ.ruby_opts
|
12
|
+
t.ruby_opts += PROJ.test_opts
|
13
|
+
end
|
14
|
+
|
15
|
+
if HAVE_RCOV
|
16
|
+
desc 'Run rcov on the unit tests'
|
17
|
+
task :rcov => :clobber_rcov do
|
18
|
+
opts = PROJ.rcov_opts.dup << '-o' << PROJ.rcov_dir
|
19
|
+
opts = opts.join(' ')
|
20
|
+
files = if test(?f, PROJ.test_file) then [PROJ.test_file]
|
21
|
+
else PROJ.tests end
|
22
|
+
files = files.join(' ')
|
23
|
+
sh "#{RCOV} #{files} #{opts}"
|
24
|
+
end
|
25
|
+
|
26
|
+
task :clobber_rcov do
|
27
|
+
rm_r 'coverage' rescue nil
|
28
|
+
end
|
29
|
+
end
|
30
|
+
|
31
|
+
end # namespace :test
|
32
|
+
|
33
|
+
desc 'Alias to test:run'
|
34
|
+
task :test => 'test:run'
|
35
|
+
|
36
|
+
task :clobber => 'test:clobber_rcov' if HAVE_RCOV
|
37
|
+
|
38
|
+
# EOF
|
metadata
ADDED
@@ -0,0 +1,121 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: plexus-rmmseg
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 0.1.6
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- pluskid
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2008-03-16 00:00:00.000000000 Z
|
12
|
+
dependencies: []
|
13
|
+
description: 'RMMSeg is an implementation of MMSEG Chinese word segmentation algorithm.
|
14
|
+
It is based on two variants of maximum matching algorithms. Two algorithms are available
|
15
|
+
for using: * simple algorithm that uses only forward maximum matching. * complex
|
16
|
+
algorithm that uses three-word chunk maximum matching and 3 additonal rules to solve
|
17
|
+
ambiguities. For more information about the algorithm, please refer to the following
|
18
|
+
essays: * http://technology.chtsai.org/mmseg/ * http://pluskid.lifegoo.com/?p=261'
|
19
|
+
email: pluskid@gmail.com
|
20
|
+
executables:
|
21
|
+
- rmmseg
|
22
|
+
extensions: []
|
23
|
+
extra_rdoc_files:
|
24
|
+
- History.txt
|
25
|
+
- README.txt
|
26
|
+
- TODO.txt
|
27
|
+
- bin/rmmseg
|
28
|
+
files:
|
29
|
+
- .gitignore
|
30
|
+
- History.txt
|
31
|
+
- Manifest.txt
|
32
|
+
- README.txt
|
33
|
+
- Rakefile
|
34
|
+
- TODO.txt
|
35
|
+
- bin/rmmseg
|
36
|
+
- data/chars.dic
|
37
|
+
- data/custom.dic
|
38
|
+
- data/punctuation.dic
|
39
|
+
- data/words.dic
|
40
|
+
- lib/rmmseg.rb
|
41
|
+
- lib/rmmseg/algorithm.rb
|
42
|
+
- lib/rmmseg/amibguity.rb
|
43
|
+
- lib/rmmseg/chunk.rb
|
44
|
+
- lib/rmmseg/complex_algorithm.rb
|
45
|
+
- lib/rmmseg/config.rb
|
46
|
+
- lib/rmmseg/dictionary.rb
|
47
|
+
- lib/rmmseg/ferret.rb
|
48
|
+
- lib/rmmseg/lawl_rule.rb
|
49
|
+
- lib/rmmseg/lsdmfocw_rule.rb
|
50
|
+
- lib/rmmseg/mm_rule.rb
|
51
|
+
- lib/rmmseg/rule_helper.rb
|
52
|
+
- lib/rmmseg/simple_algorithm.rb
|
53
|
+
- lib/rmmseg/svwl_rule.rb
|
54
|
+
- lib/rmmseg/token.rb
|
55
|
+
- lib/rmmseg/version.rb
|
56
|
+
- lib/rmmseg/word.rb
|
57
|
+
- misc/ferret_example.rb
|
58
|
+
- misc/homepage.erb
|
59
|
+
- misc/homepage.html
|
60
|
+
- plexus-rmmseg.gemspec
|
61
|
+
- spec/chunk_spec.rb
|
62
|
+
- spec/complex_algorithm_spec.rb
|
63
|
+
- spec/config_spec.rb
|
64
|
+
- spec/dictionary_spec.rb
|
65
|
+
- spec/lawl_rule_spec.rb
|
66
|
+
- spec/lsdmfocw_rule_spec.rb
|
67
|
+
- spec/mm_rule_spec.rb
|
68
|
+
- spec/simple_algorithm_spec.rb
|
69
|
+
- spec/spec_helper.rb
|
70
|
+
- spec/svwl_rule_spec.rb
|
71
|
+
- spec/word_spec.rb
|
72
|
+
- tasks/ann.rake
|
73
|
+
- tasks/annotations.rake
|
74
|
+
- tasks/doc.rake
|
75
|
+
- tasks/gem.rake
|
76
|
+
- tasks/homepage.rake
|
77
|
+
- tasks/manifest.rake
|
78
|
+
- tasks/post_load.rake
|
79
|
+
- tasks/rubyforge.rake
|
80
|
+
- tasks/setup.rb
|
81
|
+
- tasks/spec.rake
|
82
|
+
- tasks/svn.rake
|
83
|
+
- tasks/test.rake
|
84
|
+
homepage: http://rmmseg.rubyforge.org
|
85
|
+
licenses:
|
86
|
+
- MIT
|
87
|
+
metadata: {}
|
88
|
+
post_install_message:
|
89
|
+
rdoc_options:
|
90
|
+
- --main
|
91
|
+
- README.txt
|
92
|
+
require_paths:
|
93
|
+
- lib
|
94
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
95
|
+
requirements:
|
96
|
+
- - '>='
|
97
|
+
- !ruby/object:Gem::Version
|
98
|
+
version: '0'
|
99
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
100
|
+
requirements:
|
101
|
+
- - '>='
|
102
|
+
- !ruby/object:Gem::Version
|
103
|
+
version: '0'
|
104
|
+
requirements: []
|
105
|
+
rubyforge_project:
|
106
|
+
rubygems_version: 2.2.1
|
107
|
+
signing_key:
|
108
|
+
specification_version: 4
|
109
|
+
summary: RMMSeg is an implementation of MMSEG Chinese word segmentation algorithm
|
110
|
+
test_files:
|
111
|
+
- spec/chunk_spec.rb
|
112
|
+
- spec/complex_algorithm_spec.rb
|
113
|
+
- spec/config_spec.rb
|
114
|
+
- spec/dictionary_spec.rb
|
115
|
+
- spec/lawl_rule_spec.rb
|
116
|
+
- spec/lsdmfocw_rule_spec.rb
|
117
|
+
- spec/mm_rule_spec.rb
|
118
|
+
- spec/simple_algorithm_spec.rb
|
119
|
+
- spec/spec_helper.rb
|
120
|
+
- spec/svwl_rule_spec.rb
|
121
|
+
- spec/word_spec.rb
|