lingo 1.8.4.2 → 1.8.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/ChangeLog +413 -325
- data/README +380 -131
- data/Rakefile +19 -21
- data/de/lingo-abk.txt +15 -17
- data/de/lingo-dic.txt +20210 -20659
- data/de/lingo-mul.txt +5 -13
- data/de/lingo-syn.txt +5 -8
- data/de/test_dic.txt +2 -0
- data/de/test_gen.txt +8 -0
- data/de/{test_mul2.txt → test_mu2.txt} +0 -0
- data/de/{test_singleword.txt → test_sgw.txt} +0 -0
- data/de/user-dic.txt +5 -7
- data/de.lang +64 -49
- data/en/lingo-dic.txt +6398 -6404
- data/en/lingo-irr.txt +2 -3
- data/en/lingo-mul.txt +6 -7
- data/en/lingo-wdn.txt +881 -1762
- data/en/user-dic.txt +2 -5
- data/en.lang +39 -39
- data/lib/lingo/app.rb +10 -6
- data/lib/lingo/attendee/abbreviator.rb +1 -0
- data/lib/lingo/attendee/decomposer.rb +2 -1
- data/lib/lingo/attendee/multi_worder.rb +5 -6
- data/lib/lingo/attendee/stemmer.rb +1 -1
- data/lib/lingo/attendee/synonymer.rb +4 -2
- data/lib/lingo/attendee/text_reader.rb +77 -57
- data/lib/lingo/attendee/text_writer.rb +1 -1
- data/lib/lingo/attendee/tokenizer.rb +101 -50
- data/lib/lingo/attendee/variator.rb +2 -1
- data/lib/lingo/attendee/vector_filter.rb +28 -6
- data/lib/lingo/attendee/word_searcher.rb +2 -1
- data/lib/lingo/attendee.rb +8 -4
- data/lib/lingo/call.rb +7 -3
- data/lib/lingo/cli.rb +8 -16
- data/lib/lingo/config.rb +11 -6
- data/lib/lingo/ctl.rb +54 -3
- data/lib/lingo/database/crypter.rb +8 -14
- data/lib/lingo/database/hash_store.rb +1 -1
- data/lib/lingo/database/{show_progress.rb → progress.rb} +7 -8
- data/lib/lingo/database/source/key_value.rb +6 -5
- data/lib/lingo/database/source/multi_key.rb +5 -2
- data/lib/lingo/database/source/multi_value.rb +6 -4
- data/lib/lingo/database/source/single_word.rb +2 -3
- data/lib/lingo/database/source/word_class.rb +24 -5
- data/lib/lingo/database/source.rb +5 -3
- data/lib/lingo/database.rb +102 -41
- data/lib/lingo/error.rb +24 -2
- data/lib/lingo/language/dictionary.rb +26 -54
- data/lib/lingo/language/grammar.rb +19 -23
- data/lib/lingo/language/lexical.rb +5 -1
- data/lib/lingo/language/lexical_hash.rb +7 -12
- data/lib/lingo/language/token.rb +10 -1
- data/lib/lingo/language/word.rb +35 -23
- data/lib/lingo/language/word_form.rb +5 -4
- data/lib/lingo/{show_progress.rb → progress.rb} +43 -30
- data/lib/lingo/srv/lingosrv.cfg +1 -1
- data/lib/lingo/srv/public/.gitkeep +0 -0
- data/lib/lingo/srv.rb +11 -6
- data/lib/lingo/version.rb +2 -2
- data/lib/lingo/web/lingoweb.cfg +1 -1
- data/lib/lingo/web/views/index.erb +4 -4
- data/lib/lingo/web.rb +4 -6
- data/lib/lingo.rb +4 -12
- data/lingo.cfg +1 -1
- data/lir.cfg +1 -1
- data/ru/lingo-dic.txt +33473 -2113
- data/ru/lingo-mul.txt +8430 -1913
- data/ru/lingo-syn.txt +1634 -0
- data/ru/user-dic.txt +6 -0
- data/ru.lang +49 -47
- data/spec/spec_helper.rb +4 -0
- data/test/attendee/ts_decomposer.rb +2 -2
- data/test/attendee/ts_synonymer.rb +3 -3
- data/test/attendee/ts_tokenizer.rb +215 -2
- data/test/attendee/ts_variator.rb +2 -2
- data/test/attendee/ts_word_searcher.rb +10 -6
- data/test/ref/artikel.seq +2 -2
- data/test/ref/artikel.vec +5 -5
- data/test/ref/artikel.ven +11 -11
- data/test/ref/artikel.ver +11 -11
- data/test/ref/lir.seq +13 -13
- data/test/ref/lir.vec +31 -31
- data/test/test_helper.rb +19 -5
- data/test/ts_database.rb +206 -77
- data/test/ts_language.rb +86 -26
- metadata +93 -49
- data/.rspec +0 -1
- data/de/test_syn2.txt +0 -1
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: lingo
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.8.
|
4
|
+
version: 1.8.5
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- John Vorhauer
|
@@ -9,112 +9,112 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date: 2014-
|
12
|
+
date: 2014-10-02 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
|
-
name:
|
15
|
+
name: cyclops
|
16
16
|
requirement: !ruby/object:Gem::Requirement
|
17
17
|
requirements:
|
18
|
+
- - "~>"
|
19
|
+
- !ruby/object:Gem::Version
|
20
|
+
version: '0.0'
|
18
21
|
- - ">="
|
19
22
|
- !ruby/object:Gem::Version
|
20
|
-
version:
|
23
|
+
version: 0.0.4
|
21
24
|
type: :runtime
|
22
25
|
prerelease: false
|
23
26
|
version_requirements: !ruby/object:Gem::Requirement
|
24
27
|
requirements:
|
28
|
+
- - "~>"
|
29
|
+
- !ruby/object:Gem::Version
|
30
|
+
version: '0.0'
|
25
31
|
- - ">="
|
26
32
|
- !ruby/object:Gem::Version
|
27
|
-
version:
|
33
|
+
version: 0.0.4
|
28
34
|
- !ruby/object:Gem::Dependency
|
29
|
-
name:
|
35
|
+
name: nuggets
|
30
36
|
requirement: !ruby/object:Gem::Requirement
|
31
37
|
requirements:
|
32
|
-
- - "
|
33
|
-
- !ruby/object:Gem::Version
|
34
|
-
version: 0.9.2
|
35
|
-
- - "<="
|
38
|
+
- - "~>"
|
36
39
|
- !ruby/object:Gem::Version
|
37
|
-
version: 0
|
40
|
+
version: '1.0'
|
38
41
|
type: :runtime
|
39
42
|
prerelease: false
|
40
43
|
version_requirements: !ruby/object:Gem::Requirement
|
41
44
|
requirements:
|
42
|
-
- - "
|
43
|
-
- !ruby/object:Gem::Version
|
44
|
-
version: 0.9.2
|
45
|
-
- - "<="
|
45
|
+
- - "~>"
|
46
46
|
- !ruby/object:Gem::Version
|
47
|
-
version: 0
|
47
|
+
version: '1.0'
|
48
48
|
- !ruby/object:Gem::Dependency
|
49
|
-
name:
|
49
|
+
name: rubyzip
|
50
50
|
requirement: !ruby/object:Gem::Requirement
|
51
51
|
requirements:
|
52
|
-
- - "
|
52
|
+
- - "~>"
|
53
53
|
- !ruby/object:Gem::Version
|
54
|
-
version: '
|
54
|
+
version: '1.1'
|
55
55
|
type: :runtime
|
56
56
|
prerelease: false
|
57
57
|
version_requirements: !ruby/object:Gem::Requirement
|
58
58
|
requirements:
|
59
|
-
- - "
|
59
|
+
- - "~>"
|
60
60
|
- !ruby/object:Gem::Version
|
61
|
-
version: '
|
61
|
+
version: '1.1'
|
62
62
|
- !ruby/object:Gem::Dependency
|
63
|
-
name: sinatra-
|
63
|
+
name: sinatra-bells
|
64
64
|
requirement: !ruby/object:Gem::Requirement
|
65
65
|
requirements:
|
66
|
-
- - "
|
66
|
+
- - "~>"
|
67
67
|
- !ruby/object:Gem::Version
|
68
|
-
version: '0'
|
68
|
+
version: '0.0'
|
69
69
|
type: :runtime
|
70
70
|
prerelease: false
|
71
71
|
version_requirements: !ruby/object:Gem::Requirement
|
72
72
|
requirements:
|
73
|
-
- - "
|
73
|
+
- - "~>"
|
74
74
|
- !ruby/object:Gem::Version
|
75
|
-
version: '0'
|
75
|
+
version: '0.0'
|
76
76
|
- !ruby/object:Gem::Dependency
|
77
77
|
name: unicode
|
78
78
|
requirement: !ruby/object:Gem::Requirement
|
79
79
|
requirements:
|
80
|
-
- - "
|
80
|
+
- - "~>"
|
81
81
|
- !ruby/object:Gem::Version
|
82
|
-
version: '0'
|
82
|
+
version: '0.4'
|
83
83
|
type: :runtime
|
84
84
|
prerelease: false
|
85
85
|
version_requirements: !ruby/object:Gem::Requirement
|
86
86
|
requirements:
|
87
|
-
- - "
|
87
|
+
- - "~>"
|
88
88
|
- !ruby/object:Gem::Version
|
89
|
-
version: '0'
|
89
|
+
version: '0.4'
|
90
90
|
- !ruby/object:Gem::Dependency
|
91
91
|
name: diff-lcs
|
92
92
|
requirement: !ruby/object:Gem::Requirement
|
93
93
|
requirements:
|
94
|
-
- - "
|
94
|
+
- - "~>"
|
95
95
|
- !ruby/object:Gem::Version
|
96
|
-
version: 1.
|
96
|
+
version: '1.2'
|
97
97
|
type: :development
|
98
98
|
prerelease: false
|
99
99
|
version_requirements: !ruby/object:Gem::Requirement
|
100
100
|
requirements:
|
101
|
-
- - "
|
101
|
+
- - "~>"
|
102
102
|
- !ruby/object:Gem::Version
|
103
|
-
version: 1.
|
103
|
+
version: '1.2'
|
104
104
|
- !ruby/object:Gem::Dependency
|
105
105
|
name: open4
|
106
106
|
requirement: !ruby/object:Gem::Requirement
|
107
107
|
requirements:
|
108
|
-
- - "
|
108
|
+
- - "~>"
|
109
109
|
- !ruby/object:Gem::Version
|
110
|
-
version: '
|
110
|
+
version: '1.3'
|
111
111
|
type: :development
|
112
112
|
prerelease: false
|
113
113
|
version_requirements: !ruby/object:Gem::Requirement
|
114
114
|
requirements:
|
115
|
-
- - "
|
115
|
+
- - "~>"
|
116
116
|
- !ruby/object:Gem::Version
|
117
|
-
version: '
|
117
|
+
version: '1.3'
|
118
118
|
- !ruby/object:Gem::Dependency
|
119
119
|
name: hen
|
120
120
|
requirement: !ruby/object:Gem::Requirement
|
@@ -181,7 +181,6 @@ extra_rdoc_files:
|
|
181
181
|
- COPYING
|
182
182
|
- ChangeLog
|
183
183
|
files:
|
184
|
-
- ".rspec"
|
185
184
|
- COPYING
|
186
185
|
- ChangeLog
|
187
186
|
- README
|
@@ -196,11 +195,11 @@ files:
|
|
196
195
|
- de/lingo-mul.txt
|
197
196
|
- de/lingo-syn.txt
|
198
197
|
- de/test_dic.txt
|
198
|
+
- de/test_gen.txt
|
199
|
+
- de/test_mu2.txt
|
199
200
|
- de/test_mul.txt
|
200
|
-
- de/
|
201
|
-
- de/test_singleword.txt
|
201
|
+
- de/test_sgw.txt
|
202
202
|
- de/test_syn.txt
|
203
|
-
- de/test_syn2.txt
|
204
203
|
- de/user-dic.txt
|
205
204
|
- en.lang
|
206
205
|
- en/lingo-dic.txt
|
@@ -241,8 +240,8 @@ files:
|
|
241
240
|
- lib/lingo/database/gdbm_store.rb
|
242
241
|
- lib/lingo/database/hash_store.rb
|
243
242
|
- lib/lingo/database/libcdb_store.rb
|
243
|
+
- lib/lingo/database/progress.rb
|
244
244
|
- lib/lingo/database/sdbm_store.rb
|
245
|
-
- lib/lingo/database/show_progress.rb
|
246
245
|
- lib/lingo/database/source.rb
|
247
246
|
- lib/lingo/database/source/key_value.rb
|
248
247
|
- lib/lingo/database/source/multi_key.rb
|
@@ -260,10 +259,11 @@ files:
|
|
260
259
|
- lib/lingo/language/token.rb
|
261
260
|
- lib/lingo/language/word.rb
|
262
261
|
- lib/lingo/language/word_form.rb
|
263
|
-
- lib/lingo/
|
262
|
+
- lib/lingo/progress.rb
|
264
263
|
- lib/lingo/srv.rb
|
265
264
|
- lib/lingo/srv/config.ru
|
266
265
|
- lib/lingo/srv/lingosrv.cfg
|
266
|
+
- lib/lingo/srv/public/.gitkeep
|
267
267
|
- lib/lingo/version.rb
|
268
268
|
- lib/lingo/web.rb
|
269
269
|
- lib/lingo/web/config.ru
|
@@ -279,6 +279,7 @@ files:
|
|
279
279
|
- ru/lingo-dic.txt
|
280
280
|
- ru/lingo-mul.txt
|
281
281
|
- ru/lingo-syn.txt
|
282
|
+
- ru/user-dic.txt
|
282
283
|
- spec/spec_helper.rb
|
283
284
|
- test/attendee/ts_abbreviator.rb
|
284
285
|
- test/attendee/ts_decomposer.rb
|
@@ -319,12 +320,55 @@ files:
|
|
319
320
|
- txt/lir.txt
|
320
321
|
homepage: http://lex-lingo.de
|
321
322
|
licenses:
|
322
|
-
- AGPL
|
323
|
+
- AGPL-3.0
|
323
324
|
metadata: {}
|
324
|
-
post_install_message:
|
325
|
+
post_install_message: |2+
|
326
|
+
|
327
|
+
lingo-1.8.5 [2014-10-02]:
|
328
|
+
|
329
|
+
* Dictionary values (projections) are no longer sorted; hence, order of
|
330
|
+
definition affects processing.
|
331
|
+
* Lexicals in Lingo::Language::Word are no longer sorted; in particular,
|
332
|
+
compound parts keep their original order.
|
333
|
+
* Lexicals in Lingo::Language::Word are no longer cleaned from duplicates.
|
334
|
+
* Compiled dictionaries are updated whenever the Lingo version or their
|
335
|
+
configuration changes, not only when the source file's size or modification
|
336
|
+
time changes.
|
337
|
+
* Lingo::Attendee::Synonymer learned <tt>compound-parts</tt> option to also
|
338
|
+
generate synonyms for compound parts when set to +true+.
|
339
|
+
* Lingo::Attendee::TextReader learned better PDF-to-text conversion using the
|
340
|
+
+pdftotext+ command; specify <tt>filter: pdftotext</tt> in the config.
|
341
|
+
* Lingo::Attendee::VectorFilter learned +dict+ option to print words in
|
342
|
+
dictionary format (viz. Lingo::Database::Source::WordClass).
|
343
|
+
* Lingo::Attendee::VectorFilter learned +preamble+ option to print current
|
344
|
+
configuration to the beginning of the log file (<tt>debug: 'true'</tt>);
|
345
|
+
set <tt>preamble: false</tt> to disable.
|
346
|
+
* Multiword dictionaries compiled from base forms can now generate inflected
|
347
|
+
adjectives based on the gender of the head noun; set <tt>inflect: true</tt>
|
348
|
+
in the dictionary config.
|
349
|
+
* Lingo::Database::Source::WordClass supports gender information being encoded
|
350
|
+
in the dictionary as well as shorthand notation for multiple word
|
351
|
+
classes/genders.
|
352
|
+
* Lingo::Database::Source::WordClass supports compounds being encoded in the
|
353
|
+
dictionary (appending <tt>+</tt> to their parts' word classes is
|
354
|
+
recommended).
|
355
|
+
* Lingo::Database::Source removes leading and trailing whitespace from
|
356
|
+
dictionary lines.
|
357
|
+
* Lingo::Database::Crypter uses OpenSSL to encrypt/decrypt dictionaries.
|
358
|
+
Note: Can't decrypt dictionaries encrypted with the old scheme anymore.
|
359
|
+
* Lingo::Attendee::Tokenizer learned subset of MediaWiki syntax.
|
360
|
+
* Eliminated pathological behaviour of the +URLS+ rule in
|
361
|
+
Lingo::Attendee::Tokenizer.
|
362
|
+
* Fixed regression introduced in 1.8.2 where <tt>combine: all</tt> would no
|
363
|
+
longer work in Lingo::Attendee::MultiWorder.
|
364
|
+
* Updated and extended Russian dictionaries. (Yulia Dorokhova, Thomas Müller)
|
365
|
+
* +lingoctl+ no longer overwrites existing files without confirmation.
|
366
|
+
* +lingoctl+ learned +archive+ command.
|
367
|
+
* Dictionary cleanup.
|
368
|
+
|
325
369
|
rdoc_options:
|
326
370
|
- "--title"
|
327
|
-
- lingo Application documentation (v1.8.
|
371
|
+
- lingo Application documentation (v1.8.5)
|
328
372
|
- "--charset"
|
329
373
|
- UTF-8
|
330
374
|
- "--line-numbers"
|
@@ -337,7 +381,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
337
381
|
requirements:
|
338
382
|
- - ">="
|
339
383
|
- !ruby/object:Gem::Version
|
340
|
-
version: 1.9.
|
384
|
+
version: 1.9.3
|
341
385
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
342
386
|
requirements:
|
343
387
|
- - ">="
|
@@ -345,7 +389,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
345
389
|
version: '0'
|
346
390
|
requirements: []
|
347
391
|
rubyforge_project:
|
348
|
-
rubygems_version: 2.
|
392
|
+
rubygems_version: 2.4.2
|
349
393
|
signing_key:
|
350
394
|
specification_version: 4
|
351
395
|
summary: The full-featured automatic indexing system
|
data/.rspec
DELETED
@@ -1 +0,0 @@
|
|
1
|
-
--colour
|
data/de/test_syn2.txt
DELETED
@@ -1 +0,0 @@
|
|
1
|
-
Albert Einstein;Einstein, Albert;Albert Ainshtain;<Prof> Einstein
|