lingo 1.8.1 → 1.8.2
Sign up to get free protection for your applications and to get access to all the features.
- data/ChangeLog +23 -5
- data/README +1 -1
- data/Rakefile +5 -7
- data/TODO +2 -0
- data/bin/lingo +5 -1
- data/de.lang +1 -1
- data/en/lingo-syn.txt +0 -0
- data/en.lang +2 -1
- data/lib/lingo/attendee/abbreviator.rb +8 -9
- data/lib/lingo/attendee/debugger.rb +5 -4
- data/lib/lingo/attendee/decomposer.rb +8 -3
- data/lib/lingo/attendee/dehyphenizer.rb +19 -63
- data/lib/lingo/attendee/formatter.rb +1 -1
- data/lib/lingo/attendee/multi_worder.rb +67 -155
- data/lib/lingo/attendee/noneword_filter.rb +16 -9
- data/lib/lingo/attendee/object_filter.rb +1 -1
- data/lib/lingo/attendee/sequencer.rb +32 -63
- data/lib/lingo/attendee/stemmer/porter.rb +343 -0
- data/{info/gpl-hdr.txt → lib/lingo/attendee/stemmer.rb} +33 -0
- data/lib/lingo/attendee/synonymer.rb +10 -9
- data/lib/lingo/attendee/text_reader.rb +102 -76
- data/lib/lingo/attendee/text_writer.rb +23 -26
- data/lib/lingo/attendee/tokenizer.rb +13 -27
- data/lib/lingo/attendee/variator.rb +26 -66
- data/lib/lingo/attendee/vector_filter.rb +42 -43
- data/lib/lingo/attendee/word_searcher.rb +6 -7
- data/lib/lingo/attendee.rb +25 -7
- data/lib/lingo/buffered_attendee.rb +36 -10
- data/lib/lingo/cachable.rb +8 -8
- data/lib/lingo/config.rb +5 -6
- data/lib/lingo/ctl.rb +2 -3
- data/lib/lingo/database/crypter.rb +9 -26
- data/lib/lingo/database/gdbm_store.rb +3 -5
- data/lib/lingo/database/libcdb_store.rb +4 -6
- data/lib/lingo/database/sdbm_store.rb +11 -6
- data/lib/lingo/database/show_progress.rb +3 -43
- data/lib/lingo/database/source/key_value.rb +2 -6
- data/lib/lingo/database/source/multi_key.rb +3 -5
- data/lib/lingo/database/source/multi_value.rb +2 -6
- data/lib/lingo/database/source/single_word.rb +4 -6
- data/lib/lingo/database/source/word_class.rb +4 -10
- data/lib/lingo/database/source.rb +20 -18
- data/lib/lingo/database.rb +84 -59
- data/lib/lingo/error.rb +57 -1
- data/lib/lingo/language/dictionary.rb +21 -18
- data/lib/lingo/language/grammar.rb +40 -49
- data/lib/lingo/language/lexical.rb +6 -6
- data/lib/lingo/language/lexical_hash.rb +6 -0
- data/lib/lingo/language/word.rb +32 -15
- data/lib/lingo/language/word_form.rb +1 -1
- data/lib/lingo/language.rb +14 -25
- data/lib/lingo/reportable.rb +12 -10
- data/lib/lingo/show_progress.rb +81 -0
- data/lib/lingo/version.rb +1 -1
- data/lib/lingo.rb +63 -24
- data/lingo-call.cfg +6 -10
- data/lingo.cfg +60 -44
- data/lir.cfg +42 -41
- data/test/attendee/ts_abbreviator.rb +3 -5
- data/test/attendee/ts_decomposer.rb +3 -5
- data/test/attendee/ts_multi_worder.rb +87 -145
- data/test/attendee/ts_noneword_filter.rb +5 -3
- data/test/attendee/ts_object_filter.rb +5 -3
- data/test/attendee/ts_sequencer.rb +3 -5
- data/test/attendee/ts_stemmer.rb +309 -0
- data/test/attendee/ts_synonymer.rb +15 -11
- data/test/attendee/ts_text_reader.rb +12 -15
- data/test/attendee/ts_text_writer.rb +24 -29
- data/test/attendee/ts_tokenizer.rb +9 -7
- data/test/attendee/ts_variator.rb +4 -4
- data/test/attendee/ts_vector_filter.rb +24 -16
- data/test/attendee/ts_word_searcher.rb +20 -36
- data/test/{lir.csv → lir.vec} +0 -0
- data/test/ref/artikel.vec +943 -943
- data/test/ref/artikel.ven +943 -943
- data/test/ref/lir.non +201 -201
- data/test/ref/lir.seq +178 -178
- data/test/ref/lir.syn +49 -49
- data/test/ref/lir.vec +329 -0
- data/test/test_helper.rb +20 -36
- data/test/ts_database.rb +10 -10
- data/test/ts_language.rb +279 -319
- metadata +93 -104
- data/info/Objekte.png +0 -0
- data/info/Typen.png +0 -0
- data/info/database.png +0 -0
- data/info/db_small.png +0 -0
- data/info/download.png +0 -0
- data/info/kerze.png +0 -0
- data/info/language.png +0 -0
- data/info/lingo.png +0 -0
- data/info/logo.png +0 -0
- data/info/meeting.png +0 -0
- data/info/types.png +0 -0
- data/lingo-all.cfg +0 -89
- data/porter/stem.cfg +0 -311
- data/porter/stem.rb +0 -150
- data/test/ref/lir.csv +0 -329
- data/test.cfg +0 -79
@@ -5,7 +5,7 @@ require_relative '../test_helper'
|
|
5
5
|
class TestAttendeeMultiWorder < AttendeeTestCase
|
6
6
|
|
7
7
|
def test_basic
|
8
|
-
|
8
|
+
meet({ 'source' => 'tst-mul' }, [
|
9
9
|
ai('FILE|mul.txt'),
|
10
10
|
# John_F_._Kennedy
|
11
11
|
wd('John|IDF', 'john|e'), wd('F|?'), tk('.|PUNC'), wd('Kennedy|IDF', 'kennedy|e'),
|
@@ -26,8 +26,7 @@ class TestAttendeeMultiWorder < AttendeeTestCase
|
|
26
26
|
# Satzende
|
27
27
|
tk('.|PUNC'),
|
28
28
|
ai('EOF|mul.txt')
|
29
|
-
]
|
30
|
-
@expect = [
|
29
|
+
], [
|
31
30
|
ai('FILE|mul.txt'),
|
32
31
|
# John_F_._Kennedy
|
33
32
|
wd('John F. Kennedy|MUL', 'john f. kennedy|m'),
|
@@ -55,330 +54,273 @@ class TestAttendeeMultiWorder < AttendeeTestCase
|
|
55
54
|
# Satzende
|
56
55
|
tk('.|PUNC'),
|
57
56
|
ai('EOF|mul.txt')
|
58
|
-
]
|
59
|
-
meet({'source'=>'tst-mul'})
|
57
|
+
])
|
60
58
|
end
|
61
59
|
|
62
60
|
def test_multiple_prefix
|
63
|
-
|
61
|
+
meet({ 'source' => 'tst-mul' }, [
|
64
62
|
ai('FILE|mul.txt'),
|
65
63
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
66
64
|
ai('EOF|mul.txt')
|
67
|
-
]
|
68
|
-
@expect = [
|
65
|
+
], [
|
69
66
|
ai('FILE|mul.txt'),
|
70
67
|
wd('Abelsches Schema|MUL', 'abelsches schema|m'),
|
71
68
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
72
69
|
ai('EOF|mul.txt')
|
73
|
-
]
|
74
|
-
meet({'source'=>'tst-mul'})
|
70
|
+
])
|
75
71
|
|
76
|
-
|
72
|
+
meet({ 'source' => 'tst-mul' }, [
|
77
73
|
ai('FILE|mul.txt'),
|
78
74
|
wd('Tolles|IDF', 'toll|a'), wd('abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
79
75
|
ai('EOF|mul.txt')
|
80
|
-
]
|
81
|
-
@expect = [
|
76
|
+
], [
|
82
77
|
ai('FILE|mul.txt'),
|
83
78
|
wd('Tolles abelsches Schema|MUL', 'tolles abelsches schema|m'),
|
84
79
|
wd('Tolles|IDF', 'toll|a'), wd('abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
85
80
|
ai('EOF|mul.txt')
|
86
|
-
]
|
87
|
-
meet({'source'=>'tst-mul'})
|
81
|
+
])
|
88
82
|
|
89
|
-
|
83
|
+
meet({ 'source' => 'tst-mul' }, [
|
90
84
|
ai('FILE|mul.txt'),
|
91
85
|
wd('Super|IDF', 'super|a'), wd('tolles|IDF', 'toll|a'), wd('abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
92
86
|
ai('EOF|mul.txt')
|
93
|
-
]
|
94
|
-
@expect = [
|
87
|
+
], [
|
95
88
|
ai('FILE|mul.txt'),
|
96
89
|
wd('Super tolles abelsches Schema|MUL', 'super tolles abelsches schema|m'),
|
97
90
|
wd('Super|IDF', 'super|a'), wd('tolles|IDF', 'toll|a'), wd('abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
98
91
|
ai('EOF|mul.txt')
|
99
|
-
]
|
100
|
-
meet({'source'=>'tst-mul'})
|
92
|
+
])
|
101
93
|
|
102
|
-
|
94
|
+
meet({ 'source' => 'tst-mul' }, [
|
103
95
|
ai('FILE|mul.txt'),
|
104
96
|
wd('Extra|IDF', 'extra|a'), wd('super|IDF', 'super|a'), wd('tolles|IDF', 'toll|a'), wd('abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
105
97
|
ai('EOF|mul.txt')
|
106
|
-
]
|
107
|
-
@expect = [
|
98
|
+
], [
|
108
99
|
ai('FILE|mul.txt'),
|
109
100
|
wd('Extra super tolles abelsches Schema|MUL', 'extra super tolles abelsches schema|m'),
|
110
101
|
wd('Extra|IDF', 'extra|a'), wd('super|IDF', 'super|a'), wd('tolles|IDF', 'toll|a'), wd('abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
111
102
|
ai('EOF|mul.txt')
|
112
|
-
]
|
113
|
-
meet({'source'=>'tst-mul'})
|
103
|
+
])
|
114
104
|
end
|
115
105
|
|
116
106
|
def test_multiple_suffix
|
117
|
-
|
107
|
+
meet({ 'source' => 'tst-mul' }, [
|
118
108
|
ai('FILE|mul.txt'),
|
119
109
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
120
110
|
ai('EOF|mul.txt')
|
121
|
-
]
|
122
|
-
@expect = [
|
111
|
+
], [
|
123
112
|
ai('FILE|mul.txt'),
|
124
113
|
wd('Abelsches Schema|MUL', 'abelsches schema|m'),
|
125
114
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), tk('.|PUNC'),
|
126
115
|
ai('EOF|mul.txt')
|
127
|
-
]
|
128
|
-
meet({'source'=>'tst-mul'})
|
116
|
+
])
|
129
117
|
|
130
|
-
|
118
|
+
meet({ 'source' => 'tst-mul' }, [
|
131
119
|
ai('FILE|mul.txt'),
|
132
120
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), wd('toll|IDF', 'toll|a'), tk('.|PUNC'),
|
133
121
|
ai('EOF|mul.txt')
|
134
|
-
]
|
135
|
-
@expect = [
|
122
|
+
], [
|
136
123
|
ai('FILE|mul.txt'),
|
137
124
|
wd('Abelsches Schema toll|MUL', 'abelsches schema toll|m'),
|
138
125
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), wd('toll|IDF', 'toll|a'), tk('.|PUNC'),
|
139
126
|
ai('EOF|mul.txt')
|
140
|
-
]
|
141
|
-
meet({'source'=>'tst-mul'})
|
127
|
+
])
|
142
128
|
|
143
|
-
|
129
|
+
meet({ 'source' => 'tst-mul' }, [
|
144
130
|
ai('FILE|mul.txt'),
|
145
131
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), wd('toll|IDF', 'toll|a'), wd('super|IDF', 'super|a'), tk('.|PUNC'),
|
146
132
|
ai('EOF|mul.txt')
|
147
|
-
]
|
148
|
-
@expect = [
|
133
|
+
], [
|
149
134
|
ai('FILE|mul.txt'),
|
150
135
|
wd('Abelsches Schema toll super|MUL', 'abelsches schema toll super|m'),
|
151
136
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), wd('toll|IDF', 'toll|a'), wd('super|IDF', 'super|a'), tk('.|PUNC'),
|
152
137
|
ai('EOF|mul.txt')
|
153
|
-
]
|
154
|
-
meet({'source'=>'tst-mul'})
|
138
|
+
])
|
155
139
|
|
156
|
-
|
140
|
+
meet({ 'source' => 'tst-mul' }, [
|
157
141
|
ai('FILE|mul.txt'),
|
158
142
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), wd('toll|IDF', 'toll|a'), wd('super|IDF', 'super|a'), wd('extra|IDF', 'extra|a'), tk('.|PUNC'),
|
159
143
|
ai('EOF|mul.txt')
|
160
|
-
]
|
161
|
-
@expect = [
|
144
|
+
], [
|
162
145
|
ai('FILE|mul.txt'),
|
163
146
|
wd('Abelsches Schema toll super extra|MUL', 'abelsches schema toll super extra|m'),
|
164
147
|
wd('Abelsches|IDF', 'abelsch|a'), wd('Schema|IDF', 'schema|s'), wd('toll|IDF', 'toll|a'), wd('super|IDF', 'super|a'), wd('extra|IDF', 'extra|a'), tk('.|PUNC'),
|
165
148
|
ai('EOF|mul.txt')
|
166
|
-
]
|
167
|
-
meet({'source'=>'tst-mul'})
|
149
|
+
])
|
168
150
|
end
|
169
151
|
|
170
152
|
def test_ending_count
|
171
|
-
|
153
|
+
meet({ 'source' => 'tst-mul' }, input = [
|
172
154
|
ai('FILE|mul.txt'),
|
173
155
|
wd('John|IDF', 'john|e'), wd('F|?'), tk('.|PUNC'), wd('Kennedy|IDF', 'kennedy|e'),
|
174
156
|
wd('war|IDF', 'war|w'), wd('einmal|IDF', 'einmal|w'), wd('Präsident|IDF', 'präsident|s'), tk('.|PUNC'),
|
175
157
|
ai('EOF|mul.txt')
|
176
|
-
]
|
177
|
-
@expect = [
|
158
|
+
], [
|
178
159
|
ai('FILE|mul.txt'),
|
179
160
|
wd('John F. Kennedy|MUL', 'john f. kennedy|m'),
|
180
161
|
wd('John|IDF', 'john|e'), wd('F|MU?'), wd('Kennedy|IDF', 'kennedy|e'),
|
181
162
|
wd('war|IDF', 'war|w'), wd('einmal|IDF', 'einmal|w'), wd('Präsident|IDF', 'präsident|s'), tk('.|PUNC'),
|
182
163
|
ai('EOF|mul.txt')
|
183
|
-
]
|
184
|
-
meet({'source'=>'tst-mul'})
|
164
|
+
])
|
185
165
|
|
186
|
-
|
187
|
-
|
188
|
-
@expect = [
|
166
|
+
input.delete_at(-3)
|
167
|
+
meet({ 'source' => 'tst-mul' }, input, [
|
189
168
|
ai('FILE|mul.txt'),
|
190
169
|
wd('John F. Kennedy|MUL', 'john f. kennedy|m'),
|
191
170
|
wd('John|IDF', 'john|e'), wd('F|MU?'), wd('Kennedy|IDF', 'kennedy|e'),
|
192
171
|
wd('war|IDF', 'war|w'), wd('einmal|IDF', 'einmal|w'), tk('.|PUNC'),
|
193
172
|
ai('EOF|mul.txt')
|
194
|
-
]
|
195
|
-
meet({'source'=>'tst-mul'})
|
173
|
+
])
|
196
174
|
|
197
|
-
|
198
|
-
|
199
|
-
@expect = [
|
175
|
+
input.delete_at(-3)
|
176
|
+
meet({ 'source' => 'tst-mul' }, input, [
|
200
177
|
ai('FILE|mul.txt'),
|
201
178
|
wd('John F. Kennedy|MUL', 'john f. kennedy|m'),
|
202
179
|
wd('John|IDF', 'john|e'), wd('F|MU?'), wd('Kennedy|IDF', 'kennedy|e'),
|
203
180
|
wd('war|IDF', 'war|w'), tk('.|PUNC'),
|
204
181
|
ai('EOF|mul.txt')
|
205
|
-
]
|
206
|
-
meet({'source'=>'tst-mul'})
|
182
|
+
])
|
207
183
|
|
208
|
-
|
209
|
-
|
210
|
-
@expect = [
|
184
|
+
input.delete_at(-3)
|
185
|
+
meet({ 'source' => 'tst-mul' }, input, [
|
211
186
|
ai('FILE|mul.txt'),
|
212
187
|
wd('John F. Kennedy|MUL', 'john f. kennedy|m'),
|
213
188
|
wd('John|IDF', 'john|e'), wd('F|MU?'), wd('Kennedy|IDF', 'kennedy|e'),
|
214
189
|
tk('.|PUNC'),
|
215
190
|
ai('EOF|mul.txt')
|
216
|
-
]
|
217
|
-
meet({'source'=>'tst-mul'})
|
191
|
+
])
|
218
192
|
end
|
219
193
|
|
220
194
|
def test_two_sources_mode_first
|
221
195
|
# in keinen WB enthalten
|
222
|
-
|
196
|
+
meet({ 'source' => 'tst-mul,tst-mu2', 'mode' => 'first' }, [
|
223
197
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
224
|
-
]
|
225
|
-
@expect = [
|
198
|
+
], [
|
226
199
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
227
|
-
]
|
228
|
-
meet({'source'=>'tst-mul,tst-mu2', 'mode'=>'first'})
|
200
|
+
])
|
229
201
|
|
230
202
|
# im ersten WB enthalten
|
231
|
-
|
203
|
+
meet({ 'source' => 'tst-mul,tst-mu2', 'mode' => 'first' }, [
|
232
204
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
233
|
-
]
|
234
|
-
@expect = [
|
205
|
+
], [
|
235
206
|
wd('abstrakten Kunst|MUL', 'abstrakte kunst|m'),
|
236
207
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
237
|
-
]
|
238
|
-
meet({'source'=>'tst-mul,tst-mu2', 'mode'=>'first'})
|
208
|
+
])
|
239
209
|
|
240
210
|
# im zweiten WB enthalten
|
241
|
-
|
211
|
+
meet({ 'source' => 'tst-mul,tst-mu2', 'mode' => 'first' }, [
|
242
212
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
243
|
-
]
|
244
|
-
@expect = [
|
213
|
+
], [
|
245
214
|
wd('traumatischer Angelegenheit|MUL', 'traumatische angelegenheit|m'),
|
246
215
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
247
|
-
]
|
248
|
-
meet({'source'=>'tst-mul,tst-mu2', 'mode'=>'first'})
|
216
|
+
])
|
249
217
|
|
250
218
|
# in beiden WB enthalten
|
251
|
-
|
219
|
+
meet({ 'source' => 'tst-mul,tst-mu2', 'mode' => 'first' }, [
|
252
220
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
253
|
-
]
|
254
|
-
@expect = [
|
221
|
+
], [
|
255
222
|
wd('azyklischen Bewegungen|MUL', 'chaotisches movement|m'),
|
256
223
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
257
|
-
]
|
258
|
-
meet({'source'=>'tst-mul,tst-mu2', 'mode'=>'first'})
|
224
|
+
])
|
259
225
|
end
|
260
226
|
|
261
227
|
def test_two_sources_mode_first_flipped
|
262
228
|
# in keinen WB enthalten
|
263
|
-
|
229
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'first' }, [
|
264
230
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
265
|
-
]
|
266
|
-
@expect = [
|
231
|
+
], [
|
267
232
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
268
|
-
]
|
269
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'first'})
|
233
|
+
])
|
270
234
|
|
271
235
|
# im ersten WB enthalten
|
272
|
-
|
236
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'first' }, [
|
273
237
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
274
|
-
]
|
275
|
-
@expect = [
|
238
|
+
], [
|
276
239
|
wd('abstrakten Kunst|MUL', 'abstrakte kunst|m'),
|
277
240
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
278
|
-
]
|
279
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'first'})
|
241
|
+
])
|
280
242
|
|
281
243
|
# im zweiten WB enthalten
|
282
|
-
|
244
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'first' }, [
|
283
245
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
284
|
-
]
|
285
|
-
@expect = [
|
246
|
+
], [
|
286
247
|
wd('traumatischer Angelegenheit|MUL', 'traumatische angelegenheit|m'),
|
287
248
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
288
|
-
]
|
289
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'first'})
|
249
|
+
])
|
290
250
|
|
291
251
|
# in beiden WB enthalten
|
292
|
-
|
252
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'first' }, [
|
293
253
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
294
|
-
]
|
295
|
-
@expect = [
|
254
|
+
], [
|
296
255
|
wd('azyklischen Bewegungen|MUL', 'azyklische bewegung|m'),
|
297
256
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
298
|
-
]
|
299
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'first'})
|
257
|
+
])
|
300
258
|
end
|
301
259
|
|
302
260
|
def test_select_two_sources_mode_all
|
303
261
|
# in keinen WB enthalten
|
304
|
-
|
262
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'all' }, [
|
305
263
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
306
|
-
]
|
307
|
-
@expect = [
|
264
|
+
], [
|
308
265
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
309
|
-
]
|
310
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'all'})
|
266
|
+
])
|
311
267
|
|
312
268
|
# im ersten WB enthalten
|
313
|
-
|
269
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'all' }, [
|
314
270
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
315
|
-
]
|
316
|
-
@expect = [
|
271
|
+
], [
|
317
272
|
wd('abstrakten Kunst|MUL', 'abstrakte kunst|m'),
|
318
273
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
319
|
-
]
|
320
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'all'})
|
274
|
+
])
|
321
275
|
|
322
276
|
# im zweiten WB enthalten
|
323
|
-
|
277
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'all' }, [
|
324
278
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
325
|
-
]
|
326
|
-
@expect = [
|
279
|
+
], [
|
327
280
|
wd('traumatischer Angelegenheit|MUL', 'traumatische angelegenheit|m'),
|
328
281
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
329
|
-
]
|
330
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'all'})
|
282
|
+
])
|
331
283
|
|
332
284
|
# in beiden WB enthalten
|
333
|
-
|
285
|
+
meet({ 'source' => 'tst-mu2,tst-mul', 'mode' => 'all' }, [
|
334
286
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
335
|
-
]
|
336
|
-
@expect = [
|
287
|
+
], [
|
337
288
|
wd('azyklischen Bewegungen|MUL', 'azyklische bewegung|m', 'chaotisches movement|m'),
|
338
289
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
339
|
-
]
|
340
|
-
meet({'source'=>'tst-mu2,tst-mul', 'mode'=>'all'})
|
290
|
+
])
|
341
291
|
end
|
342
292
|
|
343
293
|
def test_select_two_sources_mode_def
|
344
294
|
# in keinen WB enthalten
|
345
|
-
|
295
|
+
meet({ 'source' => 'tst-mu2,tst-mul' }, [
|
346
296
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
347
|
-
]
|
348
|
-
@expect = [
|
297
|
+
], [
|
349
298
|
wd('intelligente|IDF', 'intelligent|a'), wd('Indexierung|IDF', 'indexierung|s'), ai('EOF|mul.txt')
|
350
|
-
]
|
351
|
-
meet({'source'=>'tst-mu2,tst-mul'})
|
299
|
+
])
|
352
300
|
|
353
301
|
# im ersten WB enthalten
|
354
|
-
|
302
|
+
meet({ 'source' => 'tst-mu2,tst-mul' }, [
|
355
303
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
356
|
-
]
|
357
|
-
@expect = [
|
304
|
+
], [
|
358
305
|
wd('abstrakten Kunst|MUL', 'abstrakte kunst|m'),
|
359
306
|
wd('abstrakten|IDF', 'abstrakt|a'), wd('Kunst|IDF', 'kunst|s'), ai('EOF|mul.txt')
|
360
|
-
]
|
361
|
-
meet({'source'=>'tst-mu2,tst-mul'})
|
307
|
+
])
|
362
308
|
|
363
309
|
# im zweiten WB enthalten
|
364
|
-
|
310
|
+
meet({ 'source' => 'tst-mu2,tst-mul' }, [
|
365
311
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
366
|
-
]
|
367
|
-
@expect = [
|
312
|
+
], [
|
368
313
|
wd('traumatischer Angelegenheit|MUL', 'traumatische angelegenheit|m'),
|
369
314
|
wd('traumatischer|IDF', 'traumatisch|a'), wd('Angelegenheit|IDF', 'angelegenheit|s'), ai('EOF|mul.txt')
|
370
|
-
]
|
371
|
-
meet({'source'=>'tst-mu2,tst-mul'})
|
315
|
+
])
|
372
316
|
|
373
317
|
# in beiden WB enthalten
|
374
|
-
|
318
|
+
meet({ 'source' => 'tst-mu2,tst-mul' }, [
|
375
319
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
376
|
-
]
|
377
|
-
@expect = [
|
320
|
+
], [
|
378
321
|
wd('azyklischen Bewegungen|MUL', 'azyklische bewegung|m', 'chaotisches movement|m'),
|
379
322
|
wd('azyklischen|IDF', 'azyklisch|a'), wd('Bewegungen|IDF', 'bewegung|s'), ai('EOF|mul.txt')
|
380
|
-
]
|
381
|
-
meet({'source'=>'tst-mu2,tst-mul'})
|
323
|
+
])
|
382
324
|
end
|
383
325
|
|
384
326
|
end
|
@@ -5,9 +5,11 @@ require_relative '../test_helper'
|
|
5
5
|
class TestAttendeeNonewordFilter < AttendeeTestCase
|
6
6
|
|
7
7
|
def test_basic
|
8
|
-
|
9
|
-
|
10
|
-
|
8
|
+
meet({}, [
|
9
|
+
wd('Eins|IDF'), wd('Zwei|?'), wd('Drei|IDF'), wd('Vier|?'), ai('EOF|')
|
10
|
+
], [
|
11
|
+
'vier', 'zwei', ai('EOF|')
|
12
|
+
])
|
11
13
|
end
|
12
14
|
|
13
15
|
end
|
@@ -5,9 +5,11 @@ require_relative '../test_helper'
|
|
5
5
|
class TestAttendeeObjectFilter < AttendeeTestCase
|
6
6
|
|
7
7
|
def test_basic
|
8
|
-
|
9
|
-
|
10
|
-
|
8
|
+
meet({ 'objects' => 'obj.form =~ /^[A-Z]/' }, [
|
9
|
+
wd('Eins|IDF'), wd('zwei|?'), wd('Drei|IDF'), wd('vier|?'), ai('EOF|')
|
10
|
+
], [
|
11
|
+
wd('Eins|IDF'), wd('Drei|IDF'), ai('EOF|')
|
12
|
+
])
|
11
13
|
end
|
12
14
|
|
13
15
|
end
|
@@ -5,7 +5,7 @@ require_relative '../test_helper'
|
|
5
5
|
class TestAttendeeSequencer < AttendeeTestCase
|
6
6
|
|
7
7
|
def test_basic
|
8
|
-
|
8
|
+
meet({ 'stopper' => 'PUNC,OTHR', 'source' => 'sys-mul' }, [
|
9
9
|
# AS
|
10
10
|
wd('Die|IDF', 'die|w'),
|
11
11
|
wd('helle|IDF', 'hell|a'),
|
@@ -16,8 +16,7 @@ class TestAttendeeSequencer < AttendeeTestCase
|
|
16
16
|
wd('schöne|IDF', 'schön|a'),
|
17
17
|
wd('Sonnenuntergang|KOM', 'sonnenuntergang|k', 'sonne|s+', 'untergang|s+'),
|
18
18
|
ai('EOF|')
|
19
|
-
]
|
20
|
-
@expect = [
|
19
|
+
], [
|
21
20
|
# AS
|
22
21
|
wd('Die|IDF', 'die|w'),
|
23
22
|
wd('sonne, hell|SEQ', 'sonne, hell|q'),
|
@@ -30,8 +29,7 @@ class TestAttendeeSequencer < AttendeeTestCase
|
|
30
29
|
wd('schöne|IDF', 'schön|a'),
|
31
30
|
wd('Sonnenuntergang|KOM', 'sonnenuntergang|k', 'sonne|s+', 'untergang|s+'),
|
32
31
|
ai('EOF|')
|
33
|
-
]
|
34
|
-
meet({'stopper'=>'PUNC,OTHR', 'source'=>'sys-mul'})
|
32
|
+
])
|
35
33
|
end
|
36
34
|
|
37
35
|
end
|