scylla 1.0.0 → 1.0.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/lib/scylla/classifier.rb +3 -2
- data/lib/scylla/generator.rb +11 -4
- data/lib/scylla/lms/arabic.lm +398 -398
- data/lib/scylla/lms/bulgarian.lm +268 -268
- data/lib/scylla/lms/catalan.lm +400 -400
- data/lib/scylla/lms/chinese.lm +345 -345
- data/lib/scylla/lms/czech.lm +382 -382
- data/lib/scylla/lms/danish.lm +354 -354
- data/lib/scylla/lms/dutch.lm +380 -380
- data/lib/scylla/lms/english.lm +327 -327
- data/lib/scylla/lms/finnish.lm +297 -297
- data/lib/scylla/lms/french.lm +348 -348
- data/lib/scylla/lms/german.lm +386 -386
- data/lib/scylla/lms/greek.lm +352 -352
- data/lib/scylla/lms/hebrew.lm +385 -385
- data/lib/scylla/lms/hindi.lm +400 -400
- data/lib/scylla/lms/icelandic.lm +195 -195
- data/lib/scylla/lms/indonesian.lm +374 -374
- data/lib/scylla/lms/italian.lm +365 -365
- data/lib/scylla/lms/japanese.lm +368 -368
- data/lib/scylla/lms/kannada.lm +299 -299
- data/lib/scylla/lms/korean.lm +335 -335
- data/lib/scylla/lms/marathi.lm +240 -240
- data/lib/scylla/lms/norwegian.lm +348 -348
- data/lib/scylla/lms/persian.lm +337 -337
- data/lib/scylla/lms/polish.lm +399 -399
- data/lib/scylla/lms/portuguese.lm +386 -386
- data/lib/scylla/lms/romanian.lm +255 -255
- data/lib/scylla/lms/russian.lm +400 -400
- data/lib/scylla/lms/slovak.lm +267 -267
- data/lib/scylla/lms/slovenian.lm +243 -243
- data/lib/scylla/lms/spanish.lm +371 -371
- data/lib/scylla/lms/swedish.lm +236 -236
- data/lib/scylla/lms/tagalog.lm +287 -287
- data/lib/scylla/lms/thai.lm +369 -369
- data/lib/scylla/lms/turkish.lm +341 -341
- data/lib/scylla/lms/vietnamese.lm +392 -392
- data/lib/scylla/lms/welsh.lm +275 -275
- data/lib/scylla/loader.rb +1 -1
- metadata +2 -2
data/lib/scylla/lms/french.lm
CHANGED
@@ -1,400 +1,400 @@
|
|
1
|
-
_
|
2
|
-
e
|
3
|
-
s
|
4
|
-
a
|
5
|
-
n
|
6
|
-
t
|
7
|
-
i
|
8
|
-
r
|
9
|
-
l
|
10
|
-
e_
|
11
|
-
u
|
12
|
-
o
|
13
|
-
s_
|
14
|
-
d
|
15
|
-
p
|
16
|
-
_d
|
17
|
-
c
|
18
|
-
_l
|
19
|
-
es
|
20
|
-
m
|
21
|
-
t_
|
22
|
-
é
|
23
|
-
es_
|
24
|
-
de
|
25
|
-
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
_de
|
30
|
-
on
|
31
|
-
nt
|
32
|
-
an
|
33
|
-
n_
|
34
|
-
re
|
35
|
-
la
|
36
|
-
f
|
37
|
-
de_
|
38
|
-
_s
|
39
|
-
a_
|
40
|
-
_le
|
41
|
-
ti
|
42
|
-
_c
|
43
|
-
_a
|
44
|
-
is
|
45
|
-
_la
|
46
|
-
la_
|
47
|
-
|
48
|
-
|
49
|
-
|
50
|
-
|
51
|
-
|
52
|
-
|
53
|
-
ent
|
54
|
-
et
|
55
|
-
_f
|
56
|
-
ar
|
57
|
-
|
58
|
-
u_
|
59
|
-
|
60
|
-
|
61
|
-
|
62
|
-
et_
|
63
|
-
|
64
|
-
it
|
65
|
-
|
66
|
-
|
67
|
-
|
68
|
-
|
69
|
-
|
70
|
-
|
71
|
-
|
72
|
-
_et
|
73
|
-
se
|
74
|
-
ne
|
75
|
-
les
|
76
|
-
er
|
77
|
-
|
78
|
-
|
1
|
+
_ 28636
|
2
|
+
e 10430
|
3
|
+
s 5914
|
4
|
+
a 5472
|
5
|
+
n 5393
|
6
|
+
t 5099
|
7
|
+
i 4932
|
8
|
+
r 4670
|
9
|
+
l 4370
|
10
|
+
e_ 4092
|
11
|
+
u 3743
|
12
|
+
o 3605
|
13
|
+
s_ 3324
|
14
|
+
d 2983
|
15
|
+
p 2365
|
16
|
+
_d 2316
|
17
|
+
c 2240
|
18
|
+
_l 2186
|
19
|
+
es 2042
|
20
|
+
m 1966
|
21
|
+
t_ 1954
|
22
|
+
é 1786
|
23
|
+
es_ 1643
|
24
|
+
de 1560
|
25
|
+
le 1460
|
26
|
+
en 1426
|
27
|
+
_e 1411
|
28
|
+
_p 1353
|
29
|
+
_de 1337
|
30
|
+
on 1239
|
31
|
+
nt 1203
|
32
|
+
an 1102
|
33
|
+
n_ 1076
|
34
|
+
re 992
|
35
|
+
la 939
|
36
|
+
f 939
|
37
|
+
de_ 933
|
38
|
+
_s 865
|
39
|
+
a_ 853
|
40
|
+
_le 833
|
41
|
+
ti 828
|
42
|
+
_c 820
|
43
|
+
_a 809
|
44
|
+
is 802
|
45
|
+
_la 770
|
46
|
+
la_ 745
|
47
|
+
nt_ 741
|
48
|
+
le_ 740
|
49
|
+
g 739
|
50
|
+
ra 735
|
51
|
+
v 685
|
52
|
+
’ 682
|
53
|
+
ent 672
|
54
|
+
et 657
|
55
|
+
_f 646
|
56
|
+
ar 619
|
57
|
+
te 606
|
58
|
+
u_ 605
|
59
|
+
ce 602
|
60
|
+
pa 592
|
61
|
+
r_ 586
|
62
|
+
et_ 580
|
63
|
+
q 579
|
64
|
+
it 576
|
65
|
+
me 569
|
66
|
+
_m 569
|
67
|
+
qu 565
|
68
|
+
in 561
|
69
|
+
ai 560
|
70
|
+
ur 555
|
71
|
+
ns 553
|
72
|
+
_et 550
|
73
|
+
se 548
|
74
|
+
ne 530
|
75
|
+
les 500
|
76
|
+
er 498
|
77
|
+
au 492
|
78
|
+
st 491
|
79
79
|
ue 487
|
80
|
-
b
|
81
|
-
io
|
80
|
+
b 485
|
81
|
+
io 476
|
82
|
+
co 475
|
82
83
|
_pa 471
|
83
|
-
|
84
|
-
|
85
|
-
|
86
|
-
nc 448
|
84
|
+
_en 470
|
85
|
+
ion 456
|
86
|
+
nc 453
|
87
87
|
tr 445
|
88
|
-
ran
|
89
|
-
ri
|
90
|
-
at
|
91
|
-
ou
|
92
|
-
ie
|
93
|
-
_r
|
94
|
-
re_
|
95
|
-
eu
|
96
|
-
|
97
|
-
|
98
|
-
|
88
|
+
ran 444
|
89
|
+
ri 443
|
90
|
+
at 443
|
91
|
+
ou 438
|
92
|
+
ie 435
|
93
|
+
_r 430
|
94
|
+
re_ 427
|
95
|
+
eu 413
|
96
|
+
on_ 408
|
97
|
+
des 406
|
98
|
+
par 406
|
99
99
|
en_ 399
|
100
|
-
|
101
|
-
|
102
|
-
|
103
|
-
|
104
|
-
|
105
|
-
po
|
106
|
-
|
107
|
-
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
|
112
|
-
|
113
|
-
|
114
|
-
|
115
|
-
|
116
|
-
|
117
|
-
|
118
|
-
|
119
|
-
fra
|
120
|
-
or
|
121
|
-
|
122
|
-
so
|
123
|
-
rt
|
124
|
-
oi
|
125
|
-
à_
|
126
|
-
à
|
127
|
-
du
|
128
|
-
ré
|
129
|
-
nce
|
130
|
-
is_
|
131
|
-
_à
|
132
|
-
_à
|
133
|
-
anc
|
134
|
-
x
|
135
|
-
|
136
|
-
|
137
|
-
|
138
|
-
_n
|
139
|
-
|
140
|
-
us
|
141
|
-
|
142
|
-
|
143
|
-
|
144
|
-
|
145
|
-
|
146
|
-
|
147
|
-
|
148
|
-
|
149
|
-
|
150
|
-
|
151
|
-
|
152
|
-
|
153
|
-
|
154
|
-
|
100
|
+
li 397
|
101
|
+
ta 393
|
102
|
+
fr 392
|
103
|
+
ns_ 389
|
104
|
+
al 389
|
105
|
+
po 389
|
106
|
+
ce_ 378
|
107
|
+
l’ 377
|
108
|
+
_l’ 375
|
109
|
+
_t 375
|
110
|
+
em 375
|
111
|
+
ro 375
|
112
|
+
un 373
|
113
|
+
h 372
|
114
|
+
pr 372
|
115
|
+
_fr 368
|
116
|
+
_co 358
|
117
|
+
tio 357
|
118
|
+
ne_ 356
|
119
|
+
fra 351
|
120
|
+
or 350
|
121
|
+
que 346
|
122
|
+
so 341
|
123
|
+
rt 334
|
124
|
+
oi 333
|
125
|
+
à_ 330
|
126
|
+
à 330
|
127
|
+
du 322
|
128
|
+
ré 319
|
129
|
+
nce 318
|
130
|
+
is_ 317
|
131
|
+
_à_ 316
|
132
|
+
_à 316
|
133
|
+
anc 312
|
134
|
+
x 311
|
135
|
+
si 303
|
136
|
+
est 300
|
137
|
+
el 298
|
138
|
+
_n 297
|
139
|
+
_au 296
|
140
|
+
us 293
|
141
|
+
_u 291
|
142
|
+
ll 291
|
143
|
+
om 290
|
144
|
+
ue_ 289
|
145
|
+
é_ 289
|
146
|
+
nd 287
|
147
|
+
pl 286
|
148
|
+
ma 283
|
149
|
+
ui 278
|
150
|
+
è 278
|
151
|
+
_pr 273
|
152
|
+
_un 272
|
153
|
+
ée 267
|
154
|
+
ati 264
|
155
|
+
men 263
|
155
156
|
ir 263
|
156
|
-
|
157
|
-
|
158
|
-
lu
|
159
|
-
|
160
|
-
_so 258
|
157
|
+
_du 263
|
158
|
+
_so 262
|
159
|
+
lu 262
|
160
|
+
du_ 259
|
161
161
|
ont 257
|
162
|
-
|
163
|
-
st_ 250
|
164
|
-
ve 249
|
162
|
+
ve 252
|
165
163
|
mi 249
|
166
|
-
|
167
|
-
|
168
|
-
_qu
|
169
|
-
|
170
|
-
|
171
|
-
|
172
|
-
|
164
|
+
st_ 249
|
165
|
+
rs 247
|
166
|
+
_qu 245
|
167
|
+
_q 245
|
168
|
+
i_ 243
|
169
|
+
és 241
|
170
|
+
ci 241
|
171
|
+
té 237
|
172
|
+
ut 235
|
173
173
|
di 235
|
174
|
-
|
175
|
-
|
176
|
-
|
177
|
-
|
178
|
-
|
179
|
-
|
180
|
-
|
181
|
-
pe
|
182
|
-
|
183
|
-
|
184
|
-
au_
|
185
|
-
|
186
|
-
|
174
|
+
mo 232
|
175
|
+
_o 231
|
176
|
+
ant 230
|
177
|
+
_es 229
|
178
|
+
ss 228
|
179
|
+
_é 226
|
180
|
+
eur 223
|
181
|
+
pe 220
|
182
|
+
ais 215
|
183
|
+
l_ 215
|
184
|
+
au_ 213
|
185
|
+
lle 212
|
186
|
+
con 212
|
187
|
+
_po 211
|
187
188
|
res 209
|
188
|
-
|
189
|
-
|
189
|
+
te_ 209
|
190
|
+
na 205
|
190
191
|
ct 204
|
191
|
-
il
|
192
|
-
|
193
|
-
|
194
|
-
|
195
|
-
|
196
|
-
|
197
|
-
|
198
|
-
|
199
|
-
|
200
|
-
|
201
|
-
|
202
|
-
|
203
|
-
|
204
|
-
|
205
|
-
|
206
|
-
|
207
|
-
|
208
|
-
|
209
|
-
|
192
|
+
il 203
|
193
|
+
da 203
|
194
|
+
ux 200
|
195
|
+
x_ 199
|
196
|
+
iqu 199
|
197
|
+
iq 199
|
198
|
+
nn 199
|
199
|
+
son 198
|
200
|
+
_pl 198
|
201
|
+
y 198
|
202
|
+
d’ 198
|
203
|
+
rs_ 197
|
204
|
+
ol 197
|
205
|
+
ons 194
|
206
|
+
_d’ 193
|
207
|
+
me_ 193
|
208
|
+
_se 192
|
209
|
+
ur_ 192
|
210
|
+
ar_ 192
|
210
211
|
lo 191
|
211
|
-
_i
|
212
|
-
me_ 189
|
213
|
-
_se 187
|
212
|
+
_i 189
|
214
213
|
to 187
|
215
214
|
no 186
|
216
|
-
|
217
|
-
|
218
|
-
eme
|
219
|
-
|
220
|
-
|
221
|
-
|
222
|
-
|
223
|
-
|
224
|
-
|
225
|
-
|
226
|
-
|
227
|
-
pp 172
|
215
|
+
ch 185
|
216
|
+
ux_ 184
|
217
|
+
eme 182
|
218
|
+
_re 179
|
219
|
+
ec 179
|
220
|
+
tre 177
|
221
|
+
us_ 177
|
222
|
+
vi 176
|
223
|
+
ans 175
|
224
|
+
_mo 173
|
225
|
+
ic 173
|
228
226
|
pu 172
|
229
|
-
|
227
|
+
dé 171
|
230
228
|
mp 171
|
231
|
-
|
232
|
-
lus 170
|
229
|
+
lus 171
|
233
230
|
art 170
|
234
|
-
_ma
|
231
|
+
_ma 168
|
232
|
+
un_ 168
|
233
|
+
plu 166
|
235
234
|
ire 166
|
236
|
-
|
237
|
-
ale 166
|
235
|
+
une 166
|
238
236
|
_v 165
|
239
|
-
|
240
|
-
|
241
|
-
|
242
|
-
|
237
|
+
ale 165
|
238
|
+
se_ 164
|
239
|
+
ét 164
|
240
|
+
op 164
|
241
|
+
dan 161
|
243
242
|
gr 161
|
244
|
-
_g
|
245
|
-
|
246
|
-
|
247
|
-
|
248
|
-
|
249
|
-
ac
|
250
|
-
sa
|
251
|
-
j 153
|
243
|
+
_g 160
|
244
|
+
ul 159
|
245
|
+
_ce 157
|
246
|
+
j 154
|
247
|
+
tu 153
|
248
|
+
ac 153
|
249
|
+
sa 153
|
252
250
|
mm 153
|
251
|
+
né 153
|
252
|
+
ts 152
|
253
|
+
fi 151
|
254
|
+
ts_ 151
|
253
255
|
’a 151
|
254
|
-
|
255
|
-
|
256
|
-
|
257
|
-
|
258
|
-
|
259
|
-
|
260
|
-
as
|
261
|
-
|
262
|
-
|
263
|
-
|
264
|
-
|
265
|
-
|
266
|
-
|
267
|
-
|
268
|
-
|
269
|
-
|
270
|
-
|
271
|
-
|
272
|
-
|
273
|
-
|
274
|
-
|
275
|
-
ér 133
|
276
|
-
our 133
|
277
|
-
ç 133
|
278
|
-
ia 133
|
256
|
+
im 150
|
257
|
+
és_ 150
|
258
|
+
it_ 146
|
259
|
+
er_ 144
|
260
|
+
_dé 142
|
261
|
+
_da 142
|
262
|
+
as 141
|
263
|
+
su 139
|
264
|
+
ep 139
|
265
|
+
té_ 138
|
266
|
+
bl 138
|
267
|
+
ge 138
|
268
|
+
our 137
|
269
|
+
_ré 136
|
270
|
+
ell 136
|
271
|
+
ise 136
|
272
|
+
rti 135
|
273
|
+
ç 134
|
274
|
+
ér 134
|
275
|
+
ag 132
|
276
|
+
ia 132
|
279
277
|
_no 131
|
280
|
-
|
281
|
-
|
282
|
-
|
283
|
-
|
284
|
-
|
285
|
-
nça
|
286
|
-
ça
|
287
|
-
|
288
|
-
|
289
|
-
|
290
|
-
|
291
|
-
|
292
|
-
|
293
|
-
|
294
|
-
|
278
|
+
ée_ 131
|
279
|
+
ien 128
|
280
|
+
nç 128
|
281
|
+
ntr 127
|
282
|
+
’e 125
|
283
|
+
nça 125
|
284
|
+
ça 125
|
285
|
+
anç 124
|
286
|
+
ni 124
|
287
|
+
iv 123
|
288
|
+
çai 122
|
289
|
+
ort 122
|
290
|
+
com 121
|
291
|
+
ond 119
|
292
|
+
aux 119
|
295
293
|
rr 117
|
296
|
-
|
297
|
-
|
298
|
-
ui_ 115
|
294
|
+
ui_ 116
|
295
|
+
’_ 115
|
299
296
|
ins 113
|
300
297
|
tra 112
|
301
298
|
_tr 112
|
299
|
+
_pe 111
|
302
300
|
ain 111
|
303
|
-
|
304
|
-
’_ 110
|
301
|
+
iè 110
|
305
302
|
ées 109
|
306
|
-
|
307
|
-
|
308
|
-
|
309
|
-
|
303
|
+
ie_ 109
|
304
|
+
ca 109
|
305
|
+
mb 108
|
306
|
+
d_ 108
|
307
|
+
ig 108
|
308
|
+
ine 108
|
310
309
|
_su 107
|
311
|
-
|
312
|
-
|
313
|
-
ine 106
|
314
|
-
_b 105
|
310
|
+
ses 107
|
311
|
+
qui 107
|
315
312
|
do 105
|
313
|
+
_b 105
|
314
|
+
éc 105
|
315
|
+
br 105
|
316
316
|
_di 104
|
317
|
-
|
318
|
-
|
319
|
-
d_ 104
|
320
|
-
br 104
|
321
|
-
fa 103
|
322
|
-
mme 103
|
317
|
+
nne 104
|
318
|
+
fo 104
|
323
319
|
ect 103
|
324
|
-
|
325
|
-
|
326
|
-
|
327
|
-
ot 101
|
320
|
+
mme 103
|
321
|
+
fa 103
|
322
|
+
ot 103
|
328
323
|
sé 101
|
324
|
+
ap 101
|
325
|
+
uv 100
|
329
326
|
rés 100
|
330
|
-
|
331
|
-
fo 100
|
332
|
-
cu 99
|
333
|
-
uis 99
|
334
|
-
mai 98
|
327
|
+
_te 99
|
335
328
|
_j 98
|
336
|
-
|
337
|
-
|
338
|
-
|
339
|
-
urs
|
329
|
+
ter 98
|
330
|
+
mai 98
|
331
|
+
cu 98
|
332
|
+
urs 97
|
333
|
+
ill 97
|
334
|
+
lit 97
|
335
|
+
l’_ 97
|
336
|
+
oc 96
|
337
|
+
id 96
|
338
|
+
ép 96
|
339
|
+
tan 96
|
340
|
+
uis 96
|
340
341
|
ris 96
|
341
|
-
|
342
|
-
|
343
|
-
|
344
|
-
cti 94
|
342
|
+
gi 96
|
343
|
+
bre 94
|
344
|
+
ité 94
|
345
345
|
air 94
|
346
|
-
|
347
|
-
|
346
|
+
ier 94
|
347
|
+
cti 94
|
348
348
|
ues 93
|
349
|
-
|
350
|
-
|
351
|
-
|
352
|
-
|
353
|
-
|
354
|
-
|
355
|
-
|
356
|
-
pro 90
|
357
|
-
tan 90
|
358
|
-
hi 90
|
349
|
+
nte 93
|
350
|
+
pro 92
|
351
|
+
por 92
|
352
|
+
hi 92
|
353
|
+
iti 91
|
354
|
+
mon 91
|
355
|
+
sp 91
|
359
356
|
_in 90
|
360
|
-
|
361
|
-
|
362
|
-
ouv 89
|
357
|
+
_si 90
|
358
|
+
va 89
|
363
359
|
av 89
|
364
|
-
|
365
|
-
|
366
|
-
_si 88
|
360
|
+
vo 88
|
361
|
+
oir 88
|
367
362
|
pré 88
|
368
|
-
|
369
|
-
tie
|
363
|
+
nom 88
|
364
|
+
tie 88
|
365
|
+
ouv 88
|
366
|
+
onn 87
|
370
367
|
_do 87
|
368
|
+
ist 87
|
369
|
+
nts 86
|
371
370
|
ys 86
|
372
|
-
|
371
|
+
ois 86
|
373
372
|
_an 85
|
373
|
+
ég 85
|
374
|
+
ure 84
|
375
|
+
rop 84
|
374
376
|
mé 84
|
375
|
-
|
377
|
+
nde 84
|
378
|
+
in_ 84
|
376
379
|
_fa 84
|
377
380
|
ers 84
|
378
|
-
|
379
|
-
|
380
|
-
rop 83
|
381
|
-
nts 83
|
381
|
+
pou 83
|
382
|
+
ay 83
|
382
383
|
ga 83
|
383
384
|
tes 83
|
384
|
-
|
385
|
-
|
386
|
-
and
|
385
|
+
èr 82
|
386
|
+
ère 82
|
387
|
+
and 82
|
388
|
+
_ou 82
|
389
|
+
mbr 82
|
390
|
+
rm 81
|
391
|
+
_fo 81
|
392
|
+
pri 81
|
387
393
|
omm 81
|
388
|
-
_to 81
|
389
|
-
ay 81
|
390
394
|
tat 81
|
391
|
-
|
392
|
-
pri 81
|
393
|
-
rm 80
|
394
|
-
pui 80
|
395
|
-
pou 80
|
396
|
-
_ou 80
|
397
|
-
eux 79
|
398
|
-
ial 79
|
395
|
+
_to 81
|
399
396
|
gra 79
|
400
|
-
|
397
|
+
_h 79
|
398
|
+
ha 79
|
399
|
+
nes 79
|
400
|
+
eux 79
|