language_detector 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/README.rdoc +24 -0
- data/Rakefile +18 -0
- data/VERSION +1 -0
- data/lib/language_detector.rb +232 -0
- data/lib/model-fm.yml +52504 -0
- data/lib/model-tc.yml +53985 -0
- data/lib/textcat_ngrams/afrikaans.lm +400 -0
- data/lib/textcat_ngrams/albanian.lm +400 -0
- data/lib/textcat_ngrams/amharic-utf.lm +400 -0
- data/lib/textcat_ngrams/arabic-iso8859_6.lm +400 -0
- data/lib/textcat_ngrams/arabic-windows1256.lm +400 -0
- data/lib/textcat_ngrams/armenian.lm +400 -0
- data/lib/textcat_ngrams/basque.lm +400 -0
- data/lib/textcat_ngrams/belarus-windows1251.lm +400 -0
- data/lib/textcat_ngrams/bosnian.lm +400 -0
- data/lib/textcat_ngrams/breton.lm +400 -0
- data/lib/textcat_ngrams/bulgarian-iso8859_5.lm +400 -0
- data/lib/textcat_ngrams/catalan.lm +400 -0
- data/lib/textcat_ngrams/chinese-big5.lm +400 -0
- data/lib/textcat_ngrams/chinese-gb2312.lm +400 -0
- data/lib/textcat_ngrams/croatian-ascii.lm +400 -0
- data/lib/textcat_ngrams/czech-iso8859_2.lm +400 -0
- data/lib/textcat_ngrams/danish.lm +400 -0
- data/lib/textcat_ngrams/dutch.lm +400 -0
- data/lib/textcat_ngrams/english.lm +400 -0
- data/lib/textcat_ngrams/esperanto.lm +400 -0
- data/lib/textcat_ngrams/estonian.lm +400 -0
- data/lib/textcat_ngrams/finnish.lm +400 -0
- data/lib/textcat_ngrams/french.lm +400 -0
- data/lib/textcat_ngrams/frisian.lm +400 -0
- data/lib/textcat_ngrams/georgian.lm +400 -0
- data/lib/textcat_ngrams/german.lm +400 -0
- data/lib/textcat_ngrams/greek-iso8859-7.lm +400 -0
- data/lib/textcat_ngrams/hebrew-iso8859_8.lm +400 -0
- data/lib/textcat_ngrams/hindi.lm +400 -0
- data/lib/textcat_ngrams/hungarian.lm +400 -0
- data/lib/textcat_ngrams/icelandic.lm +400 -0
- data/lib/textcat_ngrams/indonesian.lm +400 -0
- data/lib/textcat_ngrams/irish.lm +400 -0
- data/lib/textcat_ngrams/italian.lm +400 -0
- data/lib/textcat_ngrams/japanese-euc_jp.lm +400 -0
- data/lib/textcat_ngrams/japanese-shift_jis.lm +400 -0
- data/lib/textcat_ngrams/korean.lm +400 -0
- data/lib/textcat_ngrams/latin.lm +400 -0
- data/lib/textcat_ngrams/latvian.lm +400 -0
- data/lib/textcat_ngrams/lithuanian.lm +400 -0
- data/lib/textcat_ngrams/malay.lm +400 -0
- data/lib/textcat_ngrams/manx.lm +400 -0
- data/lib/textcat_ngrams/marathi.lm +400 -0
- data/lib/textcat_ngrams/mingo.lm +400 -0
- data/lib/textcat_ngrams/nepali.lm +400 -0
- data/lib/textcat_ngrams/norwegian.lm +400 -0
- data/lib/textcat_ngrams/persian.lm +400 -0
- data/lib/textcat_ngrams/polish.lm +400 -0
- data/lib/textcat_ngrams/portuguese.lm +400 -0
- data/lib/textcat_ngrams/quechua.lm +400 -0
- data/lib/textcat_ngrams/romanian.lm +400 -0
- data/lib/textcat_ngrams/rumantsch.lm +400 -0
- data/lib/textcat_ngrams/russian-iso8859_5.lm +400 -0
- data/lib/textcat_ngrams/russian-koi8_r.lm +400 -0
- data/lib/textcat_ngrams/russian-windows1251.lm +400 -0
- data/lib/textcat_ngrams/sanskrit.lm +400 -0
- data/lib/textcat_ngrams/scots.lm +400 -0
- data/lib/textcat_ngrams/scots_gaelic.lm +400 -0
- data/lib/textcat_ngrams/serbian-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovak-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovak-windows1250.lm +400 -0
- data/lib/textcat_ngrams/slovenian-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovenian-iso8859_2.lm +400 -0
- data/lib/textcat_ngrams/spanish.lm +400 -0
- data/lib/textcat_ngrams/swahili.lm +400 -0
- data/lib/textcat_ngrams/swedish.lm +400 -0
- data/lib/textcat_ngrams/tagalog.lm +400 -0
- data/lib/textcat_ngrams/tamil.lm +400 -0
- data/lib/textcat_ngrams/thai.lm +400 -0
- data/lib/textcat_ngrams/turkish.lm +400 -0
- data/lib/textcat_ngrams/ukrainian-koi8_u.lm +400 -0
- data/lib/textcat_ngrams/vietnamese.lm +400 -0
- data/lib/textcat_ngrams/welsh.lm +400 -0
- data/lib/textcat_ngrams/yiddish-utf.lm +400 -0
- data/lib/training_data/ar-utf8.txt +54 -0
- data/lib/training_data/bg-utf8.txt +26 -0
- data/lib/training_data/cs-utf8.txt +48 -0
- data/lib/training_data/da-utf8.txt +159 -0
- data/lib/training_data/de-utf8.txt +569 -0
- data/lib/training_data/el-utf8.txt +48 -0
- data/lib/training_data/en-utf8.txt +81 -0
- data/lib/training_data/es-utf8.txt +185 -0
- data/lib/training_data/et-utf8.txt +50 -0
- data/lib/training_data/fa-utf8.txt +42 -0
- data/lib/training_data/fi-utf8.txt +83 -0
- data/lib/training_data/fr-utf8.txt +191 -0
- data/lib/training_data/fy-utf8.txt +22 -0
- data/lib/training_data/ga-utf8.txt +109 -0
- data/lib/training_data/he-utf8.txt +116 -0
- data/lib/training_data/hi-utf8.txt +49 -0
- data/lib/training_data/hr-utf8.txt +80 -0
- data/lib/training_data/hu-utf8.txt +87 -0
- data/lib/training_data/io-utf8.txt +41 -0
- data/lib/training_data/is-utf8.txt +94 -0
- data/lib/training_data/it-utf8.txt +228 -0
- data/lib/training_data/ja-utf8.txt +200 -0
- data/lib/training_data/ko-utf8.txt +147 -0
- data/lib/training_data/nl-utf8.txt +215 -0
- data/lib/training_data/no-utf8.txt +281 -0
- data/lib/training_data/pl-utf8.txt +120 -0
- data/lib/training_data/pt-utf8.txt +214 -0
- data/lib/training_data/ro-utf8.txt +66 -0
- data/lib/training_data/ru-utf8.txt +310 -0
- data/lib/training_data/sl-utf8.txt +263 -0
- data/lib/training_data/sv-utf8.txt +174 -0
- data/lib/training_data/th-utf8.txt +49 -0
- data/lib/training_data/tk-utf8.txt +101 -0
- data/lib/training_data/todo/af.txt +114 -0
- data/lib/training_data/todo/amharic-utf.txt +95 -0
- data/lib/training_data/todo/arabic-windows1256.txt +157 -0
- data/lib/training_data/todo/armenian.txt +86 -0
- data/lib/training_data/todo/basque.txt +136 -0
- data/lib/training_data/todo/belarus-windows1251.txt +97 -0
- data/lib/training_data/todo/bosnian.txt +97 -0
- data/lib/training_data/todo/breton.txt +159 -0
- data/lib/training_data/todo/bulgarian-iso8859_5.txt +115 -0
- data/lib/training_data/todo/catalan.txt +93 -0
- data/lib/training_data/todo/croatian-ascii.txt +104 -0
- data/lib/training_data/todo/esperanto.txt +95 -0
- data/lib/training_data/todo/estonian.txt +218 -0
- data/lib/training_data/todo/frisian.txt +99 -0
- data/lib/training_data/todo/georgian.txt +86 -0
- data/lib/training_data/todo/greek-iso8859-7.txt +139 -0
- data/lib/training_data/todo/hawaian.txt +108 -0
- data/lib/training_data/todo/hebrew-iso8859_8.txt +79 -0
- data/lib/training_data/todo/hindi.txt +77 -0
- data/lib/training_data/todo/hungarian.txt +102 -0
- data/lib/training_data/todo/icelandic.txt +131 -0
- data/lib/training_data/todo/indonesian.txt +93 -0
- data/lib/training_data/todo/irish.txt +209 -0
- data/lib/training_data/todo/latin.txt +120 -0
- data/lib/training_data/todo/latvian.txt +126 -0
- data/lib/training_data/todo/lithuanian.txt +99 -0
- data/lib/training_data/todo/malay.txt +108 -0
- data/lib/training_data/todo/manx.txt +78 -0
- data/lib/training_data/todo/marathi.txt +100 -0
- data/lib/training_data/todo/mf.txt +100 -0
- data/lib/training_data/todo/middle_frisian.txt +102 -0
- data/lib/training_data/todo/mingo.txt +146 -0
- data/lib/training_data/todo/nepali.txt +131 -0
- data/lib/training_data/todo/persian.txt +73 -0
- data/lib/training_data/todo/quechua.txt +108 -0
- data/lib/training_data/todo/romanian.txt +103 -0
- data/lib/training_data/todo/rumantsch.txt +110 -0
- data/lib/training_data/todo/sanskrit.txt +135 -0
- data/lib/training_data/todo/scots.txt +490 -0
- data/lib/training_data/todo/scots_gaelic.txt +93 -0
- data/lib/training_data/todo/serbian-ascii.txt +121 -0
- data/lib/training_data/todo/slovak-ascii.txt +102 -0
- data/lib/training_data/todo/slovak-windows1250.txt +115 -0
- data/lib/training_data/todo/slovenian-ascii.txt +100 -0
- data/lib/training_data/todo/slovenian-iso8859_2.txt +96 -0
- data/lib/training_data/todo/sq.txt +110 -0
- data/lib/training_data/todo/swahili.txt +120 -0
- data/lib/training_data/todo/tagalog.txt +135 -0
- data/lib/training_data/todo/tamil.txt +123 -0
- data/lib/training_data/todo/turkish.txt +117 -0
- data/lib/training_data/todo/ukrainian-koi8_r.txt +214 -0
- data/lib/training_data/todo/vietnamese.txt +92 -0
- data/lib/training_data/todo/welsh.txt +148 -0
- data/lib/training_data/todo/yiddish-utf.txt +83 -0
- data/lib/training_data/uk-utf8.txt +75 -0
- data/lib/training_data/vi-utf8.txt +47 -0
- data/lib/training_data/zh-utf8.txt +228 -0
- data/test/language_detector_test.rb +78 -0
- metadata +232 -0
@@ -0,0 +1,400 @@
|
|
1
|
+
_ 24504
|
2
|
+
a 8735
|
3
|
+
i 7353
|
4
|
+
s 6064
|
5
|
+
t 5176
|
6
|
+
e 4390
|
7
|
+
r 4339
|
8
|
+
u 4200
|
9
|
+
n 3422
|
10
|
+
� 3055
|
11
|
+
m 2817
|
12
|
+
p 2755
|
13
|
+
k 2703
|
14
|
+
o 2643
|
15
|
+
s_ 2595
|
16
|
+
d 2131
|
17
|
+
l 2035
|
18
|
+
j 1972
|
19
|
+
� 1958
|
20
|
+
ie 1887
|
21
|
+
v 1822
|
22
|
+
as 1530
|
23
|
+
u_ 1396
|
24
|
+
_p 1380
|
25
|
+
b 1357
|
26
|
+
z 1311
|
27
|
+
� 1267
|
28
|
+
a_ 1261
|
29
|
+
as_ 1217
|
30
|
+
. 1065
|
31
|
+
, 1048
|
32
|
+
,_ 1033
|
33
|
+
g 1010
|
34
|
+
ar 970
|
35
|
+
� 965
|
36
|
+
ti 962
|
37
|
+
c 922
|
38
|
+
_a 876
|
39
|
+
ja 838
|
40
|
+
st 828
|
41
|
+
_i 822
|
42
|
+
_v 805
|
43
|
+
pa 792
|
44
|
+
_t 775
|
45
|
+
._ 774
|
46
|
+
um 760
|
47
|
+
_k 749
|
48
|
+
�_ 734
|
49
|
+
_n 728
|
50
|
+
es 712
|
51
|
+
i_ 706
|
52
|
+
at 703
|
53
|
+
is 695
|
54
|
+
_s 680
|
55
|
+
ai 649
|
56
|
+
ta 635
|
57
|
+
an 631
|
58
|
+
ka 621
|
59
|
+
r_ 615
|
60
|
+
�b 586
|
61
|
+
ij 585
|
62
|
+
_u 568
|
63
|
+
_pa 548
|
64
|
+
un 541
|
65
|
+
no 539
|
66
|
+
va 537
|
67
|
+
ma 525
|
68
|
+
ra 522
|
69
|
+
ri 515
|
70
|
+
iz 512
|
71
|
+
in 509
|
72
|
+
vi 508
|
73
|
+
pr 506
|
74
|
+
sa 487
|
75
|
+
ju 486
|
76
|
+
t� 483
|
77
|
+
ik 473
|
78
|
+
n_ 472
|
79
|
+
am 454
|
80
|
+
en 452
|
81
|
+
tie 440
|
82
|
+
na 432
|
83
|
+
�a 430
|
84
|
+
tu 420
|
85
|
+
ija 420
|
86
|
+
ir 419
|
87
|
+
o_ 415
|
88
|
+
m_ 414
|
89
|
+
li 411
|
90
|
+
ci 409
|
91
|
+
ku 404
|
92
|
+
mi 401
|
93
|
+
_no 398
|
94
|
+
ek 398
|
95
|
+
_un 397
|
96
|
+
t_ 395
|
97
|
+
_l 394
|
98
|
+
un_ 393
|
99
|
+
_d 393
|
100
|
+
ot 392
|
101
|
+
_un_ 392
|
102
|
+
ies 391
|
103
|
+
ar_ 388
|
104
|
+
n� 387
|
105
|
+
da 387
|
106
|
+
ei 385
|
107
|
+
em 382
|
108
|
+
_ti 382
|
109
|
+
pi 380
|
110
|
+
al 368
|
111
|
+
ba 356
|
112
|
+
ts 355
|
113
|
+
_iz 353
|
114
|
+
ap 350
|
115
|
+
jas 349
|
116
|
+
ko 346
|
117
|
+
au 345
|
118
|
+
�an 339
|
119
|
+
re 339
|
120
|
+
ni 337
|
121
|
+
k� 328
|
122
|
+
ro 327
|
123
|
+
et 326
|
124
|
+
r� 325
|
125
|
+
ga 323
|
126
|
+
mu 322
|
127
|
+
jas_ 321
|
128
|
+
tr 317
|
129
|
+
_va 312
|
130
|
+
te 310
|
131
|
+
_pr 307
|
132
|
+
sp 298
|
133
|
+
sk 297
|
134
|
+
ne 295
|
135
|
+
�ba 293
|
136
|
+
�s 289
|
137
|
+
ijas 287
|
138
|
+
_ar 283
|
139
|
+
la 283
|
140
|
+
to 282
|
141
|
+
ad 280
|
142
|
+
dz 278
|
143
|
+
�g 277
|
144
|
+
t� 277
|
145
|
+
�j 277
|
146
|
+
_sa 277
|
147
|
+
j� 274
|
148
|
+
_m 273
|
149
|
+
ties 273
|
150
|
+
l� 272
|
151
|
+
ijas_ 269
|
152
|
+
_at 269
|
153
|
+
ed 267
|
154
|
+
_pi 267
|
155
|
+
� 267
|
156
|
+
s, 265
|
157
|
+
s,_ 265
|
158
|
+
�r 261
|
159
|
+
gu 258
|
160
|
+
f 258
|
161
|
+
si 257
|
162
|
+
m� 256
|
163
|
+
nt 254
|
164
|
+
tu_ 254
|
165
|
+
_r 253
|
166
|
+
ru 252
|
167
|
+
�j 251
|
168
|
+
jum 251
|
169
|
+
�s_ 250
|
170
|
+
�t 249
|
171
|
+
iem 248
|
172
|
+
_b 248
|
173
|
+
_vi 245
|
174
|
+
par 244
|
175
|
+
pie 244
|
176
|
+
rt 243
|
177
|
+
v� 242
|
178
|
+
_ne 240
|
179
|
+
�r 240
|
180
|
+
ai_ 239
|
181
|
+
_. 239
|
182
|
+
_j 237
|
183
|
+
us 237
|
184
|
+
_ka 236
|
185
|
+
er 232
|
186
|
+
bas 232
|
187
|
+
_tie 232
|
188
|
+
_par 230
|
189
|
+
di 229
|
190
|
+
� 228
|
191
|
+
ms 228
|
192
|
+
�d 226
|
193
|
+
�bas 224
|
194
|
+
om 220
|
195
|
+
bu 219
|
196
|
+
umu 217
|
197
|
+
iek 216
|
198
|
+
kt 216
|
199
|
+
it 216
|
200
|
+
r� 215
|
201
|
+
_ko 214
|
202
|
+
ana 211
|
203
|
+
�k 211
|
204
|
+
or 210
|
205
|
+
de 210
|
206
|
+
in� 207
|
207
|
+
d� 204
|
208
|
+
ur 203
|
209
|
+
pri 203
|
210
|
+
_c 202
|
211
|
+
ta_ 202
|
212
|
+
bas_ 201
|
213
|
+
es_ 201
|
214
|
+
_pie 200
|
215
|
+
il 200
|
216
|
+
os 199
|
217
|
+
�ana 199
|
218
|
+
id 198
|
219
|
+
L 198
|
220
|
+
_ie 197
|
221
|
+
bi 194
|
222
|
+
ak 194
|
223
|
+
ja_ 194
|
224
|
+
�bas_ 193
|
225
|
+
�t 192
|
226
|
+
�bu 192
|
227
|
+
_g 191
|
228
|
+
� 189
|
229
|
+
ma_ 189
|
230
|
+
ien 188
|
231
|
+
kum 187
|
232
|
+
� 187
|
233
|
+
_ir 186
|
234
|
+
on 186
|
235
|
+
_ties 185
|
236
|
+
z� 185
|
237
|
+
ce 185
|
238
|
+
ied 184
|
239
|
+
ist 183
|
240
|
+
ts_ 183
|
241
|
+
_� 183
|
242
|
+
�_ 182
|
243
|
+
�m 181
|
244
|
+
vie 180
|
245
|
+
_�_ 180
|
246
|
+
cij 180
|
247
|
+
ka_ 179
|
248
|
+
_ap 175
|
249
|
+
s� 174
|
250
|
+
ir_ 174
|
251
|
+
zi 174
|
252
|
+
uma 173
|
253
|
+
�l 172
|
254
|
+
_ir_ 172
|
255
|
+
o� 171
|
256
|
+
_da 169
|
257
|
+
�_ 168
|
258
|
+
ar� 168
|
259
|
+
) 167
|
260
|
+
do 166
|
261
|
+
ve 166
|
262
|
+
( 165
|
263
|
+
ls 165
|
264
|
+
bu_ 164
|
265
|
+
val 164
|
266
|
+
mu_ 164
|
267
|
+
isk 163
|
268
|
+
uz 161
|
269
|
+
av 160
|
270
|
+
par_ 160
|
271
|
+
_v� 159
|
272
|
+
_par_ 158
|
273
|
+
v�r 158
|
274
|
+
_ar_ 157
|
275
|
+
rie 157
|
276
|
+
_uz 157
|
277
|
+
aj 156
|
278
|
+
�bu_ 156
|
279
|
+
oj 155
|
280
|
+
k�_ 155
|
281
|
+
ld 154
|
282
|
+
iet 154
|
283
|
+
iku 154
|
284
|
+
ks 153
|
285
|
+
du 153
|
286
|
+
ep 153
|
287
|
+
ms_ 152
|
288
|
+
ec 152
|
289
|
+
V 151
|
290
|
+
ais 150
|
291
|
+
str 150
|
292
|
+
nie 149
|
293
|
+
am_ 149
|
294
|
+
ums 148
|
295
|
+
_( 147
|
296
|
+
ju_ 146
|
297
|
+
z_ 142
|
298
|
+
ru_ 142
|
299
|
+
�j 142
|
300
|
+
gum 142
|
301
|
+
u,_ 141
|
302
|
+
u, 141
|
303
|
+
i� 141
|
304
|
+
uma_ 141
|
305
|
+
�rt 141
|
306
|
+
�gu 141
|
307
|
+
me 140
|
308
|
+
d� 140
|
309
|
+
�t 140
|
310
|
+
ent 139
|
311
|
+
ikum 138
|
312
|
+
p� 138
|
313
|
+
em_ 138
|
314
|
+
_L 138
|
315
|
+
lie 136
|
316
|
+
sta 136
|
317
|
+
r�_ 136
|
318
|
+
lst 136
|
319
|
+
eik 135
|
320
|
+
se 135
|
321
|
+
s. 134
|
322
|
+
pro 134
|
323
|
+
rs 134
|
324
|
+
s._ 134
|
325
|
+
tik 134
|
326
|
+
l� 134
|
327
|
+
ska 133
|
328
|
+
pap 133
|
329
|
+
kas 133
|
330
|
+
rm 133
|
331
|
+
�ju 133
|
332
|
+
p� 132
|
333
|
+
nu 132
|
334
|
+
T 132
|
335
|
+
p� 131
|
336
|
+
tei 131
|
337
|
+
nas 131
|
338
|
+
_V 131
|
339
|
+
jo 131
|
340
|
+
l�g 131
|
341
|
+
ut 131
|
342
|
+
iem_ 130
|
343
|
+
ras 129
|
344
|
+
pu 129
|
345
|
+
_li 129
|
346
|
+
_ga 128
|
347
|
+
dar 128
|
348
|
+
_k� 128
|
349
|
+
umu_ 127
|
350
|
+
�v 126
|
351
|
+
�gum 126
|
352
|
+
kas_ 126
|
353
|
+
t�b 125
|
354
|
+
vai 125
|
355
|
+
l�gu 125
|
356
|
+
P 125
|
357
|
+
ar�_ 125
|
358
|
+
ev 124
|
359
|
+
lai 124
|
360
|
+
�r 124
|
361
|
+
l�gum 124
|
362
|
+
tv 123
|
363
|
+
a� 123
|
364
|
+
_ar�_ 122
|
365
|
+
_ar� 122
|
366
|
+
_vie 121
|
367
|
+
S 121
|
368
|
+
_T 120
|
369
|
+
�ju 120
|
370
|
+
teik 120
|
371
|
+
cija 119
|
372
|
+
rb 119
|
373
|
+
_� 119
|
374
|
+
j�_ 119
|
375
|
+
nas_ 118
|
376
|
+
t�j 118
|
377
|
+
v�rt 118
|
378
|
+
iec 118
|
379
|
+
_la 117
|
380
|
+
�d 116
|
381
|
+
_vai 116
|
382
|
+
�jum 116
|
383
|
+
vien 116
|
384
|
+
als 116
|
385
|
+
_l� 116
|
386
|
+
ap�r 115
|
387
|
+
rts 115
|
388
|
+
isi 115
|
389
|
+
p�r 115
|
390
|
+
pap� 115
|
391
|
+
pap�r 115
|
392
|
+
ap� 115
|
393
|
+
tsp 115
|
394
|
+
m� 114
|
395
|
+
im 114
|
396
|
+
be 114
|
397
|
+
is_ 114
|
398
|
+
alst 114
|
399
|
+
_ja 114
|
400
|
+
rtspa 113
|
@@ -0,0 +1,400 @@
|
|
1
|
+
_ 23070
|
2
|
+
i 8196
|
3
|
+
a 7763
|
4
|
+
s 5179
|
5
|
+
e 3458
|
6
|
+
o 3425
|
7
|
+
u 3371
|
8
|
+
t 3344
|
9
|
+
r 3240
|
10
|
+
n 3070
|
11
|
+
k 3019
|
12
|
+
l 2060
|
13
|
+
p 1889
|
14
|
+
s_ 1756
|
15
|
+
m 1680
|
16
|
+
d 1640
|
17
|
+
v 1590
|
18
|
+
, 1501
|
19
|
+
,_ 1497
|
20
|
+
� 1400
|
21
|
+
g 1302
|
22
|
+
j 1200
|
23
|
+
o_ 1138
|
24
|
+
. 1128
|
25
|
+
ai 1113
|
26
|
+
� 1075
|
27
|
+
_p 1047
|
28
|
+
_k 1035
|
29
|
+
i_ 990
|
30
|
+
._ 984
|
31
|
+
as 975
|
32
|
+
b 937
|
33
|
+
au 903
|
34
|
+
is 863
|
35
|
+
_n 815
|
36
|
+
ka 811
|
37
|
+
si 804
|
38
|
+
_s 799
|
39
|
+
ia 796
|
40
|
+
� 759
|
41
|
+
ta 735
|
42
|
+
ie 731
|
43
|
+
ti 728
|
44
|
+
y 721
|
45
|
+
_t 711
|
46
|
+
in 697
|
47
|
+
_i 686
|
48
|
+
us 675
|
49
|
+
pa 658
|
50
|
+
ir 640
|
51
|
+
ar 633
|
52
|
+
� 620
|
53
|
+
_a 617
|
54
|
+
r_ 609
|
55
|
+
ne 583
|
56
|
+
a_ 578
|
57
|
+
ri 569
|
58
|
+
_v 558
|
59
|
+
_pa 541
|
60
|
+
al 540
|
61
|
+
ra 531
|
62
|
+
li 522
|
63
|
+
� 509
|
64
|
+
u_ 493
|
65
|
+
vi 490
|
66
|
+
_ka 489
|
67
|
+
da 487
|
68
|
+
_ne 482
|
69
|
+
_j 481
|
70
|
+
en 478
|
71
|
+
�_ 445
|
72
|
+
os 444
|
73
|
+
ki 442
|
74
|
+
� 441
|
75
|
+
an 440
|
76
|
+
ik 434
|
77
|
+
ma 433
|
78
|
+
as_ 430
|
79
|
+
st 420
|
80
|
+
_d 420
|
81
|
+
ai_ 417
|
82
|
+
s,_ 396
|
83
|
+
am 396
|
84
|
+
is_ 396
|
85
|
+
s, 396
|
86
|
+
_ir 390
|
87
|
+
jo 387
|
88
|
+
ir_ 385
|
89
|
+
at 384
|
90
|
+
_ir_ 383
|
91
|
+
i� 381
|
92
|
+
ni 377
|
93
|
+
ga 376
|
94
|
+
_b 367
|
95
|
+
na 366
|
96
|
+
e_ 365
|
97
|
+
to 352
|
98
|
+
pr 337
|
99
|
+
_g 332
|
100
|
+
_m 332
|
101
|
+
� 328
|
102
|
+
� 326
|
103
|
+
io 323
|
104
|
+
ei 323
|
105
|
+
�_ 321
|
106
|
+
su 320
|
107
|
+
�i 320
|
108
|
+
uo 319
|
109
|
+
la 317
|
110
|
+
er 303
|
111
|
+
va 299
|
112
|
+
vo 298
|
113
|
+
�i 293
|
114
|
+
es 291
|
115
|
+
- 290
|
116
|
+
�_ 286
|
117
|
+
-_ 285
|
118
|
+
_vi 284
|
119
|
+
_- 283
|
120
|
+
ko 283
|
121
|
+
_-_ 283
|
122
|
+
iau 281
|
123
|
+
sa 278
|
124
|
+
s. 278
|
125
|
+
iu 276
|
126
|
+
et 274
|
127
|
+
nu 265
|
128
|
+
ja 262
|
129
|
+
�_ 262
|
130
|
+
_ta 262
|
131
|
+
s._ 259
|
132
|
+
el 258
|
133
|
+
�j 258
|
134
|
+
os_ 256
|
135
|
+
im 255
|
136
|
+
it 254
|
137
|
+
_pr 253
|
138
|
+
no 252
|
139
|
+
av 251
|
140
|
+
ur 251
|
141
|
+
_� 248
|
142
|
+
mi 246
|
143
|
+
ve 245
|
144
|
+
ak 245
|
145
|
+
ku 243
|
146
|
+
ek 241
|
147
|
+
tu 241
|
148
|
+
_� 241
|
149
|
+
ad 241
|
150
|
+
� 238
|
151
|
+
_l 238
|
152
|
+
_i� 236
|
153
|
+
us_ 236
|
154
|
+
_su 232
|
155
|
+
oj 231
|
156
|
+
au_ 231
|
157
|
+
ba 224
|
158
|
+
nt 218
|
159
|
+
me 214
|
160
|
+
te 210
|
161
|
+
jo_ 208
|
162
|
+
ro 205
|
163
|
+
�s 204
|
164
|
+
i� 203
|
165
|
+
tai 203
|
166
|
+
_� 201
|
167
|
+
l� 201
|
168
|
+
pas 200
|
169
|
+
ip 198
|
170
|
+
iai 197
|
171
|
+
di 195
|
172
|
+
usi 194
|
173
|
+
vo_ 193
|
174
|
+
kai 190
|
175
|
+
i, 189
|
176
|
+
i,_ 189
|
177
|
+
sk 187
|
178
|
+
_r 186
|
179
|
+
aus 184
|
180
|
+
ap 183
|
181
|
+
gi 182
|
182
|
+
mo 182
|
183
|
+
uk 181
|
184
|
+
t_ 180
|
185
|
+
_da 177
|
186
|
+
be 176
|
187
|
+
ien 176
|
188
|
+
o, 174
|
189
|
+
il 174
|
190
|
+
o,_ 173
|
191
|
+
ti_ 173
|
192
|
+
re 172
|
193
|
+
_nu 171
|
194
|
+
�ia 171
|
195
|
+
_pas 169
|
196
|
+
pri 169
|
197
|
+
�_ 169
|
198
|
+
ok 168
|
199
|
+
d� 166
|
200
|
+
�l 162
|
201
|
+
bu 161
|
202
|
+
�i 160
|
203
|
+
on 160
|
204
|
+
asi 159
|
205
|
+
id 158
|
206
|
+
ul 157
|
207
|
+
ji 157
|
208
|
+
aip 156
|
209
|
+
ia_ 155
|
210
|
+
_sa 154
|
211
|
+
ot 154
|
212
|
+
gal 153
|
213
|
+
nk 153
|
214
|
+
om 152
|
215
|
+
p_ 151
|
216
|
+
_pri 151
|
217
|
+
od 151
|
218
|
+
vis 150
|
219
|
+
_at 150
|
220
|
+
vie 150
|
221
|
+
uv 150
|
222
|
+
ab 150
|
223
|
+
i�_ 149
|
224
|
+
ama 149
|
225
|
+
n� 149
|
226
|
+
A 149
|
227
|
+
sta 148
|
228
|
+
kr 148
|
229
|
+
_A 145
|
230
|
+
ais 144
|
231
|
+
rt 143
|
232
|
+
J 142
|
233
|
+
_J 142
|
234
|
+
�jo 142
|
235
|
+
_�_ 141
|
236
|
+
K 140
|
237
|
+
_K 139
|
238
|
+
pi 139
|
239
|
+
avo 139
|
240
|
+
ng 139
|
241
|
+
mas 138
|
242
|
+
du 138
|
243
|
+
ug 137
|
244
|
+
_ga 137
|
245
|
+
ol 136
|
246
|
+
tik 135
|
247
|
+
ali 135
|
248
|
+
.. 135
|
249
|
+
_vis 135
|
250
|
+
iek 134
|
251
|
+
ini 133
|
252
|
+
kad 133
|
253
|
+
a, 133
|
254
|
+
le 133
|
255
|
+
k� 133
|
256
|
+
T 133
|
257
|
+
t� 132
|
258
|
+
i. 132
|
259
|
+
_T 131
|
260
|
+
d� 131
|
261
|
+
a,_ 131
|
262
|
+
go 131
|
263
|
+
ip_ 131
|
264
|
+
aip_ 131
|
265
|
+
r� 129
|
266
|
+
a� 129
|
267
|
+
d�i 129
|
268
|
+
ke 128
|
269
|
+
k_ 128
|
270
|
+
d_ 127
|
271
|
+
ad_ 127
|
272
|
+
_ti 127
|
273
|
+
_ma 126
|
274
|
+
_va 125
|
275
|
+
i._ 124
|
276
|
+
z 123
|
277
|
+
�k 123
|
278
|
+
iau_ 121
|
279
|
+
m_ 120
|
280
|
+
kar 119
|
281
|
+
um 119
|
282
|
+
t� 119
|
283
|
+
_kad 118
|
284
|
+
u� 117
|
285
|
+
tr 117
|
286
|
+
_kai 117
|
287
|
+
as, 116
|
288
|
+
og 116
|
289
|
+
kad_ 116
|
290
|
+
as,_ 116
|
291
|
+
_ji 116
|
292
|
+
rie 115
|
293
|
+
yt 114
|
294
|
+
_ja 114
|
295
|
+
_ko 114
|
296
|
+
v� 114
|
297
|
+
ys 114
|
298
|
+
jau 113
|
299
|
+
ar_ 113
|
300
|
+
pra 112
|
301
|
+
a� 112
|
302
|
+
ant 112
|
303
|
+
kl 111
|
304
|
+
tas 111
|
305
|
+
gu 111
|
306
|
+
_ku 110
|
307
|
+
si_ 110
|
308
|
+
pe 109
|
309
|
+
eb 109
|
310
|
+
N 109
|
311
|
+
�jo_ 108
|
312
|
+
_kad_ 108
|
313
|
+
se 108
|
314
|
+
_ki 108
|
315
|
+
or 107
|
316
|
+
ly 107
|
317
|
+
lo 107
|
318
|
+
iai_ 107
|
319
|
+
_la 106
|
320
|
+
ts 106
|
321
|
+
�s 106
|
322
|
+
ig 105
|
323
|
+
_N 105
|
324
|
+
ut 105
|
325
|
+
_u 105
|
326
|
+
�s_ 105
|
327
|
+
avo_ 104
|
328
|
+
ie_ 104
|
329
|
+
a. 104
|
330
|
+
kt 104
|
331
|
+
em 103
|
332
|
+
do 103
|
333
|
+
je 102
|
334
|
+
ks 102
|
335
|
+
ats 101
|
336
|
+
_be 101
|
337
|
+
ris 101
|
338
|
+
l_ 101
|
339
|
+
_vie 101
|
340
|
+
tin 101
|
341
|
+
ag 100
|
342
|
+
dam 100
|
343
|
+
_st 100
|
344
|
+
a._ 99
|
345
|
+
_bu 99
|
346
|
+
? 99
|
347
|
+
V 98
|
348
|
+
io_ 98
|
349
|
+
kas 98
|
350
|
+
_jo 98
|
351
|
+
vien 97
|
352
|
+
_gal 97
|
353
|
+
�t 97
|
354
|
+
kia 97
|
355
|
+
lia 96
|
356
|
+
c 96
|
357
|
+
uri 96
|
358
|
+
_V 96
|
359
|
+
?_ 96
|
360
|
+
uvo 95
|
361
|
+
ru 95
|
362
|
+
ty 95
|
363
|
+
ep 94
|
364
|
+
nd 94
|
365
|
+
lai 94
|
366
|
+
_tai 94
|
367
|
+
ju 93
|
368
|
+
man 92
|
369
|
+
o. 92
|
370
|
+
buv 92
|
371
|
+
t� 92
|
372
|
+
_�i 91
|
373
|
+
i�_ 91
|
374
|
+
_i�_ 91
|
375
|
+
i�k 90
|
376
|
+
o._ 90
|
377
|
+
_to 90
|
378
|
+
bi 90
|
379
|
+
up 89
|
380
|
+
po 89
|
381
|
+
rs 89
|
382
|
+
_prie 88
|
383
|
+
�,_ 88
|
384
|
+
aik 88
|
385
|
+
ui 88
|
386
|
+
_tik 88
|
387
|
+
ij 88
|
388
|
+
�, 88
|
389
|
+
pat 88
|
390
|
+
prie 88
|
391
|
+
I 87
|
392
|
+
ies 87
|
393
|
+
tai_ 87
|
394
|
+
n_ 87
|
395
|
+
pasi 87
|
396
|
+
ius 87
|
397
|
+
�t 87
|
398
|
+
eik 86
|
399
|
+
_me 86
|
400
|
+
ina 86
|