language_detector 0.1.0
Sign up to get free protection for your applications and to get access to all the features.
- data/README.rdoc +24 -0
- data/Rakefile +18 -0
- data/VERSION +1 -0
- data/lib/language_detector.rb +232 -0
- data/lib/model-fm.yml +52504 -0
- data/lib/model-tc.yml +53985 -0
- data/lib/textcat_ngrams/afrikaans.lm +400 -0
- data/lib/textcat_ngrams/albanian.lm +400 -0
- data/lib/textcat_ngrams/amharic-utf.lm +400 -0
- data/lib/textcat_ngrams/arabic-iso8859_6.lm +400 -0
- data/lib/textcat_ngrams/arabic-windows1256.lm +400 -0
- data/lib/textcat_ngrams/armenian.lm +400 -0
- data/lib/textcat_ngrams/basque.lm +400 -0
- data/lib/textcat_ngrams/belarus-windows1251.lm +400 -0
- data/lib/textcat_ngrams/bosnian.lm +400 -0
- data/lib/textcat_ngrams/breton.lm +400 -0
- data/lib/textcat_ngrams/bulgarian-iso8859_5.lm +400 -0
- data/lib/textcat_ngrams/catalan.lm +400 -0
- data/lib/textcat_ngrams/chinese-big5.lm +400 -0
- data/lib/textcat_ngrams/chinese-gb2312.lm +400 -0
- data/lib/textcat_ngrams/croatian-ascii.lm +400 -0
- data/lib/textcat_ngrams/czech-iso8859_2.lm +400 -0
- data/lib/textcat_ngrams/danish.lm +400 -0
- data/lib/textcat_ngrams/dutch.lm +400 -0
- data/lib/textcat_ngrams/english.lm +400 -0
- data/lib/textcat_ngrams/esperanto.lm +400 -0
- data/lib/textcat_ngrams/estonian.lm +400 -0
- data/lib/textcat_ngrams/finnish.lm +400 -0
- data/lib/textcat_ngrams/french.lm +400 -0
- data/lib/textcat_ngrams/frisian.lm +400 -0
- data/lib/textcat_ngrams/georgian.lm +400 -0
- data/lib/textcat_ngrams/german.lm +400 -0
- data/lib/textcat_ngrams/greek-iso8859-7.lm +400 -0
- data/lib/textcat_ngrams/hebrew-iso8859_8.lm +400 -0
- data/lib/textcat_ngrams/hindi.lm +400 -0
- data/lib/textcat_ngrams/hungarian.lm +400 -0
- data/lib/textcat_ngrams/icelandic.lm +400 -0
- data/lib/textcat_ngrams/indonesian.lm +400 -0
- data/lib/textcat_ngrams/irish.lm +400 -0
- data/lib/textcat_ngrams/italian.lm +400 -0
- data/lib/textcat_ngrams/japanese-euc_jp.lm +400 -0
- data/lib/textcat_ngrams/japanese-shift_jis.lm +400 -0
- data/lib/textcat_ngrams/korean.lm +400 -0
- data/lib/textcat_ngrams/latin.lm +400 -0
- data/lib/textcat_ngrams/latvian.lm +400 -0
- data/lib/textcat_ngrams/lithuanian.lm +400 -0
- data/lib/textcat_ngrams/malay.lm +400 -0
- data/lib/textcat_ngrams/manx.lm +400 -0
- data/lib/textcat_ngrams/marathi.lm +400 -0
- data/lib/textcat_ngrams/mingo.lm +400 -0
- data/lib/textcat_ngrams/nepali.lm +400 -0
- data/lib/textcat_ngrams/norwegian.lm +400 -0
- data/lib/textcat_ngrams/persian.lm +400 -0
- data/lib/textcat_ngrams/polish.lm +400 -0
- data/lib/textcat_ngrams/portuguese.lm +400 -0
- data/lib/textcat_ngrams/quechua.lm +400 -0
- data/lib/textcat_ngrams/romanian.lm +400 -0
- data/lib/textcat_ngrams/rumantsch.lm +400 -0
- data/lib/textcat_ngrams/russian-iso8859_5.lm +400 -0
- data/lib/textcat_ngrams/russian-koi8_r.lm +400 -0
- data/lib/textcat_ngrams/russian-windows1251.lm +400 -0
- data/lib/textcat_ngrams/sanskrit.lm +400 -0
- data/lib/textcat_ngrams/scots.lm +400 -0
- data/lib/textcat_ngrams/scots_gaelic.lm +400 -0
- data/lib/textcat_ngrams/serbian-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovak-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovak-windows1250.lm +400 -0
- data/lib/textcat_ngrams/slovenian-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovenian-iso8859_2.lm +400 -0
- data/lib/textcat_ngrams/spanish.lm +400 -0
- data/lib/textcat_ngrams/swahili.lm +400 -0
- data/lib/textcat_ngrams/swedish.lm +400 -0
- data/lib/textcat_ngrams/tagalog.lm +400 -0
- data/lib/textcat_ngrams/tamil.lm +400 -0
- data/lib/textcat_ngrams/thai.lm +400 -0
- data/lib/textcat_ngrams/turkish.lm +400 -0
- data/lib/textcat_ngrams/ukrainian-koi8_u.lm +400 -0
- data/lib/textcat_ngrams/vietnamese.lm +400 -0
- data/lib/textcat_ngrams/welsh.lm +400 -0
- data/lib/textcat_ngrams/yiddish-utf.lm +400 -0
- data/lib/training_data/ar-utf8.txt +54 -0
- data/lib/training_data/bg-utf8.txt +26 -0
- data/lib/training_data/cs-utf8.txt +48 -0
- data/lib/training_data/da-utf8.txt +159 -0
- data/lib/training_data/de-utf8.txt +569 -0
- data/lib/training_data/el-utf8.txt +48 -0
- data/lib/training_data/en-utf8.txt +81 -0
- data/lib/training_data/es-utf8.txt +185 -0
- data/lib/training_data/et-utf8.txt +50 -0
- data/lib/training_data/fa-utf8.txt +42 -0
- data/lib/training_data/fi-utf8.txt +83 -0
- data/lib/training_data/fr-utf8.txt +191 -0
- data/lib/training_data/fy-utf8.txt +22 -0
- data/lib/training_data/ga-utf8.txt +109 -0
- data/lib/training_data/he-utf8.txt +116 -0
- data/lib/training_data/hi-utf8.txt +49 -0
- data/lib/training_data/hr-utf8.txt +80 -0
- data/lib/training_data/hu-utf8.txt +87 -0
- data/lib/training_data/io-utf8.txt +41 -0
- data/lib/training_data/is-utf8.txt +94 -0
- data/lib/training_data/it-utf8.txt +228 -0
- data/lib/training_data/ja-utf8.txt +200 -0
- data/lib/training_data/ko-utf8.txt +147 -0
- data/lib/training_data/nl-utf8.txt +215 -0
- data/lib/training_data/no-utf8.txt +281 -0
- data/lib/training_data/pl-utf8.txt +120 -0
- data/lib/training_data/pt-utf8.txt +214 -0
- data/lib/training_data/ro-utf8.txt +66 -0
- data/lib/training_data/ru-utf8.txt +310 -0
- data/lib/training_data/sl-utf8.txt +263 -0
- data/lib/training_data/sv-utf8.txt +174 -0
- data/lib/training_data/th-utf8.txt +49 -0
- data/lib/training_data/tk-utf8.txt +101 -0
- data/lib/training_data/todo/af.txt +114 -0
- data/lib/training_data/todo/amharic-utf.txt +95 -0
- data/lib/training_data/todo/arabic-windows1256.txt +157 -0
- data/lib/training_data/todo/armenian.txt +86 -0
- data/lib/training_data/todo/basque.txt +136 -0
- data/lib/training_data/todo/belarus-windows1251.txt +97 -0
- data/lib/training_data/todo/bosnian.txt +97 -0
- data/lib/training_data/todo/breton.txt +159 -0
- data/lib/training_data/todo/bulgarian-iso8859_5.txt +115 -0
- data/lib/training_data/todo/catalan.txt +93 -0
- data/lib/training_data/todo/croatian-ascii.txt +104 -0
- data/lib/training_data/todo/esperanto.txt +95 -0
- data/lib/training_data/todo/estonian.txt +218 -0
- data/lib/training_data/todo/frisian.txt +99 -0
- data/lib/training_data/todo/georgian.txt +86 -0
- data/lib/training_data/todo/greek-iso8859-7.txt +139 -0
- data/lib/training_data/todo/hawaian.txt +108 -0
- data/lib/training_data/todo/hebrew-iso8859_8.txt +79 -0
- data/lib/training_data/todo/hindi.txt +77 -0
- data/lib/training_data/todo/hungarian.txt +102 -0
- data/lib/training_data/todo/icelandic.txt +131 -0
- data/lib/training_data/todo/indonesian.txt +93 -0
- data/lib/training_data/todo/irish.txt +209 -0
- data/lib/training_data/todo/latin.txt +120 -0
- data/lib/training_data/todo/latvian.txt +126 -0
- data/lib/training_data/todo/lithuanian.txt +99 -0
- data/lib/training_data/todo/malay.txt +108 -0
- data/lib/training_data/todo/manx.txt +78 -0
- data/lib/training_data/todo/marathi.txt +100 -0
- data/lib/training_data/todo/mf.txt +100 -0
- data/lib/training_data/todo/middle_frisian.txt +102 -0
- data/lib/training_data/todo/mingo.txt +146 -0
- data/lib/training_data/todo/nepali.txt +131 -0
- data/lib/training_data/todo/persian.txt +73 -0
- data/lib/training_data/todo/quechua.txt +108 -0
- data/lib/training_data/todo/romanian.txt +103 -0
- data/lib/training_data/todo/rumantsch.txt +110 -0
- data/lib/training_data/todo/sanskrit.txt +135 -0
- data/lib/training_data/todo/scots.txt +490 -0
- data/lib/training_data/todo/scots_gaelic.txt +93 -0
- data/lib/training_data/todo/serbian-ascii.txt +121 -0
- data/lib/training_data/todo/slovak-ascii.txt +102 -0
- data/lib/training_data/todo/slovak-windows1250.txt +115 -0
- data/lib/training_data/todo/slovenian-ascii.txt +100 -0
- data/lib/training_data/todo/slovenian-iso8859_2.txt +96 -0
- data/lib/training_data/todo/sq.txt +110 -0
- data/lib/training_data/todo/swahili.txt +120 -0
- data/lib/training_data/todo/tagalog.txt +135 -0
- data/lib/training_data/todo/tamil.txt +123 -0
- data/lib/training_data/todo/turkish.txt +117 -0
- data/lib/training_data/todo/ukrainian-koi8_r.txt +214 -0
- data/lib/training_data/todo/vietnamese.txt +92 -0
- data/lib/training_data/todo/welsh.txt +148 -0
- data/lib/training_data/todo/yiddish-utf.txt +83 -0
- data/lib/training_data/uk-utf8.txt +75 -0
- data/lib/training_data/vi-utf8.txt +47 -0
- data/lib/training_data/zh-utf8.txt +228 -0
- data/test/language_detector_test.rb +78 -0
- metadata +232 -0
@@ -0,0 +1,400 @@
|
|
1
|
+
_ 24504
|
2
|
+
a 8735
|
3
|
+
i 7353
|
4
|
+
s 6064
|
5
|
+
t 5176
|
6
|
+
e 4390
|
7
|
+
r 4339
|
8
|
+
u 4200
|
9
|
+
n 3422
|
10
|
+
� 3055
|
11
|
+
m 2817
|
12
|
+
p 2755
|
13
|
+
k 2703
|
14
|
+
o 2643
|
15
|
+
s_ 2595
|
16
|
+
d 2131
|
17
|
+
l 2035
|
18
|
+
j 1972
|
19
|
+
� 1958
|
20
|
+
ie 1887
|
21
|
+
v 1822
|
22
|
+
as 1530
|
23
|
+
u_ 1396
|
24
|
+
_p 1380
|
25
|
+
b 1357
|
26
|
+
z 1311
|
27
|
+
� 1267
|
28
|
+
a_ 1261
|
29
|
+
as_ 1217
|
30
|
+
. 1065
|
31
|
+
, 1048
|
32
|
+
,_ 1033
|
33
|
+
g 1010
|
34
|
+
ar 970
|
35
|
+
� 965
|
36
|
+
ti 962
|
37
|
+
c 922
|
38
|
+
_a 876
|
39
|
+
ja 838
|
40
|
+
st 828
|
41
|
+
_i 822
|
42
|
+
_v 805
|
43
|
+
pa 792
|
44
|
+
_t 775
|
45
|
+
._ 774
|
46
|
+
um 760
|
47
|
+
_k 749
|
48
|
+
�_ 734
|
49
|
+
_n 728
|
50
|
+
es 712
|
51
|
+
i_ 706
|
52
|
+
at 703
|
53
|
+
is 695
|
54
|
+
_s 680
|
55
|
+
ai 649
|
56
|
+
ta 635
|
57
|
+
an 631
|
58
|
+
ka 621
|
59
|
+
r_ 615
|
60
|
+
�b 586
|
61
|
+
ij 585
|
62
|
+
_u 568
|
63
|
+
_pa 548
|
64
|
+
un 541
|
65
|
+
no 539
|
66
|
+
va 537
|
67
|
+
ma 525
|
68
|
+
ra 522
|
69
|
+
ri 515
|
70
|
+
iz 512
|
71
|
+
in 509
|
72
|
+
vi 508
|
73
|
+
pr 506
|
74
|
+
sa 487
|
75
|
+
ju 486
|
76
|
+
t� 483
|
77
|
+
ik 473
|
78
|
+
n_ 472
|
79
|
+
am 454
|
80
|
+
en 452
|
81
|
+
tie 440
|
82
|
+
na 432
|
83
|
+
�a 430
|
84
|
+
tu 420
|
85
|
+
ija 420
|
86
|
+
ir 419
|
87
|
+
o_ 415
|
88
|
+
m_ 414
|
89
|
+
li 411
|
90
|
+
ci 409
|
91
|
+
ku 404
|
92
|
+
mi 401
|
93
|
+
_no 398
|
94
|
+
ek 398
|
95
|
+
_un 397
|
96
|
+
t_ 395
|
97
|
+
_l 394
|
98
|
+
un_ 393
|
99
|
+
_d 393
|
100
|
+
ot 392
|
101
|
+
_un_ 392
|
102
|
+
ies 391
|
103
|
+
ar_ 388
|
104
|
+
n� 387
|
105
|
+
da 387
|
106
|
+
ei 385
|
107
|
+
em 382
|
108
|
+
_ti 382
|
109
|
+
pi 380
|
110
|
+
al 368
|
111
|
+
ba 356
|
112
|
+
ts 355
|
113
|
+
_iz 353
|
114
|
+
ap 350
|
115
|
+
jas 349
|
116
|
+
ko 346
|
117
|
+
au 345
|
118
|
+
�an 339
|
119
|
+
re 339
|
120
|
+
ni 337
|
121
|
+
k� 328
|
122
|
+
ro 327
|
123
|
+
et 326
|
124
|
+
r� 325
|
125
|
+
ga 323
|
126
|
+
mu 322
|
127
|
+
jas_ 321
|
128
|
+
tr 317
|
129
|
+
_va 312
|
130
|
+
te 310
|
131
|
+
_pr 307
|
132
|
+
sp 298
|
133
|
+
sk 297
|
134
|
+
ne 295
|
135
|
+
�ba 293
|
136
|
+
�s 289
|
137
|
+
ijas 287
|
138
|
+
_ar 283
|
139
|
+
la 283
|
140
|
+
to 282
|
141
|
+
ad 280
|
142
|
+
dz 278
|
143
|
+
�g 277
|
144
|
+
t� 277
|
145
|
+
�j 277
|
146
|
+
_sa 277
|
147
|
+
j� 274
|
148
|
+
_m 273
|
149
|
+
ties 273
|
150
|
+
l� 272
|
151
|
+
ijas_ 269
|
152
|
+
_at 269
|
153
|
+
ed 267
|
154
|
+
_pi 267
|
155
|
+
� 267
|
156
|
+
s, 265
|
157
|
+
s,_ 265
|
158
|
+
�r 261
|
159
|
+
gu 258
|
160
|
+
f 258
|
161
|
+
si 257
|
162
|
+
m� 256
|
163
|
+
nt 254
|
164
|
+
tu_ 254
|
165
|
+
_r 253
|
166
|
+
ru 252
|
167
|
+
�j 251
|
168
|
+
jum 251
|
169
|
+
�s_ 250
|
170
|
+
�t 249
|
171
|
+
iem 248
|
172
|
+
_b 248
|
173
|
+
_vi 245
|
174
|
+
par 244
|
175
|
+
pie 244
|
176
|
+
rt 243
|
177
|
+
v� 242
|
178
|
+
_ne 240
|
179
|
+
�r 240
|
180
|
+
ai_ 239
|
181
|
+
_. 239
|
182
|
+
_j 237
|
183
|
+
us 237
|
184
|
+
_ka 236
|
185
|
+
er 232
|
186
|
+
bas 232
|
187
|
+
_tie 232
|
188
|
+
_par 230
|
189
|
+
di 229
|
190
|
+
� 228
|
191
|
+
ms 228
|
192
|
+
�d 226
|
193
|
+
�bas 224
|
194
|
+
om 220
|
195
|
+
bu 219
|
196
|
+
umu 217
|
197
|
+
iek 216
|
198
|
+
kt 216
|
199
|
+
it 216
|
200
|
+
r� 215
|
201
|
+
_ko 214
|
202
|
+
ana 211
|
203
|
+
�k 211
|
204
|
+
or 210
|
205
|
+
de 210
|
206
|
+
in� 207
|
207
|
+
d� 204
|
208
|
+
ur 203
|
209
|
+
pri 203
|
210
|
+
_c 202
|
211
|
+
ta_ 202
|
212
|
+
bas_ 201
|
213
|
+
es_ 201
|
214
|
+
_pie 200
|
215
|
+
il 200
|
216
|
+
os 199
|
217
|
+
�ana 199
|
218
|
+
id 198
|
219
|
+
L 198
|
220
|
+
_ie 197
|
221
|
+
bi 194
|
222
|
+
ak 194
|
223
|
+
ja_ 194
|
224
|
+
�bas_ 193
|
225
|
+
�t 192
|
226
|
+
�bu 192
|
227
|
+
_g 191
|
228
|
+
� 189
|
229
|
+
ma_ 189
|
230
|
+
ien 188
|
231
|
+
kum 187
|
232
|
+
� 187
|
233
|
+
_ir 186
|
234
|
+
on 186
|
235
|
+
_ties 185
|
236
|
+
z� 185
|
237
|
+
ce 185
|
238
|
+
ied 184
|
239
|
+
ist 183
|
240
|
+
ts_ 183
|
241
|
+
_� 183
|
242
|
+
�_ 182
|
243
|
+
�m 181
|
244
|
+
vie 180
|
245
|
+
_�_ 180
|
246
|
+
cij 180
|
247
|
+
ka_ 179
|
248
|
+
_ap 175
|
249
|
+
s� 174
|
250
|
+
ir_ 174
|
251
|
+
zi 174
|
252
|
+
uma 173
|
253
|
+
�l 172
|
254
|
+
_ir_ 172
|
255
|
+
o� 171
|
256
|
+
_da 169
|
257
|
+
�_ 168
|
258
|
+
ar� 168
|
259
|
+
) 167
|
260
|
+
do 166
|
261
|
+
ve 166
|
262
|
+
( 165
|
263
|
+
ls 165
|
264
|
+
bu_ 164
|
265
|
+
val 164
|
266
|
+
mu_ 164
|
267
|
+
isk 163
|
268
|
+
uz 161
|
269
|
+
av 160
|
270
|
+
par_ 160
|
271
|
+
_v� 159
|
272
|
+
_par_ 158
|
273
|
+
v�r 158
|
274
|
+
_ar_ 157
|
275
|
+
rie 157
|
276
|
+
_uz 157
|
277
|
+
aj 156
|
278
|
+
�bu_ 156
|
279
|
+
oj 155
|
280
|
+
k�_ 155
|
281
|
+
ld 154
|
282
|
+
iet 154
|
283
|
+
iku 154
|
284
|
+
ks 153
|
285
|
+
du 153
|
286
|
+
ep 153
|
287
|
+
ms_ 152
|
288
|
+
ec 152
|
289
|
+
V 151
|
290
|
+
ais 150
|
291
|
+
str 150
|
292
|
+
nie 149
|
293
|
+
am_ 149
|
294
|
+
ums 148
|
295
|
+
_( 147
|
296
|
+
ju_ 146
|
297
|
+
z_ 142
|
298
|
+
ru_ 142
|
299
|
+
�j 142
|
300
|
+
gum 142
|
301
|
+
u,_ 141
|
302
|
+
u, 141
|
303
|
+
i� 141
|
304
|
+
uma_ 141
|
305
|
+
�rt 141
|
306
|
+
�gu 141
|
307
|
+
me 140
|
308
|
+
d� 140
|
309
|
+
�t 140
|
310
|
+
ent 139
|
311
|
+
ikum 138
|
312
|
+
p� 138
|
313
|
+
em_ 138
|
314
|
+
_L 138
|
315
|
+
lie 136
|
316
|
+
sta 136
|
317
|
+
r�_ 136
|
318
|
+
lst 136
|
319
|
+
eik 135
|
320
|
+
se 135
|
321
|
+
s. 134
|
322
|
+
pro 134
|
323
|
+
rs 134
|
324
|
+
s._ 134
|
325
|
+
tik 134
|
326
|
+
l� 134
|
327
|
+
ska 133
|
328
|
+
pap 133
|
329
|
+
kas 133
|
330
|
+
rm 133
|
331
|
+
�ju 133
|
332
|
+
p� 132
|
333
|
+
nu 132
|
334
|
+
T 132
|
335
|
+
p� 131
|
336
|
+
tei 131
|
337
|
+
nas 131
|
338
|
+
_V 131
|
339
|
+
jo 131
|
340
|
+
l�g 131
|
341
|
+
ut 131
|
342
|
+
iem_ 130
|
343
|
+
ras 129
|
344
|
+
pu 129
|
345
|
+
_li 129
|
346
|
+
_ga 128
|
347
|
+
dar 128
|
348
|
+
_k� 128
|
349
|
+
umu_ 127
|
350
|
+
�v 126
|
351
|
+
�gum 126
|
352
|
+
kas_ 126
|
353
|
+
t�b 125
|
354
|
+
vai 125
|
355
|
+
l�gu 125
|
356
|
+
P 125
|
357
|
+
ar�_ 125
|
358
|
+
ev 124
|
359
|
+
lai 124
|
360
|
+
�r 124
|
361
|
+
l�gum 124
|
362
|
+
tv 123
|
363
|
+
a� 123
|
364
|
+
_ar�_ 122
|
365
|
+
_ar� 122
|
366
|
+
_vie 121
|
367
|
+
S 121
|
368
|
+
_T 120
|
369
|
+
�ju 120
|
370
|
+
teik 120
|
371
|
+
cija 119
|
372
|
+
rb 119
|
373
|
+
_� 119
|
374
|
+
j�_ 119
|
375
|
+
nas_ 118
|
376
|
+
t�j 118
|
377
|
+
v�rt 118
|
378
|
+
iec 118
|
379
|
+
_la 117
|
380
|
+
�d 116
|
381
|
+
_vai 116
|
382
|
+
�jum 116
|
383
|
+
vien 116
|
384
|
+
als 116
|
385
|
+
_l� 116
|
386
|
+
ap�r 115
|
387
|
+
rts 115
|
388
|
+
isi 115
|
389
|
+
p�r 115
|
390
|
+
pap� 115
|
391
|
+
pap�r 115
|
392
|
+
ap� 115
|
393
|
+
tsp 115
|
394
|
+
m� 114
|
395
|
+
im 114
|
396
|
+
be 114
|
397
|
+
is_ 114
|
398
|
+
alst 114
|
399
|
+
_ja 114
|
400
|
+
rtspa 113
|
@@ -0,0 +1,400 @@
|
|
1
|
+
_ 23070
|
2
|
+
i 8196
|
3
|
+
a 7763
|
4
|
+
s 5179
|
5
|
+
e 3458
|
6
|
+
o 3425
|
7
|
+
u 3371
|
8
|
+
t 3344
|
9
|
+
r 3240
|
10
|
+
n 3070
|
11
|
+
k 3019
|
12
|
+
l 2060
|
13
|
+
p 1889
|
14
|
+
s_ 1756
|
15
|
+
m 1680
|
16
|
+
d 1640
|
17
|
+
v 1590
|
18
|
+
, 1501
|
19
|
+
,_ 1497
|
20
|
+
� 1400
|
21
|
+
g 1302
|
22
|
+
j 1200
|
23
|
+
o_ 1138
|
24
|
+
. 1128
|
25
|
+
ai 1113
|
26
|
+
� 1075
|
27
|
+
_p 1047
|
28
|
+
_k 1035
|
29
|
+
i_ 990
|
30
|
+
._ 984
|
31
|
+
as 975
|
32
|
+
b 937
|
33
|
+
au 903
|
34
|
+
is 863
|
35
|
+
_n 815
|
36
|
+
ka 811
|
37
|
+
si 804
|
38
|
+
_s 799
|
39
|
+
ia 796
|
40
|
+
� 759
|
41
|
+
ta 735
|
42
|
+
ie 731
|
43
|
+
ti 728
|
44
|
+
y 721
|
45
|
+
_t 711
|
46
|
+
in 697
|
47
|
+
_i 686
|
48
|
+
us 675
|
49
|
+
pa 658
|
50
|
+
ir 640
|
51
|
+
ar 633
|
52
|
+
� 620
|
53
|
+
_a 617
|
54
|
+
r_ 609
|
55
|
+
ne 583
|
56
|
+
a_ 578
|
57
|
+
ri 569
|
58
|
+
_v 558
|
59
|
+
_pa 541
|
60
|
+
al 540
|
61
|
+
ra 531
|
62
|
+
li 522
|
63
|
+
� 509
|
64
|
+
u_ 493
|
65
|
+
vi 490
|
66
|
+
_ka 489
|
67
|
+
da 487
|
68
|
+
_ne 482
|
69
|
+
_j 481
|
70
|
+
en 478
|
71
|
+
�_ 445
|
72
|
+
os 444
|
73
|
+
ki 442
|
74
|
+
� 441
|
75
|
+
an 440
|
76
|
+
ik 434
|
77
|
+
ma 433
|
78
|
+
as_ 430
|
79
|
+
st 420
|
80
|
+
_d 420
|
81
|
+
ai_ 417
|
82
|
+
s,_ 396
|
83
|
+
am 396
|
84
|
+
is_ 396
|
85
|
+
s, 396
|
86
|
+
_ir 390
|
87
|
+
jo 387
|
88
|
+
ir_ 385
|
89
|
+
at 384
|
90
|
+
_ir_ 383
|
91
|
+
i� 381
|
92
|
+
ni 377
|
93
|
+
ga 376
|
94
|
+
_b 367
|
95
|
+
na 366
|
96
|
+
e_ 365
|
97
|
+
to 352
|
98
|
+
pr 337
|
99
|
+
_g 332
|
100
|
+
_m 332
|
101
|
+
� 328
|
102
|
+
� 326
|
103
|
+
io 323
|
104
|
+
ei 323
|
105
|
+
�_ 321
|
106
|
+
su 320
|
107
|
+
�i 320
|
108
|
+
uo 319
|
109
|
+
la 317
|
110
|
+
er 303
|
111
|
+
va 299
|
112
|
+
vo 298
|
113
|
+
�i 293
|
114
|
+
es 291
|
115
|
+
- 290
|
116
|
+
�_ 286
|
117
|
+
-_ 285
|
118
|
+
_vi 284
|
119
|
+
_- 283
|
120
|
+
ko 283
|
121
|
+
_-_ 283
|
122
|
+
iau 281
|
123
|
+
sa 278
|
124
|
+
s. 278
|
125
|
+
iu 276
|
126
|
+
et 274
|
127
|
+
nu 265
|
128
|
+
ja 262
|
129
|
+
�_ 262
|
130
|
+
_ta 262
|
131
|
+
s._ 259
|
132
|
+
el 258
|
133
|
+
�j 258
|
134
|
+
os_ 256
|
135
|
+
im 255
|
136
|
+
it 254
|
137
|
+
_pr 253
|
138
|
+
no 252
|
139
|
+
av 251
|
140
|
+
ur 251
|
141
|
+
_� 248
|
142
|
+
mi 246
|
143
|
+
ve 245
|
144
|
+
ak 245
|
145
|
+
ku 243
|
146
|
+
ek 241
|
147
|
+
tu 241
|
148
|
+
_� 241
|
149
|
+
ad 241
|
150
|
+
� 238
|
151
|
+
_l 238
|
152
|
+
_i� 236
|
153
|
+
us_ 236
|
154
|
+
_su 232
|
155
|
+
oj 231
|
156
|
+
au_ 231
|
157
|
+
ba 224
|
158
|
+
nt 218
|
159
|
+
me 214
|
160
|
+
te 210
|
161
|
+
jo_ 208
|
162
|
+
ro 205
|
163
|
+
�s 204
|
164
|
+
i� 203
|
165
|
+
tai 203
|
166
|
+
_� 201
|
167
|
+
l� 201
|
168
|
+
pas 200
|
169
|
+
ip 198
|
170
|
+
iai 197
|
171
|
+
di 195
|
172
|
+
usi 194
|
173
|
+
vo_ 193
|
174
|
+
kai 190
|
175
|
+
i, 189
|
176
|
+
i,_ 189
|
177
|
+
sk 187
|
178
|
+
_r 186
|
179
|
+
aus 184
|
180
|
+
ap 183
|
181
|
+
gi 182
|
182
|
+
mo 182
|
183
|
+
uk 181
|
184
|
+
t_ 180
|
185
|
+
_da 177
|
186
|
+
be 176
|
187
|
+
ien 176
|
188
|
+
o, 174
|
189
|
+
il 174
|
190
|
+
o,_ 173
|
191
|
+
ti_ 173
|
192
|
+
re 172
|
193
|
+
_nu 171
|
194
|
+
�ia 171
|
195
|
+
_pas 169
|
196
|
+
pri 169
|
197
|
+
�_ 169
|
198
|
+
ok 168
|
199
|
+
d� 166
|
200
|
+
�l 162
|
201
|
+
bu 161
|
202
|
+
�i 160
|
203
|
+
on 160
|
204
|
+
asi 159
|
205
|
+
id 158
|
206
|
+
ul 157
|
207
|
+
ji 157
|
208
|
+
aip 156
|
209
|
+
ia_ 155
|
210
|
+
_sa 154
|
211
|
+
ot 154
|
212
|
+
gal 153
|
213
|
+
nk 153
|
214
|
+
om 152
|
215
|
+
p_ 151
|
216
|
+
_pri 151
|
217
|
+
od 151
|
218
|
+
vis 150
|
219
|
+
_at 150
|
220
|
+
vie 150
|
221
|
+
uv 150
|
222
|
+
ab 150
|
223
|
+
i�_ 149
|
224
|
+
ama 149
|
225
|
+
n� 149
|
226
|
+
A 149
|
227
|
+
sta 148
|
228
|
+
kr 148
|
229
|
+
_A 145
|
230
|
+
ais 144
|
231
|
+
rt 143
|
232
|
+
J 142
|
233
|
+
_J 142
|
234
|
+
�jo 142
|
235
|
+
_�_ 141
|
236
|
+
K 140
|
237
|
+
_K 139
|
238
|
+
pi 139
|
239
|
+
avo 139
|
240
|
+
ng 139
|
241
|
+
mas 138
|
242
|
+
du 138
|
243
|
+
ug 137
|
244
|
+
_ga 137
|
245
|
+
ol 136
|
246
|
+
tik 135
|
247
|
+
ali 135
|
248
|
+
.. 135
|
249
|
+
_vis 135
|
250
|
+
iek 134
|
251
|
+
ini 133
|
252
|
+
kad 133
|
253
|
+
a, 133
|
254
|
+
le 133
|
255
|
+
k� 133
|
256
|
+
T 133
|
257
|
+
t� 132
|
258
|
+
i. 132
|
259
|
+
_T 131
|
260
|
+
d� 131
|
261
|
+
a,_ 131
|
262
|
+
go 131
|
263
|
+
ip_ 131
|
264
|
+
aip_ 131
|
265
|
+
r� 129
|
266
|
+
a� 129
|
267
|
+
d�i 129
|
268
|
+
ke 128
|
269
|
+
k_ 128
|
270
|
+
d_ 127
|
271
|
+
ad_ 127
|
272
|
+
_ti 127
|
273
|
+
_ma 126
|
274
|
+
_va 125
|
275
|
+
i._ 124
|
276
|
+
z 123
|
277
|
+
�k 123
|
278
|
+
iau_ 121
|
279
|
+
m_ 120
|
280
|
+
kar 119
|
281
|
+
um 119
|
282
|
+
t� 119
|
283
|
+
_kad 118
|
284
|
+
u� 117
|
285
|
+
tr 117
|
286
|
+
_kai 117
|
287
|
+
as, 116
|
288
|
+
og 116
|
289
|
+
kad_ 116
|
290
|
+
as,_ 116
|
291
|
+
_ji 116
|
292
|
+
rie 115
|
293
|
+
yt 114
|
294
|
+
_ja 114
|
295
|
+
_ko 114
|
296
|
+
v� 114
|
297
|
+
ys 114
|
298
|
+
jau 113
|
299
|
+
ar_ 113
|
300
|
+
pra 112
|
301
|
+
a� 112
|
302
|
+
ant 112
|
303
|
+
kl 111
|
304
|
+
tas 111
|
305
|
+
gu 111
|
306
|
+
_ku 110
|
307
|
+
si_ 110
|
308
|
+
pe 109
|
309
|
+
eb 109
|
310
|
+
N 109
|
311
|
+
�jo_ 108
|
312
|
+
_kad_ 108
|
313
|
+
se 108
|
314
|
+
_ki 108
|
315
|
+
or 107
|
316
|
+
ly 107
|
317
|
+
lo 107
|
318
|
+
iai_ 107
|
319
|
+
_la 106
|
320
|
+
ts 106
|
321
|
+
�s 106
|
322
|
+
ig 105
|
323
|
+
_N 105
|
324
|
+
ut 105
|
325
|
+
_u 105
|
326
|
+
�s_ 105
|
327
|
+
avo_ 104
|
328
|
+
ie_ 104
|
329
|
+
a. 104
|
330
|
+
kt 104
|
331
|
+
em 103
|
332
|
+
do 103
|
333
|
+
je 102
|
334
|
+
ks 102
|
335
|
+
ats 101
|
336
|
+
_be 101
|
337
|
+
ris 101
|
338
|
+
l_ 101
|
339
|
+
_vie 101
|
340
|
+
tin 101
|
341
|
+
ag 100
|
342
|
+
dam 100
|
343
|
+
_st 100
|
344
|
+
a._ 99
|
345
|
+
_bu 99
|
346
|
+
? 99
|
347
|
+
V 98
|
348
|
+
io_ 98
|
349
|
+
kas 98
|
350
|
+
_jo 98
|
351
|
+
vien 97
|
352
|
+
_gal 97
|
353
|
+
�t 97
|
354
|
+
kia 97
|
355
|
+
lia 96
|
356
|
+
c 96
|
357
|
+
uri 96
|
358
|
+
_V 96
|
359
|
+
?_ 96
|
360
|
+
uvo 95
|
361
|
+
ru 95
|
362
|
+
ty 95
|
363
|
+
ep 94
|
364
|
+
nd 94
|
365
|
+
lai 94
|
366
|
+
_tai 94
|
367
|
+
ju 93
|
368
|
+
man 92
|
369
|
+
o. 92
|
370
|
+
buv 92
|
371
|
+
t� 92
|
372
|
+
_�i 91
|
373
|
+
i�_ 91
|
374
|
+
_i�_ 91
|
375
|
+
i�k 90
|
376
|
+
o._ 90
|
377
|
+
_to 90
|
378
|
+
bi 90
|
379
|
+
up 89
|
380
|
+
po 89
|
381
|
+
rs 89
|
382
|
+
_prie 88
|
383
|
+
�,_ 88
|
384
|
+
aik 88
|
385
|
+
ui 88
|
386
|
+
_tik 88
|
387
|
+
ij 88
|
388
|
+
�, 88
|
389
|
+
pat 88
|
390
|
+
prie 88
|
391
|
+
I 87
|
392
|
+
ies 87
|
393
|
+
tai_ 87
|
394
|
+
n_ 87
|
395
|
+
pasi 87
|
396
|
+
ius 87
|
397
|
+
�t 87
|
398
|
+
eik 86
|
399
|
+
_me 86
|
400
|
+
ina 86
|