language_detector 0.1.0
Sign up to get free protection for your applications and to get access to all the features.
- data/README.rdoc +24 -0
- data/Rakefile +18 -0
- data/VERSION +1 -0
- data/lib/language_detector.rb +232 -0
- data/lib/model-fm.yml +52504 -0
- data/lib/model-tc.yml +53985 -0
- data/lib/textcat_ngrams/afrikaans.lm +400 -0
- data/lib/textcat_ngrams/albanian.lm +400 -0
- data/lib/textcat_ngrams/amharic-utf.lm +400 -0
- data/lib/textcat_ngrams/arabic-iso8859_6.lm +400 -0
- data/lib/textcat_ngrams/arabic-windows1256.lm +400 -0
- data/lib/textcat_ngrams/armenian.lm +400 -0
- data/lib/textcat_ngrams/basque.lm +400 -0
- data/lib/textcat_ngrams/belarus-windows1251.lm +400 -0
- data/lib/textcat_ngrams/bosnian.lm +400 -0
- data/lib/textcat_ngrams/breton.lm +400 -0
- data/lib/textcat_ngrams/bulgarian-iso8859_5.lm +400 -0
- data/lib/textcat_ngrams/catalan.lm +400 -0
- data/lib/textcat_ngrams/chinese-big5.lm +400 -0
- data/lib/textcat_ngrams/chinese-gb2312.lm +400 -0
- data/lib/textcat_ngrams/croatian-ascii.lm +400 -0
- data/lib/textcat_ngrams/czech-iso8859_2.lm +400 -0
- data/lib/textcat_ngrams/danish.lm +400 -0
- data/lib/textcat_ngrams/dutch.lm +400 -0
- data/lib/textcat_ngrams/english.lm +400 -0
- data/lib/textcat_ngrams/esperanto.lm +400 -0
- data/lib/textcat_ngrams/estonian.lm +400 -0
- data/lib/textcat_ngrams/finnish.lm +400 -0
- data/lib/textcat_ngrams/french.lm +400 -0
- data/lib/textcat_ngrams/frisian.lm +400 -0
- data/lib/textcat_ngrams/georgian.lm +400 -0
- data/lib/textcat_ngrams/german.lm +400 -0
- data/lib/textcat_ngrams/greek-iso8859-7.lm +400 -0
- data/lib/textcat_ngrams/hebrew-iso8859_8.lm +400 -0
- data/lib/textcat_ngrams/hindi.lm +400 -0
- data/lib/textcat_ngrams/hungarian.lm +400 -0
- data/lib/textcat_ngrams/icelandic.lm +400 -0
- data/lib/textcat_ngrams/indonesian.lm +400 -0
- data/lib/textcat_ngrams/irish.lm +400 -0
- data/lib/textcat_ngrams/italian.lm +400 -0
- data/lib/textcat_ngrams/japanese-euc_jp.lm +400 -0
- data/lib/textcat_ngrams/japanese-shift_jis.lm +400 -0
- data/lib/textcat_ngrams/korean.lm +400 -0
- data/lib/textcat_ngrams/latin.lm +400 -0
- data/lib/textcat_ngrams/latvian.lm +400 -0
- data/lib/textcat_ngrams/lithuanian.lm +400 -0
- data/lib/textcat_ngrams/malay.lm +400 -0
- data/lib/textcat_ngrams/manx.lm +400 -0
- data/lib/textcat_ngrams/marathi.lm +400 -0
- data/lib/textcat_ngrams/mingo.lm +400 -0
- data/lib/textcat_ngrams/nepali.lm +400 -0
- data/lib/textcat_ngrams/norwegian.lm +400 -0
- data/lib/textcat_ngrams/persian.lm +400 -0
- data/lib/textcat_ngrams/polish.lm +400 -0
- data/lib/textcat_ngrams/portuguese.lm +400 -0
- data/lib/textcat_ngrams/quechua.lm +400 -0
- data/lib/textcat_ngrams/romanian.lm +400 -0
- data/lib/textcat_ngrams/rumantsch.lm +400 -0
- data/lib/textcat_ngrams/russian-iso8859_5.lm +400 -0
- data/lib/textcat_ngrams/russian-koi8_r.lm +400 -0
- data/lib/textcat_ngrams/russian-windows1251.lm +400 -0
- data/lib/textcat_ngrams/sanskrit.lm +400 -0
- data/lib/textcat_ngrams/scots.lm +400 -0
- data/lib/textcat_ngrams/scots_gaelic.lm +400 -0
- data/lib/textcat_ngrams/serbian-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovak-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovak-windows1250.lm +400 -0
- data/lib/textcat_ngrams/slovenian-ascii.lm +400 -0
- data/lib/textcat_ngrams/slovenian-iso8859_2.lm +400 -0
- data/lib/textcat_ngrams/spanish.lm +400 -0
- data/lib/textcat_ngrams/swahili.lm +400 -0
- data/lib/textcat_ngrams/swedish.lm +400 -0
- data/lib/textcat_ngrams/tagalog.lm +400 -0
- data/lib/textcat_ngrams/tamil.lm +400 -0
- data/lib/textcat_ngrams/thai.lm +400 -0
- data/lib/textcat_ngrams/turkish.lm +400 -0
- data/lib/textcat_ngrams/ukrainian-koi8_u.lm +400 -0
- data/lib/textcat_ngrams/vietnamese.lm +400 -0
- data/lib/textcat_ngrams/welsh.lm +400 -0
- data/lib/textcat_ngrams/yiddish-utf.lm +400 -0
- data/lib/training_data/ar-utf8.txt +54 -0
- data/lib/training_data/bg-utf8.txt +26 -0
- data/lib/training_data/cs-utf8.txt +48 -0
- data/lib/training_data/da-utf8.txt +159 -0
- data/lib/training_data/de-utf8.txt +569 -0
- data/lib/training_data/el-utf8.txt +48 -0
- data/lib/training_data/en-utf8.txt +81 -0
- data/lib/training_data/es-utf8.txt +185 -0
- data/lib/training_data/et-utf8.txt +50 -0
- data/lib/training_data/fa-utf8.txt +42 -0
- data/lib/training_data/fi-utf8.txt +83 -0
- data/lib/training_data/fr-utf8.txt +191 -0
- data/lib/training_data/fy-utf8.txt +22 -0
- data/lib/training_data/ga-utf8.txt +109 -0
- data/lib/training_data/he-utf8.txt +116 -0
- data/lib/training_data/hi-utf8.txt +49 -0
- data/lib/training_data/hr-utf8.txt +80 -0
- data/lib/training_data/hu-utf8.txt +87 -0
- data/lib/training_data/io-utf8.txt +41 -0
- data/lib/training_data/is-utf8.txt +94 -0
- data/lib/training_data/it-utf8.txt +228 -0
- data/lib/training_data/ja-utf8.txt +200 -0
- data/lib/training_data/ko-utf8.txt +147 -0
- data/lib/training_data/nl-utf8.txt +215 -0
- data/lib/training_data/no-utf8.txt +281 -0
- data/lib/training_data/pl-utf8.txt +120 -0
- data/lib/training_data/pt-utf8.txt +214 -0
- data/lib/training_data/ro-utf8.txt +66 -0
- data/lib/training_data/ru-utf8.txt +310 -0
- data/lib/training_data/sl-utf8.txt +263 -0
- data/lib/training_data/sv-utf8.txt +174 -0
- data/lib/training_data/th-utf8.txt +49 -0
- data/lib/training_data/tk-utf8.txt +101 -0
- data/lib/training_data/todo/af.txt +114 -0
- data/lib/training_data/todo/amharic-utf.txt +95 -0
- data/lib/training_data/todo/arabic-windows1256.txt +157 -0
- data/lib/training_data/todo/armenian.txt +86 -0
- data/lib/training_data/todo/basque.txt +136 -0
- data/lib/training_data/todo/belarus-windows1251.txt +97 -0
- data/lib/training_data/todo/bosnian.txt +97 -0
- data/lib/training_data/todo/breton.txt +159 -0
- data/lib/training_data/todo/bulgarian-iso8859_5.txt +115 -0
- data/lib/training_data/todo/catalan.txt +93 -0
- data/lib/training_data/todo/croatian-ascii.txt +104 -0
- data/lib/training_data/todo/esperanto.txt +95 -0
- data/lib/training_data/todo/estonian.txt +218 -0
- data/lib/training_data/todo/frisian.txt +99 -0
- data/lib/training_data/todo/georgian.txt +86 -0
- data/lib/training_data/todo/greek-iso8859-7.txt +139 -0
- data/lib/training_data/todo/hawaian.txt +108 -0
- data/lib/training_data/todo/hebrew-iso8859_8.txt +79 -0
- data/lib/training_data/todo/hindi.txt +77 -0
- data/lib/training_data/todo/hungarian.txt +102 -0
- data/lib/training_data/todo/icelandic.txt +131 -0
- data/lib/training_data/todo/indonesian.txt +93 -0
- data/lib/training_data/todo/irish.txt +209 -0
- data/lib/training_data/todo/latin.txt +120 -0
- data/lib/training_data/todo/latvian.txt +126 -0
- data/lib/training_data/todo/lithuanian.txt +99 -0
- data/lib/training_data/todo/malay.txt +108 -0
- data/lib/training_data/todo/manx.txt +78 -0
- data/lib/training_data/todo/marathi.txt +100 -0
- data/lib/training_data/todo/mf.txt +100 -0
- data/lib/training_data/todo/middle_frisian.txt +102 -0
- data/lib/training_data/todo/mingo.txt +146 -0
- data/lib/training_data/todo/nepali.txt +131 -0
- data/lib/training_data/todo/persian.txt +73 -0
- data/lib/training_data/todo/quechua.txt +108 -0
- data/lib/training_data/todo/romanian.txt +103 -0
- data/lib/training_data/todo/rumantsch.txt +110 -0
- data/lib/training_data/todo/sanskrit.txt +135 -0
- data/lib/training_data/todo/scots.txt +490 -0
- data/lib/training_data/todo/scots_gaelic.txt +93 -0
- data/lib/training_data/todo/serbian-ascii.txt +121 -0
- data/lib/training_data/todo/slovak-ascii.txt +102 -0
- data/lib/training_data/todo/slovak-windows1250.txt +115 -0
- data/lib/training_data/todo/slovenian-ascii.txt +100 -0
- data/lib/training_data/todo/slovenian-iso8859_2.txt +96 -0
- data/lib/training_data/todo/sq.txt +110 -0
- data/lib/training_data/todo/swahili.txt +120 -0
- data/lib/training_data/todo/tagalog.txt +135 -0
- data/lib/training_data/todo/tamil.txt +123 -0
- data/lib/training_data/todo/turkish.txt +117 -0
- data/lib/training_data/todo/ukrainian-koi8_r.txt +214 -0
- data/lib/training_data/todo/vietnamese.txt +92 -0
- data/lib/training_data/todo/welsh.txt +148 -0
- data/lib/training_data/todo/yiddish-utf.txt +83 -0
- data/lib/training_data/uk-utf8.txt +75 -0
- data/lib/training_data/vi-utf8.txt +47 -0
- data/lib/training_data/zh-utf8.txt +228 -0
- data/test/language_detector_test.rb +78 -0
- metadata +232 -0
@@ -0,0 +1,400 @@
|
|
1
|
+
_ 6290
|
2
|
+
� 5252
|
3
|
+
� 4377
|
4
|
+
� 3920
|
5
|
+
� 3050
|
6
|
+
� 2984
|
7
|
+
� 2657
|
8
|
+
� 2522
|
9
|
+
� 2454
|
10
|
+
� 2369
|
11
|
+
� 2304
|
12
|
+
� 2158
|
13
|
+
� 1981
|
14
|
+
� 1908
|
15
|
+
� 1693
|
16
|
+
� 1543
|
17
|
+
� 1443
|
18
|
+
� 1422
|
19
|
+
� 1398
|
20
|
+
� 1398
|
21
|
+
� 1301
|
22
|
+
� 1245
|
23
|
+
� 1239
|
24
|
+
� 1210
|
25
|
+
� 1181
|
26
|
+
� 1081
|
27
|
+
� 1045
|
28
|
+
� 978
|
29
|
+
�� 951
|
30
|
+
� 907
|
31
|
+
� 892
|
32
|
+
�� 829
|
33
|
+
� 795
|
34
|
+
�� 735
|
35
|
+
� 722
|
36
|
+
��� 710
|
37
|
+
� 691
|
38
|
+
�� 688
|
39
|
+
� 668
|
40
|
+
ͧ 595
|
41
|
+
. 588
|
42
|
+
� 553
|
43
|
+
� 543
|
44
|
+
�� 532
|
45
|
+
�� 528
|
46
|
+
�� 522
|
47
|
+
�� 522
|
48
|
+
�� 477
|
49
|
+
� 452
|
50
|
+
��� 451
|
51
|
+
�� 443
|
52
|
+
�� 441
|
53
|
+
� 422
|
54
|
+
ҧ 419
|
55
|
+
�� 414
|
56
|
+
� 388
|
57
|
+
�_ 378
|
58
|
+
�� 367
|
59
|
+
�� 360
|
60
|
+
� 354
|
61
|
+
Ѻ 349
|
62
|
+
�_ 347
|
63
|
+
�� 345
|
64
|
+
��� 340
|
65
|
+
�� 337
|
66
|
+
�� 337
|
67
|
+
�� 336
|
68
|
+
��� 336
|
69
|
+
� 334
|
70
|
+
ҹ 333
|
71
|
+
�� 332
|
72
|
+
�� 328
|
73
|
+
�� 325
|
74
|
+
� 322
|
75
|
+
_� 320
|
76
|
+
� 314
|
77
|
+
� 313
|
78
|
+
�� 299
|
79
|
+
ѧ 297
|
80
|
+
ҡ 297
|
81
|
+
�� 296
|
82
|
+
�� 295
|
83
|
+
Ѱ 293
|
84
|
+
�Ѱ 293
|
85
|
+
�� 290
|
86
|
+
� 289
|
87
|
+
��� 288
|
88
|
+
� 285
|
89
|
+
� 280
|
90
|
+
� 273
|
91
|
+
� 268
|
92
|
+
��� 268
|
93
|
+
� 266
|
94
|
+
�� 263
|
95
|
+
ѹ 263
|
96
|
+
� 263
|
97
|
+
�� 256
|
98
|
+
�� 254
|
99
|
+
�� 253
|
100
|
+
�� 252
|
101
|
+
��� 251
|
102
|
+
�� 251
|
103
|
+
� 248
|
104
|
+
� 248
|
105
|
+
�� 248
|
106
|
+
�� 248
|
107
|
+
�� 247
|
108
|
+
�� 247
|
109
|
+
�� 247
|
110
|
+
�� 247
|
111
|
+
͡ 245
|
112
|
+
�� 245
|
113
|
+
�� 244
|
114
|
+
� 244
|
115
|
+
�� 243
|
116
|
+
�� 241
|
117
|
+
_� 240
|
118
|
+
�� 238
|
119
|
+
� 237
|
120
|
+
_� 236
|
121
|
+
�� 234
|
122
|
+
� 227
|
123
|
+
�� 225
|
124
|
+
� 221
|
125
|
+
� 216
|
126
|
+
¡ 214
|
127
|
+
ä 213
|
128
|
+
�� 211
|
129
|
+
�� 211
|
130
|
+
�� 211
|
131
|
+
�� 210
|
132
|
+
Թ 209
|
133
|
+
�� 206
|
134
|
+
�� 202
|
135
|
+
�� 202
|
136
|
+
˹ 201
|
137
|
+
�� 201
|
138
|
+
_� 200
|
139
|
+
�� 197
|
140
|
+
�� 196
|
141
|
+
�_ 193
|
142
|
+
�� 191
|
143
|
+
�� 191
|
144
|
+
�� 188
|
145
|
+
�� 188
|
146
|
+
�� 186
|
147
|
+
�ͧ 184
|
148
|
+
�� 184
|
149
|
+
��� 183
|
150
|
+
�� 183
|
151
|
+
�� 181
|
152
|
+
�� 180
|
153
|
+
�� 179
|
154
|
+
��� 178
|
155
|
+
�ҧ 177
|
156
|
+
��_ 176
|
157
|
+
�ä 176
|
158
|
+
_� 176
|
159
|
+
���� 174
|
160
|
+
�� 174
|
161
|
+
��� 174
|
162
|
+
��� 174
|
163
|
+
Ѵ 172
|
164
|
+
Դ 172
|
165
|
+
���_ 171
|
166
|
+
��� 167
|
167
|
+
�� 167
|
168
|
+
167
|
169
|
+
ҵ 167
|
170
|
+
��� 167
|
171
|
+
��ä 166
|
172
|
+
�� 166
|
173
|
+
�� 165
|
174
|
+
�� 165
|
175
|
+
� 163
|
176
|
+
�� 162
|
177
|
+
�� 161
|
178
|
+
�� 161
|
179
|
+
�_ 161
|
180
|
+
�_ 154
|
181
|
+
�� 154
|
182
|
+
�� 154
|
183
|
+
�ͧ 151
|
184
|
+
���� 151
|
185
|
+
��� 151
|
186
|
+
� 150
|
187
|
+
ѡ 150
|
188
|
+
�_ 148
|
189
|
+
��� 147
|
190
|
+
�� 146
|
191
|
+
�� 146
|
192
|
+
�� 146
|
193
|
+
�_ 146
|
194
|
+
� 145
|
195
|
+
�� 140
|
196
|
+
� 139
|
197
|
+
�ҡ 139
|
198
|
+
�� 138
|
199
|
+
�� 138
|
200
|
+
�� 137
|
201
|
+
�� 136
|
202
|
+
�� 135
|
203
|
+
�Ѻ 134
|
204
|
+
�¡ 133
|
205
|
+
_� 132
|
206
|
+
�� 132
|
207
|
+
�� 132
|
208
|
+
�� 131
|
209
|
+
� 130
|
210
|
+
�� 129
|
211
|
+
ҵ� 129
|
212
|
+
_� 128
|
213
|
+
�� 128
|
214
|
+
��� 128
|
215
|
+
�Ѻ 128
|
216
|
+
ա 128
|
217
|
+
�� 127
|
218
|
+
�� 127
|
219
|
+
�� 126
|
220
|
+
_�� 126
|
221
|
+
�ҵ� 126
|
222
|
+
�� 126
|
223
|
+
�ҵ 126
|
224
|
+
�� 126
|
225
|
+
�� 126
|
226
|
+
_�� 125
|
227
|
+
�� 124
|
228
|
+
�� 124
|
229
|
+
���� 124
|
230
|
+
��� 124
|
231
|
+
�� 123
|
232
|
+
Ҥ 122
|
233
|
+
� 122
|
234
|
+
� 122
|
235
|
+
�� 121
|
236
|
+
�� 121
|
237
|
+
�� 120
|
238
|
+
��� 120
|
239
|
+
ҷ 119
|
240
|
+
��� 119
|
241
|
+
��� 118
|
242
|
+
�� 118
|
243
|
+
�� 117
|
244
|
+
ǹ 117
|
245
|
+
�� 117
|
246
|
+
���� 117
|
247
|
+
���� 117
|
248
|
+
��� 117
|
249
|
+
����� 117
|
250
|
+
�� 116
|
251
|
+
�� 116
|
252
|
+
_��� 116
|
253
|
+
��� 116
|
254
|
+
��� 115
|
255
|
+
�� 115
|
256
|
+
�Ѱ�� 115
|
257
|
+
�� 115
|
258
|
+
� 115
|
259
|
+
Ѱ� 115
|
260
|
+
�. 115
|
261
|
+
Ѱ��� 115
|
262
|
+
�Ѱ� 115
|
263
|
+
���� 115
|
264
|
+
Ѱ�� 115
|
265
|
+
����� 115
|
266
|
+
�� 115
|
267
|
+
_��� 113
|
268
|
+
�� 113
|
269
|
+
�� 113
|
270
|
+
�� 112
|
271
|
+
� 112
|
272
|
+
_� 112
|
273
|
+
��� 111
|
274
|
+
Ի 111
|
275
|
+
��� 111
|
276
|
+
�� 111
|
277
|
+
�� 110
|
278
|
+
_� 110
|
279
|
+
�� 110
|
280
|
+
_� 110
|
281
|
+
Ҩ 109
|
282
|
+
��� 108
|
283
|
+
��¡ 108
|
284
|
+
_� 107
|
285
|
+
ѭ 107
|
286
|
+
�ҹ 107
|
287
|
+
�� 106
|
288
|
+
��� 106
|
289
|
+
_� 106
|
290
|
+
���� 105
|
291
|
+
�� 105
|
292
|
+
Ե 105
|
293
|
+
�� 105
|
294
|
+
�� 103
|
295
|
+
�� 102
|
296
|
+
�_ 102
|
297
|
+
��� 102
|
298
|
+
�� 102
|
299
|
+
�� 102
|
300
|
+
�� 101
|
301
|
+
� 100
|
302
|
+
��� 100
|
303
|
+
�� 100
|
304
|
+
_� 99
|
305
|
+
�� 99
|
306
|
+
��ͧ 99
|
307
|
+
�� 99
|
308
|
+
�_ 98
|
309
|
+
Ъ 98
|
310
|
+
�� 98
|
311
|
+
���� 98
|
312
|
+
¡� 97
|
313
|
+
�� 97
|
314
|
+
�_ 97
|
315
|
+
�� 97
|
316
|
+
Ҫ 97
|
317
|
+
�_ 96
|
318
|
+
�� 96
|
319
|
+
Ѱ� 94
|
320
|
+
Ҿ 94
|
321
|
+
�Ѱ� 94
|
322
|
+
�� 94
|
323
|
+
�� 94
|
324
|
+
�� 93
|
325
|
+
�� 93
|
326
|
+
�� 93
|
327
|
+
��� 92
|
328
|
+
��� 92
|
329
|
+
�. 92
|
330
|
+
Ѱ�� 92
|
331
|
+
�ѹ 92
|
332
|
+
Ѱ��� 92
|
333
|
+
�� 92
|
334
|
+
�Ѱ�� 92
|
335
|
+
��� 92
|
336
|
+
���� 92
|
337
|
+
֧ 92
|
338
|
+
.� 91
|
339
|
+
��� 91
|
340
|
+
á 91
|
341
|
+
_�� 90
|
342
|
+
��� 90
|
343
|
+
��. 90
|
344
|
+
�� 90
|
345
|
+
���� 90
|
346
|
+
��� 90
|
347
|
+
��� 89
|
348
|
+
.�. 89
|
349
|
+
��ҧ 89
|
350
|
+
��_ 89
|
351
|
+
���ҧ 89
|
352
|
+
�ѧ 89
|
353
|
+
�� 89
|
354
|
+
��� 88
|
355
|
+
ͺ 88
|
356
|
+
_� 88
|
357
|
+
�.� 87
|
358
|
+
�ͧ 87
|
359
|
+
�Ъ 87
|
360
|
+
�� 87
|
361
|
+
�� 87
|
362
|
+
�ѧ 87
|
363
|
+
��.�. 87
|
364
|
+
�.�. 87
|
365
|
+
���_ 87
|
366
|
+
� 87
|
367
|
+
�� 87
|
368
|
+
��� 87
|
369
|
+
�� 87
|
370
|
+
��.� 87
|
371
|
+
��Ъ 87
|
372
|
+
�� 87
|
373
|
+
' 86
|
374
|
+
�� 86
|
375
|
+
�� 86
|
376
|
+
��� 86
|
377
|
+
_��. 86
|
378
|
+
�ҧ 86
|
379
|
+
�� 85
|
380
|
+
�� 85
|
381
|
+
§ 85
|
382
|
+
._ 85
|
383
|
+
��� 85
|
384
|
+
�� 85
|
385
|
+
�� 84
|
386
|
+
�� 84
|
387
|
+
��� 84
|
388
|
+
��Ѱ 84
|
389
|
+
�� 84
|
390
|
+
�� 84
|
391
|
+
��� 84
|
392
|
+
_��.� 84
|
393
|
+
�� 83
|
394
|
+
�� 83
|
395
|
+
��� 83
|
396
|
+
���� 83
|
397
|
+
ѵ 82
|
398
|
+
���� 82
|
399
|
+
�� 82
|
400
|
+
�_ 82
|
@@ -0,0 +1,400 @@
|
|
1
|
+
_ 23226
|
2
|
+
i 8957
|
3
|
+
a 7675
|
4
|
+
e 6219
|
5
|
+
n 5169
|
6
|
+
& 4950
|
7
|
+
; 4950
|
8
|
+
l 4674
|
9
|
+
r 4464
|
10
|
+
&i 3206
|
11
|
+
&i; 3206
|
12
|
+
i; 3206
|
13
|
+
s 3206
|
14
|
+
k 3009
|
15
|
+
d 2977
|
16
|
+
t 2442
|
17
|
+
m 2010
|
18
|
+
y 2001
|
19
|
+
u 1885
|
20
|
+
n_ 1725
|
21
|
+
g 1584
|
22
|
+
o 1567
|
23
|
+
b 1470
|
24
|
+
e_ 1426
|
25
|
+
� 1353
|
26
|
+
ar 1273
|
27
|
+
la 1236
|
28
|
+
a_ 1209
|
29
|
+
i_ 1169
|
30
|
+
in 1124
|
31
|
+
_b 1101
|
32
|
+
an 1097
|
33
|
+
er 1073
|
34
|
+
le 1058
|
35
|
+
s; 1036
|
36
|
+
&s; 1036
|
37
|
+
&s 1036
|
38
|
+
;_ 1018
|
39
|
+
de 936
|
40
|
+
;n 918
|
41
|
+
&i;n 917
|
42
|
+
i;n 917
|
43
|
+
,_ 872
|
44
|
+
_, 872
|
45
|
+
_,_ 872
|
46
|
+
, 872
|
47
|
+
i;_ 863
|
48
|
+
&i;_ 863
|
49
|
+
_k 816
|
50
|
+
en 769
|
51
|
+
r_ 762
|
52
|
+
_y 759
|
53
|
+
da 759
|
54
|
+
il 759
|
55
|
+
k_ 750
|
56
|
+
z 739
|
57
|
+
nd 725
|
58
|
+
&g; 708
|
59
|
+
g; 708
|
60
|
+
&g 708
|
61
|
+
ra 697
|
62
|
+
_a 692
|
63
|
+
_d 692
|
64
|
+
_s 676
|
65
|
+
' 673
|
66
|
+
_i 644
|
67
|
+
._ 641
|
68
|
+
. 641
|
69
|
+
_. 637
|
70
|
+
_._ 637
|
71
|
+
c 637
|
72
|
+
ka 635
|
73
|
+
v 632
|
74
|
+
;& 624
|
75
|
+
h 615
|
76
|
+
_g 597
|
77
|
+
ri 596
|
78
|
+
� 596
|
79
|
+
lar 583
|
80
|
+
li 580
|
81
|
+
ma 559
|
82
|
+
ya 555
|
83
|
+
ler 553
|
84
|
+
p 547
|
85
|
+
re 529
|
86
|
+
al 529
|
87
|
+
� 527
|
88
|
+
_t 520
|
89
|
+
ir 508
|
90
|
+
ak 502
|
91
|
+
bi 500
|
92
|
+
;l 480
|
93
|
+
in_ 478
|
94
|
+
di 477
|
95
|
+
r& 468
|
96
|
+
el 453
|
97
|
+
et 449
|
98
|
+
ek 445
|
99
|
+
n& 439
|
100
|
+
_o 439
|
101
|
+
ol 437
|
102
|
+
da_ 434
|
103
|
+
n&i 433
|
104
|
+
n&i; 433
|
105
|
+
ni 429
|
106
|
+
ti 428
|
107
|
+
de_ 425
|
108
|
+
an_ 422
|
109
|
+
eri 421
|
110
|
+
r&i 417
|
111
|
+
r&i; 417
|
112
|
+
s& 413
|
113
|
+
s&i 413
|
114
|
+
s&i; 413
|
115
|
+
ar& 412
|
116
|
+
me 407
|
117
|
+
te 405
|
118
|
+
a& 404
|
119
|
+
i& 390
|
120
|
+
ay 387
|
121
|
+
ne 380
|
122
|
+
_bi 373
|
123
|
+
_ka 368
|
124
|
+
ar&i; 367
|
125
|
+
ar&i 367
|
126
|
+
u_ 363
|
127
|
+
as 363
|
128
|
+
_e 362
|
129
|
+
ta 359
|
130
|
+
&i;l 352
|
131
|
+
i;l 352
|
132
|
+
nda 350
|
133
|
+
ki 347
|
134
|
+
na 346
|
135
|
+
si 343
|
136
|
+
_v 337
|
137
|
+
;&i; 334
|
138
|
+
;&i 334
|
139
|
+
ve 334
|
140
|
+
ara 333
|
141
|
+
en_ 332
|
142
|
+
;i 331
|
143
|
+
on 328
|
144
|
+
un 326
|
145
|
+
l&i; 322
|
146
|
+
l& 322
|
147
|
+
l&i 322
|
148
|
+
leri 322
|
149
|
+
ba 318
|
150
|
+
_m 318
|
151
|
+
ik 315
|
152
|
+
mi 315
|
153
|
+
f 306
|
154
|
+
lar& 302
|
155
|
+
lar&i 302
|
156
|
+
sa 298
|
157
|
+
_h 297
|
158
|
+
ld 296
|
159
|
+
&i;& 290
|
160
|
+
i;& 290
|
161
|
+
_ve 288
|
162
|
+
l_ 287
|
163
|
+
ge 286
|
164
|
+
is 285
|
165
|
+
ed 285
|
166
|
+
i&s; 284
|
167
|
+
i&s 284
|
168
|
+
;r 282
|
169
|
+
_ya 279
|
170
|
+
_ol 279
|
171
|
+
d&i; 278
|
172
|
+
d& 278
|
173
|
+
d&i 278
|
174
|
+
nl 277
|
175
|
+
kl 275
|
176
|
+
;k 274
|
177
|
+
&i;n_ 271
|
178
|
+
;n_ 271
|
179
|
+
i;n_ 271
|
180
|
+
ile 270
|
181
|
+
or 269
|
182
|
+
iy 267
|
183
|
+
a&s 264
|
184
|
+
a&s; 264
|
185
|
+
y&i; 262
|
186
|
+
ad 262
|
187
|
+
y& 262
|
188
|
+
y&i 262
|
189
|
+
ye 259
|
190
|
+
ha 258
|
191
|
+
es 258
|
192
|
+
t& 257
|
193
|
+
t&i 257
|
194
|
+
t&i; 257
|
195
|
+
ini 253
|
196
|
+
;nd 253
|
197
|
+
i;nd 253
|
198
|
+
�r 253
|
199
|
+
&i;nd 253
|
200
|
+
se 248
|
201
|
+
_ge 248
|
202
|
+
i;nda 248
|
203
|
+
;nda 248
|
204
|
+
;n&i; 247
|
205
|
+
i;n& 247
|
206
|
+
;n& 247
|
207
|
+
&i;n& 247
|
208
|
+
i;n&i 247
|
209
|
+
;n&i 247
|
210
|
+
bu 245
|
211
|
+
_' 245
|
212
|
+
_ba 244
|
213
|
+
as&i 242
|
214
|
+
as&i; 242
|
215
|
+
_de 242
|
216
|
+
as& 242
|
217
|
+
at 240
|
218
|
+
am 240
|
219
|
+
nda_ 239
|
220
|
+
ar_ 231
|
221
|
+
ve_ 230
|
222
|
+
rin 230
|
223
|
+
_ve_ 228
|
224
|
+
_bu 227
|
225
|
+
im 227
|
226
|
+
&i;r 226
|
227
|
+
i;r 226
|
228
|
+
ur 221
|
229
|
+
g;&i 220
|
230
|
+
g;& 220
|
231
|
+
&g;& 220
|
232
|
+
yo 220
|
233
|
+
&g;&i 220
|
234
|
+
g;&i; 220
|
235
|
+
ul 215
|
236
|
+
ak_ 215
|
237
|
+
ke 213
|
238
|
+
nu 213
|
239
|
+
erin 211
|
240
|
+
g;i 208
|
241
|
+
&g;i 208
|
242
|
+
lan 207
|
243
|
+
bir 205
|
244
|
+
r&i;n 205
|
245
|
+
nde 202
|
246
|
+
rl 202
|
247
|
+
n&i;_ 201
|
248
|
+
ko 201
|
249
|
+
ca 200
|
250
|
+
m_ 197
|
251
|
+
rd 196
|
252
|
+
t_ 194
|
253
|
+
er_ 194
|
254
|
+
st 193
|
255
|
+
em 193
|
256
|
+
_sa 190
|
257
|
+
lm 189
|
258
|
+
rt 188
|
259
|
+
_� 187
|
260
|
+
i;k 187
|
261
|
+
�n 187
|
262
|
+
ola 187
|
263
|
+
&i;k 187
|
264
|
+
lerin 185
|
265
|
+
ce 185
|
266
|
+
'_ 185
|
267
|
+
;m 183
|
268
|
+
az 183
|
269
|
+
rk 182
|
270
|
+
y� 182
|
271
|
+
;la 181
|
272
|
+
_bir 181
|
273
|
+
ir_ 180
|
274
|
+
n&i;n 180
|
275
|
+
ru 180
|
276
|
+
lu 180
|
277
|
+
;nda_ 178
|
278
|
+
e& 177
|
279
|
+
_� 176
|
280
|
+
_ha 175
|
281
|
+
_ko 173
|
282
|
+
esi 171
|
283
|
+
_� 170
|
284
|
+
ap 170
|
285
|
+
ni_ 168
|
286
|
+
t� 167
|
287
|
+
den 164
|
288
|
+
ind 161
|
289
|
+
di_ 161
|
290
|
+
be 161
|
291
|
+
s&i;n 160
|
292
|
+
nin 159
|
293
|
+
�z 158
|
294
|
+
ri_ 155
|
295
|
+
y&i;l 155
|
296
|
+
_p 154
|
297
|
+
nin_ 153
|
298
|
+
&s;_ 152
|
299
|
+
_y& 152
|
300
|
+
edi 152
|
301
|
+
s;_ 152
|
302
|
+
_y&i; 152
|
303
|
+
_y&i 152
|
304
|
+
yl 151
|
305
|
+
le_ 151
|
306
|
+
inde 150
|
307
|
+
eti 150
|
308
|
+
ala 150
|
309
|
+
&i;&s 149
|
310
|
+
ele 149
|
311
|
+
i;&s; 149
|
312
|
+
;&s; 149
|
313
|
+
;&s 149
|
314
|
+
i;&s 149
|
315
|
+
ek_ 148
|
316
|
+
ere 148
|
317
|
+
�i 147
|
318
|
+
du 145
|
319
|
+
�n 145
|
320
|
+
z_ 144
|
321
|
+
na_ 144
|
322
|
+
eri_ 143
|
323
|
+
ec 142
|
324
|
+
g� 142
|
325
|
+
i;&g; 141
|
326
|
+
s&i;_ 141
|
327
|
+
bir_ 141
|
328
|
+
&i;&g 141
|
329
|
+
i;&g 141
|
330
|
+
ah 141
|
331
|
+
;&g; 141
|
332
|
+
;&g 141
|
333
|
+
_g� 140
|
334
|
+
lar_ 140
|
335
|
+
eli 140
|
336
|
+
a&g; 140
|
337
|
+
a&g 140
|
338
|
+
dan 140
|
339
|
+
ac 140
|
340
|
+
i� 140
|
341
|
+
an& 140
|
342
|
+
u& 139
|
343
|
+
;&g;& 138
|
344
|
+
_y� 138
|
345
|
+
an&i 138
|
346
|
+
an&i; 138
|
347
|
+
pa 138
|
348
|
+
it 137
|
349
|
+
_ola 137
|
350
|
+
_bir_ 136
|
351
|
+
;t 135
|
352
|
+
�r 135
|
353
|
+
ne_ 135
|
354
|
+
ini_ 134
|
355
|
+
lma 134
|
356
|
+
kan 133
|
357
|
+
ab 132
|
358
|
+
to 131
|
359
|
+
ba& 131
|
360
|
+
kar 130
|
361
|
+
r&i;_ 130
|
362
|
+
_ar 129
|
363
|
+
ili 129
|
364
|
+
li_ 129
|
365
|
+
ki_ 128
|
366
|
+
bu_ 127
|
367
|
+
anl 127
|
368
|
+
d� 127
|
369
|
+
ler_ 126
|
370
|
+
_ba& 126
|
371
|
+
kon 126
|
372
|
+
ll 125
|
373
|
+
tl 125
|
374
|
+
ine 125
|
375
|
+
e&g; 124
|
376
|
+
e&g 124
|
377
|
+
_il 124
|
378
|
+
_bu_ 124
|
379
|
+
re_ 124
|
380
|
+
bil 123
|
381
|
+
&s;i 123
|
382
|
+
;&i;n 123
|
383
|
+
s;i 123
|
384
|
+
ede 123
|
385
|
+
zd 123
|
386
|
+
'' 122
|
387
|
+
_da 122
|
388
|
+
_'' 122
|
389
|
+
_t� 122
|
390
|
+
ret 122
|
391
|
+
_-_ 121
|
392
|
+
_''_ 121
|
393
|
+
mas 121
|
394
|
+
''_ 121
|
395
|
+
- 121
|
396
|
+
dan_ 121
|
397
|
+
leri_ 121
|
398
|
+
;u 121
|
399
|
+
_- 121
|
400
|
+
ev 121
|