language_detector 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (172) hide show
  1. data/README.rdoc +24 -0
  2. data/Rakefile +18 -0
  3. data/VERSION +1 -0
  4. data/lib/language_detector.rb +232 -0
  5. data/lib/model-fm.yml +52504 -0
  6. data/lib/model-tc.yml +53985 -0
  7. data/lib/textcat_ngrams/afrikaans.lm +400 -0
  8. data/lib/textcat_ngrams/albanian.lm +400 -0
  9. data/lib/textcat_ngrams/amharic-utf.lm +400 -0
  10. data/lib/textcat_ngrams/arabic-iso8859_6.lm +400 -0
  11. data/lib/textcat_ngrams/arabic-windows1256.lm +400 -0
  12. data/lib/textcat_ngrams/armenian.lm +400 -0
  13. data/lib/textcat_ngrams/basque.lm +400 -0
  14. data/lib/textcat_ngrams/belarus-windows1251.lm +400 -0
  15. data/lib/textcat_ngrams/bosnian.lm +400 -0
  16. data/lib/textcat_ngrams/breton.lm +400 -0
  17. data/lib/textcat_ngrams/bulgarian-iso8859_5.lm +400 -0
  18. data/lib/textcat_ngrams/catalan.lm +400 -0
  19. data/lib/textcat_ngrams/chinese-big5.lm +400 -0
  20. data/lib/textcat_ngrams/chinese-gb2312.lm +400 -0
  21. data/lib/textcat_ngrams/croatian-ascii.lm +400 -0
  22. data/lib/textcat_ngrams/czech-iso8859_2.lm +400 -0
  23. data/lib/textcat_ngrams/danish.lm +400 -0
  24. data/lib/textcat_ngrams/dutch.lm +400 -0
  25. data/lib/textcat_ngrams/english.lm +400 -0
  26. data/lib/textcat_ngrams/esperanto.lm +400 -0
  27. data/lib/textcat_ngrams/estonian.lm +400 -0
  28. data/lib/textcat_ngrams/finnish.lm +400 -0
  29. data/lib/textcat_ngrams/french.lm +400 -0
  30. data/lib/textcat_ngrams/frisian.lm +400 -0
  31. data/lib/textcat_ngrams/georgian.lm +400 -0
  32. data/lib/textcat_ngrams/german.lm +400 -0
  33. data/lib/textcat_ngrams/greek-iso8859-7.lm +400 -0
  34. data/lib/textcat_ngrams/hebrew-iso8859_8.lm +400 -0
  35. data/lib/textcat_ngrams/hindi.lm +400 -0
  36. data/lib/textcat_ngrams/hungarian.lm +400 -0
  37. data/lib/textcat_ngrams/icelandic.lm +400 -0
  38. data/lib/textcat_ngrams/indonesian.lm +400 -0
  39. data/lib/textcat_ngrams/irish.lm +400 -0
  40. data/lib/textcat_ngrams/italian.lm +400 -0
  41. data/lib/textcat_ngrams/japanese-euc_jp.lm +400 -0
  42. data/lib/textcat_ngrams/japanese-shift_jis.lm +400 -0
  43. data/lib/textcat_ngrams/korean.lm +400 -0
  44. data/lib/textcat_ngrams/latin.lm +400 -0
  45. data/lib/textcat_ngrams/latvian.lm +400 -0
  46. data/lib/textcat_ngrams/lithuanian.lm +400 -0
  47. data/lib/textcat_ngrams/malay.lm +400 -0
  48. data/lib/textcat_ngrams/manx.lm +400 -0
  49. data/lib/textcat_ngrams/marathi.lm +400 -0
  50. data/lib/textcat_ngrams/mingo.lm +400 -0
  51. data/lib/textcat_ngrams/nepali.lm +400 -0
  52. data/lib/textcat_ngrams/norwegian.lm +400 -0
  53. data/lib/textcat_ngrams/persian.lm +400 -0
  54. data/lib/textcat_ngrams/polish.lm +400 -0
  55. data/lib/textcat_ngrams/portuguese.lm +400 -0
  56. data/lib/textcat_ngrams/quechua.lm +400 -0
  57. data/lib/textcat_ngrams/romanian.lm +400 -0
  58. data/lib/textcat_ngrams/rumantsch.lm +400 -0
  59. data/lib/textcat_ngrams/russian-iso8859_5.lm +400 -0
  60. data/lib/textcat_ngrams/russian-koi8_r.lm +400 -0
  61. data/lib/textcat_ngrams/russian-windows1251.lm +400 -0
  62. data/lib/textcat_ngrams/sanskrit.lm +400 -0
  63. data/lib/textcat_ngrams/scots.lm +400 -0
  64. data/lib/textcat_ngrams/scots_gaelic.lm +400 -0
  65. data/lib/textcat_ngrams/serbian-ascii.lm +400 -0
  66. data/lib/textcat_ngrams/slovak-ascii.lm +400 -0
  67. data/lib/textcat_ngrams/slovak-windows1250.lm +400 -0
  68. data/lib/textcat_ngrams/slovenian-ascii.lm +400 -0
  69. data/lib/textcat_ngrams/slovenian-iso8859_2.lm +400 -0
  70. data/lib/textcat_ngrams/spanish.lm +400 -0
  71. data/lib/textcat_ngrams/swahili.lm +400 -0
  72. data/lib/textcat_ngrams/swedish.lm +400 -0
  73. data/lib/textcat_ngrams/tagalog.lm +400 -0
  74. data/lib/textcat_ngrams/tamil.lm +400 -0
  75. data/lib/textcat_ngrams/thai.lm +400 -0
  76. data/lib/textcat_ngrams/turkish.lm +400 -0
  77. data/lib/textcat_ngrams/ukrainian-koi8_u.lm +400 -0
  78. data/lib/textcat_ngrams/vietnamese.lm +400 -0
  79. data/lib/textcat_ngrams/welsh.lm +400 -0
  80. data/lib/textcat_ngrams/yiddish-utf.lm +400 -0
  81. data/lib/training_data/ar-utf8.txt +54 -0
  82. data/lib/training_data/bg-utf8.txt +26 -0
  83. data/lib/training_data/cs-utf8.txt +48 -0
  84. data/lib/training_data/da-utf8.txt +159 -0
  85. data/lib/training_data/de-utf8.txt +569 -0
  86. data/lib/training_data/el-utf8.txt +48 -0
  87. data/lib/training_data/en-utf8.txt +81 -0
  88. data/lib/training_data/es-utf8.txt +185 -0
  89. data/lib/training_data/et-utf8.txt +50 -0
  90. data/lib/training_data/fa-utf8.txt +42 -0
  91. data/lib/training_data/fi-utf8.txt +83 -0
  92. data/lib/training_data/fr-utf8.txt +191 -0
  93. data/lib/training_data/fy-utf8.txt +22 -0
  94. data/lib/training_data/ga-utf8.txt +109 -0
  95. data/lib/training_data/he-utf8.txt +116 -0
  96. data/lib/training_data/hi-utf8.txt +49 -0
  97. data/lib/training_data/hr-utf8.txt +80 -0
  98. data/lib/training_data/hu-utf8.txt +87 -0
  99. data/lib/training_data/io-utf8.txt +41 -0
  100. data/lib/training_data/is-utf8.txt +94 -0
  101. data/lib/training_data/it-utf8.txt +228 -0
  102. data/lib/training_data/ja-utf8.txt +200 -0
  103. data/lib/training_data/ko-utf8.txt +147 -0
  104. data/lib/training_data/nl-utf8.txt +215 -0
  105. data/lib/training_data/no-utf8.txt +281 -0
  106. data/lib/training_data/pl-utf8.txt +120 -0
  107. data/lib/training_data/pt-utf8.txt +214 -0
  108. data/lib/training_data/ro-utf8.txt +66 -0
  109. data/lib/training_data/ru-utf8.txt +310 -0
  110. data/lib/training_data/sl-utf8.txt +263 -0
  111. data/lib/training_data/sv-utf8.txt +174 -0
  112. data/lib/training_data/th-utf8.txt +49 -0
  113. data/lib/training_data/tk-utf8.txt +101 -0
  114. data/lib/training_data/todo/af.txt +114 -0
  115. data/lib/training_data/todo/amharic-utf.txt +95 -0
  116. data/lib/training_data/todo/arabic-windows1256.txt +157 -0
  117. data/lib/training_data/todo/armenian.txt +86 -0
  118. data/lib/training_data/todo/basque.txt +136 -0
  119. data/lib/training_data/todo/belarus-windows1251.txt +97 -0
  120. data/lib/training_data/todo/bosnian.txt +97 -0
  121. data/lib/training_data/todo/breton.txt +159 -0
  122. data/lib/training_data/todo/bulgarian-iso8859_5.txt +115 -0
  123. data/lib/training_data/todo/catalan.txt +93 -0
  124. data/lib/training_data/todo/croatian-ascii.txt +104 -0
  125. data/lib/training_data/todo/esperanto.txt +95 -0
  126. data/lib/training_data/todo/estonian.txt +218 -0
  127. data/lib/training_data/todo/frisian.txt +99 -0
  128. data/lib/training_data/todo/georgian.txt +86 -0
  129. data/lib/training_data/todo/greek-iso8859-7.txt +139 -0
  130. data/lib/training_data/todo/hawaian.txt +108 -0
  131. data/lib/training_data/todo/hebrew-iso8859_8.txt +79 -0
  132. data/lib/training_data/todo/hindi.txt +77 -0
  133. data/lib/training_data/todo/hungarian.txt +102 -0
  134. data/lib/training_data/todo/icelandic.txt +131 -0
  135. data/lib/training_data/todo/indonesian.txt +93 -0
  136. data/lib/training_data/todo/irish.txt +209 -0
  137. data/lib/training_data/todo/latin.txt +120 -0
  138. data/lib/training_data/todo/latvian.txt +126 -0
  139. data/lib/training_data/todo/lithuanian.txt +99 -0
  140. data/lib/training_data/todo/malay.txt +108 -0
  141. data/lib/training_data/todo/manx.txt +78 -0
  142. data/lib/training_data/todo/marathi.txt +100 -0
  143. data/lib/training_data/todo/mf.txt +100 -0
  144. data/lib/training_data/todo/middle_frisian.txt +102 -0
  145. data/lib/training_data/todo/mingo.txt +146 -0
  146. data/lib/training_data/todo/nepali.txt +131 -0
  147. data/lib/training_data/todo/persian.txt +73 -0
  148. data/lib/training_data/todo/quechua.txt +108 -0
  149. data/lib/training_data/todo/romanian.txt +103 -0
  150. data/lib/training_data/todo/rumantsch.txt +110 -0
  151. data/lib/training_data/todo/sanskrit.txt +135 -0
  152. data/lib/training_data/todo/scots.txt +490 -0
  153. data/lib/training_data/todo/scots_gaelic.txt +93 -0
  154. data/lib/training_data/todo/serbian-ascii.txt +121 -0
  155. data/lib/training_data/todo/slovak-ascii.txt +102 -0
  156. data/lib/training_data/todo/slovak-windows1250.txt +115 -0
  157. data/lib/training_data/todo/slovenian-ascii.txt +100 -0
  158. data/lib/training_data/todo/slovenian-iso8859_2.txt +96 -0
  159. data/lib/training_data/todo/sq.txt +110 -0
  160. data/lib/training_data/todo/swahili.txt +120 -0
  161. data/lib/training_data/todo/tagalog.txt +135 -0
  162. data/lib/training_data/todo/tamil.txt +123 -0
  163. data/lib/training_data/todo/turkish.txt +117 -0
  164. data/lib/training_data/todo/ukrainian-koi8_r.txt +214 -0
  165. data/lib/training_data/todo/vietnamese.txt +92 -0
  166. data/lib/training_data/todo/welsh.txt +148 -0
  167. data/lib/training_data/todo/yiddish-utf.txt +83 -0
  168. data/lib/training_data/uk-utf8.txt +75 -0
  169. data/lib/training_data/vi-utf8.txt +47 -0
  170. data/lib/training_data/zh-utf8.txt +228 -0
  171. data/test/language_detector_test.rb +78 -0
  172. metadata +232 -0
@@ -0,0 +1,400 @@
1
+ _ 20326
2
+ e 6617
3
+ t 4843
4
+ o 3834
5
+ n 3653
6
+ i 3602
7
+ a 3433
8
+ s 2945
9
+ r 2921
10
+ h 2507
11
+ e_ 2000
12
+ d 1816
13
+ _t 1785
14
+ c 1639
15
+ l 1635
16
+ th 1535
17
+ he 1351
18
+ _th 1333
19
+ u 1309
20
+ f 1253
21
+ m 1175
22
+ p 1151
23
+ _a 1145
24
+ the 1142
25
+ _the 1060
26
+ s_ 978
27
+ er 968
28
+ _o 967
29
+ he_ 928
30
+ d_ 888
31
+ t_ 885
32
+ the_ 844
33
+ _the_ 843
34
+ on 842
35
+ in 817
36
+ y 783
37
+ n_ 773
38
+ b 761
39
+ re 754
40
+ , 734
41
+ ,_ 732
42
+ an 732
43
+ g 728
44
+ w 718
45
+ _i 707
46
+ en 676
47
+ f_ 599
48
+ y_ 595
49
+ of 594
50
+ _of 592
51
+ es 589
52
+ ti 587
53
+ v 580
54
+ _of_ 575
55
+ of_ 575
56
+ nd 568
57
+ at 549
58
+ r_ 540
59
+ _w 534
60
+ it 522
61
+ ed 496
62
+ _p 494
63
+ nt 485
64
+ _c 462
65
+ o_ 457
66
+ io 450
67
+ _an 439
68
+ te 432
69
+ or 425
70
+ _b 418
71
+ nd_ 407
72
+ to 406
73
+ st 402
74
+ is 401
75
+ _s 396
76
+ _in 389
77
+ ion 385
78
+ and 385
79
+ de 384
80
+ ve 382
81
+ ha 375
82
+ ar 366
83
+ _m 361
84
+ and_ 360
85
+ _and 360
86
+ _and_ 358
87
+ se 353
88
+ _to 347
89
+ me 346
90
+ to_ 344
91
+ ed_ 339
92
+ . 330
93
+ be 329
94
+ _f 329
95
+ ._ 329
96
+ _to_ 320
97
+ co 317
98
+ ic 316
99
+ ns 308
100
+ al 307
101
+ le 304
102
+ ou 304
103
+ ce 293
104
+ ent 279
105
+ l_ 278
106
+ _co 277
107
+ tio 275
108
+ on_ 274
109
+ _d 274
110
+ tion 268
111
+ ri 266
112
+ _e 264
113
+ ng 253
114
+ hi 251
115
+ er_ 249
116
+ ea 246
117
+ as 245
118
+ _be 242
119
+ pe 242
120
+ h_ 234
121
+ _r 232
122
+ ec 227
123
+ ch 223
124
+ ro 222
125
+ ct 220
126
+ _h 219
127
+ pr 217
128
+ in_ 217
129
+ ne 214
130
+ ll 214
131
+ rt 213
132
+ s,_ 210
133
+ s, 210
134
+ li 209
135
+ ra 208
136
+ T 207
137
+ wh 204
138
+ a_ 203
139
+ ac 201
140
+ _wh 199
141
+ _n 196
142
+ ts 196
143
+ di 196
144
+ es_ 195
145
+ si 194
146
+ re_ 193
147
+ at_ 192
148
+ nc 192
149
+ ie 190
150
+ _a_ 188
151
+ _in_ 185
152
+ ing 184
153
+ us 182
154
+ _re 182
155
+ g_ 179
156
+ ng_ 178
157
+ op 178
158
+ con 177
159
+ tha 175
160
+ _l 174
161
+ _tha 174
162
+ ver 173
163
+ ma 173
164
+ ion_ 171
165
+ _con 171
166
+ ci 170
167
+ ons 170
168
+ _it 170
169
+ po 169
170
+ ere 168
171
+ is_ 167
172
+ ta 167
173
+ la 166
174
+ _pr 165
175
+ fo 164
176
+ ho 164
177
+ ir 162
178
+ ss 161
179
+ men 160
180
+ be_ 160
181
+ un 159
182
+ ty 159
183
+ _be_ 158
184
+ ing_ 157
185
+ om 156
186
+ ot 156
187
+ hat 155
188
+ ly 155
189
+ _g 155
190
+ em 153
191
+ _T 151
192
+ rs 150
193
+ mo 148
194
+ ch_ 148
195
+ wi 147
196
+ we 147
197
+ ad 147
198
+ ts_ 145
199
+ res 143
200
+ _wi 143
201
+ I 143
202
+ hat_ 142
203
+ ei 141
204
+ ly_ 141
205
+ ni 140
206
+ os 140
207
+ ca 139
208
+ ur 139
209
+ A 138
210
+ ut 138
211
+ that 138
212
+ _that 137
213
+ ati 137
214
+ _fo 137
215
+ st_ 137
216
+ il 136
217
+ or_ 136
218
+ for 136
219
+ pa 136
220
+ ul 135
221
+ ate 135
222
+ ter 134
223
+ it_ 134
224
+ nt_ 133
225
+ that_ 132
226
+ _ha 129
227
+ al_ 128
228
+ el 128
229
+ as_ 127
230
+ ll_ 127
231
+ _ma 125
232
+ no 124
233
+ ment 124
234
+ an_ 124
235
+ tion_ 122
236
+ su 122
237
+ bl 122
238
+ _de 122
239
+ nce 120
240
+ pl 120
241
+ fe 119
242
+ tr 118
243
+ so 118
244
+ int 115
245
+ ov 114
246
+ e, 114
247
+ e,_ 114
248
+ _u 113
249
+ ent_ 113
250
+ Th 113
251
+ her 113
252
+ j 112
253
+ atio 112
254
+ ation 112
255
+ _Th 111
256
+ le_ 110
257
+ ai 110
258
+ _it_ 110
259
+ _on 110
260
+ _for 109
261
+ ect 109
262
+ k 109
263
+ hic 108
264
+ est 108
265
+ der 107
266
+ tu 107
267
+ na 106
268
+ _by_ 106
269
+ by_ 106
270
+ E 106
271
+ by 106
272
+ _by 106
273
+ ve_ 106
274
+ _di 106
275
+ en_ 104
276
+ vi 104
277
+ m_ 103
278
+ _whi 102
279
+ iv 102
280
+ whi 102
281
+ ns_ 102
282
+ _A 101
283
+ ich 100
284
+ ge 100
285
+ pro 99
286
+ ess 99
287
+ _whic 99
288
+ ers 99
289
+ hich 99
290
+ ce_ 99
291
+ which 99
292
+ whic 99
293
+ all 98
294
+ ove 98
295
+ _is 98
296
+ ich_ 97
297
+ ee 97
298
+ hich_ 97
299
+ n,_ 96
300
+ n, 96
301
+ im 95
302
+ ir_ 94
303
+ hei 94
304
+ ions 94
305
+ sti 94
306
+ se_ 94
307
+ per 93
308
+ The 93
309
+ _pa 93
310
+ heir 93
311
+ id 93
312
+ eir 93
313
+ eir_ 93
314
+ ig 93
315
+ heir_ 93
316
+ _no 93
317
+ ev 93
318
+ era 92
319
+ _int 92
320
+ ted 91
321
+ _The 91
322
+ ies 91
323
+ art 91
324
+ thei 90
325
+ _ar 90
326
+ _thei 90
327
+ their 90
328
+ _pro 90
329
+ et 89
330
+ _pe 88
331
+ _mo 88
332
+ ther 88
333
+ x 87
334
+ gh 87
335
+ S 87
336
+ _is_ 87
337
+ ol 87
338
+ ty_ 87
339
+ _I 86
340
+ nde 86
341
+ am 86
342
+ rn 86
343
+ nte 86
344
+ mp 85
345
+ _su 84
346
+ _we 84
347
+ par 84
348
+ _v 84
349
+ pu 82
350
+ his 82
351
+ ow 82
352
+ mi 82
353
+ go 81
354
+ N 81
355
+ ue 81
356
+ ple 81
357
+ ep 80
358
+ ab 80
359
+ ;_ 80
360
+ ; 80
361
+ ex 80
362
+ ain 80
363
+ over 80
364
+ _un 79
365
+ q 79
366
+ qu 79
367
+ pp 79
368
+ ith 79
369
+ ry 79
370
+ _as 79
371
+ ber 79
372
+ ub 78
373
+ av 78
374
+ uc 78
375
+ s._ 77
376
+ s. 77
377
+ enc 77
378
+ are 77
379
+ iti 77
380
+ gr 76
381
+ his_ 76
382
+ ua 76
383
+ part 76
384
+ ff 75
385
+ eve 75
386
+ O 75
387
+ rea 74
388
+ ous 74
389
+ ia 74
390
+ The_ 73
391
+ ag 73
392
+ mb 73
393
+ _go 73
394
+ fa 72
395
+ on,_ 72
396
+ ern 72
397
+ t,_ 72
398
+ on, 72
399
+ t, 72
400
+ _me 71
@@ -0,0 +1,400 @@
1
+ _ 57050
2
+ a 16035
3
+ i 12706
4
+ e 12227
5
+ o 12102
6
+ n 10393
7
+ s 8344
8
+ l 7707
9
+ r 7492
10
+ t 7134
11
+ k 5376
12
+ u 4558
13
+ j 3946
14
+ a_ 3875
15
+ m 3783
16
+ d 3710
17
+ p 3693
18
+ la 2840
19
+ s_ 2769
20
+ e_ 2751
21
+ . 2706
22
+ _l 2635
23
+ _k 2619
24
+ v 2531
25
+ n_ 2504
26
+ o_ 2444
27
+ i_ 2333
28
+ ._ 2278
29
+ on 2238
30
+ , 2193
31
+ ,_ 2182
32
+ _la 2100
33
+ en 2080
34
+ j_ 2050
35
+ as 2028
36
+ la_ 2012
37
+ ta 1956
38
+ _la_ 1907
39
+ an 1882
40
+ _p 1850
41
+ g 1831
42
+ _e 1791
43
+ _d 1778
44
+ is 1737
45
+ aj 1658
46
+ st 1635
47
+ _s 1575
48
+ c 1526
49
+ de 1517
50
+ oj 1498
51
+ er 1476
52
+ ti 1456
53
+ f 1443
54
+ _a 1442
55
+ b 1427
56
+ ro 1379
57
+ _m 1351
58
+ ra 1341
59
+ nt 1293
60
+ ka 1270
61
+ ri 1258
62
+ al 1249
63
+ as_ 1248
64
+ aj_ 1213
65
+ to 1209
66
+ _de 1203
67
+ _t 1200
68
+ te 1179
69
+ _n 1176
70
+ is_ 1171
71
+ in 1151
72
+ ko 1145
73
+ or 1114
74
+ es 1083
75
+ re 1034
76
+ ia 1029
77
+ li 1022
78
+ de_ 1016
79
+ _de_ 979
80
+ ar 974
81
+ _v 966
82
+ vi 942
83
+ lo 932
84
+ x 928
85
+ io 917
86
+ ne 855
87
+ no 848
88
+ ni 843
89
+ mi 835
90
+ ma 819
91
+ _ka 816
92
+ el 815
93
+ pr 771
94
+ z 744
95
+ un 734
96
+ l_ 732
97
+ po 730
98
+ _f 725
99
+ � 724
100
+ est 691
101
+ na 687
102
+ ki 679
103
+ kaj 676
104
+ si 665
105
+ u_ 663
106
+ kaj_ 660
107
+ " 654
108
+ tas 651
109
+ le 650
110
+ oj_ 648
111
+ _i 643
112
+ tr 642
113
+ _pr 630
114
+ _es 628
115
+ jn 626
116
+ pe 618
117
+ _kaj 616
118
+ ig 616
119
+ _kaj_ 611
120
+ do 608
121
+ sta 606
122
+ on_ 602
123
+ ek 602
124
+ ci 597
125
+ r_ 595
126
+ � 594
127
+ _r 593
128
+ il 592
129
+ _est 587
130
+ di 586
131
+ am 586
132
+ _mi 582
133
+ a� 578
134
+ _vi 577
135
+ mo 575
136
+ ant 565
137
+ _ne 562
138
+ en_ 561
139
+ o. 559
140
+ � 543
141
+ iu 538
142
+ o, 529
143
+ ur 527
144
+ o._ 527
145
+ om 525
146
+ o,_ 524
147
+ at 521
148
+ va 521
149
+ - 519
150
+ _en 518
151
+ : 513
152
+ :_ 512
153
+ _ti 500
154
+ M 496
155
+ h 488
156
+ nd 484
157
+ me 484
158
+ _al 481
159
+ _ko 479
160
+ ve 478
161
+ ie 478
162
+ _ki 473
163
+ it 473
164
+ L 466
165
+ _b 465
166
+ se 462
167
+ em 452
168
+ ol 450
169
+ nta 449
170
+ tu 448
171
+ ik 444
172
+ ov 443
173
+ da 443
174
+ _M 440
175
+ _po 439
176
+ tas_ 438
177
+ ne_ 437
178
+ et 437
179
+ _ma 436
180
+ _en_ 435
181
+ su 429
182
+ pl 426
183
+ _L 425
184
+ pa 420
185
+ _o 417
186
+ vo 408
187
+ an_ 407
188
+ ro_ 406
189
+ sti 406
190
+ nu 399
191
+ kon 396
192
+ stas 391
193
+ m_ 391
194
+ ir 388
195
+ n. 386
196
+ fa 386
197
+ jn_ 382
198
+ ku 382
199
+ os 376
200
+ ke 375
201
+ n, 375
202
+ esta 374
203
+ n,_ 372
204
+ _su 362
205
+ ta_ 362
206
+ stas_ 359
207
+ xi 359
208
+ Mi 358
209
+ _ne_ 356
210
+ al_ 355
211
+ nk 353
212
+ so 353
213
+ n._ 352
214
+ id 349
215
+ _g 348
216
+ estas 347
217
+ ga 346
218
+ _h 345
219
+ per 345
220
+ _Mi 340
221
+ ok 339
222
+ K 339
223
+ mp 337
224
+ _esta 337
225
+ s,_ 335
226
+ s, 335
227
+ _se 333
228
+ anta 332
229
+ ul 326
230
+ ran 325
231
+ _" 323
232
+ �_ 322
233
+ te_ 320
234
+ ak 320
235
+ a�_ 320
236
+ ed 320
237
+ rt 319
238
+ ojn 318
239
+ gi 318
240
+ _� 317
241
+ tis 316
242
+ gx 316
243
+ mal 316
244
+ ia_ 315
245
+ ks 310
246
+ _al_ 310
247
+ mi_ 309
248
+ S 309
249
+ lu 309
250
+ ns 308
251
+ kt 305
252
+ io_ 302
253
+ ent 300
254
+ ? 300
255
+ _K 300
256
+ ec 300
257
+ el_ 299
258
+ _- 299
259
+ li_ 299
260
+ E 298
261
+ � 298
262
+ _li 297
263
+ fo 296
264
+ ter 296
265
+ _re 296
266
+ A 295
267
+ nto 294
268
+ vi_ 292
269
+ La 292
270
+ _mal 290
271
+ nte 288
272
+ sp 287
273
+ sa 287
274
+ _mi_ 279
275
+ ut 278
276
+ op 278
277
+ _ke 277
278
+ bo 277
279
+ ajn 276
280
+ un_ 276
281
+ T 274
282
+ to_ 272
283
+ -_ 272
284
+ bl 272
285
+ _an 271
286
+ _La 271
287
+ �i 269
288
+ _S 268
289
+ _pl 267
290
+ _fa 266
291
+ ni_ 266
292
+ La_ 265
293
+ _E 264
294
+ N 263
295
+ tis_ 263
296
+ _tr 263
297
+ ' 262
298
+ ! 262
299
+ _-_ 262
300
+ pro 261
301
+ iu_ 261
302
+ i� 261
303
+ nc 260
304
+ _si 259
305
+ du 257
306
+ _kon 256
307
+ ru 255
308
+ _vi_ 254
309
+ _j 253
310
+ ce 251
311
+ ke_ 249
312
+ ap 248
313
+ us 247
314
+ be 247
315
+ im 247
316
+ B 246
317
+ _ku 246
318
+ _La_ 246
319
+ tra 245
320
+ ad 245
321
+ uj 245
322
+ ac 245
323
+ ita 243
324
+ pre 242
325
+ _pro 242
326
+ co 241
327
+ rm 241
328
+ _ni 238
329
+ _pe 236
330
+ ?_ 234
331
+ on. 234
332
+ toj 234
333
+ "_ 234
334
+ j. 234
335
+ _ke_ 233
336
+ s. 232
337
+ _A 231
338
+ av 230
339
+ ri_ 230
340
+ _el 229
341
+ por 229
342
+ ` 224
343
+ ev 224
344
+ las 223
345
+ P 223
346
+ j._ 221
347
+ eni 220
348
+ _T 220
349
+ _B 219
350
+ j,_ 218
351
+ j, 218
352
+ era 217
353
+ _in 216
354
+ on._ 216
355
+ cx 216
356
+ _N 215
357
+ ion 215
358
+ ab 215
359
+ .. 214
360
+ ) 213
361
+ fi 213
362
+ or_ 212
363
+ pri 212
364
+ s._ 212
365
+ _por 210
366
+ ez 210
367
+ in_ 210
368
+ am_ 209
369
+ on,_ 209
370
+ ll 209
371
+ �i 209
372
+ on, 209
373
+ _ve 208
374
+ ris 208
375
+ esti 208
376
+ !_ 207
377
+ men 206
378
+ vas 205
379
+ iel 204
380
+ taj 203
381
+ _c 201
382
+ aro 201
383
+ ank 200
384
+ _pri 200
385
+ jo 200
386
+ ja 200
387
+ ont 200
388
+ lt 199
389
+ _P 199
390
+ igi 199
391
+ _pa 197
392
+ oj. 197
393
+ ( 196
394
+ au 195
395
+ oro 195
396
+ ng 195
397
+ _( 194
398
+ sto 194
399
+ ast 194
400
+ ag 193