language_detector 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (172) hide show
  1. data/README.rdoc +24 -0
  2. data/Rakefile +18 -0
  3. data/VERSION +1 -0
  4. data/lib/language_detector.rb +232 -0
  5. data/lib/model-fm.yml +52504 -0
  6. data/lib/model-tc.yml +53985 -0
  7. data/lib/textcat_ngrams/afrikaans.lm +400 -0
  8. data/lib/textcat_ngrams/albanian.lm +400 -0
  9. data/lib/textcat_ngrams/amharic-utf.lm +400 -0
  10. data/lib/textcat_ngrams/arabic-iso8859_6.lm +400 -0
  11. data/lib/textcat_ngrams/arabic-windows1256.lm +400 -0
  12. data/lib/textcat_ngrams/armenian.lm +400 -0
  13. data/lib/textcat_ngrams/basque.lm +400 -0
  14. data/lib/textcat_ngrams/belarus-windows1251.lm +400 -0
  15. data/lib/textcat_ngrams/bosnian.lm +400 -0
  16. data/lib/textcat_ngrams/breton.lm +400 -0
  17. data/lib/textcat_ngrams/bulgarian-iso8859_5.lm +400 -0
  18. data/lib/textcat_ngrams/catalan.lm +400 -0
  19. data/lib/textcat_ngrams/chinese-big5.lm +400 -0
  20. data/lib/textcat_ngrams/chinese-gb2312.lm +400 -0
  21. data/lib/textcat_ngrams/croatian-ascii.lm +400 -0
  22. data/lib/textcat_ngrams/czech-iso8859_2.lm +400 -0
  23. data/lib/textcat_ngrams/danish.lm +400 -0
  24. data/lib/textcat_ngrams/dutch.lm +400 -0
  25. data/lib/textcat_ngrams/english.lm +400 -0
  26. data/lib/textcat_ngrams/esperanto.lm +400 -0
  27. data/lib/textcat_ngrams/estonian.lm +400 -0
  28. data/lib/textcat_ngrams/finnish.lm +400 -0
  29. data/lib/textcat_ngrams/french.lm +400 -0
  30. data/lib/textcat_ngrams/frisian.lm +400 -0
  31. data/lib/textcat_ngrams/georgian.lm +400 -0
  32. data/lib/textcat_ngrams/german.lm +400 -0
  33. data/lib/textcat_ngrams/greek-iso8859-7.lm +400 -0
  34. data/lib/textcat_ngrams/hebrew-iso8859_8.lm +400 -0
  35. data/lib/textcat_ngrams/hindi.lm +400 -0
  36. data/lib/textcat_ngrams/hungarian.lm +400 -0
  37. data/lib/textcat_ngrams/icelandic.lm +400 -0
  38. data/lib/textcat_ngrams/indonesian.lm +400 -0
  39. data/lib/textcat_ngrams/irish.lm +400 -0
  40. data/lib/textcat_ngrams/italian.lm +400 -0
  41. data/lib/textcat_ngrams/japanese-euc_jp.lm +400 -0
  42. data/lib/textcat_ngrams/japanese-shift_jis.lm +400 -0
  43. data/lib/textcat_ngrams/korean.lm +400 -0
  44. data/lib/textcat_ngrams/latin.lm +400 -0
  45. data/lib/textcat_ngrams/latvian.lm +400 -0
  46. data/lib/textcat_ngrams/lithuanian.lm +400 -0
  47. data/lib/textcat_ngrams/malay.lm +400 -0
  48. data/lib/textcat_ngrams/manx.lm +400 -0
  49. data/lib/textcat_ngrams/marathi.lm +400 -0
  50. data/lib/textcat_ngrams/mingo.lm +400 -0
  51. data/lib/textcat_ngrams/nepali.lm +400 -0
  52. data/lib/textcat_ngrams/norwegian.lm +400 -0
  53. data/lib/textcat_ngrams/persian.lm +400 -0
  54. data/lib/textcat_ngrams/polish.lm +400 -0
  55. data/lib/textcat_ngrams/portuguese.lm +400 -0
  56. data/lib/textcat_ngrams/quechua.lm +400 -0
  57. data/lib/textcat_ngrams/romanian.lm +400 -0
  58. data/lib/textcat_ngrams/rumantsch.lm +400 -0
  59. data/lib/textcat_ngrams/russian-iso8859_5.lm +400 -0
  60. data/lib/textcat_ngrams/russian-koi8_r.lm +400 -0
  61. data/lib/textcat_ngrams/russian-windows1251.lm +400 -0
  62. data/lib/textcat_ngrams/sanskrit.lm +400 -0
  63. data/lib/textcat_ngrams/scots.lm +400 -0
  64. data/lib/textcat_ngrams/scots_gaelic.lm +400 -0
  65. data/lib/textcat_ngrams/serbian-ascii.lm +400 -0
  66. data/lib/textcat_ngrams/slovak-ascii.lm +400 -0
  67. data/lib/textcat_ngrams/slovak-windows1250.lm +400 -0
  68. data/lib/textcat_ngrams/slovenian-ascii.lm +400 -0
  69. data/lib/textcat_ngrams/slovenian-iso8859_2.lm +400 -0
  70. data/lib/textcat_ngrams/spanish.lm +400 -0
  71. data/lib/textcat_ngrams/swahili.lm +400 -0
  72. data/lib/textcat_ngrams/swedish.lm +400 -0
  73. data/lib/textcat_ngrams/tagalog.lm +400 -0
  74. data/lib/textcat_ngrams/tamil.lm +400 -0
  75. data/lib/textcat_ngrams/thai.lm +400 -0
  76. data/lib/textcat_ngrams/turkish.lm +400 -0
  77. data/lib/textcat_ngrams/ukrainian-koi8_u.lm +400 -0
  78. data/lib/textcat_ngrams/vietnamese.lm +400 -0
  79. data/lib/textcat_ngrams/welsh.lm +400 -0
  80. data/lib/textcat_ngrams/yiddish-utf.lm +400 -0
  81. data/lib/training_data/ar-utf8.txt +54 -0
  82. data/lib/training_data/bg-utf8.txt +26 -0
  83. data/lib/training_data/cs-utf8.txt +48 -0
  84. data/lib/training_data/da-utf8.txt +159 -0
  85. data/lib/training_data/de-utf8.txt +569 -0
  86. data/lib/training_data/el-utf8.txt +48 -0
  87. data/lib/training_data/en-utf8.txt +81 -0
  88. data/lib/training_data/es-utf8.txt +185 -0
  89. data/lib/training_data/et-utf8.txt +50 -0
  90. data/lib/training_data/fa-utf8.txt +42 -0
  91. data/lib/training_data/fi-utf8.txt +83 -0
  92. data/lib/training_data/fr-utf8.txt +191 -0
  93. data/lib/training_data/fy-utf8.txt +22 -0
  94. data/lib/training_data/ga-utf8.txt +109 -0
  95. data/lib/training_data/he-utf8.txt +116 -0
  96. data/lib/training_data/hi-utf8.txt +49 -0
  97. data/lib/training_data/hr-utf8.txt +80 -0
  98. data/lib/training_data/hu-utf8.txt +87 -0
  99. data/lib/training_data/io-utf8.txt +41 -0
  100. data/lib/training_data/is-utf8.txt +94 -0
  101. data/lib/training_data/it-utf8.txt +228 -0
  102. data/lib/training_data/ja-utf8.txt +200 -0
  103. data/lib/training_data/ko-utf8.txt +147 -0
  104. data/lib/training_data/nl-utf8.txt +215 -0
  105. data/lib/training_data/no-utf8.txt +281 -0
  106. data/lib/training_data/pl-utf8.txt +120 -0
  107. data/lib/training_data/pt-utf8.txt +214 -0
  108. data/lib/training_data/ro-utf8.txt +66 -0
  109. data/lib/training_data/ru-utf8.txt +310 -0
  110. data/lib/training_data/sl-utf8.txt +263 -0
  111. data/lib/training_data/sv-utf8.txt +174 -0
  112. data/lib/training_data/th-utf8.txt +49 -0
  113. data/lib/training_data/tk-utf8.txt +101 -0
  114. data/lib/training_data/todo/af.txt +114 -0
  115. data/lib/training_data/todo/amharic-utf.txt +95 -0
  116. data/lib/training_data/todo/arabic-windows1256.txt +157 -0
  117. data/lib/training_data/todo/armenian.txt +86 -0
  118. data/lib/training_data/todo/basque.txt +136 -0
  119. data/lib/training_data/todo/belarus-windows1251.txt +97 -0
  120. data/lib/training_data/todo/bosnian.txt +97 -0
  121. data/lib/training_data/todo/breton.txt +159 -0
  122. data/lib/training_data/todo/bulgarian-iso8859_5.txt +115 -0
  123. data/lib/training_data/todo/catalan.txt +93 -0
  124. data/lib/training_data/todo/croatian-ascii.txt +104 -0
  125. data/lib/training_data/todo/esperanto.txt +95 -0
  126. data/lib/training_data/todo/estonian.txt +218 -0
  127. data/lib/training_data/todo/frisian.txt +99 -0
  128. data/lib/training_data/todo/georgian.txt +86 -0
  129. data/lib/training_data/todo/greek-iso8859-7.txt +139 -0
  130. data/lib/training_data/todo/hawaian.txt +108 -0
  131. data/lib/training_data/todo/hebrew-iso8859_8.txt +79 -0
  132. data/lib/training_data/todo/hindi.txt +77 -0
  133. data/lib/training_data/todo/hungarian.txt +102 -0
  134. data/lib/training_data/todo/icelandic.txt +131 -0
  135. data/lib/training_data/todo/indonesian.txt +93 -0
  136. data/lib/training_data/todo/irish.txt +209 -0
  137. data/lib/training_data/todo/latin.txt +120 -0
  138. data/lib/training_data/todo/latvian.txt +126 -0
  139. data/lib/training_data/todo/lithuanian.txt +99 -0
  140. data/lib/training_data/todo/malay.txt +108 -0
  141. data/lib/training_data/todo/manx.txt +78 -0
  142. data/lib/training_data/todo/marathi.txt +100 -0
  143. data/lib/training_data/todo/mf.txt +100 -0
  144. data/lib/training_data/todo/middle_frisian.txt +102 -0
  145. data/lib/training_data/todo/mingo.txt +146 -0
  146. data/lib/training_data/todo/nepali.txt +131 -0
  147. data/lib/training_data/todo/persian.txt +73 -0
  148. data/lib/training_data/todo/quechua.txt +108 -0
  149. data/lib/training_data/todo/romanian.txt +103 -0
  150. data/lib/training_data/todo/rumantsch.txt +110 -0
  151. data/lib/training_data/todo/sanskrit.txt +135 -0
  152. data/lib/training_data/todo/scots.txt +490 -0
  153. data/lib/training_data/todo/scots_gaelic.txt +93 -0
  154. data/lib/training_data/todo/serbian-ascii.txt +121 -0
  155. data/lib/training_data/todo/slovak-ascii.txt +102 -0
  156. data/lib/training_data/todo/slovak-windows1250.txt +115 -0
  157. data/lib/training_data/todo/slovenian-ascii.txt +100 -0
  158. data/lib/training_data/todo/slovenian-iso8859_2.txt +96 -0
  159. data/lib/training_data/todo/sq.txt +110 -0
  160. data/lib/training_data/todo/swahili.txt +120 -0
  161. data/lib/training_data/todo/tagalog.txt +135 -0
  162. data/lib/training_data/todo/tamil.txt +123 -0
  163. data/lib/training_data/todo/turkish.txt +117 -0
  164. data/lib/training_data/todo/ukrainian-koi8_r.txt +214 -0
  165. data/lib/training_data/todo/vietnamese.txt +92 -0
  166. data/lib/training_data/todo/welsh.txt +148 -0
  167. data/lib/training_data/todo/yiddish-utf.txt +83 -0
  168. data/lib/training_data/uk-utf8.txt +75 -0
  169. data/lib/training_data/vi-utf8.txt +47 -0
  170. data/lib/training_data/zh-utf8.txt +228 -0
  171. data/test/language_detector_test.rb +78 -0
  172. metadata +232 -0
@@ -0,0 +1,400 @@
1
+ _ 16483
2
+ a 9342
3
+ i 5293
4
+ a_ 4071
5
+ u 2730
6
+ k 2609
7
+ n 2351
8
+ w 2076
9
+ m 1928
10
+ e 1866
11
+ h 1800
12
+ o 1775
13
+ wa 1743
14
+ l 1486
15
+ s 1419
16
+ i_ 1401
17
+ t 1399
18
+ _k 1306
19
+ y 1100
20
+ _w 969
21
+ li 945
22
+ wa_ 911
23
+ z 891
24
+ _wa 890
25
+ ka 834
26
+ ku 799
27
+ r 770
28
+ b 733
29
+ an 727
30
+ ma 723
31
+ o_ 711
32
+ _m 707
33
+ na 698
34
+ ya 675
35
+ ha 672
36
+ g 602
37
+ al 580
38
+ d 570
39
+ at 560
40
+ am 554
41
+ _n 549
42
+ _ku 549
43
+ ik 543
44
+ _h 515
45
+ ya_ 514
46
+ A 494
47
+ is 487
48
+ _y 485
49
+ hi 474
50
+ na_ 471
51
+ _ya 471
52
+ ta 468
53
+ sh 456
54
+ ali 449
55
+ j 426
56
+ u_ 423
57
+ ki 418
58
+ e_ 402
59
+ p 401
60
+ ti 401
61
+ _wa_ 399
62
+ f 392
63
+ _ya_ 390
64
+ ba 390
65
+ ri 385
66
+ ng 385
67
+ il 380
68
+ c 358
69
+ hu 356
70
+ _na 356
71
+ ni 355
72
+ za 354
73
+ zi 351
74
+ ia 344
75
+ _na_ 343
76
+ _a 336
77
+ in 327
78
+ _ma 326
79
+ ch 322
80
+ mb 317
81
+ ika 314
82
+ . 311
83
+ ._ 309
84
+ _ka 307
85
+ as 306
86
+ ak 306
87
+ ati 301
88
+ , 300
89
+ ka_ 296
90
+ ,_ 294
91
+ _u 292
92
+ kw 286
93
+ ili 278
94
+ K 274
95
+ en 271
96
+ si 266
97
+ _kw 262
98
+ la 261
99
+ ni_ 261
100
+ ma_ 261
101
+ _s 258
102
+ kwa 258
103
+ ar 256
104
+ ut 245
105
+ za_ 245
106
+ nd 242
107
+ mba 241
108
+ _kwa 239
109
+ _z 234
110
+ li_ 233
111
+ un 233
112
+ ny 230
113
+ it 229
114
+ se 229
115
+ yo 227
116
+ ia_ 222
117
+ M 221
118
+ sa 221
119
+ kat 217
120
+ _K 214
121
+ _i 213
122
+ ika_ 213
123
+ ana 212
124
+ ish 212
125
+ kati 206
126
+ _ha 204
127
+ on 201
128
+ ai 200
129
+ I 198
130
+ aa 196
131
+ um 195
132
+ im 190
133
+ v 188
134
+ mu 187
135
+ amb 187
136
+ sha 185
137
+ em 183
138
+ fa 181
139
+ zi_ 180
140
+ di 179
141
+ mi 178
142
+ _M 178
143
+ us 176
144
+ _ki 176
145
+ ha_ 175
146
+ iw 172
147
+ ama 172
148
+ _kat 168
149
+ _kati 168
150
+ _hi 166
151
+ _l 166
152
+ ra 166
153
+ kwa_ 165
154
+ la_ 164
155
+ W 164
156
+ ja 163
157
+ U 163
158
+ N 163
159
+ amba 161
160
+ ao 161
161
+ _za 160
162
+ ji 160
163
+ B 157
164
+ iwa 155
165
+ tik 155
166
+ wal 155
167
+ le 155
168
+ tika 154
169
+ ge 153
170
+ lis 153
171
+ tu 152
172
+ atika 152
173
+ to 152
174
+ atik 152
175
+ uw 152
176
+ _kwa_ 151
177
+ A_ 151
178
+ ke 150
179
+ S 147
180
+ tika_ 145
181
+ aj 145
182
+ we 144
183
+ cha 144
184
+ bi 141
185
+ az 140
186
+ er 139
187
+ ek 138
188
+ katik 138
189
+ ez 138
190
+ uwa 137
191
+ kut 135
192
+ _al 134
193
+ _B 134
194
+ ad 134
195
+ mu_ 133
196
+ _ali 133
197
+ rik 132
198
+ _W 131
199
+ ba_ 131
200
+ kuw 131
201
+ me 130
202
+ ali_ 128
203
+ kuwa 128
204
+ ema 127
205
+ wan 127
206
+ bu 126
207
+ sem 126
208
+ _A 125
209
+ ir 125
210
+ ata 125
211
+ iz 124
212
+ _hu 124
213
+ ay 124
214
+ ul 124
215
+ af 123
216
+ iki 122
217
+ ema_ 121
218
+ da 120
219
+ ti_ 120
220
+ sema 119
221
+ aka 118
222
+ sema_ 118
223
+ te 118
224
+ uz 117
225
+ yo_ 117
226
+ _v 117
227
+ io 116
228
+ iy 115
229
+ uta 115
230
+ ani 115
231
+ _wal 115
232
+ he 115
233
+ if 114
234
+ _la 114
235
+ ab 114
236
+ go 112
237
+ _za_ 111
238
+ ama_ 111
239
+ sa_ 111
240
+ pa 110
241
+ _t 110
242
+ zo 110
243
+ nge 110
244
+ wam 109
245
+ wali 108
246
+ ua 107
247
+ ur 106
248
+ _c 106
249
+ ise 105
250
+ _ch 105
251
+ isem 105
252
+ ho 105
253
+ ye 104
254
+ iyo 104
255
+ E 104
256
+ el 104
257
+ mo 103
258
+ ung 103
259
+ eri 103
260
+ _wali 103
261
+ _b 102
262
+ mba_ 102
263
+ ari 101
264
+ ita 101
265
+ isema 100
266
+ ot 99
267
+ _la_ 99
268
+ uk 99
269
+ ao_ 99
270
+ di_ 99
271
+ sha_ 99
272
+ ini 99
273
+ kuwa_ 98
274
+ uwa_ 98
275
+ ana_ 98
276
+ lise 98
277
+ lisem 98
278
+ uli 97
279
+ shi 97
280
+ ga 96
281
+ iwa_ 96
282
+ fu 96
283
+ T 96
284
+ R 95
285
+ _il 95
286
+ wak 94
287
+ aw 94
288
+ isha 94
289
+ ri_ 93
290
+ _am 93
291
+ ara 92
292
+ _cha 92
293
+ aji 92
294
+ _ili 91
295
+ ifa 91
296
+ O 90
297
+ _p 90
298
+ uh 90
299
+ iri 90
300
+ chi 90
301
+ asi 89
302
+ po 89
303
+ a. 89
304
+ ong 89
305
+ azi 88
306
+ _j 88
307
+ _kut 88
308
+ eny 88
309
+ nc 88
310
+ a._ 88
311
+ ko 87
312
+ uu 87
313
+ id 87
314
+ w_ 87
315
+ no 87
316
+ P 86
317
+ ah 86
318
+ ina 86
319
+ rika 86
320
+ _Bw 85
321
+ H 85
322
+ gu 85
323
+ uo 85
324
+ Bw_ 85
325
+ _Bw_ 85
326
+ _se 85
327
+ Bw 85
328
+ ib 84
329
+ _S 84
330
+ kam 84
331
+ hi_ 84
332
+ nya 84
333
+ si_ 83
334
+ a, 82
335
+ no_ 81
336
+ pi 81
337
+ ok 81
338
+ i. 81
339
+ ip 81
340
+ kwam 81
341
+ i._ 81
342
+ amba_ 80
343
+ dh 80
344
+ end 80
345
+ ani_ 80
346
+ a,_ 79
347
+ wamb 79
348
+ kwamb 79
349
+ _sh 79
350
+ eza 79
351
+ nz 79
352
+ wi 79
353
+ _kwam 79
354
+ wamba 79
355
+ alis 78
356
+ _kuw 78
357
+ ngo 78
358
+ ap 77
359
+ _N 77
360
+ any 77
361
+ ili_ 77
362
+ C 77
363
+ WA 76
364
+ vy 76
365
+ wana 76
366
+ _hiy 75
367
+ Wa 75
368
+ hiyo 75
369
+ nch 75
370
+ _hiyo 75
371
+ de 75
372
+ _kuwa 75
373
+ ing 75
374
+ hiy 75
375
+ vi 75
376
+ isha_ 74
377
+ es 74
378
+ atu 74
379
+ _Wa 74
380
+ nchi 74
381
+ aki 74
382
+ lim 73
383
+ da_ 73
384
+ ini_ 73
385
+ ash 73
386
+ ala 73
387
+ i, 73
388
+ ano 73
389
+ i,_ 72
390
+ _kam 71
391
+ _wan 71
392
+ ano_ 71
393
+ mw 71
394
+ nde 71
395
+ ji_ 71
396
+ ion 70
397
+ _amb 70
398
+ ndi 70
399
+ _Ka 70
400
+ eza_ 70
@@ -0,0 +1,400 @@
1
+ _ 33494
2
+ e 8992
3
+ n 7900
4
+ t 7859
5
+ a 7781
6
+ r 7251
7
+ s 6435
8
+ i 5649
9
+ l 4541
10
+ d 4079
11
+ o 3724
12
+ m 3203
13
+ k 3058
14
+ g 2478
15
+ en 2403
16
+ n_ 2389
17
+ t_ 2073
18
+ de 1939
19
+ r_ 1910
20
+ v 1890
21
+ h 1789
22
+ u 1782
23
+ _s 1768
24
+ � 1724
25
+ er 1709
26
+ f 1597
27
+ en_ 1537
28
+ a_ 1526
29
+ an 1357
30
+ p 1320
31
+ et 1317
32
+ � 1278
33
+ � 1261
34
+ st 1236
35
+ ar 1226
36
+ c 1191
37
+ _d 1158
38
+ e_ 1116
39
+ in 1045
40
+ _f 1027
41
+ te 1000
42
+ b 997
43
+ _a 978
44
+ s_ 974
45
+ ra 958
46
+ . 956
47
+ tt 935
48
+ _i 898
49
+ _m 890
50
+ ._ 886
51
+ ll 870
52
+ ta 844
53
+ _o 842
54
+ _e 839
55
+ nd 820
56
+ ti 804
57
+ sk 798
58
+ re 779
59
+ at 769
60
+ _de 754
61
+ om 743
62
+ m_ 739
63
+ �r 720
64
+ , 697
65
+ ,_ 695
66
+ ng 686
67
+ li 673
68
+ ka 666
69
+ oc 662
70
+ _h 654
71
+ on 652
72
+ et_ 647
73
+ ch 645
74
+ ns 643
75
+ is 642
76
+ er_ 630
77
+ �r 625
78
+ _v 614
79
+ _t 614
80
+ ni 611
81
+ i_ 609
82
+ _oc 592
83
+ tt_ 587
84
+ na 586
85
+ y 586
86
+ la 579
87
+ _b 579
88
+ h_ 577
89
+ kt 575
90
+ ch_ 568
91
+ ig 564
92
+ f� 563
93
+ och 555
94
+ or 555
95
+ _och 554
96
+ och_ 554
97
+ _och_ 553
98
+ me 548
99
+ den 548
100
+ om_ 535
101
+ _i_ 531
102
+ d_ 530
103
+ j 529
104
+ ik 520
105
+ de_ 520
106
+ f�r 518
107
+ ge 498
108
+ ad 497
109
+ _k 491
110
+ _f� 487
111
+ ri 484
112
+ el 482
113
+ il 481
114
+ so 480
115
+ al 474
116
+ g_ 469
117
+ le 464
118
+ an_ 461
119
+ _f�r 447
120
+ si 437
121
+ ar_ 437
122
+ att 435
123
+ _p 434
124
+ es 420
125
+ ing 413
126
+ se 407
127
+ to 404
128
+ _u 403
129
+ _en 403
130
+ and 398
131
+ den_ 395
132
+ nde 393
133
+ nn 393
134
+ _l 391
135
+ �_ 391
136
+ D 385
137
+ �n 383
138
+ nt 382
139
+ l_ 381
140
+ tr 378
141
+ _D 372
142
+ va 370
143
+ am 369
144
+ sa 367
145
+ _so 365
146
+ ga 364
147
+ _en_ 361
148
+ �r_ 358
149
+ ck 357
150
+ av 354
151
+ v_ 351
152
+ ed 347
153
+ ma 346
154
+ da 346
155
+ som 346
156
+ rs 344
157
+ som_ 344
158
+ ve 342
159
+ ter 341
160
+ att_ 341
161
+ ha 338
162
+ ne 337
163
+ ut 335
164
+ as 332
165
+ ska 329
166
+ _at 327
167
+ _att 326
168
+ _som 324
169
+ _att_ 324
170
+ _som_ 323
171
+ vi 322
172
+ ikt 317
173
+ _av 316
174
+ det 316
175
+ _den 315
176
+ he 315
177
+ ss 314
178
+ un 307
179
+ ke 304
180
+ _g 303
181
+ us 302
182
+ di 302
183
+ _st 300
184
+ rn 297
185
+ _me 296
186
+ _� 295
187
+ ade 294
188
+ " 290
189
+ _ha 290
190
+ av_ 289
191
+ ill 288
192
+ _n 286
193
+ _in 279
194
+ io 275
195
+ _r 275
196
+ der 275
197
+ it 274
198
+ _av_ 274
199
+ sta 274
200
+ gen 272
201
+ isk 270
202
+ _ti 269
203
+ id 265
204
+ na_ 265
205
+ ns_ 264
206
+ ko 262
207
+ _den_ 261
208
+ ag 258
209
+ det_ 257
210
+ lig 257
211
+ era 256
212
+ ll_ 255
213
+ _det 252
214
+ _�r 251
215
+ be 249
216
+ _�r_ 248
217
+ ra_ 247
218
+ ion 244
219
+ - 241
220
+ pr 240
221
+ oni 233
222
+ til 231
223
+ ten 228
224
+ _si 225
225
+ k_ 222
226
+ p� 222
227
+ fr 221
228
+ ro 219
229
+ till 219
230
+ iv 216
231
+ ls 216
232
+ ande 215
233
+ �r_ 214
234
+ _det_ 213
235
+ �l 212
236
+ _p� 211
237
+ ts 210
238
+ ens 209
239
+ med 209
240
+ mm 208
241
+ rt 208
242
+ _till 208
243
+ _til 208
244
+ _va 207
245
+ _fr 205
246
+ _sk 205
247
+ var 205
248
+ nin 204
249
+ ning 203
250
+ ol 201
251
+ ka_ 200
252
+ lle 198
253
+ ett 198
254
+ rd 197
255
+ em 196
256
+ p�_ 195
257
+ x 195
258
+ rk 194
259
+ _ut 194
260
+ ste 194
261
+ ds 193
262
+ _vi 192
263
+ �r 192
264
+ S 192
265
+ nde_ 191
266
+ are 191
267
+ ver 190
268
+ _p�_ 190
269
+ nis 189
270
+ kr 189
271
+ _med 188
272
+ all 188
273
+ �n 187
274
+ nge 185
275
+ mo 184
276
+ os 183
277
+ ld 182
278
+ ade_ 181
279
+ _S 181
280
+ ed_ 180
281
+ r� 176
282
+ De 175
283
+ _- 175
284
+ kan 174
285
+ ta_ 173
286
+ ng_ 172
287
+ v� 171
288
+ f�r_ 170
289
+ ill_ 170
290
+ han 170
291
+ _De 170
292
+ pp 169
293
+ lt 169
294
+ sam 168
295
+ nte 167
296
+ ans 167
297
+ ton 166
298
+ ur 165
299
+ mi 165
300
+ ess 165
301
+ kl 164
302
+ ig_ 164
303
+ ks 164
304
+ as_ 163
305
+ und 163
306
+ men 162
307
+ med_ 161
308
+ _med_ 161
309
+ ak 161
310
+ Di 160
311
+ ot 159
312
+ rna 159
313
+ ul 159
314
+ _var 159
315
+ te_ 158
316
+ gen_ 158
317
+ het 157
318
+ kto 157
319
+ str 156
320
+ _Di 155
321
+ tad 155
322
+ lan 154
323
+ ga_ 154
324
+ iska 154
325
+ fa 154
326
+ fi 154
327
+ s� 154
328
+ Dikt 153
329
+ Dik 153
330
+ pe 153
331
+ ska_ 152
332
+ ja 152
333
+ H 151
334
+ res 151
335
+ ku 151
336
+ iu 150
337
+ ande_ 150
338
+ till_ 150
339
+ t. 150
340
+ ern 150
341
+ rm 149
342
+ _Dikt 149
343
+ _Dik 149
344
+ ie 149
345
+ bl 148
346
+ -_ 147
347
+ od 147
348
+ _H 147
349
+ n. 147
350
+ ist 147
351
+ _di 146
352
+ ius 146
353
+ _" 145
354
+ la_ 145
355
+ sl 145
356
+ man 145
357
+ ren 145
358
+ _f�r_ 145
359
+ toni 144
360
+ kton 144
361
+ n._ 144
362
+ ktoni 144
363
+ ikton 144
364
+ I 144
365
+ ikto 144
366
+ nius 143
367
+ ten_ 143
368
+ onius 143
369
+ oniu 143
370
+ toniu 143
371
+ ing_ 143
372
+ Dikto 143
373
+ niu 143
374
+ _ko 143
375
+ ic 142
376
+ _sa 142
377
+ _han 142
378
+ ett_ 142
379
+ sm 141
380
+ ba 141
381
+ M 141
382
+ gr 140
383
+ l� 140
384
+ ex 138
385
+ t._ 138
386
+ sp 137
387
+ lla 137
388
+ _et 137
389
+ _M 137
390
+ dr 137
391
+ r� 136
392
+ rad 136
393
+ ek 136
394
+ _be 135
395
+ tar 135
396
+ _-_ 135
397
+ _om 134
398
+ rl 134
399
+ E 134
400
+ m� 133