language_detector 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (172) hide show
  1. data/README.rdoc +24 -0
  2. data/Rakefile +18 -0
  3. data/VERSION +1 -0
  4. data/lib/language_detector.rb +232 -0
  5. data/lib/model-fm.yml +52504 -0
  6. data/lib/model-tc.yml +53985 -0
  7. data/lib/textcat_ngrams/afrikaans.lm +400 -0
  8. data/lib/textcat_ngrams/albanian.lm +400 -0
  9. data/lib/textcat_ngrams/amharic-utf.lm +400 -0
  10. data/lib/textcat_ngrams/arabic-iso8859_6.lm +400 -0
  11. data/lib/textcat_ngrams/arabic-windows1256.lm +400 -0
  12. data/lib/textcat_ngrams/armenian.lm +400 -0
  13. data/lib/textcat_ngrams/basque.lm +400 -0
  14. data/lib/textcat_ngrams/belarus-windows1251.lm +400 -0
  15. data/lib/textcat_ngrams/bosnian.lm +400 -0
  16. data/lib/textcat_ngrams/breton.lm +400 -0
  17. data/lib/textcat_ngrams/bulgarian-iso8859_5.lm +400 -0
  18. data/lib/textcat_ngrams/catalan.lm +400 -0
  19. data/lib/textcat_ngrams/chinese-big5.lm +400 -0
  20. data/lib/textcat_ngrams/chinese-gb2312.lm +400 -0
  21. data/lib/textcat_ngrams/croatian-ascii.lm +400 -0
  22. data/lib/textcat_ngrams/czech-iso8859_2.lm +400 -0
  23. data/lib/textcat_ngrams/danish.lm +400 -0
  24. data/lib/textcat_ngrams/dutch.lm +400 -0
  25. data/lib/textcat_ngrams/english.lm +400 -0
  26. data/lib/textcat_ngrams/esperanto.lm +400 -0
  27. data/lib/textcat_ngrams/estonian.lm +400 -0
  28. data/lib/textcat_ngrams/finnish.lm +400 -0
  29. data/lib/textcat_ngrams/french.lm +400 -0
  30. data/lib/textcat_ngrams/frisian.lm +400 -0
  31. data/lib/textcat_ngrams/georgian.lm +400 -0
  32. data/lib/textcat_ngrams/german.lm +400 -0
  33. data/lib/textcat_ngrams/greek-iso8859-7.lm +400 -0
  34. data/lib/textcat_ngrams/hebrew-iso8859_8.lm +400 -0
  35. data/lib/textcat_ngrams/hindi.lm +400 -0
  36. data/lib/textcat_ngrams/hungarian.lm +400 -0
  37. data/lib/textcat_ngrams/icelandic.lm +400 -0
  38. data/lib/textcat_ngrams/indonesian.lm +400 -0
  39. data/lib/textcat_ngrams/irish.lm +400 -0
  40. data/lib/textcat_ngrams/italian.lm +400 -0
  41. data/lib/textcat_ngrams/japanese-euc_jp.lm +400 -0
  42. data/lib/textcat_ngrams/japanese-shift_jis.lm +400 -0
  43. data/lib/textcat_ngrams/korean.lm +400 -0
  44. data/lib/textcat_ngrams/latin.lm +400 -0
  45. data/lib/textcat_ngrams/latvian.lm +400 -0
  46. data/lib/textcat_ngrams/lithuanian.lm +400 -0
  47. data/lib/textcat_ngrams/malay.lm +400 -0
  48. data/lib/textcat_ngrams/manx.lm +400 -0
  49. data/lib/textcat_ngrams/marathi.lm +400 -0
  50. data/lib/textcat_ngrams/mingo.lm +400 -0
  51. data/lib/textcat_ngrams/nepali.lm +400 -0
  52. data/lib/textcat_ngrams/norwegian.lm +400 -0
  53. data/lib/textcat_ngrams/persian.lm +400 -0
  54. data/lib/textcat_ngrams/polish.lm +400 -0
  55. data/lib/textcat_ngrams/portuguese.lm +400 -0
  56. data/lib/textcat_ngrams/quechua.lm +400 -0
  57. data/lib/textcat_ngrams/romanian.lm +400 -0
  58. data/lib/textcat_ngrams/rumantsch.lm +400 -0
  59. data/lib/textcat_ngrams/russian-iso8859_5.lm +400 -0
  60. data/lib/textcat_ngrams/russian-koi8_r.lm +400 -0
  61. data/lib/textcat_ngrams/russian-windows1251.lm +400 -0
  62. data/lib/textcat_ngrams/sanskrit.lm +400 -0
  63. data/lib/textcat_ngrams/scots.lm +400 -0
  64. data/lib/textcat_ngrams/scots_gaelic.lm +400 -0
  65. data/lib/textcat_ngrams/serbian-ascii.lm +400 -0
  66. data/lib/textcat_ngrams/slovak-ascii.lm +400 -0
  67. data/lib/textcat_ngrams/slovak-windows1250.lm +400 -0
  68. data/lib/textcat_ngrams/slovenian-ascii.lm +400 -0
  69. data/lib/textcat_ngrams/slovenian-iso8859_2.lm +400 -0
  70. data/lib/textcat_ngrams/spanish.lm +400 -0
  71. data/lib/textcat_ngrams/swahili.lm +400 -0
  72. data/lib/textcat_ngrams/swedish.lm +400 -0
  73. data/lib/textcat_ngrams/tagalog.lm +400 -0
  74. data/lib/textcat_ngrams/tamil.lm +400 -0
  75. data/lib/textcat_ngrams/thai.lm +400 -0
  76. data/lib/textcat_ngrams/turkish.lm +400 -0
  77. data/lib/textcat_ngrams/ukrainian-koi8_u.lm +400 -0
  78. data/lib/textcat_ngrams/vietnamese.lm +400 -0
  79. data/lib/textcat_ngrams/welsh.lm +400 -0
  80. data/lib/textcat_ngrams/yiddish-utf.lm +400 -0
  81. data/lib/training_data/ar-utf8.txt +54 -0
  82. data/lib/training_data/bg-utf8.txt +26 -0
  83. data/lib/training_data/cs-utf8.txt +48 -0
  84. data/lib/training_data/da-utf8.txt +159 -0
  85. data/lib/training_data/de-utf8.txt +569 -0
  86. data/lib/training_data/el-utf8.txt +48 -0
  87. data/lib/training_data/en-utf8.txt +81 -0
  88. data/lib/training_data/es-utf8.txt +185 -0
  89. data/lib/training_data/et-utf8.txt +50 -0
  90. data/lib/training_data/fa-utf8.txt +42 -0
  91. data/lib/training_data/fi-utf8.txt +83 -0
  92. data/lib/training_data/fr-utf8.txt +191 -0
  93. data/lib/training_data/fy-utf8.txt +22 -0
  94. data/lib/training_data/ga-utf8.txt +109 -0
  95. data/lib/training_data/he-utf8.txt +116 -0
  96. data/lib/training_data/hi-utf8.txt +49 -0
  97. data/lib/training_data/hr-utf8.txt +80 -0
  98. data/lib/training_data/hu-utf8.txt +87 -0
  99. data/lib/training_data/io-utf8.txt +41 -0
  100. data/lib/training_data/is-utf8.txt +94 -0
  101. data/lib/training_data/it-utf8.txt +228 -0
  102. data/lib/training_data/ja-utf8.txt +200 -0
  103. data/lib/training_data/ko-utf8.txt +147 -0
  104. data/lib/training_data/nl-utf8.txt +215 -0
  105. data/lib/training_data/no-utf8.txt +281 -0
  106. data/lib/training_data/pl-utf8.txt +120 -0
  107. data/lib/training_data/pt-utf8.txt +214 -0
  108. data/lib/training_data/ro-utf8.txt +66 -0
  109. data/lib/training_data/ru-utf8.txt +310 -0
  110. data/lib/training_data/sl-utf8.txt +263 -0
  111. data/lib/training_data/sv-utf8.txt +174 -0
  112. data/lib/training_data/th-utf8.txt +49 -0
  113. data/lib/training_data/tk-utf8.txt +101 -0
  114. data/lib/training_data/todo/af.txt +114 -0
  115. data/lib/training_data/todo/amharic-utf.txt +95 -0
  116. data/lib/training_data/todo/arabic-windows1256.txt +157 -0
  117. data/lib/training_data/todo/armenian.txt +86 -0
  118. data/lib/training_data/todo/basque.txt +136 -0
  119. data/lib/training_data/todo/belarus-windows1251.txt +97 -0
  120. data/lib/training_data/todo/bosnian.txt +97 -0
  121. data/lib/training_data/todo/breton.txt +159 -0
  122. data/lib/training_data/todo/bulgarian-iso8859_5.txt +115 -0
  123. data/lib/training_data/todo/catalan.txt +93 -0
  124. data/lib/training_data/todo/croatian-ascii.txt +104 -0
  125. data/lib/training_data/todo/esperanto.txt +95 -0
  126. data/lib/training_data/todo/estonian.txt +218 -0
  127. data/lib/training_data/todo/frisian.txt +99 -0
  128. data/lib/training_data/todo/georgian.txt +86 -0
  129. data/lib/training_data/todo/greek-iso8859-7.txt +139 -0
  130. data/lib/training_data/todo/hawaian.txt +108 -0
  131. data/lib/training_data/todo/hebrew-iso8859_8.txt +79 -0
  132. data/lib/training_data/todo/hindi.txt +77 -0
  133. data/lib/training_data/todo/hungarian.txt +102 -0
  134. data/lib/training_data/todo/icelandic.txt +131 -0
  135. data/lib/training_data/todo/indonesian.txt +93 -0
  136. data/lib/training_data/todo/irish.txt +209 -0
  137. data/lib/training_data/todo/latin.txt +120 -0
  138. data/lib/training_data/todo/latvian.txt +126 -0
  139. data/lib/training_data/todo/lithuanian.txt +99 -0
  140. data/lib/training_data/todo/malay.txt +108 -0
  141. data/lib/training_data/todo/manx.txt +78 -0
  142. data/lib/training_data/todo/marathi.txt +100 -0
  143. data/lib/training_data/todo/mf.txt +100 -0
  144. data/lib/training_data/todo/middle_frisian.txt +102 -0
  145. data/lib/training_data/todo/mingo.txt +146 -0
  146. data/lib/training_data/todo/nepali.txt +131 -0
  147. data/lib/training_data/todo/persian.txt +73 -0
  148. data/lib/training_data/todo/quechua.txt +108 -0
  149. data/lib/training_data/todo/romanian.txt +103 -0
  150. data/lib/training_data/todo/rumantsch.txt +110 -0
  151. data/lib/training_data/todo/sanskrit.txt +135 -0
  152. data/lib/training_data/todo/scots.txt +490 -0
  153. data/lib/training_data/todo/scots_gaelic.txt +93 -0
  154. data/lib/training_data/todo/serbian-ascii.txt +121 -0
  155. data/lib/training_data/todo/slovak-ascii.txt +102 -0
  156. data/lib/training_data/todo/slovak-windows1250.txt +115 -0
  157. data/lib/training_data/todo/slovenian-ascii.txt +100 -0
  158. data/lib/training_data/todo/slovenian-iso8859_2.txt +96 -0
  159. data/lib/training_data/todo/sq.txt +110 -0
  160. data/lib/training_data/todo/swahili.txt +120 -0
  161. data/lib/training_data/todo/tagalog.txt +135 -0
  162. data/lib/training_data/todo/tamil.txt +123 -0
  163. data/lib/training_data/todo/turkish.txt +117 -0
  164. data/lib/training_data/todo/ukrainian-koi8_r.txt +214 -0
  165. data/lib/training_data/todo/vietnamese.txt +92 -0
  166. data/lib/training_data/todo/welsh.txt +148 -0
  167. data/lib/training_data/todo/yiddish-utf.txt +83 -0
  168. data/lib/training_data/uk-utf8.txt +75 -0
  169. data/lib/training_data/vi-utf8.txt +47 -0
  170. data/lib/training_data/zh-utf8.txt +228 -0
  171. data/test/language_detector_test.rb +78 -0
  172. metadata +232 -0
@@ -0,0 +1,400 @@
1
+ _ 7044
2
+ f 2698
3
+ ] 1196
4
+ g 933
5
+ s 815
6
+ l 781
7
+ / 698
8
+ ; 662
9
+ k 645
10
+ d 635
11
+ ]_ 630
12
+ f_ 611
13
+ sf 549
14
+ f] 541
15
+ n 526
16
+ t 460
17
+ o 412
18
+ j 399
19
+ f]_ 374
20
+ L 365
21
+ _; 364
22
+ x 356
23
+ _k 353
24
+ { 337
25
+ b 323
26
+ u 321
27
+ ' 303
28
+ df 299
29
+ sf] 290
30
+ _l 283
31
+ sf]_ 265
32
+ g] 245
33
+ G 232
34
+ e 231
35
+ | 227
36
+ a 222
37
+ /_ 222
38
+ L_ 211
39
+ _g 210
40
+ c 207
41
+ df_ 207
42
+ {_ 207
43
+ _c 201
44
+ g_ 201
45
+ kf 184
46
+ f/ 177
47
+ _u 171
48
+ /f 168
49
+ P 163
50
+ _/ 162
51
+ k| 161
52
+ _s 161
53
+ } 159
54
+ + 158
55
+ h 151
56
+ fn 150
57
+ n] 145
58
+ of 141
59
+ tf 140
60
+ : 136
61
+ p 136
62
+ t_ 134
63
+ . 133
64
+ _k| 133
65
+ ._ 133
66
+ _e 131
67
+ _d 131
68
+ _f 129
69
+ _._ 127
70
+ _. 127
71
+ n]_ 123
72
+ ;f 119
73
+ lj 118
74
+ O 118
75
+ ? 118
76
+ q 118
77
+ nf 118
78
+ y 116
79
+ _a 113
80
+ m 111
81
+ Ps 110
82
+ r 110
83
+ fg 106
84
+ w 105
85
+ sf_ 103
86
+ lg 102
87
+ g]_ 100
88
+ gf 94
89
+ _g] 91
90
+ Psf 90
91
+ x? 89
92
+ fd 88
93
+ fO 88
94
+ _lj 85
95
+ ]s 85
96
+ z 85
97
+ s_ 84
98
+ _p 82
99
+ _sf 80
100
+ D 79
101
+ kl 78
102
+ _;f 78
103
+ f/_ 77
104
+ cf 77
105
+ }_ 76
106
+ Psf] 76
107
+ jf 76
108
+ , 75
109
+ fl 75
110
+ \ 75
111
+ _x 74
112
+ kfn 74
113
+ f{ 74
114
+ _/f 74
115
+ ]k 73
116
+ of] 73
117
+ ,_ 72
118
+ v 72
119
+ lt 72
120
+ _cf 72
121
+ _b 71
122
+ O{ 70
123
+ i 69
124
+ xf 68
125
+ ]kf 68
126
+ _/_ 68
127
+ Psf]_ 68
128
+ _h 67
129
+ g]kfn 67
130
+ g]k 67
131
+ d_ 67
132
+ g]kf 67
133
+ O{_ 67
134
+ ]kfn 67
135
+ _g]k 66
136
+ g' 66
137
+ _g]kf 66
138
+ o_ 64
139
+ " 64
140
+ ;b 63
141
+ Gq 63
142
+ f+ 63
143
+ n_ 63
144
+ fk 62
145
+ sf/ 62
146
+ /L 62
147
+ _kl 62
148
+ I 61
149
+ T 61
150
+ /s 61
151
+ If 61
152
+ dG 60
153
+ _j 60
154
+ ]sf 60
155
+ ;_ 59
156
+ u_ 59
157
+ yf 59
158
+ dGq 58
159
+ fO{ 58
160
+ af 57
161
+ eP 57
162
+ fs 57
163
+ fO{_ 57
164
+ fj 56
165
+ f; 56
166
+ qL 56
167
+ l/ 55
168
+ \_ 55
169
+ ;D 54
170
+ dGqL 54
171
+ GqL 54
172
+ ;+ 53
173
+ g\ 53
174
+ /sf 52
175
+ nfO 51
176
+ _kf 51
177
+ ug 51
178
+ pg 51
179
+ :t 51
180
+ fp 50
181
+ _ug 50
182
+ u/ 50
183
+ lg_ 49
184
+ ePs 49
185
+ fdf 48
186
+ cl 48
187
+ nfO{_ 48
188
+ nfO{ 48
189
+ ;/ 48
190
+ _cl 47
191
+ F 47
192
+ '/ 47
193
+ g\_ 47
194
+ _r 47
195
+ fo 47
196
+ _eP 47
197
+ ]{ 46
198
+ Z 46
199
+ /L_ 46
200
+ _f_ 45
201
+ ePsf 45
202
+ gd 45
203
+ _;D 45
204
+ if 45
205
+ Gb 44
206
+ lb 44
207
+ Q 44
208
+ _n 44
209
+ fsf 44
210
+ ]sf] 43
211
+ +; 43
212
+ nL 43
213
+ lx 43
214
+ _t 43
215
+ _: 42
216
+ +;b 42
217
+ _o 42
218
+ fdf_ 42
219
+ bf 42
220
+ hf 42
221
+ _lg 42
222
+ ePsf] 41
223
+ j_ 41
224
+ ln 41
225
+ ef 41
226
+ /] 41
227
+ _df 41
228
+ To 40
229
+ klg_ 40
230
+ _klg_ 40
231
+ ]sf]_ 40
232
+ klg 40
233
+ _klg 40
234
+ _u/ 40
235
+ f{_ 40
236
+ _ePs 40
237
+ 'g 40
238
+ Gg 39
239
+ :y 39
240
+ _g\ 39
241
+ f} 39
242
+ kf_ 39
243
+ :tf 38
244
+ ]{_ 38
245
+ fpg 38
246
+ b' 38
247
+ hg 38
248
+ g]{ 38
249
+ jZ 38
250
+ _;+ 37
251
+ gs 37
252
+ wf 37
253
+ o{ 37
254
+ GqL_ 37
255
+ l_ 37
256
+ qL_ 37
257
+ dGqL_ 37
258
+ gf_ 37
259
+ ]; 37
260
+ _ePsf 36
261
+ x' 36
262
+ ?_ 36
263
+ ! 36
264
+ fx 35
265
+ u| 34
266
+ ;d 34
267
+ _lb 34
268
+ fn_ 34
269
+ _P 34
270
+ fg_ 34
271
+ = 34
272
+ bn 34
273
+ Zj 34
274
+ o; 34
275
+ g]{_ 34
276
+ _g\_ 34
277
+ kIf 33
278
+ dl 33
279
+ kI 33
280
+ ljZj 33
281
+ jZj 33
282
+ rf 33
283
+ +u 33
284
+ ]d 33
285
+ ljZ 33
286
+ nL_ 32
287
+ f+; 32
288
+ fnL 32
289
+ gL 32
290
+ ;/sf 32
291
+ tf_ 32
292
+ wfg 32
293
+ _;/ 32
294
+ Qm 32
295
+ fb 32
296
+ f;_ 32
297
+ ld 32
298
+ ;/sf/ 32
299
+ /sf/ 32
300
+ _x' 32
301
+ ;/s 32
302
+ ;f+ 32
303
+ _;f+ 32
304
+ fu 32
305
+ x?_ 32
306
+ ;f+; 31
307
+ _k|:t 31
308
+ s' 31
309
+ _kI 31
310
+ _k|: 31
311
+ of]_ 31
312
+ _kIf 31
313
+ _;f+; 31
314
+ ]l 31
315
+ k|: 31
316
+ bg 31
317
+ _;/s 31
318
+ |: 31
319
+ f+;b 31
320
+ _;/sf 31
321
+ |:t 31
322
+ |] 31
323
+ k|:t 31
324
+ m_ 31
325
+ ;f+;b 31
326
+ Jo 30
327
+ k|wf 30
328
+ |w 30
329
+ |wf 30
330
+ k|w 30
331
+ km 30
332
+ J 30
333
+ k|wfg 30
334
+ |wfg 30
335
+ ]t 30
336
+ @ 30
337
+ ;f] 30
338
+ b_ 29
339
+ > 29
340
+ kfn_ 29
341
+ fn] 29
342
+ gsf 29
343
+ sf+ 29
344
+ Zjf 29
345
+ ]kfn_ 29
346
+ jif 29
347
+ ji 29
348
+ jf; 29
349
+ _k|w 29
350
+ fgd 29
351
+ _k|wf 29
352
+ Zjf; 29
353
+ ljZjf 28
354
+ jZjf; 28
355
+ ]n 28
356
+ _z 28
357
+ _s' 28
358
+ _dG 28
359
+ |]; 28
360
+ _;d 28
361
+ jZjf 28
362
+ u|] 27
363
+ gdGq 27
364
+ gdG 27
365
+ ?n 27
366
+ x'g 27
367
+ |wfgd 27
368
+ wfgd 27
369
+ gdGqL 27
370
+ +u|] 27
371
+ f+u 27
372
+ fgdG 27
373
+ u|]; 27
374
+ +u|]; 27
375
+ wfgdG 27
376
+ dfg 27
377
+ a} 27
378
+ _dGq 27
379
+ f+u| 27
380
+ fgdGq 27
381
+ sf+u| 27
382
+ _sf+u 27
383
+ f+u|] 27
384
+ +u| 27
385
+ sf+u 27
386
+ _sf+ 27
387
+ x?n 27
388
+ S 26
389
+ _To 26
390
+ ]kfnL 26
391
+ _! 26
392
+ _T 26
393
+ ul 26
394
+ /f] 26
395
+ fsf] 26
396
+ af_ 26
397
+ ;s 26
398
+ kfnL 26
399
+ |:tf 26
400
+ k|:tf 26
@@ -0,0 +1,400 @@
1
+ _ 22970
2
+ e 6833
3
+ n 4206
4
+ r 3516
5
+ t 3112
6
+ a 2587
7
+ s 2440
8
+ i 2112
9
+ l 1901
10
+ o 1900
11
+ n_ 1875
12
+ r_ 1761
13
+ k 1713
14
+ g 1630
15
+ en 1615
16
+ m 1508
17
+ e_ 1450
18
+ d 1444
19
+ er 1436
20
+ h 1306
21
+ t_ 1300
22
+ _h 1180
23
+ _s 1148
24
+ er_ 1105
25
+ v 982
26
+ en_ 976
27
+ an 919
28
+ . 901
29
+ ._ 791
30
+ _. 781
31
+ et 770
32
+ g_ 762
33
+ _._ 726
34
+ � 725
35
+ u 719
36
+ f 709
37
+ p 702
38
+ ha 682
39
+ _ha 672
40
+ de 657
41
+ te 651
42
+ _e 621
43
+ et_ 614
44
+ re 581
45
+ ne 565
46
+ _o 554
47
+ an_ 544
48
+ ke 534
49
+ _, 522
50
+ ,_ 522
51
+ , 522
52
+ _,_ 522
53
+ _f 519
54
+ _m 515
55
+ or 503
56
+ _d 483
57
+ _i 480
58
+ �_ 479
59
+ se 476
60
+ m_ 469
61
+ nn 454
62
+ b 449
63
+ me 441
64
+ � 434
65
+ _a 413
66
+ st 404
67
+ _t 398
68
+ og 380
69
+ _v 377
70
+ _og 366
71
+ ar 364
72
+ el 364
73
+ le 361
74
+ i_ 356
75
+ om 353
76
+ og_ 351
77
+ _og_ 351
78
+ li 350
79
+ _k 346
80
+ _de 339
81
+ ge 339
82
+ han 337
83
+ y 333
84
+ _han 332
85
+ ve 330
86
+ kk 323
87
+ in 311
88
+ _b 307
89
+ fo 301
90
+ j 301
91
+ il 298
92
+ _H 291
93
+ H 291
94
+ han_ 288
95
+ _han_ 288
96
+ for 287
97
+ ik 281
98
+ l_ 278
99
+ kke 277
100
+ tt 276
101
+ ti 270
102
+ ne_ 270
103
+ d_ 269
104
+ ed 269
105
+ om_ 268
106
+ nne 266
107
+ _me 264
108
+ ng 257
109
+ _er 257
110
+ _fo 256
111
+ eg 256
112
+ _se 256
113
+ _g 256
114
+ un 255
115
+ ig 255
116
+ sk 253
117
+ _er_ 252
118
+ _p 252
119
+ _for 250
120
+ ke_ 249
121
+ _n 238
122
+ _l 233
123
+ al 232
124
+ �r 222
125
+ s_ 221
126
+ ar_ 215
127
+ at 214
128
+ _en 211
129
+ he 211
130
+ pe 209
131
+ _i_ 208
132
+ am 200
133
+ es 200
134
+ si 200
135
+ enn 197
136
+ det 195
137
+ or_ 193
138
+ vi 190
139
+ ns 189
140
+ ikk 188
141
+ det_ 185
142
+ so 185
143
+ un_ 183
144
+ il_ 181
145
+ nd 181
146
+ te_ 181
147
+ "_ 180
148
+ " 180
149
+ _"_ 180
150
+ _" 180
151
+ em 179
152
+ _ti 176
153
+ kke_ 176
154
+ lig 174
155
+ ten 174
156
+ Ha 173
157
+ _Ha 173
158
+ re_ 172
159
+ ikke 168
160
+ je 165
161
+ Han 165
162
+ ter 165
163
+ _Han 165
164
+ eg_ 164
165
+ p� 164
166
+ _p� 163
167
+ _si 163
168
+ _� 163
169
+ _Han_ 162
170
+ Han_ 162
171
+ p�_ 162
172
+ _p�_ 161
173
+ til 160
174
+ som 160
175
+ _so 159
176
+ den 159
177
+ _det 157
178
+ ed_ 155
179
+ ll 155
180
+ _ik 155
181
+ rt 155
182
+ som_ 153
183
+ ra 152
184
+ a_ 152
185
+ har 152
186
+ nt 152
187
+ de_ 152
188
+ tr 151
189
+ v_ 151
190
+ _har 151
191
+ ka 151
192
+ ig_ 150
193
+ _som 150
194
+ for_ 150
195
+ _som_ 150
196
+ _en_ 149
197
+ hu 149
198
+ _ikk 148
199
+ _ham 148
200
+ ham 148
201
+ ste 148
202
+ _det_ 148
203
+ _ikke 148
204
+ enne 148
205
+ ikke_ 148
206
+ har_ 147
207
+ nge 147
208
+ D 147
209
+ _har_ 147
210
+ _D 147
211
+ am_ 147
212
+ ere 147
213
+ ham_ 146
214
+ _ham_ 146
215
+ it 145
216
+ _he 144
217
+ _til 144
218
+ av 143
219
+ va 140
220
+ men 140
221
+ �r 140
222
+ _ve 140
223
+ _hu 139
224
+ ta 139
225
+ pen 137
226
+ sp 137
227
+ _st 135
228
+ tte 135
229
+ la 135
230
+ _E 133
231
+ E 133
232
+ den_ 130
233
+ is 130
234
+ til_ 128
235
+ _r 128
236
+ tt_ 128
237
+ �r_ 127
238
+ k_ 124
239
+ _�_ 124
240
+ ri 124
241
+ _til_ 124
242
+ at_ 123
243
+ ene 123
244
+ seg 123
245
+ _av 123
246
+ med 122
247
+ _vi 122
248
+ _seg 122
249
+ seg_ 121
250
+ _seg_ 121
251
+ _for_ 120
252
+ nne_ 120
253
+ ut 120
254
+ _u 119
255
+ mm 119
256
+ mme 119
257
+ De 118
258
+ _De 118
259
+ _at 118
260
+ _hun 117
261
+ hun 117
262
+ ko 117
263
+ be 116
264
+ _at_ 115
265
+ ter_ 115
266
+ pen_ 114
267
+ ker 113
268
+ hun_ 113
269
+ _hun_ 113
270
+ on 111
271
+ lig_ 111
272
+ .. 110
273
+ hen 107
274
+ _med 107
275
+ rs 106
276
+ ser 106
277
+ med_ 105
278
+ _men 104
279
+ _hen 104
280
+ _sk 104
281
+ _med_ 104
282
+ ak 103
283
+ ans 103
284
+ ker_ 102
285
+ av_ 101
286
+ _ka 101
287
+ no 100
288
+ ver 100
289
+ ler 99
290
+ J 99
291
+ spe 99
292
+ ten_ 99
293
+ _J 99
294
+ ene_ 98
295
+ ld 98
296
+ hv 98
297
+ _av_ 98
298
+ ger 97
299
+ ni 96
300
+ gen 96
301
+ ie 95
302
+ ser_ 94
303
+ _et 94
304
+ spen 94
305
+ _hv 94
306
+ men_ 93
307
+ Espe 92
308
+ Es 92
309
+ _Esp 92
310
+ _Es 92
311
+ _Espe 92
312
+ Esp 92
313
+ _al 92
314
+ Espen 92
315
+ lle 89
316
+ rem 89
317
+ id 89
318
+ f� 89
319
+ ei 88
320
+ inn 88
321
+ rd 88
322
+ enne_ 88
323
+ _henn 87
324
+ henne 87
325
+ henn 87
326
+ kt 86
327
+ spen_ 86
328
+ _om 86
329
+ ler_ 86
330
+ da 86
331
+ ett 86
332
+ itt 86
333
+ bl 85
334
+ to 85
335
+ _Je 84
336
+ ger_ 84
337
+ Je 84
338
+ � 84
339
+ ma 83
340
+ ing 83
341
+ �r 83
342
+ ns_ 83
343
+ eli 82
344
+ ang 82
345
+ _be 82
346
+ s� 82
347
+ _den 82
348
+ pp 81
349
+ rk 81
350
+ dr 81
351
+ oe 81
352
+ ss 81
353
+ _f� 80
354
+ ek 80
355
+ le_ 79
356
+ _no 79
357
+ kj 78
358
+ elig 78
359
+ nes 78
360
+ nn_ 77
361
+ nk 77
362
+ fr 77
363
+ sl 77
364
+ my 77
365
+ kan 77
366
+ s�_ 76
367
+ as 76
368
+ _om_ 76
369
+ _kan 75
370
+ _ko 75
371
+ _bl 73
372
+ Hu 73
373
+ nen 73
374
+ _Hu 73
375
+ eng 73
376
+ gj 73
377
+ rt_ 72
378
+ ge_ 72
379
+ ba 72
380
+ lv 71
381
+ rer 71
382
+ nde 71
383
+ ls 70
384
+ lo 70
385
+ ga 70
386
+ _noe 70
387
+ ro 70
388
+ _den_ 70
389
+ _ut 70
390
+ noe 70
391
+ Hun 69
392
+ Hun_ 69
393
+ _in 69
394
+ _Hun 69
395
+ _Hun_ 69
396
+ ren 68
397
+ �re 68
398
+ �r_ 68
399
+ sen 68
400
+ sa 67