langdetect-ruby 0.1.1 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +24 -13
  3. data/langdetect-ruby.gemspec +1 -1
  4. data/lib/lingua_ruby/configuration.rb +4 -1
  5. data/lib/lingua_ruby/detector.rb +59 -1
  6. data/lib/lingua_ruby/profile_loader.rb +26 -6
  7. data/lib/lingua_ruby/profiles/am.json +193 -0
  8. data/lib/lingua_ruby/profiles/bg.json +290 -0
  9. data/lib/lingua_ruby/profiles/bn.json +211 -0
  10. data/lib/lingua_ruby/profiles/cs.json +302 -0
  11. data/lib/lingua_ruby/profiles/da.json +302 -0
  12. data/lib/lingua_ruby/profiles/de.json +302 -0
  13. data/lib/lingua_ruby/profiles/el.json +302 -0
  14. data/lib/lingua_ruby/profiles/es.json +302 -0
  15. data/lib/lingua_ruby/profiles/et.json +289 -0
  16. data/lib/lingua_ruby/profiles/fa.json +234 -0
  17. data/lib/lingua_ruby/profiles/fi.json +284 -0
  18. data/lib/lingua_ruby/profiles/fr.json +302 -0
  19. data/lib/lingua_ruby/profiles/ha.json +302 -0
  20. data/lib/lingua_ruby/profiles/hi.json +255 -0
  21. data/lib/lingua_ruby/profiles/hr.json +302 -0
  22. data/lib/lingua_ruby/profiles/hu.json +302 -0
  23. data/lib/lingua_ruby/profiles/it.json +302 -0
  24. data/lib/lingua_ruby/profiles/lt.json +294 -0
  25. data/lib/lingua_ruby/profiles/lv.json +302 -0
  26. data/lib/lingua_ruby/profiles/my.json +200 -0
  27. data/lib/lingua_ruby/profiles/no.json +297 -0
  28. data/lib/lingua_ruby/profiles/pl.json +302 -0
  29. data/lib/lingua_ruby/profiles/pt.json +302 -0
  30. data/lib/lingua_ruby/profiles/ro.json +302 -0
  31. data/lib/lingua_ruby/profiles/ru.json +297 -0
  32. data/lib/lingua_ruby/profiles/sk.json +302 -0
  33. data/lib/lingua_ruby/profiles/sv.json +302 -0
  34. data/lib/lingua_ruby/profiles/sw.json +268 -0
  35. data/lib/lingua_ruby/profiles/ta.json +235 -0
  36. data/lib/lingua_ruby/profiles/te.json +254 -0
  37. data/lib/lingua_ruby/profiles/th.json +251 -0
  38. data/lib/lingua_ruby/profiles/tl.json +302 -0
  39. data/lib/lingua_ruby/profiles/tr.json +302 -0
  40. data/lib/lingua_ruby/profiles/uk.json +302 -0
  41. data/lib/lingua_ruby/profiles/ur.json +232 -0
  42. data/lib/lingua_ruby/profiles/vi.json +277 -0
  43. data/lib/lingua_ruby/profiles/yo.json +245 -0
  44. data/lib/lingua_ruby/profiles/zu.json +302 -0
  45. data/lib/lingua_ruby/result.rb +13 -26
  46. data/lib/lingua_ruby/version.rb +1 -1
  47. data/lib/lingua_ruby.rb +4 -0
  48. metadata +41 -2
@@ -0,0 +1,302 @@
1
+ {
2
+ "e": 0,
3
+ "t": 1,
4
+ "n": 2,
5
+ "i": 3,
6
+ "d": 4,
7
+ "s": 5,
8
+ "u": 6,
9
+ "a": 7,
10
+ "r": 8,
11
+ "h": 9,
12
+ "c": 10,
13
+ "l": 11,
14
+ "ch": 12,
15
+ "n ": 13,
16
+ "e ": 14,
17
+ "nd": 15,
18
+ " d": 16,
19
+ "d ": 17,
20
+ "sch": 18,
21
+ "t ": 19,
22
+ "st": 20,
23
+ "de": 21,
24
+ "sc": 22,
25
+ "p": 23,
26
+ "an": 24,
27
+ " i": 25,
28
+ "nd ": 26,
29
+ "ts": 27,
30
+ "eu": 28,
31
+ "in": 29,
32
+ "che": 30,
33
+ "en": 31,
34
+ "r ": 32,
35
+ "lan": 33,
36
+ "and": 34,
37
+ "d i": 35,
38
+ " is": 36,
39
+ "ist": 37,
40
+ "st ": 38,
41
+ "in ": 39,
42
+ "he": 40,
43
+ "ie": 41,
44
+ "is": 42,
45
+ "deu": 43,
46
+ "la": 44,
47
+ "tsc": 45,
48
+ "ut": 46,
49
+ "uts": 47,
50
+ "b": 48,
51
+ "eut": 49,
52
+ "k": 50,
53
+ "un": 51,
54
+ " b": 52,
55
+ " s": 53,
56
+ "ein": 54,
57
+ "es": 55,
58
+ "er": 56,
59
+ "hla": 57,
60
+ "chl": 58,
61
+ "o": 59,
62
+ "en ": 60,
63
+ "hl": 61,
64
+ "ei": 62,
65
+ " de": 63,
66
+ "ie ": 64,
67
+ "die": 65,
68
+ "te": 66,
69
+ " di": 67,
70
+ "le": 68,
71
+ "ur": 69,
72
+ "und": 70,
73
+ "di": 71,
74
+ " u": 72,
75
+ "hen": 73,
76
+ "ek": 74,
77
+ " f": 75,
78
+ "hi": 76,
79
+ "ur ": 77,
80
+ "tur": 78,
81
+ "tu": 79,
82
+ "chi": 80,
83
+ "r s": 81,
84
+ " ge": 82,
85
+ "ges": 83,
86
+ "n m": 84,
87
+ " be": 85,
88
+ "t d": 86,
89
+ "spr": 87,
90
+ "ele": 88,
91
+ "sta": 89,
92
+ "he ": 90,
93
+ " ei": 91,
94
+ "t e": 92,
95
+ " un": 93,
96
+ "ge": 94,
97
+ " g": 95,
98
+ "ro": 96,
99
+ "be": 97,
100
+ " e": 98,
101
+ " v": 99,
102
+ "li": 100,
103
+ "f": 101,
104
+ " m": 102,
105
+ "el": 103,
106
+ "ra": 104,
107
+ "ta": 105,
108
+ "g": 106,
109
+ "pr": 107,
110
+ "sp": 108,
111
+ "v": 109,
112
+ "m": 110,
113
+ "it": 111,
114
+ "dt ": 112,
115
+ "nds": 113,
116
+ "ds ": 114,
117
+ "s u": 115,
118
+ "ale": 116,
119
+ "ral": 117,
120
+ "t b": 118,
121
+ "era": 119,
122
+ "bek": 120,
123
+ "eka": 121,
124
+ "kan": 122,
125
+ "ann": 123,
126
+ "nnt": 124,
127
+ "der": 125,
128
+ "nt ": 126,
129
+ "hte": 127,
130
+ "w": 128,
131
+ "aat": 129,
132
+ "esp": 130,
133
+ "pro": 131,
134
+ "roc": 132,
135
+ "och": 133,
136
+ "n b": 134,
137
+ "ber": 135,
138
+ "erl": 136,
139
+ "rli": 137,
140
+ "lin": 138,
141
+ "n i": 139,
142
+ "taa": 140,
143
+ "e h": 141,
144
+ " ha": 142,
145
+ "hau": 143,
146
+ "aup": 144,
147
+ "upt": 145,
148
+ "pts": 146,
149
+ "tst": 147,
150
+ " st": 148,
151
+ "tad": 149,
152
+ "er ": 150,
153
+ "ler": 151,
154
+ "adt": 152,
155
+ "te ": 153,
156
+ "e k": 154,
157
+ " ku": 155,
158
+ "kul": 156,
159
+ "sre": 157,
160
+ "ult": 158,
161
+ "ltu": 159,
162
+ "esr": 160,
163
+ "des": 161,
164
+ "r u": 162,
165
+ "d a": 163,
166
+ "nde": 164,
167
+ " ar": 165,
168
+ "arc": 166,
169
+ "bun": 167,
170
+ "rch": 168,
171
+ "hit": 169,
172
+ "ite": 170,
173
+ "tek": 171,
174
+ "ekt": 172,
175
+ " bu": 173,
176
+ "e b": 174,
177
+ "r d": 175,
178
+ "ktu": 176,
179
+ "t f": 177,
180
+ " fü": 178,
181
+ "öde": 179,
182
+ "föd": 180,
183
+ " fö": 181,
184
+ "n f": 182,
185
+ "k d": 183,
186
+ "ik ": 184,
187
+ "lik": 185,
188
+ "bli": 186,
189
+ "ubl": 187,
190
+ "pub": 188,
191
+ "epu": 189,
192
+ "für": 190,
193
+ "ür ": 191,
194
+ "rep": 192,
195
+ " se": 193,
196
+ "sei": 194,
197
+ "ine": 195,
198
+ "ne ": 196,
199
+ "e g": 197,
200
+ "esc": 198,
201
+ "hic": 199,
202
+ "ich": 200,
203
+ "cht": 201,
204
+ "ad": 202,
205
+ "dt": 203,
206
+ "ds": 204,
207
+ "s ": 205,
208
+ "ka": 206,
209
+ "nn": 207,
210
+ "nt": 208,
211
+ "fü": 209,
212
+ "ür": 210,
213
+ "se": 211,
214
+ "ne": 212,
215
+ "ic": 213,
216
+ "ht": 214,
217
+ " k": 215,
218
+ "ku": 216,
219
+ "ul": 217,
220
+ "lt": 218,
221
+ " a": 219,
222
+ "ar": 220,
223
+ "rc": 221,
224
+ "kt": 222,
225
+ "bu": 223,
226
+ "sr": 224,
227
+ "re": 225,
228
+ "ep": 226,
229
+ "ü": 227,
230
+ "ö": 228,
231
+ " l": 229,
232
+ "mi": 230,
233
+ "tt": 231,
234
+ "op": 232,
235
+ "pa": 233,
236
+ "a ": 234,
237
+ "ac": 235,
238
+ " w": 236,
239
+ "wi": 237,
240
+ "ir": 238,
241
+ "rd": 239,
242
+ "vo": 240,
243
+ "on": 241,
244
+ "vi": 242,
245
+ "me": 243,
246
+ "ns": 244,
247
+ "oc": 245,
248
+ "rl": 246,
249
+ " h": 247,
250
+ "ha": 248,
251
+ "au": 249,
252
+ "up": 250,
253
+ "pt": 251,
254
+ "e d": 252,
255
+ "e s": 253,
256
+ " sp": 254,
257
+ "pra": 255,
258
+ "rac": 256,
259
+ "ach": 257,
260
+ "e w": 258,
261
+ " wi": 259,
262
+ "wir": 260,
263
+ "ird": 261,
264
+ "rd ": 262,
265
+ "d v": 263,
266
+ " vo": 264,
267
+ "von": 265,
268
+ "on ": 266,
269
+ "n v": 267,
270
+ " vi": 268,
271
+ "vie": 269,
272
+ "iel": 270,
273
+ "len": 271,
274
+ " me": 272,
275
+ "men": 273,
276
+ "ens": 274,
277
+ "nsc": 275,
278
+ "n g": 276,
279
+ "pu": 277,
280
+ "ub": 278,
281
+ "bl": 279,
282
+ "ik": 280,
283
+ "k ": 281,
284
+ "fö": 282,
285
+ "öd": 283,
286
+ "al": 284,
287
+ "aa": 285,
288
+ "at": 286,
289
+ "n l": 287,
290
+ " la": 288,
291
+ " in": 289,
292
+ " mi": 290,
293
+ "mit": 291,
294
+ "itt": 292,
295
+ "tte": 293,
296
+ "tel": 294,
297
+ "leu": 295,
298
+ "eur": 296,
299
+ "uro": 297,
300
+ "rop": 298,
301
+ "opa": 299
302
+ }
@@ -0,0 +1,302 @@
1
+ {
2
+ "α": 0,
3
+ "ι": 1,
4
+ "ε": 2,
5
+ "ν": 3,
6
+ "τ": 4,
7
+ "α ": 5,
8
+ "λ": 6,
9
+ "ο": 7,
10
+ "σ": 8,
11
+ " ε": 9,
12
+ "ρ": 10,
13
+ "η": 11,
14
+ "να": 12,
15
+ "αι": 13,
16
+ "ι ": 14,
17
+ "ί": 15,
18
+ "αι ": 16,
19
+ "κ": 17,
20
+ "η ": 18,
21
+ "ς": 19,
22
+ "ς ": 20,
23
+ "π": 21,
24
+ "μ": 22,
25
+ "ώ": 23,
26
+ " τ": 24,
27
+ " γ": 25,
28
+ "το": 26,
29
+ " μ": 27,
30
+ " εί": 28,
31
+ "είν": 29,
32
+ "ναι": 30,
33
+ "ίνα": 31,
34
+ "ίν": 32,
35
+ "εί": 33,
36
+ "ή": 34,
37
+ "υ": 35,
38
+ "γ": 36,
39
+ "ά": 37,
40
+ "ι μ": 38,
41
+ "χ": 39,
42
+ "ό": 40,
43
+ "ια ": 41,
44
+ "ου": 42,
45
+ "στ": 43,
46
+ " η": 44,
47
+ " η ": 45,
48
+ "ια": 46,
49
+ " α": 47,
50
+ "ή ": 48,
51
+ " κ": 49,
52
+ "ελ": 50,
53
+ "λλ": 51,
54
+ " ελ": 52,
55
+ " π": 53,
56
+ "ελλ": 54,
57
+ "ες ": 55,
58
+ "η ε": 56,
59
+ " το": 57,
60
+ "ου ": 58,
61
+ "υ ": 59,
62
+ "ες": 60,
63
+ "τε": 61,
64
+ "αρ": 62,
65
+ "κα": 63,
66
+ "ία": 64,
67
+ "α τ": 65,
68
+ "γλώ": 66,
69
+ " γλ": 67,
70
+ "ή γ": 68,
71
+ "λώσ": 69,
72
+ "ώσσ": 70,
73
+ "σα ": 71,
74
+ "κή ": 72,
75
+ "ική": 73,
76
+ "ία ": 74,
77
+ " κα": 75,
78
+ "και": 76,
79
+ "ι ε": 77,
80
+ "μια": 78,
81
+ " μι": 79,
82
+ "δ": 80,
83
+ "α ε": 81,
84
+ "άδα": 82,
85
+ "λάδ": 83,
86
+ "λλά": 84,
87
+ "σσ": 85,
88
+ "σα": 86,
89
+ "τι": 87,
90
+ "ώσ": 88,
91
+ "τη": 89,
92
+ "λώ": 90,
93
+ "ολ": 91,
94
+ "ικ": 92,
95
+ "γλ": 93,
96
+ "κή": 94,
97
+ "ύ": 95,
98
+ "μι": 96,
99
+ "θ": 97,
100
+ "ω": 98,
101
+ "λά": 99,
102
+ "άδ": 100,
103
+ "δα": 101,
104
+ "α κ": 102,
105
+ "θεν": 103,
106
+ "ρία": 104,
107
+ "ρθε": 105,
108
+ "σσα": 106,
109
+ "αρθ": 107,
110
+ " μί": 108,
111
+ "μία": 109,
112
+ "παρ": 110,
113
+ " πα": 111,
114
+ "ν π": 112,
115
+ "ον ": 113,
116
+ "τον": 114,
117
+ "για": 115,
118
+ " γι": 116,
119
+ "α α": 117,
120
+ "τή ": 118,
121
+ "στή": 119,
122
+ "ωστ": 120,
123
+ "νωσ": 121,
124
+ "γνω": 122,
125
+ "ώνα": 123,
126
+ "α έ": 124,
127
+ " έχ": 125,
128
+ "έχε": 126,
129
+ "χει": 127,
130
+ "ει ": 128,
131
+ "α π": 129,
132
+ " πο": 130,
133
+ "πολ": 131,
134
+ "νών": 132,
135
+ "ενώ": 133,
136
+ "ολύ": 134,
137
+ "λύ ": 135,
138
+ "ύ μ": 136,
139
+ " μα": 137,
140
+ "μακ": 138,
141
+ "ακρ": 139,
142
+ "κρά": 140,
143
+ "ρά ": 141,
144
+ "ά ι": 142,
145
+ " ισ": 143,
146
+ "ιστ": 144,
147
+ "στο": 145,
148
+ "τορ": 146,
149
+ "ορί": 147,
150
+ "κόσ": 148,
151
+ "όσμ": 149,
152
+ "σμο": 150,
153
+ "μου": 151,
154
+ "υ η": 152,
155
+ "η α": 153,
156
+ " αθ": 154,
157
+ "αθή": 155,
158
+ "θήν": 156,
159
+ "ήνα": 157,
160
+ "να ": 158,
161
+ "ι η": 159,
162
+ "ας ": 160,
163
+ "η π": 161,
164
+ "δας": 162,
165
+ "ς ε": 163,
166
+ "ης ": 164,
167
+ " πρ": 165,
168
+ "πρω": 166,
169
+ "ρωτ": 167,
170
+ "ωτε": 168,
171
+ "τεύ": 169,
172
+ "εύο": 170,
173
+ "ύου": 171,
174
+ "ουσ": 172,
175
+ "υσα": 173,
176
+ "της": 174,
177
+ " τη": 175,
178
+ " απ": 176,
179
+ "από": 177,
180
+ "πό ": 178,
181
+ "ό τ": 179,
182
+ " τι": 180,
183
+ "τις": 181,
184
+ "ις ": 182,
185
+ "ς α": 183,
186
+ " αρ": 184,
187
+ "αρχ": 185,
188
+ "ρχα": 186,
189
+ "χαι": 187,
190
+ "αιό": 188,
191
+ "ιότ": 189,
192
+ "ότε": 190,
193
+ "τερ": 191,
194
+ "ερε": 192,
195
+ "ρες": 193,
196
+ " γν": 194,
197
+ "ς γ": 195,
198
+ "σσε": 196,
199
+ "σες": 197,
200
+ "ς τ": 198,
201
+ "ι γ": 199,
202
+ "του": 200,
203
+ "ς κ": 201,
204
+ "υ κ": 202,
205
+ " κό": 203,
206
+ " χ": 204,
207
+ "ακ": 205,
208
+ "κρ": 206,
209
+ "ρά": 207,
210
+ "ά ": 208,
211
+ " ι": 209,
212
+ "ισ": 210,
213
+ "ορ": 211,
214
+ "ρί": 212,
215
+ "μί": 213,
216
+ "απ": 214,
217
+ "πό": 215,
218
+ "ό ": 216,
219
+ "έ": 217,
220
+ "ις": 218,
221
+ "ρχ": 219,
222
+ "χα": 220,
223
+ "ιό": 221,
224
+ "ότ": 222,
225
+ "ερ": 223,
226
+ "ρε": 224,
227
+ "σε": 225,
228
+ "κό": 226,
229
+ "όσ": 227,
230
+ "σμ": 228,
231
+ "μο": 229,
232
+ "αθ": 230,
233
+ "θή": 231,
234
+ "ήν": 232,
235
+ "χώ": 233,
236
+ "ώρ": 234,
237
+ "ρα": 235,
238
+ " σ": 236,
239
+ " ν": 237,
240
+ "νο": 238,
241
+ "οτ": 239,
242
+ "ιο": 240,
243
+ "οα": 241,
244
+ "αν": 242,
245
+ "ατ": 243,
246
+ "λι": 244,
247
+ "ευ": 245,
248
+ "υρ": 246,
249
+ "ρώ": 247,
250
+ "ώπ": 248,
251
+ "πη": 249,
252
+ "λη": 250,
253
+ "ην": 251,
254
+ "νι": 252,
255
+ " έ": 253,
256
+ "έχ": 254,
257
+ "χε": 255,
258
+ "ει": 256,
259
+ "πο": 257,
260
+ "λύ": 258,
261
+ "ύ ": 259,
262
+ "μα": 260,
263
+ " στ": 261,
264
+ "στη": 262,
265
+ "τη ": 263,
266
+ "η ν": 264,
267
+ " νο": 265,
268
+ "νοτ": 266,
269
+ "οτι": 267,
270
+ "τιο": 268,
271
+ "ιοα": 269,
272
+ "οαν": 270,
273
+ "ανα": 271,
274
+ "νατ": 272,
275
+ "ατο": 273,
276
+ "τολ": 274,
277
+ "ολι": 275,
278
+ "λικ": 276,
279
+ "ή ε": 277,
280
+ " ευ": 278,
281
+ "ευρ": 279,
282
+ "υρώ": 280,
283
+ "ρώπ": 281,
284
+ "ώπη": 282,
285
+ "πη ": 283,
286
+ "η η": 284,
287
+ "λλη": 285,
288
+ "λην": 286,
289
+ "ηνι": 287,
290
+ "νικ": 288,
291
+ "πρ": 289,
292
+ "ρω": 290,
293
+ "ωτ": 291,
294
+ "εύ": 292,
295
+ "ύο": 293,
296
+ "υσ": 294,
297
+ "ης": 295,
298
+ "ας": 296,
299
+ "γν": 297,
300
+ "νω": 298,
301
+ "ωσ": 299
302
+ }