langdetect-ruby 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,402 @@
1
+ {
2
+ "a": 0,
3
+ "n": 1,
4
+ "e": 2,
5
+ "i": 3,
6
+ "d": 4,
7
+ "an": 5,
8
+ "u": 6,
9
+ "r": 7,
10
+ "a ": 8,
11
+ "s": 9,
12
+ "m": 10,
13
+ "g": 11,
14
+ " d": 12,
15
+ "k": 13,
16
+ "t": 14,
17
+ "n ": 15,
18
+ "an ": 16,
19
+ "b": 17,
20
+ "i ": 18,
21
+ "p": 19,
22
+ "l": 20,
23
+ "da": 21,
24
+ "ng": 22,
25
+ "ga": 23,
26
+ "er": 24,
27
+ "sa": 25,
28
+ "ra": 26,
29
+ "h": 27,
30
+ "ar": 28,
31
+ "me": 29,
32
+ "ang": 30,
33
+ "ne": 31,
34
+ "in": 32,
35
+ "be": 33,
36
+ " m": 34,
37
+ "ya": 35,
38
+ " p": 36,
39
+ "ah": 37,
40
+ "la": 38,
41
+ " me": 39,
42
+ "y": 40,
43
+ "ia": 41,
44
+ " s": 42,
45
+ " b": 43,
46
+ " da": 44,
47
+ "en": 45,
48
+ "es": 46,
49
+ "di": 47,
50
+ "du": 48,
51
+ "ng ": 49,
52
+ "g ": 50,
53
+ "at": 51,
54
+ "am": 52,
55
+ "o": 53,
56
+ "ia ": 54,
57
+ "si": 55,
58
+ "al": 56,
59
+ "h ": 57,
60
+ "ba": 58,
61
+ " k": 59,
62
+ "ke": 60,
63
+ " i": 61,
64
+ "ua": 62,
65
+ "em": 63,
66
+ "nd": 64,
67
+ "ah ": 65,
68
+ "ri": 66,
69
+ "pa": 67,
70
+ " in": 68,
71
+ "ara": 69,
72
+ "ra ": 70,
73
+ "ka": 71,
74
+ " ke": 72,
75
+ "ni": 73,
76
+ "un": 74,
77
+ " du": 75,
78
+ "yan": 76,
79
+ "ik": 77,
80
+ "a d": 78,
81
+ " ya": 79,
82
+ "ag": 80,
83
+ "pe": 81,
84
+ " sa": 82,
85
+ " y": 83,
86
+ "aga": 84,
87
+ " pe": 85,
88
+ " n": 86,
89
+ "ad": 87,
90
+ " a": 88,
91
+ "ta": 89,
92
+ "on": 90,
93
+ "ala": 91,
94
+ "do": 92,
95
+ " t": 93,
96
+ " ne": 94,
97
+ "neg": 95,
98
+ "ega": 96,
99
+ "gar": 97,
100
+ " di": 98,
101
+ "ha": 99,
102
+ "eg": 100,
103
+ "tu": 101,
104
+ "sia": 102,
105
+ "li": 103,
106
+ "nt": 104,
107
+ "esi": 105,
108
+ "j": 106,
109
+ " be": 107,
110
+ "nes": 108,
111
+ "dan": 109,
112
+ "one": 110,
113
+ "don": 111,
114
+ "ndo": 112,
115
+ "ind": 113,
116
+ "ada": 114,
117
+ "lah": 115,
118
+ "ban": 116,
119
+ "era": 117,
120
+ "nga": 118,
121
+ "n d": 119,
122
+ "ari": 120,
123
+ "ri ": 121,
124
+ "ua ": 122,
125
+ "atu": 123,
126
+ "nta": 124,
127
+ "a i": 125,
128
+ "mer": 126,
129
+ "kan": 127,
130
+ "uni": 128,
131
+ "at ": 129,
132
+ " ba": 130,
133
+ "sa ": 131,
134
+ "i d": 132,
135
+ "di ": 133,
136
+ "mem": 134,
137
+ "ber": 135,
138
+ "erb": 136,
139
+ "ter": 137,
140
+ " te": 138,
141
+ "aya": 139,
142
+ "uan": 140,
143
+ "na": 141,
144
+ "mi": 142,
145
+ "de": 143,
146
+ "rb": 144,
147
+ "uk": 145,
148
+ "t ": 146,
149
+ "ay": 147,
150
+ "k ": 148,
151
+ "te": 149,
152
+ "as": 150,
153
+ "dun": 151,
154
+ "ru": 152,
155
+ "up": 153,
156
+ "aha": 154,
157
+ "esa": 155,
158
+ "rbe": 156,
159
+ "mp": 157,
160
+ "ula": 158,
161
+ "pul": 159,
162
+ "ini": 160,
163
+ "ni ": 161,
164
+ "m ": 162,
165
+ "am ": 163,
166
+ "gan": 164,
167
+ " j": 165,
168
+ "eng": 166,
169
+ "den": 167,
170
+ " de": 168,
171
+ "a s": 169,
172
+ "ud": 170,
173
+ "eb": 171,
174
+ "a b": 172,
175
+ "dua": 173,
176
+ " r": 174,
177
+ "ak": 175,
178
+ "a m": 176,
179
+ "eru": 177,
180
+ "upa": 178,
181
+ "sat": 179,
182
+ "a p": 180,
183
+ "n p": 181,
184
+ "nia": 182,
185
+ "mpa": 183,
186
+ "ama": 184,
187
+ "ai ": 185,
188
+ " se": 186,
189
+ "i m": 187,
190
+ "gam": 188,
191
+ "au": 189,
192
+ "emi": 190,
193
+ "mil": 191,
194
+ "ya ": 192,
195
+ "pu": 193,
196
+ "ul": 194,
197
+ "ili": 195,
198
+ "ma": 196,
199
+ "ki": 197,
200
+ "u ": 198,
201
+ "dal": 199,
202
+ "se": 200,
203
+ " ad": 201,
204
+ "ki ": 202,
205
+ "ai": 203,
206
+ "pem": 204,
207
+ "iki": 205,
208
+ "lik": 206,
209
+ "il": 207,
210
+ "tia": 208,
211
+ "rag": 209,
212
+ "et": 210,
213
+ "i s": 211,
214
+ "le": 212,
215
+ "us ": 213,
216
+ "ika": 214,
217
+ " ju": 215,
218
+ "gsa": 216,
219
+ "ngs": 217,
220
+ "n a": 218,
221
+ "da ": 219,
222
+ "eda": 220,
223
+ "g s": 221,
224
+ "pen": 222,
225
+ "end": 223,
226
+ "bed": 224,
227
+ "uk ": 225,
228
+ "adi": 226,
229
+ "kay": 227,
230
+ "dar": 228,
231
+ "n b": 229,
232
+ "a r": 230,
233
+ "dat": 231,
234
+ "man": 232,
235
+ "dik": 233,
236
+ "m p": 234,
237
+ "lam": 235,
238
+ "una": 236,
239
+ "gun": 237,
240
+ "g d": 238,
241
+ "i y": 239,
242
+ "eme": 240,
243
+ "i n": 241,
244
+ "g m": 242,
245
+ "eri": 243,
246
+ "rin": 244,
247
+ "eka": 245,
248
+ "int": 246,
249
+ "tah": 247,
250
+ "asa": 248,
251
+ "n k": 249,
252
+ "has": 250,
253
+ "emb": 251,
254
+ "bah": 252,
255
+ "t d": 253,
256
+ "har": 254,
257
+ "r ": 255,
258
+ "mel": 256,
259
+ "si ": 257,
260
+ "asi": 258,
261
+ "h s": 259,
262
+ "n n": 260,
263
+ "aka": 261,
264
+ "rup": 262,
265
+ "i k": 263,
266
+ "ben": 264,
267
+ "is": 265,
268
+ "ed": 266,
269
+ "nj": 267,
270
+ "ja": 268,
271
+ " u": 269,
272
+ "i a": 270,
273
+ "k d": 271,
274
+ "bag": 272,
275
+ "gai": 273,
276
+ "us": 274,
277
+ "s ": 275,
278
+ "a y": 276,
279
+ " un": 277,
280
+ "bu": 278,
281
+ "a a": 279,
282
+ "ar ": 280,
283
+ "sar": 281,
284
+ "bes": 282,
285
+ "eh": 283,
286
+ "n t": 284,
287
+ "id": 285,
288
+ "lau": 286,
289
+ "gu": 287,
290
+ "a k": 288,
291
+ "n i": 289,
292
+ "men": 290,
293
+ "gs": 291,
294
+ "nja": 292,
295
+ "sam": 293,
296
+ "ek": 294,
297
+ "tua": 295,
298
+ "ti": 296,
299
+ "enj": 297,
300
+ "el": 298,
301
+ "ju": 299,
302
+ "nya": 300,
303
+ "ny": 301,
304
+ "nya ": 302,
305
+ "meny": 303,
306
+ "eny": 304,
307
+ "peny": 305,
308
+ "kep": 306,
309
+ "epa": 307,
310
+ "pad": 308,
311
+ "pada": 309,
312
+ " pad": 310,
313
+ "itu": 311,
314
+ " itu": 312,
315
+ "yang": 313,
316
+ " yan": 314,
317
+ "denga": 315,
318
+ "dengan": 316,
319
+ "ngan": 317,
320
+ " den": 318,
321
+ "juga": 319,
322
+ " jug": 320,
323
+ "uga ": 321,
324
+ "seb": 322,
325
+ "seba": 323,
326
+ "bagai": 324,
327
+ "agai": 325,
328
+ "telah": 326,
329
+ "elah": 327,
330
+ "tela": 328,
331
+ " tel": 329,
332
+ "untu": 330,
333
+ "ntuk": 331,
334
+ "tuk ": 332,
335
+ " unt": 333,
336
+ "ora": 334,
337
+ "orang": 335,
338
+ "rang": 336,
339
+ " ora": 337,
340
+ "dap": 338,
341
+ "apat": 339,
342
+ "dpat": 340,
343
+ "suda": 341,
344
+ "udah": 342,
345
+ " sud": 343,
346
+ "haru": 344,
347
+ "arus": 345,
348
+ " har": 346,
349
+ "aka ": 347,
350
+ "mere": 348,
351
+ "erek": 349,
352
+ "reka": 350,
353
+ " mer": 351,
354
+ "maka": 352,
355
+ " mak": 353,
356
+ "tida": 354,
357
+ "idak": 355,
358
+ "dak ": 356,
359
+ " tid": 357,
360
+ "seh": 358,
361
+ "sehi": 359,
362
+ "hing": 360,
363
+ "ingg": 361,
364
+ " seh": 362,
365
+ "aka": 363,
366
+ "masi": 364,
367
+ "asih": 365,
368
+ " mas": 366,
369
+ "kare": 367,
370
+ "aren": 368,
371
+ "rena": 369,
372
+ " kar": 370,
373
+ "dari": 371,
374
+ " dar": 372,
375
+ "ari ": 373,
376
+ "oleh": 374,
377
+ "leh ": 375,
378
+ " ole": 376,
379
+ "sela": 377,
380
+ "elam": 378,
381
+ " sel": 379,
382
+ "perl": 380,
383
+ "erlu": 381,
384
+ " per": 382,
385
+ "bisa": 383,
386
+ "isa ": 384,
387
+ " bis": 385,
388
+ "sang": 386,
389
+ "anga": 387,
390
+ "ngat": 388,
391
+ " san": 389,
392
+ "meng": 390,
393
+ "eng ": 391,
394
+ "ngg": 392,
395
+ "pern": 393,
396
+ "erna": 394,
397
+ "rnah": 395,
398
+ " per": 396,
399
+ "seka": 397,
400
+ "ekar": 398,
401
+ " sek": 399
402
+ }
@@ -0,0 +1,302 @@
1
+ {
2
+ "の": 0,
3
+ "で": 1,
4
+ "日": 2,
5
+ "本": 3,
6
+ "は": 4,
7
+ "す": 5,
8
+ "日本": 6,
9
+ "す ": 7,
10
+ "す 日": 8,
11
+ " 日本": 9,
12
+ "日本の": 10,
13
+ "本の": 11,
14
+ " 日": 12,
15
+ "です": 13,
16
+ "て": 14,
17
+ "世界": 15,
18
+ "に": 16,
19
+ "です ": 17,
20
+ "り": 18,
21
+ "界": 19,
22
+ "世": 20,
23
+ "り ": 21,
24
+ "都": 22,
25
+ "東": 23,
26
+ "ア": 24,
27
+ "は日本": 25,
28
+ "ら": 26,
29
+ "れ": 27,
30
+ "特": 28,
31
+ "であり": 29,
32
+ "あり ": 30,
33
+ "本は": 31,
34
+ "ていま": 32,
35
+ "います": 33,
36
+ "ます ": 34,
37
+ "文化は": 35,
38
+ "化は": 36,
39
+ "文化": 37,
40
+ "は日": 38,
41
+ "ます": 39,
42
+ "いま": 40,
43
+ "てい": 41,
44
+ "であ": 42,
45
+ "あり": 43,
46
+ "一": 44,
47
+ "化": 45,
48
+ "し": 46,
49
+ "と": 47,
50
+ "日本は": 48,
51
+ "が": 49,
52
+ "語": 50,
53
+ "文": 51,
54
+ "れて": 52,
55
+ "用": 53,
56
+ "あ": 54,
57
+ "い": 55,
58
+ "ま": 56,
59
+ "に有": 57,
60
+ "特に": 58,
61
+ "本の文": 59,
62
+ "の文化": 60,
63
+ "してい": 61,
64
+ "用して": 62,
65
+ "使用し": 63,
66
+ "が使用": 64,
67
+ "人が使": 65,
68
+ "万人が": 66,
69
+ "アジア": 67,
70
+ "は特": 68,
71
+ "化は伝": 69,
72
+ "らは": 70,
73
+ "ぷら": 71,
74
+ "天ぷ": 72,
75
+ "は伝統": 73,
76
+ "や天": 74,
77
+ "司や": 75,
78
+ "東ア": 76,
79
+ "伝統と": 77,
80
+ "統と現": 78,
81
+ "と現代": 79,
82
+ "現代が": 80,
83
+ "代が融": 81,
84
+ "が融合": 82,
85
+ "ジアに": 83,
86
+ "アに位": 84,
87
+ "に位置": 85,
88
+ "東アジ": 86,
89
+ "は東ア": 87,
90
+ "本は東": 88,
91
+ "位置す": 89,
92
+ "置する": 90,
93
+ "する島": 91,
94
+ "る島国": 92,
95
+ "島国で": 93,
96
+ "国です": 94,
97
+ "日本語": 95,
98
+ "本語は": 96,
99
+ "語は日": 97,
100
+ "名で": 98,
101
+ "名です": 99,
102
+ "有名": 100,
103
+ "本の公": 101,
104
+ "の公用": 102,
105
+ "公用語": 103,
106
+ "用語で": 104,
107
+ "語であ": 105,
108
+ "り 約": 106,
109
+ " 約一": 107,
110
+ "約一億": 108,
111
+ "一億二": 109,
112
+ "億二千": 110,
113
+ "二千万": 111,
114
+ "千万人": 112,
115
+ "らは特": 113,
116
+ "食文化": 114,
117
+ "の食文": 115,
118
+ "本の食": 116,
119
+ "れてい": 117,
120
+ "られて": 118,
121
+ "知られ": 119,
122
+ "に知ら": 120,
123
+ "的に知": 121,
124
+ "界的に": 122,
125
+ "世界的": 123,
126
+ "で世界": 124,
127
+ "業で世": 125,
128
+ "造業で": 126,
129
+ "製造業": 127,
130
+ "と製造": 128,
131
+ "新と製": 129,
132
+ "革新と": 130,
133
+ "術革新": 131,
134
+ "ぷらは": 132,
135
+ "天ぷら": 133,
136
+ "や天ぷ": 134,
137
+ "司や天": 135,
138
+ "寿司や": 136,
139
+ " 寿司": 137,
140
+ "り 寿": 138,
141
+ "おり ": 139,
142
+ "ており": 140,
143
+ "れてお": 141,
144
+ "されて": 142,
145
+ "愛され": 143,
146
+ "で愛さ": 144,
147
+ "中で愛": 145,
148
+ "界中で": 146,
149
+ "世界中": 147,
150
+ "は世界": 148,
151
+ "化は世": 149,
152
+ "技術革": 150,
153
+ "の首都": 151,
154
+ "本の首": 152,
155
+ "京は日": 153,
156
+ "特に有": 154,
157
+ "に有名": 155,
158
+ "有名で": 156,
159
+ "東京は": 157,
160
+ " 東京": 158,
161
+ "す 東": 159,
162
+ "のです": 160,
163
+ "もので": 161,
164
+ "のもの": 162,
165
+ "特のも": 163,
166
+ "独特の": 164,
167
+ "た独特": 165,
168
+ "した独": 166,
169
+ "合した": 167,
170
+ "融合し": 168,
171
+ "は技術": 169,
172
+ "本は技": 170,
173
+ "つです": 171,
174
+ "一つで": 172,
175
+ "の一つ": 173,
176
+ "圏の一": 174,
177
+ "市圏の": 175,
178
+ "都市圏": 176,
179
+ "は特に": 177,
180
+ "の都市": 178,
181
+ "大の都": 179,
182
+ "最大の": 180,
183
+ "界最大": 181,
184
+ "世界最": 182,
185
+ " 世界": 183,
186
+ "り 世": 184,
187
+ "都であ": 185,
188
+ "首都で": 186,
189
+ "は東": 187,
190
+ "名": 188,
191
+ "有": 189,
192
+ "ぷ": 190,
193
+ "天": 191,
194
+ "や": 192,
195
+ "司": 193,
196
+ "寿": 194,
197
+ "お": 195,
198
+ "さ": 196,
199
+ "愛": 197,
200
+ "中": 198,
201
+ "食": 199,
202
+ "知": 200,
203
+ "的": 201,
204
+ "業": 202,
205
+ "代": 203,
206
+ "約一": 204,
207
+ " 約": 205,
208
+ "語で": 206,
209
+ "用語": 207,
210
+ "公用": 208,
211
+ "の公": 209,
212
+ "語は": 210,
213
+ "本語": 211,
214
+ "国で": 212,
215
+ "島国": 213,
216
+ "る島": 214,
217
+ "する": 215,
218
+ "置す": 216,
219
+ "位置": 217,
220
+ "に位": 218,
221
+ "アに": 219,
222
+ "ジア": 220,
223
+ "アジ": 221,
224
+ "現": 222,
225
+ "統": 223,
226
+ "伝": 224,
227
+ "使": 225,
228
+ "人": 226,
229
+ "万": 227,
230
+ "千": 228,
231
+ "二": 229,
232
+ "億": 230,
233
+ "約": 231,
234
+ "公": 232,
235
+ "国": 233,
236
+ "島": 234,
237
+ "る": 235,
238
+ "置": 236,
239
+ "位": 237,
240
+ "ジ": 238,
241
+ "造": 239,
242
+ "製": 240,
243
+ "新": 241,
244
+ "革": 242,
245
+ "術": 243,
246
+ "技": 244,
247
+ "つ": 245,
248
+ "圏": 246,
249
+ "市": 247,
250
+ "大": 248,
251
+ "最": 249,
252
+ "首": 250,
253
+ "京": 251,
254
+ "も": 252,
255
+ "独": 253,
256
+ "た": 254,
257
+ "合": 255,
258
+ "融": 256,
259
+ "業で": 257,
260
+ "造業": 258,
261
+ "製造": 259,
262
+ "と製": 260,
263
+ "新と": 261,
264
+ "革新": 262,
265
+ "術革": 263,
266
+ "技術": 264,
267
+ "は技": 265,
268
+ "つで": 266,
269
+ "一つ": 267,
270
+ "の一": 268,
271
+ "圏の": 269,
272
+ "市圏": 270,
273
+ "都市": 271,
274
+ "の都": 272,
275
+ "大の": 273,
276
+ "が融": 274,
277
+ "寿司": 275,
278
+ " 寿": 276,
279
+ "おり": 277,
280
+ "てお": 278,
281
+ "され": 279,
282
+ "愛さ": 280,
283
+ "で愛": 281,
284
+ "中で": 282,
285
+ "界中": 283,
286
+ "は世": 284,
287
+ "食文": 285,
288
+ "の食": 286,
289
+ "られ": 287,
290
+ "知ら": 288,
291
+ "に知": 289,
292
+ "的に": 290,
293
+ "界的": 291,
294
+ "で世": 292,
295
+ "代が": 293,
296
+ "現代": 294,
297
+ "と現": 295,
298
+ "統と": 296,
299
+ "伝統": 297,
300
+ "は伝": 298,
301
+ "の文": 299
302
+ }