iso-639 0.2.10 → 0.3.1

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: da2f2ce60e4acc74618b01f7c2f22e12fd8c86b7a7b6e5e254ae0667cc6c2b7b
4
- data.tar.gz: f5d18fadc8b2aa67847f49f00dfb0354de15ef00c9ec98fafe9721ceb87dec62
3
+ metadata.gz: 814587429390abbe6fb28f55a2ee74b07d65c17e845b369f33a9dab981daef11
4
+ data.tar.gz: aeab1e9162ec0eb34614bbfddd50edf57447ec5905110a2240011119241016af
5
5
  SHA512:
6
- metadata.gz: 5b16c4ae94be5045d5f0334c971cd26f80d81bac61a74339f39e9101e312dad234956136504550b1257a3ac06c9bb708844016c52ac8c33fb3ab9da1c4b97c22
7
- data.tar.gz: 381eb1d06c4eadbeea18ce22fbd71aa3b1a81ed7f7200016e551b7e814570622bbd1bf92194f9150c470eece0e5780f637898963b432ecd79cbeb4e2b4ec88d2
6
+ metadata.gz: 5dce38567522e0a329821cc433518c8a7f20b680c5fe22d3fec488e7cdc007f0bb4e8c6a58153ef07a53a85b8c897d531db591d2fb045363981688a481ad482f
7
+ data.tar.gz: 24cd30d637416bb970c3df0c1595aa0879c60f8329d7ed7f0c467f81ced221d5b88f9af1405007e996b7434433bd0cc14267d09a9d20331f1849a00e4cc30462
data/iso-639.gemspec CHANGED
@@ -2,13 +2,13 @@
2
2
 
3
3
  Gem::Specification.new do |s|
4
4
  s.name = 'iso-639'
5
- s.version = '0.2.10'
5
+ s.version = '0.3.1'
6
6
  s.licenses = ['MIT']
7
7
  s.summary = 'ISO 639-1 and ISO 639-2 language code entries and convenience methods'
8
8
  s.description = 'ISO 639-1 and ISO 639-2 language code entries and convenience methods'
9
9
  s.authors = ['William Melody']
10
10
  s.email = 'hi@williammelody.com'
11
- s.date = '2020-03-01'
11
+ s.date = '2020-03-02'
12
12
  s.extra_rdoc_files = [
13
13
  'LICENSE',
14
14
  'README.md'
@@ -21,6 +21,7 @@ Gem::Specification.new do |s|
21
21
  'README.md',
22
22
  'Rakefile',
23
23
  'iso-639.gemspec',
24
+ 'lib/data/ISO-639-2_utf-8.txt',
24
25
  'lib/iso-639.rb',
25
26
  'test/helper.rb',
26
27
  'test/test_iso_639.rb'
@@ -32,4 +33,5 @@ Gem::Specification.new do |s|
32
33
  s.add_development_dependency('rdoc', '~> 6', '>= 0')
33
34
  s.add_development_dependency('rubocop', '~> 0', '>= 0.49.0')
34
35
  s.add_development_dependency('test-unit', '~> 3', '>= 0')
36
+ s.required_ruby_version = '>= 2.3'
35
37
  end
@@ -0,0 +1,487 @@
1
+ aar||aa|Afar|afar
2
+ abk||ab|Abkhazian|abkhaze
3
+ ace|||Achinese|aceh
4
+ ach|||Acoli|acoli
5
+ ada|||Adangme|adangme
6
+ ady|||Adyghe; Adygei|adyghé
7
+ afa|||Afro-Asiatic languages|afro-asiatiques, langues
8
+ afh|||Afrihili|afrihili
9
+ afr||af|Afrikaans|afrikaans
10
+ ain|||Ainu|aïnou
11
+ aka||ak|Akan|akan
12
+ akk|||Akkadian|akkadien
13
+ alb|sqi|sq|Albanian|albanais
14
+ ale|||Aleut|aléoute
15
+ alg|||Algonquian languages|algonquines, langues
16
+ alt|||Southern Altai|altai du Sud
17
+ amh||am|Amharic|amharique
18
+ ang|||English, Old (ca.450-1100)|anglo-saxon (ca.450-1100)
19
+ anp|||Angika|angika
20
+ apa|||Apache languages|apaches, langues
21
+ ara||ar|Arabic|arabe
22
+ arc|||Official Aramaic (700-300 BCE); Imperial Aramaic (700-300 BCE)|araméen d'empire (700-300 BCE)
23
+ arg||an|Aragonese|aragonais
24
+ arm|hye|hy|Armenian|arménien
25
+ arn|||Mapudungun; Mapuche|mapudungun; mapuche; mapuce
26
+ arp|||Arapaho|arapaho
27
+ art|||Artificial languages|artificielles, langues
28
+ arw|||Arawak|arawak
29
+ asm||as|Assamese|assamais
30
+ ast|||Asturian; Bable; Leonese; Asturleonese|asturien; bable; léonais; asturoléonais
31
+ ath|||Athapascan languages|athapascanes, langues
32
+ aus|||Australian languages|australiennes, langues
33
+ ava||av|Avaric|avar
34
+ ave||ae|Avestan|avestique
35
+ awa|||Awadhi|awadhi
36
+ aym||ay|Aymara|aymara
37
+ aze||az|Azerbaijani|azéri
38
+ bad|||Banda languages|banda, langues
39
+ bai|||Bamileke languages|bamiléké, langues
40
+ bak||ba|Bashkir|bachkir
41
+ bal|||Baluchi|baloutchi
42
+ bam||bm|Bambara|bambara
43
+ ban|||Balinese|balinais
44
+ baq|eus|eu|Basque|basque
45
+ bas|||Basa|basa
46
+ bat|||Baltic languages|baltes, langues
47
+ bej|||Beja; Bedawiyet|bedja
48
+ bel||be|Belarusian|biélorusse
49
+ bem|||Bemba|bemba
50
+ ben||bn|Bengali|bengali
51
+ ber|||Berber languages|berbères, langues
52
+ bho|||Bhojpuri|bhojpuri
53
+ bih||bh|Bihari languages|langues biharis
54
+ bik|||Bikol|bikol
55
+ bin|||Bini; Edo|bini; edo
56
+ bis||bi|Bislama|bichlamar
57
+ bla|||Siksika|blackfoot
58
+ bnt|||Bantu languages|bantou, langues
59
+ bos||bs|Bosnian|bosniaque
60
+ bra|||Braj|braj
61
+ bre||br|Breton|breton
62
+ btk|||Batak languages|batak, langues
63
+ bua|||Buriat|bouriate
64
+ bug|||Buginese|bugi
65
+ bul||bg|Bulgarian|bulgare
66
+ bur|mya|my|Burmese|birman
67
+ byn|||Blin; Bilin|blin; bilen
68
+ cad|||Caddo|caddo
69
+ cai|||Central American Indian languages|amérindiennes de L'Amérique centrale, langues
70
+ car|||Galibi Carib|karib; galibi; carib
71
+ cat||ca|Catalan; Valencian|catalan; valencien
72
+ cau|||Caucasian languages|caucasiennes, langues
73
+ ceb|||Cebuano|cebuano
74
+ cel|||Celtic languages|celtiques, langues; celtes, langues
75
+ cha||ch|Chamorro|chamorro
76
+ chb|||Chibcha|chibcha
77
+ che||ce|Chechen|tchétchène
78
+ chg|||Chagatai|djaghataï
79
+ chi|zho|zh|Chinese|chinois
80
+ chk|||Chuukese|chuuk
81
+ chm|||Mari|mari
82
+ chn|||Chinook jargon|chinook, jargon
83
+ cho|||Choctaw|choctaw
84
+ chp|||Chipewyan; Dene Suline|chipewyan
85
+ chr|||Cherokee|cherokee
86
+ chu||cu|Church Slavic; Old Slavonic; Church Slavonic; Old Bulgarian; Old Church Slavonic|slavon d'église; vieux slave; slavon liturgique; vieux bulgare
87
+ chv||cv|Chuvash|tchouvache
88
+ chy|||Cheyenne|cheyenne
89
+ cmc|||Chamic languages|chames, langues
90
+ cnr|||Montenegrin|monténégrin
91
+ cop|||Coptic|copte
92
+ cor||kw|Cornish|cornique
93
+ cos||co|Corsican|corse
94
+ cpe|||Creoles and pidgins, English based|créoles et pidgins basés sur l'anglais
95
+ cpf|||Creoles and pidgins, French-based|créoles et pidgins basés sur le français
96
+ cpp|||Creoles and pidgins, Portuguese-based|créoles et pidgins basés sur le portugais
97
+ cre||cr|Cree|cree
98
+ crh|||Crimean Tatar; Crimean Turkish|tatar de Crimé
99
+ crp|||Creoles and pidgins|créoles et pidgins
100
+ csb|||Kashubian|kachoube
101
+ cus|||Cushitic languages|couchitiques, langues
102
+ cze|ces|cs|Czech|tchèque
103
+ dak|||Dakota|dakota
104
+ dan||da|Danish|danois
105
+ dar|||Dargwa|dargwa
106
+ day|||Land Dayak languages|dayak, langues
107
+ del|||Delaware|delaware
108
+ den|||Slave (Athapascan)|esclave (athapascan)
109
+ dgr|||Dogrib|dogrib
110
+ din|||Dinka|dinka
111
+ div||dv|Divehi; Dhivehi; Maldivian|maldivien
112
+ doi|||Dogri|dogri
113
+ dra|||Dravidian languages|dravidiennes, langues
114
+ dsb|||Lower Sorbian|bas-sorabe
115
+ dua|||Duala|douala
116
+ dum|||Dutch, Middle (ca.1050-1350)|néerlandais moyen (ca. 1050-1350)
117
+ dut|nld|nl|Dutch; Flemish|néerlandais; flamand
118
+ dyu|||Dyula|dioula
119
+ dzo||dz|Dzongkha|dzongkha
120
+ efi|||Efik|efik
121
+ egy|||Egyptian (Ancient)|égyptien
122
+ eka|||Ekajuk|ekajuk
123
+ elx|||Elamite|élamite
124
+ eng||en|English|anglais
125
+ enm|||English, Middle (1100-1500)|anglais moyen (1100-1500)
126
+ epo||eo|Esperanto|espéranto
127
+ est||et|Estonian|estonien
128
+ ewe||ee|Ewe|éwé
129
+ ewo|||Ewondo|éwondo
130
+ fan|||Fang|fang
131
+ fao||fo|Faroese|féroïen
132
+ fat|||Fanti|fanti
133
+ fij||fj|Fijian|fidjien
134
+ fil|||Filipino; Pilipino|filipino; pilipino
135
+ fin||fi|Finnish|finnois
136
+ fiu|||Finno-Ugrian languages|finno-ougriennes, langues
137
+ fon|||Fon|fon
138
+ fre|fra|fr|French|français
139
+ frm|||French, Middle (ca.1400-1600)|français moyen (1400-1600)
140
+ fro|||French, Old (842-ca.1400)|français ancien (842-ca.1400)
141
+ frr|||Northern Frisian|frison septentrional
142
+ frs|||Eastern Frisian|frison oriental
143
+ fry||fy|Western Frisian|frison occidental
144
+ ful||ff|Fulah|peul
145
+ fur|||Friulian|frioulan
146
+ gaa|||Ga|ga
147
+ gay|||Gayo|gayo
148
+ gba|||Gbaya|gbaya
149
+ gem|||Germanic languages|germaniques, langues
150
+ geo|kat|ka|Georgian|géorgien
151
+ ger|deu|de|German|allemand
152
+ gez|||Geez|guèze
153
+ gil|||Gilbertese|kiribati
154
+ gla||gd|Gaelic; Scottish Gaelic|gaélique; gaélique écossais
155
+ gle||ga|Irish|irlandais
156
+ glg||gl|Galician|galicien
157
+ glv||gv|Manx|manx; mannois
158
+ gmh|||German, Middle High (ca.1050-1500)|allemand, moyen haut (ca. 1050-1500)
159
+ goh|||German, Old High (ca.750-1050)|allemand, vieux haut (ca. 750-1050)
160
+ gon|||Gondi|gond
161
+ gor|||Gorontalo|gorontalo
162
+ got|||Gothic|gothique
163
+ grb|||Grebo|grebo
164
+ grc|||Greek, Ancient (to 1453)|grec ancien (jusqu'à 1453)
165
+ gre|ell|el|Greek, Modern (1453-)|grec moderne (après 1453)
166
+ grn||gn|Guarani|guarani
167
+ gsw|||Swiss German; Alemannic; Alsatian|suisse alémanique; alémanique; alsacien
168
+ guj||gu|Gujarati|goudjrati
169
+ gwi|||Gwich'in|gwich'in
170
+ hai|||Haida|haida
171
+ hat||ht|Haitian; Haitian Creole|haïtien; créole haïtien
172
+ hau||ha|Hausa|haoussa
173
+ haw|||Hawaiian|hawaïen
174
+ heb||he|Hebrew|hébreu
175
+ her||hz|Herero|herero
176
+ hil|||Hiligaynon|hiligaynon
177
+ him|||Himachali languages; Western Pahari languages|langues himachalis; langues paharis occidentales
178
+ hin||hi|Hindi|hindi
179
+ hit|||Hittite|hittite
180
+ hmn|||Hmong; Mong|hmong
181
+ hmo||ho|Hiri Motu|hiri motu
182
+ hrv||hr|Croatian|croate
183
+ hsb|||Upper Sorbian|haut-sorabe
184
+ hun||hu|Hungarian|hongrois
185
+ hup|||Hupa|hupa
186
+ iba|||Iban|iban
187
+ ibo||ig|Igbo|igbo
188
+ ice|isl|is|Icelandic|islandais
189
+ ido||io|Ido|ido
190
+ iii||ii|Sichuan Yi; Nuosu|yi de Sichuan
191
+ ijo|||Ijo languages|ijo, langues
192
+ iku||iu|Inuktitut|inuktitut
193
+ ile||ie|Interlingue; Occidental|interlingue
194
+ ilo|||Iloko|ilocano
195
+ ina||ia|Interlingua (International Auxiliary Language Association)|interlingua (langue auxiliaire internationale)
196
+ inc|||Indic languages|indo-aryennes, langues
197
+ ind||id|Indonesian|indonésien
198
+ ine|||Indo-European languages|indo-européennes, langues
199
+ inh|||Ingush|ingouche
200
+ ipk||ik|Inupiaq|inupiaq
201
+ ira|||Iranian languages|iraniennes, langues
202
+ iro|||Iroquoian languages|iroquoises, langues
203
+ ita||it|Italian|italien
204
+ jav||jv|Javanese|javanais
205
+ jbo|||Lojban|lojban
206
+ jpn||ja|Japanese|japonais
207
+ jpr|||Judeo-Persian|judéo-persan
208
+ jrb|||Judeo-Arabic|judéo-arabe
209
+ kaa|||Kara-Kalpak|karakalpak
210
+ kab|||Kabyle|kabyle
211
+ kac|||Kachin; Jingpho|kachin; jingpho
212
+ kal||kl|Kalaallisut; Greenlandic|groenlandais
213
+ kam|||Kamba|kamba
214
+ kan||kn|Kannada|kannada
215
+ kar|||Karen languages|karen, langues
216
+ kas||ks|Kashmiri|kashmiri
217
+ kau||kr|Kanuri|kanouri
218
+ kaw|||Kawi|kawi
219
+ kaz||kk|Kazakh|kazakh
220
+ kbd|||Kabardian|kabardien
221
+ kha|||Khasi|khasi
222
+ khi|||Khoisan languages|khoïsan, langues
223
+ khm||km|Central Khmer|khmer central
224
+ kho|||Khotanese; Sakan|khotanais; sakan
225
+ kik||ki|Kikuyu; Gikuyu|kikuyu
226
+ kin||rw|Kinyarwanda|rwanda
227
+ kir||ky|Kirghiz; Kyrgyz|kirghiz
228
+ kmb|||Kimbundu|kimbundu
229
+ kok|||Konkani|konkani
230
+ kom||kv|Komi|kom
231
+ kon||kg|Kongo|kongo
232
+ kor||ko|Korean|coréen
233
+ kos|||Kosraean|kosrae
234
+ kpe|||Kpelle|kpellé
235
+ krc|||Karachay-Balkar|karatchai balkar
236
+ krl|||Karelian|carélien
237
+ kro|||Kru languages|krou, langues
238
+ kru|||Kurukh|kurukh
239
+ kua||kj|Kuanyama; Kwanyama|kuanyama; kwanyama
240
+ kum|||Kumyk|koumyk
241
+ kur||ku|Kurdish|kurde
242
+ kut|||Kutenai|kutenai
243
+ lad|||Ladino|judéo-espagnol
244
+ lah|||Lahnda|lahnda
245
+ lam|||Lamba|lamba
246
+ lao||lo|Lao|lao
247
+ lat||la|Latin|latin
248
+ lav||lv|Latvian|letton
249
+ lez|||Lezghian|lezghien
250
+ lim||li|Limburgan; Limburger; Limburgish|limbourgeois
251
+ lin||ln|Lingala|lingala
252
+ lit||lt|Lithuanian|lituanien
253
+ lol|||Mongo|mongo
254
+ loz|||Lozi|lozi
255
+ ltz||lb|Luxembourgish; Letzeburgesch|luxembourgeois
256
+ lua|||Luba-Lulua|luba-lulua
257
+ lub||lu|Luba-Katanga|luba-katanga
258
+ lug||lg|Ganda|ganda
259
+ lui|||Luiseno|luiseno
260
+ lun|||Lunda|lunda
261
+ luo|||Luo (Kenya and Tanzania)|luo (Kenya et Tanzanie)
262
+ lus|||Lushai|lushai
263
+ mac|mkd|mk|Macedonian|macédonien
264
+ mad|||Madurese|madourais
265
+ mag|||Magahi|magahi
266
+ mah||mh|Marshallese|marshall
267
+ mai|||Maithili|maithili
268
+ mak|||Makasar|makassar
269
+ mal||ml|Malayalam|malayalam
270
+ man|||Mandingo|mandingue
271
+ mao|mri|mi|Maori|maori
272
+ map|||Austronesian languages|austronésiennes, langues
273
+ mar||mr|Marathi|marathe
274
+ mas|||Masai|massaï
275
+ may|msa|ms|Malay|malais
276
+ mdf|||Moksha|moksa
277
+ mdr|||Mandar|mandar
278
+ men|||Mende|mendé
279
+ mga|||Irish, Middle (900-1200)|irlandais moyen (900-1200)
280
+ mic|||Mi'kmaq; Micmac|mi'kmaq; micmac
281
+ min|||Minangkabau|minangkabau
282
+ mis|||Uncoded languages|langues non codées
283
+ mkh|||Mon-Khmer languages|môn-khmer, langues
284
+ mlg||mg|Malagasy|malgache
285
+ mlt||mt|Maltese|maltais
286
+ mnc|||Manchu|mandchou
287
+ mni|||Manipuri|manipuri
288
+ mno|||Manobo languages|manobo, langues
289
+ moh|||Mohawk|mohawk
290
+ mon||mn|Mongolian|mongol
291
+ mos|||Mossi|moré
292
+ mul|||Multiple languages|multilingue
293
+ mun|||Munda languages|mounda, langues
294
+ mus|||Creek|muskogee
295
+ mwl|||Mirandese|mirandais
296
+ mwr|||Marwari|marvari
297
+ myn|||Mayan languages|maya, langues
298
+ myv|||Erzya|erza
299
+ nah|||Nahuatl languages|nahuatl, langues
300
+ nai|||North American Indian languages|nord-amérindiennes, langues
301
+ nap|||Neapolitan|napolitain
302
+ nau||na|Nauru|nauruan
303
+ nav||nv|Navajo; Navaho|navaho
304
+ nbl||nr|Ndebele, South; South Ndebele|ndébélé du Sud
305
+ nde||nd|Ndebele, North; North Ndebele|ndébélé du Nord
306
+ ndo||ng|Ndonga|ndonga
307
+ nds|||Low German; Low Saxon; German, Low; Saxon, Low|bas allemand; bas saxon; allemand, bas; saxon, bas
308
+ nep||ne|Nepali|népalais
309
+ new|||Nepal Bhasa; Newari|nepal bhasa; newari
310
+ nia|||Nias|nias
311
+ nic|||Niger-Kordofanian languages|nigéro-kordofaniennes, langues
312
+ niu|||Niuean|niué
313
+ nno||nn|Norwegian Nynorsk; Nynorsk, Norwegian|norvégien nynorsk; nynorsk, norvégien
314
+ nob||nb|Bokmål, Norwegian; Norwegian Bokmål|norvégien bokmål
315
+ nog|||Nogai|nogaï; nogay
316
+ non|||Norse, Old|norrois, vieux
317
+ nor||no|Norwegian|norvégien
318
+ nqo|||N'Ko|n'ko
319
+ nso|||Pedi; Sepedi; Northern Sotho|pedi; sepedi; sotho du Nord
320
+ nub|||Nubian languages|nubiennes, langues
321
+ nwc|||Classical Newari; Old Newari; Classical Nepal Bhasa|newari classique
322
+ nya||ny|Chichewa; Chewa; Nyanja|chichewa; chewa; nyanja
323
+ nym|||Nyamwezi|nyamwezi
324
+ nyn|||Nyankole|nyankolé
325
+ nyo|||Nyoro|nyoro
326
+ nzi|||Nzima|nzema
327
+ oci||oc|Occitan (post 1500)|occitan (après 1500)
328
+ oji||oj|Ojibwa|ojibwa
329
+ ori||or|Oriya|oriya
330
+ orm||om|Oromo|galla
331
+ osa|||Osage|osage
332
+ oss||os|Ossetian; Ossetic|ossète
333
+ ota|||Turkish, Ottoman (1500-1928)|turc ottoman (1500-1928)
334
+ oto|||Otomian languages|otomi, langues
335
+ paa|||Papuan languages|papoues, langues
336
+ pag|||Pangasinan|pangasinan
337
+ pal|||Pahlavi|pahlavi
338
+ pam|||Pampanga; Kapampangan|pampangan
339
+ pan||pa|Panjabi; Punjabi|pendjabi
340
+ pap|||Papiamento|papiamento
341
+ pau|||Palauan|palau
342
+ peo|||Persian, Old (ca.600-400 B.C.)|perse, vieux (ca. 600-400 av. J.-C.)
343
+ per|fas|fa|Persian|persan
344
+ phi|||Philippine languages|philippines, langues
345
+ phn|||Phoenician|phénicien
346
+ pli||pi|Pali|pali
347
+ pol||pl|Polish|polonais
348
+ pon|||Pohnpeian|pohnpei
349
+ por||pt|Portuguese|portugais
350
+ pra|||Prakrit languages|prâkrit, langues
351
+ pro|||Provençal, Old (to 1500); Occitan, Old (to 1500)|provençal ancien (jusqu'à 1500); occitan ancien (jusqu'à 1500)
352
+ pus||ps|Pushto; Pashto|pachto
353
+ qaa-qtz|||Reserved for local use|réservée à l'usage local
354
+ que||qu|Quechua|quechua
355
+ raj|||Rajasthani|rajasthani
356
+ rap|||Rapanui|rapanui
357
+ rar|||Rarotongan; Cook Islands Maori|rarotonga; maori des îles Cook
358
+ roa|||Romance languages|romanes, langues
359
+ roh||rm|Romansh|romanche
360
+ rom|||Romany|tsigane
361
+ rum|ron|ro|Romanian; Moldavian; Moldovan|roumain; moldave
362
+ run||rn|Rundi|rundi
363
+ rup|||Aromanian; Arumanian; Macedo-Romanian|aroumain; macédo-roumain
364
+ rus||ru|Russian|russe
365
+ sad|||Sandawe|sandawe
366
+ sag||sg|Sango|sango
367
+ sah|||Yakut|iakoute
368
+ sai|||South American Indian languages|sud-amérindiennes, langues
369
+ sal|||Salishan languages|salishennes, langues
370
+ sam|||Samaritan Aramaic|samaritain
371
+ san||sa|Sanskrit|sanskrit
372
+ sas|||Sasak|sasak
373
+ sat|||Santali|santal
374
+ scn|||Sicilian|sicilien
375
+ sco|||Scots|écossais
376
+ sel|||Selkup|selkoupe
377
+ sem|||Semitic languages|sémitiques, langues
378
+ sga|||Irish, Old (to 900)|irlandais ancien (jusqu'à 900)
379
+ sgn|||Sign Languages|langues des signes
380
+ shn|||Shan|chan
381
+ sid|||Sidamo|sidamo
382
+ sin||si|Sinhala; Sinhalese|singhalais
383
+ sio|||Siouan languages|sioux, langues
384
+ sit|||Sino-Tibetan languages|sino-tibétaines, langues
385
+ sla|||Slavic languages|slaves, langues
386
+ slo|slk|sk|Slovak|slovaque
387
+ slv||sl|Slovenian|slovène
388
+ sma|||Southern Sami|sami du Sud
389
+ sme||se|Northern Sami|sami du Nord
390
+ smi|||Sami languages|sames, langues
391
+ smj|||Lule Sami|sami de Lule
392
+ smn|||Inari Sami|sami d'Inari
393
+ smo||sm|Samoan|samoan
394
+ sms|||Skolt Sami|sami skolt
395
+ sna||sn|Shona|shona
396
+ snd||sd|Sindhi|sindhi
397
+ snk|||Soninke|soninké
398
+ sog|||Sogdian|sogdien
399
+ som||so|Somali|somali
400
+ son|||Songhai languages|songhai, langues
401
+ sot||st|Sotho, Southern|sotho du Sud
402
+ spa||es|Spanish; Castilian|espagnol; castillan
403
+ srd||sc|Sardinian|sarde
404
+ srn|||Sranan Tongo|sranan tongo
405
+ srp||sr|Serbian|serbe
406
+ srr|||Serer|sérère
407
+ ssa|||Nilo-Saharan languages|nilo-sahariennes, langues
408
+ ssw||ss|Swati|swati
409
+ suk|||Sukuma|sukuma
410
+ sun||su|Sundanese|soundanais
411
+ sus|||Susu|soussou
412
+ sux|||Sumerian|sumérien
413
+ swa||sw|Swahili|swahili
414
+ swe||sv|Swedish|suédois
415
+ syc|||Classical Syriac|syriaque classique
416
+ syr|||Syriac|syriaque
417
+ tah||ty|Tahitian|tahitien
418
+ tai|||Tai languages|tai, langues
419
+ tam||ta|Tamil|tamoul
420
+ tat||tt|Tatar|tatar
421
+ tel||te|Telugu|télougou
422
+ tem|||Timne|temne
423
+ ter|||Tereno|tereno
424
+ tet|||Tetum|tetum
425
+ tgk||tg|Tajik|tadjik
426
+ tgl||tl|Tagalog|tagalog
427
+ tha||th|Thai|thaï
428
+ tib|bod|bo|Tibetan|tibétain
429
+ tig|||Tigre|tigré
430
+ tir||ti|Tigrinya|tigrigna
431
+ tiv|||Tiv|tiv
432
+ tkl|||Tokelau|tokelau
433
+ tlh|||Klingon; tlhIngan-Hol|klingon
434
+ tli|||Tlingit|tlingit
435
+ tmh|||Tamashek|tamacheq
436
+ tog|||Tonga (Nyasa)|tonga (Nyasa)
437
+ ton||to|Tonga (Tonga Islands)|tongan (Îles Tonga)
438
+ tpi|||Tok Pisin|tok pisin
439
+ tsi|||Tsimshian|tsimshian
440
+ tsn||tn|Tswana|tswana
441
+ tso||ts|Tsonga|tsonga
442
+ tuk||tk|Turkmen|turkmène
443
+ tum|||Tumbuka|tumbuka
444
+ tup|||Tupi languages|tupi, langues
445
+ tur||tr|Turkish|turc
446
+ tut|||Altaic languages|altaïques, langues
447
+ tvl|||Tuvalu|tuvalu
448
+ twi||tw|Twi|twi
449
+ tyv|||Tuvinian|touva
450
+ udm|||Udmurt|oudmourte
451
+ uga|||Ugaritic|ougaritique
452
+ uig||ug|Uighur; Uyghur|ouïgour
453
+ ukr||uk|Ukrainian|ukrainien
454
+ umb|||Umbundu|umbundu
455
+ und|||Undetermined|indéterminée
456
+ urd||ur|Urdu|ourdou
457
+ uzb||uz|Uzbek|ouszbek
458
+ vai|||Vai|vaï
459
+ ven||ve|Venda|venda
460
+ vie||vi|Vietnamese|vietnamien
461
+ vol||vo|Volapük|volapük
462
+ vot|||Votic|vote
463
+ wak|||Wakashan languages|wakashanes, langues
464
+ wal|||Wolaitta; Wolaytta|wolaitta; wolaytta
465
+ war|||Waray|waray
466
+ was|||Washo|washo
467
+ wel|cym|cy|Welsh|gallois
468
+ wen|||Sorbian languages|sorabes, langues
469
+ wln||wa|Walloon|wallon
470
+ wol||wo|Wolof|wolof
471
+ xal|||Kalmyk; Oirat|kalmouk; oïrat
472
+ xho||xh|Xhosa|xhosa
473
+ yao|||Yao|yao
474
+ yap|||Yapese|yapois
475
+ yid||yi|Yiddish|yiddish
476
+ yor||yo|Yoruba|yoruba
477
+ ypk|||Yupik languages|yupik, langues
478
+ zap|||Zapotec|zapotèque
479
+ zbl|||Blissymbols; Blissymbolics; Bliss|symboles Bliss; Bliss
480
+ zen|||Zenaga|zenaga
481
+ zgh|||Standard Moroccan Tamazight|amazighe standard marocain
482
+ zha||za|Zhuang; Chuang|zhuang; chuang
483
+ znd|||Zande languages|zandé, langues
484
+ zul||zu|Zulu|zoulou
485
+ zun|||Zuni|zuni
486
+ zxx|||No linguistic content; Not applicable|pas de contenu linguistique; non applicable
487
+ zza|||Zaza; Dimili; Dimli; Kirdki; Kirmanjki; Zazaki|zaza; dimili; dimli; kirdki; kirmanjki; zazaki
data/lib/iso-639.rb CHANGED
@@ -1,520 +1,31 @@
1
1
  # frozen_string_literal: true
2
2
 
3
- # http://www.loc.gov/standards/iso639-2/ascii_8bits.html
3
+ require 'csv'
4
4
 
5
5
  class ISO_639 < Array
6
- # Redefine `[]` to freeze all strings and arrays.
7
- #
8
- # Ruby 2.3+ uses the `frozen_string_literal` magic comment to freeze all
9
- # strings, while previous versions require the `#map` approach.
10
- def self.[](a3_bib, a3_term, a2, english_name, french_name)
11
- if a3_bib.frozen? # then Ruby 2.3+
12
- super(a3_bib, a3_term, a2, english_name, french_name).freeze
13
- else
14
- super(
15
- a3_bib.freeze,
16
- a3_term.freeze,
17
- a2.freeze,
18
- english_name.freeze,
19
- french_name.freeze
20
- ).freeze
21
- end
22
- end
23
-
24
- # The ISO 639-2 dataset as an array of entries. Each entry is an array with
25
- # the following format:
6
+ # Load the ISO 639-2 dataset as an array of entries. Each entry is an array
7
+ # with the following format:
26
8
  # * [0]: an alpha-3 (bibliographic) code
27
9
  # * [1]: an alpha-3 (terminologic) code (when given)
28
10
  # * [2]: an alpha-2 code (when given)
29
11
  # * [3]: an English name
30
12
  # * [4]: a French name of a language
31
- ISO_639_2 = [
32
- self["aar", "", "aa", "Afar", "afar"],
33
- self["abk", "", "ab", "Abkhazian", "abkhaze"],
34
- self["ace", "", "", "Achinese", "aceh"],
35
- self["ach", "", "", "Acoli", "acoli"],
36
- self["ada", "", "", "Adangme", "adangme"],
37
- self["ady", "", "", "Adyghe; Adygei", "adyghé"],
38
- self["afa", "", "", "Afro-Asiatic languages", "afro-asiatiques, langues"],
39
- self["afh", "", "", "Afrihili", "afrihili"],
40
- self["afr", "", "af", "Afrikaans", "afrikaans"],
41
- self["ain", "", "", "Ainu", "aïnou"],
42
- self["aka", "", "ak", "Akan", "akan"],
43
- self["akk", "", "", "Akkadian", "akkadien"],
44
- self["alb", "sqi", "sq", "Albanian", "albanais"],
45
- self["ale", "", "", "Aleut", "aléoute"],
46
- self["alg", "", "", "Algonquian languages", "algonquines, langues"],
47
- self["alt", "", "", "Southern Altai", "altai du Sud"],
48
- self["amh", "", "am", "Amharic", "amharique"],
49
- self["ang", "", "", "English, Old (ca.450-1100)", "anglo-saxon (ca.450-1100)"],
50
- self["anp", "", "", "Angika", "angika"],
51
- self["apa", "", "", "Apache languages", "apaches, langues"],
52
- self["ara", "", "ar", "Arabic", "arabe"],
53
- self["arc", "", "", "Official Aramaic (700-300 BCE); Imperial Aramaic (700-300 BCE)", "araméen d'empire (700-300 BCE)"],
54
- self["arg", "", "an", "Aragonese", "aragonais"],
55
- self["arm", "hye", "hy", "Armenian", "arménien"],
56
- self["arn", "", "", "Mapudungun; Mapuche", "mapudungun; mapuche; mapuce"],
57
- self["arp", "", "", "Arapaho", "arapaho"],
58
- self["art", "", "", "Artificial languages", "artificielles, langues"],
59
- self["arw", "", "", "Arawak", "arawak"],
60
- self["asm", "", "as", "Assamese", "assamais"],
61
- self["ast", "", "", "Asturian; Bable; Leonese; Asturleonese", "asturien; bable; léonais; asturoléonais"],
62
- self["ath", "", "", "Athapascan languages", "athapascanes, langues"],
63
- self["aus", "", "", "Australian languages", "australiennes, langues"],
64
- self["ava", "", "av", "Avaric", "avar"],
65
- self["ave", "", "ae", "Avestan", "avestique"],
66
- self["awa", "", "", "Awadhi", "awadhi"],
67
- self["aym", "", "ay", "Aymara", "aymara"],
68
- self["aze", "", "az", "Azerbaijani", "azéri"],
69
- self["bad", "", "", "Banda languages", "banda, langues"],
70
- self["bai", "", "", "Bamileke languages", "bamiléké, langues"],
71
- self["bak", "", "ba", "Bashkir", "bachkir"],
72
- self["bal", "", "", "Baluchi", "baloutchi"],
73
- self["bam", "", "bm", "Bambara", "bambara"],
74
- self["ban", "", "", "Balinese", "balinais"],
75
- self["baq", "eus", "eu", "Basque", "basque"],
76
- self["bas", "", "", "Basa", "basa"],
77
- self["bat", "", "", "Baltic languages", "baltes, langues"],
78
- self["bej", "", "", "Beja; Bedawiyet", "bedja"],
79
- self["bel", "", "be", "Belarusian", "biélorusse"],
80
- self["bem", "", "", "Bemba", "bemba"],
81
- self["ben", "", "bn", "Bengali", "bengali"],
82
- self["ber", "", "", "Berber languages", "berbères, langues"],
83
- self["bho", "", "", "Bhojpuri", "bhojpuri"],
84
- self["bih", "", "bh", "Bihari languages", "langues biharis"],
85
- self["bik", "", "", "Bikol", "bikol"],
86
- self["bin", "", "", "Bini; Edo", "bini; edo"],
87
- self["bis", "", "bi", "Bislama", "bichlamar"],
88
- self["bla", "", "", "Siksika", "blackfoot"],
89
- self["bnt", "", "", "Bantu (Other)", "bantoues, autres langues"],
90
- self["bos", "", "bs", "Bosnian", "bosniaque"],
91
- self["bra", "", "", "Braj", "braj"],
92
- self["bre", "", "br", "Breton", "breton"],
93
- self["btk", "", "", "Batak languages", "batak, langues"],
94
- self["bua", "", "", "Buriat", "bouriate"],
95
- self["bug", "", "", "Buginese", "bugi"],
96
- self["bul", "", "bg", "Bulgarian", "bulgare"],
97
- self["bur", "mya", "my", "Burmese", "birman"],
98
- self["byn", "", "", "Blin; Bilin", "blin; bilen"],
99
- self["cad", "", "", "Caddo", "caddo"],
100
- self["cai", "", "", "Central American Indian languages", "amérindiennes de L'Amérique centrale, langues"],
101
- self["car", "", "", "Galibi Carib", "karib; galibi; carib"],
102
- self["cat", "", "ca", "Catalan; Valencian", "catalan; valencien"],
103
- self["cau", "", "", "Caucasian languages", "caucasiennes, langues"],
104
- self["ceb", "", "", "Cebuano", "cebuano"],
105
- self["cel", "", "", "Celtic languages", "celtiques, langues; celtes, langues"],
106
- self["cha", "", "ch", "Chamorro", "chamorro"],
107
- self["chb", "", "", "Chibcha", "chibcha"],
108
- self["che", "", "ce", "Chechen", "tchétchène"],
109
- self["chg", "", "", "Chagatai", "djaghataï"],
110
- self["chi", "zho", "zh", "Chinese", "chinois"],
111
- self["chk", "", "", "Chuukese", "chuuk"],
112
- self["chm", "", "", "Mari", "mari"],
113
- self["chn", "", "", "Chinook jargon", "chinook, jargon"],
114
- self["cho", "", "", "Choctaw", "choctaw"],
115
- self["chp", "", "", "Chipewyan; Dene Suline", "chipewyan"],
116
- self["chr", "", "", "Cherokee", "cherokee"],
117
- self["chu", "", "cu", "Church Slavic; Old Slavonic; Church Slavonic; Old Bulgarian; Old Church Slavonic", "slavon d'église; vieux slave; slavon liturgique; vieux bulgare"],
118
- self["chv", "", "cv", "Chuvash", "tchouvache"],
119
- self["chy", "", "", "Cheyenne", "cheyenne"],
120
- self["cmc", "", "", "Chamic languages", "chames, langues"],
121
- self["cop", "", "", "Coptic", "copte"],
122
- self["cor", "", "kw", "Cornish", "cornique"],
123
- self["cos", "", "co", "Corsican", "corse"],
124
- self["cpe", "", "", "Creoles and pidgins, English based", "créoles et pidgins basés sur l'anglais"],
125
- self["cpf", "", "", "Creoles and pidgins, French-based ", "créoles et pidgins basés sur le français"],
126
- self["cpp", "", "", "Creoles and pidgins, Portuguese-based ", "créoles et pidgins basés sur le portugais"],
127
- self["cre", "", "cr", "Cree", "cree"],
128
- self["crh", "", "", "Crimean Tatar; Crimean Turkish", "tatar de Crimé"],
129
- self["crp", "", "", "Creoles and pidgins ", "créoles et pidgins"],
130
- self["csb", "", "", "Kashubian", "kachoube"],
131
- self["cus", "", "", "Cushitic languages", "couchitiques, langues"],
132
- self["cze", "ces", "cs", "Czech", "tchèque"],
133
- self["dak", "", "", "Dakota", "dakota"],
134
- self["dan", "", "da", "Danish", "danois"],
135
- self["dar", "", "", "Dargwa", "dargwa"],
136
- self["day", "", "", "Land Dayak languages", "dayak, langues"],
137
- self["del", "", "", "Delaware", "delaware"],
138
- self["den", "", "", "Slave (Athapascan)", "esclave (athapascan)"],
139
- self["dgr", "", "", "Dogrib", "dogrib"],
140
- self["din", "", "", "Dinka", "dinka"],
141
- self["div", "", "dv", "Divehi; Dhivehi; Maldivian", "maldivien"],
142
- self["doi", "", "", "Dogri", "dogri"],
143
- self["dra", "", "", "Dravidian languages", "dravidiennes, langues"],
144
- self["dsb", "", "", "Lower Sorbian", "bas-sorabe"],
145
- self["dua", "", "", "Duala", "douala"],
146
- self["dum", "", "", "Dutch, Middle (ca.1050-1350)", "néerlandais moyen (ca. 1050-1350)"],
147
- self["dut", "nld", "nl", "Dutch; Flemish", "néerlandais; flamand"],
148
- self["dyu", "", "", "Dyula", "dioula"],
149
- self["dzo", "", "dz", "Dzongkha", "dzongkha"],
150
- self["efi", "", "", "Efik", "efik"],
151
- self["egy", "", "", "Egyptian (Ancient)", "égyptien"],
152
- self["eka", "", "", "Ekajuk", "ekajuk"],
153
- self["elx", "", "", "Elamite", "élamite"],
154
- self["eng", "", "en", "English", "anglais"],
155
- self["enm", "", "", "English, Middle (1100-1500)", "anglais moyen (1100-1500)"],
156
- self["epo", "", "eo", "Esperanto", "espéranto"],
157
- self["est", "", "et", "Estonian", "estonien"],
158
- self["ewe", "", "ee", "Ewe", "éwé"],
159
- self["ewo", "", "", "Ewondo", "éwondo"],
160
- self["fan", "", "", "Fang", "fang"],
161
- self["fao", "", "fo", "Faroese", "féroïen"],
162
- self["fat", "", "", "Fanti", "fanti"],
163
- self["fij", "", "fj", "Fijian", "fidjien"],
164
- self["fil", "", "", "Filipino; Pilipino", "filipino; pilipino"],
165
- self["fin", "", "fi", "Finnish", "finnois"],
166
- self["fiu", "", "", "Finno-Ugrian languages", "finno-ougriennes, langues"],
167
- self["fon", "", "", "Fon", "fon"],
168
- self["fre", "fra", "fr", "French", "français"],
169
- self["frm", "", "", "French, Middle (ca.1400-1600)", "français moyen (1400-1600)"],
170
- self["fro", "", "", "French, Old (842-ca.1400)", "français ancien (842-ca.1400)"],
171
- self["frr", "", "", "Northern Frisian", "frison septentrional"],
172
- self["frs", "", "", "Eastern Frisian", "frison oriental"],
173
- self["fry", "", "fy", "Western Frisian", "frison occidental"],
174
- self["ful", "", "ff", "Fulah", "peul"],
175
- self["fur", "", "", "Friulian", "frioulan"],
176
- self["gaa", "", "", "Ga", "ga"],
177
- self["gay", "", "", "Gayo", "gayo"],
178
- self["gba", "", "", "Gbaya", "gbaya"],
179
- self["gem", "", "", "Germanic languages", "germaniques, langues"],
180
- self["geo", "kat", "ka", "Georgian", "géorgien"],
181
- self["ger", "deu", "de", "German", "allemand"],
182
- self["gez", "", "", "Geez", "guèze"],
183
- self["gil", "", "", "Gilbertese", "kiribati"],
184
- self["gla", "", "gd", "Gaelic; Scottish Gaelic", "gaélique; gaélique écossais"],
185
- self["gle", "", "ga", "Irish", "irlandais"],
186
- self["glg", "", "gl", "Galician", "galicien"],
187
- self["glv", "", "gv", "Manx", "manx; mannois"],
188
- self["gmh", "", "", "German, Middle High (ca.1050-1500)", "allemand, moyen haut (ca. 1050-1500)"],
189
- self["goh", "", "", "German, Old High (ca.750-1050)", "allemand, vieux haut (ca. 750-1050)"],
190
- self["gon", "", "", "Gondi", "gond"],
191
- self["gor", "", "", "Gorontalo", "gorontalo"],
192
- self["got", "", "", "Gothic", "gothique"],
193
- self["grb", "", "", "Grebo", "grebo"],
194
- self["grc", "", "", "Greek, Ancient (to 1453)", "grec ancien (jusqu'à 1453)"],
195
- self["gre", "ell", "el", "Greek, Modern (1453-)", "grec moderne (après 1453)"],
196
- self["grn", "", "gn", "Guarani", "guarani"],
197
- self["gsw", "", "", "Swiss German; Alemannic; Alsatian", "suisse alémanique; alémanique; alsacien"],
198
- self["guj", "", "gu", "Gujarati", "goudjrati"],
199
- self["gwi", "", "", "Gwich'in", "gwich'in"],
200
- self["hai", "", "", "Haida", "haida"],
201
- self["hat", "", "ht", "Haitian; Haitian Creole", "haïtien; créole haïtien"],
202
- self["hau", "", "ha", "Hausa", "haoussa"],
203
- self["haw", "", "", "Hawaiian", "hawaïen"],
204
- self["heb", "", "he", "Hebrew", "hébreu"],
205
- self["her", "", "hz", "Herero", "herero"],
206
- self["hil", "", "", "Hiligaynon", "hiligaynon"],
207
- self["him", "", "", "Himachali languages; Western Pahari languages", "langues himachalis; langues paharis occidentales"],
208
- self["hin", "", "hi", "Hindi", "hindi"],
209
- self["hit", "", "", "Hittite", "hittite"],
210
- self["hmn", "", "", "Hmong", "hmong"],
211
- self["hmo", "", "ho", "Hiri Motu", "hiri motu"],
212
- self["hrv", "", "hr", "Croatian", "croate"],
213
- self["hsb", "", "", "Upper Sorbian", "haut-sorabe"],
214
- self["hun", "", "hu", "Hungarian", "hongrois"],
215
- self["hup", "", "", "Hupa", "hupa"],
216
- self["iba", "", "", "Iban", "iban"],
217
- self["ibo", "", "ig", "Igbo", "igbo"],
218
- self["ice", "isl", "is", "Icelandic", "islandais"],
219
- self["ido", "", "io", "Ido", "ido"],
220
- self["iii", "", "ii", "Sichuan Yi; Nuosu", "yi de Sichuan"],
221
- self["ijo", "", "", "Ijo languages", "ijo, langues"],
222
- self["iku", "", "iu", "Inuktitut", "inuktitut"],
223
- self["ile", "", "ie", "Interlingue; Occidental", "interlingue"],
224
- self["ilo", "", "", "Iloko", "ilocano"],
225
- self["ina", "", "ia", "Interlingua (International Auxiliary Language Association)", "interlingua (langue auxiliaire internationale)"],
226
- self["inc", "", "", "Indic languages", "indo-aryennes, langues"],
227
- self["ind", "", "id", "Indonesian", "indonésien"],
228
- self["ine", "", "", "Indo-European languages", "indo-européennes, langues"],
229
- self["inh", "", "", "Ingush", "ingouche"],
230
- self["ipk", "", "ik", "Inupiaq", "inupiaq"],
231
- self["ira", "", "", "Iranian languages", "iraniennes, langues"],
232
- self["iro", "", "", "Iroquoian languages", "iroquoises, langues"],
233
- self["ita", "", "it", "Italian", "italien"],
234
- self["jav", "", "jv", "Javanese", "javanais"],
235
- self["jbo", "", "", "Lojban", "lojban"],
236
- self["jpn", "", "ja", "Japanese", "japonais"],
237
- self["jpr", "", "", "Judeo-Persian", "judéo-persan"],
238
- self["jrb", "", "", "Judeo-Arabic", "judéo-arabe"],
239
- self["kaa", "", "", "Kara-Kalpak", "karakalpak"],
240
- self["kab", "", "", "Kabyle", "kabyle"],
241
- self["kac", "", "", "Kachin; Jingpho", "kachin; jingpho"],
242
- self["kal", "", "kl", "Kalaallisut; Greenlandic", "groenlandais"],
243
- self["kam", "", "", "Kamba", "kamba"],
244
- self["kan", "", "kn", "Kannada", "kannada"],
245
- self["kar", "", "", "Karen languages", "karen, langues"],
246
- self["kas", "", "ks", "Kashmiri", "kashmiri"],
247
- self["kau", "", "kr", "Kanuri", "kanouri"],
248
- self["kaw", "", "", "Kawi", "kawi"],
249
- self["kaz", "", "kk", "Kazakh", "kazakh"],
250
- self["kbd", "", "", "Kabardian", "kabardien"],
251
- self["kha", "", "", "Khasi", "khasi"],
252
- self["khi", "", "", "Khoisan languages", "khoïsan, langues"],
253
- self["khm", "", "km", "Central Khmer", "khmer central"],
254
- self["kho", "", "", "Khotanese; Sakan", "khotanais; sakan"],
255
- self["kik", "", "ki", "Kikuyu; Gikuyu", "kikuyu"],
256
- self["kin", "", "rw", "Kinyarwanda", "rwanda"],
257
- self["kir", "", "ky", "Kirghiz; Kyrgyz", "kirghiz"],
258
- self["kmb", "", "", "Kimbundu", "kimbundu"],
259
- self["kok", "", "", "Konkani", "konkani"],
260
- self["kom", "", "kv", "Komi", "kom"],
261
- self["kon", "", "kg", "Kongo", "kongo"],
262
- self["kor", "", "ko", "Korean", "coréen"],
263
- self["kos", "", "", "Kosraean", "kosrae"],
264
- self["kpe", "", "", "Kpelle", "kpellé"],
265
- self["krc", "", "", "Karachay-Balkar", "karatchai balkar"],
266
- self["krl", "", "", "Karelian", "carélien"],
267
- self["kro", "", "", "Kru languages", "krou, langues"],
268
- self["kru", "", "", "Kurukh", "kurukh"],
269
- self["kua", "", "kj", "Kuanyama; Kwanyama", "kuanyama; kwanyama"],
270
- self["kum", "", "", "Kumyk", "koumyk"],
271
- self["kur", "", "ku", "Kurdish", "kurde"],
272
- self["kut", "", "", "Kutenai", "kutenai"],
273
- self["lad", "", "", "Ladino", "judéo-espagnol"],
274
- self["lah", "", "", "Lahnda", "lahnda"],
275
- self["lam", "", "", "Lamba", "lamba"],
276
- self["lao", "", "lo", "Lao", "lao"],
277
- self["lat", "", "la", "Latin", "latin"],
278
- self["lav", "", "lv", "Latvian", "letton"],
279
- self["lez", "", "", "Lezghian", "lezghien"],
280
- self["lim", "", "li", "Limburgan; Limburger; Limburgish", "limbourgeois"],
281
- self["lin", "", "ln", "Lingala", "lingala"],
282
- self["lit", "", "lt", "Lithuanian", "lituanien"],
283
- self["lol", "", "", "Mongo", "mongo"],
284
- self["loz", "", "", "Lozi", "lozi"],
285
- self["ltz", "", "lb", "Luxembourgish; Letzeburgesch", "luxembourgeois"],
286
- self["lua", "", "", "Luba-Lulua", "luba-lulua"],
287
- self["lub", "", "lu", "Luba-Katanga", "luba-katanga"],
288
- self["lug", "", "lg", "Ganda", "ganda"],
289
- self["lui", "", "", "Luiseno", "luiseno"],
290
- self["lun", "", "", "Lunda", "lunda"],
291
- self["luo", "", "", "Luo (Kenya and Tanzania)", "luo (Kenya et Tanzanie)"],
292
- self["lus", "", "", "Lushai", "lushai"],
293
- self["mac", "mkd", "mk", "Macedonian", "macédonien"],
294
- self["mad", "", "", "Madurese", "madourais"],
295
- self["mag", "", "", "Magahi", "magahi"],
296
- self["mah", "", "mh", "Marshallese", "marshall"],
297
- self["mai", "", "", "Maithili", "maithili"],
298
- self["mak", "", "", "Makasar", "makassar"],
299
- self["mal", "", "ml", "Malayalam", "malayalam"],
300
- self["man", "", "", "Mandingo", "mandingue"],
301
- self["mao", "mri", "mi", "Maori", "maori"],
302
- self["map", "", "", "Austronesian languages", "austronésiennes, langues"],
303
- self["mar", "", "mr", "Marathi", "marathe"],
304
- self["mas", "", "", "Masai", "massaï"],
305
- self["may", "msa", "ms", "Malay", "malais"],
306
- self["mdf", "", "", "Moksha", "moksa"],
307
- self["mdr", "", "", "Mandar", "mandar"],
308
- self["men", "", "", "Mende", "mendé"],
309
- self["mga", "", "", "Irish, Middle (900-1200)", "irlandais moyen (900-1200)"],
310
- self["mic", "", "", "Mi'kmaq; Micmac", "mi'kmaq; micmac"],
311
- self["min", "", "", "Minangkabau", "minangkabau"],
312
- self["mis", "", "", "Uncoded languages", "langues non codées"],
313
- self["mkh", "", "", "Mon-Khmer languages", "môn-khmer, langues"],
314
- self["mlg", "", "mg", "Malagasy", "malgache"],
315
- self["mlt", "", "mt", "Maltese", "maltais"],
316
- self["mnc", "", "", "Manchu", "mandchou"],
317
- self["mni", "", "", "Manipuri", "manipuri"],
318
- self["mno", "", "", "Manobo languages", "manobo, langues"],
319
- self["moh", "", "", "Mohawk", "mohawk"],
320
- self["mon", "", "mn", "Mongolian", "mongol"],
321
- self["mos", "", "", "Mossi", "moré"],
322
- self["mul", "", "", "Multiple languages", "multilingue"],
323
- self["mun", "", "", "Munda languages", "mounda, langues"],
324
- self["mus", "", "", "Creek", "muskogee"],
325
- self["mwl", "", "", "Mirandese", "mirandais"],
326
- self["mwr", "", "", "Marwari", "marvari"],
327
- self["myn", "", "", "Mayan languages", "maya, langues"],
328
- self["myv", "", "", "Erzya", "erza"],
329
- self["nah", "", "", "Nahuatl languages", "nahuatl, langues"],
330
- self["nai", "", "", "North American Indian languages", "nord-amérindiennes, langues"],
331
- self["nap", "", "", "Neapolitan", "napolitain"],
332
- self["nau", "", "na", "Nauru", "nauruan"],
333
- self["nav", "", "nv", "Navajo; Navaho", "navaho"],
334
- self["nbl", "", "nr", "Ndebele, South; South Ndebele", "ndébélé du Sud"],
335
- self["nde", "", "nd", "Ndebele, North; North Ndebele", "ndébélé du Nord"],
336
- self["ndo", "", "ng", "Ndonga", "ndonga"],
337
- self["nds", "", "", "Low German; Low Saxon; German, Low; Saxon, Low", "bas allemand; bas saxon; allemand, bas; saxon, bas"],
338
- self["nep", "", "ne", "Nepali", "népalais"],
339
- self["new", "", "", "Nepal Bhasa; Newari", "nepal bhasa; newari"],
340
- self["nia", "", "", "Nias", "nias"],
341
- self["nic", "", "", "Niger-Kordofanian languages", "nigéro-kordofaniennes, langues"],
342
- self["niu", "", "", "Niuean", "niué"],
343
- self["nno", "", "nn", "Norwegian Nynorsk; Nynorsk, Norwegian", "norvégien nynorsk; nynorsk, norvégien"],
344
- self["nob", "", "nb", "Bokmål, Norwegian; Norwegian Bokmål", "norvégien bokmål"],
345
- self["nog", "", "", "Nogai", "nogaï; nogay"],
346
- self["non", "", "", "Norse, Old", "norrois, vieux"],
347
- self["nor", "", "no", "Norwegian", "norvégien"],
348
- self["nqo", "", "", "N'Ko", "n'ko"],
349
- self["nso", "", "", "Pedi; Sepedi; Northern Sotho", "pedi; sepedi; sotho du Nord"],
350
- self["nub", "", "", "Nubian languages", "nubiennes, langues"],
351
- self["nwc", "", "", "Classical Newari; Old Newari; Classical Nepal Bhasa", "newari classique"],
352
- self["nya", "", "ny", "Chichewa; Chewa; Nyanja", "chichewa; chewa; nyanja"],
353
- self["nym", "", "", "Nyamwezi", "nyamwezi"],
354
- self["nyn", "", "", "Nyankole", "nyankolé"],
355
- self["nyo", "", "", "Nyoro", "nyoro"],
356
- self["nzi", "", "", "Nzima", "nzema"],
357
- self["oci", "", "oc", "Occitan (post 1500); Provençal", "occitan (après 1500); provençal"],
358
- self["oji", "", "oj", "Ojibwa", "ojibwa"],
359
- self["ori", "", "or", "Oriya", "oriya"],
360
- self["orm", "", "om", "Oromo", "galla"],
361
- self["osa", "", "", "Osage", "osage"],
362
- self["oss", "", "os", "Ossetian; Ossetic", "ossète"],
363
- self["ota", "", "", "Turkish, Ottoman (1500-1928)", "turc ottoman (1500-1928)"],
364
- self["oto", "", "", "Otomian languages", "otomi, langues"],
365
- self["paa", "", "", "Papuan languages", "papoues, langues"],
366
- self["pag", "", "", "Pangasinan", "pangasinan"],
367
- self["pal", "", "", "Pahlavi", "pahlavi"],
368
- self["pam", "", "", "Pampanga; Kapampangan", "pampangan"],
369
- self["pan", "", "pa", "Panjabi; Punjabi", "pendjabi"],
370
- self["pap", "", "", "Papiamento", "papiamento"],
371
- self["pau", "", "", "Palauan", "palau"],
372
- self["peo", "", "", "Persian, Old (ca.600-400 B.C.)", "perse, vieux (ca. 600-400 av. J.-C.)"],
373
- self["per", "fas", "fa", "Persian", "persan"],
374
- self["phi", "", "", "Philippine languages", "philippines, langues"],
375
- self["phn", "", "", "Phoenician", "phénicien"],
376
- self["pli", "", "pi", "Pali", "pali"],
377
- self["pol", "", "pl", "Polish", "polonais"],
378
- self["pon", "", "", "Pohnpeian", "pohnpei"],
379
- self["por", "", "pt", "Portuguese", "portugais"],
380
- self["pra", "", "", "Prakrit languages", "prâkrit, langues"],
381
- self["pro", "", "", "Provençal, Old (to 1500)", "provençal ancien (jusqu'à 1500)"],
382
- self["pus", "", "ps", "Pushto; Pashto", "pachto"],
383
- self["qaa-qtz", "", "", "Reserved for local use", "réservée à l'usage local"],
384
- self["que", "", "qu", "Quechua", "quechua"],
385
- self["raj", "", "", "Rajasthani", "rajasthani"],
386
- self["rap", "", "", "Rapanui", "rapanui"],
387
- self["rar", "", "", "Rarotongan; Cook Islands Maori", "rarotonga; maori des îles Cook"],
388
- self["roa", "", "", "Romance languages", "romanes, langues"],
389
- self["roh", "", "rm", "Romansh", "romanche"],
390
- self["rom", "", "", "Romany", "tsigane"],
391
- self["rum", "ron", "ro", "Romanian; Moldavian; Moldovan", "roumain; moldave"],
392
- self["run", "", "rn", "Rundi", "rundi"],
393
- self["rup", "", "", "Aromanian; Arumanian; Macedo-Romanian", "aroumain; macédo-roumain"],
394
- self["rus", "", "ru", "Russian", "russe"],
395
- self["sad", "", "", "Sandawe", "sandawe"],
396
- self["sag", "", "sg", "Sango", "sango"],
397
- self["sah", "", "", "Yakut", "iakoute"],
398
- self["sai", "", "", "South American Indian (Other)", "indiennes d'Amérique du Sud, autres langues"],
399
- self["sal", "", "", "Salishan languages", "salishennes, langues"],
400
- self["sam", "", "", "Samaritan Aramaic", "samaritain"],
401
- self["san", "", "sa", "Sanskrit", "sanskrit"],
402
- self["sas", "", "", "Sasak", "sasak"],
403
- self["sat", "", "", "Santali", "santal"],
404
- self["scn", "", "", "Sicilian", "sicilien"],
405
- self["sco", "", "", "Scots", "écossais"],
406
- self["sel", "", "", "Selkup", "selkoupe"],
407
- self["sem", "", "", "Semitic languages", "sémitiques, langues"],
408
- self["sga", "", "", "Irish, Old (to 900)", "irlandais ancien (jusqu'à 900)"],
409
- self["sgn", "", "", "Sign Languages", "langues des signes"],
410
- self["shn", "", "", "Shan", "chan"],
411
- self["sid", "", "", "Sidamo", "sidamo"],
412
- self["sin", "", "si", "Sinhala; Sinhalese", "singhalais"],
413
- self["sio", "", "", "Siouan languages", "sioux, langues"],
414
- self["sit", "", "", "Sino-Tibetan languages", "sino-tibétaines, langues"],
415
- self["sla", "", "", "Slavic languages", "slaves, langues"],
416
- self["slo", "slk", "sk", "Slovak", "slovaque"],
417
- self["slv", "", "sl", "Slovenian", "slovène"],
418
- self["sma", "", "", "Southern Sami", "sami du Sud"],
419
- self["sme", "", "se", "Northern Sami", "sami du Nord"],
420
- self["smi", "", "", "Sami languages", "sames, langues"],
421
- self["smj", "", "", "Lule Sami", "sami de Lule"],
422
- self["smn", "", "", "Inari Sami", "sami d'Inari"],
423
- self["smo", "", "sm", "Samoan", "samoan"],
424
- self["sms", "", "", "Skolt Sami", "sami skolt"],
425
- self["sna", "", "sn", "Shona", "shona"],
426
- self["snd", "", "sd", "Sindhi", "sindhi"],
427
- self["snk", "", "", "Soninke", "soninké"],
428
- self["sog", "", "", "Sogdian", "sogdien"],
429
- self["som", "", "so", "Somali", "somali"],
430
- self["son", "", "", "Songhai languages", "songhai, langues"],
431
- self["sot", "", "st", "Sotho, Southern", "sotho du Sud"],
432
- self["spa", "", "es", "Spanish; Castilian", "espagnol; castillan"],
433
- self["srd", "", "sc", "Sardinian", "sarde"],
434
- self["srn", "", "", "Sranan Tongo", "sranan tongo"],
435
- self["srp", "", "sr", "Serbian", "serbe"],
436
- self["srr", "", "", "Serer", "sérère"],
437
- self["ssa", "", "", "Nilo-Saharan languages", "nilo-sahariennes, langues"],
438
- self["ssw", "", "ss", "Swati", "swati"],
439
- self["suk", "", "", "Sukuma", "sukuma"],
440
- self["sun", "", "su", "Sundanese", "soundanais"],
441
- self["sus", "", "", "Susu", "soussou"],
442
- self["sux", "", "", "Sumerian", "sumérien"],
443
- self["swa", "", "sw", "Swahili", "swahili"],
444
- self["swe", "", "sv", "Swedish", "suédois"],
445
- self["syc", "", "", "Classical Syriac", "syriaque classique"],
446
- self["syr", "", "", "Syriac", "syriaque"],
447
- self["tah", "", "ty", "Tahitian", "tahitien"],
448
- self["tai", "", "", "Tai languages", "tai, langues"],
449
- self["tam", "", "ta", "Tamil", "tamoul"],
450
- self["tat", "", "tt", "Tatar", "tatar"],
451
- self["tel", "", "te", "Telugu", "télougou"],
452
- self["tem", "", "", "Timne", "temne"],
453
- self["ter", "", "", "Tereno", "tereno"],
454
- self["tet", "", "", "Tetum", "tetum"],
455
- self["tgk", "", "tg", "Tajik", "tadjik"],
456
- self["tgl", "", "tl", "Tagalog", "tagalog"],
457
- self["tha", "", "th", "Thai", "thaï"],
458
- self["tib", "bod", "bo", "Tibetan", "tibétain"],
459
- self["tig", "", "", "Tigre", "tigré"],
460
- self["tir", "", "ti", "Tigrinya", "tigrigna"],
461
- self["tiv", "", "", "Tiv", "tiv"],
462
- self["tkl", "", "", "Tokelau", "tokelau"],
463
- self["tlh", "", "", "Klingon; tlhIngan-Hol", "klingon"],
464
- self["tli", "", "", "Tlingit", "tlingit"],
465
- self["tmh", "", "", "Tamashek", "tamacheq"],
466
- self["tog", "", "", "Tonga (Nyasa)", "tonga (Nyasa)"],
467
- self["ton", "", "to", "Tonga (Tonga Islands)", "tongan (Îles Tonga)"],
468
- self["tpi", "", "", "Tok Pisin", "tok pisin"],
469
- self["tsi", "", "", "Tsimshian", "tsimshian"],
470
- self["tsn", "", "tn", "Tswana", "tswana"],
471
- self["tso", "", "ts", "Tsonga", "tsonga"],
472
- self["tuk", "", "tk", "Turkmen", "turkmène"],
473
- self["tum", "", "", "Tumbuka", "tumbuka"],
474
- self["tup", "", "", "Tupi languages", "tupi, langues"],
475
- self["tur", "", "tr", "Turkish", "turc"],
476
- self["tut", "", "", "Altaic languages", "altaïques, langues"],
477
- self["tvl", "", "", "Tuvalu", "tuvalu"],
478
- self["twi", "", "tw", "Twi", "twi"],
479
- self["tyv", "", "", "Tuvinian", "touva"],
480
- self["udm", "", "", "Udmurt", "oudmourte"],
481
- self["uga", "", "", "Ugaritic", "ougaritique"],
482
- self["uig", "", "ug", "Uighur; Uyghur", "ouïgour"],
483
- self["ukr", "", "uk", "Ukrainian", "ukrainien"],
484
- self["umb", "", "", "Umbundu", "umbundu"],
485
- self["und", "", "", "Undetermined", "indéterminée"],
486
- self["urd", "", "ur", "Urdu", "ourdou"],
487
- self["uzb", "", "uz", "Uzbek", "ouszbek"],
488
- self["vai", "", "", "Vai", "vaï"],
489
- self["ven", "", "ve", "Venda", "venda"],
490
- self["vie", "", "vi", "Vietnamese", "vietnamien"],
491
- self["vol", "", "vo", "Volapük", "volapük"],
492
- self["vot", "", "", "Votic", "vote"],
493
- self["wak", "", "", "Wakashan languages", "wakashanes, langues"],
494
- self["wal", "", "", "Walamo", "walamo"],
495
- self["war", "", "", "Waray", "waray"],
496
- self["was", "", "", "Washo", "washo"],
497
- self["wel", "cym", "cy", "Welsh", "gallois"],
498
- self["wen", "", "", "Sorbian languages", "sorabes, langues"],
499
- self["wln", "", "wa", "Walloon", "wallon"],
500
- self["wol", "", "wo", "Wolof", "wolof"],
501
- self["xal", "", "", "Kalmyk; Oirat", "kalmouk; oïrat"],
502
- self["xho", "", "xh", "Xhosa", "xhosa"],
503
- self["yao", "", "", "Yao", "yao"],
504
- self["yap", "", "", "Yapese", "yapois"],
505
- self["yid", "", "yi", "Yiddish", "yiddish"],
506
- self["yor", "", "yo", "Yoruba", "yoruba"],
507
- self["ypk", "", "", "Yupik languages", "yupik, langues"],
508
- self["zap", "", "", "Zapotec", "zapotèque"],
509
- self["zbl", "", "", "Blissymbols; Blissymbolics; Bliss", "symboles Bliss; Bliss"],
510
- self["zen", "", "", "Zenaga", "zenaga"],
511
- self["zha", "", "za", "Zhuang; Chuang", "zhuang; chuang"],
512
- self["znd", "", "", "Zande languages", "zandé, langues"],
513
- self["zul", "", "zu", "Zulu", "zoulou"],
514
- self["zun", "", "", "Zuni", "zuni"],
515
- self["zxx", "", "", "No linguistic content; Not applicable", "pas de contenu linguistique; non applicable"],
516
- self["zza", "", "", "Zaza; Dimili; Dimli; Kirdki; Kirmanjki; Zazaki", "zaza; dimili; dimli; kirdki; kirmanjki; zazaki"]
517
- ].freeze
13
+ #
14
+ # Dataset Source:
15
+ # https://www.loc.gov/standards/iso639-2/ascii_8bits.html
16
+ # https://www.loc.gov/standards/iso639-2/ISO-639-2_utf-8.txt
17
+ ISO_639_2 = lambda do
18
+ dataset = []
19
+ CSV.foreach(
20
+ File.join(File.dirname(__FILE__), 'data', 'ISO-639-2_utf-8.txt'),
21
+ **{ col_sep: "|",
22
+ converters: ->(v) { v || '' },
23
+ encoding: 'bom|utf-8' }
24
+ ).each do |row|
25
+ dataset << self[*row].freeze
26
+ end
27
+ return dataset
28
+ end.call.freeze
518
29
 
519
30
  # An inverted index generated from the ISO_639_2 data. Used for searching
520
31
  # all words and codes in all fields.
data/test/test_iso_639.rb CHANGED
@@ -4,7 +4,7 @@ require 'helper'
4
4
 
5
5
  describe ISO_639 do
6
6
  it 'should have full code list in ISO_639_2' do
7
- assert_equal 485, ISO_639::ISO_639_2.length
7
+ assert_equal 487, ISO_639::ISO_639_2.length
8
8
  end
9
9
 
10
10
  it 'should have shorter code list in ISO_639_1' do
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: iso-639
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.10
4
+ version: 0.3.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - William Melody
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2020-03-01 00:00:00.000000000 Z
11
+ date: 2020-03-02 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: minitest
@@ -125,6 +125,7 @@ files:
125
125
  - README.md
126
126
  - Rakefile
127
127
  - iso-639.gemspec
128
+ - lib/data/ISO-639-2_utf-8.txt
128
129
  - lib/iso-639.rb
129
130
  - test/helper.rb
130
131
  - test/test_iso_639.rb
@@ -140,7 +141,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
140
141
  requirements:
141
142
  - - ">="
142
143
  - !ruby/object:Gem::Version
143
- version: '0'
144
+ version: '2.3'
144
145
  required_rubygems_version: !ruby/object:Gem::Requirement
145
146
  requirements:
146
147
  - - ">="