iso-639 0.2.10 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: da2f2ce60e4acc74618b01f7c2f22e12fd8c86b7a7b6e5e254ae0667cc6c2b7b
4
- data.tar.gz: f5d18fadc8b2aa67847f49f00dfb0354de15ef00c9ec98fafe9721ceb87dec62
3
+ metadata.gz: 814587429390abbe6fb28f55a2ee74b07d65c17e845b369f33a9dab981daef11
4
+ data.tar.gz: aeab1e9162ec0eb34614bbfddd50edf57447ec5905110a2240011119241016af
5
5
  SHA512:
6
- metadata.gz: 5b16c4ae94be5045d5f0334c971cd26f80d81bac61a74339f39e9101e312dad234956136504550b1257a3ac06c9bb708844016c52ac8c33fb3ab9da1c4b97c22
7
- data.tar.gz: 381eb1d06c4eadbeea18ce22fbd71aa3b1a81ed7f7200016e551b7e814570622bbd1bf92194f9150c470eece0e5780f637898963b432ecd79cbeb4e2b4ec88d2
6
+ metadata.gz: 5dce38567522e0a329821cc433518c8a7f20b680c5fe22d3fec488e7cdc007f0bb4e8c6a58153ef07a53a85b8c897d531db591d2fb045363981688a481ad482f
7
+ data.tar.gz: 24cd30d637416bb970c3df0c1595aa0879c60f8329d7ed7f0c467f81ced221d5b88f9af1405007e996b7434433bd0cc14267d09a9d20331f1849a00e4cc30462
data/iso-639.gemspec CHANGED
@@ -2,13 +2,13 @@
2
2
 
3
3
  Gem::Specification.new do |s|
4
4
  s.name = 'iso-639'
5
- s.version = '0.2.10'
5
+ s.version = '0.3.1'
6
6
  s.licenses = ['MIT']
7
7
  s.summary = 'ISO 639-1 and ISO 639-2 language code entries and convenience methods'
8
8
  s.description = 'ISO 639-1 and ISO 639-2 language code entries and convenience methods'
9
9
  s.authors = ['William Melody']
10
10
  s.email = 'hi@williammelody.com'
11
- s.date = '2020-03-01'
11
+ s.date = '2020-03-02'
12
12
  s.extra_rdoc_files = [
13
13
  'LICENSE',
14
14
  'README.md'
@@ -21,6 +21,7 @@ Gem::Specification.new do |s|
21
21
  'README.md',
22
22
  'Rakefile',
23
23
  'iso-639.gemspec',
24
+ 'lib/data/ISO-639-2_utf-8.txt',
24
25
  'lib/iso-639.rb',
25
26
  'test/helper.rb',
26
27
  'test/test_iso_639.rb'
@@ -32,4 +33,5 @@ Gem::Specification.new do |s|
32
33
  s.add_development_dependency('rdoc', '~> 6', '>= 0')
33
34
  s.add_development_dependency('rubocop', '~> 0', '>= 0.49.0')
34
35
  s.add_development_dependency('test-unit', '~> 3', '>= 0')
36
+ s.required_ruby_version = '>= 2.3'
35
37
  end
@@ -0,0 +1,487 @@
1
+ aar||aa|Afar|afar
2
+ abk||ab|Abkhazian|abkhaze
3
+ ace|||Achinese|aceh
4
+ ach|||Acoli|acoli
5
+ ada|||Adangme|adangme
6
+ ady|||Adyghe; Adygei|adyghé
7
+ afa|||Afro-Asiatic languages|afro-asiatiques, langues
8
+ afh|||Afrihili|afrihili
9
+ afr||af|Afrikaans|afrikaans
10
+ ain|||Ainu|aïnou
11
+ aka||ak|Akan|akan
12
+ akk|||Akkadian|akkadien
13
+ alb|sqi|sq|Albanian|albanais
14
+ ale|||Aleut|aléoute
15
+ alg|||Algonquian languages|algonquines, langues
16
+ alt|||Southern Altai|altai du Sud
17
+ amh||am|Amharic|amharique
18
+ ang|||English, Old (ca.450-1100)|anglo-saxon (ca.450-1100)
19
+ anp|||Angika|angika
20
+ apa|||Apache languages|apaches, langues
21
+ ara||ar|Arabic|arabe
22
+ arc|||Official Aramaic (700-300 BCE); Imperial Aramaic (700-300 BCE)|araméen d'empire (700-300 BCE)
23
+ arg||an|Aragonese|aragonais
24
+ arm|hye|hy|Armenian|arménien
25
+ arn|||Mapudungun; Mapuche|mapudungun; mapuche; mapuce
26
+ arp|||Arapaho|arapaho
27
+ art|||Artificial languages|artificielles, langues
28
+ arw|||Arawak|arawak
29
+ asm||as|Assamese|assamais
30
+ ast|||Asturian; Bable; Leonese; Asturleonese|asturien; bable; léonais; asturoléonais
31
+ ath|||Athapascan languages|athapascanes, langues
32
+ aus|||Australian languages|australiennes, langues
33
+ ava||av|Avaric|avar
34
+ ave||ae|Avestan|avestique
35
+ awa|||Awadhi|awadhi
36
+ aym||ay|Aymara|aymara
37
+ aze||az|Azerbaijani|azéri
38
+ bad|||Banda languages|banda, langues
39
+ bai|||Bamileke languages|bamiléké, langues
40
+ bak||ba|Bashkir|bachkir
41
+ bal|||Baluchi|baloutchi
42
+ bam||bm|Bambara|bambara
43
+ ban|||Balinese|balinais
44
+ baq|eus|eu|Basque|basque
45
+ bas|||Basa|basa
46
+ bat|||Baltic languages|baltes, langues
47
+ bej|||Beja; Bedawiyet|bedja
48
+ bel||be|Belarusian|biélorusse
49
+ bem|||Bemba|bemba
50
+ ben||bn|Bengali|bengali
51
+ ber|||Berber languages|berbères, langues
52
+ bho|||Bhojpuri|bhojpuri
53
+ bih||bh|Bihari languages|langues biharis
54
+ bik|||Bikol|bikol
55
+ bin|||Bini; Edo|bini; edo
56
+ bis||bi|Bislama|bichlamar
57
+ bla|||Siksika|blackfoot
58
+ bnt|||Bantu languages|bantou, langues
59
+ bos||bs|Bosnian|bosniaque
60
+ bra|||Braj|braj
61
+ bre||br|Breton|breton
62
+ btk|||Batak languages|batak, langues
63
+ bua|||Buriat|bouriate
64
+ bug|||Buginese|bugi
65
+ bul||bg|Bulgarian|bulgare
66
+ bur|mya|my|Burmese|birman
67
+ byn|||Blin; Bilin|blin; bilen
68
+ cad|||Caddo|caddo
69
+ cai|||Central American Indian languages|amérindiennes de L'Amérique centrale, langues
70
+ car|||Galibi Carib|karib; galibi; carib
71
+ cat||ca|Catalan; Valencian|catalan; valencien
72
+ cau|||Caucasian languages|caucasiennes, langues
73
+ ceb|||Cebuano|cebuano
74
+ cel|||Celtic languages|celtiques, langues; celtes, langues
75
+ cha||ch|Chamorro|chamorro
76
+ chb|||Chibcha|chibcha
77
+ che||ce|Chechen|tchétchène
78
+ chg|||Chagatai|djaghataï
79
+ chi|zho|zh|Chinese|chinois
80
+ chk|||Chuukese|chuuk
81
+ chm|||Mari|mari
82
+ chn|||Chinook jargon|chinook, jargon
83
+ cho|||Choctaw|choctaw
84
+ chp|||Chipewyan; Dene Suline|chipewyan
85
+ chr|||Cherokee|cherokee
86
+ chu||cu|Church Slavic; Old Slavonic; Church Slavonic; Old Bulgarian; Old Church Slavonic|slavon d'église; vieux slave; slavon liturgique; vieux bulgare
87
+ chv||cv|Chuvash|tchouvache
88
+ chy|||Cheyenne|cheyenne
89
+ cmc|||Chamic languages|chames, langues
90
+ cnr|||Montenegrin|monténégrin
91
+ cop|||Coptic|copte
92
+ cor||kw|Cornish|cornique
93
+ cos||co|Corsican|corse
94
+ cpe|||Creoles and pidgins, English based|créoles et pidgins basés sur l'anglais
95
+ cpf|||Creoles and pidgins, French-based|créoles et pidgins basés sur le français
96
+ cpp|||Creoles and pidgins, Portuguese-based|créoles et pidgins basés sur le portugais
97
+ cre||cr|Cree|cree
98
+ crh|||Crimean Tatar; Crimean Turkish|tatar de Crimé
99
+ crp|||Creoles and pidgins|créoles et pidgins
100
+ csb|||Kashubian|kachoube
101
+ cus|||Cushitic languages|couchitiques, langues
102
+ cze|ces|cs|Czech|tchèque
103
+ dak|||Dakota|dakota
104
+ dan||da|Danish|danois
105
+ dar|||Dargwa|dargwa
106
+ day|||Land Dayak languages|dayak, langues
107
+ del|||Delaware|delaware
108
+ den|||Slave (Athapascan)|esclave (athapascan)
109
+ dgr|||Dogrib|dogrib
110
+ din|||Dinka|dinka
111
+ div||dv|Divehi; Dhivehi; Maldivian|maldivien
112
+ doi|||Dogri|dogri
113
+ dra|||Dravidian languages|dravidiennes, langues
114
+ dsb|||Lower Sorbian|bas-sorabe
115
+ dua|||Duala|douala
116
+ dum|||Dutch, Middle (ca.1050-1350)|néerlandais moyen (ca. 1050-1350)
117
+ dut|nld|nl|Dutch; Flemish|néerlandais; flamand
118
+ dyu|||Dyula|dioula
119
+ dzo||dz|Dzongkha|dzongkha
120
+ efi|||Efik|efik
121
+ egy|||Egyptian (Ancient)|égyptien
122
+ eka|||Ekajuk|ekajuk
123
+ elx|||Elamite|élamite
124
+ eng||en|English|anglais
125
+ enm|||English, Middle (1100-1500)|anglais moyen (1100-1500)
126
+ epo||eo|Esperanto|espéranto
127
+ est||et|Estonian|estonien
128
+ ewe||ee|Ewe|éwé
129
+ ewo|||Ewondo|éwondo
130
+ fan|||Fang|fang
131
+ fao||fo|Faroese|féroïen
132
+ fat|||Fanti|fanti
133
+ fij||fj|Fijian|fidjien
134
+ fil|||Filipino; Pilipino|filipino; pilipino
135
+ fin||fi|Finnish|finnois
136
+ fiu|||Finno-Ugrian languages|finno-ougriennes, langues
137
+ fon|||Fon|fon
138
+ fre|fra|fr|French|français
139
+ frm|||French, Middle (ca.1400-1600)|français moyen (1400-1600)
140
+ fro|||French, Old (842-ca.1400)|français ancien (842-ca.1400)
141
+ frr|||Northern Frisian|frison septentrional
142
+ frs|||Eastern Frisian|frison oriental
143
+ fry||fy|Western Frisian|frison occidental
144
+ ful||ff|Fulah|peul
145
+ fur|||Friulian|frioulan
146
+ gaa|||Ga|ga
147
+ gay|||Gayo|gayo
148
+ gba|||Gbaya|gbaya
149
+ gem|||Germanic languages|germaniques, langues
150
+ geo|kat|ka|Georgian|géorgien
151
+ ger|deu|de|German|allemand
152
+ gez|||Geez|guèze
153
+ gil|||Gilbertese|kiribati
154
+ gla||gd|Gaelic; Scottish Gaelic|gaélique; gaélique écossais
155
+ gle||ga|Irish|irlandais
156
+ glg||gl|Galician|galicien
157
+ glv||gv|Manx|manx; mannois
158
+ gmh|||German, Middle High (ca.1050-1500)|allemand, moyen haut (ca. 1050-1500)
159
+ goh|||German, Old High (ca.750-1050)|allemand, vieux haut (ca. 750-1050)
160
+ gon|||Gondi|gond
161
+ gor|||Gorontalo|gorontalo
162
+ got|||Gothic|gothique
163
+ grb|||Grebo|grebo
164
+ grc|||Greek, Ancient (to 1453)|grec ancien (jusqu'à 1453)
165
+ gre|ell|el|Greek, Modern (1453-)|grec moderne (après 1453)
166
+ grn||gn|Guarani|guarani
167
+ gsw|||Swiss German; Alemannic; Alsatian|suisse alémanique; alémanique; alsacien
168
+ guj||gu|Gujarati|goudjrati
169
+ gwi|||Gwich'in|gwich'in
170
+ hai|||Haida|haida
171
+ hat||ht|Haitian; Haitian Creole|haïtien; créole haïtien
172
+ hau||ha|Hausa|haoussa
173
+ haw|||Hawaiian|hawaïen
174
+ heb||he|Hebrew|hébreu
175
+ her||hz|Herero|herero
176
+ hil|||Hiligaynon|hiligaynon
177
+ him|||Himachali languages; Western Pahari languages|langues himachalis; langues paharis occidentales
178
+ hin||hi|Hindi|hindi
179
+ hit|||Hittite|hittite
180
+ hmn|||Hmong; Mong|hmong
181
+ hmo||ho|Hiri Motu|hiri motu
182
+ hrv||hr|Croatian|croate
183
+ hsb|||Upper Sorbian|haut-sorabe
184
+ hun||hu|Hungarian|hongrois
185
+ hup|||Hupa|hupa
186
+ iba|||Iban|iban
187
+ ibo||ig|Igbo|igbo
188
+ ice|isl|is|Icelandic|islandais
189
+ ido||io|Ido|ido
190
+ iii||ii|Sichuan Yi; Nuosu|yi de Sichuan
191
+ ijo|||Ijo languages|ijo, langues
192
+ iku||iu|Inuktitut|inuktitut
193
+ ile||ie|Interlingue; Occidental|interlingue
194
+ ilo|||Iloko|ilocano
195
+ ina||ia|Interlingua (International Auxiliary Language Association)|interlingua (langue auxiliaire internationale)
196
+ inc|||Indic languages|indo-aryennes, langues
197
+ ind||id|Indonesian|indonésien
198
+ ine|||Indo-European languages|indo-européennes, langues
199
+ inh|||Ingush|ingouche
200
+ ipk||ik|Inupiaq|inupiaq
201
+ ira|||Iranian languages|iraniennes, langues
202
+ iro|||Iroquoian languages|iroquoises, langues
203
+ ita||it|Italian|italien
204
+ jav||jv|Javanese|javanais
205
+ jbo|||Lojban|lojban
206
+ jpn||ja|Japanese|japonais
207
+ jpr|||Judeo-Persian|judéo-persan
208
+ jrb|||Judeo-Arabic|judéo-arabe
209
+ kaa|||Kara-Kalpak|karakalpak
210
+ kab|||Kabyle|kabyle
211
+ kac|||Kachin; Jingpho|kachin; jingpho
212
+ kal||kl|Kalaallisut; Greenlandic|groenlandais
213
+ kam|||Kamba|kamba
214
+ kan||kn|Kannada|kannada
215
+ kar|||Karen languages|karen, langues
216
+ kas||ks|Kashmiri|kashmiri
217
+ kau||kr|Kanuri|kanouri
218
+ kaw|||Kawi|kawi
219
+ kaz||kk|Kazakh|kazakh
220
+ kbd|||Kabardian|kabardien
221
+ kha|||Khasi|khasi
222
+ khi|||Khoisan languages|khoïsan, langues
223
+ khm||km|Central Khmer|khmer central
224
+ kho|||Khotanese; Sakan|khotanais; sakan
225
+ kik||ki|Kikuyu; Gikuyu|kikuyu
226
+ kin||rw|Kinyarwanda|rwanda
227
+ kir||ky|Kirghiz; Kyrgyz|kirghiz
228
+ kmb|||Kimbundu|kimbundu
229
+ kok|||Konkani|konkani
230
+ kom||kv|Komi|kom
231
+ kon||kg|Kongo|kongo
232
+ kor||ko|Korean|coréen
233
+ kos|||Kosraean|kosrae
234
+ kpe|||Kpelle|kpellé
235
+ krc|||Karachay-Balkar|karatchai balkar
236
+ krl|||Karelian|carélien
237
+ kro|||Kru languages|krou, langues
238
+ kru|||Kurukh|kurukh
239
+ kua||kj|Kuanyama; Kwanyama|kuanyama; kwanyama
240
+ kum|||Kumyk|koumyk
241
+ kur||ku|Kurdish|kurde
242
+ kut|||Kutenai|kutenai
243
+ lad|||Ladino|judéo-espagnol
244
+ lah|||Lahnda|lahnda
245
+ lam|||Lamba|lamba
246
+ lao||lo|Lao|lao
247
+ lat||la|Latin|latin
248
+ lav||lv|Latvian|letton
249
+ lez|||Lezghian|lezghien
250
+ lim||li|Limburgan; Limburger; Limburgish|limbourgeois
251
+ lin||ln|Lingala|lingala
252
+ lit||lt|Lithuanian|lituanien
253
+ lol|||Mongo|mongo
254
+ loz|||Lozi|lozi
255
+ ltz||lb|Luxembourgish; Letzeburgesch|luxembourgeois
256
+ lua|||Luba-Lulua|luba-lulua
257
+ lub||lu|Luba-Katanga|luba-katanga
258
+ lug||lg|Ganda|ganda
259
+ lui|||Luiseno|luiseno
260
+ lun|||Lunda|lunda
261
+ luo|||Luo (Kenya and Tanzania)|luo (Kenya et Tanzanie)
262
+ lus|||Lushai|lushai
263
+ mac|mkd|mk|Macedonian|macédonien
264
+ mad|||Madurese|madourais
265
+ mag|||Magahi|magahi
266
+ mah||mh|Marshallese|marshall
267
+ mai|||Maithili|maithili
268
+ mak|||Makasar|makassar
269
+ mal||ml|Malayalam|malayalam
270
+ man|||Mandingo|mandingue
271
+ mao|mri|mi|Maori|maori
272
+ map|||Austronesian languages|austronésiennes, langues
273
+ mar||mr|Marathi|marathe
274
+ mas|||Masai|massaï
275
+ may|msa|ms|Malay|malais
276
+ mdf|||Moksha|moksa
277
+ mdr|||Mandar|mandar
278
+ men|||Mende|mendé
279
+ mga|||Irish, Middle (900-1200)|irlandais moyen (900-1200)
280
+ mic|||Mi'kmaq; Micmac|mi'kmaq; micmac
281
+ min|||Minangkabau|minangkabau
282
+ mis|||Uncoded languages|langues non codées
283
+ mkh|||Mon-Khmer languages|môn-khmer, langues
284
+ mlg||mg|Malagasy|malgache
285
+ mlt||mt|Maltese|maltais
286
+ mnc|||Manchu|mandchou
287
+ mni|||Manipuri|manipuri
288
+ mno|||Manobo languages|manobo, langues
289
+ moh|||Mohawk|mohawk
290
+ mon||mn|Mongolian|mongol
291
+ mos|||Mossi|moré
292
+ mul|||Multiple languages|multilingue
293
+ mun|||Munda languages|mounda, langues
294
+ mus|||Creek|muskogee
295
+ mwl|||Mirandese|mirandais
296
+ mwr|||Marwari|marvari
297
+ myn|||Mayan languages|maya, langues
298
+ myv|||Erzya|erza
299
+ nah|||Nahuatl languages|nahuatl, langues
300
+ nai|||North American Indian languages|nord-amérindiennes, langues
301
+ nap|||Neapolitan|napolitain
302
+ nau||na|Nauru|nauruan
303
+ nav||nv|Navajo; Navaho|navaho
304
+ nbl||nr|Ndebele, South; South Ndebele|ndébélé du Sud
305
+ nde||nd|Ndebele, North; North Ndebele|ndébélé du Nord
306
+ ndo||ng|Ndonga|ndonga
307
+ nds|||Low German; Low Saxon; German, Low; Saxon, Low|bas allemand; bas saxon; allemand, bas; saxon, bas
308
+ nep||ne|Nepali|népalais
309
+ new|||Nepal Bhasa; Newari|nepal bhasa; newari
310
+ nia|||Nias|nias
311
+ nic|||Niger-Kordofanian languages|nigéro-kordofaniennes, langues
312
+ niu|||Niuean|niué
313
+ nno||nn|Norwegian Nynorsk; Nynorsk, Norwegian|norvégien nynorsk; nynorsk, norvégien
314
+ nob||nb|Bokmål, Norwegian; Norwegian Bokmål|norvégien bokmål
315
+ nog|||Nogai|nogaï; nogay
316
+ non|||Norse, Old|norrois, vieux
317
+ nor||no|Norwegian|norvégien
318
+ nqo|||N'Ko|n'ko
319
+ nso|||Pedi; Sepedi; Northern Sotho|pedi; sepedi; sotho du Nord
320
+ nub|||Nubian languages|nubiennes, langues
321
+ nwc|||Classical Newari; Old Newari; Classical Nepal Bhasa|newari classique
322
+ nya||ny|Chichewa; Chewa; Nyanja|chichewa; chewa; nyanja
323
+ nym|||Nyamwezi|nyamwezi
324
+ nyn|||Nyankole|nyankolé
325
+ nyo|||Nyoro|nyoro
326
+ nzi|||Nzima|nzema
327
+ oci||oc|Occitan (post 1500)|occitan (après 1500)
328
+ oji||oj|Ojibwa|ojibwa
329
+ ori||or|Oriya|oriya
330
+ orm||om|Oromo|galla
331
+ osa|||Osage|osage
332
+ oss||os|Ossetian; Ossetic|ossète
333
+ ota|||Turkish, Ottoman (1500-1928)|turc ottoman (1500-1928)
334
+ oto|||Otomian languages|otomi, langues
335
+ paa|||Papuan languages|papoues, langues
336
+ pag|||Pangasinan|pangasinan
337
+ pal|||Pahlavi|pahlavi
338
+ pam|||Pampanga; Kapampangan|pampangan
339
+ pan||pa|Panjabi; Punjabi|pendjabi
340
+ pap|||Papiamento|papiamento
341
+ pau|||Palauan|palau
342
+ peo|||Persian, Old (ca.600-400 B.C.)|perse, vieux (ca. 600-400 av. J.-C.)
343
+ per|fas|fa|Persian|persan
344
+ phi|||Philippine languages|philippines, langues
345
+ phn|||Phoenician|phénicien
346
+ pli||pi|Pali|pali
347
+ pol||pl|Polish|polonais
348
+ pon|||Pohnpeian|pohnpei
349
+ por||pt|Portuguese|portugais
350
+ pra|||Prakrit languages|prâkrit, langues
351
+ pro|||Provençal, Old (to 1500); Occitan, Old (to 1500)|provençal ancien (jusqu'à 1500); occitan ancien (jusqu'à 1500)
352
+ pus||ps|Pushto; Pashto|pachto
353
+ qaa-qtz|||Reserved for local use|réservée à l'usage local
354
+ que||qu|Quechua|quechua
355
+ raj|||Rajasthani|rajasthani
356
+ rap|||Rapanui|rapanui
357
+ rar|||Rarotongan; Cook Islands Maori|rarotonga; maori des îles Cook
358
+ roa|||Romance languages|romanes, langues
359
+ roh||rm|Romansh|romanche
360
+ rom|||Romany|tsigane
361
+ rum|ron|ro|Romanian; Moldavian; Moldovan|roumain; moldave
362
+ run||rn|Rundi|rundi
363
+ rup|||Aromanian; Arumanian; Macedo-Romanian|aroumain; macédo-roumain
364
+ rus||ru|Russian|russe
365
+ sad|||Sandawe|sandawe
366
+ sag||sg|Sango|sango
367
+ sah|||Yakut|iakoute
368
+ sai|||South American Indian languages|sud-amérindiennes, langues
369
+ sal|||Salishan languages|salishennes, langues
370
+ sam|||Samaritan Aramaic|samaritain
371
+ san||sa|Sanskrit|sanskrit
372
+ sas|||Sasak|sasak
373
+ sat|||Santali|santal
374
+ scn|||Sicilian|sicilien
375
+ sco|||Scots|écossais
376
+ sel|||Selkup|selkoupe
377
+ sem|||Semitic languages|sémitiques, langues
378
+ sga|||Irish, Old (to 900)|irlandais ancien (jusqu'à 900)
379
+ sgn|||Sign Languages|langues des signes
380
+ shn|||Shan|chan
381
+ sid|||Sidamo|sidamo
382
+ sin||si|Sinhala; Sinhalese|singhalais
383
+ sio|||Siouan languages|sioux, langues
384
+ sit|||Sino-Tibetan languages|sino-tibétaines, langues
385
+ sla|||Slavic languages|slaves, langues
386
+ slo|slk|sk|Slovak|slovaque
387
+ slv||sl|Slovenian|slovène
388
+ sma|||Southern Sami|sami du Sud
389
+ sme||se|Northern Sami|sami du Nord
390
+ smi|||Sami languages|sames, langues
391
+ smj|||Lule Sami|sami de Lule
392
+ smn|||Inari Sami|sami d'Inari
393
+ smo||sm|Samoan|samoan
394
+ sms|||Skolt Sami|sami skolt
395
+ sna||sn|Shona|shona
396
+ snd||sd|Sindhi|sindhi
397
+ snk|||Soninke|soninké
398
+ sog|||Sogdian|sogdien
399
+ som||so|Somali|somali
400
+ son|||Songhai languages|songhai, langues
401
+ sot||st|Sotho, Southern|sotho du Sud
402
+ spa||es|Spanish; Castilian|espagnol; castillan
403
+ srd||sc|Sardinian|sarde
404
+ srn|||Sranan Tongo|sranan tongo
405
+ srp||sr|Serbian|serbe
406
+ srr|||Serer|sérère
407
+ ssa|||Nilo-Saharan languages|nilo-sahariennes, langues
408
+ ssw||ss|Swati|swati
409
+ suk|||Sukuma|sukuma
410
+ sun||su|Sundanese|soundanais
411
+ sus|||Susu|soussou
412
+ sux|||Sumerian|sumérien
413
+ swa||sw|Swahili|swahili
414
+ swe||sv|Swedish|suédois
415
+ syc|||Classical Syriac|syriaque classique
416
+ syr|||Syriac|syriaque
417
+ tah||ty|Tahitian|tahitien
418
+ tai|||Tai languages|tai, langues
419
+ tam||ta|Tamil|tamoul
420
+ tat||tt|Tatar|tatar
421
+ tel||te|Telugu|télougou
422
+ tem|||Timne|temne
423
+ ter|||Tereno|tereno
424
+ tet|||Tetum|tetum
425
+ tgk||tg|Tajik|tadjik
426
+ tgl||tl|Tagalog|tagalog
427
+ tha||th|Thai|thaï
428
+ tib|bod|bo|Tibetan|tibétain
429
+ tig|||Tigre|tigré
430
+ tir||ti|Tigrinya|tigrigna
431
+ tiv|||Tiv|tiv
432
+ tkl|||Tokelau|tokelau
433
+ tlh|||Klingon; tlhIngan-Hol|klingon
434
+ tli|||Tlingit|tlingit
435
+ tmh|||Tamashek|tamacheq
436
+ tog|||Tonga (Nyasa)|tonga (Nyasa)
437
+ ton||to|Tonga (Tonga Islands)|tongan (Îles Tonga)
438
+ tpi|||Tok Pisin|tok pisin
439
+ tsi|||Tsimshian|tsimshian
440
+ tsn||tn|Tswana|tswana
441
+ tso||ts|Tsonga|tsonga
442
+ tuk||tk|Turkmen|turkmène
443
+ tum|||Tumbuka|tumbuka
444
+ tup|||Tupi languages|tupi, langues
445
+ tur||tr|Turkish|turc
446
+ tut|||Altaic languages|altaïques, langues
447
+ tvl|||Tuvalu|tuvalu
448
+ twi||tw|Twi|twi
449
+ tyv|||Tuvinian|touva
450
+ udm|||Udmurt|oudmourte
451
+ uga|||Ugaritic|ougaritique
452
+ uig||ug|Uighur; Uyghur|ouïgour
453
+ ukr||uk|Ukrainian|ukrainien
454
+ umb|||Umbundu|umbundu
455
+ und|||Undetermined|indéterminée
456
+ urd||ur|Urdu|ourdou
457
+ uzb||uz|Uzbek|ouszbek
458
+ vai|||Vai|vaï
459
+ ven||ve|Venda|venda
460
+ vie||vi|Vietnamese|vietnamien
461
+ vol||vo|Volapük|volapük
462
+ vot|||Votic|vote
463
+ wak|||Wakashan languages|wakashanes, langues
464
+ wal|||Wolaitta; Wolaytta|wolaitta; wolaytta
465
+ war|||Waray|waray
466
+ was|||Washo|washo
467
+ wel|cym|cy|Welsh|gallois
468
+ wen|||Sorbian languages|sorabes, langues
469
+ wln||wa|Walloon|wallon
470
+ wol||wo|Wolof|wolof
471
+ xal|||Kalmyk; Oirat|kalmouk; oïrat
472
+ xho||xh|Xhosa|xhosa
473
+ yao|||Yao|yao
474
+ yap|||Yapese|yapois
475
+ yid||yi|Yiddish|yiddish
476
+ yor||yo|Yoruba|yoruba
477
+ ypk|||Yupik languages|yupik, langues
478
+ zap|||Zapotec|zapotèque
479
+ zbl|||Blissymbols; Blissymbolics; Bliss|symboles Bliss; Bliss
480
+ zen|||Zenaga|zenaga
481
+ zgh|||Standard Moroccan Tamazight|amazighe standard marocain
482
+ zha||za|Zhuang; Chuang|zhuang; chuang
483
+ znd|||Zande languages|zandé, langues
484
+ zul||zu|Zulu|zoulou
485
+ zun|||Zuni|zuni
486
+ zxx|||No linguistic content; Not applicable|pas de contenu linguistique; non applicable
487
+ zza|||Zaza; Dimili; Dimli; Kirdki; Kirmanjki; Zazaki|zaza; dimili; dimli; kirdki; kirmanjki; zazaki
data/lib/iso-639.rb CHANGED
@@ -1,520 +1,31 @@
1
1
  # frozen_string_literal: true
2
2
 
3
- # http://www.loc.gov/standards/iso639-2/ascii_8bits.html
3
+ require 'csv'
4
4
 
5
5
  class ISO_639 < Array
6
- # Redefine `[]` to freeze all strings and arrays.
7
- #
8
- # Ruby 2.3+ uses the `frozen_string_literal` magic comment to freeze all
9
- # strings, while previous versions require the `#map` approach.
10
- def self.[](a3_bib, a3_term, a2, english_name, french_name)
11
- if a3_bib.frozen? # then Ruby 2.3+
12
- super(a3_bib, a3_term, a2, english_name, french_name).freeze
13
- else
14
- super(
15
- a3_bib.freeze,
16
- a3_term.freeze,
17
- a2.freeze,
18
- english_name.freeze,
19
- french_name.freeze
20
- ).freeze
21
- end
22
- end
23
-
24
- # The ISO 639-2 dataset as an array of entries. Each entry is an array with
25
- # the following format:
6
+ # Load the ISO 639-2 dataset as an array of entries. Each entry is an array
7
+ # with the following format:
26
8
  # * [0]: an alpha-3 (bibliographic) code
27
9
  # * [1]: an alpha-3 (terminologic) code (when given)
28
10
  # * [2]: an alpha-2 code (when given)
29
11
  # * [3]: an English name
30
12
  # * [4]: a French name of a language
31
- ISO_639_2 = [
32
- self["aar", "", "aa", "Afar", "afar"],
33
- self["abk", "", "ab", "Abkhazian", "abkhaze"],
34
- self["ace", "", "", "Achinese", "aceh"],
35
- self["ach", "", "", "Acoli", "acoli"],
36
- self["ada", "", "", "Adangme", "adangme"],
37
- self["ady", "", "", "Adyghe; Adygei", "adyghé"],
38
- self["afa", "", "", "Afro-Asiatic languages", "afro-asiatiques, langues"],
39
- self["afh", "", "", "Afrihili", "afrihili"],
40
- self["afr", "", "af", "Afrikaans", "afrikaans"],
41
- self["ain", "", "", "Ainu", "aïnou"],
42
- self["aka", "", "ak", "Akan", "akan"],
43
- self["akk", "", "", "Akkadian", "akkadien"],
44
- self["alb", "sqi", "sq", "Albanian", "albanais"],
45
- self["ale", "", "", "Aleut", "aléoute"],
46
- self["alg", "", "", "Algonquian languages", "algonquines, langues"],
47
- self["alt", "", "", "Southern Altai", "altai du Sud"],
48
- self["amh", "", "am", "Amharic", "amharique"],
49
- self["ang", "", "", "English, Old (ca.450-1100)", "anglo-saxon (ca.450-1100)"],
50
- self["anp", "", "", "Angika", "angika"],
51
- self["apa", "", "", "Apache languages", "apaches, langues"],
52
- self["ara", "", "ar", "Arabic", "arabe"],
53
- self["arc", "", "", "Official Aramaic (700-300 BCE); Imperial Aramaic (700-300 BCE)", "araméen d'empire (700-300 BCE)"],
54
- self["arg", "", "an", "Aragonese", "aragonais"],
55
- self["arm", "hye", "hy", "Armenian", "arménien"],
56
- self["arn", "", "", "Mapudungun; Mapuche", "mapudungun; mapuche; mapuce"],
57
- self["arp", "", "", "Arapaho", "arapaho"],
58
- self["art", "", "", "Artificial languages", "artificielles, langues"],
59
- self["arw", "", "", "Arawak", "arawak"],
60
- self["asm", "", "as", "Assamese", "assamais"],
61
- self["ast", "", "", "Asturian; Bable; Leonese; Asturleonese", "asturien; bable; léonais; asturoléonais"],
62
- self["ath", "", "", "Athapascan languages", "athapascanes, langues"],
63
- self["aus", "", "", "Australian languages", "australiennes, langues"],
64
- self["ava", "", "av", "Avaric", "avar"],
65
- self["ave", "", "ae", "Avestan", "avestique"],
66
- self["awa", "", "", "Awadhi", "awadhi"],
67
- self["aym", "", "ay", "Aymara", "aymara"],
68
- self["aze", "", "az", "Azerbaijani", "azéri"],
69
- self["bad", "", "", "Banda languages", "banda, langues"],
70
- self["bai", "", "", "Bamileke languages", "bamiléké, langues"],
71
- self["bak", "", "ba", "Bashkir", "bachkir"],
72
- self["bal", "", "", "Baluchi", "baloutchi"],
73
- self["bam", "", "bm", "Bambara", "bambara"],
74
- self["ban", "", "", "Balinese", "balinais"],
75
- self["baq", "eus", "eu", "Basque", "basque"],
76
- self["bas", "", "", "Basa", "basa"],
77
- self["bat", "", "", "Baltic languages", "baltes, langues"],
78
- self["bej", "", "", "Beja; Bedawiyet", "bedja"],
79
- self["bel", "", "be", "Belarusian", "biélorusse"],
80
- self["bem", "", "", "Bemba", "bemba"],
81
- self["ben", "", "bn", "Bengali", "bengali"],
82
- self["ber", "", "", "Berber languages", "berbères, langues"],
83
- self["bho", "", "", "Bhojpuri", "bhojpuri"],
84
- self["bih", "", "bh", "Bihari languages", "langues biharis"],
85
- self["bik", "", "", "Bikol", "bikol"],
86
- self["bin", "", "", "Bini; Edo", "bini; edo"],
87
- self["bis", "", "bi", "Bislama", "bichlamar"],
88
- self["bla", "", "", "Siksika", "blackfoot"],
89
- self["bnt", "", "", "Bantu (Other)", "bantoues, autres langues"],
90
- self["bos", "", "bs", "Bosnian", "bosniaque"],
91
- self["bra", "", "", "Braj", "braj"],
92
- self["bre", "", "br", "Breton", "breton"],
93
- self["btk", "", "", "Batak languages", "batak, langues"],
94
- self["bua", "", "", "Buriat", "bouriate"],
95
- self["bug", "", "", "Buginese", "bugi"],
96
- self["bul", "", "bg", "Bulgarian", "bulgare"],
97
- self["bur", "mya", "my", "Burmese", "birman"],
98
- self["byn", "", "", "Blin; Bilin", "blin; bilen"],
99
- self["cad", "", "", "Caddo", "caddo"],
100
- self["cai", "", "", "Central American Indian languages", "amérindiennes de L'Amérique centrale, langues"],
101
- self["car", "", "", "Galibi Carib", "karib; galibi; carib"],
102
- self["cat", "", "ca", "Catalan; Valencian", "catalan; valencien"],
103
- self["cau", "", "", "Caucasian languages", "caucasiennes, langues"],
104
- self["ceb", "", "", "Cebuano", "cebuano"],
105
- self["cel", "", "", "Celtic languages", "celtiques, langues; celtes, langues"],
106
- self["cha", "", "ch", "Chamorro", "chamorro"],
107
- self["chb", "", "", "Chibcha", "chibcha"],
108
- self["che", "", "ce", "Chechen", "tchétchène"],
109
- self["chg", "", "", "Chagatai", "djaghataï"],
110
- self["chi", "zho", "zh", "Chinese", "chinois"],
111
- self["chk", "", "", "Chuukese", "chuuk"],
112
- self["chm", "", "", "Mari", "mari"],
113
- self["chn", "", "", "Chinook jargon", "chinook, jargon"],
114
- self["cho", "", "", "Choctaw", "choctaw"],
115
- self["chp", "", "", "Chipewyan; Dene Suline", "chipewyan"],
116
- self["chr", "", "", "Cherokee", "cherokee"],
117
- self["chu", "", "cu", "Church Slavic; Old Slavonic; Church Slavonic; Old Bulgarian; Old Church Slavonic", "slavon d'église; vieux slave; slavon liturgique; vieux bulgare"],
118
- self["chv", "", "cv", "Chuvash", "tchouvache"],
119
- self["chy", "", "", "Cheyenne", "cheyenne"],
120
- self["cmc", "", "", "Chamic languages", "chames, langues"],
121
- self["cop", "", "", "Coptic", "copte"],
122
- self["cor", "", "kw", "Cornish", "cornique"],
123
- self["cos", "", "co", "Corsican", "corse"],
124
- self["cpe", "", "", "Creoles and pidgins, English based", "créoles et pidgins basés sur l'anglais"],
125
- self["cpf", "", "", "Creoles and pidgins, French-based ", "créoles et pidgins basés sur le français"],
126
- self["cpp", "", "", "Creoles and pidgins, Portuguese-based ", "créoles et pidgins basés sur le portugais"],
127
- self["cre", "", "cr", "Cree", "cree"],
128
- self["crh", "", "", "Crimean Tatar; Crimean Turkish", "tatar de Crimé"],
129
- self["crp", "", "", "Creoles and pidgins ", "créoles et pidgins"],
130
- self["csb", "", "", "Kashubian", "kachoube"],
131
- self["cus", "", "", "Cushitic languages", "couchitiques, langues"],
132
- self["cze", "ces", "cs", "Czech", "tchèque"],
133
- self["dak", "", "", "Dakota", "dakota"],
134
- self["dan", "", "da", "Danish", "danois"],
135
- self["dar", "", "", "Dargwa", "dargwa"],
136
- self["day", "", "", "Land Dayak languages", "dayak, langues"],
137
- self["del", "", "", "Delaware", "delaware"],
138
- self["den", "", "", "Slave (Athapascan)", "esclave (athapascan)"],
139
- self["dgr", "", "", "Dogrib", "dogrib"],
140
- self["din", "", "", "Dinka", "dinka"],
141
- self["div", "", "dv", "Divehi; Dhivehi; Maldivian", "maldivien"],
142
- self["doi", "", "", "Dogri", "dogri"],
143
- self["dra", "", "", "Dravidian languages", "dravidiennes, langues"],
144
- self["dsb", "", "", "Lower Sorbian", "bas-sorabe"],
145
- self["dua", "", "", "Duala", "douala"],
146
- self["dum", "", "", "Dutch, Middle (ca.1050-1350)", "néerlandais moyen (ca. 1050-1350)"],
147
- self["dut", "nld", "nl", "Dutch; Flemish", "néerlandais; flamand"],
148
- self["dyu", "", "", "Dyula", "dioula"],
149
- self["dzo", "", "dz", "Dzongkha", "dzongkha"],
150
- self["efi", "", "", "Efik", "efik"],
151
- self["egy", "", "", "Egyptian (Ancient)", "égyptien"],
152
- self["eka", "", "", "Ekajuk", "ekajuk"],
153
- self["elx", "", "", "Elamite", "élamite"],
154
- self["eng", "", "en", "English", "anglais"],
155
- self["enm", "", "", "English, Middle (1100-1500)", "anglais moyen (1100-1500)"],
156
- self["epo", "", "eo", "Esperanto", "espéranto"],
157
- self["est", "", "et", "Estonian", "estonien"],
158
- self["ewe", "", "ee", "Ewe", "éwé"],
159
- self["ewo", "", "", "Ewondo", "éwondo"],
160
- self["fan", "", "", "Fang", "fang"],
161
- self["fao", "", "fo", "Faroese", "féroïen"],
162
- self["fat", "", "", "Fanti", "fanti"],
163
- self["fij", "", "fj", "Fijian", "fidjien"],
164
- self["fil", "", "", "Filipino; Pilipino", "filipino; pilipino"],
165
- self["fin", "", "fi", "Finnish", "finnois"],
166
- self["fiu", "", "", "Finno-Ugrian languages", "finno-ougriennes, langues"],
167
- self["fon", "", "", "Fon", "fon"],
168
- self["fre", "fra", "fr", "French", "français"],
169
- self["frm", "", "", "French, Middle (ca.1400-1600)", "français moyen (1400-1600)"],
170
- self["fro", "", "", "French, Old (842-ca.1400)", "français ancien (842-ca.1400)"],
171
- self["frr", "", "", "Northern Frisian", "frison septentrional"],
172
- self["frs", "", "", "Eastern Frisian", "frison oriental"],
173
- self["fry", "", "fy", "Western Frisian", "frison occidental"],
174
- self["ful", "", "ff", "Fulah", "peul"],
175
- self["fur", "", "", "Friulian", "frioulan"],
176
- self["gaa", "", "", "Ga", "ga"],
177
- self["gay", "", "", "Gayo", "gayo"],
178
- self["gba", "", "", "Gbaya", "gbaya"],
179
- self["gem", "", "", "Germanic languages", "germaniques, langues"],
180
- self["geo", "kat", "ka", "Georgian", "géorgien"],
181
- self["ger", "deu", "de", "German", "allemand"],
182
- self["gez", "", "", "Geez", "guèze"],
183
- self["gil", "", "", "Gilbertese", "kiribati"],
184
- self["gla", "", "gd", "Gaelic; Scottish Gaelic", "gaélique; gaélique écossais"],
185
- self["gle", "", "ga", "Irish", "irlandais"],
186
- self["glg", "", "gl", "Galician", "galicien"],
187
- self["glv", "", "gv", "Manx", "manx; mannois"],
188
- self["gmh", "", "", "German, Middle High (ca.1050-1500)", "allemand, moyen haut (ca. 1050-1500)"],
189
- self["goh", "", "", "German, Old High (ca.750-1050)", "allemand, vieux haut (ca. 750-1050)"],
190
- self["gon", "", "", "Gondi", "gond"],
191
- self["gor", "", "", "Gorontalo", "gorontalo"],
192
- self["got", "", "", "Gothic", "gothique"],
193
- self["grb", "", "", "Grebo", "grebo"],
194
- self["grc", "", "", "Greek, Ancient (to 1453)", "grec ancien (jusqu'à 1453)"],
195
- self["gre", "ell", "el", "Greek, Modern (1453-)", "grec moderne (après 1453)"],
196
- self["grn", "", "gn", "Guarani", "guarani"],
197
- self["gsw", "", "", "Swiss German; Alemannic; Alsatian", "suisse alémanique; alémanique; alsacien"],
198
- self["guj", "", "gu", "Gujarati", "goudjrati"],
199
- self["gwi", "", "", "Gwich'in", "gwich'in"],
200
- self["hai", "", "", "Haida", "haida"],
201
- self["hat", "", "ht", "Haitian; Haitian Creole", "haïtien; créole haïtien"],
202
- self["hau", "", "ha", "Hausa", "haoussa"],
203
- self["haw", "", "", "Hawaiian", "hawaïen"],
204
- self["heb", "", "he", "Hebrew", "hébreu"],
205
- self["her", "", "hz", "Herero", "herero"],
206
- self["hil", "", "", "Hiligaynon", "hiligaynon"],
207
- self["him", "", "", "Himachali languages; Western Pahari languages", "langues himachalis; langues paharis occidentales"],
208
- self["hin", "", "hi", "Hindi", "hindi"],
209
- self["hit", "", "", "Hittite", "hittite"],
210
- self["hmn", "", "", "Hmong", "hmong"],
211
- self["hmo", "", "ho", "Hiri Motu", "hiri motu"],
212
- self["hrv", "", "hr", "Croatian", "croate"],
213
- self["hsb", "", "", "Upper Sorbian", "haut-sorabe"],
214
- self["hun", "", "hu", "Hungarian", "hongrois"],
215
- self["hup", "", "", "Hupa", "hupa"],
216
- self["iba", "", "", "Iban", "iban"],
217
- self["ibo", "", "ig", "Igbo", "igbo"],
218
- self["ice", "isl", "is", "Icelandic", "islandais"],
219
- self["ido", "", "io", "Ido", "ido"],
220
- self["iii", "", "ii", "Sichuan Yi; Nuosu", "yi de Sichuan"],
221
- self["ijo", "", "", "Ijo languages", "ijo, langues"],
222
- self["iku", "", "iu", "Inuktitut", "inuktitut"],
223
- self["ile", "", "ie", "Interlingue; Occidental", "interlingue"],
224
- self["ilo", "", "", "Iloko", "ilocano"],
225
- self["ina", "", "ia", "Interlingua (International Auxiliary Language Association)", "interlingua (langue auxiliaire internationale)"],
226
- self["inc", "", "", "Indic languages", "indo-aryennes, langues"],
227
- self["ind", "", "id", "Indonesian", "indonésien"],
228
- self["ine", "", "", "Indo-European languages", "indo-européennes, langues"],
229
- self["inh", "", "", "Ingush", "ingouche"],
230
- self["ipk", "", "ik", "Inupiaq", "inupiaq"],
231
- self["ira", "", "", "Iranian languages", "iraniennes, langues"],
232
- self["iro", "", "", "Iroquoian languages", "iroquoises, langues"],
233
- self["ita", "", "it", "Italian", "italien"],
234
- self["jav", "", "jv", "Javanese", "javanais"],
235
- self["jbo", "", "", "Lojban", "lojban"],
236
- self["jpn", "", "ja", "Japanese", "japonais"],
237
- self["jpr", "", "", "Judeo-Persian", "judéo-persan"],
238
- self["jrb", "", "", "Judeo-Arabic", "judéo-arabe"],
239
- self["kaa", "", "", "Kara-Kalpak", "karakalpak"],
240
- self["kab", "", "", "Kabyle", "kabyle"],
241
- self["kac", "", "", "Kachin; Jingpho", "kachin; jingpho"],
242
- self["kal", "", "kl", "Kalaallisut; Greenlandic", "groenlandais"],
243
- self["kam", "", "", "Kamba", "kamba"],
244
- self["kan", "", "kn", "Kannada", "kannada"],
245
- self["kar", "", "", "Karen languages", "karen, langues"],
246
- self["kas", "", "ks", "Kashmiri", "kashmiri"],
247
- self["kau", "", "kr", "Kanuri", "kanouri"],
248
- self["kaw", "", "", "Kawi", "kawi"],
249
- self["kaz", "", "kk", "Kazakh", "kazakh"],
250
- self["kbd", "", "", "Kabardian", "kabardien"],
251
- self["kha", "", "", "Khasi", "khasi"],
252
- self["khi", "", "", "Khoisan languages", "khoïsan, langues"],
253
- self["khm", "", "km", "Central Khmer", "khmer central"],
254
- self["kho", "", "", "Khotanese; Sakan", "khotanais; sakan"],
255
- self["kik", "", "ki", "Kikuyu; Gikuyu", "kikuyu"],
256
- self["kin", "", "rw", "Kinyarwanda", "rwanda"],
257
- self["kir", "", "ky", "Kirghiz; Kyrgyz", "kirghiz"],
258
- self["kmb", "", "", "Kimbundu", "kimbundu"],
259
- self["kok", "", "", "Konkani", "konkani"],
260
- self["kom", "", "kv", "Komi", "kom"],
261
- self["kon", "", "kg", "Kongo", "kongo"],
262
- self["kor", "", "ko", "Korean", "coréen"],
263
- self["kos", "", "", "Kosraean", "kosrae"],
264
- self["kpe", "", "", "Kpelle", "kpellé"],
265
- self["krc", "", "", "Karachay-Balkar", "karatchai balkar"],
266
- self["krl", "", "", "Karelian", "carélien"],
267
- self["kro", "", "", "Kru languages", "krou, langues"],
268
- self["kru", "", "", "Kurukh", "kurukh"],
269
- self["kua", "", "kj", "Kuanyama; Kwanyama", "kuanyama; kwanyama"],
270
- self["kum", "", "", "Kumyk", "koumyk"],
271
- self["kur", "", "ku", "Kurdish", "kurde"],
272
- self["kut", "", "", "Kutenai", "kutenai"],
273
- self["lad", "", "", "Ladino", "judéo-espagnol"],
274
- self["lah", "", "", "Lahnda", "lahnda"],
275
- self["lam", "", "", "Lamba", "lamba"],
276
- self["lao", "", "lo", "Lao", "lao"],
277
- self["lat", "", "la", "Latin", "latin"],
278
- self["lav", "", "lv", "Latvian", "letton"],
279
- self["lez", "", "", "Lezghian", "lezghien"],
280
- self["lim", "", "li", "Limburgan; Limburger; Limburgish", "limbourgeois"],
281
- self["lin", "", "ln", "Lingala", "lingala"],
282
- self["lit", "", "lt", "Lithuanian", "lituanien"],
283
- self["lol", "", "", "Mongo", "mongo"],
284
- self["loz", "", "", "Lozi", "lozi"],
285
- self["ltz", "", "lb", "Luxembourgish; Letzeburgesch", "luxembourgeois"],
286
- self["lua", "", "", "Luba-Lulua", "luba-lulua"],
287
- self["lub", "", "lu", "Luba-Katanga", "luba-katanga"],
288
- self["lug", "", "lg", "Ganda", "ganda"],
289
- self["lui", "", "", "Luiseno", "luiseno"],
290
- self["lun", "", "", "Lunda", "lunda"],
291
- self["luo", "", "", "Luo (Kenya and Tanzania)", "luo (Kenya et Tanzanie)"],
292
- self["lus", "", "", "Lushai", "lushai"],
293
- self["mac", "mkd", "mk", "Macedonian", "macédonien"],
294
- self["mad", "", "", "Madurese", "madourais"],
295
- self["mag", "", "", "Magahi", "magahi"],
296
- self["mah", "", "mh", "Marshallese", "marshall"],
297
- self["mai", "", "", "Maithili", "maithili"],
298
- self["mak", "", "", "Makasar", "makassar"],
299
- self["mal", "", "ml", "Malayalam", "malayalam"],
300
- self["man", "", "", "Mandingo", "mandingue"],
301
- self["mao", "mri", "mi", "Maori", "maori"],
302
- self["map", "", "", "Austronesian languages", "austronésiennes, langues"],
303
- self["mar", "", "mr", "Marathi", "marathe"],
304
- self["mas", "", "", "Masai", "massaï"],
305
- self["may", "msa", "ms", "Malay", "malais"],
306
- self["mdf", "", "", "Moksha", "moksa"],
307
- self["mdr", "", "", "Mandar", "mandar"],
308
- self["men", "", "", "Mende", "mendé"],
309
- self["mga", "", "", "Irish, Middle (900-1200)", "irlandais moyen (900-1200)"],
310
- self["mic", "", "", "Mi'kmaq; Micmac", "mi'kmaq; micmac"],
311
- self["min", "", "", "Minangkabau", "minangkabau"],
312
- self["mis", "", "", "Uncoded languages", "langues non codées"],
313
- self["mkh", "", "", "Mon-Khmer languages", "môn-khmer, langues"],
314
- self["mlg", "", "mg", "Malagasy", "malgache"],
315
- self["mlt", "", "mt", "Maltese", "maltais"],
316
- self["mnc", "", "", "Manchu", "mandchou"],
317
- self["mni", "", "", "Manipuri", "manipuri"],
318
- self["mno", "", "", "Manobo languages", "manobo, langues"],
319
- self["moh", "", "", "Mohawk", "mohawk"],
320
- self["mon", "", "mn", "Mongolian", "mongol"],
321
- self["mos", "", "", "Mossi", "moré"],
322
- self["mul", "", "", "Multiple languages", "multilingue"],
323
- self["mun", "", "", "Munda languages", "mounda, langues"],
324
- self["mus", "", "", "Creek", "muskogee"],
325
- self["mwl", "", "", "Mirandese", "mirandais"],
326
- self["mwr", "", "", "Marwari", "marvari"],
327
- self["myn", "", "", "Mayan languages", "maya, langues"],
328
- self["myv", "", "", "Erzya", "erza"],
329
- self["nah", "", "", "Nahuatl languages", "nahuatl, langues"],
330
- self["nai", "", "", "North American Indian languages", "nord-amérindiennes, langues"],
331
- self["nap", "", "", "Neapolitan", "napolitain"],
332
- self["nau", "", "na", "Nauru", "nauruan"],
333
- self["nav", "", "nv", "Navajo; Navaho", "navaho"],
334
- self["nbl", "", "nr", "Ndebele, South; South Ndebele", "ndébélé du Sud"],
335
- self["nde", "", "nd", "Ndebele, North; North Ndebele", "ndébélé du Nord"],
336
- self["ndo", "", "ng", "Ndonga", "ndonga"],
337
- self["nds", "", "", "Low German; Low Saxon; German, Low; Saxon, Low", "bas allemand; bas saxon; allemand, bas; saxon, bas"],
338
- self["nep", "", "ne", "Nepali", "népalais"],
339
- self["new", "", "", "Nepal Bhasa; Newari", "nepal bhasa; newari"],
340
- self["nia", "", "", "Nias", "nias"],
341
- self["nic", "", "", "Niger-Kordofanian languages", "nigéro-kordofaniennes, langues"],
342
- self["niu", "", "", "Niuean", "niué"],
343
- self["nno", "", "nn", "Norwegian Nynorsk; Nynorsk, Norwegian", "norvégien nynorsk; nynorsk, norvégien"],
344
- self["nob", "", "nb", "Bokmål, Norwegian; Norwegian Bokmål", "norvégien bokmål"],
345
- self["nog", "", "", "Nogai", "nogaï; nogay"],
346
- self["non", "", "", "Norse, Old", "norrois, vieux"],
347
- self["nor", "", "no", "Norwegian", "norvégien"],
348
- self["nqo", "", "", "N'Ko", "n'ko"],
349
- self["nso", "", "", "Pedi; Sepedi; Northern Sotho", "pedi; sepedi; sotho du Nord"],
350
- self["nub", "", "", "Nubian languages", "nubiennes, langues"],
351
- self["nwc", "", "", "Classical Newari; Old Newari; Classical Nepal Bhasa", "newari classique"],
352
- self["nya", "", "ny", "Chichewa; Chewa; Nyanja", "chichewa; chewa; nyanja"],
353
- self["nym", "", "", "Nyamwezi", "nyamwezi"],
354
- self["nyn", "", "", "Nyankole", "nyankolé"],
355
- self["nyo", "", "", "Nyoro", "nyoro"],
356
- self["nzi", "", "", "Nzima", "nzema"],
357
- self["oci", "", "oc", "Occitan (post 1500); Provençal", "occitan (après 1500); provençal"],
358
- self["oji", "", "oj", "Ojibwa", "ojibwa"],
359
- self["ori", "", "or", "Oriya", "oriya"],
360
- self["orm", "", "om", "Oromo", "galla"],
361
- self["osa", "", "", "Osage", "osage"],
362
- self["oss", "", "os", "Ossetian; Ossetic", "ossète"],
363
- self["ota", "", "", "Turkish, Ottoman (1500-1928)", "turc ottoman (1500-1928)"],
364
- self["oto", "", "", "Otomian languages", "otomi, langues"],
365
- self["paa", "", "", "Papuan languages", "papoues, langues"],
366
- self["pag", "", "", "Pangasinan", "pangasinan"],
367
- self["pal", "", "", "Pahlavi", "pahlavi"],
368
- self["pam", "", "", "Pampanga; Kapampangan", "pampangan"],
369
- self["pan", "", "pa", "Panjabi; Punjabi", "pendjabi"],
370
- self["pap", "", "", "Papiamento", "papiamento"],
371
- self["pau", "", "", "Palauan", "palau"],
372
- self["peo", "", "", "Persian, Old (ca.600-400 B.C.)", "perse, vieux (ca. 600-400 av. J.-C.)"],
373
- self["per", "fas", "fa", "Persian", "persan"],
374
- self["phi", "", "", "Philippine languages", "philippines, langues"],
375
- self["phn", "", "", "Phoenician", "phénicien"],
376
- self["pli", "", "pi", "Pali", "pali"],
377
- self["pol", "", "pl", "Polish", "polonais"],
378
- self["pon", "", "", "Pohnpeian", "pohnpei"],
379
- self["por", "", "pt", "Portuguese", "portugais"],
380
- self["pra", "", "", "Prakrit languages", "prâkrit, langues"],
381
- self["pro", "", "", "Provençal, Old (to 1500)", "provençal ancien (jusqu'à 1500)"],
382
- self["pus", "", "ps", "Pushto; Pashto", "pachto"],
383
- self["qaa-qtz", "", "", "Reserved for local use", "réservée à l'usage local"],
384
- self["que", "", "qu", "Quechua", "quechua"],
385
- self["raj", "", "", "Rajasthani", "rajasthani"],
386
- self["rap", "", "", "Rapanui", "rapanui"],
387
- self["rar", "", "", "Rarotongan; Cook Islands Maori", "rarotonga; maori des îles Cook"],
388
- self["roa", "", "", "Romance languages", "romanes, langues"],
389
- self["roh", "", "rm", "Romansh", "romanche"],
390
- self["rom", "", "", "Romany", "tsigane"],
391
- self["rum", "ron", "ro", "Romanian; Moldavian; Moldovan", "roumain; moldave"],
392
- self["run", "", "rn", "Rundi", "rundi"],
393
- self["rup", "", "", "Aromanian; Arumanian; Macedo-Romanian", "aroumain; macédo-roumain"],
394
- self["rus", "", "ru", "Russian", "russe"],
395
- self["sad", "", "", "Sandawe", "sandawe"],
396
- self["sag", "", "sg", "Sango", "sango"],
397
- self["sah", "", "", "Yakut", "iakoute"],
398
- self["sai", "", "", "South American Indian (Other)", "indiennes d'Amérique du Sud, autres langues"],
399
- self["sal", "", "", "Salishan languages", "salishennes, langues"],
400
- self["sam", "", "", "Samaritan Aramaic", "samaritain"],
401
- self["san", "", "sa", "Sanskrit", "sanskrit"],
402
- self["sas", "", "", "Sasak", "sasak"],
403
- self["sat", "", "", "Santali", "santal"],
404
- self["scn", "", "", "Sicilian", "sicilien"],
405
- self["sco", "", "", "Scots", "écossais"],
406
- self["sel", "", "", "Selkup", "selkoupe"],
407
- self["sem", "", "", "Semitic languages", "sémitiques, langues"],
408
- self["sga", "", "", "Irish, Old (to 900)", "irlandais ancien (jusqu'à 900)"],
409
- self["sgn", "", "", "Sign Languages", "langues des signes"],
410
- self["shn", "", "", "Shan", "chan"],
411
- self["sid", "", "", "Sidamo", "sidamo"],
412
- self["sin", "", "si", "Sinhala; Sinhalese", "singhalais"],
413
- self["sio", "", "", "Siouan languages", "sioux, langues"],
414
- self["sit", "", "", "Sino-Tibetan languages", "sino-tibétaines, langues"],
415
- self["sla", "", "", "Slavic languages", "slaves, langues"],
416
- self["slo", "slk", "sk", "Slovak", "slovaque"],
417
- self["slv", "", "sl", "Slovenian", "slovène"],
418
- self["sma", "", "", "Southern Sami", "sami du Sud"],
419
- self["sme", "", "se", "Northern Sami", "sami du Nord"],
420
- self["smi", "", "", "Sami languages", "sames, langues"],
421
- self["smj", "", "", "Lule Sami", "sami de Lule"],
422
- self["smn", "", "", "Inari Sami", "sami d'Inari"],
423
- self["smo", "", "sm", "Samoan", "samoan"],
424
- self["sms", "", "", "Skolt Sami", "sami skolt"],
425
- self["sna", "", "sn", "Shona", "shona"],
426
- self["snd", "", "sd", "Sindhi", "sindhi"],
427
- self["snk", "", "", "Soninke", "soninké"],
428
- self["sog", "", "", "Sogdian", "sogdien"],
429
- self["som", "", "so", "Somali", "somali"],
430
- self["son", "", "", "Songhai languages", "songhai, langues"],
431
- self["sot", "", "st", "Sotho, Southern", "sotho du Sud"],
432
- self["spa", "", "es", "Spanish; Castilian", "espagnol; castillan"],
433
- self["srd", "", "sc", "Sardinian", "sarde"],
434
- self["srn", "", "", "Sranan Tongo", "sranan tongo"],
435
- self["srp", "", "sr", "Serbian", "serbe"],
436
- self["srr", "", "", "Serer", "sérère"],
437
- self["ssa", "", "", "Nilo-Saharan languages", "nilo-sahariennes, langues"],
438
- self["ssw", "", "ss", "Swati", "swati"],
439
- self["suk", "", "", "Sukuma", "sukuma"],
440
- self["sun", "", "su", "Sundanese", "soundanais"],
441
- self["sus", "", "", "Susu", "soussou"],
442
- self["sux", "", "", "Sumerian", "sumérien"],
443
- self["swa", "", "sw", "Swahili", "swahili"],
444
- self["swe", "", "sv", "Swedish", "suédois"],
445
- self["syc", "", "", "Classical Syriac", "syriaque classique"],
446
- self["syr", "", "", "Syriac", "syriaque"],
447
- self["tah", "", "ty", "Tahitian", "tahitien"],
448
- self["tai", "", "", "Tai languages", "tai, langues"],
449
- self["tam", "", "ta", "Tamil", "tamoul"],
450
- self["tat", "", "tt", "Tatar", "tatar"],
451
- self["tel", "", "te", "Telugu", "télougou"],
452
- self["tem", "", "", "Timne", "temne"],
453
- self["ter", "", "", "Tereno", "tereno"],
454
- self["tet", "", "", "Tetum", "tetum"],
455
- self["tgk", "", "tg", "Tajik", "tadjik"],
456
- self["tgl", "", "tl", "Tagalog", "tagalog"],
457
- self["tha", "", "th", "Thai", "thaï"],
458
- self["tib", "bod", "bo", "Tibetan", "tibétain"],
459
- self["tig", "", "", "Tigre", "tigré"],
460
- self["tir", "", "ti", "Tigrinya", "tigrigna"],
461
- self["tiv", "", "", "Tiv", "tiv"],
462
- self["tkl", "", "", "Tokelau", "tokelau"],
463
- self["tlh", "", "", "Klingon; tlhIngan-Hol", "klingon"],
464
- self["tli", "", "", "Tlingit", "tlingit"],
465
- self["tmh", "", "", "Tamashek", "tamacheq"],
466
- self["tog", "", "", "Tonga (Nyasa)", "tonga (Nyasa)"],
467
- self["ton", "", "to", "Tonga (Tonga Islands)", "tongan (Îles Tonga)"],
468
- self["tpi", "", "", "Tok Pisin", "tok pisin"],
469
- self["tsi", "", "", "Tsimshian", "tsimshian"],
470
- self["tsn", "", "tn", "Tswana", "tswana"],
471
- self["tso", "", "ts", "Tsonga", "tsonga"],
472
- self["tuk", "", "tk", "Turkmen", "turkmène"],
473
- self["tum", "", "", "Tumbuka", "tumbuka"],
474
- self["tup", "", "", "Tupi languages", "tupi, langues"],
475
- self["tur", "", "tr", "Turkish", "turc"],
476
- self["tut", "", "", "Altaic languages", "altaïques, langues"],
477
- self["tvl", "", "", "Tuvalu", "tuvalu"],
478
- self["twi", "", "tw", "Twi", "twi"],
479
- self["tyv", "", "", "Tuvinian", "touva"],
480
- self["udm", "", "", "Udmurt", "oudmourte"],
481
- self["uga", "", "", "Ugaritic", "ougaritique"],
482
- self["uig", "", "ug", "Uighur; Uyghur", "ouïgour"],
483
- self["ukr", "", "uk", "Ukrainian", "ukrainien"],
484
- self["umb", "", "", "Umbundu", "umbundu"],
485
- self["und", "", "", "Undetermined", "indéterminée"],
486
- self["urd", "", "ur", "Urdu", "ourdou"],
487
- self["uzb", "", "uz", "Uzbek", "ouszbek"],
488
- self["vai", "", "", "Vai", "vaï"],
489
- self["ven", "", "ve", "Venda", "venda"],
490
- self["vie", "", "vi", "Vietnamese", "vietnamien"],
491
- self["vol", "", "vo", "Volapük", "volapük"],
492
- self["vot", "", "", "Votic", "vote"],
493
- self["wak", "", "", "Wakashan languages", "wakashanes, langues"],
494
- self["wal", "", "", "Walamo", "walamo"],
495
- self["war", "", "", "Waray", "waray"],
496
- self["was", "", "", "Washo", "washo"],
497
- self["wel", "cym", "cy", "Welsh", "gallois"],
498
- self["wen", "", "", "Sorbian languages", "sorabes, langues"],
499
- self["wln", "", "wa", "Walloon", "wallon"],
500
- self["wol", "", "wo", "Wolof", "wolof"],
501
- self["xal", "", "", "Kalmyk; Oirat", "kalmouk; oïrat"],
502
- self["xho", "", "xh", "Xhosa", "xhosa"],
503
- self["yao", "", "", "Yao", "yao"],
504
- self["yap", "", "", "Yapese", "yapois"],
505
- self["yid", "", "yi", "Yiddish", "yiddish"],
506
- self["yor", "", "yo", "Yoruba", "yoruba"],
507
- self["ypk", "", "", "Yupik languages", "yupik, langues"],
508
- self["zap", "", "", "Zapotec", "zapotèque"],
509
- self["zbl", "", "", "Blissymbols; Blissymbolics; Bliss", "symboles Bliss; Bliss"],
510
- self["zen", "", "", "Zenaga", "zenaga"],
511
- self["zha", "", "za", "Zhuang; Chuang", "zhuang; chuang"],
512
- self["znd", "", "", "Zande languages", "zandé, langues"],
513
- self["zul", "", "zu", "Zulu", "zoulou"],
514
- self["zun", "", "", "Zuni", "zuni"],
515
- self["zxx", "", "", "No linguistic content; Not applicable", "pas de contenu linguistique; non applicable"],
516
- self["zza", "", "", "Zaza; Dimili; Dimli; Kirdki; Kirmanjki; Zazaki", "zaza; dimili; dimli; kirdki; kirmanjki; zazaki"]
517
- ].freeze
13
+ #
14
+ # Dataset Source:
15
+ # https://www.loc.gov/standards/iso639-2/ascii_8bits.html
16
+ # https://www.loc.gov/standards/iso639-2/ISO-639-2_utf-8.txt
17
+ ISO_639_2 = lambda do
18
+ dataset = []
19
+ CSV.foreach(
20
+ File.join(File.dirname(__FILE__), 'data', 'ISO-639-2_utf-8.txt'),
21
+ **{ col_sep: "|",
22
+ converters: ->(v) { v || '' },
23
+ encoding: 'bom|utf-8' }
24
+ ).each do |row|
25
+ dataset << self[*row].freeze
26
+ end
27
+ return dataset
28
+ end.call.freeze
518
29
 
519
30
  # An inverted index generated from the ISO_639_2 data. Used for searching
520
31
  # all words and codes in all fields.
data/test/test_iso_639.rb CHANGED
@@ -4,7 +4,7 @@ require 'helper'
4
4
 
5
5
  describe ISO_639 do
6
6
  it 'should have full code list in ISO_639_2' do
7
- assert_equal 485, ISO_639::ISO_639_2.length
7
+ assert_equal 487, ISO_639::ISO_639_2.length
8
8
  end
9
9
 
10
10
  it 'should have shorter code list in ISO_639_1' do
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: iso-639
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.10
4
+ version: 0.3.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - William Melody
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2020-03-01 00:00:00.000000000 Z
11
+ date: 2020-03-02 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: minitest
@@ -125,6 +125,7 @@ files:
125
125
  - README.md
126
126
  - Rakefile
127
127
  - iso-639.gemspec
128
+ - lib/data/ISO-639-2_utf-8.txt
128
129
  - lib/iso-639.rb
129
130
  - test/helper.rb
130
131
  - test/test_iso_639.rb
@@ -140,7 +141,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
140
141
  requirements:
141
142
  - - ">="
142
143
  - !ruby/object:Gem::Version
143
- version: '0'
144
+ version: '2.3'
144
145
  required_rubygems_version: !ruby/object:Gem::Requirement
145
146
  requirements:
146
147
  - - ">="