interscript 0.1.1 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (170) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
  6. data/lib/g2pwrapper.py +34 -0
  7. data/lib/interscript-opal.rb +2 -0
  8. data/lib/interscript.rb +138 -20
  9. data/lib/interscript/command.rb +28 -0
  10. data/lib/interscript/fs.rb +71 -0
  11. data/lib/interscript/mapping.rb +142 -0
  12. data/lib/interscript/opal.rb +27 -0
  13. data/lib/interscript/opal/maps.js.erb +10 -0
  14. data/lib/interscript/opal_map_translate.rb +12 -0
  15. data/lib/interscript/version.rb +1 -1
  16. data/lib/model-7 +0 -0
  17. data/lib/tha-pt-b-7 +0 -0
  18. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  19. data/maps/alalc-amh-Ethi-Latn-1997.yaml +509 -0
  20. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  21. data/maps/alalc-ara-Arab-Latn-1997.yaml +1283 -0
  22. data/maps/alalc-asm-Deva-Latn-1997.yaml +159 -0
  23. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +141 -0
  24. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +125 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  27. data/maps/alalc-ell-Grek-Latn-1997.yaml +624 -0
  28. data/maps/alalc-ell-Grek-Latn-2010.yaml +627 -0
  29. data/maps/alalc-hin-Deva-Latn-2020.yaml +159 -0
  30. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  31. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  32. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  33. data/maps/alalc-mar-Deva-Latn-1997.yaml +170 -0
  34. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  35. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  36. data/maps/alalc-pan-Deva-Latn-1997.yaml +237 -0
  37. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +221 -0
  38. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  39. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  40. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  41. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  42. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  43. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  44. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +174 -0
  45. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +169 -0
  46. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  47. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  48. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  49. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  50. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  51. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +528 -0
  52. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +592 -0
  53. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +108 -0
  54. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  55. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +184 -0
  56. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +285 -0
  57. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  58. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +38 -0
  59. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +701 -0
  60. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +19 -0
  61. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  62. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  63. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  64. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  65. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  66. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  67. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  68. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  69. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +200 -0
  70. data/maps/bgnpcgn-per-Arab-Latn-1956.yaml +92 -0
  71. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +314 -0
  72. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  73. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +162 -0
  74. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  75. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  76. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  77. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  78. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  79. data/maps/bis-gjr-Gujr-Latn-13194-1991.yaml +166 -0
  80. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  81. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  82. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  83. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  84. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  85. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  86. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  87. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  88. data/maps/dos-nep-Deva-Latn-1997.yaml +33 -0
  89. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  90. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  91. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  92. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  93. data/maps/ggg-kat-Geor-Latn-2002.yaml +88 -0
  94. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  95. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  96. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +186 -0
  97. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  98. data/maps/icao-bel-Cyrl-Latn-9303.yaml +136 -0
  99. data/maps/icao-bul-Cyrl-Latn-9303.yaml +118 -0
  100. data/maps/icao-heb-Hebr-Latn-9303.yaml +151 -0
  101. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +117 -0
  102. data/maps/icao-per-Arab-Latn-9303.yaml +103 -0
  103. data/maps/icao-rus-Cyrl-Latn-9303.yaml +117 -0
  104. data/maps/icao-srp-Cyrl-Latn-9303.yaml +117 -0
  105. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +119 -0
  106. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  107. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +609 -0
  108. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +40 -0
  109. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  110. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +271 -0
  111. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  112. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  113. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  114. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  115. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  116. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  117. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  118. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  119. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  120. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  121. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  122. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  123. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  124. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  125. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  126. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  127. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  128. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  129. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  130. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  131. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  132. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  133. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  134. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  135. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  136. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  137. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  138. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  139. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  140. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  141. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  142. data/maps/sac-zho-Hans-Latn-1979.yaml +24759 -0
  143. data/maps/ses-ara-Arab-Latn-1930.yaml +279 -0
  144. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  145. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  146. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  147. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  148. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  149. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  150. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  151. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  152. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  153. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  154. data/maps/un-mon-Mong-Latn-2013.yaml +99 -0
  155. data/maps/un-nep-Deva-Latn-1972.yaml +163 -0
  156. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  157. data/maps/un-ukr-Cyrl-Latn-1998.yaml +30 -0
  158. data/maps/ungegn-amh-Ethi-Latn-2016.yaml +575 -0
  159. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  160. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  161. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  162. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  163. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  164. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  165. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  166. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  167. data/spec/interscript/mapping_spec.rb +42 -0
  168. data/spec/interscript_spec.rb +26 -0
  169. data/spec/spec_helper.rb +3 -0
  170. metadata +298 -18
@@ -0,0 +1,159 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2020
4
+ language: hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Hindi Romanization, 2020
8
+ url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
9
+ creation_date: 2020
10
+ description: |
11
+ ALA-LC Romanization table for Hindi
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
25
+ virāma.
26
+
27
+ - |
28
+ Exception: Anusvāra is transliterated by:
29
+
30
+ a) ṅ before gutturals,
31
+ b) ñ before palatals,
32
+ c) ṇ before cerebrals,
33
+ d) n before dentals, and
34
+ e) m before labials.
35
+
36
+ - Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
37
+ labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
38
+
39
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
40
+
41
+ tests:
42
+ - source: "हम"
43
+ expected: "hama"
44
+ - source: "मीन"
45
+ expected: "maīna"
46
+ - source: "औसत"
47
+ expected: "ăusata"
48
+ - source: "माँऽऽऽ!"
49
+ expected: "maān̐’’’!"
50
+ - source: "माँ"
51
+ expected: "maām̐"
52
+
53
+
54
+
55
+ map:
56
+
57
+ rules:
58
+ # note[4]
59
+ - pattern: (?<=)\u0901(?=\b)
60
+ result: "m̐"
61
+
62
+ characters:
63
+
64
+ # I. Vowels and Diphthongs (see Note 1)
65
+
66
+ 'अ': 'a'
67
+ 'आ': 'ā'
68
+ 'इ': 'i'
69
+ 'ई': 'ī'
70
+ 'उ': 'u'
71
+ 'ऊ': 'ū'
72
+ 'ऋ': 'ṛ'
73
+ 'ॠ': 'ṝ'
74
+ 'ऌ': 'ḹ'
75
+ 'ॳ': 'ĕ'
76
+ 'ए': 'e'
77
+ 'ॲ': 'ê'
78
+ 'अै': 'ai'
79
+ 'ऐ': 'ai'
80
+ 'ऒ': 'ŏ'
81
+ 'ओ': 'o'
82
+ 'ऑ': 'ô'
83
+ 'औ': 'ău'
84
+
85
+ # II. Consonants (see Note 2)
86
+ # Gutturals
87
+ 'क': 'ka'
88
+ 'ख': 'kha'
89
+ 'ग': 'ga'
90
+ 'घ': 'gha'
91
+ 'ङ': 'ṅa'
92
+
93
+ # Palatals
94
+ 'च': 'ca'
95
+ 'छ': 'cha'
96
+ 'ज': 'ja'
97
+ 'झ': 'jha'
98
+ 'ञ': 'ña'
99
+
100
+ # Cerebrals
101
+ 'ट': 'ṭa'
102
+ 'ठ': 'ṭha'
103
+ 'ड': 'ḍa'
104
+ 'ड़': 'ṛa'
105
+ 'ढ': 'ḍha'
106
+ 'ढ़': 'ṛha'
107
+ 'ण': 'ṇa'
108
+
109
+ # Dentals
110
+ 'त': 'ta'
111
+ 'थ': 'tha'
112
+ 'द': 'da'
113
+ 'ध': 'dha'
114
+ 'न': 'na'
115
+
116
+ # Labials
117
+ 'प': 'pa'
118
+ 'फ': 'pha'
119
+ 'ब': 'ba'
120
+ 'भ': 'bha'
121
+ 'म': 'ma'
122
+
123
+ # Semivowels
124
+ 'य': 'ya'
125
+ 'र': 'ra'
126
+ 'ल': 'la'
127
+ 'व': 'ba'
128
+
129
+ # Sibilants
130
+ 'श': 'śa'
131
+ 'ष': 'sha'
132
+ 'स': 'sa'
133
+
134
+ # Aspirate
135
+ 'ह': 'ha'
136
+
137
+ # Anusvāra
138
+ 'ं': 'ṃ'
139
+
140
+ # Bisarga
141
+ 'ः ': 'ḥ'
142
+
143
+ # Anunāsika
144
+ 'ँ': 'n̐' # ঁ : n̐, m̐
145
+
146
+ # Abagraha
147
+ 'ऽ': '’' # (apostrophe)
148
+
149
+ # Medials # Needed for connecting constants
150
+ 'ा': "ā"
151
+ 'ि': "i"
152
+ 'ी': "ī"
153
+ 'ु': "u"
154
+ 'ू': "ū"
155
+ 'ृ': "ṛi"
156
+ 'ॄ': "rī"
157
+ 'े': "e"
158
+ 'ॊ': "o"
159
+ 'ौ': "au"
@@ -0,0 +1,111 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: kat
5
+ source_script: Geok
6
+ destination_script: Latn
7
+ name: ALA-LC Georgian System (1997)
8
+ url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
9
+ creation_date: 1997
10
+ confirmation_date: 1997
11
+ description: |
12
+ Values are shown for the Khutsuri alphabet.
13
+
14
+ notes:
15
+
16
+ tests:
17
+
18
+ - source: ႼႨႢႬႨ
19
+ expected: CIGNI
20
+
21
+ - source: ⴜⴈⴂⴌⴈ
22
+ expected: cigni
23
+
24
+ - source: ႱႭႪႭႫႭႬ
25
+ expected: SOLOMON
26
+
27
+ - source: ⴑⴍⴊⴍⴋⴍⴌ
28
+ expected: solomon
29
+
30
+ - source: ႠႡႰႠჀႠႫ
31
+ expected: ABRAHAM
32
+
33
+ map:
34
+ characters:
35
+ '\u10a0' : 'A' # Ⴀ
36
+ '\u10a1' : 'B' # Ⴁ
37
+ '\u10a2' : 'G' # Ⴂ
38
+ '\u10a3' : 'D' # Ⴃ
39
+ '\u10a4' : 'E' # Ⴄ
40
+ '\u10a5' : 'V' # Ⴅ
41
+ '\u10a6' : 'Z' # Ⴆ
42
+ '\u10a7' : 'Tʻ' # Ⴇ
43
+ '\u10a8' : 'I' # Ⴈ
44
+ '\u10a9' : 'K' # Ⴉ
45
+ '\u10aa' : 'L' # Ⴊ
46
+ '\u10ab' : 'M' # Ⴋ
47
+ '\u10ac' : 'N' # Ⴌ
48
+ '\u10ad' : 'O' # Ⴍ
49
+ '\u10ae' : 'P' # Ⴎ
50
+ '\u10af' : 'Ž' # Ⴏ
51
+ '\u10b0' : 'R' # Ⴐ
52
+ '\u10b1' : 'S' # Ⴑ
53
+ '\u10b2' : 'T' # Ⴒ
54
+ '\u10b3' : 'U' # Ⴓ
55
+ '\u10b4' : 'Pʻ' # Ⴔ
56
+ '\u10b5' : 'Kʻ' # Ⴕ
57
+ '\u10b6' : 'Ġ' # Ⴖ
58
+ '\u10b7' : 'Q' # Ⴗ
59
+ '\u10b8' : 'Š' # Ⴘ
60
+ '\u10b9' : 'Čʻ' # Ⴙ
61
+ '\u10ba' : 'Cʻ' # Ⴚ
62
+ '\u10bb' : 'Ż' # Ⴛ
63
+ '\u10bc' : 'C' # Ⴜ
64
+ '\u10bd' : 'Č' # Ⴝ
65
+ '\u10be' : 'X' # Ⴞ
66
+ '\u10bf' : 'J' # Ⴟ
67
+ '\u10c0' : 'H' # Ⴠ
68
+ '\u10c1' : 'Ē' # Ⴡ
69
+ '\u10c2' : 'Y' # Ⴢ
70
+ '\u10c3' : 'W' # Ⴣ
71
+ '\u10c4' : 'X̣' # Ⴤ
72
+ '\u10c5' : 'Ō' # Ⴥ
73
+
74
+ '\u2d00' : 'a' # ⴀ
75
+ '\u2d01' : 'b' # ⴁ
76
+ '\u2d02' : 'g' # ⴂ
77
+ '\u2d03' : 'd' # ⴃ
78
+ '\u2d04' : 'e' # ⴄ
79
+ '\u2d05' : 'v' # ⴅ
80
+ '\u2d06' : 'z' # ⴆ
81
+ '\u2d07' : 'tʻ' # ⴇ
82
+ '\u2d08' : 'i' # ⴈ
83
+ '\u2d09' : 'k' # ⴉ
84
+ '\u2d0a' : 'l' # ⴊ
85
+ '\u2d0b' : 'm' # ⴋ
86
+ '\u2d0c' : 'n' # ⴌ
87
+ '\u2d0d' : 'o' # ⴍ
88
+ '\u2d0e' : 'p' # ⴎ
89
+ '\u2d0f' : 'ž' # ⴏ
90
+ '\u2d10' : 'r' # ⴐ
91
+ '\u2d11' : 's' # ⴑ
92
+ '\u2d12' : 't' # ⴒ
93
+ '\u2d13' : 'u' # ⴓ
94
+ '\u2d14' : 'pʻ' # ⴔ
95
+ '\u2d15' : 'kʻ' # ⴕ
96
+ '\u2d16' : 'ġ' # ⴖ
97
+ '\u2d17' : 'q' # ⴗ
98
+ '\u2d18' : 'š' # ⴘ
99
+ '\u2d19' : 'čʻ' # ⴙ
100
+ '\u2d1a' : 'cʻ' # ⴚ
101
+ '\u2d1b' : 'ż' # ⴛ
102
+ '\u2d1c' : 'c' # ⴜ
103
+ '\u2d1d' : 'č' # ⴝ
104
+ '\u2d1e' : 'x' # ⴞ
105
+ '\u2d1f' : 'j' # ⴟ
106
+ '\u2d20' : 'h' # ⴠ
107
+ '\u2d21' : 'ē' # ⴡ
108
+ '\u2d22' : 'y' # ⴢ
109
+ '\u2d23' : 'w' # ⴣ
110
+ '\u2d24' : 'x̣' # ⴤ
111
+ '\u2d25' : 'ō' # ⴥ
@@ -0,0 +1,146 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: ALA-LC Georgian System (1997)
8
+ url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
9
+ creation_date: 1997
10
+ confirmation_date: 1997
11
+ description: |
12
+ Values are shown for the older Khutsuri and the modern Mkhedruli alphabets.
13
+ There are no upper case letters in Mkhedruli.
14
+
15
+ notes:
16
+
17
+ tests:
18
+
19
+ - source: ხაოფსე
20
+ expected: xaopʻse
21
+
22
+ - source: ჭლოუ
23
+ expected: člou
24
+
25
+ - source: ჩოხულდი
26
+ expected: čʻoxuldi
27
+
28
+ - source: ქვემო ლინდა
29
+ expected: kʻvemo linda
30
+
31
+ - source: ტამკვაჩ იგვავერა
32
+ expected: tamkvačʻ igvavera
33
+
34
+ - source: სვანეთი
35
+ expected: svanetʻi
36
+
37
+ - source: საცხვარისი
38
+ expected: sacʻxvarisi
39
+
40
+ - source: მუხრან-თელეთი
41
+ expected: muxran-tʻeletʻi
42
+
43
+ - source: მუცდი
44
+ expected: mucʻdi
45
+
46
+ - source: ლეჩხუმი
47
+ expected: lečʻxumi
48
+
49
+ - source: ვერხნაია მწარა
50
+ expected: verxnaia mcara
51
+
52
+ - source: ეგრისის ქედი
53
+ expected: egrisis kʻedi
54
+
55
+ - source: დოჩარიფშა
56
+ expected: dočʻaripʻša
57
+
58
+ - source: ბოლოკო
59
+ expected: boloko
60
+
61
+ - source: აჭანდარა
62
+ expected: ačandara
63
+
64
+ - source: აუალიცა
65
+ expected: aualicʻa
66
+
67
+ - source: აკალამრა
68
+ expected: akalamra
69
+
70
+ - source: ლასილი
71
+ expected: lasili
72
+
73
+ - source: გუბაზეული
74
+ expected: gubazeuli
75
+
76
+ - source: ბაყაყი
77
+ expected: baqaqi
78
+
79
+ - source: ძროხა
80
+ expected: żroxa
81
+
82
+ - source: ჰაერი
83
+ expected: haeri
84
+
85
+ - source: ჟოლო
86
+ expected: žolo
87
+
88
+ - source: ჯართი
89
+ expected: jartʻi
90
+
91
+ - source: ღრმაღელე
92
+ expected: ġrmaġele
93
+
94
+ map:
95
+ characters:
96
+ '\u10d0' : 'a' # ა
97
+ '\u10d1' : 'b' # ბ
98
+ '\u10d2' : 'g' # გ
99
+ '\u10d3' : 'd' # დ
100
+ '\u10d4' : 'e' # ე
101
+ '\u10d5' : 'v' # ვ
102
+ '\u10d6' : 'z' # ზ
103
+
104
+ '\u10f1' : 'ē' # ჱ
105
+
106
+ '\u10d7' : 'tʻ' # თ
107
+ '\u10d8' : 'i' # ი
108
+ '\u10d9' : 'k' # კ
109
+ '\u10da' : 'l' # ლ
110
+ '\u10db' : 'm' # მ
111
+ '\u10dc' : 'n' # ნ
112
+
113
+ '\u10f2' : 'y' # ჲ
114
+
115
+ '\u10dd' : 'o' # ო
116
+ '\u10de' : 'p' # პ
117
+ '\u10df' : 'ž' # ჟ
118
+ '\u10e0' : 'r' # რ
119
+ '\u10e1' : 's' # ს
120
+ '\u10e2' : 't' # ტ
121
+
122
+ '\u10f3' : 'w' # ჳ
123
+
124
+ '\u10e3' : 'u' # უ
125
+ '\u10e4' : 'pʻ' # ფ
126
+ '\u10e5' : 'kʻ' # ქ
127
+ '\u10e6' : 'ġ' # ღ
128
+ '\u10e7' : 'q' # ყ
129
+ '\u10e8' : 'š' # შ
130
+ '\u10e9' : 'čʻ' # ჩ
131
+ '\u10ea' : 'cʻ' # ც
132
+ '\u10eb' : 'ż' # ძ
133
+ '\u10ec' : 'c' # წ
134
+ '\u10ed' : 'č' # ჭ
135
+ '\u10ee' : 'x' # ხ
136
+
137
+ '\u10f4' : 'x̣' # ჴ
138
+
139
+ '\u10ef' : 'j' # ჯ
140
+ '\u10f0' : 'h' # ჰ
141
+
142
+ '\u10f5' : 'ō' # ჵ
143
+
144
+ '\u10f6' : 'f' # ჶ
145
+ '\u10f7' : 'ĕ' # ჷ
146
+ '\u10f8' : 'ʻ' # ჸ
@@ -0,0 +1,94 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: kor
5
+ source_script: Hang
6
+ destination_script: Latn
7
+ name: ALA-LC Romanization Table -- Korean (1997)
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/korean.pdf
9
+ creation_date: 1997
10
+ adoption_date:
11
+ description:
12
+ "1. General Practice
13
+ The Library of Congress will continue to follow the McCune-Reischauer system
14
+ to romanize Korean with the exceptions noted in this document. See:
15
+ Romanization of the Korean Language: Based upon its Phonetic Structure by
16
+ G.M. McCune and E.O. Reischauer ([S.l.: s.n., 1939?), reprinted from the
17
+ Transactions of the Korea Branch of the Royal Asiatic Society. Full text of the
18
+ original document is available online from the National Library of Australia Web
19
+ site: http://www.nla.gov.au/librariesaustralia/cjk/download/ras_1939.pdf"
20
+
21
+ notes:
22
+
23
+
24
+ tests:
25
+ - source: 은하-리
26
+ expected: "Ŭnha-ri"
27
+ - source: 은중-리
28
+ expected: "Ŭnjung-ni"
29
+ - source: 은장-령
30
+ expected: "Ŭnjang-nyŏng"
31
+ - source: 은혜-동
32
+ expected: "Ŭnhye-dong"
33
+ - source: 은호-리
34
+ expected: "Ŭnho-ri"
35
+ - source: 은행정
36
+ expected: "Ŭnhaengjŏng"
37
+ - source: 은행-동
38
+ expected: "Ŭnhaeng-dong"
39
+ - source: 은행-촌
40
+ expected: "Ŭnhaeng-ch’on"
41
+ - source: 원수
42
+ expected: "Wŏnsu"
43
+ - source: 원소리-고개
44
+ expected: "Wŏnsori-gogae"
45
+ - source: 원소참
46
+ expected: "Wŏnsoch’am"
47
+ - source: 원소-리
48
+ expected: "Wŏnso-ri"
49
+ - source: 원신-리
50
+ expected: "Wŏnsil-li"
51
+ - source: 난곡
52
+ expected: "Nan’gok"
53
+ - source: 난산-리
54
+ expected: "Nansal-li"
55
+ - source: 난직
56
+ expected: "Nanjik"
57
+ - source: 영곡
58
+ expected: "Yŏnggok"
59
+ - source: 윗두밀
60
+ expected: "Wittumil"
61
+ - source: 윗도심이
62
+ expected: "Wittosimi"
63
+ - source: 둔지
64
+ expected: "Tunji"
65
+ - source: 서승
66
+ expected: "Sŏsŭng"
67
+ # - source: 신촌
68
+ # expected: "Sinch’on"
69
+ - source: 비암덕
70
+ expected: "Piamdŏk"
71
+ - source: 바위안
72
+ expected: "Pawian"
73
+ - source: 오송평
74
+ expected: "Osongp’yŏng"
75
+ - source: 그물목
76
+ expected: "Kŭmulmok"
77
+ - source: 구원정
78
+ expected: "Kuwŏnjŏng"
79
+ - source: 일하
80
+ expected: "Irha"
81
+ - source: 황우
82
+ expected: "Hwangu"
83
+ - source: 자작보
84
+ expected: "Chajakpo"
85
+ # - source: 비파1-동
86
+ # expected: "Pip’a Il-tong"
87
+ - source: 문암 오-동
88
+ expected: "Munam O-dong"
89
+
90
+ map:
91
+ character_separator: ""
92
+ word_separator: " "
93
+ title_case: True
94
+ inherit: "var-kor-Hang-Latn-mr-1939"