interscript 0.1.1 → 0.1.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.adoc +250 -17
- data/bin/interscript +38 -17
- data/bin/setup +8 -0
- data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
- data/lib/g2pwrapper.py +34 -0
- data/lib/interscript-opal.rb +2 -0
- data/lib/interscript.rb +138 -20
- data/lib/interscript/command.rb +28 -0
- data/lib/interscript/fs.rb +71 -0
- data/lib/interscript/mapping.rb +142 -0
- data/lib/interscript/opal.rb +27 -0
- data/lib/interscript/opal/maps.js.erb +10 -0
- data/lib/interscript/opal_map_translate.rb +12 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +509 -0
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
- data/maps/alalc-ara-Arab-Latn-1997.yaml +1283 -0
- data/maps/alalc-asm-Deva-Latn-1997.yaml +159 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +141 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +125 -0
- data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
- data/maps/alalc-ell-Grek-Latn-1997.yaml +624 -0
- data/maps/alalc-ell-Grek-Latn-2010.yaml +627 -0
- data/maps/alalc-hin-Deva-Latn-2020.yaml +159 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
- data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
- data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
- data/maps/alalc-mar-Deva-Latn-1997.yaml +170 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
- data/maps/alalc-pan-Deva-Latn-1997.yaml +237 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +221 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +174 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +169 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
- data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +528 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +592 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +108 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +184 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +285 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +38 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +701 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +19 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +200 -0
- data/maps/bgnpcgn-per-Arab-Latn-1956.yaml +92 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +314 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +162 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
- data/maps/bis-gjr-Gujr-Latn-13194-1991.yaml +166 -0
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
- data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
- data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
- data/maps/dos-nep-Deva-Latn-1997.yaml +33 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
- data/maps/ggg-kat-Geor-Latn-2002.yaml +88 -0
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +186 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +118 -0
- data/maps/icao-heb-Hebr-Latn-9303.yaml +151 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +117 -0
- data/maps/icao-per-Arab-Latn-9303.yaml +103 -0
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +117 -0
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +117 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +119 -0
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +609 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +40 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +271 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
- data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
- data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
- data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
- data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
- data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
- data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
- data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
- data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
- data/maps/sac-zho-Hans-Latn-1979.yaml +24759 -0
- data/maps/ses-ara-Arab-Latn-1930.yaml +279 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
- data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
- data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
- data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
- data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
- data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
- data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
- data/maps/un-mon-Mong-Latn-2013.yaml +99 -0
- data/maps/un-nep-Deva-Latn-1972.yaml +163 -0
- data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +30 -0
- data/maps/ungegn-amh-Ethi-Latn-2016.yaml +575 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
- data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
- data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
- data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
- data/spec/interscript/mapping_spec.rb +42 -0
- data/spec/interscript_spec.rb +26 -0
- data/spec/spec_helper.rb +3 -0
- metadata +298 -18
|
@@ -0,0 +1,159 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2020
|
|
4
|
+
language: hin
|
|
5
|
+
source_script: Deva
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Hindi Romanization, 2020
|
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
|
|
9
|
+
creation_date: 2020
|
|
10
|
+
description: |
|
|
11
|
+
ALA-LC Romanization table for Hindi
|
|
12
|
+
|
|
13
|
+
notes:
|
|
14
|
+
|
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
16
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
17
|
+
made in transliteration.
|
|
18
|
+
|
|
19
|
+
- |
|
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
21
|
+
transliteration, with the following exceptions:
|
|
22
|
+
|
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
24
|
+
b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
|
|
25
|
+
virāma.
|
|
26
|
+
|
|
27
|
+
- |
|
|
28
|
+
Exception: Anusvāra is transliterated by:
|
|
29
|
+
|
|
30
|
+
a) ṅ before gutturals,
|
|
31
|
+
b) ñ before palatals,
|
|
32
|
+
c) ṇ before cerebrals,
|
|
33
|
+
d) n before dentals, and
|
|
34
|
+
e) m before labials.
|
|
35
|
+
|
|
36
|
+
- Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
|
|
37
|
+
labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
|
|
38
|
+
|
|
39
|
+
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
|
40
|
+
|
|
41
|
+
tests:
|
|
42
|
+
- source: "हम"
|
|
43
|
+
expected: "hama"
|
|
44
|
+
- source: "मीन"
|
|
45
|
+
expected: "maīna"
|
|
46
|
+
- source: "औसत"
|
|
47
|
+
expected: "ăusata"
|
|
48
|
+
- source: "माँऽऽऽ!"
|
|
49
|
+
expected: "maān̐’’’!"
|
|
50
|
+
- source: "माँ"
|
|
51
|
+
expected: "maām̐"
|
|
52
|
+
|
|
53
|
+
|
|
54
|
+
|
|
55
|
+
map:
|
|
56
|
+
|
|
57
|
+
rules:
|
|
58
|
+
# note[4]
|
|
59
|
+
- pattern: (?<=)\u0901(?=\b)
|
|
60
|
+
result: "m̐"
|
|
61
|
+
|
|
62
|
+
characters:
|
|
63
|
+
|
|
64
|
+
# I. Vowels and Diphthongs (see Note 1)
|
|
65
|
+
|
|
66
|
+
'अ': 'a'
|
|
67
|
+
'आ': 'ā'
|
|
68
|
+
'इ': 'i'
|
|
69
|
+
'ई': 'ī'
|
|
70
|
+
'उ': 'u'
|
|
71
|
+
'ऊ': 'ū'
|
|
72
|
+
'ऋ': 'ṛ'
|
|
73
|
+
'ॠ': 'ṝ'
|
|
74
|
+
'ऌ': 'ḹ'
|
|
75
|
+
'ॳ': 'ĕ'
|
|
76
|
+
'ए': 'e'
|
|
77
|
+
'ॲ': 'ê'
|
|
78
|
+
'अै': 'ai'
|
|
79
|
+
'ऐ': 'ai'
|
|
80
|
+
'ऒ': 'ŏ'
|
|
81
|
+
'ओ': 'o'
|
|
82
|
+
'ऑ': 'ô'
|
|
83
|
+
'औ': 'ău'
|
|
84
|
+
|
|
85
|
+
# II. Consonants (see Note 2)
|
|
86
|
+
# Gutturals
|
|
87
|
+
'क': 'ka'
|
|
88
|
+
'ख': 'kha'
|
|
89
|
+
'ग': 'ga'
|
|
90
|
+
'घ': 'gha'
|
|
91
|
+
'ङ': 'ṅa'
|
|
92
|
+
|
|
93
|
+
# Palatals
|
|
94
|
+
'च': 'ca'
|
|
95
|
+
'छ': 'cha'
|
|
96
|
+
'ज': 'ja'
|
|
97
|
+
'झ': 'jha'
|
|
98
|
+
'ञ': 'ña'
|
|
99
|
+
|
|
100
|
+
# Cerebrals
|
|
101
|
+
'ट': 'ṭa'
|
|
102
|
+
'ठ': 'ṭha'
|
|
103
|
+
'ड': 'ḍa'
|
|
104
|
+
'ड़': 'ṛa'
|
|
105
|
+
'ढ': 'ḍha'
|
|
106
|
+
'ढ़': 'ṛha'
|
|
107
|
+
'ण': 'ṇa'
|
|
108
|
+
|
|
109
|
+
# Dentals
|
|
110
|
+
'त': 'ta'
|
|
111
|
+
'थ': 'tha'
|
|
112
|
+
'द': 'da'
|
|
113
|
+
'ध': 'dha'
|
|
114
|
+
'न': 'na'
|
|
115
|
+
|
|
116
|
+
# Labials
|
|
117
|
+
'प': 'pa'
|
|
118
|
+
'फ': 'pha'
|
|
119
|
+
'ब': 'ba'
|
|
120
|
+
'भ': 'bha'
|
|
121
|
+
'म': 'ma'
|
|
122
|
+
|
|
123
|
+
# Semivowels
|
|
124
|
+
'य': 'ya'
|
|
125
|
+
'र': 'ra'
|
|
126
|
+
'ल': 'la'
|
|
127
|
+
'व': 'ba'
|
|
128
|
+
|
|
129
|
+
# Sibilants
|
|
130
|
+
'श': 'śa'
|
|
131
|
+
'ष': 'sha'
|
|
132
|
+
'स': 'sa'
|
|
133
|
+
|
|
134
|
+
# Aspirate
|
|
135
|
+
'ह': 'ha'
|
|
136
|
+
|
|
137
|
+
# Anusvāra
|
|
138
|
+
'ं': 'ṃ'
|
|
139
|
+
|
|
140
|
+
# Bisarga
|
|
141
|
+
'ः ': 'ḥ'
|
|
142
|
+
|
|
143
|
+
# Anunāsika
|
|
144
|
+
'ँ': 'n̐' # ঁ : n̐, m̐
|
|
145
|
+
|
|
146
|
+
# Abagraha
|
|
147
|
+
'ऽ': '’' # (apostrophe)
|
|
148
|
+
|
|
149
|
+
# Medials # Needed for connecting constants
|
|
150
|
+
'ा': "ā"
|
|
151
|
+
'ि': "i"
|
|
152
|
+
'ी': "ī"
|
|
153
|
+
'ु': "u"
|
|
154
|
+
'ू': "ū"
|
|
155
|
+
'ृ': "ṛi"
|
|
156
|
+
'ॄ': "rī"
|
|
157
|
+
'े': "e"
|
|
158
|
+
'ॊ': "o"
|
|
159
|
+
'ौ': "au"
|
|
@@ -0,0 +1,111 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: kat
|
|
5
|
+
source_script: Geok
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: ALA-LC Georgian System (1997)
|
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
|
|
9
|
+
creation_date: 1997
|
|
10
|
+
confirmation_date: 1997
|
|
11
|
+
description: |
|
|
12
|
+
Values are shown for the Khutsuri alphabet.
|
|
13
|
+
|
|
14
|
+
notes:
|
|
15
|
+
|
|
16
|
+
tests:
|
|
17
|
+
|
|
18
|
+
- source: ႼႨႢႬႨ
|
|
19
|
+
expected: CIGNI
|
|
20
|
+
|
|
21
|
+
- source: ⴜⴈⴂⴌⴈ
|
|
22
|
+
expected: cigni
|
|
23
|
+
|
|
24
|
+
- source: ႱႭႪႭႫႭႬ
|
|
25
|
+
expected: SOLOMON
|
|
26
|
+
|
|
27
|
+
- source: ⴑⴍⴊⴍⴋⴍⴌ
|
|
28
|
+
expected: solomon
|
|
29
|
+
|
|
30
|
+
- source: ႠႡႰႠჀႠႫ
|
|
31
|
+
expected: ABRAHAM
|
|
32
|
+
|
|
33
|
+
map:
|
|
34
|
+
characters:
|
|
35
|
+
'\u10a0' : 'A' # Ⴀ
|
|
36
|
+
'\u10a1' : 'B' # Ⴁ
|
|
37
|
+
'\u10a2' : 'G' # Ⴂ
|
|
38
|
+
'\u10a3' : 'D' # Ⴃ
|
|
39
|
+
'\u10a4' : 'E' # Ⴄ
|
|
40
|
+
'\u10a5' : 'V' # Ⴅ
|
|
41
|
+
'\u10a6' : 'Z' # Ⴆ
|
|
42
|
+
'\u10a7' : 'Tʻ' # Ⴇ
|
|
43
|
+
'\u10a8' : 'I' # Ⴈ
|
|
44
|
+
'\u10a9' : 'K' # Ⴉ
|
|
45
|
+
'\u10aa' : 'L' # Ⴊ
|
|
46
|
+
'\u10ab' : 'M' # Ⴋ
|
|
47
|
+
'\u10ac' : 'N' # Ⴌ
|
|
48
|
+
'\u10ad' : 'O' # Ⴍ
|
|
49
|
+
'\u10ae' : 'P' # Ⴎ
|
|
50
|
+
'\u10af' : 'Ž' # Ⴏ
|
|
51
|
+
'\u10b0' : 'R' # Ⴐ
|
|
52
|
+
'\u10b1' : 'S' # Ⴑ
|
|
53
|
+
'\u10b2' : 'T' # Ⴒ
|
|
54
|
+
'\u10b3' : 'U' # Ⴓ
|
|
55
|
+
'\u10b4' : 'Pʻ' # Ⴔ
|
|
56
|
+
'\u10b5' : 'Kʻ' # Ⴕ
|
|
57
|
+
'\u10b6' : 'Ġ' # Ⴖ
|
|
58
|
+
'\u10b7' : 'Q' # Ⴗ
|
|
59
|
+
'\u10b8' : 'Š' # Ⴘ
|
|
60
|
+
'\u10b9' : 'Čʻ' # Ⴙ
|
|
61
|
+
'\u10ba' : 'Cʻ' # Ⴚ
|
|
62
|
+
'\u10bb' : 'Ż' # Ⴛ
|
|
63
|
+
'\u10bc' : 'C' # Ⴜ
|
|
64
|
+
'\u10bd' : 'Č' # Ⴝ
|
|
65
|
+
'\u10be' : 'X' # Ⴞ
|
|
66
|
+
'\u10bf' : 'J' # Ⴟ
|
|
67
|
+
'\u10c0' : 'H' # Ⴠ
|
|
68
|
+
'\u10c1' : 'Ē' # Ⴡ
|
|
69
|
+
'\u10c2' : 'Y' # Ⴢ
|
|
70
|
+
'\u10c3' : 'W' # Ⴣ
|
|
71
|
+
'\u10c4' : 'X̣' # Ⴤ
|
|
72
|
+
'\u10c5' : 'Ō' # Ⴥ
|
|
73
|
+
|
|
74
|
+
'\u2d00' : 'a' # ⴀ
|
|
75
|
+
'\u2d01' : 'b' # ⴁ
|
|
76
|
+
'\u2d02' : 'g' # ⴂ
|
|
77
|
+
'\u2d03' : 'd' # ⴃ
|
|
78
|
+
'\u2d04' : 'e' # ⴄ
|
|
79
|
+
'\u2d05' : 'v' # ⴅ
|
|
80
|
+
'\u2d06' : 'z' # ⴆ
|
|
81
|
+
'\u2d07' : 'tʻ' # ⴇ
|
|
82
|
+
'\u2d08' : 'i' # ⴈ
|
|
83
|
+
'\u2d09' : 'k' # ⴉ
|
|
84
|
+
'\u2d0a' : 'l' # ⴊ
|
|
85
|
+
'\u2d0b' : 'm' # ⴋ
|
|
86
|
+
'\u2d0c' : 'n' # ⴌ
|
|
87
|
+
'\u2d0d' : 'o' # ⴍ
|
|
88
|
+
'\u2d0e' : 'p' # ⴎ
|
|
89
|
+
'\u2d0f' : 'ž' # ⴏ
|
|
90
|
+
'\u2d10' : 'r' # ⴐ
|
|
91
|
+
'\u2d11' : 's' # ⴑ
|
|
92
|
+
'\u2d12' : 't' # ⴒ
|
|
93
|
+
'\u2d13' : 'u' # ⴓ
|
|
94
|
+
'\u2d14' : 'pʻ' # ⴔ
|
|
95
|
+
'\u2d15' : 'kʻ' # ⴕ
|
|
96
|
+
'\u2d16' : 'ġ' # ⴖ
|
|
97
|
+
'\u2d17' : 'q' # ⴗ
|
|
98
|
+
'\u2d18' : 'š' # ⴘ
|
|
99
|
+
'\u2d19' : 'čʻ' # ⴙ
|
|
100
|
+
'\u2d1a' : 'cʻ' # ⴚ
|
|
101
|
+
'\u2d1b' : 'ż' # ⴛ
|
|
102
|
+
'\u2d1c' : 'c' # ⴜ
|
|
103
|
+
'\u2d1d' : 'č' # ⴝ
|
|
104
|
+
'\u2d1e' : 'x' # ⴞ
|
|
105
|
+
'\u2d1f' : 'j' # ⴟ
|
|
106
|
+
'\u2d20' : 'h' # ⴠ
|
|
107
|
+
'\u2d21' : 'ē' # ⴡ
|
|
108
|
+
'\u2d22' : 'y' # ⴢ
|
|
109
|
+
'\u2d23' : 'w' # ⴣ
|
|
110
|
+
'\u2d24' : 'x̣' # ⴤ
|
|
111
|
+
'\u2d25' : 'ō' # ⴥ
|
|
@@ -0,0 +1,146 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: kat
|
|
5
|
+
source_script: Geor
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: ALA-LC Georgian System (1997)
|
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
|
|
9
|
+
creation_date: 1997
|
|
10
|
+
confirmation_date: 1997
|
|
11
|
+
description: |
|
|
12
|
+
Values are shown for the older Khutsuri and the modern Mkhedruli alphabets.
|
|
13
|
+
There are no upper case letters in Mkhedruli.
|
|
14
|
+
|
|
15
|
+
notes:
|
|
16
|
+
|
|
17
|
+
tests:
|
|
18
|
+
|
|
19
|
+
- source: ხაოფსე
|
|
20
|
+
expected: xaopʻse
|
|
21
|
+
|
|
22
|
+
- source: ჭლოუ
|
|
23
|
+
expected: člou
|
|
24
|
+
|
|
25
|
+
- source: ჩოხულდი
|
|
26
|
+
expected: čʻoxuldi
|
|
27
|
+
|
|
28
|
+
- source: ქვემო ლინდა
|
|
29
|
+
expected: kʻvemo linda
|
|
30
|
+
|
|
31
|
+
- source: ტამკვაჩ იგვავერა
|
|
32
|
+
expected: tamkvačʻ igvavera
|
|
33
|
+
|
|
34
|
+
- source: სვანეთი
|
|
35
|
+
expected: svanetʻi
|
|
36
|
+
|
|
37
|
+
- source: საცხვარისი
|
|
38
|
+
expected: sacʻxvarisi
|
|
39
|
+
|
|
40
|
+
- source: მუხრან-თელეთი
|
|
41
|
+
expected: muxran-tʻeletʻi
|
|
42
|
+
|
|
43
|
+
- source: მუცდი
|
|
44
|
+
expected: mucʻdi
|
|
45
|
+
|
|
46
|
+
- source: ლეჩხუმი
|
|
47
|
+
expected: lečʻxumi
|
|
48
|
+
|
|
49
|
+
- source: ვერხნაია მწარა
|
|
50
|
+
expected: verxnaia mcara
|
|
51
|
+
|
|
52
|
+
- source: ეგრისის ქედი
|
|
53
|
+
expected: egrisis kʻedi
|
|
54
|
+
|
|
55
|
+
- source: დოჩარიფშა
|
|
56
|
+
expected: dočʻaripʻša
|
|
57
|
+
|
|
58
|
+
- source: ბოლოკო
|
|
59
|
+
expected: boloko
|
|
60
|
+
|
|
61
|
+
- source: აჭანდარა
|
|
62
|
+
expected: ačandara
|
|
63
|
+
|
|
64
|
+
- source: აუალიცა
|
|
65
|
+
expected: aualicʻa
|
|
66
|
+
|
|
67
|
+
- source: აკალამრა
|
|
68
|
+
expected: akalamra
|
|
69
|
+
|
|
70
|
+
- source: ლასილი
|
|
71
|
+
expected: lasili
|
|
72
|
+
|
|
73
|
+
- source: გუბაზეული
|
|
74
|
+
expected: gubazeuli
|
|
75
|
+
|
|
76
|
+
- source: ბაყაყი
|
|
77
|
+
expected: baqaqi
|
|
78
|
+
|
|
79
|
+
- source: ძროხა
|
|
80
|
+
expected: żroxa
|
|
81
|
+
|
|
82
|
+
- source: ჰაერი
|
|
83
|
+
expected: haeri
|
|
84
|
+
|
|
85
|
+
- source: ჟოლო
|
|
86
|
+
expected: žolo
|
|
87
|
+
|
|
88
|
+
- source: ჯართი
|
|
89
|
+
expected: jartʻi
|
|
90
|
+
|
|
91
|
+
- source: ღრმაღელე
|
|
92
|
+
expected: ġrmaġele
|
|
93
|
+
|
|
94
|
+
map:
|
|
95
|
+
characters:
|
|
96
|
+
'\u10d0' : 'a' # ა
|
|
97
|
+
'\u10d1' : 'b' # ბ
|
|
98
|
+
'\u10d2' : 'g' # გ
|
|
99
|
+
'\u10d3' : 'd' # დ
|
|
100
|
+
'\u10d4' : 'e' # ე
|
|
101
|
+
'\u10d5' : 'v' # ვ
|
|
102
|
+
'\u10d6' : 'z' # ზ
|
|
103
|
+
|
|
104
|
+
'\u10f1' : 'ē' # ჱ
|
|
105
|
+
|
|
106
|
+
'\u10d7' : 'tʻ' # თ
|
|
107
|
+
'\u10d8' : 'i' # ი
|
|
108
|
+
'\u10d9' : 'k' # კ
|
|
109
|
+
'\u10da' : 'l' # ლ
|
|
110
|
+
'\u10db' : 'm' # მ
|
|
111
|
+
'\u10dc' : 'n' # ნ
|
|
112
|
+
|
|
113
|
+
'\u10f2' : 'y' # ჲ
|
|
114
|
+
|
|
115
|
+
'\u10dd' : 'o' # ო
|
|
116
|
+
'\u10de' : 'p' # პ
|
|
117
|
+
'\u10df' : 'ž' # ჟ
|
|
118
|
+
'\u10e0' : 'r' # რ
|
|
119
|
+
'\u10e1' : 's' # ს
|
|
120
|
+
'\u10e2' : 't' # ტ
|
|
121
|
+
|
|
122
|
+
'\u10f3' : 'w' # ჳ
|
|
123
|
+
|
|
124
|
+
'\u10e3' : 'u' # უ
|
|
125
|
+
'\u10e4' : 'pʻ' # ფ
|
|
126
|
+
'\u10e5' : 'kʻ' # ქ
|
|
127
|
+
'\u10e6' : 'ġ' # ღ
|
|
128
|
+
'\u10e7' : 'q' # ყ
|
|
129
|
+
'\u10e8' : 'š' # შ
|
|
130
|
+
'\u10e9' : 'čʻ' # ჩ
|
|
131
|
+
'\u10ea' : 'cʻ' # ც
|
|
132
|
+
'\u10eb' : 'ż' # ძ
|
|
133
|
+
'\u10ec' : 'c' # წ
|
|
134
|
+
'\u10ed' : 'č' # ჭ
|
|
135
|
+
'\u10ee' : 'x' # ხ
|
|
136
|
+
|
|
137
|
+
'\u10f4' : 'x̣' # ჴ
|
|
138
|
+
|
|
139
|
+
'\u10ef' : 'j' # ჯ
|
|
140
|
+
'\u10f0' : 'h' # ჰ
|
|
141
|
+
|
|
142
|
+
'\u10f5' : 'ō' # ჵ
|
|
143
|
+
|
|
144
|
+
'\u10f6' : 'f' # ჶ
|
|
145
|
+
'\u10f7' : 'ĕ' # ჷ
|
|
146
|
+
'\u10f8' : 'ʻ' # ჸ
|
|
@@ -0,0 +1,94 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: kor
|
|
5
|
+
source_script: Hang
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: ALA-LC Romanization Table -- Korean (1997)
|
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/korean.pdf
|
|
9
|
+
creation_date: 1997
|
|
10
|
+
adoption_date:
|
|
11
|
+
description:
|
|
12
|
+
"1. General Practice
|
|
13
|
+
The Library of Congress will continue to follow the McCune-Reischauer system
|
|
14
|
+
to romanize Korean with the exceptions noted in this document. See:
|
|
15
|
+
Romanization of the Korean Language: Based upon its Phonetic Structure by
|
|
16
|
+
G.M. McCune and E.O. Reischauer ([S.l.: s.n., 1939?), reprinted from the
|
|
17
|
+
Transactions of the Korea Branch of the Royal Asiatic Society. Full text of the
|
|
18
|
+
original document is available online from the National Library of Australia Web
|
|
19
|
+
site: http://www.nla.gov.au/librariesaustralia/cjk/download/ras_1939.pdf"
|
|
20
|
+
|
|
21
|
+
notes:
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
tests:
|
|
25
|
+
- source: 은하-리
|
|
26
|
+
expected: "Ŭnha-ri"
|
|
27
|
+
- source: 은중-리
|
|
28
|
+
expected: "Ŭnjung-ni"
|
|
29
|
+
- source: 은장-령
|
|
30
|
+
expected: "Ŭnjang-nyŏng"
|
|
31
|
+
- source: 은혜-동
|
|
32
|
+
expected: "Ŭnhye-dong"
|
|
33
|
+
- source: 은호-리
|
|
34
|
+
expected: "Ŭnho-ri"
|
|
35
|
+
- source: 은행정
|
|
36
|
+
expected: "Ŭnhaengjŏng"
|
|
37
|
+
- source: 은행-동
|
|
38
|
+
expected: "Ŭnhaeng-dong"
|
|
39
|
+
- source: 은행-촌
|
|
40
|
+
expected: "Ŭnhaeng-ch’on"
|
|
41
|
+
- source: 원수
|
|
42
|
+
expected: "Wŏnsu"
|
|
43
|
+
- source: 원소리-고개
|
|
44
|
+
expected: "Wŏnsori-gogae"
|
|
45
|
+
- source: 원소참
|
|
46
|
+
expected: "Wŏnsoch’am"
|
|
47
|
+
- source: 원소-리
|
|
48
|
+
expected: "Wŏnso-ri"
|
|
49
|
+
- source: 원신-리
|
|
50
|
+
expected: "Wŏnsil-li"
|
|
51
|
+
- source: 난곡
|
|
52
|
+
expected: "Nan’gok"
|
|
53
|
+
- source: 난산-리
|
|
54
|
+
expected: "Nansal-li"
|
|
55
|
+
- source: 난직
|
|
56
|
+
expected: "Nanjik"
|
|
57
|
+
- source: 영곡
|
|
58
|
+
expected: "Yŏnggok"
|
|
59
|
+
- source: 윗두밀
|
|
60
|
+
expected: "Wittumil"
|
|
61
|
+
- source: 윗도심이
|
|
62
|
+
expected: "Wittosimi"
|
|
63
|
+
- source: 둔지
|
|
64
|
+
expected: "Tunji"
|
|
65
|
+
- source: 서승
|
|
66
|
+
expected: "Sŏsŭng"
|
|
67
|
+
# - source: 신촌
|
|
68
|
+
# expected: "Sinch’on"
|
|
69
|
+
- source: 비암덕
|
|
70
|
+
expected: "Piamdŏk"
|
|
71
|
+
- source: 바위안
|
|
72
|
+
expected: "Pawian"
|
|
73
|
+
- source: 오송평
|
|
74
|
+
expected: "Osongp’yŏng"
|
|
75
|
+
- source: 그물목
|
|
76
|
+
expected: "Kŭmulmok"
|
|
77
|
+
- source: 구원정
|
|
78
|
+
expected: "Kuwŏnjŏng"
|
|
79
|
+
- source: 일하
|
|
80
|
+
expected: "Irha"
|
|
81
|
+
- source: 황우
|
|
82
|
+
expected: "Hwangu"
|
|
83
|
+
- source: 자작보
|
|
84
|
+
expected: "Chajakpo"
|
|
85
|
+
# - source: 비파1-동
|
|
86
|
+
# expected: "Pip’a Il-tong"
|
|
87
|
+
- source: 문암 오-동
|
|
88
|
+
expected: "Munam O-dong"
|
|
89
|
+
|
|
90
|
+
map:
|
|
91
|
+
character_separator: ""
|
|
92
|
+
word_separator: " "
|
|
93
|
+
title_case: True
|
|
94
|
+
inherit: "var-kor-Hang-Latn-mr-1939"
|