interscript 0.1.1 → 0.1.6

Sign up to get free protection for your applications and to get access to all the features.
Files changed (170) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
  6. data/lib/g2pwrapper.py +34 -0
  7. data/lib/interscript-opal.rb +2 -0
  8. data/lib/interscript.rb +138 -20
  9. data/lib/interscript/command.rb +28 -0
  10. data/lib/interscript/fs.rb +71 -0
  11. data/lib/interscript/mapping.rb +142 -0
  12. data/lib/interscript/opal.rb +27 -0
  13. data/lib/interscript/opal/maps.js.erb +10 -0
  14. data/lib/interscript/opal_map_translate.rb +12 -0
  15. data/lib/interscript/version.rb +1 -1
  16. data/lib/model-7 +0 -0
  17. data/lib/tha-pt-b-7 +0 -0
  18. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  19. data/maps/alalc-amh-Ethi-Latn-1997.yaml +509 -0
  20. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  21. data/maps/alalc-ara-Arab-Latn-1997.yaml +1283 -0
  22. data/maps/alalc-asm-Deva-Latn-1997.yaml +159 -0
  23. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +141 -0
  24. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +125 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  27. data/maps/alalc-ell-Grek-Latn-1997.yaml +624 -0
  28. data/maps/alalc-ell-Grek-Latn-2010.yaml +627 -0
  29. data/maps/alalc-hin-Deva-Latn-2020.yaml +159 -0
  30. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  31. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  32. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  33. data/maps/alalc-mar-Deva-Latn-1997.yaml +170 -0
  34. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  35. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  36. data/maps/alalc-pan-Deva-Latn-1997.yaml +237 -0
  37. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +221 -0
  38. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  39. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  40. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  41. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  42. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  43. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  44. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +174 -0
  45. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +169 -0
  46. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  47. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  48. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  49. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  50. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  51. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +528 -0
  52. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +592 -0
  53. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +108 -0
  54. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  55. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +184 -0
  56. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +285 -0
  57. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  58. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +38 -0
  59. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +701 -0
  60. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +19 -0
  61. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  62. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  63. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  64. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  65. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  66. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  67. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  68. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  69. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +200 -0
  70. data/maps/bgnpcgn-per-Arab-Latn-1956.yaml +92 -0
  71. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +314 -0
  72. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  73. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +162 -0
  74. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  75. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  76. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  77. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  78. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  79. data/maps/bis-gjr-Gujr-Latn-13194-1991.yaml +166 -0
  80. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  81. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  82. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  83. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  84. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  85. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  86. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  87. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  88. data/maps/dos-nep-Deva-Latn-1997.yaml +33 -0
  89. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  90. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  91. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  92. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  93. data/maps/ggg-kat-Geor-Latn-2002.yaml +88 -0
  94. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  95. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  96. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +186 -0
  97. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  98. data/maps/icao-bel-Cyrl-Latn-9303.yaml +136 -0
  99. data/maps/icao-bul-Cyrl-Latn-9303.yaml +118 -0
  100. data/maps/icao-heb-Hebr-Latn-9303.yaml +151 -0
  101. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +117 -0
  102. data/maps/icao-per-Arab-Latn-9303.yaml +103 -0
  103. data/maps/icao-rus-Cyrl-Latn-9303.yaml +117 -0
  104. data/maps/icao-srp-Cyrl-Latn-9303.yaml +117 -0
  105. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +119 -0
  106. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  107. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +609 -0
  108. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +40 -0
  109. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  110. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +271 -0
  111. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  112. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  113. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  114. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  115. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  116. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  117. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  118. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  119. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  120. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  121. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  122. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  123. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  124. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  125. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  126. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  127. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  128. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  129. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  130. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  131. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  132. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  133. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  134. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  135. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  136. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  137. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  138. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  139. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  140. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  141. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  142. data/maps/sac-zho-Hans-Latn-1979.yaml +24759 -0
  143. data/maps/ses-ara-Arab-Latn-1930.yaml +279 -0
  144. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  145. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  146. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  147. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  148. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  149. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  150. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  151. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  152. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  153. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  154. data/maps/un-mon-Mong-Latn-2013.yaml +99 -0
  155. data/maps/un-nep-Deva-Latn-1972.yaml +163 -0
  156. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  157. data/maps/un-ukr-Cyrl-Latn-1998.yaml +30 -0
  158. data/maps/ungegn-amh-Ethi-Latn-2016.yaml +575 -0
  159. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  160. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  161. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  162. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  163. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  164. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  165. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  166. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  167. data/spec/interscript/mapping_spec.rb +42 -0
  168. data/spec/interscript_spec.rb +26 -0
  169. data/spec/spec_helper.rb +3 -0
  170. metadata +298 -18
@@ -0,0 +1,155 @@
1
+ ---
2
+ authority_id: bis
3
+ id: 1991
4
+ language: tml
5
+ source_script: Taml
6
+ destination_script: Latn
7
+ name: Indian script code for information interchange - ISCII - Tamil Romanization
8
+ #url:
9
+ creation_date: 1991
10
+ description: |
11
+ IS 13194 (1991): Indian script code for information
12
+ interchange - ISCII [LITD 20: Indian Language Technologies
13
+ and Products]
14
+
15
+ notes:
16
+ - |
17
+ Exception: Anusvāra is transliterated by:
18
+
19
+ a) ṅ before gutturals,
20
+ b) ñ before palatals,
21
+ c) ṇ before cerebrals,
22
+ d) n before dentals, and
23
+ e) m before labials.
24
+
25
+ tests:
26
+ - source: "இளைஞர்களின் உறுதியான மனநிலையை பிரதிபலிக்கிறது: நீட் தேர்வில் 85-90 சதவீத மாணவர்கள் பங்கேற்பு - ரமேஷ் பொக்ரியால்"
27
+ expected: "iḷaiñrkḷiṉ uṟutiyāṉ mṉnilaiyai pirtiplikkiṟtu: nīṭ tērvil 85-90 ctvīt māṇvrkḷ pṅkēṟpu - rmēṣ pokriyāl"
28
+ - source: "நாடாளுமன்றத்தில் 4 மசோதாக்களை எதிர்க்க காங்கிரஸ் முடிவு - ஜெயராம் ரமேஷ்"
29
+ expected: "nāṭāḷumṉṟttil 4 mcōtākkḷai etirkk kāṅkirs muṭivu - jeyrām rmēṣ"
30
+ - source: "கர்நாடகாவில் மேலும் 9,894 பேருக்கு கொரோனா தொற்று உறுதி"
31
+ expected: "krnāṭkāvil mēlum 9,894 pērukku korōṉā toṟṟu uṟuti"
32
+ - source: "ஐதராபாத்துக்கு கைகொடுக்குமா அதிரடி?"
33
+ expected: "aitrāpāttukku kaikoṭukkumā atirṭi?"
34
+ - source: "அமெரிக்க ஓபன் டென்னிஸ்: இறுதிப்போட்டியில் டொமினிக்-ஸ்வெரேவ்"
35
+ expected: "amerikk ŏpṉ ṭeṉṉis: iṟutippōṭṭiyil ṭomiṉik-sverēv"
36
+ - source: "ஐ.பி.எல். கிரிக்கெட்டில் களம் இறங்கும் அமெரிக்க வீரர்"
37
+ expected: "ai.pi.el. kirikkeṭṭil kḷm iṟṅkum amerikk vīrr"
38
+ - source: "அமெரிக்க ஓபன் டென்னிஸ்; நவோமி ஒசாகா சாம்பியன் பட்டம் வென்றார்"
39
+ expected: "amerikk ŏpṉ ṭeṉṉis; nvōmi ocākā cāmpiyṉ pṭṭm veṉṟār"
40
+ - source: "புதிய கல்விக்கொள்கைக்கு எதிர்ப்பு: முன்னாள் துணைவேந்தர்கள் 20 பேர் பிரதமருக்கு கடிதம்"
41
+ expected: "putiy klvikkoḷkaikku etirppu: muṉṉāḷ tuṇaivēntrkḷ 20 pēr pirtmrukku kṭitm"
42
+ - source: "இந்த ஆண்டு ஐ.பி.எல். கோப்பையை எந்த அணி வெல்லும்? - கெவின் பீட்டர்சன் கணிப்பு"
43
+ expected: "int āṇṭu ai.pi.el. kōppaiyai ent aṇi vellum? - keviṉ pīṭṭrcṉ kṇippu"
44
+ - source: "இந்திய எண்ணெய் கப்பலில் தீ: விபத்து குறித்த எச்சரிக்கையை கப்பல் அதிகாரிகள் புறக்கணித்தனர் - இலங்கை கோர்ட்டு தகவல்"
45
+ expected: "intiy eṇṇey kpplil tī: vipttu kuṟitt eccrikkaiyai kppl atikārikḷ puṟkkṇittṉr - ilṅkai kōrṭṭu tkvl"
46
+
47
+ map:
48
+
49
+ rules:
50
+ # note
51
+ - pattern: \u0B82(?=[கங])
52
+ result: ṅ
53
+ - pattern: \u0B82(?=[சஜஞ])
54
+ result: ñ
55
+ - pattern: \u0B82(?=[டண])
56
+ result: ṇ
57
+ - pattern: \u0B82(?=[தநன])
58
+ result: n
59
+ - pattern: \u0B82(?=[பம])
60
+ result: m
61
+
62
+ characters:
63
+ 'அ': 'a'
64
+ 'ஆ': 'ā'
65
+ 'இ': 'i'
66
+ 'ஈ': 'ī'
67
+ 'உ': 'u'
68
+ 'ஊ': 'ū'
69
+
70
+ 'எ': 'e'
71
+ 'ஏ': 'ē'
72
+ 'ஐ': 'ai'
73
+
74
+ 'ஒ': 'o'
75
+ 'ஓ': 'ŏ'
76
+ 'ஔ': 'au'
77
+
78
+ # II. Consonants (see Note 2)
79
+ # Gutturals
80
+ 'க': 'k'
81
+ 'ங': 'ṅ'
82
+
83
+ # Palatals
84
+ 'ச': 'c'
85
+ 'ஜ': 'j'
86
+ 'ஞ': 'ñ'
87
+
88
+ # Cerebrals
89
+ 'ட': 'ṭ'
90
+ 'ண': 'ṇ'
91
+
92
+ # Dentals
93
+ 'த': 't'
94
+ 'ந': 'n'
95
+ 'ன': 'ṉ'
96
+
97
+ # Labials
98
+ 'ப': 'p'
99
+ 'ம': 'm'
100
+
101
+ # Semivowels
102
+ 'ய': 'y'
103
+ 'ர': 'r'
104
+ 'ற': 'ṟ'
105
+ 'ல': 'l'
106
+ 'ள': 'ḷ'
107
+ 'ழ': 'ẕ'
108
+
109
+
110
+ # Sibilants
111
+ 'வ': 'v'
112
+ 'ஶ': 'ś'
113
+ 'ஷ': 'ṣ'
114
+ 'ஸ': 's'
115
+
116
+
117
+ # Aspirate
118
+ 'ஹ': 'h'
119
+
120
+
121
+ # Bisarga
122
+ 'ஃ': 'ḥ'
123
+
124
+ # Anusvāra
125
+ 'ஂ': 'ṃ'
126
+
127
+ # Medials # Needed for connecting constants
128
+
129
+ 'ா': 'ā'
130
+ 'ி': 'i'
131
+ 'ீ': 'ī'
132
+ 'ு': 'u'
133
+ 'ூ': 'ū'
134
+
135
+ 'ൃ': "ṛ"
136
+ 'ൄ': "ṝ"
137
+
138
+
139
+ 'ெ': "e"
140
+ 'ே': "ē"
141
+ 'ை': "ai"
142
+ 'ொ': 'o'
143
+ 'ோ': 'ō'
144
+ 'ௌ': 'au'
145
+
146
+
147
+ 'ൺ': 'n'
148
+ 'ൻ': 'ṇ'
149
+
150
+ '्': ''
151
+ '്': ''
152
+ '்': ''
153
+ 'ൗ': ''
154
+ "‍": '' # no need for zero with joiner
155
+ "‌": '' # no need for zero with non joiner
@@ -0,0 +1,168 @@
1
+ ---
2
+ authority_id: un
3
+ id: 1998
4
+ language: bel
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: National System of Geographic Names Transmission into Roman Alphabet in Belarus
8
+ url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/20th-gegn-docs/20th_gegn_WP34.pdf
9
+ creation_date: 1998
10
+ description: |
11
+ The national system of romanization for Belarusian was approved by the State Committee and Land Resources,
12
+ Geodesy and Cartography, Republic of Belarus, on 20 March, 1998. This scheme was also supported by
13
+ the Y. Kolas Institute of Linguistics and the Republic Committee on Toponymy at the Belarusian Academy of Sciences.
14
+ While the system is still based on GOST 1983, it takes more precisely into account the peculiarities of
15
+ the Belarusian orthography. The system is reversible though there may exist some ambiguous consonant combinations.
16
+
17
+ tests: # the same as in by-bel-Cyrl-Latn-2007
18
+ - source: Аршанскi
19
+ expected: Aršanski
20
+ - source: Бешанковічы
21
+ expected: Biešankovičy
22
+ - source: Віцебск
23
+ expected: Viciebsk
24
+ - source: Гомель
25
+ expected: Homieĺ
26
+ - source: Гаўя
27
+ expected: Haŭja
28
+ - source: Добруш
29
+ expected: Dobruš
30
+ - source: Ельск
31
+ expected: Jeĺsk
32
+ - source: Бабаедава
33
+ expected: Babajedava
34
+ - source: Венцавічы
35
+ expected: Viencavičy
36
+ - source: Ёды
37
+ expected: Jody
38
+ - source: Вераб'ёвічы
39
+ expected: Vierabjovičy
40
+ - source: Мёры
41
+ expected: Miory
42
+ - source: Зэльва
43
+ expected: Zeĺva
44
+ - source: Iванава
45
+ expected: Ivanava
46
+ - source: Iўе
47
+ expected: Iŭje
48
+ - source: Лагойск
49
+ expected: Lahojsk
50
+ - source: Круглае
51
+ expected: Kruhlaje
52
+ - source: Лошыца
53
+ expected: Lošyca
54
+ - source: Любань
55
+ expected: Liubań
56
+ - source: Магілёў
57
+ expected: Mahilioŭ
58
+ - source: Нясвіж
59
+ expected: Niasviž
60
+ - source: Орша
61
+ expected: Orša
62
+ - source: Паставы
63
+ expected: Pastavy
64
+ - source: Рагачоў
65
+ expected: Rahačoŭ
66
+ - source: Смаргонь
67
+ expected: Smarhoń
68
+ - source: Талачын
69
+ expected: Talačyn
70
+ - source: Узда
71
+ expected: Uzda
72
+ - source: Шаркаўшчына
73
+ expected: Šarkaŭščyna
74
+ - source: Фаніпаль
75
+ expected: Fanipaĺ
76
+ - source: Хоцімск
77
+ expected: Chocimsk
78
+ - source: Цёмны Лес
79
+ expected: Ciomny Lies
80
+ - source: Чавусы
81
+ expected: Čavusy
82
+ - source: Шумілiна
83
+ expected: Šumilina
84
+ - source: Чыгірынка
85
+ expected: Čyhirynka
86
+ - source: Чэрвень
87
+ expected: Červień
88
+ - source: Друць
89
+ expected: Druć
90
+ - source: Чачэрск
91
+ expected: Čačersk
92
+ - source: Юхнаўка
93
+ expected: Juchnaŭka
94
+ - source: Гаюціна
95
+ expected: Hajucina
96
+ - source: Цюрлі
97
+ expected: Ciurli
98
+ - source: Любонічы
99
+ expected: Liuboničy
100
+ - source: Ямнае
101
+ expected: Jamnaje
102
+ - source: Баяры
103
+ expected: Bajary
104
+ - source: Валяр'яны
105
+ expected: Valiarjany
106
+ - source: Вязынка
107
+ expected: Viazynka
108
+
109
+ map:
110
+ inherit: gost-rus-Cyrl-Latn-16876-71-1983
111
+
112
+ rules:
113
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0415 # Е after consonants
114
+ result: IE
115
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0435 # е after consonants
116
+ result: ie
117
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0401 # Ё after consonants
118
+ result: IO
119
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0451 # ё after consonants
120
+ result: io
121
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u042E # Ю after consonants
122
+ result: IU
123
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u044E # ю after consonants
124
+ result: iu
125
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u042F # Я after consonants
126
+ result: IA
127
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u044F # я after consonants
128
+ result: ia
129
+ - pattern: \u0417\u042C # ЗЬ
130
+ result: "\u0179"
131
+ - pattern: \u0437\u044C # зь
132
+ result: "\u017A"
133
+ - pattern: \u041B\u042C # ЛЬ
134
+ result: "\u0139"
135
+ - pattern: \u043B\u044C # ль
136
+ result: "\u013A"
137
+ - pattern: \u0421\u042C # СЬ
138
+ result: "\u015A"
139
+ - pattern: \u0441\u044C # сь
140
+ result: "\u015B"
141
+ - pattern: \u0426\u042C # ЦЬ
142
+ result: "\u0106"
143
+ - pattern: \u0446\u044C # ць
144
+ result: "\u0107"
145
+ - pattern: \u041D\u042C # НЬ
146
+ result: "\u0143"
147
+ - pattern: \u043D\u044C # нь
148
+ result: "\u0144"
149
+ characters:
150
+ '\u0406' : 'I' # І
151
+ '\u0413' : 'H' # Г
152
+ '\u0415' : 'Je' # Е
153
+ '\u0401' : 'Jo' # Ё
154
+ '\U040E' : 'Ŭ' # Ў
155
+ '\u0425' : 'Ch' # Х
156
+ '\u042C' : '' # Ь
157
+ '\u042D' : 'E' # Э
158
+
159
+ '\u0433' : 'h' # г
160
+ '\u0456' : 'i' # і
161
+ '\u0435' : 'je' # е
162
+ '\u0451' : 'jo' # ё
163
+ '\u045E' : 'ŭ' # ў
164
+ '\u0445' : 'ch' # х
165
+ '\u044C' : '' # ь
166
+ '\u044D' : 'e' # э
167
+
168
+ '\u0027' : '' # '
@@ -0,0 +1,115 @@
1
+ ---
2
+ authority_id: by
3
+ id: 2007
4
+ language: bel
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: REGULATORY LEGAL ACTS OF THE NATIONAL BANK, NATIONAL ACADEMY OF SCIENCES OF BELARUS, MINISTRIES, OTHER REPUBLICAN GOVERNMENT BODIES 8/16668
8
+ url: http://www.pravo.by/pdf/2007-159/2007-159(027-028).pdf
9
+ creation_date: 2007
10
+ description: |
11
+ RESOLUTION OF THE STATE COMMITTEE
12
+ ON PROPERTY OF THE REPUBLIC OF BELARUS June 11, 2007 No. 38
13
+
14
+ 8/16668 (06/18/2007) On amendments and additions to the Instructions
15
+ for the transliteration of geographical names of the
16
+ Republic of Belarus in letters of the Latin alphabet
17
+
18
+ Based on the Regulation on the State Property Committee of the Republic of Belarus,
19
+ approved by the Decree of the Council of Ministers of the Republic of Belarusdated July 29, 2006
20
+ No. 958 "Issues of the State Committee on Property of the Republic of Belarus"
21
+
22
+ tests:
23
+ - source: Аршанскi
24
+ expected: Aršanski
25
+ - source: Бешанковічы
26
+ expected: Biešankovičy
27
+ - source: Віцебск
28
+ expected: Viciebsk
29
+ - source: Гомель
30
+ expected: Homieĺ
31
+ - source: Гаўя
32
+ expected: Haŭja
33
+ - source: Добруш
34
+ expected: Dobruš
35
+ - source: Ельск
36
+ expected: Jeĺsk
37
+ - source: Бабаедава
38
+ expected: Babajedava
39
+ - source: Венцавічы
40
+ expected: Viencavičy
41
+ - source: Ёды
42
+ expected: Jody
43
+ - source: Вераб'ёвічы
44
+ expected: Vierabjovičy
45
+ - source: Мёры
46
+ expected: Miory
47
+ - source: Зэльва
48
+ expected: Zeĺva
49
+ - source: Iванава
50
+ expected: Ivanava
51
+ - source: Iўе
52
+ expected: Iŭje
53
+ - source: Лагойск
54
+ expected: Lahojsk
55
+ - source: Круглае
56
+ expected: Kruhlaje
57
+ - source: Лошыца
58
+ expected: Lošyca
59
+ - source: Любань
60
+ expected: Liubań
61
+ - source: Магілёў
62
+ expected: Mahilioŭ
63
+ - source: Нясвіж
64
+ expected: Niasviž
65
+ - source: Орша
66
+ expected: Orša
67
+ - source: Паставы
68
+ expected: Pastavy
69
+ - source: Рагачоў
70
+ expected: Rahačoŭ
71
+ - source: Смаргонь
72
+ expected: Smarhoń
73
+ - source: Талачын
74
+ expected: Talačyn
75
+ - source: Узда
76
+ expected: Uzda
77
+ - source: Шаркаўшчына
78
+ expected: Šarkaŭščyna
79
+ - source: Фаніпаль
80
+ expected: Fanipaĺ
81
+ - source: Хоцімск
82
+ expected: Chocimsk
83
+ - source: Цёмны Лес
84
+ expected: Ciomny Lies
85
+ - source: Чавусы
86
+ expected: Čavusy
87
+ - source: Шумілiна
88
+ expected: Šumilina
89
+ - source: Чыгірынка
90
+ expected: Čyhirynka
91
+ - source: Чэрвень
92
+ expected: Červień
93
+ - source: Друць
94
+ expected: Druć
95
+ - source: Чачэрск
96
+ expected: Čačersk
97
+ - source: Юхнаўка
98
+ expected: Juchnaŭka
99
+ - source: Гаюціна
100
+ expected: Hajucina
101
+ - source: Цюрлі
102
+ expected: Ciurli
103
+ - source: Любонічы
104
+ expected: Liuboničy
105
+ - source: Ямнае
106
+ expected: Jamnaje
107
+ - source: Баяры
108
+ expected: Bajary
109
+ - source: Валяр'яны
110
+ expected: Valiarjany
111
+ - source: Вязынка
112
+ expected: Viazynka
113
+
114
+ map:
115
+ inherit: by-bel-Cyrl-Latn-1998
@@ -0,0 +1,33 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1997
4
+ language: nep
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Nepali Romanization, 1997
8
+ url: http://nationalgeoportal.gov.np/old/pdf/translation2.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ Survey Department, Ministry of Land Management, Cooperatives and Poverty Alleviation, Government of Nepal.
12
+
13
+ notes:
14
+ - |
15
+ ं (anusvara) is rendered by
16
+ ṅ before क, ख, ग, and घ
17
+ ñ before च, छ, ज, and झ
18
+ ṇ before ट, ठ, ड, and ढ
19
+ n before त, थ, द, and ध
20
+ ṁ before य, र, ल, व, श, ष, स
21
+
22
+ tests:
23
+ - source: "दुःख"
24
+ expected: "duhkh"
25
+
26
+ map:
27
+
28
+ inherit: "bgnpcgn-nep-Deva-Latn-2011"
29
+
30
+ characters:
31
+
32
+ # Bisarga
33
+ 'ः': 'h'