interscript 0.1.7 → 2.1.0b1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (314) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +116 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +83 -133
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +68 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +68 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +76 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +68 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/lib/interscript/visualize.rb +61 -0
  63. data/lib/interscript/visualize/group.html.erb +59 -0
  64. data/lib/interscript/visualize/json.rb +57 -0
  65. data/lib/interscript/visualize/map.html.erb +46 -0
  66. data/lib/interscript/visualize/nodes.rb +89 -0
  67. data/requirements.txt +1 -0
  68. metadata +78 -416
  69. data/README.adoc +0 -298
  70. data/lib/g2pwrapper.py +0 -34
  71. data/lib/interscript/fs.rb +0 -69
  72. data/lib/interscript/mapping.rb +0 -142
  73. data/lib/interscript/opal.rb +0 -57
  74. data/lib/interscript/opal/entrypoint.rb +0 -12
  75. data/lib/interscript/opal/map_translate.rb +0 -7
  76. data/lib/interscript/opal/maps.js.erb +0 -10
  77. data/lib/model-7 +0 -0
  78. data/lib/tha-pt-b-7 +0 -0
  79. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  80. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  81. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  82. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  83. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
  84. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
  85. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  86. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  87. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  88. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  89. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  90. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  91. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  92. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  93. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
  94. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
  95. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  96. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  97. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  98. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  99. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  100. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  101. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  102. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  103. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  104. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  105. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  106. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  107. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  108. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  109. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  110. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  111. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  112. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
  113. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  114. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  115. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  116. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  117. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  118. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  119. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  120. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  121. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  122. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  123. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  124. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  125. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  126. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  127. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  128. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  129. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  130. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
  131. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  132. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
  133. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  134. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  135. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  136. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  137. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  138. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  139. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  140. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  141. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  142. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  143. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  144. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  145. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  146. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  147. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  148. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  149. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  150. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  151. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
  152. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
  153. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  154. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  155. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  156. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  157. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  158. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  159. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  160. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  161. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  162. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  163. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  164. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  165. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  166. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  167. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  168. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
  169. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  170. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
  171. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  172. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  173. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  174. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  175. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  176. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  177. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  178. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  179. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  180. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  181. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  182. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  183. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  184. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  185. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  186. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  187. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  188. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  189. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  190. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  191. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  192. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  193. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  194. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  195. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  196. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  197. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  198. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  199. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  200. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  201. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  202. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  203. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  204. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  205. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  206. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  207. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  208. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  209. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  210. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  211. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  212. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  213. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
  214. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  215. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  216. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  217. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  218. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  219. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  220. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  221. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  222. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  223. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  224. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  225. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  226. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  227. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  228. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  229. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  230. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  231. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  232. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  233. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  234. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  235. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  236. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  237. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  238. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  239. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  240. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  241. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  242. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  243. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  244. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
  245. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  246. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  247. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  248. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  249. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  250. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  251. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  252. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  253. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  254. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  255. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  256. data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
  257. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  258. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  259. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  260. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  261. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  262. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
  263. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  264. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  265. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  266. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  267. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  268. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  269. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  270. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  271. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  272. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  273. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  274. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  275. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  276. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  277. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  278. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  279. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  280. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  281. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  282. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  283. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  284. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  285. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  286. data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
  287. data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
  288. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  289. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  290. data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
  291. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  292. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  293. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  294. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  295. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  296. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  297. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  298. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  299. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  300. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  301. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  302. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  303. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  304. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  305. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  306. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  307. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  308. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  309. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  310. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  311. data/spec/interscript/filenames_spec.rb +0 -384
  312. data/spec/interscript/mapping_spec.rb +0 -42
  313. data/spec/interscript_spec.rb +0 -29
  314. data/spec/spec_helper.rb +0 -3
@@ -1,190 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 2013
4
- language: iso-639-2:mkd
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: Makedonian Romanization, BGN/PCGN 2013 System
8
- url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
9
- creation_date: 2013
10
- description: |
11
- Macedonian was officially established as a written language in Yugoslavia during
12
- World War II and is now the official language of North Macedonia.
13
- This romanization system replaces the BGN/PCGN 1981 agreement and adheres
14
- to the most widely-accepted standardization of Macedonian orthography.
15
-
16
- notes:
17
- - The Macedonian Cyrillic lowercase italic Д may sometimes be seen as g.
18
- There is no specific Unicode encoding for this variant form so a comparable character
19
- has been used here for illustrative purposes.
20
- - The Macedonian Cyrillic lowercase italic Ѓ may sometimes be seen as ī.
21
- There is no specific Unicode encoding for this variant form so a comparable character
22
- has been used here for illustrative purposes.
23
- - The Macedonian Cyrillic lowercase italic П may sometimes be seen as ū.
24
- There is no specific Unicode encoding for this variant form so a comparable character
25
- has been used here for illustrative purposes.
26
- - The Macedonian Cyrillic lowercase italic Т may sometimes be seen as w̄.
27
- There is no specific Unicode encoding for this variant form so a comparable character
28
- has been used here for illustrative purposes.
29
- - |
30
- An inventory of letter-diacritic combinations, with their Unicode encoding,
31
- in addition to the unmodified letters of the basic Roman script is:
32
- | Ǵ (U+01F4) | ǵ (U+01F5) |
33
- | Ž (U+017D) | ž (U+017E) |
34
- | Dz (U+01F2)* | dz (U+01F3)* |
35
- | Lj (U+01C8)* | lj (U+01C9)* |
36
- | Nj (U+01CB)* | nj(U+01CC)* |
37
- | Ḱ (U+IE30) | ḱ (U+IE31) |
38
- | Č (U+010C) | č (U+010D) |
39
- | Dž (U+01C5)* | dž (U+01C6)* |
40
- | Š (U+0160) | š (U+0161) |
41
- * Note that these characters can also be reproduced with individual letters (e.g. l+j).
42
- - The Romanization column shows only lowercase forms but, when romanizing,
43
- uppercase and lowercase Roman letters as appropriate should be used.
44
-
45
- tests:
46
- - source: Ѓенови Ливаѓе
47
- expected: Ǵenovi Livaǵe
48
- - source: ЛУЃЕ луѓе
49
- expected: LUǴE luǵe
50
- - source: ЅВЕЗДА ѕвезда Ѕвезда
51
- expected: DZVEZDA dzvezda Dzvezda
52
- - source: Јабежица
53
- expected: Jabežica
54
- - source: Љиќен и Бард
55
- expected: Ljiḱen i Bard
56
- - source: Ќамилов Чукар
57
- expected: Ḱamilov Čukar
58
- - source: Џавидин Кајнак
59
- expected: Džavidin Kajnak
60
- - source: Џамалџи
61
- expected: Džamaldži
62
- - source: Џибра Гури и Зи
63
- expected: Džibra Guri i Zi
64
- - source: Абазова Куќарица
65
- expected: Abazova Kuḱarica
66
- - source: Баба Анѓина Маала
67
- expected: Baba Anǵina Maala
68
- - source: Ваљановец
69
- expected: Valjanovec
70
- - source: Галал Једи Дереш
71
- expected: Galal Jedi Dereš
72
- - source: Дванаесет Клајнци
73
- expected: Dvanaeset Klajnci
74
- - source: Електродистрибуција Струга
75
- expected: Elektrodistribucija Struga
76
- - source: Железничка Станица Рајко Жинзифов
77
- expected: Železnička Stanica Rajko Žinzifov
78
- - source: Заедничко Речиште
79
- expected: Zaedničko Rečište
80
- - source: Испраена Плоча
81
- expected: Ispraena Ploča
82
- - source: Казнено-Поправна Установа Идризово
83
- expected: Kazneno-Popravna Ustanova Idrizovo
84
- - source: Лази и Зејнелит
85
- expected: Lazi i Zejnelit
86
- - source: Мавровско Езеро
87
- expected: Mavrovsko Ezero
88
- - source: Национален Парк Галичица
89
- expected: Nacionalen Park Galičica
90
- - source: Одморалиште Свети Стефан
91
- expected: Odmoralište Sveti Stefan
92
- - source: Планинарски Дом Караџица
93
- expected: Planinarski Dom Karadžica
94
- - source: Раса е Лисењит
95
- expected: Rasa e Lisenjit
96
- - source: Скочивирска Клисура
97
- expected: Skočivirska Klisura
98
- - source: Термо-електроцентрала Неготино
99
- expected: Termo-elektrocentrala Negotino
100
- - source: Узуновско Бресје
101
- expected: Uzunovsko Bresje
102
- - source: Фабрика Југохром
103
- expected: Fabrika Jugohrom
104
- - source: Хидроелектрана Сапунџица
105
- expected: Hidroelektrana Sapundžica
106
- - source: Цветковско Рамниште
107
- expected: Cvetkovsko Ramnište
108
- - source: Чалтанова Пештера
109
- expected: Čaltanova Peštera
110
- - source: Шкемби Вишнејц
111
- expected: Škembi Višnejc
112
-
113
- map:
114
- postrules:
115
- # DZ
116
- - pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
117
- result: "DZ"
118
- #LJ
119
- - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
120
- result: "LJ"
121
- #NJ
122
- - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
123
- result: "NJ"
124
- #DŽ
125
- - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
126
- result: "DŽ"
127
-
128
- characters:
129
- "\u0410": "A"
130
- "\u0411": "B"
131
- "\u0412": "V"
132
- "\u0413": "G"
133
- "\u0414": "D"
134
- "\u0403": "\u01F4" # Ǵ
135
- "\u0415": "E"
136
- "\u0416": "\u005a\u030c" # Ž
137
- "\u0417": "Z"
138
- "\u0405": "Dz"
139
- "\u0418": "I"
140
- "\u0408": "J"
141
- "\u041A": "K"
142
- "\u041B": "L"
143
- "\u0409": "Lj"
144
- "\u041C": "M"
145
- "\u041D": "N"
146
- "\u040A": "Nj"
147
- "\u041E": "O"
148
- "\u041F": "P"
149
- "\u0420": "R"
150
- "\u0421": "S"
151
- "\u0422": "T"
152
- "\u040C": "\u004b\u0301" # Ḱ
153
- "\u0423": "U"
154
- "\u0424": "F"
155
- "\u0425": "H"
156
- "\u0426": "C"
157
- "\u0427": "\u0043\u030c" # Č
158
- "\u040F": "D\u007a\u030c" # Dž
159
- "\u0428": "\u0053\u030c" # Š
160
- "\u0430": "a"
161
- "\u0431": "b"
162
- "\u0432": "v"
163
- "\u0433": "g"
164
- "\u0434": "d"
165
- "\u0453": "\u01F5" # ǵ
166
- "\u0435": "e"
167
- "\u0436": "\u007a\u030c" # ž
168
- "\u0437": "z"
169
- "\u0455": "dz"
170
- "\u0438": "i"
171
- "\u0458": "j"
172
- "\u043A": "k"
173
- "\u043B": "l"
174
- "\u0459": "lj"
175
- "\u043C": "m"
176
- "\u043D": "n"
177
- "\u045A": "nj"
178
- "\u043E": "o"
179
- "\u043F": "p"
180
- "\u0440": "r"
181
- "\u0441": "s"
182
- "\u0442": "t"
183
- "\u045C": "\u1E31" # ḱ
184
- "\u0443": "u"
185
- "\u0444": "f"
186
- "\u0445": "h"
187
- "\u0446": "c"
188
- "\u0447": "\u0063\u030c" # č
189
- "\u045F": "d\u007a\u030c" # dž
190
- "\u0448": "\u0073\u030c" # š
@@ -1,223 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 1964
4
- language: iso-639-2:mon
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: BGN/PCGN 1964 System
8
- alias:
9
- ogc11122:
10
- code: mon_Cyrl2Latn_BGN_1964
11
- description: Mongolian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1964 System
12
- url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
13
- creation_date:
14
- confirmation_date:
15
- description: |
16
- This system was originated by the PCGN in 1957 and adopted as a
17
- BGN/PCGN System in 1964. It is intended for use in the romanization of
18
- geographic names in the "Mongolian People's Republic" but not to romanize
19
- Mongolian names in adjacent parts of China and the U.S.S.R.
20
-
21
- notes: |
22
- - b occurs initially and after л, м, and б.
23
- - v occurs medially in Mongolian words and initially in foreign words.
24
- - y occurs only as the second element of diphthongs.
25
- - k, p, f, and shch occurs foreign words only.
26
- - "\u2019" occurs only in Russion words.
27
- - ï occurs only in suffixes to words containing back vowels (a, o, and u).
28
- - In monosyllables yu or yü depending on pronunciation; in polysyllables yu when followed by a, o, or u, but yü when followed by i, e, ö, or ü.
29
-
30
- tests:
31
- - source: Эрдэнэт Сум
32
- expected: Erdenet Sum
33
- - source: Эрдэнэт
34
- expected: Erdenet
35
- - source: Эрдэнэ
36
- expected: Erdene
37
- - source: Шивээговь Сум
38
- expected: Shiveegovĭ Sum
39
- - source: Шивээговь
40
- expected: Shiveegovĭ
41
- - source: Шарынгол Сум
42
- expected: Sharïngol Sum
43
- - source: Шарынгол
44
- expected: Sharïngol
45
- - source: Цагааннуур
46
- expected: Tsagaannuur
47
- - source: Хонгор Сум
48
- expected: Hongor Sum
49
- - source: Хонгор
50
- expected: Hongor
51
- - source: Хайлаастай
52
- expected: Haylaastay
53
- - source: Түнэл Сум
54
- expected: Tünel Sum
55
- - source: Түнэл
56
- expected: Tünel
57
- - source: Сүхбаатар
58
- expected: Sühbaatar
59
- - source: Сүмбэр Сум
60
- expected: Sümber Sum
61
- - source: Сүмбэр
62
- expected: Sümber
63
- - source: Сайншанд Сум
64
- expected: Saynshand Sum
65
- - source: Сайншанд
66
- expected: Saynshand
67
- - source: Орхон Сум
68
- expected: Orhon Sum
69
- - source: Орхон
70
- expected: Orhon
71
- - source: Нарст
72
- expected: Narst
73
- - source: Мөрөн Сум
74
- expected: Mörön Sum
75
- - source: Мөрөн
76
- expected: Mörön
77
- - source: Зүүнхөвөө
78
- expected: Dzüünhövöö
79
- - source: Жаргалант Сум
80
- expected: Jargalant Sum
81
- - source: Жаргалант
82
- expected: Jargalant
83
- - source: Дархан Сум
84
- expected: Darhan Sum
85
- - source: Даланзадгад Сум
86
- expected: Dalandzadgad Sum
87
- - source: Даланзадгад
88
- expected: Dalandzadgad
89
- - source: Давст Сум
90
- expected: Davst Sum
91
- - source: Давст
92
- expected: Davst
93
- - source: Говьсүмбэр Сум
94
- expected: Govĭsümber Sum
95
- - source: Говь
96
- expected: Govĭ
97
- - source: Буга
98
- expected: Buga
99
- - source: Бор-Өндөр Сум
100
- expected: Bor-Öndör Sum
101
- - source: Бор-Өндөр
102
- expected: Bor-Öndör
103
- - source: Баянхонгор
104
- expected: Bayanhongor
105
- - source: Баянтал
106
- expected: Bayantal
107
- - source: Баяндэлгэр Сум
108
- expected: Bayandelger Sum
109
- - source: Баяндэлгэр
110
- expected: Bayandelger
111
- - source: Баян-Өндөр Сум
112
- expected: Bayan-Öndör Sum
113
- - source: Баруун-Урт Сум
114
- expected: Baruun-Urt Sum
115
- - source: Баруун-Урт
116
- expected: Baruun-Urt
117
- - source: Архуст
118
- expected: Arhust
119
- - source: Арвайхээр Сум
120
- expected: Arvayheer Sum
121
- - source: Арвайхээр
122
- expected: Arvayheer
123
- - source: Есөнбулаг Сум
124
- expected: Yösönbulag Sum
125
- - source: Ерөө Сум
126
- expected: Yöröö Sum
127
- - source: Есөнзүйл Сум
128
- expected: Yösöndzüyl Sum
129
- - source: Ноён Сум
130
- expected: Noyon Sum
131
- - source: Родник Балянгийн-Булак
132
- expected: Rodnik Balyangiyn-Bulak
133
- - source: Замын-Үүд Сум
134
- expected: Dzamïn-Üüd Sum
135
- - source: Адаацаг Сум
136
- expected: Adaatsag Sum
137
- - source: Чандмань Сум
138
- expected: Chandmanĭ Sum
139
- - source: Хяргас Сум
140
- expected: Hyargas Sum
141
-
142
- map:
143
- rules:
144
- - pattern: \u042e(?=[АаОоУу]) # Ю before а, о, or у
145
- result: "Yu"
146
- - pattern: \u044e(?=[АаОоУу]) # ю before а, о, or у
147
- result: "yu"
148
- - pattern: \u042e(?=[ИиЭэӨөҮү]) # Ю before и, э, ө, or ү
149
- result: "Yü"
150
- - pattern: \u044e(?=[ИиЭэӨөҮү]) # ю before и, э, ө, or ү
151
- result: "yü"
152
-
153
- characters:
154
- "А": "A" # \u0410
155
- "Б": "B" # \u0411
156
- "В": "V" # \u0412
157
- "Г": "G" # \u0413
158
- "Д": "D" # \u0414
159
- "Е": "Yö" # \u0415
160
- "Ё": "Yo" # \u0401
161
- "Ж": "J" # \u0416
162
- "З": "Dz" # \u0417
163
- "И": "I" # \u0418
164
- "Й": "Y" # \u0419
165
- "К": "K" # \u041a
166
- "Л": "L" # \u041b
167
- "М": "M" # \u041c
168
- "Н": "N" # \u041d
169
- "О": "O" # \u041e
170
- "Ө": "Ö" # \u04e8
171
- "П": "P" # \u041f
172
- "Р": "R" # \u0420
173
- "С": "S" # \u0421
174
- "Т": "T" # \u0422
175
- "У": "U" # \u0423
176
- "Ү": "Ü" # \u04ae
177
- "Ф": "F" # \u0424
178
- "Х": "H" # \u0425
179
- "Ц": "Ts" # \u0426
180
- "Ч": "Ch" # \u0427
181
- "Ш": "Sh" # \u0428
182
- "Щ": "Shch" # \u0429
183
- "Ъ": "\u2019" # \u042a
184
- "Ы": "Ï" # \u042b
185
- "Ь": "Ĭ" # \u042c
186
- "Э": "E" # \u042d
187
- "Ю": "Yu" # \u042e
188
- "Я": "Ya" # \u042f
189
- "а": "a" # \u0430
190
- "б": "b" # \u0431
191
- "в": "v" # \u0432
192
- "г": "g" # \u0433
193
- "д": "d" # \u0434
194
- "е": "yö" # \u0435
195
- "ё": "yo" # \u0451
196
- "ж": "j" # \u0436
197
- "з": "dz" # \u0437
198
- "и": "i" # \u0438
199
- "й": "y" # \u0439
200
- "к": "k" # \u043a
201
- "л": "l" # \u043b
202
- "м": "m" # \u043c
203
- "н": "n" # \u043d
204
- "о": "o" # \u043e
205
- "ө": "ö" # \u04e9
206
- "п": "p" # \u043f
207
- "р": "r" # \u0440
208
- "с": "s" # \u0441
209
- "т": "t" # \u0442
210
- "у": "u" # \u0443
211
- "ү": "ü" # \u04af
212
- "ф": "f" # \u0444
213
- "х": "h" # \u0445
214
- "ц": "ts" # \u0446
215
- "ч": "ch" # \u0447
216
- "ш": "sh" # \u0448
217
- "щ": "shch" # \u0449
218
- "ъ": "\u2019" # \u044a
219
- "ы": "ï" # \u044b
220
- "ь": "ĭ" # \u044c
221
- "э": "e" # \u044d
222
- "ю": "yu" # \u044e
223
- "я": "ya" # \u044f
@@ -1,230 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 2020
4
- language: iso-639-2:nep
5
- source_script: Deva
6
- destination_script: Latn
7
- name: Nepali Romanization, 2020
8
- url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20NEPALI.pdf
9
- creation_date: 1964
10
- description: |
11
- BGN/PCGN 2011 Agreement Romanization of Nepali
12
- The BGN and the PCGN have adopted the Nepal Survey Department (NSD) system for the
13
- romanization of Nepali names. This system, below, should be applied to Nepali names for which Roman‐
14
- script spellings in materials produced by the government of Nepal are not available.
15
-
16
- notes:
17
-
18
- - Only the isolated forms of the characters are given in the consonant table. See any grammar of Nepali
19
- (or other language using the Devanagari alphabet) for variant forms used in conjunct characters.
20
- - These two consonant characters appear sometimes to represent ṛ (cerebral r), e.g., पहाड → pahāṛ
21
- instead of pahāḍ. At one time they were written with dots below, i.e., as ड़ and ढ़, though this is no
22
- longer normal practice in Nepali. The romanizations ṛ and ṛh, respectively, are optional for
23
- documentary purposes if such dots appear in Nepali writing.
24
- - व , can be romanized as either v or w. This character is primarily
25
- romanized as v in consonant initial, medial, and final position; however, initial, medial, and final w
26
- romanizations can occur. The w romanization is a special case which is believed to be dependent on
27
- dialect, pronunciation, or stress.
28
- - |
29
- An inventory of letter‐diacritic combinations, with their Unicode encoding, in addition to the unmodified letters of the basic Roman script is:
30
- Ṅ(U+1E44) ṅ (U+1E45)
31
- Ñ (U+00D1) ñ (U+00F1)
32
- Ṭ (1E6C) ṭ (1E6D)
33
- Ḍ (1E0C) ḍ (1E0D)
34
- Ṇ (1E46) ṇ (1E47)
35
- Ṣ (1E62) ṣ (1E63)
36
- Ā (U+0100) ā (U+0101)
37
- Ī (U+012A) ī (U+012B)
38
- Ū (U+016A) ū (U+016B)
39
- Ṛ (1E5A) ṛ (1E5B)
40
-
41
- - The Romanization column shows only lowercase forms but, when romanizing, uppercase and lowercase
42
- Roman letters as appropriate should be used.
43
-
44
- - |
45
- ं (anusvara) is rendered by
46
- ṅ before क, ख, ग, and घ
47
- ñ before च, छ, ज, and झ
48
- ṇ before ट, ठ, ड, and ढ
49
- n before त, थ, द, and ध
50
- ṁ before य, र, ल, व, श, ष, स and ह
51
-
52
- tests:
53
- - source: "लेखन"
54
- expected: "lekhn"
55
- - source: "मुद्रा"
56
- expected: "mudarā"
57
- - source: "प्रशंसा"
58
- expected: "parshṃsā" # note 5 rule checking
59
- - source: "अंक"
60
- expected: "aṅk" # note 5 rule checking
61
- - source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
62
- expected: "nekpāle sathgit sathāyī kmiṭīko baiṭhk bhdau gte bolāune bheko"
63
- - source: "न घर रह्यो, न परिवार"
64
- expected: "n ghr rhayo, n privār"
65
- - source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
66
- expected: "ḍhorpāṭnmā bhujīkholā bāḍhīphirole abhibhāvk gumāekā bālbālikāko bichlalī"
67
- - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
68
- expected: "susamitākā kākā hembhādur r kākīlāī pni phirole bgāyo"
69
- - source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
70
- expected: "sṃvidhān jārī bhes~gai sāravjnik parshāsnmā nyā~ utasāh āune apekṣā thiyo"
71
- - source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
72
- expected: "deshmā koronā sṅkarmit r mṛitkko sṅkhayā hrek din bḍhado chh"
73
- - source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
74
- expected: "gāu~pālikākā adhaykṣ ṭikā guruṅkā anusār viṣaṇudāslāī rājule sutankā lāgi belukā sāthī lgekā thie"
75
- - source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
76
- expected: "yo āyojnā gāu~pālikāko kenadar telalokmā prachh"
77
- - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
78
- expected: "susamitākā kākā hembhādur r kākīlāī pni phirole bgāyo"
79
- - source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
80
- expected: "chait philo sātā ghr āekā unī lkḍāun bhepchhi ytai rokie"
81
- - source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
82
- expected: "kām gran jāneko hkmā rojgārdātā kmapnīko ptrs~gai vḍā r jilalā parshāsnko siphāris anivāray grieko chh"
83
- - source: "दुःख"
84
- expected: "duḥkh"
85
- - source: "निकुञ्जको स्थानीय पोस्टका कर्मचारी पनि त्यहीँ थिए"
86
- expected: "nikuñajko sathānīy posaṭkā kramchārī pni tayhī~ thie"
87
- - source: "युद्धकालको मनोविज्ञान"
88
- expected: "yudadhkālko mnovijñān"
89
- - source: "जर्मन वायुसेवाको आक्रमणमा दुई लाख पचास हजार मानिसको ज्यान जानसक्ने र करिब ३० देखि ४० लाख मान्छे विस्थापित हुने अनुमान बेलायत सरकारको थियो"
90
- expected: "jramn vāyusevāko ākarmṇmā duī lākh pchās hjār mānisko jayān jānskane r krib 30 dekhi 40 lākh mānachhe visathāpit hune anumān belāyt srkārko thiyo"
91
- - source: "युद्ध"
92
- expected: "yudadh"
93
- - source: "कोरोनासँग जम्काभेट"
94
- expected: "koronās~g jmakābheṭ"
95
- - source: "संक्रमित"
96
- expected: "sṅkarmit"
97
- - source: "स्वयम्"
98
- expected: "savyma"
99
- - source: "संख्या"
100
- expected: "sṅkhayā"
101
- - source: "गौरीटारस्थित रंगशाला"
102
- expected: "gaurīṭārsathit rṅgshālā"
103
-
104
- map:
105
-
106
- rules:
107
- # note[5]
108
- - pattern: \u0902(?=[कखगघ]) # ं before क, ख, ग, and घ
109
- result: ṅ
110
- - pattern: \u0902(?=[चछजझ]) # ं before च, छ, ज, and झ
111
- result: ñ
112
- - pattern: \u0902(?=[टठडढ]) # ं before ट, ठ, ड, and ढ
113
- result: ṇ
114
- - pattern: \u0902(?=[तथदध]) # ं before त, थ, द, and ध
115
- result: n
116
-
117
- characters:
118
-
119
- # Vowels and Diphthongs
120
-
121
- 'अ': 'a'
122
- 'आ': 'ā'
123
- 'इ': 'i'
124
- 'ई': 'ī'
125
- 'उ': 'u'
126
- 'ऊ': 'ū'
127
- 'ऋ': 'ṛi'
128
- 'ॠ': 'rī'
129
- 'ए': 'e'
130
- 'ऐ': 'ai'
131
- 'ओ': 'o'
132
- 'औ': 'au'
133
-
134
- # Medials # Needed for connecting constants
135
-
136
- 'ा': "ā"
137
- 'ि': "i"
138
- 'ी': "ī"
139
- 'ु': "u"
140
- 'ू': "ū"
141
- 'ृ': "ṛi"
142
- 'ॄ': "rī"
143
- 'े': "e"
144
- 'ै': "ai"
145
- 'ो': "o"
146
- 'ौ': "au"
147
-
148
-
149
- # Consonants (see Note 1)
150
-
151
- # Gutturals
152
- 'क': 'k'
153
- 'ख': 'kh'
154
- 'ग': 'g'
155
- 'घ': 'gh'
156
- 'ङ': 'ṅ'
157
-
158
- # Palatals
159
- 'च': 'ch'
160
- 'छ': 'chh'
161
- 'ज': 'j'
162
- 'झ': 'jh'
163
- 'ञ': 'ñ'
164
-
165
- # Cerebrals
166
- 'ट': 'ṭ'
167
- 'ठ': 'ṭh'
168
- 'ड': 'ḍ'
169
- 'ढ': 'ḍh'
170
- 'ण': 'ṇ'
171
-
172
- # Dentals
173
- 'त': 't'
174
- 'थ': 'th'
175
- 'द': 'd'
176
- 'ध': 'dh'
177
- 'न': 'n'
178
-
179
- # Labials
180
- 'प': 'p'
181
- 'फ': 'ph'
182
- 'ब': 'b'
183
- 'भ': 'bh'
184
- 'म': 'm'
185
-
186
- # Semivowels
187
- 'य': 'y'
188
- 'र': 'r'
189
- 'ल': 'l'
190
- 'व': 'v' # or wa [Note#3]
191
-
192
- # Sibilants
193
- 'श': 'sh'
194
- 'ष': 'ṣ'
195
- 'स': 's'
196
- 'क्ष': 'kṣ'
197
- 'त्र': 'tr'
198
- 'ज्ञ' : 'jñ'
199
-
200
- # Aspirate
201
- 'ह': 'h'
202
-
203
- # Anusvāra
204
- 'ं': 'ṃ'
205
-
206
- # Bisarga
207
- 'ः': 'ḥ'
208
-
209
- # Anunāsika
210
- 'ँ': '~'
211
-
212
- 'ॅ': 'r'
213
-
214
- # halanta
215
- '्': 'a'
216
-
217
- # Abagraha
218
- 'ऽ': '’' # (apostrophe)
219
-
220
- # Numerals / सङ्ख्या
221
- '०': '0'
222
- '१': '1'
223
- '२': '2'
224
- '३': '3'
225
- '४': '4'
226
- '५': '5'
227
- '६': '6'
228
- '७': '7'
229
- '८': '8'
230
- '९': '9'