interscript 0.1.7 → 0.1.9

Sign up to get free protection for your applications and to get access to all the features.
Files changed (82) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +1 -3
  3. data/aliases.json +1 -0
  4. data/lib/interscript.rb +8 -3
  5. data/lib/interscript/fs.rb +27 -0
  6. data/lib/interscript/mapping.rb +3 -1
  7. data/lib/interscript/opal.rb +142 -3
  8. data/lib/interscript/opal/entrypoint.rb +8 -0
  9. data/lib/interscript/opal/exports.rb +11 -0
  10. data/lib/interscript/opal/maps.js.erb +2 -4
  11. data/lib/interscript/version.rb +1 -1
  12. data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -5
  13. data/maps/alalc-asm-Deva-Latn-1997.yaml +104 -10
  14. data/maps/alalc-asm-Deva-Latn-2012.yaml +18 -3
  15. data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
  16. data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
  17. data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
  18. data/maps/alalc-hin-Deva-Latn-1997.yaml +102 -10
  19. data/maps/alalc-hin-Deva-Latn-2011.yaml +19 -1
  20. data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
  21. data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
  22. data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
  23. data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
  24. data/maps/alalc-pra-Deva-Latn-2012.yaml +2 -2
  25. data/maps/alalc-san-Deva-Latn-2012.yaml +78 -9
  26. data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
  27. data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
  28. data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
  29. data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
  30. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +3 -1
  31. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
  32. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
  33. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +1 -1
  34. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
  35. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
  36. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
  37. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
  38. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
  39. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
  40. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +2 -0
  41. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +87 -53
  42. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
  43. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
  44. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
  45. data/maps/{bis-knd-Knda-Latn-13194-1991.yaml → bis-kan-Kana-Latn-13194-1991.yaml} +2 -2
  46. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +17 -2
  47. data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
  48. data/maps/{iso-kan-Knda-Latn-15919-2001.yaml → iso-kan-Kana-Latn-15919-2001.yaml} +1 -1
  49. data/maps/{mns-mon-Cyrl-Latn-5217-2012.yaml → masm-mon-Cyrl-Latn-5217-2012.yaml} +2 -2
  50. data/maps/{mns-mon-Latn-Cyrl-5217-2012.yaml → masm-mon-Latn-Cyrl-5217-2012.yaml} +1 -1
  51. data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
  52. data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
  53. data/maps/odni-ara-Arab-Latn-2015.yaml +20 -130
  54. data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
  55. data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
  56. data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
  57. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
  58. data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
  59. data/maps/{odni-per-Arab-Latn-2015.yaml → odni-prs-Arab-Latn-2015.yaml} +0 -0
  60. data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
  61. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
  62. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +4 -0
  63. data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
  64. data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
  65. data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
  66. data/maps/un-hin-Deva-Latn-2016.yaml +104 -10
  67. data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
  68. data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
  69. data/maps/un-mar-Deva-Latn-2016.yaml +24 -13
  70. data/maps/un-nep-Deva-Latn-1972.yaml +40 -121
  71. data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
  72. data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
  73. data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
  74. data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
  75. data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
  76. data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
  77. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
  78. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
  79. data/spec/interscript/filenames_spec.rb +6 -369
  80. data/spec/interscript_spec.rb +10 -2
  81. metadata +50 -7
  82. data/lib/interscript/opal/map_translate.rb +0 -7
@@ -0,0 +1,251 @@
1
+ ---
2
+ authority_id: un
3
+ id: 1972
4
+ language: iso-639-2:mal
5
+ source_script: Mlym
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Malayalam Romanization Version 4.0
8
+ url: https://www.eki.ee/wgrs/rom1_ml.htm
9
+ creation_date: 1972
10
+ confirmation_date: 2016
11
+ description: |
12
+ The United Nations recommended system was approved in 1972 (II/11) and amended in 1977 (III/12),
13
+ based on a report prepared by D. N. Sharma. The tables and their corrections were published in
14
+ volume II of the conference reports.
15
+
16
+ There is no evidence of the use of the system either in India or in international cartographic products.
17
+
18
+ Malayalam (Malayāḷam) uses an alphasyllabic script whereby each character represents a syllable rather
19
+ than one sound. Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially)
20
+ and in an abbreviated form, to denote vowels after consonants. The romanization table is unambiguous but now
21
+ outdated because since the 1970's a new orthography has been introduced and the use of many character
22
+ combinations and ligatures has been simplified. Nevertheless the user of the romanization table would have to
23
+ recognize many ligatures not given in the original table. The system is mostly reversible but there exist some
24
+ ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
25
+ consonants (ligatures vs. character sequences), particularly in the case of older orthography.
26
+
27
+
28
+ notes:
29
+ - |
30
+ ടു For traditional script forms ഖു khu, മു mu, etc., exceptionally കു ku (ക്കു kku, ങ്കു ṅku), ഗു gu, ഛു chhu, ജു ju, ണു ṇu, തു tu, നു nu (ന്നു nnu), ഭു bhu, രു ru, ശു shu, ഹു hu
31
+ - |
32
+ ടൂ For traditional script forms ഖൂ khū, മൂ mū, etc., exceptionally കൂ kū, ഗൂ gū, ഛൂ chhū, ജൂ jū, ണൂ ṇū, തൂ tū, നൂ nū, ഭൂ bhū, രൂ rū, ശൂ shū, ഹൂ hū
33
+ - |
34
+ ടൃ Traditionally written in conjunction with the consonant character: കൃ kṛ .
35
+ - |
36
+ ടൗ In the older spelling: ൌ.
37
+ - |
38
+ ട്‌ Indicates absence of the inherent short [a] vowel, e.g. ക്‌ k , സ്‌ s. Special, co-called chillu-forms of consonants with that symbol: ണ്‍ ṇ, ന്‍ n, ര്‍ r, ല്‍ l, ള്‍ ḷ.
39
+ - |
40
+ റ Special ligature: റ്റ ṭ̈.
41
+
42
+ tests:
43
+ - source: "ചൈനയ്ക്കെതിരെ ലഡാക്കിൽ സദാസജ്ജം; യുഎസിൽനിന്ന് ൭൨,൫൦൦ സിഗ്–൧൬ റൈഫിൾ"
44
+ expected: "chainaykkĕtirĕ laḍākkil sadāsajjaṃ; yuĕsilninn 72,500 sig–16 ṟaiphiḷ"
45
+ - source: "സർഗഭൂമിക’യ്ക്കില്ല; ലളിതച്ചേച്ചി അങ്ങനെ പറഞ്ഞിട്ടുണ്ടാവില്ല: ആർഎൽവി രാമകൃഷ്ണൻ"
46
+ expected: "sargabhūmika’ykkilla; laḷitachchechchi aṅṅanĕ paṟaññiṭṭuṇṭāvilla: ārĕlvi rāmakṛṣhṇan"
47
+ - source: "സ്വർണക്കടത്ത്‌: ഫൈസൽ ഫരീദും റബിന്‍സും ദുബായിൽ അറസ്റ്റിലായെന്ന്‌ എന്‍ഐഎ"
48
+ expected: "svarṇakkaṭatt: phaisal pharīduṃ ṟabinsuṃ dubāyil aṟasṟṟilāyĕnn ĕnaiĕ"
49
+ - source: "വരുമോ ചൈനയുടെ വാക്സീൻ?; ആഗോള ഉപയോഗത്തിന് ഡബ്ല്യുഎച്ച്ഒയുമായി ചർച്ച"
50
+ expected: "varumo chainayuṭĕ vāksīn?; āgoḷa upayogattin ḍablyuĕchchŏyumāyi charchcha"
51
+ - source: "കുട്ടികളുടെ മാനസിക പിരിമുറുക്കം മാറ്റാൻ പരിശീലനം; ക്ലാസുമായി പോക്സോ പ്രതി"
52
+ expected: "kuṭṭikaḷuṭĕ mānasika pirimuṟukkaṃ māṟṟān parishīlanaṃ; klāsumāyi pokso prati"
53
+ - source: "ആദ്യം അമിത് ഷാ, ഇപ്പോൾ മോദി; ബിജെപിയെ പുണരാൻ ജഗൻ; ആന്ധ്രയിലെ കരുനീക്കങ്ങൾ"
54
+ expected: "ādyaṃ amit ṣhā, ippoḷ modi; bijĕpiyĕ puṇarān jagan; āndhrayilĕ karunīkkaṅṅaḷ"
55
+ - source: "ലഹരിമരുന്ന് കേസ്: ബിനീഷ് കോടിയേരിയെ ഇഡി 6 മണിക്കൂർ ചോദ്യം ചെയ്തു"
56
+ expected: "laharimarunn kes: binīṣh koṭiyeriyĕ iḍi 6 maṇikkūr chodyaṃ chĕytu"
57
+ - source: "ഈന്തപ്പഴം വിതരണം ചെയ്തത് ശിവശങ്കര്‍ പറഞ്ഞതു പ്രകാരം: ടി.വി അനുപമയുടെ മൊഴി"
58
+ expected: "īntappaḻaṃ vitaraṇaṃ chĕytat shivashaṅkar paṟaññatu prakāraṃ: ṭi.vi anupamayuṭĕ mŏḻi"
59
+ - source: "൫൦൦൦ മണിക്കൂർ കാത്തിരിക്കാൻ തയാറെന്ന് രാഹുൽ: ഒടുവിൽ വഴങ്ങി ഹരിയാന"
60
+ expected: "5000 maṇikkūr kāttirikkān tayāṟĕnn rāhul: ŏṭuvil vaḻaṅṅi hariyāna"
61
+ - source: "കാരണം ഷോര്‍ട്ട്‌സര്‍ക്യൂട്ടല്ല; കത്തിയത് ഫയല്‍ മാത്രം, സാനിറ്റൈസര്‍ ഉള്‍പ്പെടെ കത്തിയില്ല"
62
+ expected: "kāraṇaṃ ṣhorṭṭsarkyūṭṭalla; kattiyat phayal mātraṃ, sāniṟṟaisar uḷppĕṭĕ kattiyilla"
63
+ - source: "വിമൺ സയൻറിസ്റ്റ്സ് സ്കീം"
64
+ expected: "vimaṇ sayanṟisṟṟs skīṃ"
65
+
66
+ map:
67
+
68
+ rules:
69
+ - pattern: ([ക]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
70
+ result: 'k'
71
+ - pattern: ([ഖ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
72
+ result: 'kh'
73
+ - pattern: ([ഗ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
74
+ result: 'g'
75
+ - pattern: ([ഘ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
76
+ result: 'gh'
77
+ - pattern: ([ങ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
78
+ result: 'ṅ'
79
+ - pattern: ([ച]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
80
+ result: 'ch'
81
+ - pattern: ([ഛ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
82
+ result: 'chh'
83
+ - pattern: ([ജ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
84
+ result: 'j'
85
+ - pattern: ([ഝ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
86
+ result: 'jh'
87
+ - pattern: ([ഞ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
88
+ result: 'ñ'
89
+ - pattern: ([ട]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
90
+ result: 'ṭ'
91
+ - pattern: ([ഠ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
92
+ result: 'ṭh'
93
+ - pattern: ([ഡ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
94
+ result: 'ḍ'
95
+ - pattern: ([ഢ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
96
+ result: 'ḍh'
97
+ - pattern: ([ണ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
98
+ result: 'ṇ'
99
+ - pattern: ([ത]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
100
+ result: 't'
101
+ - pattern: ([ഥ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
102
+ result: 'th'
103
+ - pattern: ([ദ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
104
+ result: 'd'
105
+ - pattern: ([ധ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
106
+ result: 'dh'
107
+ - pattern: ([ന]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
108
+ result: 'n'
109
+ - pattern: ([പ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
110
+ result: 'p'
111
+ - pattern: ([ഫ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
112
+ result: 'ph'
113
+ - pattern: ([ബ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
114
+ result: 'b'
115
+ - pattern: ([ഭ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
116
+ result: 'bh'
117
+ - pattern: ([മ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
118
+ result: 'm'
119
+ - pattern: ([യ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
120
+ result: 'y'
121
+ - pattern: ([ര]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
122
+ result: 'r'
123
+ - pattern: ([ല]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
124
+ result: 'l'
125
+ - pattern: ([വ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
126
+ result: 'v'
127
+ - pattern: ([ശ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
128
+ result: 'sh'
129
+ - pattern: ([ഷ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
130
+ result: 'ṣh'
131
+ - pattern: ([സ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
132
+ result: 's'
133
+ - pattern: ([ഹ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
134
+ result: 'h'
135
+ - pattern: ([ള]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
136
+ result: 'ḷ'
137
+ - pattern: ([ഴ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
138
+ result: 'ḻ'
139
+ - pattern: ([റ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
140
+ result: 'ṟ'
141
+ - pattern: ([ക്ഷ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
142
+ result: 'kṣh'
143
+
144
+ characters:
145
+ # I. Independent vowel characters
146
+ 'അ': 'a'
147
+ 'ആ': 'ā'
148
+ 'ഇ': 'i'
149
+ 'ഈ': 'ī'
150
+ 'ഉ': 'u'
151
+ 'ഊ': 'ū'
152
+ 'ഋ': "ṛ"
153
+ 'എ': 'ĕ'
154
+ 'ഏ': 'e'
155
+ 'ഐ': 'ai'
156
+ 'ഒ': 'ŏ'
157
+ 'ഓ': 'o'
158
+ 'ഔ': 'au'
159
+
160
+ # II. Abbreviated vowel characters
161
+ 'ാ': 'ā'
162
+ 'ി': 'i'
163
+ 'ീ': 'ī'
164
+ 'ു': 'u'
165
+ 'ൂ': 'ū'
166
+ 'ൃ': "ṛ"
167
+ 'െ': "ĕ"
168
+ 'േ': "e"
169
+ 'ൈ': "ai"
170
+ 'ൊ': 'ŏ'
171
+ 'ോ': 'o'
172
+ 'ൌ': 'au'
173
+
174
+ #III. Other symbols
175
+ 'ഃ': 'ḥ'
176
+ 'ം': 'ṃ'
177
+ '്': ''
178
+
179
+ #IV. Consonant characters
180
+ 'ക': 'ka'
181
+ 'ഖ': 'kha'
182
+ 'ഗ': 'ga'
183
+ 'ഘ': 'gha'
184
+ 'ങ': 'ṅa'
185
+ 'ച': 'cha'
186
+ 'ഛ': 'chha'
187
+ 'ജ': 'ja'
188
+ 'ഝ': 'jha'
189
+ 'ഞ': 'ña'
190
+ 'ട': 'ṭa'
191
+ 'ഠ': 'ṭha'
192
+ 'ഡ': 'ḍa'
193
+ 'ഢ': 'ḍha'
194
+ 'ണ': 'ṇa'
195
+ 'ത': 'ta'
196
+ 'ഥ': 'tha'
197
+ 'ദ': 'da'
198
+ 'ധ': 'dha'
199
+ 'ന': 'na'
200
+ 'പ': 'pa'
201
+ 'ഫ': 'pha'
202
+ 'ബ': 'ba'
203
+ 'ഭ': 'bha'
204
+ 'മ': 'ma'
205
+ 'യ': 'ya'
206
+ 'ര': 'ra'
207
+ 'ല': 'la'
208
+ 'വ': 'va'
209
+ 'ശ': 'sha'
210
+ 'ഷ': 'ṣha'
211
+ 'സ': 'sa'
212
+ 'ഹ': 'ha'
213
+ 'ക്ഷ': 'kṣha'
214
+ 'ള': 'ḷa'
215
+ 'ഴ': 'ḻa'
216
+ 'റ': 'ṟa'
217
+ 'റ്റ': 'ṭ̈'
218
+
219
+
220
+ '्': ''
221
+ '़': ''
222
+ 'ൗ': ''
223
+ "‍": '' # no need for zero with joiner
224
+ "‌": '' # no need for zero with non joiner
225
+
226
+
227
+ # numbers
228
+ '൦': '0'
229
+ '൧': '1'
230
+ '൨': '2'
231
+ '൩': '3'
232
+ '൪': '4'
233
+ '൫': '5'
234
+ '൬': '6'
235
+ '൭': '7'
236
+ '൮': '8'
237
+ '൯': '9'
238
+ '൰': '10'
239
+ '൱': '100'
240
+ '൲': '1000'
241
+
242
+
243
+ # chillu-forms of consonants note 5
244
+ 'ൿ': 'k'
245
+ 'ൺ': 'ṇ'
246
+ 'ൻ': 'n'
247
+ 'ൽ': 'l'
248
+ 'ൾ': 'ḷ'
249
+ 'ർ': 'r'
250
+ 'സ്': 's'
251
+
@@ -31,33 +31,44 @@ notes:
31
31
  - |
32
32
  The following independent characters are sometimes used: अि i, अी ī, अु u, अू ū, अे e, अै ai.
33
33
 
34
+ ######################################## Additional Note ############################################################
35
+ # It is recommended that the vowel अ (a) should always be romanized except when it ends a #
36
+ # name. In the scheme we are not yet able to detect a name. Analysing language pattern and the example #
37
+ # we found that actually when a word ends with a consonant it should be transliterated without the vowel in it. #
38
+ # so we are applying this rule as if a word ends with a consonant, in this case we are removing the ending 'a'. #
39
+ #####################################################################################################################
40
+
34
41
  tests:
42
+ - source: "महाराष्ट्र"
43
+ expected: "mahārāṣhṭr"
44
+ - source: "मुंबई"
45
+ expected: "muṁbaī"
35
46
  - source: "परिपक्क"
36
- expected: "paraipakka"
47
+ expected: "paripakk"
37
48
  - source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
38
- expected: "ṭhaāṇae - jailhayaāta baudhavaāraī eka hajaāra raugṇaāṁchaī vaāḍha, tara jaṇaāṁchyaā maṛtyaūchaī naoṁda"
49
+ expected: "ṭhāṇe - jilhyāt budhavārī ek hajār rugṇāṁchī vāḍh, tar jaṇāṁchyā mṛtyūchī noṁd"
39
50
  - source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
40
- expected: "ekataā kapaūra paunhaā aḍakalaī vaādaāta, vaebasaīraijamadhalyaā 'tyaā' saīnamauḷae jamaāvaāchaī gharaāvara dagaḍaphaeka"
51
+ expected: "ekatā kapūr punhā aḍakalī vādāt, vebasīrijamadhalyā 'tyā' sīnamuḷae jamāvāchī gharāvar dagaḍaphek"
41
52
  - source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
42
- expected: "jaāṇaūna ghyaā, baīemasaīchyaā adhaikaāryaāṁnaī kaṁganaā raāṇaautachyaā ôphaisamadhalae nakkaī kaāya- kaāya taoḍalaṁ"
53
+ expected: "jāṇūn ghyā, bīemasīchyā adhikāryāṁnī kaṁganā rāṇautachyā ôphisamadhale nakkī kāy- kāy toḍalaṁ"
43
54
  - source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
44
- expected: "kaṁganaā mauṁbaīta daākhala haoṇyaāpaūrvaī 'maātaoshraī'varaūna pharmaāna sauṭalae; pravaktyaāṁnaā sakta ādaesha"
55
+ expected: "kaṁganā muṁbaīt dākhal hoṇyāpūrvī 'mātoshrī'varūn pharmān suṭale; pravaktyāṁnā sakt ādesh"
45
56
  - source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
46
- expected: "maraāṭhaā ārakṣhaṇaāsa taātpaurataī sthagaitaī; sarvaochcha nyaāyaālayaāchaā nairṇaya"
57
+ expected: "marāṭhā ārakṣhaṇās tātpuratī sthagitī; sarvochch nyāyālayāchā nirṇay"
47
58
  - source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
48
- expected: "bhaārataāchyaā tainhaī lashaīṁchaā pahailaā ṭappaā yashasvaī, vaāchaā kadhaī yaeṇaāra baājaāraāta"
59
+ expected: "bhāratāchyā tinhī lashīṁchā pahilā ṭappā yashasvī, vāchā kadhī yeṇār bājārāt"
49
60
  - source: "रुग्णवाढीमुळे खाटांची चणचण"
50
- expected: "raugṇavaāḍhaīmauḷae khaāṭaāṁchaī chaṇachaṇa"
61
+ expected: "rugṇavāḍhīmuḷae khāṭāṁchī chaṇachaṇ"
51
62
  - source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
52
- expected: "paīema svanaidhaī karja yaojanaelaā mauṁbaītaūna alpa prataisaāda"
63
+ expected: "pīem svanidhī karj yojanelā muṁbaītūn alp pratisād"
53
64
  - source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
54
- expected: "saāṁtaākraūjha-chaeṁbaūra laiṁka raoḍavaraīla unnata maārgaālaā sthagaitaī"
65
+ expected: "sāṁtākrūjh-cheṁbūr liṁk roḍavarīl unnat mārgālā sthagitī"
55
66
  - source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
56
- expected: "saṁpaādaka arṇaba gaosvaāmaī yaāṁchyaāvairaūddha khaḍaka paolaisa ṭhaāṇyaāta takraāra"
67
+ expected: "saṁpādak arṇab gosvāmī yāṁchyāvirūddh khaḍak polis ṭhāṇyāt takrār"
57
68
  - source: "करणाऱ्या मुलांना अनुक्रमे प्ले ग्रूप"
58
- expected: "karaṇaāryaā maulaāṁnaā anaukramae plae graūpa"
69
+ expected: "karaṇāryā mulāṁnā anukrame ple grūp"
59
70
  - source: "राज्यातील शाळा दिवाळीपर्यंत बंद, मंत्र्यांच्या बैठकीत निर्णय, शिक्षकांची जबाबदारी वाढली"
60
- expected: "raājyaātaīla shaāḷaā daivaāḷaīparyaṁta baṁda, maṁtryaāṁchyaā baaiṭhakaīta nairṇaya, shaikṣhakaāṁchaī jabaābadaāraī vaāḍhalaī"
71
+ expected: "rājyātīl shāḷaā divāḷaīparyaṁt baṁd, maṁtryāṁchyā baiṭhakīt nirṇay, shikṣhakāṁchī jabābadārī vāḍhalī"
61
72
 
62
73
  map:
63
74
  inherit: "un-hin-Deva-Latn-2016"
@@ -86,169 +86,88 @@ tests:
86
86
  map:
87
87
 
88
88
  rules:
89
- - pattern: ([क]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
89
+ - pattern: (([क]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([क])(?=\b))
90
90
  result: 'k'
91
- - pattern: ([ख]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
91
+ - pattern: (([ख]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ख])(?=\b))
92
92
  result: 'kh'
93
- - pattern: ([ग]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
93
+ - pattern: (([ग]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ग])(?=\b))
94
94
  result: 'g'
95
- - pattern: ([घ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
95
+ - pattern: (([घ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([घ])(?=\b))
96
96
  result: 'gh'
97
- - pattern: ([ङ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
97
+ - pattern: (([ङ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ङ])(?=\b))
98
98
  result: 'ṅ'
99
- - pattern: ([च]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
99
+ - pattern: (([च]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([च])(?=\b))
100
100
  result: 'ch'
101
- - pattern: ([छ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
101
+ - pattern: (([छ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([छ])(?=\b))
102
102
  result: 'chh'
103
- - pattern: ([ज]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
103
+ - pattern: (([ज]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ज])(?=\b))
104
104
  result: 'j'
105
- - pattern: ([झ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
105
+ - pattern: (([झ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([झ])(?=\b))
106
106
  result: 'jh'
107
- - pattern: ([ञ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
107
+ - pattern: (([ञ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ञ])(?=\b))
108
108
  result: 'ñ'
109
- - pattern: ([ट]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
109
+ - pattern: (([ट]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ट])(?=\b))
110
110
  result: 'ṭ'
111
- - pattern: ([ठ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
111
+ - pattern: (([ठ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ठ])(?=\b))
112
112
  result: 'ṭh'
113
- - pattern: ([ड]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
113
+ - pattern: (([ड]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ड])(?=\b))
114
114
  result: 'ḍ'
115
- - pattern: ([ढ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
115
+ - pattern: (([ढ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ढ])(?=\b))
116
116
  result: 'ḍh'
117
- - pattern: ([ण]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
117
+ - pattern: (([ण]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ण])(?=\b))
118
118
  result: 'ṇ'
119
- - pattern: ([त]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
119
+ - pattern: (([त]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([त])(?=\b))
120
120
  result: 't'
121
- - pattern: ([थ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
121
+ - pattern: (([थ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([थ])(?=\b))
122
122
  result: 'th'
123
- - pattern: ([द]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
123
+ - pattern: (([द]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([द])(?=\b))
124
124
  result: 'd'
125
- - pattern: ([ध]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
125
+ - pattern: (([ध]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ध])(?=\b))
126
126
  result: 'dh'
127
- - pattern: ([न]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
127
+ - pattern: (([न]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([न])(?=\b))
128
128
  result: 'n'
129
- - pattern: ([प]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
129
+ - pattern: (([प]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([प])(?=\b))
130
130
  result: 'p'
131
- - pattern: ([फ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
131
+ - pattern: (([फ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([फ])(?=\b))
132
132
  result: 'ph'
133
- - pattern: ([ब]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
133
+ - pattern: (([ब]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ब])(?=\b))
134
134
  result: 'b'
135
- - pattern: ([भ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
135
+ - pattern: (([भ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([भ])(?=\b))
136
136
  result: 'bh'
137
- - pattern: ([म]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
137
+ - pattern: (([म]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([म])(?=\b))
138
138
  result: 'm'
139
- - pattern: ([य]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
139
+ - pattern: (([य]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([य])(?=\b))
140
140
  result: 'y'
141
- - pattern: ([र]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
141
+ - pattern: (([र]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([र])(?=\b))
142
142
  result: 'r'
143
- - pattern: ([ल]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
143
+ - pattern: (([ल]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ल])(?=\b))
144
144
  result: 'l'
145
- - pattern: ([व]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
145
+ - pattern: (([व]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([व])(?=\b))
146
146
  result: 'v'
147
- - pattern: ([श]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
147
+ - pattern: (([श]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([श])(?=\b))
148
148
  result: 'sh'
149
- - pattern: ([ष]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
149
+ - pattern: (([ष]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ष])(?=\b))
150
150
  result: 'ṣh'
151
- - pattern: ([स]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
151
+ - pattern: (([स]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([स])(?=\b))
152
152
  result: 's'
153
- - pattern: ([क़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
153
+ - pattern: (([क़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([क़])(?=\b))
154
154
  result: 'q'
155
- - pattern: ([ख़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
155
+ - pattern: (([ख़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ख़])(?=\b))
156
156
  result: 'ḳh'
157
- - pattern: ([ग़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
157
+ - pattern: (([ग़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ग़])(?=\b))
158
158
  result: 'g'
159
- - pattern: ([ज़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
159
+ - pattern: (([ज़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ज़])(?=\b))
160
160
  result: 'z'
161
- - pattern: ([ड़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
161
+ - pattern: (([ड़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ड़])(?=\b))
162
162
  result: 'ṙ'
163
- - pattern: ([ढ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
163
+ - pattern: (([ढ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ढ़])(?=\b))
164
164
  result: 'ṙh'
165
- - pattern: ([फ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
165
+ - pattern: (([फ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([फ़])(?=\b))
166
166
  result: 'f'
167
- - pattern: ([ह]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
167
+ - pattern: (([ह]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d]))|(([ह])(?=\b))
168
168
  result: 'h'
169
169
 
170
170
 
171
- - pattern: ([क])(?=\b)
172
- result: 'k'
173
- - pattern: ([ख])(?=\b)
174
- result: 'kh'
175
- - pattern: ([ग])(?=\b)
176
- result: 'g'
177
- - pattern: ([घ])(?=\b)
178
- result: 'gh'
179
- - pattern: ([ङ])(?=\b)
180
- result: 'ṅ'
181
- - pattern: ([च])(?=\b)
182
- result: 'ch'
183
- - pattern: ([छ])(?=\b)
184
- result: 'chh'
185
- - pattern: ([ज])(?=\b)
186
- result: 'j'
187
- - pattern: ([झ])(?=\b)
188
- result: 'jh'
189
- - pattern: ([ञ])(?=\b)
190
- result: 'ñ'
191
- - pattern: ([ट])(?=\b)
192
- result: 'ṭ'
193
- - pattern: ([ठ])(?=\b)
194
- result: 'ṭh'
195
- - pattern: ([ड])(?=\b)
196
- result: 'ḍ'
197
- - pattern: ([ढ])(?=\b)
198
- result: 'ḍh'
199
- - pattern: ([ण])(?=\b)
200
- result: 'ṇ'
201
- - pattern: ([त])(?=\b)
202
- result: 't'
203
- - pattern: ([थ])(?=\b)
204
- result: 'th'
205
- - pattern: ([द])(?=\b)
206
- result: 'd'
207
- - pattern: ([ध])(?=\b)
208
- result: 'dh'
209
- - pattern: ([न])(?=\b)
210
- result: 'n'
211
- - pattern: ([प])(?=\b)
212
- result: 'p'
213
- - pattern: ([फ])(?=\b)
214
- result: 'ph'
215
- - pattern: ([ब])(?=\b)
216
- result: 'b'
217
- - pattern: ([भ])(?=\b)
218
- result: 'bh'
219
- - pattern: ([म])(?=\b)
220
- result: 'm'
221
- - pattern: ([य])(?=\b)
222
- result: 'y'
223
- - pattern: ([र])(?=\b)
224
- result: 'r'
225
- - pattern: ([ल])(?=\b)
226
- result: 'l'
227
- - pattern: ([व])(?=\b)
228
- result: 'v'
229
- - pattern: ([श])(?=\b)
230
- result: 'sh'
231
- - pattern: ([ष])(?=\b)
232
- result: 'ṣh'
233
- - pattern: ([स])(?=\b)
234
- result: 's'
235
- - pattern: ([क़])(?=\b)
236
- result: 'q'
237
- - pattern: ([ख़])(?=\b)
238
- result: 'ḳh'
239
- - pattern: ([ग़])(?=\b)
240
- result: 'g'
241
- - pattern: ([ज़])(?=\b)
242
- result: 'z'
243
- - pattern: ([ड़])(?=\b)
244
- result: 'ṙ'
245
- - pattern: ([ढ़])(?=\b)
246
- result: 'ṙh'
247
- - pattern: ([फ़])(?=\b)
248
- result: 'f'
249
- - pattern: ([ह])(?=\b)
250
- result: 'h'
251
-
252
171
  characters:
253
172
 
254
173
  # Vowels and Diphthongs