interscript 0.1.7 → 0.1.9

Sign up to get free protection for your applications and to get access to all the features.
Files changed (82) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +1 -3
  3. data/aliases.json +1 -0
  4. data/lib/interscript.rb +8 -3
  5. data/lib/interscript/fs.rb +27 -0
  6. data/lib/interscript/mapping.rb +3 -1
  7. data/lib/interscript/opal.rb +142 -3
  8. data/lib/interscript/opal/entrypoint.rb +8 -0
  9. data/lib/interscript/opal/exports.rb +11 -0
  10. data/lib/interscript/opal/maps.js.erb +2 -4
  11. data/lib/interscript/version.rb +1 -1
  12. data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -5
  13. data/maps/alalc-asm-Deva-Latn-1997.yaml +104 -10
  14. data/maps/alalc-asm-Deva-Latn-2012.yaml +18 -3
  15. data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
  16. data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
  17. data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
  18. data/maps/alalc-hin-Deva-Latn-1997.yaml +102 -10
  19. data/maps/alalc-hin-Deva-Latn-2011.yaml +19 -1
  20. data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
  21. data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
  22. data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
  23. data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
  24. data/maps/alalc-pra-Deva-Latn-2012.yaml +2 -2
  25. data/maps/alalc-san-Deva-Latn-2012.yaml +78 -9
  26. data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
  27. data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
  28. data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
  29. data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
  30. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +3 -1
  31. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
  32. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
  33. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +1 -1
  34. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
  35. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
  36. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
  37. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
  38. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
  39. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
  40. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +2 -0
  41. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +87 -53
  42. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
  43. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
  44. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
  45. data/maps/{bis-knd-Knda-Latn-13194-1991.yaml → bis-kan-Kana-Latn-13194-1991.yaml} +2 -2
  46. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +17 -2
  47. data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
  48. data/maps/{iso-kan-Knda-Latn-15919-2001.yaml → iso-kan-Kana-Latn-15919-2001.yaml} +1 -1
  49. data/maps/{mns-mon-Cyrl-Latn-5217-2012.yaml → masm-mon-Cyrl-Latn-5217-2012.yaml} +2 -2
  50. data/maps/{mns-mon-Latn-Cyrl-5217-2012.yaml → masm-mon-Latn-Cyrl-5217-2012.yaml} +1 -1
  51. data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
  52. data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
  53. data/maps/odni-ara-Arab-Latn-2015.yaml +20 -130
  54. data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
  55. data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
  56. data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
  57. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
  58. data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
  59. data/maps/{odni-per-Arab-Latn-2015.yaml → odni-prs-Arab-Latn-2015.yaml} +0 -0
  60. data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
  61. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
  62. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +4 -0
  63. data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
  64. data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
  65. data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
  66. data/maps/un-hin-Deva-Latn-2016.yaml +104 -10
  67. data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
  68. data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
  69. data/maps/un-mar-Deva-Latn-2016.yaml +24 -13
  70. data/maps/un-nep-Deva-Latn-1972.yaml +40 -121
  71. data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
  72. data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
  73. data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
  74. data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
  75. data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
  76. data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
  77. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
  78. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
  79. data/spec/interscript/filenames_spec.rb +6 -369
  80. data/spec/interscript_spec.rb +10 -2
  81. metadata +50 -7
  82. data/lib/interscript/opal/map_translate.rb +0 -7
@@ -0,0 +1,63 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:kan
5
+ source_script: Kana
6
+ destination_script: Latn
7
+ name: Kannada Romanization, 2011
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
9
+ creation_date: 2011
10
+ description: |
11
+ ALA-LC Romanization table for Kannada
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the superscript sign (◌್).
25
+
26
+ - |
27
+ Exception: Anusvāra is transliterated by:
28
+
29
+ a) ṅ before gutturals,
30
+ b) ñ before palatals,
31
+ c) ṇ before cerebrals,
32
+ d) n before dentals, and
33
+ e) m before labials.
34
+
35
+
36
+ tests:
37
+ - source: "ಕರ್ಣಾಟಕ"
38
+ expected: "karṇāṭaka"
39
+ - source: "ಬೆಂಗಳೂರು"
40
+ expected: "beṅgaḷūru"
41
+ - source: "ಭಾರತದಲ್ಲಿ ಗಾಳಿ ಕಲುಷಿತವಾಗಿದೆ: ಹವಾಮಾನ ಬದಲಾವಣೆ ಸಮರ್ಥನೆಗೆ ಭಾರತವನ್ನು ಟೀಕಿಸಿದ ಟ್ರಂಪ್"
42
+ expected: "bhāratadalli gāḷi kaluṣitavāgide: havāmāna badalāvaṇe samarthanege bhāratavannu ṭīkisida ṭraṃp"
43
+ - source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ ಅಂತಿಮ ಚರ್ಚೆ: ಭಾರತದ ವಿರುದ್ಧ ಟ್ರಂಪ್ ಆರೋಪವೇನು?!"
44
+ expected: "amerika adhyakṣīya cunāvaṇe aṃtima carce: bhāratada viruddha ṭraṃp ārōpavēnu?!"
45
+ - source: "ಹೇಗಿದೆ ಅಮೆರಿಕನ್‌ ಚುನಾವಣ ಕಣ?"
46
+ expected: "hēgide amerikan cunāvaṇa kaṇa?"
47
+ - source: "ಫ್ರೀಜರ್ ನಲ್ಲಿಟ್ಟ ನೂಡಲ್ಸ್ ತಿಂದು ಒಂದೇ ಕುಟುಂಬದ ೯ ಮಂದಿ ಸಾವು: ೩ ಮಕ್ಕಳು ಅಪಾಯದಿಂದ ಪಾರು"
48
+ expected: "phrījar nalliṭṭa nūḍals tiṃdu oṃdē kuṭuṃbada 9 maṃdi sāvu: 3 makkaḷu apāyadinda pāru"
49
+ - source: "ಉಡುಪಿಯಲ್ಲಿ ಪ್ರಪ್ರಥಮ ಬಾರಿಗೆ ಪ್ರಾರಂಭವಾಗಿರುವ ದೇಶಿ ಉತ್ಪನ್ನಗಳ ಮಳಿಗೆ"
50
+ expected: "uḍupiyalli praprathama bārige prāraṃbhavāgiruva dēśi utpannagaḷa maḷige"
51
+ - source: "ಚಿಕ್ಕಮಗಳೂರು : ಪುಷ್ಪ ಸಮರ್ಪಣೆ ವೇಳೆ ಮಗಳನ್ನ ನೆನೆದು ಕಣ್ಣೀರಿಟ್ಟ ಮೃತ ಪೇದೆ ತಾಯಿ"
52
+ expected: "cikkamagaḷūru : puṣpa samarpaṇe vēḷe magaḷanna nenedu kaṇṇīriṭṭa mṛta pēde tāyi"
53
+ - source: "ಸಮಂಗಳೂರು: ಡ್ರಗ್ಸ್ ಜಾಗೃತಿ ಬರಹದಿಂದ ಗಮನಸೆಳೆಯುತ್ತಿದೆ ಸಿಟಿ ಬಸ್"
54
+ expected: "samaṅgaḷūru: ḍrags jāgṛti barahadinda gamanaseḷeyuttide siṭi bas"
55
+ - source: "ಪುರಸಭೆ, ಪಪಂ ಅಧ್ಯಕ್ಷ-ಉಪಾಧ್ಯಕ್ಷ ಚುನಾವಣೆಗೆ ಹೈಕೋರ್ಟ್‌ ಅಸ್ತು"
56
+ expected: "purasabhe, papaṃ adhyakṣa-upādhyakṣa cunāvaṇege haikōrṭ astu"
57
+ - source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ ಅಂತಿಮ ಚರ್ಚೆ: ಭಾರತದ ವಿರುದ್ಧ ಟ್ರಂಪ್ ಆರೋಪವೇನು?"
58
+ expected: "amerika adhyakṣīya cunāvaṇe aṃtima carce: bhāratada viruddha ṭraṃp ārōpavēnu?"
59
+ - source: "ಮನೆ ಕುಸಿದು ತಂದೆ ಮತ್ತು ಮಗ ಸಾವು, ಇನ್ನಿಬ್ಬರಿಗೆ ಗಾಯ: ಸ್ಥಳಕ್ಕೆ ಶಾಸಕರ ಭೇಟಿ"
60
+ expected: "mane kusidu taṃde mattu maga sāvu, innibbarige gāya: sthaḷakke śāsakara bhēṭi"
61
+
62
+ map:
63
+ inherit: 'alalc-kan-Kana-Latn-1997'
@@ -0,0 +1,284 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:ori
5
+ source_script: Orya
6
+ destination_script: Latn
7
+ name: Oriya Romanization, 1997
8
+ alias:
9
+ ogc11122:
10
+ code: ori_Orya2Latn_ALA_1997
11
+ description: Oriya ALA-Library of Congress 1997 System
12
+ url: http://catdir.loc.gov/catdir/cpso/romanization/oriya.pdf
13
+ creation_date: 1997
14
+ description: |
15
+ ALA-LC Romanization table for Oriya
16
+
17
+ notes:
18
+ - |
19
+ Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for vowels following a
20
+ consonant can be found in grammars; no distinction between the two is made in transliteration.
21
+ - |
22
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
23
+ transliteration, with the following exceptions:
24
+ a) when another vowel is indicated by its appropriate sign; and
25
+ b) when the absence of any vowel is indicated by the subscript sign ( ୍ ) called hasanta.
26
+ - |
27
+ ବ is used both as a labial and as a semivowel. When it occurs as the second consonant of a
28
+ consonant cluster, it is transliterated va. When ବ is doubled, it is transliterated bba.
29
+ - |
30
+ Exception: Anusvāra is transliterated by:
31
+ a) ṅ before gutturals,
32
+ b) ñ before palatals,
33
+ c) ṇ before cerebrals,
34
+ d) n before dentals, and
35
+ e) m before labials.
36
+ - |
37
+ Candrabindu before guttural, palatal, cerebral, and dental occlusives is transliterated n̐.
38
+ Before labials, sibilants, semivowels, the aspirate, vowels, and in final position it is
39
+ transliterated m̐.
40
+ - When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
41
+ tests:
42
+ - source: "ର୍କ"
43
+ expected: "rka"
44
+ - source: "ଓଡ଼ିଆ"
45
+ expected: "oṙiā"
46
+ - source: "ଓଡ଼ିଶା"
47
+ expected: "oṙiśā"
48
+ - source: "ଭୁବନେଶ୍ୱର"
49
+ expected: "bhubaneśwara"
50
+ - source: "ଆଇପିଏଲ୍‌-୧୩: ରୟାଲ ଚ୍ୟାଲେଞ୍ଜର୍ସ ବାଙ୍ଗାଲୋରକୁ ୫ ଓ୍ୱିକେଟରେ ପରାସ୍ତ କଲା ମୁମ୍ବାଇ ଇଣ୍ଡିଆନ୍ସ"
51
+ expected: "āipiel-13: raẏāla cẏāleñjarsa bāṅgāloraku 5 obikeṭare parāsta kalā mumbāi iṇḍiānsa"
52
+ - source: "ଓଡ଼ିଶା ସିଭିଲ ସର୍ଭିସେସ୍‌ ମେନ୍‌ ପରୀକ୍ଷା ଡିସେମ୍ବରରେ, ଜାଣନ୍ତୁ କେଉଁ ବିଷୟର ପରୀକ୍ଷା କେବେ"
53
+ expected: "oṙiśā sibhila sarbhises men parīkshā ḍisembarare, jāṇantu keum̐ bishaẏara parīkshā kebe"
54
+ - source: "ଗଞ୍ଜାମରେ କୋଭିଡ଼ ମୃତ୍ୟୁ ୨୨୮ରେ ପହଞ୍ଚିଲା"
55
+ expected: "gañjāmare keābhiṙa mṛtẏu 228re pahañcilā"
56
+ - source: "ଭାରତ ମହାସାଗର ଦ୍ବୀପରାଷ୍ଟ୍ର ଶ୍ରୀଲଙ୍କା ଓ ମାଳଦ୍ବୀପରେ ପମ୍ପିଓଙ୍କ ଚୀନ୍‌ବିରୋଧୀ ଅଭିଯାନ"
57
+ expected: "bhārata mahāsāgara dbīparāshṭra śrīlaṅkā o māḷadbīpare pampioṅka cīnbireādhī abhiyāna"
58
+ - source: "କଟକ ସହରରୁ ଆଜି ୩୯ କରୋନା ପଜିଟିଭ୍‌ ଚିହ୍ନଟ, ସ୍ଥାନୀୟ ଅଂଚଳରୁ ୨୪ ଜଣ ଆକ୍ରାନ୍ତ"
59
+ expected: "kaṭaka sahararu āji 39 karonā pajiṭibh cihnaṭa, sthānīẏa aṃcaḷaru 24 jaṇa ākrānta"
60
+ - source: "ବିଧାୟକ ସୌମ୍ୟରଂଜନଙ୍କ ମାରାଥନ ପ୍ରଚାର: ‘ଦ୍ୱିତୀୟବାର ସୁଯୋଗ ମିଳିଛି, ବୁଝି ବିଚାରି ଭୋଟ ଦିଅ’"
61
+ expected: "bidhāẏaka seୗmẏaraṃjanaṅka mārāthana pracāra: ‘dbitīẏabāra suyeāga miḷichi, bujhi bicāri bheāṭa dia’"
62
+ - source: "ଅଣ୍ଡା ବିଗାଡ଼ିଛି ପୁଷ୍ଟିକର ଖାଦ୍ୟ ଯୋଜନା ଅଙ୍କ"
63
+ expected: "aṇḍā bigāṙichi pushṭikara khādẏa yeājanā aṅka"
64
+ - source: "ପଥରଗଡ଼ ମଦ ମୃତ୍ୟୁ ମାମଲା : ଠିକାଦାର ସହ ବନ୍ଧାହେଲେ ୪"
65
+ expected: "patharagaḍa mada mṛtẏu māmalā : ṭhikādāra saha bandhāhele 4"
66
+ - source: "ତିର୍ତ୍ତୋଲର ବିକାଶ ନେଇ ବିଷ୍ଣୁବାବୁ ମୋତେ ବହୁ ବାର ଭେଟୁଥିଲେ: ନବୀନ"
67
+ expected: "tirtteālara bikāśa nei bishṇubābu mote bahu bāra bheṭuthile: nabīna"
68
+
69
+
70
+ map:
71
+
72
+ rules:
73
+ # Rule II
74
+ - pattern: ([କ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
75
+ result: 'k'
76
+ - pattern: ([ଖ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
77
+ result: 'kh'
78
+ - pattern: ([ଗ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
79
+ result: 'g'
80
+ - pattern: ([ଘ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
81
+ result: 'gh'
82
+ - pattern: ([ଙ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
83
+ result: 'ṅ'
84
+ - pattern: ([ଚ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
85
+ result: 'c'
86
+ - pattern: ([ଛ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
87
+ result: 'ch'
88
+ - pattern: ([ଜ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
89
+ result: 'j'
90
+ - pattern: ([ଝ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
91
+ result: 'jh'
92
+ - pattern: ([ଞ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
93
+ result: 'ñ'
94
+ - pattern: ([ଟ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
95
+ result: 'ṭ'
96
+ - pattern: ([ଠ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
97
+ result: 'ṭh'
98
+ - pattern: ([ଡ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
99
+ result: 'ḍ'
100
+ - pattern: ([ଢ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
101
+ result: 'ḍh'
102
+ - pattern: ([ଣ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
103
+ result: 'ṇ'
104
+ - pattern: ([ତ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
105
+ result: 't'
106
+ - pattern: ([ଥ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
107
+ result: 'th'
108
+ - pattern: ([ଦ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
109
+ result: 'd'
110
+ - pattern: ([ଧ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
111
+ result: 'dh'
112
+ - pattern: ([ନ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
113
+ result: 'n'
114
+ - pattern: ([ପ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
115
+ result: 'p'
116
+ - pattern: ([ଫ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
117
+ result: 'ph'
118
+ - pattern: ([ବ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
119
+ result: 'b'
120
+ - pattern: ([ଭ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
121
+ result: 'bh'
122
+ - pattern: ([ମ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
123
+ result: 'm'
124
+ - pattern: ([ଯ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
125
+ result: 'y'
126
+ - pattern: ([ୟ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
127
+ result: 'ẏ'
128
+ - pattern: ([ର]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
129
+ result: 'r'
130
+ - pattern: ([ଲ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
131
+ result: 'l'
132
+ - pattern: ([ଳ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
133
+ result: 'ḷ'
134
+ - pattern: ([ଶ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
135
+ result: 'ś'
136
+ - pattern: ([ଷ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
137
+ result: 'sh'
138
+ - pattern: ([ସ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
139
+ result: 's'
140
+ - pattern: ([ହ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
141
+ result: 'h'
142
+ - pattern: ([ୱ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
143
+ result: 'b'
144
+ - pattern: ([ଡ଼]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
145
+ result: 'ṙ'
146
+ - pattern: ([ଢ଼]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
147
+ result: 'ṙh'
148
+
149
+ # Rule III
150
+ - pattern: ([ବ]=?)(?=[\u0b2c])
151
+ result: 'bba'
152
+ # Rule IV
153
+ - pattern: \u0902(?=[କଖଗଘଙ])
154
+ result: ṅ
155
+ - pattern: \u0902(?=[ଚଛଜଝଞ])
156
+ result: ñ
157
+ - pattern: \u0902(?=[ଟଠଡଢଣ])
158
+ result: ṇ
159
+ - pattern: \u0902(?=[ତଥଦଧନ])
160
+ result: n
161
+ # Rule V
162
+ - pattern: \u0b01(?=[ପଫବଭମଯୟରଲଳଶଷସହଅଆଇଈଉଊଋୠଌଏଐଓଔ])
163
+ result: "m̐"
164
+ - pattern: (?<=)\u0b01(?=\b)
165
+ result: "m̐"
166
+
167
+ characters:
168
+ 'ଅ': 'a'
169
+ 'ଆ': 'ā'
170
+ 'ଇ': 'i'
171
+ 'ଈ': 'ī'
172
+ 'ଉ': 'u'
173
+ 'ଊ': 'ū'
174
+ 'ଋ': 'ṛ'
175
+ 'ୠ': 'ṝ'
176
+ 'ଌ': 'ḻ'
177
+ 'ଏ': 'e'
178
+ 'ଐ': 'ai'
179
+ 'ଓ': 'o'
180
+ 'ଔ': 'au'
181
+
182
+ # II. Consonants (see Note 2)
183
+ # Gutturals
184
+ 'କ': 'ka'
185
+ 'ଖ': 'kha'
186
+ 'ଗ': 'ga'
187
+ 'ଘ': 'gha'
188
+ 'ଙ': 'ṅa'
189
+
190
+ # Palatals
191
+ 'ଚ': 'ca'
192
+ 'ଛ': 'cha'
193
+ 'ଜ': 'ja'
194
+ 'ଝ': 'jha'
195
+ 'ଞ': 'ña'
196
+
197
+ # Cerebrals
198
+ 'ଟ': 'ṭa'
199
+ 'ଠ': 'ṭha'
200
+ 'ଡ': 'ḍa'
201
+ 'ଢ': 'ḍha'
202
+ 'ଣ': 'ṇa'
203
+
204
+ # Dentals
205
+ 'ତ': 'ta'
206
+ 'ଥ': 'tha'
207
+ 'ଦ': 'da'
208
+ 'ଧ': 'dha'
209
+ 'ନ': 'na'
210
+
211
+ # Labials
212
+ 'ପ': 'pa'
213
+ 'ଫ': 'pha'
214
+ 'ବ': 'ba'
215
+ 'ଭ': 'bha'
216
+ 'ମ': 'ma'
217
+
218
+ # Semivowels
219
+ 'ଯ': 'ya'
220
+ 'ୟ': 'ẏa'
221
+ 'ର': 'ra'
222
+ 'ଲ': 'la'
223
+ 'ଳ': 'ḷa'
224
+
225
+ # Sibilants
226
+ 'ଶ': 'śa'
227
+ 'ଷ': 'sha'
228
+ 'ସ': 'sa'
229
+
230
+
231
+ # Aspirate
232
+ 'ହ': 'ha'
233
+
234
+ # Chandrabindu
235
+ 'ଁ': 'n̐'
236
+
237
+ # Bisarga
238
+ 'ଃ': 'ḥ'
239
+
240
+ # Anusvāra
241
+ 'ଂ': 'ṃ'
242
+
243
+ # Abagraha
244
+ 'ଽ': "’"
245
+
246
+ # Medials # Needed for connecting constants
247
+
248
+ 'ା': 'ā'
249
+ 'ି': 'i'
250
+ 'ୀ': 'ī'
251
+ 'ୁ': 'u'
252
+ 'ୂ': 'ū'
253
+ 'ୃ': 'ṛ'
254
+ 'େ': 'e'
255
+ 'ୈ': 'ai'
256
+ 'ୋ': 'o'
257
+ 'ୌ': 'au'
258
+
259
+ '्': ''
260
+ '୍': ''
261
+ '़': ''
262
+ '଼': ''
263
+ '।': '.'
264
+ "‍": ''# Used for joining
265
+ "‌": ''# Used for non joining
266
+
267
+ #Absent but used
268
+ 'ୱ': 'wa'
269
+ 'ଡ଼': 'ṙa'
270
+ 'ଢ଼': 'ṙha'
271
+
272
+ # Numbers
273
+
274
+ '୦': '0'
275
+ '୧': '1'
276
+ '୨': '2'
277
+ '୩': '3'
278
+ '୪': '4'
279
+ '୫': '5'
280
+ '୬': '6'
281
+ '୭': '7'
282
+ '୮': '8'
283
+ '୯': '9'
284
+
@@ -0,0 +1,67 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:ori
5
+ source_script: Orya
6
+ destination_script: Latn
7
+ name: Oriya Romanization, 2011
8
+ alias:
9
+ ogc11122:
10
+ code: ori_Orya2Latn_ALA_2011
11
+ description: Oriya ALA-Library of Congress 2011 System
12
+ url: https://www.loc.gov/catdir/cpso/romanization/oriya.pdf
13
+ creation_date: 2011
14
+ description: |
15
+ ALA-LC Romanization table for Oriya
16
+
17
+ notes:
18
+ - |
19
+ Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for vowels following a
20
+ consonant can be found in grammars; no distinction between the two is made in transliteration.
21
+ - |
22
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
23
+ transliteration, with the following exceptions:
24
+ a) when another vowel is indicated by its appropriate sign; and
25
+ b) when the absence of any vowel is indicated by the subscript sign ( ୍ ) called hasanta.
26
+ - |
27
+ ବ is used both as a labial and as a semivowel. When it occurs as the second consonant of a
28
+ consonant cluster, it is transliterated va. When ବ is doubled, it is transliterated bba.
29
+ - |
30
+ Exception: Anusvāra is transliterated by:
31
+ a) ṅ before gutturals,
32
+ b) ñ before palatals,
33
+ c) ṇ before cerebrals,
34
+ d) n before dentals, and
35
+ e) m before labials.
36
+ - |
37
+ Candrabindu before guttural, palatal, cerebral, and dental occlusives is transliterated n̐.
38
+ Before labials, sibilants, semivowels, the aspirate, vowels, and in final position it is
39
+ transliterated m̐.
40
+ - When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
41
+ tests:
42
+ - source: "ବିହାର ନିର୍ବାଚନ: ସନ୍ଧ୍ୟା ୬ଟା ସୁଦ୍ଧା ୫୩.୫୪ ପ୍ରତିଶତ ମତଦାନ"
43
+ expected: "bihāra nirbācana: sandhẏā 6ṭā suddhā 53.54 pratiśata matadāna"
44
+ - source: "ଡିସେମ୍ବର ସୁଦ୍ଧା ପ୍ରସ୍ତୁତ ହୋଇଯିବ ଅକ୍ସଫୋର୍ଡ କରୋନାଭାଇରସ୍ ଟିକା: ଅଦର ପୁନାୱାଲା"
45
+ expected: "ḍisembara suddhā prastuta heāiyiba aksapheārḍa kareānābhāiras ṭikā: adara punābālā"
46
+ - source: "କରୋନା ଆକ୍ରାନ୍ତ ହେଲେ କେନ୍ଦ୍ରମନ୍ତ୍ରୀ ସ୍ମୃତି ଇରାନୀ"
47
+ expected: "karonā ākrānta hele kendramantrī smṛti irānī"
48
+ - source: "ଆମେରିକା ଉପରେ ଉତ୍‌କ୍ଷିପ୍ତ ହୋଇ ଚୀନ୍ କହିଲା: ଭାରତ ସହ ଆମର ସୀମା ବିବାଦ ଦ୍ବିପାକ୍ଷିକ ମାମଲା"
49
+ expected: "āmerikā upare utkshipta heāi cīn kahilā: bhārata saha āmara sīmā bibāda dbipākshika māmalā"
50
+ - source: "ପରଲୋକରେ ଦକ୍ଷିଣ କୋରିଆର ସବୁଠୁ ଧନୀବ୍ୟକ୍ତି ‘ସାମ୍‌ସଙ୍ଗ୍’ ଅଧ୍ୟକ୍ଷ ଲି କୁନ୍-ହି; ଛାଡ଼ିଯାଇଛନ୍ତି ୨୧ ବିଲିୟନ୍ ଡଲାର୍‌ର ସାମ୍ରାଜ୍ୟ"
51
+ expected: "paraleākare dakshiṇa keāriāra sabuṭhu dhanībẏakti ‘sāmsaṅg’ adhẏaksha li kun-hi; chāṙiyāichanti 21 biliẏan ḍalārra sāmrājẏa"
52
+ - source: "ଉପନିର୍ବାଚନ ପାଇଁ ବାଲେଶ୍ୱରରେ ବିଜେଡିର ସମାବେଶ। (ଫଟୋ: ମନୋଜ ବିଶ୍ୱାଳ)"
53
+ expected: "upanirbācana pāim̐ bāleśwarare bijeḍira samābeśa. (phaṭo: manoja biśbāḷa)"
54
+ - source: "ନୂଆପଲ୍ଲୀ ଦୁର୍ଗାପୂଜା ମଣ୍ଡପ ବାହାରେ ମା’ଙ୍କୁ ପୂଜାର୍ଚ୍ଚନା କରୁଛନ୍ତି ଭକ୍ତ। (ଫଟୋ: ବିଭୂତି)"
55
+ expected: "nūāpallī durgāpūjā maṇḍapa bāhāre mā’ṅku pūjārccanā karuchanti bhakta. (phaṭo: bibhūti)"
56
+ - source: "ମା ଶାରଳାଙ୍କ ପୀଠରେ ଦଶମୀ ପୂଜା। (ଫଟୋ: ସୋମନାଥ, ଜଗତସିଂହପୁର ଟାଉନ୍‌)"
57
+ expected: "mā śāraḷāṅka pīṭhare daśamī pūjā. (phaṭo: somanātha, jagatasiṃhapura ṭāun)"
58
+ - source: "ଆଜି ବିହାରରେ ପ୍ରଥମ ପର୍ଯ୍ୟାୟ ଭୋଟ, ମହାମେଣ୍ଟ-ଏନ୍‌ଡିଏ କଡ଼ା ଟକ୍କର"
59
+ expected: "āji bihārare prathama paryẏāẏa bheāṭa, mahāmeṇṭa-enḍie kaṙā ṭakkara"
60
+ - source: "ନିର୍ବାଚନ ପ୍ରଚାରରୁ ଫେରି ନିଜ ଅଭିଜ୍ଞତା ବଖାଣି ଅମିଷା କହିଲେ, ‘କୌଣସି ପରିସ୍ଥିତିରେ ମୋର ସହିତ ଦୁଷ୍କର୍ମ ହେବାର ଆଶଙ୍କା ରହିଥିଲା’"
61
+ expected: "nirbācana pracāraru pheri nija abhijñatā bakhāṇi amishā kahile, ‘keୗṇasi paristhitire meāra sahita dushkarma hebāra āśaṅkā rahithilā’"
62
+ - source: "ବ୍ଲୁ ଫ୍ଲାଗ ବିଚ୍‌ରେ ଅଘଟଣ: ମା’ ଆଗରେ ସମୁଦ୍ରରେ ଭାସିଗଲେ ପୁଅ, ଖୋଜିବା ପାଇଁ ଲାଇଫଗାର୍ଡ ଟିମ୍‌ ନିୟୋଜିତ"
63
+ expected: "blu phlāga bicre aghaṭaṇa: mā’ āgare samudrare bhāsigale pua, kheājibā pāim̐ lāiphagārḍa ṭim niẏeājita"
64
+
65
+ map:
66
+
67
+ inherit: alalc-ori-Orya-Latn-1997
@@ -38,9 +38,9 @@ notes:
38
38
 
39
39
  tests:
40
40
  - source: "सृष्टिस्थितिविनाशानां शक्तिभूते सनातनि"
41
- expected: "saṛṣaṭaisathaitaivainaāśaānaāṃ śakataibhaūtae sanaātanai"
41
+ expected: "sṛṣṭisthitivināśānāṃ śaktibhūte sanātani"
42
42
  - source: "गुणाश्रये गुणमये नारायणि नमोऽस्तु ते"
43
- expected: "gauṇaāśarayae gauṇamayae naāraāyaṇai namaosatau tae"
43
+ expected: "guṇāśraye guṇamaye nārāyaṇi namostu te"
44
44
 
45
45
  map:
46
46
 
@@ -38,27 +38,96 @@ notes:
38
38
 
39
39
  tests:
40
40
  - source: "पूर्णमदः पूर्णमिदं पूर्णात् पूर्ण्मुदच्यते"
41
- expected: "paūraṇamadaḥ paūraṇamaidaṃ paūraṇaāta paūraṇamaudacayatae"
41
+ expected: "pūrṇamadaḥ pūrṇamidaṃ pūrṇāt pūrṇmudacyate"
42
42
  - source: "पूर्णस्य पूर्णमादाय पूर्णमेवावशिष्यते"
43
- expected: "paūraṇasaya paūraṇamaādaāya paūraṇamaevaāvaśaiṣayatae"
43
+ expected: "pūrṇasya pūrṇamādāya pūrṇamevāvaśiṣyate"
44
44
  - source: "यथा चतुर्भिः कनकं परीक्ष्यते निर्घषणच्छेदन तापताडनैः"
45
- expected: "yathaā cataurabhaiḥ kanakaṃ paraīkaṣayatae nairaghaṣaṇacachaedana taāpataāḍanaaiḥ"
45
+ expected: "yathā caturbhiḥ kanakaṃ parīkṣyate nirghaṣaṇacchedana tāpatāḍanaiḥ"
46
46
  - source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
47
- expected: "tathaā cataurabhaiḥ paurauṣaḥ paraīkaṣayatae tayaāgaena śaīlaena gauṇaena karamaṇaā"
47
+ expected: "tathā caturbhiḥ puruṣaḥ parīkṣyate tyāgena śīlena guṇena karmaṇā"
48
48
  - source: "यो न हृष्यति न द्वेष्टि न शोचति न काङ्‍क्षति"
49
- expected: "yao na haṛṣayatai na davaeṣaṭai na śaocatai na kaāṅakaṣatai"
49
+ expected: "yo na hṛṣyati na dveṣṭi na śocati na kāṅkṣati"
50
50
  - source: "शुभाशुभपरित्यागी भक्तिमान्यः स मे प्रियः"
51
- expected: "śaubhaāśaubhaparaitayaāgaī bhakataimaānayaḥ sa mae paraiyaḥ"
51
+ expected: "śubhāśubhaparityāgī bhaktimānyaḥ sa me priyaḥ"
52
52
  - source: "सत्य -सत्यमेवेश्वरो लोके सत्ये धर्मः सदाश्रितः"
53
- expected: "sataya -satayamaevaeśavarao laokae satayae dharamaḥ sadaāśaraitaḥ"
53
+ expected: "satya -satyameveśvaro loke satye dharmaḥ sadāśritaḥ"
54
54
  - source: "सत्यमूलनि सर्वाणि सत्यान्नास्ति परं पदम्"
55
- expected: "satayamaūlanai saravaāṇai satayaānanaāsatai paraṃ padama"
55
+ expected: "satyamūlani sarvāṇi satyānnāsti paraṃ padam"
56
56
  - source: "पिता माताग्निरात्मा च गुरुश्च भरतर्षभ"
57
- expected: "paitaā maātaāganairaātamaā ca gaurauśaca bharataraṣabha"
57
+ expected: "pitā mātāgnirātmā ca guruśca bharatarṣabha"
58
58
 
59
59
  map:
60
60
 
61
61
  rules:
62
+ # note [2]
63
+ - pattern: (क=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
64
+ result: 'k'
65
+ - pattern: (ख=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
66
+ result: 'kh'
67
+ - pattern: (ग=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
68
+ result: 'g'
69
+ - pattern: (घ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
70
+ result: 'gh'
71
+ - pattern: (ङ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
72
+ result: 'ṅ'
73
+ - pattern: (च=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
74
+ result: 'c'
75
+ - pattern: (छ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
76
+ result: 'ch'
77
+ - pattern: (ज=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
78
+ result: 'j'
79
+ - pattern: (झ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
80
+ result: 'jh'
81
+ - pattern: (ञ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
82
+ result: 'ñ'
83
+ - pattern: (ट=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
84
+ result: 'ṭ'
85
+ - pattern: (ठ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
86
+ result: 'ṭh'
87
+ - pattern: (ड=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
88
+ result: 'ḍ'
89
+ - pattern: (ढ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
90
+ result: 'ḍh'
91
+ - pattern: (ण=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
92
+ result: 'ṇ'
93
+ - pattern: (त=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
94
+ result: 't'
95
+ - pattern: (थ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
96
+ result: 'th'
97
+ - pattern: (द=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
98
+ result: 'd'
99
+ - pattern: (ध=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
100
+ result: 'dh'
101
+ - pattern: (न=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
102
+ result: 'n'
103
+ - pattern: (प=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
104
+ result: 'p'
105
+ - pattern: (फ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
106
+ result: 'ph'
107
+ - pattern: (ब=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
108
+ result: 'b'
109
+ - pattern: (भ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
110
+ result: 'bh'
111
+ - pattern: (म=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
112
+ result: 'm'
113
+ - pattern: (य=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
114
+ result: 'y'
115
+ - pattern: (र=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
116
+ result: 'r'
117
+ - pattern: (ल=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
118
+ result: 'l'
119
+ - pattern: (ळ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
120
+ result: 'ḻ'
121
+ - pattern: (व=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
122
+ result: 'v'
123
+ - pattern: (श=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
124
+ result: 'ś'
125
+ - pattern: (ष=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
126
+ result: 'ṣ'
127
+ - pattern: (स=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
128
+ result: 's'
129
+ - pattern: (ह=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
130
+ result: 'h'
62
131
  # note[3]
63
132
  - pattern: \u0902(?=[कखगघङ])
64
133
  result: ṅ