interscript 0.1.7 → 0.1.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.adoc +1 -3
- data/aliases.json +1 -0
- data/lib/interscript.rb +8 -3
- data/lib/interscript/fs.rb +27 -0
- data/lib/interscript/mapping.rb +3 -1
- data/lib/interscript/opal.rb +142 -3
- data/lib/interscript/opal/entrypoint.rb +8 -0
- data/lib/interscript/opal/exports.rb +11 -0
- data/lib/interscript/opal/maps.js.erb +2 -4
- data/lib/interscript/version.rb +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -5
- data/maps/alalc-asm-Deva-Latn-1997.yaml +104 -10
- data/maps/alalc-asm-Deva-Latn-2012.yaml +18 -3
- data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
- data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
- data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
- data/maps/alalc-hin-Deva-Latn-1997.yaml +102 -10
- data/maps/alalc-hin-Deva-Latn-2011.yaml +19 -1
- data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
- data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
- data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
- data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
- data/maps/alalc-pra-Deva-Latn-2012.yaml +2 -2
- data/maps/alalc-san-Deva-Latn-2012.yaml +78 -9
- data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
- data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
- data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +3 -1
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +2 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +87 -53
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
- data/maps/{bis-knd-Knda-Latn-13194-1991.yaml → bis-kan-Kana-Latn-13194-1991.yaml} +2 -2
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +17 -2
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
- data/maps/{iso-kan-Knda-Latn-15919-2001.yaml → iso-kan-Kana-Latn-15919-2001.yaml} +1 -1
- data/maps/{mns-mon-Cyrl-Latn-5217-2012.yaml → masm-mon-Cyrl-Latn-5217-2012.yaml} +2 -2
- data/maps/{mns-mon-Latn-Cyrl-5217-2012.yaml → masm-mon-Latn-Cyrl-5217-2012.yaml} +1 -1
- data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
- data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
- data/maps/odni-ara-Arab-Latn-2015.yaml +20 -130
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
- data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
- data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
- data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
- data/maps/{odni-per-Arab-Latn-2015.yaml → odni-prs-Arab-Latn-2015.yaml} +0 -0
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +4 -0
- data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
- data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
- data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
- data/maps/un-hin-Deva-Latn-2016.yaml +104 -10
- data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
- data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
- data/maps/un-mar-Deva-Latn-2016.yaml +24 -13
- data/maps/un-nep-Deva-Latn-1972.yaml +40 -121
- data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
- data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
- data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
- data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
- data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
- data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
- data/spec/interscript/filenames_spec.rb +6 -369
- data/spec/interscript_spec.rb +10 -2
- metadata +50 -7
- data/lib/interscript/opal/map_translate.rb +0 -7
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2011
|
|
4
|
+
language: iso-639-2:kan
|
|
5
|
+
source_script: Kana
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Kannada Romanization, 2011
|
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
|
|
9
|
+
creation_date: 2011
|
|
10
|
+
description: |
|
|
11
|
+
ALA-LC Romanization table for Kannada
|
|
12
|
+
|
|
13
|
+
notes:
|
|
14
|
+
|
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
16
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
17
|
+
made in transliteration.
|
|
18
|
+
|
|
19
|
+
- |
|
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
21
|
+
transliteration, with the following exceptions:
|
|
22
|
+
|
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
24
|
+
b) when the absence of any vowel is indicated by the superscript sign (◌್).
|
|
25
|
+
|
|
26
|
+
- |
|
|
27
|
+
Exception: Anusvāra is transliterated by:
|
|
28
|
+
|
|
29
|
+
a) ṅ before gutturals,
|
|
30
|
+
b) ñ before palatals,
|
|
31
|
+
c) ṇ before cerebrals,
|
|
32
|
+
d) n before dentals, and
|
|
33
|
+
e) m before labials.
|
|
34
|
+
|
|
35
|
+
|
|
36
|
+
tests:
|
|
37
|
+
- source: "ಕರ್ಣಾಟಕ"
|
|
38
|
+
expected: "karṇāṭaka"
|
|
39
|
+
- source: "ಬೆಂಗಳೂರು"
|
|
40
|
+
expected: "beṅgaḷūru"
|
|
41
|
+
- source: "ಭಾರತದಲ್ಲಿ ಗಾಳಿ ಕಲುಷಿತವಾಗಿದೆ: ಹವಾಮಾನ ಬದಲಾವಣೆ ಸಮರ್ಥನೆಗೆ ಭಾರತವನ್ನು ಟೀಕಿಸಿದ ಟ್ರಂಪ್"
|
|
42
|
+
expected: "bhāratadalli gāḷi kaluṣitavāgide: havāmāna badalāvaṇe samarthanege bhāratavannu ṭīkisida ṭraṃp"
|
|
43
|
+
- source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ ಅಂತಿಮ ಚರ್ಚೆ: ಭಾರತದ ವಿರುದ್ಧ ಟ್ರಂಪ್ ಆರೋಪವೇನು?!"
|
|
44
|
+
expected: "amerika adhyakṣīya cunāvaṇe aṃtima carce: bhāratada viruddha ṭraṃp ārōpavēnu?!"
|
|
45
|
+
- source: "ಹೇಗಿದೆ ಅಮೆರಿಕನ್ ಚುನಾವಣ ಕಣ?"
|
|
46
|
+
expected: "hēgide amerikan cunāvaṇa kaṇa?"
|
|
47
|
+
- source: "ಫ್ರೀಜರ್ ನಲ್ಲಿಟ್ಟ ನೂಡಲ್ಸ್ ತಿಂದು ಒಂದೇ ಕುಟುಂಬದ ೯ ಮಂದಿ ಸಾವು: ೩ ಮಕ್ಕಳು ಅಪಾಯದಿಂದ ಪಾರು"
|
|
48
|
+
expected: "phrījar nalliṭṭa nūḍals tiṃdu oṃdē kuṭuṃbada 9 maṃdi sāvu: 3 makkaḷu apāyadinda pāru"
|
|
49
|
+
- source: "ಉಡುಪಿಯಲ್ಲಿ ಪ್ರಪ್ರಥಮ ಬಾರಿಗೆ ಪ್ರಾರಂಭವಾಗಿರುವ ದೇಶಿ ಉತ್ಪನ್ನಗಳ ಮಳಿಗೆ"
|
|
50
|
+
expected: "uḍupiyalli praprathama bārige prāraṃbhavāgiruva dēśi utpannagaḷa maḷige"
|
|
51
|
+
- source: "ಚಿಕ್ಕಮಗಳೂರು : ಪುಷ್ಪ ಸಮರ್ಪಣೆ ವೇಳೆ ಮಗಳನ್ನ ನೆನೆದು ಕಣ್ಣೀರಿಟ್ಟ ಮೃತ ಪೇದೆ ತಾಯಿ"
|
|
52
|
+
expected: "cikkamagaḷūru : puṣpa samarpaṇe vēḷe magaḷanna nenedu kaṇṇīriṭṭa mṛta pēde tāyi"
|
|
53
|
+
- source: "ಸಮಂಗಳೂರು: ಡ್ರಗ್ಸ್ ಜಾಗೃತಿ ಬರಹದಿಂದ ಗಮನಸೆಳೆಯುತ್ತಿದೆ ಸಿಟಿ ಬಸ್"
|
|
54
|
+
expected: "samaṅgaḷūru: ḍrags jāgṛti barahadinda gamanaseḷeyuttide siṭi bas"
|
|
55
|
+
- source: "ಪುರಸಭೆ, ಪಪಂ ಅಧ್ಯಕ್ಷ-ಉಪಾಧ್ಯಕ್ಷ ಚುನಾವಣೆಗೆ ಹೈಕೋರ್ಟ್ ಅಸ್ತು"
|
|
56
|
+
expected: "purasabhe, papaṃ adhyakṣa-upādhyakṣa cunāvaṇege haikōrṭ astu"
|
|
57
|
+
- source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ ಅಂತಿಮ ಚರ್ಚೆ: ಭಾರತದ ವಿರುದ್ಧ ಟ್ರಂಪ್ ಆರೋಪವೇನು?"
|
|
58
|
+
expected: "amerika adhyakṣīya cunāvaṇe aṃtima carce: bhāratada viruddha ṭraṃp ārōpavēnu?"
|
|
59
|
+
- source: "ಮನೆ ಕುಸಿದು ತಂದೆ ಮತ್ತು ಮಗ ಸಾವು, ಇನ್ನಿಬ್ಬರಿಗೆ ಗಾಯ: ಸ್ಥಳಕ್ಕೆ ಶಾಸಕರ ಭೇಟಿ"
|
|
60
|
+
expected: "mane kusidu taṃde mattu maga sāvu, innibbarige gāya: sthaḷakke śāsakara bhēṭi"
|
|
61
|
+
|
|
62
|
+
map:
|
|
63
|
+
inherit: 'alalc-kan-Kana-Latn-1997'
|
|
@@ -0,0 +1,284 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: iso-639-2:ori
|
|
5
|
+
source_script: Orya
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Oriya Romanization, 1997
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: ori_Orya2Latn_ALA_1997
|
|
11
|
+
description: Oriya ALA-Library of Congress 1997 System
|
|
12
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/oriya.pdf
|
|
13
|
+
creation_date: 1997
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Oriya
|
|
16
|
+
|
|
17
|
+
notes:
|
|
18
|
+
- |
|
|
19
|
+
Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for vowels following a
|
|
20
|
+
consonant can be found in grammars; no distinction between the two is made in transliteration.
|
|
21
|
+
- |
|
|
22
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
23
|
+
transliteration, with the following exceptions:
|
|
24
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
25
|
+
b) when the absence of any vowel is indicated by the subscript sign ( ୍ ) called hasanta.
|
|
26
|
+
- |
|
|
27
|
+
ବ is used both as a labial and as a semivowel. When it occurs as the second consonant of a
|
|
28
|
+
consonant cluster, it is transliterated va. When ବ is doubled, it is transliterated bba.
|
|
29
|
+
- |
|
|
30
|
+
Exception: Anusvāra is transliterated by:
|
|
31
|
+
a) ṅ before gutturals,
|
|
32
|
+
b) ñ before palatals,
|
|
33
|
+
c) ṇ before cerebrals,
|
|
34
|
+
d) n before dentals, and
|
|
35
|
+
e) m before labials.
|
|
36
|
+
- |
|
|
37
|
+
Candrabindu before guttural, palatal, cerebral, and dental occlusives is transliterated n̐.
|
|
38
|
+
Before labials, sibilants, semivowels, the aspirate, vowels, and in final position it is
|
|
39
|
+
transliterated m̐.
|
|
40
|
+
- When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
|
|
41
|
+
tests:
|
|
42
|
+
- source: "ର୍କ"
|
|
43
|
+
expected: "rka"
|
|
44
|
+
- source: "ଓଡ଼ିଆ"
|
|
45
|
+
expected: "oṙiā"
|
|
46
|
+
- source: "ଓଡ଼ିଶା"
|
|
47
|
+
expected: "oṙiśā"
|
|
48
|
+
- source: "ଭୁବନେଶ୍ୱର"
|
|
49
|
+
expected: "bhubaneśwara"
|
|
50
|
+
- source: "ଆଇପିଏଲ୍-୧୩: ରୟାଲ ଚ୍ୟାଲେଞ୍ଜର୍ସ ବାଙ୍ଗାଲୋରକୁ ୫ ଓ୍ୱିକେଟରେ ପରାସ୍ତ କଲା ମୁମ୍ବାଇ ଇଣ୍ଡିଆନ୍ସ"
|
|
51
|
+
expected: "āipiel-13: raẏāla cẏāleñjarsa bāṅgāloraku 5 obikeṭare parāsta kalā mumbāi iṇḍiānsa"
|
|
52
|
+
- source: "ଓଡ଼ିଶା ସିଭିଲ ସର୍ଭିସେସ୍ ମେନ୍ ପରୀକ୍ଷା ଡିସେମ୍ବରରେ, ଜାଣନ୍ତୁ କେଉଁ ବିଷୟର ପରୀକ୍ଷା କେବେ"
|
|
53
|
+
expected: "oṙiśā sibhila sarbhises men parīkshā ḍisembarare, jāṇantu keum̐ bishaẏara parīkshā kebe"
|
|
54
|
+
- source: "ଗଞ୍ଜାମରେ କୋଭିଡ଼ ମୃତ୍ୟୁ ୨୨୮ରେ ପହଞ୍ଚିଲା"
|
|
55
|
+
expected: "gañjāmare keābhiṙa mṛtẏu 228re pahañcilā"
|
|
56
|
+
- source: "ଭାରତ ମହାସାଗର ଦ୍ବୀପରାଷ୍ଟ୍ର ଶ୍ରୀଲଙ୍କା ଓ ମାଳଦ୍ବୀପରେ ପମ୍ପିଓଙ୍କ ଚୀନ୍ବିରୋଧୀ ଅଭିଯାନ"
|
|
57
|
+
expected: "bhārata mahāsāgara dbīparāshṭra śrīlaṅkā o māḷadbīpare pampioṅka cīnbireādhī abhiyāna"
|
|
58
|
+
- source: "କଟକ ସହରରୁ ଆଜି ୩୯ କରୋନା ପଜିଟିଭ୍ ଚିହ୍ନଟ, ସ୍ଥାନୀୟ ଅଂଚଳରୁ ୨୪ ଜଣ ଆକ୍ରାନ୍ତ"
|
|
59
|
+
expected: "kaṭaka sahararu āji 39 karonā pajiṭibh cihnaṭa, sthānīẏa aṃcaḷaru 24 jaṇa ākrānta"
|
|
60
|
+
- source: "ବିଧାୟକ ସୌମ୍ୟରଂଜନଙ୍କ ମାରାଥନ ପ୍ରଚାର: ‘ଦ୍ୱିତୀୟବାର ସୁଯୋଗ ମିଳିଛି, ବୁଝି ବିଚାରି ଭୋଟ ଦିଅ’"
|
|
61
|
+
expected: "bidhāẏaka seୗmẏaraṃjanaṅka mārāthana pracāra: ‘dbitīẏabāra suyeāga miḷichi, bujhi bicāri bheāṭa dia’"
|
|
62
|
+
- source: "ଅଣ୍ଡା ବିଗାଡ଼ିଛି ପୁଷ୍ଟିକର ଖାଦ୍ୟ ଯୋଜନା ଅଙ୍କ"
|
|
63
|
+
expected: "aṇḍā bigāṙichi pushṭikara khādẏa yeājanā aṅka"
|
|
64
|
+
- source: "ପଥରଗଡ଼ ମଦ ମୃତ୍ୟୁ ମାମଲା : ଠିକାଦାର ସହ ବନ୍ଧାହେଲେ ୪"
|
|
65
|
+
expected: "patharagaḍa mada mṛtẏu māmalā : ṭhikādāra saha bandhāhele 4"
|
|
66
|
+
- source: "ତିର୍ତ୍ତୋଲର ବିକାଶ ନେଇ ବିଷ୍ଣୁବାବୁ ମୋତେ ବହୁ ବାର ଭେଟୁଥିଲେ: ନବୀନ"
|
|
67
|
+
expected: "tirtteālara bikāśa nei bishṇubābu mote bahu bāra bheṭuthile: nabīna"
|
|
68
|
+
|
|
69
|
+
|
|
70
|
+
map:
|
|
71
|
+
|
|
72
|
+
rules:
|
|
73
|
+
# Rule II
|
|
74
|
+
- pattern: ([କ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
75
|
+
result: 'k'
|
|
76
|
+
- pattern: ([ଖ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
77
|
+
result: 'kh'
|
|
78
|
+
- pattern: ([ଗ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
79
|
+
result: 'g'
|
|
80
|
+
- pattern: ([ଘ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
81
|
+
result: 'gh'
|
|
82
|
+
- pattern: ([ଙ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
83
|
+
result: 'ṅ'
|
|
84
|
+
- pattern: ([ଚ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
85
|
+
result: 'c'
|
|
86
|
+
- pattern: ([ଛ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
87
|
+
result: 'ch'
|
|
88
|
+
- pattern: ([ଜ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
89
|
+
result: 'j'
|
|
90
|
+
- pattern: ([ଝ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
91
|
+
result: 'jh'
|
|
92
|
+
- pattern: ([ଞ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
93
|
+
result: 'ñ'
|
|
94
|
+
- pattern: ([ଟ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
95
|
+
result: 'ṭ'
|
|
96
|
+
- pattern: ([ଠ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
97
|
+
result: 'ṭh'
|
|
98
|
+
- pattern: ([ଡ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
99
|
+
result: 'ḍ'
|
|
100
|
+
- pattern: ([ଢ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
101
|
+
result: 'ḍh'
|
|
102
|
+
- pattern: ([ଣ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
103
|
+
result: 'ṇ'
|
|
104
|
+
- pattern: ([ତ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
105
|
+
result: 't'
|
|
106
|
+
- pattern: ([ଥ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
107
|
+
result: 'th'
|
|
108
|
+
- pattern: ([ଦ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
109
|
+
result: 'd'
|
|
110
|
+
- pattern: ([ଧ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
111
|
+
result: 'dh'
|
|
112
|
+
- pattern: ([ନ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
113
|
+
result: 'n'
|
|
114
|
+
- pattern: ([ପ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
115
|
+
result: 'p'
|
|
116
|
+
- pattern: ([ଫ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
117
|
+
result: 'ph'
|
|
118
|
+
- pattern: ([ବ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
119
|
+
result: 'b'
|
|
120
|
+
- pattern: ([ଭ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
121
|
+
result: 'bh'
|
|
122
|
+
- pattern: ([ମ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
123
|
+
result: 'm'
|
|
124
|
+
- pattern: ([ଯ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
125
|
+
result: 'y'
|
|
126
|
+
- pattern: ([ୟ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
127
|
+
result: 'ẏ'
|
|
128
|
+
- pattern: ([ର]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
129
|
+
result: 'r'
|
|
130
|
+
- pattern: ([ଲ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
131
|
+
result: 'l'
|
|
132
|
+
- pattern: ([ଳ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
133
|
+
result: 'ḷ'
|
|
134
|
+
- pattern: ([ଶ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
135
|
+
result: 'ś'
|
|
136
|
+
- pattern: ([ଷ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
137
|
+
result: 'sh'
|
|
138
|
+
- pattern: ([ସ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
139
|
+
result: 's'
|
|
140
|
+
- pattern: ([ହ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
141
|
+
result: 'h'
|
|
142
|
+
- pattern: ([ୱ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
143
|
+
result: 'b'
|
|
144
|
+
- pattern: ([ଡ଼]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
145
|
+
result: 'ṙ'
|
|
146
|
+
- pattern: ([ଢ଼]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
|
147
|
+
result: 'ṙh'
|
|
148
|
+
|
|
149
|
+
# Rule III
|
|
150
|
+
- pattern: ([ବ]=?)(?=[\u0b2c])
|
|
151
|
+
result: 'bba'
|
|
152
|
+
# Rule IV
|
|
153
|
+
- pattern: \u0902(?=[କଖଗଘଙ])
|
|
154
|
+
result: ṅ
|
|
155
|
+
- pattern: \u0902(?=[ଚଛଜଝଞ])
|
|
156
|
+
result: ñ
|
|
157
|
+
- pattern: \u0902(?=[ଟଠଡଢଣ])
|
|
158
|
+
result: ṇ
|
|
159
|
+
- pattern: \u0902(?=[ତଥଦଧନ])
|
|
160
|
+
result: n
|
|
161
|
+
# Rule V
|
|
162
|
+
- pattern: \u0b01(?=[ପଫବଭମଯୟରଲଳଶଷସହଅଆଇଈଉଊଋୠଌଏଐଓଔ])
|
|
163
|
+
result: "m̐"
|
|
164
|
+
- pattern: (?<=)\u0b01(?=\b)
|
|
165
|
+
result: "m̐"
|
|
166
|
+
|
|
167
|
+
characters:
|
|
168
|
+
'ଅ': 'a'
|
|
169
|
+
'ଆ': 'ā'
|
|
170
|
+
'ଇ': 'i'
|
|
171
|
+
'ଈ': 'ī'
|
|
172
|
+
'ଉ': 'u'
|
|
173
|
+
'ଊ': 'ū'
|
|
174
|
+
'ଋ': 'ṛ'
|
|
175
|
+
'ୠ': 'ṝ'
|
|
176
|
+
'ଌ': 'ḻ'
|
|
177
|
+
'ଏ': 'e'
|
|
178
|
+
'ଐ': 'ai'
|
|
179
|
+
'ଓ': 'o'
|
|
180
|
+
'ଔ': 'au'
|
|
181
|
+
|
|
182
|
+
# II. Consonants (see Note 2)
|
|
183
|
+
# Gutturals
|
|
184
|
+
'କ': 'ka'
|
|
185
|
+
'ଖ': 'kha'
|
|
186
|
+
'ଗ': 'ga'
|
|
187
|
+
'ଘ': 'gha'
|
|
188
|
+
'ଙ': 'ṅa'
|
|
189
|
+
|
|
190
|
+
# Palatals
|
|
191
|
+
'ଚ': 'ca'
|
|
192
|
+
'ଛ': 'cha'
|
|
193
|
+
'ଜ': 'ja'
|
|
194
|
+
'ଝ': 'jha'
|
|
195
|
+
'ଞ': 'ña'
|
|
196
|
+
|
|
197
|
+
# Cerebrals
|
|
198
|
+
'ଟ': 'ṭa'
|
|
199
|
+
'ଠ': 'ṭha'
|
|
200
|
+
'ଡ': 'ḍa'
|
|
201
|
+
'ଢ': 'ḍha'
|
|
202
|
+
'ଣ': 'ṇa'
|
|
203
|
+
|
|
204
|
+
# Dentals
|
|
205
|
+
'ତ': 'ta'
|
|
206
|
+
'ଥ': 'tha'
|
|
207
|
+
'ଦ': 'da'
|
|
208
|
+
'ଧ': 'dha'
|
|
209
|
+
'ନ': 'na'
|
|
210
|
+
|
|
211
|
+
# Labials
|
|
212
|
+
'ପ': 'pa'
|
|
213
|
+
'ଫ': 'pha'
|
|
214
|
+
'ବ': 'ba'
|
|
215
|
+
'ଭ': 'bha'
|
|
216
|
+
'ମ': 'ma'
|
|
217
|
+
|
|
218
|
+
# Semivowels
|
|
219
|
+
'ଯ': 'ya'
|
|
220
|
+
'ୟ': 'ẏa'
|
|
221
|
+
'ର': 'ra'
|
|
222
|
+
'ଲ': 'la'
|
|
223
|
+
'ଳ': 'ḷa'
|
|
224
|
+
|
|
225
|
+
# Sibilants
|
|
226
|
+
'ଶ': 'śa'
|
|
227
|
+
'ଷ': 'sha'
|
|
228
|
+
'ସ': 'sa'
|
|
229
|
+
|
|
230
|
+
|
|
231
|
+
# Aspirate
|
|
232
|
+
'ହ': 'ha'
|
|
233
|
+
|
|
234
|
+
# Chandrabindu
|
|
235
|
+
'ଁ': 'n̐'
|
|
236
|
+
|
|
237
|
+
# Bisarga
|
|
238
|
+
'ଃ': 'ḥ'
|
|
239
|
+
|
|
240
|
+
# Anusvāra
|
|
241
|
+
'ଂ': 'ṃ'
|
|
242
|
+
|
|
243
|
+
# Abagraha
|
|
244
|
+
'ଽ': "’"
|
|
245
|
+
|
|
246
|
+
# Medials # Needed for connecting constants
|
|
247
|
+
|
|
248
|
+
'ା': 'ā'
|
|
249
|
+
'ି': 'i'
|
|
250
|
+
'ୀ': 'ī'
|
|
251
|
+
'ୁ': 'u'
|
|
252
|
+
'ୂ': 'ū'
|
|
253
|
+
'ୃ': 'ṛ'
|
|
254
|
+
'େ': 'e'
|
|
255
|
+
'ୈ': 'ai'
|
|
256
|
+
'ୋ': 'o'
|
|
257
|
+
'ୌ': 'au'
|
|
258
|
+
|
|
259
|
+
'्': ''
|
|
260
|
+
'୍': ''
|
|
261
|
+
'़': ''
|
|
262
|
+
'଼': ''
|
|
263
|
+
'।': '.'
|
|
264
|
+
"": ''# Used for joining
|
|
265
|
+
"": ''# Used for non joining
|
|
266
|
+
|
|
267
|
+
#Absent but used
|
|
268
|
+
'ୱ': 'wa'
|
|
269
|
+
'ଡ଼': 'ṙa'
|
|
270
|
+
'ଢ଼': 'ṙha'
|
|
271
|
+
|
|
272
|
+
# Numbers
|
|
273
|
+
|
|
274
|
+
'୦': '0'
|
|
275
|
+
'୧': '1'
|
|
276
|
+
'୨': '2'
|
|
277
|
+
'୩': '3'
|
|
278
|
+
'୪': '4'
|
|
279
|
+
'୫': '5'
|
|
280
|
+
'୬': '6'
|
|
281
|
+
'୭': '7'
|
|
282
|
+
'୮': '8'
|
|
283
|
+
'୯': '9'
|
|
284
|
+
|
|
@@ -0,0 +1,67 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2011
|
|
4
|
+
language: iso-639-2:ori
|
|
5
|
+
source_script: Orya
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Oriya Romanization, 2011
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: ori_Orya2Latn_ALA_2011
|
|
11
|
+
description: Oriya ALA-Library of Congress 2011 System
|
|
12
|
+
url: https://www.loc.gov/catdir/cpso/romanization/oriya.pdf
|
|
13
|
+
creation_date: 2011
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Oriya
|
|
16
|
+
|
|
17
|
+
notes:
|
|
18
|
+
- |
|
|
19
|
+
Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for vowels following a
|
|
20
|
+
consonant can be found in grammars; no distinction between the two is made in transliteration.
|
|
21
|
+
- |
|
|
22
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
23
|
+
transliteration, with the following exceptions:
|
|
24
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
25
|
+
b) when the absence of any vowel is indicated by the subscript sign ( ୍ ) called hasanta.
|
|
26
|
+
- |
|
|
27
|
+
ବ is used both as a labial and as a semivowel. When it occurs as the second consonant of a
|
|
28
|
+
consonant cluster, it is transliterated va. When ବ is doubled, it is transliterated bba.
|
|
29
|
+
- |
|
|
30
|
+
Exception: Anusvāra is transliterated by:
|
|
31
|
+
a) ṅ before gutturals,
|
|
32
|
+
b) ñ before palatals,
|
|
33
|
+
c) ṇ before cerebrals,
|
|
34
|
+
d) n before dentals, and
|
|
35
|
+
e) m before labials.
|
|
36
|
+
- |
|
|
37
|
+
Candrabindu before guttural, palatal, cerebral, and dental occlusives is transliterated n̐.
|
|
38
|
+
Before labials, sibilants, semivowels, the aspirate, vowels, and in final position it is
|
|
39
|
+
transliterated m̐.
|
|
40
|
+
- When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
|
|
41
|
+
tests:
|
|
42
|
+
- source: "ବିହାର ନିର୍ବାଚନ: ସନ୍ଧ୍ୟା ୬ଟା ସୁଦ୍ଧା ୫୩.୫୪ ପ୍ରତିଶତ ମତଦାନ"
|
|
43
|
+
expected: "bihāra nirbācana: sandhẏā 6ṭā suddhā 53.54 pratiśata matadāna"
|
|
44
|
+
- source: "ଡିସେମ୍ବର ସୁଦ୍ଧା ପ୍ରସ୍ତୁତ ହୋଇଯିବ ଅକ୍ସଫୋର୍ଡ କରୋନାଭାଇରସ୍ ଟିକା: ଅଦର ପୁନାୱାଲା"
|
|
45
|
+
expected: "ḍisembara suddhā prastuta heāiyiba aksapheārḍa kareānābhāiras ṭikā: adara punābālā"
|
|
46
|
+
- source: "କରୋନା ଆକ୍ରାନ୍ତ ହେଲେ କେନ୍ଦ୍ରମନ୍ତ୍ରୀ ସ୍ମୃତି ଇରାନୀ"
|
|
47
|
+
expected: "karonā ākrānta hele kendramantrī smṛti irānī"
|
|
48
|
+
- source: "ଆମେରିକା ଉପରେ ଉତ୍କ୍ଷିପ୍ତ ହୋଇ ଚୀନ୍ କହିଲା: ଭାରତ ସହ ଆମର ସୀମା ବିବାଦ ଦ୍ବିପାକ୍ଷିକ ମାମଲା"
|
|
49
|
+
expected: "āmerikā upare utkshipta heāi cīn kahilā: bhārata saha āmara sīmā bibāda dbipākshika māmalā"
|
|
50
|
+
- source: "ପରଲୋକରେ ଦକ୍ଷିଣ କୋରିଆର ସବୁଠୁ ଧନୀବ୍ୟକ୍ତି ‘ସାମ୍ସଙ୍ଗ୍’ ଅଧ୍ୟକ୍ଷ ଲି କୁନ୍-ହି; ଛାଡ଼ିଯାଇଛନ୍ତି ୨୧ ବିଲିୟନ୍ ଡଲାର୍ର ସାମ୍ରାଜ୍ୟ"
|
|
51
|
+
expected: "paraleākare dakshiṇa keāriāra sabuṭhu dhanībẏakti ‘sāmsaṅg’ adhẏaksha li kun-hi; chāṙiyāichanti 21 biliẏan ḍalārra sāmrājẏa"
|
|
52
|
+
- source: "ଉପନିର୍ବାଚନ ପାଇଁ ବାଲେଶ୍ୱରରେ ବିଜେଡିର ସମାବେଶ। (ଫଟୋ: ମନୋଜ ବିଶ୍ୱାଳ)"
|
|
53
|
+
expected: "upanirbācana pāim̐ bāleśwarare bijeḍira samābeśa. (phaṭo: manoja biśbāḷa)"
|
|
54
|
+
- source: "ନୂଆପଲ୍ଲୀ ଦୁର୍ଗାପୂଜା ମଣ୍ଡପ ବାହାରେ ମା’ଙ୍କୁ ପୂଜାର୍ଚ୍ଚନା କରୁଛନ୍ତି ଭକ୍ତ। (ଫଟୋ: ବିଭୂତି)"
|
|
55
|
+
expected: "nūāpallī durgāpūjā maṇḍapa bāhāre mā’ṅku pūjārccanā karuchanti bhakta. (phaṭo: bibhūti)"
|
|
56
|
+
- source: "ମା ଶାରଳାଙ୍କ ପୀଠରେ ଦଶମୀ ପୂଜା। (ଫଟୋ: ସୋମନାଥ, ଜଗତସିଂହପୁର ଟାଉନ୍)"
|
|
57
|
+
expected: "mā śāraḷāṅka pīṭhare daśamī pūjā. (phaṭo: somanātha, jagatasiṃhapura ṭāun)"
|
|
58
|
+
- source: "ଆଜି ବିହାରରେ ପ୍ରଥମ ପର୍ଯ୍ୟାୟ ଭୋଟ, ମହାମେଣ୍ଟ-ଏନ୍ଡିଏ କଡ଼ା ଟକ୍କର"
|
|
59
|
+
expected: "āji bihārare prathama paryẏāẏa bheāṭa, mahāmeṇṭa-enḍie kaṙā ṭakkara"
|
|
60
|
+
- source: "ନିର୍ବାଚନ ପ୍ରଚାରରୁ ଫେରି ନିଜ ଅଭିଜ୍ଞତା ବଖାଣି ଅମିଷା କହିଲେ, ‘କୌଣସି ପରିସ୍ଥିତିରେ ମୋର ସହିତ ଦୁଷ୍କର୍ମ ହେବାର ଆଶଙ୍କା ରହିଥିଲା’"
|
|
61
|
+
expected: "nirbācana pracāraru pheri nija abhijñatā bakhāṇi amishā kahile, ‘keୗṇasi paristhitire meāra sahita dushkarma hebāra āśaṅkā rahithilā’"
|
|
62
|
+
- source: "ବ୍ଲୁ ଫ୍ଲାଗ ବିଚ୍ରେ ଅଘଟଣ: ମା’ ଆଗରେ ସମୁଦ୍ରରେ ଭାସିଗଲେ ପୁଅ, ଖୋଜିବା ପାଇଁ ଲାଇଫଗାର୍ଡ ଟିମ୍ ନିୟୋଜିତ"
|
|
63
|
+
expected: "blu phlāga bicre aghaṭaṇa: mā’ āgare samudrare bhāsigale pua, kheājibā pāim̐ lāiphagārḍa ṭim niẏeājita"
|
|
64
|
+
|
|
65
|
+
map:
|
|
66
|
+
|
|
67
|
+
inherit: alalc-ori-Orya-Latn-1997
|
|
@@ -38,9 +38,9 @@ notes:
|
|
|
38
38
|
|
|
39
39
|
tests:
|
|
40
40
|
- source: "सृष्टिस्थितिविनाशानां शक्तिभूते सनातनि"
|
|
41
|
-
expected: "
|
|
41
|
+
expected: "sṛṣṭisthitivināśānāṃ śaktibhūte sanātani"
|
|
42
42
|
- source: "गुणाश्रये गुणमये नारायणि नमोऽस्तु ते"
|
|
43
|
-
expected: "
|
|
43
|
+
expected: "guṇāśraye guṇamaye nārāyaṇi namo’stu te"
|
|
44
44
|
|
|
45
45
|
map:
|
|
46
46
|
|
|
@@ -38,27 +38,96 @@ notes:
|
|
|
38
38
|
|
|
39
39
|
tests:
|
|
40
40
|
- source: "पूर्णमदः पूर्णमिदं पूर्णात् पूर्ण्मुदच्यते"
|
|
41
|
-
expected: "
|
|
41
|
+
expected: "pūrṇamadaḥ pūrṇamidaṃ pūrṇāt pūrṇmudacyate"
|
|
42
42
|
- source: "पूर्णस्य पूर्णमादाय पूर्णमेवावशिष्यते"
|
|
43
|
-
expected: "
|
|
43
|
+
expected: "pūrṇasya pūrṇamādāya pūrṇamevāvaśiṣyate"
|
|
44
44
|
- source: "यथा चतुर्भिः कनकं परीक्ष्यते निर्घषणच्छेदन तापताडनैः"
|
|
45
|
-
expected: "
|
|
45
|
+
expected: "yathā caturbhiḥ kanakaṃ parīkṣyate nirghaṣaṇacchedana tāpatāḍanaiḥ"
|
|
46
46
|
- source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
|
|
47
|
-
expected: "
|
|
47
|
+
expected: "tathā caturbhiḥ puruṣaḥ parīkṣyate tyāgena śīlena guṇena karmaṇā"
|
|
48
48
|
- source: "यो न हृष्यति न द्वेष्टि न शोचति न काङ्क्षति"
|
|
49
|
-
expected: "
|
|
49
|
+
expected: "yo na hṛṣyati na dveṣṭi na śocati na kāṅkṣati"
|
|
50
50
|
- source: "शुभाशुभपरित्यागी भक्तिमान्यः स मे प्रियः"
|
|
51
|
-
expected: "
|
|
51
|
+
expected: "śubhāśubhaparityāgī bhaktimānyaḥ sa me priyaḥ"
|
|
52
52
|
- source: "सत्य -सत्यमेवेश्वरो लोके सत्ये धर्मः सदाश्रितः"
|
|
53
|
-
expected: "
|
|
53
|
+
expected: "satya -satyameveśvaro loke satye dharmaḥ sadāśritaḥ"
|
|
54
54
|
- source: "सत्यमूलनि सर्वाणि सत्यान्नास्ति परं पदम्"
|
|
55
|
-
expected: "
|
|
55
|
+
expected: "satyamūlani sarvāṇi satyānnāsti paraṃ padam"
|
|
56
56
|
- source: "पिता माताग्निरात्मा च गुरुश्च भरतर्षभ"
|
|
57
|
-
expected: "
|
|
57
|
+
expected: "pitā mātāgnirātmā ca guruśca bharatarṣabha"
|
|
58
58
|
|
|
59
59
|
map:
|
|
60
60
|
|
|
61
61
|
rules:
|
|
62
|
+
# note [2]
|
|
63
|
+
- pattern: (क=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
64
|
+
result: 'k'
|
|
65
|
+
- pattern: (ख=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
66
|
+
result: 'kh'
|
|
67
|
+
- pattern: (ग=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
68
|
+
result: 'g'
|
|
69
|
+
- pattern: (घ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
70
|
+
result: 'gh'
|
|
71
|
+
- pattern: (ङ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
72
|
+
result: 'ṅ'
|
|
73
|
+
- pattern: (च=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
74
|
+
result: 'c'
|
|
75
|
+
- pattern: (छ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
76
|
+
result: 'ch'
|
|
77
|
+
- pattern: (ज=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
78
|
+
result: 'j'
|
|
79
|
+
- pattern: (झ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
80
|
+
result: 'jh'
|
|
81
|
+
- pattern: (ञ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
82
|
+
result: 'ñ'
|
|
83
|
+
- pattern: (ट=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
84
|
+
result: 'ṭ'
|
|
85
|
+
- pattern: (ठ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
86
|
+
result: 'ṭh'
|
|
87
|
+
- pattern: (ड=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
88
|
+
result: 'ḍ'
|
|
89
|
+
- pattern: (ढ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
90
|
+
result: 'ḍh'
|
|
91
|
+
- pattern: (ण=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
92
|
+
result: 'ṇ'
|
|
93
|
+
- pattern: (त=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
94
|
+
result: 't'
|
|
95
|
+
- pattern: (थ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
96
|
+
result: 'th'
|
|
97
|
+
- pattern: (द=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
98
|
+
result: 'd'
|
|
99
|
+
- pattern: (ध=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
100
|
+
result: 'dh'
|
|
101
|
+
- pattern: (न=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
102
|
+
result: 'n'
|
|
103
|
+
- pattern: (प=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
104
|
+
result: 'p'
|
|
105
|
+
- pattern: (फ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
106
|
+
result: 'ph'
|
|
107
|
+
- pattern: (ब=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
108
|
+
result: 'b'
|
|
109
|
+
- pattern: (भ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
110
|
+
result: 'bh'
|
|
111
|
+
- pattern: (म=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
112
|
+
result: 'm'
|
|
113
|
+
- pattern: (य=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
114
|
+
result: 'y'
|
|
115
|
+
- pattern: (र=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
116
|
+
result: 'r'
|
|
117
|
+
- pattern: (ल=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
118
|
+
result: 'l'
|
|
119
|
+
- pattern: (ळ=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
120
|
+
result: 'ḻ'
|
|
121
|
+
- pattern: (व=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
122
|
+
result: 'v'
|
|
123
|
+
- pattern: (श=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
124
|
+
result: 'ś'
|
|
125
|
+
- pattern: (ष=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
126
|
+
result: 'ṣ'
|
|
127
|
+
- pattern: (स=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
128
|
+
result: 's'
|
|
129
|
+
- pattern: (ह=?)(?=[\u093e\u093f\u0940\u0941\u0942\u0943\u0944\u0947\u0948\u094b\u094c\u094d])
|
|
130
|
+
result: 'h'
|
|
62
131
|
# note[3]
|
|
63
132
|
- pattern: \u0902(?=[कखगघङ])
|
|
64
133
|
result: ṅ
|