interscript 0.1.7 → 0.1.9
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/README.adoc +1 -3
- data/aliases.json +1 -0
- data/lib/interscript.rb +8 -3
- data/lib/interscript/fs.rb +27 -0
- data/lib/interscript/mapping.rb +3 -1
- data/lib/interscript/opal.rb +142 -3
- data/lib/interscript/opal/entrypoint.rb +8 -0
- data/lib/interscript/opal/exports.rb +11 -0
- data/lib/interscript/opal/maps.js.erb +2 -4
- data/lib/interscript/version.rb +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -5
- data/maps/alalc-asm-Deva-Latn-1997.yaml +104 -10
- data/maps/alalc-asm-Deva-Latn-2012.yaml +18 -3
- data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
- data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
- data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
- data/maps/alalc-hin-Deva-Latn-1997.yaml +102 -10
- data/maps/alalc-hin-Deva-Latn-2011.yaml +19 -1
- data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
- data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
- data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
- data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
- data/maps/alalc-pra-Deva-Latn-2012.yaml +2 -2
- data/maps/alalc-san-Deva-Latn-2012.yaml +78 -9
- data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
- data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
- data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +3 -1
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +2 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +87 -53
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
- data/maps/{bis-knd-Knda-Latn-13194-1991.yaml → bis-kan-Kana-Latn-13194-1991.yaml} +2 -2
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +17 -2
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
- data/maps/{iso-kan-Knda-Latn-15919-2001.yaml → iso-kan-Kana-Latn-15919-2001.yaml} +1 -1
- data/maps/{mns-mon-Cyrl-Latn-5217-2012.yaml → masm-mon-Cyrl-Latn-5217-2012.yaml} +2 -2
- data/maps/{mns-mon-Latn-Cyrl-5217-2012.yaml → masm-mon-Latn-Cyrl-5217-2012.yaml} +1 -1
- data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
- data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
- data/maps/odni-ara-Arab-Latn-2015.yaml +20 -130
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
- data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
- data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
- data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
- data/maps/{odni-per-Arab-Latn-2015.yaml → odni-prs-Arab-Latn-2015.yaml} +0 -0
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +4 -0
- data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
- data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
- data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
- data/maps/un-hin-Deva-Latn-2016.yaml +104 -10
- data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
- data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
- data/maps/un-mar-Deva-Latn-2016.yaml +24 -13
- data/maps/un-nep-Deva-Latn-1972.yaml +40 -121
- data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
- data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
- data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
- data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
- data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
- data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
- data/spec/interscript/filenames_spec.rb +6 -369
- data/spec/interscript_spec.rb +10 -2
- metadata +50 -7
- data/lib/interscript/opal/map_translate.rb +0 -7
@@ -0,0 +1,247 @@
|
|
1
|
+
---
|
2
|
+
authority_id: ungegn
|
3
|
+
id: 1972
|
4
|
+
language: iso-639-2:ori
|
5
|
+
source_script: Orya
|
6
|
+
destination_script: Latn
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Oriya Romanization, 1972
|
8
|
+
url: http://www.eki.ee/wgrs/v2_2/rom1_or.pdf
|
9
|
+
creation_date: 1972
|
10
|
+
confirmation_date: 2003
|
11
|
+
description: |
|
12
|
+
The United Nations recommended system was approved in 1972 (II/11), based on a report
|
13
|
+
prepared by D. N. Sharma. The note on the system was published in volume II of the
|
14
|
+
conference reports.
|
15
|
+
|
16
|
+
There is no evidence of the use of the system either in India or in international cartographic
|
17
|
+
products.
|
18
|
+
|
19
|
+
Oriya uses an alphasyllabic script whereby each character represents a syllable rather than one sound.
|
20
|
+
Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially) and in an
|
21
|
+
abbreviated form, to denote vowels after consonants. The romanization table is unambiguous. The system is mostly
|
22
|
+
reversible but there may exist some ambiguities in the romanization of vowels (independent vs. abbreviated characters)
|
23
|
+
and consonants (combinations with subscript consonants vs. character sequences).
|
24
|
+
|
25
|
+
notes:
|
26
|
+
- Combinations with r as the first component are written with a special superscript symbol, e.g. ର୍କ rka.
|
27
|
+
|
28
|
+
tests:
|
29
|
+
- source: "ର୍କ"
|
30
|
+
expected: "rka"
|
31
|
+
- source: "ଓଡ଼ିଆ"
|
32
|
+
expected: "oṙiā"
|
33
|
+
- source: "ଓଡ଼ିଶା"
|
34
|
+
expected: "oṙishā"
|
35
|
+
- source: "ଭୁବନେଶ୍ୱର"
|
36
|
+
expected: "bhubaneshvara"
|
37
|
+
- source: "ଆଇପିଏଲ୍-୧୩: ଦିଲ୍ଲୀ କ୍ୟାପିଟାଲ୍ସକୁ ୮୮ ରନ୍ ପରାସ୍ତ କଲା ସନରାଇଜର୍ସ ହାଇଦ୍ରାବାଦ"
|
38
|
+
expected: "āipiel-13: dillī kyāpiṭālsaku 88 ran parāsta kalā sanarāijarsa hāidrābāda"
|
39
|
+
- source: "ପ୍ରେମ ସମ୍ପର୍କରେ ଭଟ୍ଟା: ରାଗରେ ପ୍ରେମିକାର ତଣ୍ଟି କାଟି ନିଜେ ବିଷ ପିଇଲା ପ୍ରେମିକ"
|
40
|
+
expected: "prema samparkare bhaṭṭā: rāgare premikāra taṇṭi kāṭi nije biṣha piilā premika"
|
41
|
+
- source: "ପ୍ରେମ ସମ୍ପର୍କରେ ଭଟ୍ଟା: ରାଗରେ ପ୍ରେମିକାର ତଣ୍ଟି କାଟି ନିଜେ ବିଷ ପିଇଲା ପ୍ରେମିକ"
|
42
|
+
expected: "prema samparkare bhaṭṭā: rāgare premikāra taṇṭi kāṭi nije biṣha piilā premika"
|
43
|
+
- source: "ହୋଟେଲ, ଲଜ୍ରେ ରୁମ୍ ମିଳୁନି: ନେତାଙ୍କ ନାଁରେ ଆଗୁଆ ହୋଇଯାଇଛି ବୁକିଂ"
|
44
|
+
expected: "heāṭela, lajre rum miḷuni: netāṅka nāmre āguā heāiỵāichhhi bukiṃ"
|
45
|
+
- source: "ପର୍ଯ୍ୟଟକମାନଙ୍କ ନିମନ୍ତେ ନଭେମ୍ବର ୧ରୁ ଖୋଲିବ ଶିମିଳିପାଳ ଅଭୟାରଣ୍ୟ"
|
46
|
+
expected: "parỵyaṭakamānaṅka nimante nabhembara 1ru kholiba shimiḷipāḷa abhayāraṇya"
|
47
|
+
- source: "ପାରିବାରିକ ଅଶାନ୍ତିର କରୁଣ ପରିଣତି: କୂଅକୁ ଡେଇଁଲେ ମା’-ଝିଅ, ଝିଅ ମୃତ"
|
48
|
+
expected: "pāribārika ashāntira karuṇa pariṇati: kūaku ḍeimle mā’-jhia, jhia mṛta"
|
49
|
+
- source: "‘ଭ୍ରଷ୍ଟାଚାରର ବଂଶବାଦ’ ଏବେ ସାଜିଛି ଦେଶ ପାଇଁ ନୂଆ ସମସ୍ୟା; ପ୍ରଧାନମନ୍ତ୍ରୀ ମୋଦୀ"
|
50
|
+
expected: "‘bhraṣhṭāchārara baṃshabāda’ ebe sājichhhi desha pāim nūā samasyā; pradhānamantrī modī"
|
51
|
+
- source: "ପାହାଡ଼ି ଇଲାକାବାସୀଙ୍କ ଆଶାର ବତୀ ‘ପାର୍ବତୀ’"
|
52
|
+
expected: "pāhāṙi ilākābāsīṅka āshāra batī ‘pārbatī’"
|
53
|
+
|
54
|
+
|
55
|
+
map:
|
56
|
+
|
57
|
+
rules:
|
58
|
+
- pattern: ([କ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
59
|
+
result: 'k'
|
60
|
+
- pattern: ([ଖ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
61
|
+
result: 'kh'
|
62
|
+
- pattern: ([ଗ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
63
|
+
result: 'g'
|
64
|
+
- pattern: ([ଘ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
65
|
+
result: 'gh'
|
66
|
+
- pattern: ([ଙ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
67
|
+
result: 'ṅ'
|
68
|
+
- pattern: ([ଚ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
69
|
+
result: 'ch'
|
70
|
+
- pattern: ([ଛ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
71
|
+
result: 'chhh'
|
72
|
+
- pattern: ([ଜ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
73
|
+
result: 'j'
|
74
|
+
- pattern: ([ଝ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
75
|
+
result: 'jh'
|
76
|
+
- pattern: ([ଞ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
77
|
+
result: 'ñ'
|
78
|
+
- pattern: ([ଟ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
79
|
+
result: 'ṭ'
|
80
|
+
- pattern: ([ଠ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
81
|
+
result: 'ṭh'
|
82
|
+
- pattern: ([ଡ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
83
|
+
result: 'ḍ'
|
84
|
+
- pattern: ([ଡ଼]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
85
|
+
result: 'ṙ'
|
86
|
+
- pattern: ([ଢ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
87
|
+
result: 'ḍh'
|
88
|
+
- pattern: ([ଢ଼]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
89
|
+
result: 'ṙh'
|
90
|
+
- pattern: ([ଣ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
91
|
+
result: 'ṇ'
|
92
|
+
- pattern: ([ତ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
93
|
+
result: 't'
|
94
|
+
- pattern: ([ଥ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
95
|
+
result: 'th'
|
96
|
+
- pattern: ([ଦ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
97
|
+
result: 'd'
|
98
|
+
- pattern: ([ଧ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
99
|
+
result: 'dh'
|
100
|
+
- pattern: ([ନ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
101
|
+
result: 'n'
|
102
|
+
- pattern: ([ପ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
103
|
+
result: 'p'
|
104
|
+
- pattern: ([ଫ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
105
|
+
result: 'ph'
|
106
|
+
- pattern: ([ବ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
107
|
+
result: 'b'
|
108
|
+
- pattern: ([ଭ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
109
|
+
result: 'bh'
|
110
|
+
- pattern: ([ମ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
111
|
+
result: 'm'
|
112
|
+
- pattern: ([ଯ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
113
|
+
result: 'ỵ'
|
114
|
+
- pattern: ([ୟ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
115
|
+
result: 'y'
|
116
|
+
- pattern: ([ର]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
117
|
+
result: 'r'
|
118
|
+
- pattern: ([ଲ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
119
|
+
result: 'l'
|
120
|
+
- pattern: ([ଳ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
121
|
+
result: 'ḷ'
|
122
|
+
- pattern: ([ଶ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
123
|
+
result: 'sh'
|
124
|
+
- pattern: ([ଷ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
125
|
+
result: 'ṣh'
|
126
|
+
- pattern: ([ସ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
127
|
+
result: 's'
|
128
|
+
- pattern: ([ହ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
129
|
+
result: 'h'
|
130
|
+
- pattern: ([କ୍ଷ]=?)(?=[\u0b4d\u0b3e\u0b3f\u0b40\u0b41\u0b42\u0b43\u0b47\u0b48\u0b4b\u0b4c])
|
131
|
+
result: 'kṣh'
|
132
|
+
|
133
|
+
characters:
|
134
|
+
'ଅ': 'a'
|
135
|
+
'ଆ': 'ā'
|
136
|
+
'ଇ': 'i'
|
137
|
+
'ଈ': 'ī'
|
138
|
+
'ଉ': 'u'
|
139
|
+
'ଊ': 'ū'
|
140
|
+
'ଋ': 'ṛ'
|
141
|
+
'ୠ': 'ṝ'
|
142
|
+
'ଌ': 'ḻ'
|
143
|
+
'ଏ': 'e'
|
144
|
+
'ଐ': 'ai'
|
145
|
+
'ଓ': 'o'
|
146
|
+
'ୱ': 'va'
|
147
|
+
'ଔ': 'au'
|
148
|
+
|
149
|
+
# II. Consonants
|
150
|
+
# Gutturals
|
151
|
+
'କ': 'ka'
|
152
|
+
'ଖ': 'kha'
|
153
|
+
'ଗ': 'ga'
|
154
|
+
'ଘ': 'gha'
|
155
|
+
'ଙ': 'ṅa'
|
156
|
+
|
157
|
+
# Palatals
|
158
|
+
'ଚ': 'cha'
|
159
|
+
'ଛ': 'chha'
|
160
|
+
'ଜ': 'ja'
|
161
|
+
'ଝ': 'jha'
|
162
|
+
'ଞ': 'ña'
|
163
|
+
|
164
|
+
# Cerebrals
|
165
|
+
'ଟ': 'ṭa'
|
166
|
+
'ଠ': 'ṭha'
|
167
|
+
'ଡ': 'ḍa'
|
168
|
+
'ଡ଼': 'ṙa'
|
169
|
+
'ଢ': 'ḍha'
|
170
|
+
'ଢ଼': 'ṙha'
|
171
|
+
'ଣ': 'ṇa'
|
172
|
+
|
173
|
+
# Dentals
|
174
|
+
'ତ': 'ta'
|
175
|
+
'ଥ': 'tha'
|
176
|
+
'ଦ': 'da'
|
177
|
+
'ଧ': 'dha'
|
178
|
+
'ନ': 'na'
|
179
|
+
|
180
|
+
# Labials
|
181
|
+
'ପ': 'pa'
|
182
|
+
'ଫ': 'pha'
|
183
|
+
'ବ': 'ba'
|
184
|
+
'ଭ': 'bha'
|
185
|
+
'ମ': 'ma'
|
186
|
+
|
187
|
+
# Semivowels
|
188
|
+
'ଯ': 'ỵa'
|
189
|
+
'ୟ': 'ya'
|
190
|
+
'ର': 'ra'
|
191
|
+
'ଲ': 'la'
|
192
|
+
'ଳ': 'ḷa'
|
193
|
+
|
194
|
+
# Sibilants
|
195
|
+
'ଶ': 'sha'
|
196
|
+
'ଷ': 'ṣha'
|
197
|
+
'ସ': 'sa'
|
198
|
+
|
199
|
+
|
200
|
+
# Aspirate
|
201
|
+
'ହ': 'ha'
|
202
|
+
|
203
|
+
'କ୍ଷ': 'kṣha'
|
204
|
+
|
205
|
+
# Chandrabindu
|
206
|
+
'ଁ': 'm'
|
207
|
+
|
208
|
+
# Bisarga
|
209
|
+
'ଃ': 'ḥ'
|
210
|
+
|
211
|
+
# Anusvāra
|
212
|
+
'ଂ': 'ṃ'
|
213
|
+
|
214
|
+
# Medials # Needed for connecting constants
|
215
|
+
|
216
|
+
'ା': 'ā'
|
217
|
+
'ି': 'i'
|
218
|
+
'ୀ': 'ī'
|
219
|
+
'ୁ': 'u'
|
220
|
+
'ୂ': 'ū'
|
221
|
+
'ୃ': 'ṛ'
|
222
|
+
'େ': 'e'
|
223
|
+
'ୈ': 'ai'
|
224
|
+
'ୋ': 'o'
|
225
|
+
'ୌ': 'au'
|
226
|
+
|
227
|
+
'्': ''
|
228
|
+
'୍': ''
|
229
|
+
'़': ''
|
230
|
+
'଼': ''
|
231
|
+
'।': '.'
|
232
|
+
"": ''# Used for joining
|
233
|
+
"": ''# Used for non joining
|
234
|
+
|
235
|
+
# Numbers
|
236
|
+
|
237
|
+
'୦': '0'
|
238
|
+
'୧': '1'
|
239
|
+
'୨': '2'
|
240
|
+
'୩': '3'
|
241
|
+
'୪': '4'
|
242
|
+
'୫': '5'
|
243
|
+
'୬': '6'
|
244
|
+
'୭': '7'
|
245
|
+
'୮': '8'
|
246
|
+
'୯': '9'
|
247
|
+
|
@@ -0,0 +1,402 @@
|
|
1
|
+
---
|
2
|
+
authority_id: un
|
3
|
+
id: 1972
|
4
|
+
language: iso-639-2:pan
|
5
|
+
source_script: Guru
|
6
|
+
destination_script: Latn
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Panjabi Romanization Version 4.0
|
8
|
+
url: https://www.eki.ee/wgrs/rom1_pa.htm
|
9
|
+
creation_date: 1972
|
10
|
+
confirmation_date: 2016
|
11
|
+
description: |
|
12
|
+
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977 (III/12),
|
13
|
+
based on a report prepared by D. N. Sharma. The tables and their corrections were published in volume
|
14
|
+
II of the conference reports1,2.
|
15
|
+
|
16
|
+
There is no evidence of the use of the system either in India or in international cartographic products.
|
17
|
+
|
18
|
+
Punjabi (Panjābī) in India uses an alphasyllabic script (Gurmukhi) whereby each character represents a syllable
|
19
|
+
rather than one sound. Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially)
|
20
|
+
and in an abbreviated form, to denote vowels after consonants. The romanization table is unambiguous. The system is mostly
|
21
|
+
reversible but there exist some ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
|
22
|
+
consonants (combinations with subscript consonants vs. character sequences).
|
23
|
+
|
24
|
+
References
|
25
|
+
|
26
|
+
Second United Nations Conference on the Standardization of Geographical Names. London, 10–31 May 1972. Vol. II. Technical papers.
|
27
|
+
United Nations. New York 1974, pp. 136–138.
|
28
|
+
|
29
|
+
Third United Nations Conference on the Standardization of Geographical Names. Athens, 17 August – 7 September 1977. Vol. II,
|
30
|
+
Technical papers, pp. 393 etc.
|
31
|
+
|
32
|
+
|
33
|
+
|
34
|
+
notes:
|
35
|
+
- |
|
36
|
+
These characters are used in combination with abbreviated vowel characters: ਉ u, ਊ ū, ਅ a, ਆ ā, ਐ ai, ਔ au, ਇ i, ਈ ī, ਏ e; exceptional variation: ਓ o.
|
37
|
+
- |
|
38
|
+
Dotted variants of the characters: ਸ਼ sha, ਖ਼ ḳha, ਗ਼ g̣a, ਜ਼ za, ਫ਼ fa.
|
39
|
+
- |
|
40
|
+
(ੰ) Used if it is preceded by short vowels (a, i, u) and ū, excluding the independent vowel character ਉ (u, ū), e.g. ਸੰਗ saṁg, ਸਿੰਗ siṁg, ਬੁੰਦਾ buṁdā, ਬੂੰਦ būṁd, ਇੰਜਨ iṁjan.
|
41
|
+
- |
|
42
|
+
(ਂ) Used in all other occasions, e.g. ਝੋਂਕਾ jhoṁkā.
|
43
|
+
- |
|
44
|
+
(ੱ) Marks doubling of the following consonant: ਨਿੱਕਾ nikkā, ਲੱਭਣਾ labhbhṇā, ਕੁੱਤਾ kuttā, ਹਿੱਸਾ hissā, ਲੱਮਾ lammā.
|
45
|
+
- |
|
46
|
+
Absence of the inherent vowel (-a) is not marked in the spelling in any way except for the combinations
|
47
|
+
with subscript characters and those which are doubled by ੱ (adhaka).
|
48
|
+
|
49
|
+
tests:
|
50
|
+
- source: "ਪੰਜਾਬ 'ਚ ਵਧ ਰਿਹਾ ਖ਼ੁਦਕੁਸ਼ੀਆਂ ਦਾ ਰੁਝਾਨ"
|
51
|
+
expected: "paṁzāba 'cha vadha rihā khaḳhudakusḳhīāṁ dā rujhāna"
|
52
|
+
- source: "ਲੱਖ ਤੋਂ ਪਾਰ ਪੁੱਜਾ ਸਰਗਰਮ ਕੇਸਾਂ ਦਾ ਅੰਕੜਾ, ਦਿੱਲੀ 'ਚ ਦੋ ਲੱਖ ਤੋਂ ਪਾਰ ਇਨਫੈਕਟਿਡ"
|
53
|
+
expected: "lakkha toṁ pāra puzzā sragarama kesāṁ dā aṁkaṙā, dillī 'cha do lakkha toṁ pāra inaphaikaṭiḍa"
|
54
|
+
- source: "ਪਰਿਵਾਰਕ ਸਮੱਸਿਆਵਾਂ ਅਤੇ ਵਿਆਹ ਵੀ ਹੈ ਹੋਰ ਅਹਿਮ ਕਾਰਨ"
|
55
|
+
expected: "parivāraka smassiāvāṁ ate viāh vī hai hora ahima kārana"
|
56
|
+
- source: "ਮਰਦਾਂ 'ਚ ਔਰਤਾਂ ਨਾਲੋਂ ਵੱਧ ਹੈ ਖ਼ੁਦਕੁਸ਼ੀ ਦਾ ਰੁਝਾਨ"
|
57
|
+
expected: "maradāṁ 'cha auratāṁ nāloṁ vaddha hai khaḳhudakusḳhī dā rujhāna"
|
58
|
+
- source: "ਰਾਸ਼ਟਰੀ ਪੱਧਰ 'ਤੇ ਪੰਜਾਬ ਦੀ ਸਥਿਤੀ ਕਾਫ਼ੀ ਸੂਬਿਆਂ ਤੋਂ ਬਿਹਤਰ"
|
59
|
+
expected: "rāsṭarī paddhara 'te paṁzāba dī sthitī kāphaḳhī sūbiāṁ toṁ bihtara"
|
60
|
+
- source: "ਚੀਨੀ ਸੈਨਾ ਨੇ ਲਾਪਤਾ ਅਰੁਣਾਚਲ ਦੇ 5 ਨੌਜਵਾਨਾਂ ਬਾਰੇ ਦੱਸਿਆ"
|
61
|
+
expected: "chīnī sainā ne lāpatā aruṇāchala de 5 naujavānāṁ bāre dassiā"
|
62
|
+
- source: "ਸਾਖਰਤਾ ਦੇ ਮਾਮਲੇ 'ਚ ਦੇਸ਼ 'ਚ 7ਵੇਂ ਨੰਬਰ 'ਤੇ ਪੰਜਾਬ"
|
63
|
+
expected: "sākharatā de māmale 'cha des 'cha 7veṁ naṁbara 'te paṁzāba"
|
64
|
+
- source: "ਦਿੱਲੀ ਕਮੇਟੀ ਦੇ ਮੈਂਬਰ ਸ਼ੰਟੀ ਨੇ ਅਕਾਲੀ ਦਲ ਤੋਂ ਦਿੱਤਾ ਅਸਤੀਫ਼ਾ"
|
65
|
+
expected: "dillī kameṭī de maiṁbara sṁṭī ne akālī dala toṁ dittā astīphaḳhā"
|
66
|
+
- source: "੧੦੨ ਹੋਰ ਕੋਰੋਨਾ ਪਾਜ਼ੀਟਿਵ ਮਰੀਜ਼ਾਂ ਦੀ ਪੁਸ਼ਟੀ, ਇਕ ਦੀ ਮੌਤ"
|
67
|
+
expected: "102 hora koronā pājaḳhīṭiva marījaḳhāṁ dī pusṭī, ika dī mauta"
|
68
|
+
- source: "ਸੜਕ ਹਾਦਸੇ ਦੌਰਾਨ ਇਕ ਦੀ ਮੌਤ"
|
69
|
+
expected: "sṙaka hādase daurāna ika dī mauta"
|
70
|
+
|
71
|
+
map:
|
72
|
+
|
73
|
+
rules:
|
74
|
+
- pattern: (?<!ੱ)([ਕ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
75
|
+
result: 'k'
|
76
|
+
- pattern: (?<!ੱ)([ਖ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
77
|
+
result: 'kh'
|
78
|
+
- pattern: (?<!ੱ)([ਖ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
79
|
+
result: 'ḳh'
|
80
|
+
- pattern: (?<!ੱ)([ਗ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
81
|
+
result: 'g'
|
82
|
+
- pattern: (?<!ੱ)([ਗ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
83
|
+
result: 'g̣'
|
84
|
+
- pattern: (?<!ੱ)([ਘ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
85
|
+
result: 'gh'
|
86
|
+
- pattern: (?<!ੱ)([ਙ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
87
|
+
result: 'ṅ'
|
88
|
+
- pattern: (?<!ੱ)([ਚ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
89
|
+
result: 'ch'
|
90
|
+
- pattern: (?<!ੱ)([ਛ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
91
|
+
result: 'chh'
|
92
|
+
- pattern: (?<!ੱ)([ਜ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
93
|
+
result: 'z'
|
94
|
+
- pattern: (?<!ੱ)([ਜ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
95
|
+
result: 'j'
|
96
|
+
- pattern: (?<!ੱ)([ਝ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
97
|
+
result: 'jh'
|
98
|
+
- pattern: (?<!ੱ)([ਞ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
99
|
+
result: 'ñ'
|
100
|
+
- pattern: (?<!ੱ)([ਟ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
101
|
+
result: 'ṭ'
|
102
|
+
- pattern: (?<!ੱ)([ਠ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
103
|
+
result: 'ṭh'
|
104
|
+
- pattern: (?<!ੱ)([ਡ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
105
|
+
result: 'ḍ'
|
106
|
+
- pattern: (?<!ੱ)([ਢ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
107
|
+
result: 'ḍh'
|
108
|
+
- pattern: (?<!ੱ)([ਣ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
109
|
+
result: 'ṇ'
|
110
|
+
- pattern: (?<!ੱ)([ਤ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
111
|
+
result: 't'
|
112
|
+
- pattern: (?<!ੱ)([ਥ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
113
|
+
result: 'th'
|
114
|
+
- pattern: (?<!ੱ)([ਦ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
115
|
+
result: 'd'
|
116
|
+
- pattern: (?<!ੱ)([ਧ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
117
|
+
result: 'dh'
|
118
|
+
- pattern: (?<!ੱ)([ਨ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
119
|
+
result: 'n'
|
120
|
+
- pattern: (?<!ੱ)([ਪ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
121
|
+
result: 'p'
|
122
|
+
- pattern: (?<!ੱ)([ਫ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
123
|
+
result: 'ph'
|
124
|
+
- pattern: (?<!ੱ)([ਫ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
125
|
+
result: 'f'
|
126
|
+
- pattern: (?<!ੱ)([ਬ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
127
|
+
result: 'b'
|
128
|
+
- pattern: (?<!ੱ)([ਭ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
129
|
+
result: 'bh'
|
130
|
+
- pattern: (?<!ੱ)([ਮ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
131
|
+
result: 'm'
|
132
|
+
- pattern: (?<!ੱ)([ਯ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
133
|
+
result: 'y'
|
134
|
+
- pattern: (?<!ੱ)([ਰ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
135
|
+
result: 'r'
|
136
|
+
- pattern: (?<!ੱ)([ਲ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
137
|
+
result: 'l'
|
138
|
+
- pattern: (?<!ੱ)([ਲੵ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
139
|
+
result: 'l'
|
140
|
+
- pattern: (?<!ੱ)([ਲ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
141
|
+
result: 'l'
|
142
|
+
- pattern: (?<!ੱ)([ਵ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
143
|
+
result: 'v'
|
144
|
+
- pattern: (?<!ੱ)([ੜ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
145
|
+
result: 'ṙ'
|
146
|
+
- pattern: (?<!ੱ)([ਸ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
147
|
+
result: 's'
|
148
|
+
- pattern: (?<!ੱ)([ਸ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
149
|
+
result: 'sh'
|
150
|
+
- pattern: (?<!ੱ)([ਹ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
151
|
+
result: 'h'
|
152
|
+
|
153
|
+
- pattern: (?<=ੱ)([ਕ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
154
|
+
result: 'kk'
|
155
|
+
- pattern: (?<=ੱ)([ਖ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
156
|
+
result: 'kkh'
|
157
|
+
- pattern: (?<=ੱ)([ਖ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
158
|
+
result: 'ḳḳh'
|
159
|
+
- pattern: (?<=ੱ)([ਗ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
160
|
+
result: 'gg'
|
161
|
+
- pattern: (?<=ੱ)([ਗ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
162
|
+
result: 'gg̣'
|
163
|
+
- pattern: (?<=ੱ)([ਘ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
164
|
+
result: 'ggh'
|
165
|
+
- pattern: (?<=ੱ)([ਙ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
166
|
+
result: 'ṅṅ'
|
167
|
+
- pattern: (?<=ੱ)([ਚ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
168
|
+
result: 'cch'
|
169
|
+
- pattern: (?<=ੱ)([ਛ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
170
|
+
result: 'cchh'
|
171
|
+
- pattern: (?<=ੱ)([ਜ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
172
|
+
result: 'zz'
|
173
|
+
- pattern: (?<=ੱ)([ਜ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
174
|
+
result: 'jj'
|
175
|
+
- pattern: (?<=ੱ)([ਝ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
176
|
+
result: 'jjh'
|
177
|
+
- pattern: (?<=ੱ)([ਞ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
178
|
+
result: 'ññ'
|
179
|
+
- pattern: (?<=ੱ)([ਟ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
180
|
+
result: 'ṭṭ'
|
181
|
+
- pattern: (?<=ੱ)([ਠ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
182
|
+
result: 'ṭṭh'
|
183
|
+
- pattern: (?<=ੱ)([ਡ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
184
|
+
result: 'ḍḍ'
|
185
|
+
- pattern: (?<=ੱ)([ਢ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
186
|
+
result: 'ḍḍh'
|
187
|
+
- pattern: (?<=ੱ)([ਣ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
188
|
+
result: 'ṇṇ'
|
189
|
+
- pattern: (?<=ੱ)([ਤ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
190
|
+
result: 'tt'
|
191
|
+
- pattern: (?<=ੱ)([ਥ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
192
|
+
result: 'tth'
|
193
|
+
- pattern: (?<=ੱ)([ਦ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
194
|
+
result: 'dd'
|
195
|
+
- pattern: (?<=ੱ)([ਧ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
196
|
+
result: 'ddh'
|
197
|
+
- pattern: (?<=ੱ)([ਨ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
198
|
+
result: 'nn'
|
199
|
+
- pattern: (?<=ੱ)([ਪ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
200
|
+
result: 'pp'
|
201
|
+
- pattern: (?<=ੱ)([ਫ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
202
|
+
result: 'pph'
|
203
|
+
- pattern: (?<=ੱ)([ਫ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
204
|
+
result: 'ff'
|
205
|
+
- pattern: (?<=ੱ)([ਬ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
206
|
+
result: 'bb'
|
207
|
+
- pattern: (?<=ੱ)([ਭ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
208
|
+
result: 'bbh'
|
209
|
+
- pattern: (?<=ੱ)([ਮ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
210
|
+
result: 'mm'
|
211
|
+
- pattern: (?<=ੱ)([ਯ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
212
|
+
result: 'yy'
|
213
|
+
- pattern: (?<=ੱ)([ਰ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
214
|
+
result: 'rr'
|
215
|
+
- pattern: (?<=ੱ)([ਲ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
216
|
+
result: 'll'
|
217
|
+
- pattern: (?<=ੱ)([ਲੵ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
218
|
+
result: 'll'
|
219
|
+
- pattern: (?<=ੱ)([ਲ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
220
|
+
result: 'll'
|
221
|
+
- pattern: (?<=ੱ)([ਵ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
222
|
+
result: 'vv'
|
223
|
+
- pattern: (?<=ੱ)([ੜ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
224
|
+
result: 'ṙṙ'
|
225
|
+
- pattern: (?<=ੱ)([ਸ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
226
|
+
result: 'ss'
|
227
|
+
- pattern: (?<=ੱ)([ਸ਼]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
228
|
+
result: 'ssh'
|
229
|
+
- pattern: (?<=ੱ)([ਹ]=?)(?=[\u0a3e\u0a3f\u0a40\u0a41\u0a42\u0a47\u0a48\u0a4b\u0a4c\u0a4d])
|
230
|
+
result: 'hh'
|
231
|
+
|
232
|
+
characters:
|
233
|
+
|
234
|
+
# I. Vowels and Diphthongs (see Note 1)
|
235
|
+
'ਅ': 'a'
|
236
|
+
'ਆ': 'ā'
|
237
|
+
'ਇ': 'i'
|
238
|
+
'ਈ': 'ī'
|
239
|
+
'ਉ': 'u'
|
240
|
+
'ਊ': 'ū'
|
241
|
+
'ਏ': 'e'
|
242
|
+
'ਐ': 'ai'
|
243
|
+
'ਓ': 'o'
|
244
|
+
'ਔ': 'au'
|
245
|
+
|
246
|
+
'ਾ': "ā"
|
247
|
+
'ਿ': "i"
|
248
|
+
'ੀ': "ī"
|
249
|
+
'ੁ': "u"
|
250
|
+
'ੂ': "ū"
|
251
|
+
'ੇ': "e"
|
252
|
+
'ੈ': "ai"
|
253
|
+
'ੋ': "o"
|
254
|
+
'ੌ': "au"
|
255
|
+
|
256
|
+
# II. Consonants
|
257
|
+
'ਕ': 'ka'
|
258
|
+
'ਖ': 'kha'
|
259
|
+
'ਖ਼': 'ḳha'
|
260
|
+
'ਗ': 'ga'
|
261
|
+
'ਗ਼': 'g̣a'
|
262
|
+
'ਘ': 'gha'
|
263
|
+
'ਙ': 'ṅa'
|
264
|
+
'ਚ': 'cha'
|
265
|
+
'ਛ': 'chha'
|
266
|
+
'ਜ਼': 'za'
|
267
|
+
'ਜ': 'ja'
|
268
|
+
'ਝ': 'jha'
|
269
|
+
'ਞ': 'ña'
|
270
|
+
'ਟ': 'ṭa'
|
271
|
+
'ਠ': 'ṭha'
|
272
|
+
'ਡ': 'ḍa'
|
273
|
+
'ਢ': 'ḍha'
|
274
|
+
'ਣ': 'ṇa'
|
275
|
+
'ਤ': 'ta'
|
276
|
+
'ਥ': 'tha'
|
277
|
+
'ਦ': 'da'
|
278
|
+
'ਧ': 'dha'
|
279
|
+
'ਨ': 'na'
|
280
|
+
'ਪ': 'pa'
|
281
|
+
'ਫ': 'pha'
|
282
|
+
'ਫ਼': 'fa'
|
283
|
+
'ਬ': 'ba'
|
284
|
+
'ਭ': 'bha'
|
285
|
+
'ਮ': 'ma'
|
286
|
+
'ਯ': 'ya'
|
287
|
+
'ਰ': 'ra'
|
288
|
+
'ਲ': 'la'
|
289
|
+
'ਲੵ': 'la'
|
290
|
+
'ਲ਼': 'la'
|
291
|
+
'ਵ': 'va'
|
292
|
+
'ੜ': 'ṙa'
|
293
|
+
'ਸ': 's'
|
294
|
+
'ਸ਼': 'sha'
|
295
|
+
'ਹ': 'h'
|
296
|
+
'ਂ': 'ṁ'
|
297
|
+
'ੰ': 'ṁ'
|
298
|
+
|
299
|
+
# Adhik character doubling of the following consonant[Note 5]
|
300
|
+
'ੱਕ': 'kka'
|
301
|
+
'ੱਖ': 'kkha'
|
302
|
+
'ੱਖ਼': 'ḳḳha'
|
303
|
+
'ੱਗ': 'gga'
|
304
|
+
'ੱਗ਼': 'gg̣a'
|
305
|
+
'ੱਘ': 'ggha'
|
306
|
+
'ੱਙ': 'ṅṅa'
|
307
|
+
'ੱਚ': 'ccha'
|
308
|
+
'ੱਛ': 'cchha'
|
309
|
+
'ੱਜ਼': 'zza'
|
310
|
+
'ੱਜ': 'jja'
|
311
|
+
'ੱਝ': 'jjha'
|
312
|
+
'ੱਞ': 'ñña'
|
313
|
+
'ੱਟ': 'ṭṭa'
|
314
|
+
'ੱਠ': 'ṭṭha'
|
315
|
+
'ੱਡ': 'ḍḍa'
|
316
|
+
'ੱਢ': 'ḍḍha'
|
317
|
+
'ੱਣ': 'ṇṇa'
|
318
|
+
'ੱਤ': 'tta'
|
319
|
+
'ੱਥ': 'ttha'
|
320
|
+
'ੱਦ': 'dda'
|
321
|
+
'ੱਧ': 'ddha'
|
322
|
+
'ੱਨ': 'nna'
|
323
|
+
'ੱਪ': 'ppa'
|
324
|
+
'ੱਫ': 'ppha'
|
325
|
+
'ੱਫ਼': 'ffa'
|
326
|
+
'ੱਬ': 'bba'
|
327
|
+
'ੱਭ': 'bbha'
|
328
|
+
'ੱਮ': 'mma'
|
329
|
+
'ੱਯ': 'yya'
|
330
|
+
'ੱਰ': 'rra'
|
331
|
+
'ੱਲ': 'lla'
|
332
|
+
'ੱਲੵ': 'lla'
|
333
|
+
'ੱਲ਼': 'lla'
|
334
|
+
'ੱਵ': 'vva'
|
335
|
+
'ੱੜ': 'ṙṙa'
|
336
|
+
'ੱਸ': 'ss'
|
337
|
+
'ੱਸ਼': 'ssha'
|
338
|
+
'ੱਹ': 'hh'
|
339
|
+
|
340
|
+
# Adhik character doubling of the following consonant and ends with ੍ [Note 5]
|
341
|
+
'ੱਕ੍': 'kk'
|
342
|
+
'ੱਖ੍': 'kkh'
|
343
|
+
'ੱਖ਼੍': 'ḳḳh'
|
344
|
+
'ੱਗ੍': 'gg'
|
345
|
+
'ੱਗ਼੍': 'gg̣'
|
346
|
+
'ੱਘ੍': 'ggh'
|
347
|
+
'ੱਙ੍': 'ṅṅ'
|
348
|
+
'ੱਚ੍': 'cch'
|
349
|
+
'ੱਛ੍': 'cchh'
|
350
|
+
'ੱਜ਼੍': 'zz'
|
351
|
+
'ੱਜ੍': 'jj'
|
352
|
+
'ੱਝ੍': 'jjh'
|
353
|
+
'ੱਞ੍': 'ññ'
|
354
|
+
'ੱਟ੍': 'ṭṭ'
|
355
|
+
'ੱਠ੍': 'ṭṭh'
|
356
|
+
'ੱਡ੍': 'ḍḍ'
|
357
|
+
'ੱਢ੍': 'ḍḍh'
|
358
|
+
'ੱਣ੍': 'ṇṇ'
|
359
|
+
'ੱਤ੍': 'tt'
|
360
|
+
'ੱਥ੍': 'tth'
|
361
|
+
'ੱਦ੍': 'dd'
|
362
|
+
'ੱਧ੍': 'ddh'
|
363
|
+
'ੱਨ੍': 'nn'
|
364
|
+
'ੱਪ੍': 'pp'
|
365
|
+
'ੱਫ੍': 'pph'
|
366
|
+
'ੱਫ਼੍': 'ff'
|
367
|
+
'ੱਬ੍': 'bb'
|
368
|
+
'ੱਭ੍': 'bbh'
|
369
|
+
'ੱਮ੍': 'mm'
|
370
|
+
'ੱਯ੍': 'yy'
|
371
|
+
'ੱਰ੍': 'rr'
|
372
|
+
'ੱਲ੍': 'll'
|
373
|
+
'ੱਲੵ੍': 'll'
|
374
|
+
'ੱਲ਼੍': 'll'
|
375
|
+
'ੱਵ੍': 'vv'
|
376
|
+
'ੱੜ੍': 'ṙṙ'
|
377
|
+
'ੱਸ੍': 'ss'
|
378
|
+
'ੱਸ਼੍': 'ssh'
|
379
|
+
'ੱਹ੍': 'hh'
|
380
|
+
|
381
|
+
|
382
|
+
# III. Subscript consonant characters
|
383
|
+
"੍ਹ": "-h"
|
384
|
+
"੍ਵ": "-v"
|
385
|
+
"੍ਰ": "-r"
|
386
|
+
"੍ਯ": "-y"
|
387
|
+
|
388
|
+
"੍": ""
|
389
|
+
"ੱ": ""
|
390
|
+
"਼": ""
|
391
|
+
|
392
|
+
# digits
|
393
|
+
'੦': '0'
|
394
|
+
'੧': '1'
|
395
|
+
'੨': '2'
|
396
|
+
'੩': '3'
|
397
|
+
'੪': '4'
|
398
|
+
'੫': '5'
|
399
|
+
'੬': '6'
|
400
|
+
'੭': '7'
|
401
|
+
'੮': '8'
|
402
|
+
'੯': '9'
|