interscript 0.1.2 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -0,0 +1,190 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2013
4
+ language: mkd
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Makedonian Romanization, BGN/PCGN 2013 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
9
+ creation_date: 2013
10
+ description: |
11
+ Macedonian was officially established as a written language in Yugoslavia during
12
+ World War II and is now the official language of North Macedonia.
13
+ This romanization system replaces the BGN/PCGN 1981 agreement and adheres
14
+ to the most widely-accepted standardization of Macedonian orthography.
15
+
16
+ notes:
17
+ - The Macedonian Cyrillic lowercase italic Д may sometimes be seen as g.
18
+ There is no specific Unicode encoding for this variant form so a comparable character
19
+ has been used here for illustrative purposes.
20
+ - The Macedonian Cyrillic lowercase italic Ѓ may sometimes be seen as ī.
21
+ There is no specific Unicode encoding for this variant form so a comparable character
22
+ has been used here for illustrative purposes.
23
+ - The Macedonian Cyrillic lowercase italic П may sometimes be seen as ū.
24
+ There is no specific Unicode encoding for this variant form so a comparable character
25
+ has been used here for illustrative purposes.
26
+ - The Macedonian Cyrillic lowercase italic Т may sometimes be seen as w̄.
27
+ There is no specific Unicode encoding for this variant form so a comparable character
28
+ has been used here for illustrative purposes.
29
+ - |
30
+ An inventory of letter-diacritic combinations, with their Unicode encoding,
31
+ in addition to the unmodified letters of the basic Roman script is:
32
+ | Ǵ (U+01F4) | ǵ (U+01F5) |
33
+ | Ž (U+017D) | ž (U+017E) |
34
+ | Dz (U+01F2)* | dz (U+01F3)* |
35
+ | Lj (U+01C8)* | lj (U+01C9)* |
36
+ | Nj (U+01CB)* | nj(U+01CC)* |
37
+ | Ḱ (U+IE30) | ḱ (U+IE31) |
38
+ | Č (U+010C) | č (U+010D) |
39
+ | Dž (U+01C5)* | dž (U+01C6)* |
40
+ | Š (U+0160) | š (U+0161) |
41
+ * Note that these characters can also be reproduced with individual letters (e.g. l+j).
42
+ - The Romanization column shows only lowercase forms but, when romanizing,
43
+ uppercase and lowercase Roman letters as appropriate should be used.
44
+
45
+ tests:
46
+ - source: Ѓенови Ливаѓе
47
+ expected: Ǵenovi Livaǵe
48
+ - source: ЛУЃЕ луѓе
49
+ expected: LUǴE luǵe
50
+ - source: ЅВЕЗДА ѕвезда Ѕвезда
51
+ expected: DZVEZDA dzvezda Dzvezda
52
+ - source: Јабежица
53
+ expected: Jabežica
54
+ - source: Љиќен и Бард
55
+ expected: Ljiḱen i Bard
56
+ - source: Ќамилов Чукар
57
+ expected: Ḱamilov Čukar
58
+ - source: Џавидин Кајнак
59
+ expected: Džavidin Kajnak
60
+ - source: Џамалџи
61
+ expected: Džamaldži
62
+ - source: Џибра Гури и Зи
63
+ expected: Džibra Guri i Zi
64
+ - source: Абазова Куќарица
65
+ expected: Abazova Kuḱarica
66
+ - source: Баба Анѓина Маала
67
+ expected: Baba Anǵina Maala
68
+ - source: Ваљановец
69
+ expected: Valjanovec
70
+ - source: Галал Једи Дереш
71
+ expected: Galal Jedi Dereš
72
+ - source: Дванаесет Клајнци
73
+ expected: Dvanaeset Klajnci
74
+ - source: Електродистрибуција Струга
75
+ expected: Elektrodistribucija Struga
76
+ - source: Железничка Станица Рајко Жинзифов
77
+ expected: Železnička Stanica Rajko Žinzifov
78
+ - source: Заедничко Речиште
79
+ expected: Zaedničko Rečište
80
+ - source: Испраена Плоча
81
+ expected: Ispraena Ploča
82
+ - source: Казнено-Поправна Установа Идризово
83
+ expected: Kazneno-Popravna Ustanova Idrizovo
84
+ - source: Лази и Зејнелит
85
+ expected: Lazi i Zejnelit
86
+ - source: Мавровско Езеро
87
+ expected: Mavrovsko Ezero
88
+ - source: Национален Парк Галичица
89
+ expected: Nacionalen Park Galičica
90
+ - source: Одморалиште Свети Стефан
91
+ expected: Odmoralište Sveti Stefan
92
+ - source: Планинарски Дом Караџица
93
+ expected: Planinarski Dom Karadžica
94
+ - source: Раса е Лисењит
95
+ expected: Rasa e Lisenjit
96
+ - source: Скочивирска Клисура
97
+ expected: Skočivirska Klisura
98
+ - source: Термо-електроцентрала Неготино
99
+ expected: Termo-elektrocentrala Negotino
100
+ - source: Узуновско Бресје
101
+ expected: Uzunovsko Bresje
102
+ - source: Фабрика Југохром
103
+ expected: Fabrika Jugohrom
104
+ - source: Хидроелектрана Сапунџица
105
+ expected: Hidroelektrana Sapundžica
106
+ - source: Цветковско Рамниште
107
+ expected: Cvetkovsko Ramnište
108
+ - source: Чалтанова Пештера
109
+ expected: Čaltanova Peštera
110
+ - source: Шкемби Вишнејц
111
+ expected: Škembi Višnejc
112
+
113
+ map:
114
+ postrules:
115
+ # DZ
116
+ - pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
117
+ result: "DZ"
118
+ #LJ
119
+ - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
120
+ result: "LJ"
121
+ #NJ
122
+ - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
123
+ result: "NJ"
124
+ #DŽ
125
+ - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
126
+ result: "DŽ"
127
+
128
+ characters:
129
+ "\u0410": "A"
130
+ "\u0411": "B"
131
+ "\u0412": "V"
132
+ "\u0413": "G"
133
+ "\u0414": "D"
134
+ "\u0403": "\u01F4" # Ǵ
135
+ "\u0415": "E"
136
+ "\u0416": "\u005a\u030c" # Ž
137
+ "\u0417": "Z"
138
+ "\u0405": "Dz"
139
+ "\u0418": "I"
140
+ "\u0408": "J"
141
+ "\u041A": "K"
142
+ "\u041B": "L"
143
+ "\u0409": "Lj"
144
+ "\u041C": "M"
145
+ "\u041D": "N"
146
+ "\u040A": "Nj"
147
+ "\u041E": "O"
148
+ "\u041F": "P"
149
+ "\u0420": "R"
150
+ "\u0421": "S"
151
+ "\u0422": "T"
152
+ "\u040C": "\u004b\u0301" # Ḱ
153
+ "\u0423": "U"
154
+ "\u0424": "F"
155
+ "\u0425": "H"
156
+ "\u0426": "C"
157
+ "\u0427": "\u0043\u030c" # Č
158
+ "\u040F": "D\u007a\u030c" # Dž
159
+ "\u0428": "\u0053\u030c" # Š
160
+ "\u0430": "a"
161
+ "\u0431": "b"
162
+ "\u0432": "v"
163
+ "\u0433": "g"
164
+ "\u0434": "d"
165
+ "\u0453": "\u01F5" # ǵ
166
+ "\u0435": "e"
167
+ "\u0436": "\u007a\u030c" # ž
168
+ "\u0437": "z"
169
+ "\u0455": "dz"
170
+ "\u0438": "i"
171
+ "\u0458": "j"
172
+ "\u043A": "k"
173
+ "\u043B": "l"
174
+ "\u0459": "lj"
175
+ "\u043C": "m"
176
+ "\u043D": "n"
177
+ "\u045A": "nj"
178
+ "\u043E": "o"
179
+ "\u043F": "p"
180
+ "\u0440": "r"
181
+ "\u0441": "s"
182
+ "\u0442": "t"
183
+ "\u045C": "\u1E31" # ḱ
184
+ "\u0443": "u"
185
+ "\u0444": "f"
186
+ "\u0445": "h"
187
+ "\u0446": "c"
188
+ "\u0447": "\u0063\u030c" # č
189
+ "\u045F": "d\u007a\u030c" # dž
190
+ "\u0448": "\u0073\u030c" # š
@@ -102,69 +102,148 @@ tests:
102
102
  Число открепительных удостоверений, утраченных в окружной избирательной комиссии
103
103
 
104
104
  expected: |
105
- VYBORY DEPUTATOV GOSUDARSTVENNOY DUMY FEDERALNOGO SOBRANIYA ROSSIYSKOY FEDERATSII SEDMOGO SOZYVA
106
- DATA GOLOSOVANIYA: 18.09.2016
107
-
108
- NAIMENOVANIE IZBIRATELNOY KOMISSII: TSIK ROSSII
109
-
110
- SVODNAYA TABLITSA REZULTATOV VYBOROV PO FEDERALNOMU IZBIRATELNOMU OKRUGU
111
-
112
-
113
- CHISLO IZBIRATELEY, VNESENNYKH V SPISOK IZBIRATELEY NA MOMENT OKONCHANIYA GOLOSOVANIYA
114
- CHISLO IZBIRATELNYKH BYULLETENEY, POLUCHENNYKH UCHASTKOVOY IZBIRATELNOY KOMISSIEY
115
- CHISLO IZBIRATELNYKH BYULLETENEY, VYDANNYKH IZBIRATELYAM, PROGOLOSOVAVSHIM DOSROCHNO
116
- CHISLO IZBIRATELNYKH BYULLETENEY, VYDANNYKH V POMESHCHENII DLYA GOLOSOVANIYA V DENGOLOSOVANIYA
117
- CHISLO IZBIRATELNYKH BYULLETENEY, VYDANNYKH VNE POMESHCHENIYA DLYA GOLOSOVANIYA V DENGOLOSOVANIYA
118
- CHISLO POGASHENNYKH IZBIRATELNYKH BYULLETENEY
119
- CHISLO IZBIRATELNYKH BYULLETENEY, SODERZHASHCHIKHSYA V PERENOSNYKH YASHCHIKAKH DLYA GOLOSOVANIYA
120
- CHISLO IZBIRATELNYKH BYULLETENEY, SODERZHASHCHIKHSYA V STATSIONARNYKH YASHCHIKAKH DLYA GOLOSOVANIYA
121
- CHISLO NEDEYSTVITELNYKH IZBIRATELNYKH BYULLETENEY
122
- CHISLO DEYSTVITELNYKH IZBIRATELNYKH BYULLETENEY
123
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, POLUCHENNYKH UCHASTKOVOY IZBIRATELNOY KOMISSIEY
124
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, VYDANNYKH NA IZBIRATELNOM UCHASTKE DO DNYA GOLOSOVANIYA
125
- CHISLO IZBIRATELEY, PROGOLOSOVAVSHIKH PO OTKREPITELNYM UDOSTOVERENIYAM NA IZBIRATELNOM UCHASTKE
126
- CHISLO POGASHENNYKH NEISPOLZOVANNYKH OTKREPITELNYKH UDOSTOVERENIY
127
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, VYDANNYKH IZBIRATELYAM TERRITORIALNOY IZBIRATELNOY KOMISSIEY
128
- CHISLO UTRACHENNYKH OTKREPITELNYKH UDOSTOVERENIY
129
- CHISLO UTRACHENNYKH IZBIRATELNYKH BYULLETENEY
130
- CHISLO IZBIRATELNYKH BYULLETENEY, NE UCHTENNYKH PRI POLUCHENII
105
+ Vybory deputatov Gosudarstvennoy Dumy Federalnogo Sobraniya Rossiyskoy Federatsii sedmogo sozyva
106
+ Data golosovaniya: 18.09.2016
107
+
108
+ Naimenovaniye Izbiratelnoy komissii: TSIK Rossii
109
+
110
+ Svodnaya tablitsa rezultatov vyborov po federalnomu izbiratelnomu okrugu
111
+
112
+
113
+ Chislo izbirateley, vnesennykh v spisok izbirateley na moment okonchaniya golosovaniya
114
+ Chislo izbiratelnykh byulleteney, poluchennykh uchastkovoy izbiratelnoy komissiyey
115
+ Chislo izbiratelnykh byulleteney, vydannykh izbiratelyam, progolosovavshim dosrochno
116
+ Chislo izbiratelnykh byulleteney, vydannykh v pomeshchenii dlya golosovaniya v dengolosovaniya
117
+ Chislo izbiratelnykh byulleteney, vydannykh vne pomeshcheniya dlya golosovaniya v dengolosovaniya
118
+ Chislo pogashennykh izbiratelnykh byulleteney
119
+ Chislo izbiratelnykh byulleteney, soderzhashchikhsya v perenosnykh yashchikakh dlya golosovaniya
120
+ Chislo izbiratelnykh byulleteney, soderzhashchikhsya v statsionarnykh yashchikakh dlya golosovaniya
121
+ Chislo nedeystvitelnykh izbiratelnykh byulleteney
122
+ Chislo deystvitelnykh izbiratelnykh byulleteney
123
+ Chislo otkrepitelnykh udostovereniy, poluchennykh uchastkovoy izbiratelnoy komissiyey
124
+ Chislo otkrepitelnykh udostovereniy, vydannykh na izbiratelnom uchastke do dnya golosovaniya
125
+ Chislo izbirateley, progolosovavshikh po otkrepitelnym udostovereniyam na izbiratelnom uchastke
126
+ Chislo pogashennykh neispolzovannykh otkrepitelnykh udostovereniy
127
+ Chislo otkrepitelnykh udostovereniy, vydannykh izbiratelyam territorialnoy izbiratelnoy komissiyey
128
+ Chislo utrachennykh otkrepitelnykh udostovereniy
129
+ Chislo utrachennykh izbiratelnykh byulleteney
130
+ Chislo izbiratelnykh byulleteney, ne uchtennykh pri poluchenii
131
131
  1. VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "RODINA"
132
- 2. POLITICHESKAYA PARTIYA KOMMUNISTICHESKAYA PARTIYA KOMMUNISTY ROSSII
133
- 3. POLITICHESKAYA PARTIYA "ROSSIYSKAYA PARTIYA PENSIONEROV ZA SPRAVEDLIVOST’"
134
- 4. VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "EDINAYA ROSSIYA"
135
- 5. POLITICHESKAYA PARTIYA "ROSSIYSKAYA EKOLOGICHESKAYA PARTIYA "ZELENYE"
136
- 6. POLITICHESKAYA PARTIYA "GRAZHDANSKAYA PLATFORMA"
137
- 7. POLITICHESKAYA PARTIYA LDPR - LIBERALNO-DEMOKRATICHESKAYA PARTIYA ROSSII
138
- 8. POLITICHESKAYA PARTIYA "PARTIYA NARODNOY SVOBODY" (PARNAS)
139
- 9. VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "PARTIYA ROSTA"
140
- 10. OBSHCHESTVENNAYA ORGANIZATSIYA VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "GRAZHDANSKAYA SILA"
141
- 11. POLITICHESKAYA PARTIYA "ROSSIYSKAYA OBEDINENNAYA DEMOKRATICHESKAYA PARTIYA ""YABLOKO"""
142
- 12. POLITICHESKAYA PARTIYA "KOMMUNISTICHESKAYA PARTIYA ROSSIYSKOY FEDERATSII"
143
- 13. POLITICHESKAYA PARTIYA "PATRIOTY ROSSII"
144
- 14. POLITICHESKAYA PARTIYA SPRAVEDLIVAYA ROSSIYA
145
-
146
- DANNYYE OKRUZHNYKH IZBIRATYELNYKH KOMISSIY O CHISLYE OTKRYEPITYELNYKH UDOSTOVYERYENIY
147
-
148
-
149
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, POLUCHENNYKH OKRUZHNOY IZBIRATELNOY KOMISSIEY
150
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, VYDANNYKH TERRITORIALNYM IZBIRATELNYM KOMISSIYAM
151
- CHISLO NEISPOLZOVANNYKH OTKREPITELNYKH UDOSTOVERENIY, POGASHENNYKH OKRUZHNOY IZBIRATELNOY KOMISSIEY
152
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, UTRACHENNYKH V OKRUZHNOY IZBIRATELNOY KOMISSII
132
+ 2. Politicheskaya partiya KOMMUNISTICHESKAYA PARTIYA KOMMUNISTY ROSSII
133
+ 3. Politicheskaya partiya "Rossiyskaya partiya pensionerov za spravedlivost’"
134
+ 4. Vserossiyskaya politicheskaya partiya "YEDINAYA ROSSIYA"
135
+ 5. Politicheskaya partiya "Rossiyskaya ekologicheskaya partiya "Zelenyye"
136
+ 6. Politicheskaya partiya "Grazhdanskaya Platforma"
137
+ 7. Politicheskaya partiya LDPR - Liberalno-demokraticheskaya partiya Rossii
138
+ 8. Politicheskaya partiya "Partiya narodnoy svobody" (PARNAS)
139
+ 9. Vserossiyskaya politicheskaya partiya "PARTIYA ROSTA"
140
+ 10. Obshchestvennaya organizatsiya Vserossiyskaya politicheskaya partiya "Grazhdanskaya Sila"
141
+ 11. Politicheskaya partiya "Rossiyskaya ob"yedinennaya demokraticheskaya partiya "YABLOKO"
142
+ 12. Politicheskaya partiya "KOMMUNISTICHESKAYA PARTIYA ROSSIYSKOY FEDERATSII"
143
+ 13. Politicheskaya partiya "PATRIOTY ROSSII"
144
+ 14. Politicheskaya partiya SPRAVEDLIVAYA ROSSIYA
145
+
146
+ Dannyye okruzhnykh izbiratelnykh komissiy o chisle otkrepitelnykh udostovereniy
147
+
148
+
149
+ Chislo otkrepitelnykh udostovereniy, poluchennykh okruzhnoy izbiratelnoy komissiyey
150
+ Chislo otkrepitelnykh udostovereniy, vydannykh territorialnym izbiratelnym komissiyam
151
+ Chislo neispolzovannykh otkrepitelnykh udostovereniy, pogashennykh okruzhnoy izbiratelnoy komissiyey
152
+ Chislo otkrepitelnykh udostovereniy, utrachennykh v okruzhnoy izbiratelnoy komissii
153
+ - source: ДЛИННОЕ ПОКРЫВАЛО
154
+ expected: DLINNOYE POKRYVALO
155
+ - source: Еловая шишка
156
+ expected: Yelovaya shishka
157
+ - source: ЕЛОВАЯ ШИШКА
158
+ expected: YELOVAYA SHISHKA
159
+ - source: Длинное покрывало
160
+ expected: Dlinnoye pokryvalo
161
+ - source: В лесу еловые шишки
162
+ expected: V lesu yelovyye shishki
163
+ - source: OН ВИДЕЛ ЕЁ В ПЕРВЫЙ РАЗ
164
+ expected: ON VIDEL YEYË V PERVYY RAZ
165
+ - source: Ёж колючий
166
+ expected: Yëzh kolyuchiy
167
+ - source: ЁЖ КОЛЮЧИЙ
168
+ expected: YËZH KOLYUCHIY
169
+ - source: Он видел её в первый раз
170
+ expected: On videl yeyë v pervyy raz
171
+ - source: У ёжа колючки
172
+ expected: U yëzha kolyuchki
173
+ - source: ЙА Йа йа
174
+ expected: Y·A Y·a y·a
175
+ - source: ЫУ Ыу ыу
176
+ expected: Y·U Y·u y·u
177
+ - source: ОЫ Оы оы
178
+ expected: O·Y O·y o·y
179
+ - source: ОЫУ Оыу оыу
180
+ expected: O·Y·U O·y·u o·y·u
181
+ - source: СЭ Сэ сэ
182
+ expected: S·E S·e s·e
183
+ - source: ТС тс Тс тС
184
+ expected: T·S t·s T·s t·S
185
+ - source: ШЧ шч Шч шЧ
186
+ expected: SH·CH sh·ch Sh·ch sh·Ch
153
187
 
154
188
  map:
155
189
  rules:
156
- - pattern: ([ЄФІЦАаЕеИиЙйОоУуЫыЮюЯяії])\u0415
157
- result: "\\1YE"
158
- - pattern: \b\u0415
159
- result: YE
160
- - pattern: ([йьъ])\u0415
161
- result: "\\1YE"
162
- - pattern: ([ЄФІЦАаЕеИиЙйОоУуЫыЮюЯяії])\u0435
163
- result: "\\1ye"
164
- - pattern: \b\u0435
165
- result: ye
166
- - pattern: ([йьъ])\u0435
167
- result: "\\1ye"
190
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0401 # Ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
191
+ result: "Y\u00eb"
192
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0451 # ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
193
+ result: "y\u00eb"
194
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0415 # Е after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
195
+ result: "Y\u0415"
196
+ - pattern: \b\u0415 # Е initially
197
+ result: "Y\u0435"
198
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0435 # е after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
199
+ result: "y\u0435"
200
+ - pattern: \b\u0435 # е initially
201
+ result: "y\u0435"
202
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0401 # Ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
203
+ result: "Y\u00eb"
204
+ - pattern: \b\u0401
205
+ result: "Y\u00eb"
206
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0451 # ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
207
+ result: "y\u00eb"
208
+ - pattern: \b\u0451
209
+ result: "y\u00eb"
210
+ - pattern: \u0419(?=[АаУуЫыЭэ]) # Й before а, у, ы, or э
211
+ result: "Y\u00b7"
212
+ - pattern: \u0439(?=[АаУуЫыЭэ]) # й before а, у, ы, or э
213
+ result: "y\u00b7"
214
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯя])\u042b(?=[АаУуЫыЭэ]) # Ы after any vowel character and before а, у, ы, or э
215
+ result: "\u00b7Y\u00b7"
216
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯя])\u044b(?=[АаУуЫыЭэ]) # ы after any vowel character and before а, у, ы, or э
217
+ result: "\u00b7y\u00b7"
218
+ - pattern: \u042b(?=[АаУуЫыЭэ]) # Ы before а, у, ы, or э
219
+ result: "Ы\u00b7"
220
+ - pattern: \u044b(?=[АаУуЫыЭэ]) # ы before а, у, ы, or э
221
+ result: "ы\u00b7"
222
+ - pattern: (?<=[Оо])\u042b # Ы after о
223
+ result: "\u00b7Y"
224
+ - pattern: (?<=[Оо])\u044b # ы after о
225
+ result: "\u00b7y"
226
+ - pattern: \b\u0401
227
+ result: "Y\u00eb"
228
+ - pattern: \b\u0451
229
+ result: "y\u00eb"
230
+ - pattern: (?<=[БбВвГгДдЖжЗзКкЛлМмНнПпРрСсТтФфХхЦцЧчШшЩщ])\u042d # Э after any consonant character except й
231
+ result: "\u00b7E"
232
+ - pattern: (?<=[БбВвГгДдЖжЗзКкЛлМмНнПпРрСсТтФфХхЦцЧчШшЩщ])\u044d # э after any consonant character except й
233
+ result: "\u00b7e"
234
+ - pattern: (Т|т)(С|с) # тс => t·s
235
+ result: "\\1\u00b7\\2"
236
+ - pattern: (Ш|ш)(Ч|ч) # шч => sh·ch
237
+ result: "\\1\u00b7\\2"
238
+
239
+ postrules:
240
+
241
+ #YE
242
+ - pattern: "((?<=[[:upper:]])Ye(?=[[:upper:]])?|(?<=[[:upper:]])?Ye(?=[[:upper:]]))"
243
+ result: "YE"
244
+ #YË
245
+ - pattern: "((?<=[[:upper:]])Yë(?=[[:upper:]])?|(?<=[[:upper:]])?Yë(?=[[:upper:]]))"
246
+ result: "YË"
168
247
 
169
248
  characters:
170
249
  "\u0410": "A"
@@ -173,7 +252,7 @@ map:
173
252
  "\u0413": "G"
174
253
  "\u0414": "D"
175
254
  "\u0415": "E"
176
- "\u0435": "e"
255
+ "\u0401": "\u00cb" # Ё
177
256
  "\u0416": "Zh"
178
257
  "\u0417": "Z"
179
258
  "\u0418": "I"
@@ -194,9 +273,9 @@ map:
194
273
  "\u0427": "Ch"
195
274
  "\u0428": "Sh"
196
275
  "\u0429": "Shch"
197
- "\u042a": "\""
276
+ "\u042a": "\"" # Ъ
198
277
  "\u042b": "Y"
199
- "\u042c": "\u2019"
278
+ "\u042c": "\u2019" # Ь => ’
200
279
  "\u042d": "E"
201
280
  "\u042e": "Yu"
202
281
  "\u042f": "Ya"
@@ -205,6 +284,8 @@ map:
205
284
  "\u0432": "v"
206
285
  "\u0433": "g"
207
286
  "\u0434": "d"
287
+ "\u0435": "e"
288
+ "\u0451": "\u00eb" # ё
208
289
  "\u0436": "zh"
209
290
  "\u0437": "z"
210
291
  "\u0438": "i"
@@ -225,9 +306,9 @@ map:
225
306
  "\u0447": "ch"
226
307
  "\u0448": "sh"
227
308
  "\u0449": "shch"
228
- "\u044a": "\""
309
+ "\u044a": "\"" # ъ
229
310
  "\u044b": "y"
230
- "\u044c": "\u2019"
311
+ "\u044c": "\u2019" # ь => ’
231
312
  "\u044d": "e"
232
313
  "\u044e": "yu"
233
314
  "\u044f": "ya"
@@ -0,0 +1,166 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2005
4
+ language: srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF SERBIAN, BGN/PCGN 2005 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816783/TABLE_OF_CORRESPONDENCES_FOR_SERBIAN.pdf
9
+ creation_date: 2005
10
+ confirmation_date: 2019-06
11
+ description: |
12
+ The tabulation below reflects the Serbian Cyrillic alphabet and the standard Roman script equivalents
13
+ used in both Serbia and Montenegro.
14
+
15
+ notes:
16
+ - The Serbian Cyrillic lowercase italic Д may sometimes be seen as g.
17
+ There is no specific Unicode encoding for this variant form so a comparable character
18
+ has been used here for illustrative purposes.
19
+
20
+ - The digraph dj(Dj) will occasionally be found as an alternative form of đ(Đ).
21
+
22
+ - The Serbian Cyrillic lowercase italic П may sometimes be seen as ӣ.
23
+ There is no specific Unicode encoding for this variant form so a comparable character
24
+ has been used here for illustrative purposes.
25
+
26
+ - The Serbian Cyrillic lowercase italic Т may sometimes be seen as w.
27
+ There is no specific Unicode encoding for this variant form so a comparable character
28
+ has been used here for illustrative purposes.
29
+
30
+ - |
31
+ An inventory of letter-diacritic combinations, with their Unicode encoding,
32
+ in addition to the unmodified letters of the basic Roman script is:
33
+ | Đ (U+0110) | đ (U+0111) |
34
+ | Ž (U+017D) | ž (U+017E) |
35
+ | Lj (U+01C8)* | lj (U+01C9)* |
36
+ | Ć (U+0106) | ć (U+0107) |
37
+ | Dž (U+01C5)* | dž (U+01C6)* |
38
+ | Š (U+0160) | š (U+0161) |
39
+ * Note that these characters can also be reproduced with individual letters (e.g. l+j).
40
+
41
+ - The Roman-script columns show only lowercase forms but, when applying the table,
42
+ uppercase and lowercase Roman letters as appropriate should be used.
43
+
44
+ tests:
45
+ - source: Шупља Стена
46
+ expected: Šuplja Stena
47
+ - source: Чукарица
48
+ expected: Čukarica
49
+ - source: Црна Трава
50
+ expected: Crna Trava
51
+ - source: Херцег Нови
52
+ expected: Herceg Novi
53
+ - source: Улцињ
54
+ expected: Ulcinj
55
+ - source: Ужице
56
+ expected: Užice
57
+ - source: Тресаначка Река
58
+ expected: Tresanačka Reka
59
+ - source: Сјеница
60
+ expected: Sjenica
61
+ - source: Рожаје
62
+ expected: Rožaje
63
+ - source: Пљевља
64
+ expected: Pljevlja
65
+ - source: Оџаци
66
+ expected: Odžaci
67
+ - source: Никшић
68
+ expected: Nikšić
69
+ - source: Медвеђа
70
+ expected: Medveđa
71
+ - source: Лозница
72
+ expected: Loznica
73
+ - source: Књажевац
74
+ expected: Knjaževac
75
+ - source: Зрењанин
76
+ expected: Zrenjanin
77
+ - source: Житорађа
78
+ expected: Žitorađa
79
+ - source: Ервеник
80
+ expected: Ervenik
81
+ - source: Доње Љупче
82
+ expected: Donje Ljupče
83
+ - source: Гусиње
84
+ expected: Gusinje
85
+ - source: ГУСИЊЕ
86
+ expected: GUSINJE
87
+ - source: Врњачка Бања
88
+ expected: Vrnjačka Banja
89
+ - source: Бијело Поље
90
+ expected: Bijelo Polje
91
+ - source: Алибунар
92
+ expected: Alibunar
93
+
94
+ map:
95
+ postrules:
96
+ #LJ
97
+ - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
98
+ result: "LJ"
99
+ #NJ
100
+ - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
101
+ result: "NJ"
102
+ #DŽ
103
+ - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
104
+ result: "DŽ"
105
+
106
+ characters:
107
+ "\u0410": "A"
108
+ "\u0411": "B"
109
+ "\u0412": "V"
110
+ "\u0413": "G"
111
+ "\u0414": "D"
112
+ "\u0402": "\u0110" # Đ
113
+ "\u0415": "E"
114
+ "\u0416": "\u005a\u030c" # Ž
115
+ "\u0417": "Z"
116
+ "\u0418": "I"
117
+ "\u0408": "J"
118
+ "\u041A": "K"
119
+ "\u041B": "L"
120
+ "\u0409": "Lj"
121
+ "\u041C": "M"
122
+ "\u041D": "N"
123
+ "\u040A": "Nj"
124
+ "\u041E": "O"
125
+ "\u041F": "P"
126
+ "\u0420": "R"
127
+ "\u0421": "S"
128
+ "\u0422": "T"
129
+ "\u040B": "\u0043\u0301" # Ć
130
+ "\u0423": "U"
131
+ "\u0424": "F"
132
+ "\u0425": "H"
133
+ "\u0426": "C"
134
+ "\u0427": "\u0043\u030c" # Č
135
+ "\u040F": "D\u007a\u030c" # Dž
136
+ "\u0428": "\u0053\u030c" # Š
137
+ "\u0430": "a"
138
+ "\u0431": "b"
139
+ "\u0432": "v"
140
+ "\u0433": "g"
141
+ "\u0434": "d"
142
+ "\u0452": "\u0111" # đ
143
+ "\u0435": "e"
144
+ "\u0436": "\u007a\u030c" # ž
145
+ "\u0437": "z"
146
+ "\u0438": "i"
147
+ "\u0458": "j"
148
+ "\u043A": "k"
149
+ "\u043B": "l"
150
+ "\u0459": "lj"
151
+ "\u043C": "m"
152
+ "\u043D": "n"
153
+ "\u045A": "nj"
154
+ "\u043E": "o"
155
+ "\u043F": "p"
156
+ "\u0440": "r"
157
+ "\u0441": "s"
158
+ "\u0442": "t"
159
+ "\u045B": "\u0063\u0301" # ć́
160
+ "\u0443": "u"
161
+ "\u0444": "f"
162
+ "\u0445": "h"
163
+ "\u0446": "c"
164
+ "\u0447": "\u0063\u030c" # č
165
+ "\u045F": "d\u007a\u030c" # dž
166
+ "\u0448": "\u0073\u030c" # š