interscript 0.1.2 → 0.1.3

Sign up to get free protection for your applications and to get access to all the features.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -0,0 +1,190 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2013
4
+ language: mkd
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Makedonian Romanization, BGN/PCGN 2013 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
9
+ creation_date: 2013
10
+ description: |
11
+ Macedonian was officially established as a written language in Yugoslavia during
12
+ World War II and is now the official language of North Macedonia.
13
+ This romanization system replaces the BGN/PCGN 1981 agreement and adheres
14
+ to the most widely-accepted standardization of Macedonian orthography.
15
+
16
+ notes:
17
+ - The Macedonian Cyrillic lowercase italic Д may sometimes be seen as g.
18
+ There is no specific Unicode encoding for this variant form so a comparable character
19
+ has been used here for illustrative purposes.
20
+ - The Macedonian Cyrillic lowercase italic Ѓ may sometimes be seen as ī.
21
+ There is no specific Unicode encoding for this variant form so a comparable character
22
+ has been used here for illustrative purposes.
23
+ - The Macedonian Cyrillic lowercase italic П may sometimes be seen as ū.
24
+ There is no specific Unicode encoding for this variant form so a comparable character
25
+ has been used here for illustrative purposes.
26
+ - The Macedonian Cyrillic lowercase italic Т may sometimes be seen as w̄.
27
+ There is no specific Unicode encoding for this variant form so a comparable character
28
+ has been used here for illustrative purposes.
29
+ - |
30
+ An inventory of letter-diacritic combinations, with their Unicode encoding,
31
+ in addition to the unmodified letters of the basic Roman script is:
32
+ | Ǵ (U+01F4) | ǵ (U+01F5) |
33
+ | Ž (U+017D) | ž (U+017E) |
34
+ | Dz (U+01F2)* | dz (U+01F3)* |
35
+ | Lj (U+01C8)* | lj (U+01C9)* |
36
+ | Nj (U+01CB)* | nj(U+01CC)* |
37
+ | Ḱ (U+IE30) | ḱ (U+IE31) |
38
+ | Č (U+010C) | č (U+010D) |
39
+ | Dž (U+01C5)* | dž (U+01C6)* |
40
+ | Š (U+0160) | š (U+0161) |
41
+ * Note that these characters can also be reproduced with individual letters (e.g. l+j).
42
+ - The Romanization column shows only lowercase forms but, when romanizing,
43
+ uppercase and lowercase Roman letters as appropriate should be used.
44
+
45
+ tests:
46
+ - source: Ѓенови Ливаѓе
47
+ expected: Ǵenovi Livaǵe
48
+ - source: ЛУЃЕ луѓе
49
+ expected: LUǴE luǵe
50
+ - source: ЅВЕЗДА ѕвезда Ѕвезда
51
+ expected: DZVEZDA dzvezda Dzvezda
52
+ - source: Јабежица
53
+ expected: Jabežica
54
+ - source: Љиќен и Бард
55
+ expected: Ljiḱen i Bard
56
+ - source: Ќамилов Чукар
57
+ expected: Ḱamilov Čukar
58
+ - source: Џавидин Кајнак
59
+ expected: Džavidin Kajnak
60
+ - source: Џамалџи
61
+ expected: Džamaldži
62
+ - source: Џибра Гури и Зи
63
+ expected: Džibra Guri i Zi
64
+ - source: Абазова Куќарица
65
+ expected: Abazova Kuḱarica
66
+ - source: Баба Анѓина Маала
67
+ expected: Baba Anǵina Maala
68
+ - source: Ваљановец
69
+ expected: Valjanovec
70
+ - source: Галал Једи Дереш
71
+ expected: Galal Jedi Dereš
72
+ - source: Дванаесет Клајнци
73
+ expected: Dvanaeset Klajnci
74
+ - source: Електродистрибуција Струга
75
+ expected: Elektrodistribucija Struga
76
+ - source: Железничка Станица Рајко Жинзифов
77
+ expected: Železnička Stanica Rajko Žinzifov
78
+ - source: Заедничко Речиште
79
+ expected: Zaedničko Rečište
80
+ - source: Испраена Плоча
81
+ expected: Ispraena Ploča
82
+ - source: Казнено-Поправна Установа Идризово
83
+ expected: Kazneno-Popravna Ustanova Idrizovo
84
+ - source: Лази и Зејнелит
85
+ expected: Lazi i Zejnelit
86
+ - source: Мавровско Езеро
87
+ expected: Mavrovsko Ezero
88
+ - source: Национален Парк Галичица
89
+ expected: Nacionalen Park Galičica
90
+ - source: Одморалиште Свети Стефан
91
+ expected: Odmoralište Sveti Stefan
92
+ - source: Планинарски Дом Караџица
93
+ expected: Planinarski Dom Karadžica
94
+ - source: Раса е Лисењит
95
+ expected: Rasa e Lisenjit
96
+ - source: Скочивирска Клисура
97
+ expected: Skočivirska Klisura
98
+ - source: Термо-електроцентрала Неготино
99
+ expected: Termo-elektrocentrala Negotino
100
+ - source: Узуновско Бресје
101
+ expected: Uzunovsko Bresje
102
+ - source: Фабрика Југохром
103
+ expected: Fabrika Jugohrom
104
+ - source: Хидроелектрана Сапунџица
105
+ expected: Hidroelektrana Sapundžica
106
+ - source: Цветковско Рамниште
107
+ expected: Cvetkovsko Ramnište
108
+ - source: Чалтанова Пештера
109
+ expected: Čaltanova Peštera
110
+ - source: Шкемби Вишнејц
111
+ expected: Škembi Višnejc
112
+
113
+ map:
114
+ postrules:
115
+ # DZ
116
+ - pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
117
+ result: "DZ"
118
+ #LJ
119
+ - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
120
+ result: "LJ"
121
+ #NJ
122
+ - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
123
+ result: "NJ"
124
+ #DŽ
125
+ - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
126
+ result: "DŽ"
127
+
128
+ characters:
129
+ "\u0410": "A"
130
+ "\u0411": "B"
131
+ "\u0412": "V"
132
+ "\u0413": "G"
133
+ "\u0414": "D"
134
+ "\u0403": "\u01F4" # Ǵ
135
+ "\u0415": "E"
136
+ "\u0416": "\u005a\u030c" # Ž
137
+ "\u0417": "Z"
138
+ "\u0405": "Dz"
139
+ "\u0418": "I"
140
+ "\u0408": "J"
141
+ "\u041A": "K"
142
+ "\u041B": "L"
143
+ "\u0409": "Lj"
144
+ "\u041C": "M"
145
+ "\u041D": "N"
146
+ "\u040A": "Nj"
147
+ "\u041E": "O"
148
+ "\u041F": "P"
149
+ "\u0420": "R"
150
+ "\u0421": "S"
151
+ "\u0422": "T"
152
+ "\u040C": "\u004b\u0301" # Ḱ
153
+ "\u0423": "U"
154
+ "\u0424": "F"
155
+ "\u0425": "H"
156
+ "\u0426": "C"
157
+ "\u0427": "\u0043\u030c" # Č
158
+ "\u040F": "D\u007a\u030c" # Dž
159
+ "\u0428": "\u0053\u030c" # Š
160
+ "\u0430": "a"
161
+ "\u0431": "b"
162
+ "\u0432": "v"
163
+ "\u0433": "g"
164
+ "\u0434": "d"
165
+ "\u0453": "\u01F5" # ǵ
166
+ "\u0435": "e"
167
+ "\u0436": "\u007a\u030c" # ž
168
+ "\u0437": "z"
169
+ "\u0455": "dz"
170
+ "\u0438": "i"
171
+ "\u0458": "j"
172
+ "\u043A": "k"
173
+ "\u043B": "l"
174
+ "\u0459": "lj"
175
+ "\u043C": "m"
176
+ "\u043D": "n"
177
+ "\u045A": "nj"
178
+ "\u043E": "o"
179
+ "\u043F": "p"
180
+ "\u0440": "r"
181
+ "\u0441": "s"
182
+ "\u0442": "t"
183
+ "\u045C": "\u1E31" # ḱ
184
+ "\u0443": "u"
185
+ "\u0444": "f"
186
+ "\u0445": "h"
187
+ "\u0446": "c"
188
+ "\u0447": "\u0063\u030c" # č
189
+ "\u045F": "d\u007a\u030c" # dž
190
+ "\u0448": "\u0073\u030c" # š
@@ -102,69 +102,148 @@ tests:
102
102
  Число открепительных удостоверений, утраченных в окружной избирательной комиссии
103
103
 
104
104
  expected: |
105
- VYBORY DEPUTATOV GOSUDARSTVENNOY DUMY FEDERALNOGO SOBRANIYA ROSSIYSKOY FEDERATSII SEDMOGO SOZYVA
106
- DATA GOLOSOVANIYA: 18.09.2016
107
-
108
- NAIMENOVANIE IZBIRATELNOY KOMISSII: TSIK ROSSII
109
-
110
- SVODNAYA TABLITSA REZULTATOV VYBOROV PO FEDERALNOMU IZBIRATELNOMU OKRUGU
111
-
112
-
113
- CHISLO IZBIRATELEY, VNESENNYKH V SPISOK IZBIRATELEY NA MOMENT OKONCHANIYA GOLOSOVANIYA
114
- CHISLO IZBIRATELNYKH BYULLETENEY, POLUCHENNYKH UCHASTKOVOY IZBIRATELNOY KOMISSIEY
115
- CHISLO IZBIRATELNYKH BYULLETENEY, VYDANNYKH IZBIRATELYAM, PROGOLOSOVAVSHIM DOSROCHNO
116
- CHISLO IZBIRATELNYKH BYULLETENEY, VYDANNYKH V POMESHCHENII DLYA GOLOSOVANIYA V DENGOLOSOVANIYA
117
- CHISLO IZBIRATELNYKH BYULLETENEY, VYDANNYKH VNE POMESHCHENIYA DLYA GOLOSOVANIYA V DENGOLOSOVANIYA
118
- CHISLO POGASHENNYKH IZBIRATELNYKH BYULLETENEY
119
- CHISLO IZBIRATELNYKH BYULLETENEY, SODERZHASHCHIKHSYA V PERENOSNYKH YASHCHIKAKH DLYA GOLOSOVANIYA
120
- CHISLO IZBIRATELNYKH BYULLETENEY, SODERZHASHCHIKHSYA V STATSIONARNYKH YASHCHIKAKH DLYA GOLOSOVANIYA
121
- CHISLO NEDEYSTVITELNYKH IZBIRATELNYKH BYULLETENEY
122
- CHISLO DEYSTVITELNYKH IZBIRATELNYKH BYULLETENEY
123
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, POLUCHENNYKH UCHASTKOVOY IZBIRATELNOY KOMISSIEY
124
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, VYDANNYKH NA IZBIRATELNOM UCHASTKE DO DNYA GOLOSOVANIYA
125
- CHISLO IZBIRATELEY, PROGOLOSOVAVSHIKH PO OTKREPITELNYM UDOSTOVERENIYAM NA IZBIRATELNOM UCHASTKE
126
- CHISLO POGASHENNYKH NEISPOLZOVANNYKH OTKREPITELNYKH UDOSTOVERENIY
127
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, VYDANNYKH IZBIRATELYAM TERRITORIALNOY IZBIRATELNOY KOMISSIEY
128
- CHISLO UTRACHENNYKH OTKREPITELNYKH UDOSTOVERENIY
129
- CHISLO UTRACHENNYKH IZBIRATELNYKH BYULLETENEY
130
- CHISLO IZBIRATELNYKH BYULLETENEY, NE UCHTENNYKH PRI POLUCHENII
105
+ Vybory deputatov Gosudarstvennoy Dumy Federalnogo Sobraniya Rossiyskoy Federatsii sedmogo sozyva
106
+ Data golosovaniya: 18.09.2016
107
+
108
+ Naimenovaniye Izbiratelnoy komissii: TSIK Rossii
109
+
110
+ Svodnaya tablitsa rezultatov vyborov po federalnomu izbiratelnomu okrugu
111
+
112
+
113
+ Chislo izbirateley, vnesennykh v spisok izbirateley na moment okonchaniya golosovaniya
114
+ Chislo izbiratelnykh byulleteney, poluchennykh uchastkovoy izbiratelnoy komissiyey
115
+ Chislo izbiratelnykh byulleteney, vydannykh izbiratelyam, progolosovavshim dosrochno
116
+ Chislo izbiratelnykh byulleteney, vydannykh v pomeshchenii dlya golosovaniya v dengolosovaniya
117
+ Chislo izbiratelnykh byulleteney, vydannykh vne pomeshcheniya dlya golosovaniya v dengolosovaniya
118
+ Chislo pogashennykh izbiratelnykh byulleteney
119
+ Chislo izbiratelnykh byulleteney, soderzhashchikhsya v perenosnykh yashchikakh dlya golosovaniya
120
+ Chislo izbiratelnykh byulleteney, soderzhashchikhsya v statsionarnykh yashchikakh dlya golosovaniya
121
+ Chislo nedeystvitelnykh izbiratelnykh byulleteney
122
+ Chislo deystvitelnykh izbiratelnykh byulleteney
123
+ Chislo otkrepitelnykh udostovereniy, poluchennykh uchastkovoy izbiratelnoy komissiyey
124
+ Chislo otkrepitelnykh udostovereniy, vydannykh na izbiratelnom uchastke do dnya golosovaniya
125
+ Chislo izbirateley, progolosovavshikh po otkrepitelnym udostovereniyam na izbiratelnom uchastke
126
+ Chislo pogashennykh neispolzovannykh otkrepitelnykh udostovereniy
127
+ Chislo otkrepitelnykh udostovereniy, vydannykh izbiratelyam territorialnoy izbiratelnoy komissiyey
128
+ Chislo utrachennykh otkrepitelnykh udostovereniy
129
+ Chislo utrachennykh izbiratelnykh byulleteney
130
+ Chislo izbiratelnykh byulleteney, ne uchtennykh pri poluchenii
131
131
  1. VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "RODINA"
132
- 2. POLITICHESKAYA PARTIYA KOMMUNISTICHESKAYA PARTIYA KOMMUNISTY ROSSII
133
- 3. POLITICHESKAYA PARTIYA "ROSSIYSKAYA PARTIYA PENSIONEROV ZA SPRAVEDLIVOST’"
134
- 4. VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "EDINAYA ROSSIYA"
135
- 5. POLITICHESKAYA PARTIYA "ROSSIYSKAYA EKOLOGICHESKAYA PARTIYA "ZELENYE"
136
- 6. POLITICHESKAYA PARTIYA "GRAZHDANSKAYA PLATFORMA"
137
- 7. POLITICHESKAYA PARTIYA LDPR - LIBERALNO-DEMOKRATICHESKAYA PARTIYA ROSSII
138
- 8. POLITICHESKAYA PARTIYA "PARTIYA NARODNOY SVOBODY" (PARNAS)
139
- 9. VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "PARTIYA ROSTA"
140
- 10. OBSHCHESTVENNAYA ORGANIZATSIYA VSEROSSIYSKAYA POLITICHESKAYA PARTIYA "GRAZHDANSKAYA SILA"
141
- 11. POLITICHESKAYA PARTIYA "ROSSIYSKAYA OBEDINENNAYA DEMOKRATICHESKAYA PARTIYA ""YABLOKO"""
142
- 12. POLITICHESKAYA PARTIYA "KOMMUNISTICHESKAYA PARTIYA ROSSIYSKOY FEDERATSII"
143
- 13. POLITICHESKAYA PARTIYA "PATRIOTY ROSSII"
144
- 14. POLITICHESKAYA PARTIYA SPRAVEDLIVAYA ROSSIYA
145
-
146
- DANNYYE OKRUZHNYKH IZBIRATYELNYKH KOMISSIY O CHISLYE OTKRYEPITYELNYKH UDOSTOVYERYENIY
147
-
148
-
149
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, POLUCHENNYKH OKRUZHNOY IZBIRATELNOY KOMISSIEY
150
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, VYDANNYKH TERRITORIALNYM IZBIRATELNYM KOMISSIYAM
151
- CHISLO NEISPOLZOVANNYKH OTKREPITELNYKH UDOSTOVERENIY, POGASHENNYKH OKRUZHNOY IZBIRATELNOY KOMISSIEY
152
- CHISLO OTKREPITELNYKH UDOSTOVERENIY, UTRACHENNYKH V OKRUZHNOY IZBIRATELNOY KOMISSII
132
+ 2. Politicheskaya partiya KOMMUNISTICHESKAYA PARTIYA KOMMUNISTY ROSSII
133
+ 3. Politicheskaya partiya "Rossiyskaya partiya pensionerov za spravedlivost’"
134
+ 4. Vserossiyskaya politicheskaya partiya "YEDINAYA ROSSIYA"
135
+ 5. Politicheskaya partiya "Rossiyskaya ekologicheskaya partiya "Zelenyye"
136
+ 6. Politicheskaya partiya "Grazhdanskaya Platforma"
137
+ 7. Politicheskaya partiya LDPR - Liberalno-demokraticheskaya partiya Rossii
138
+ 8. Politicheskaya partiya "Partiya narodnoy svobody" (PARNAS)
139
+ 9. Vserossiyskaya politicheskaya partiya "PARTIYA ROSTA"
140
+ 10. Obshchestvennaya organizatsiya Vserossiyskaya politicheskaya partiya "Grazhdanskaya Sila"
141
+ 11. Politicheskaya partiya "Rossiyskaya ob"yedinennaya demokraticheskaya partiya "YABLOKO"
142
+ 12. Politicheskaya partiya "KOMMUNISTICHESKAYA PARTIYA ROSSIYSKOY FEDERATSII"
143
+ 13. Politicheskaya partiya "PATRIOTY ROSSII"
144
+ 14. Politicheskaya partiya SPRAVEDLIVAYA ROSSIYA
145
+
146
+ Dannyye okruzhnykh izbiratelnykh komissiy o chisle otkrepitelnykh udostovereniy
147
+
148
+
149
+ Chislo otkrepitelnykh udostovereniy, poluchennykh okruzhnoy izbiratelnoy komissiyey
150
+ Chislo otkrepitelnykh udostovereniy, vydannykh territorialnym izbiratelnym komissiyam
151
+ Chislo neispolzovannykh otkrepitelnykh udostovereniy, pogashennykh okruzhnoy izbiratelnoy komissiyey
152
+ Chislo otkrepitelnykh udostovereniy, utrachennykh v okruzhnoy izbiratelnoy komissii
153
+ - source: ДЛИННОЕ ПОКРЫВАЛО
154
+ expected: DLINNOYE POKRYVALO
155
+ - source: Еловая шишка
156
+ expected: Yelovaya shishka
157
+ - source: ЕЛОВАЯ ШИШКА
158
+ expected: YELOVAYA SHISHKA
159
+ - source: Длинное покрывало
160
+ expected: Dlinnoye pokryvalo
161
+ - source: В лесу еловые шишки
162
+ expected: V lesu yelovyye shishki
163
+ - source: OН ВИДЕЛ ЕЁ В ПЕРВЫЙ РАЗ
164
+ expected: ON VIDEL YEYË V PERVYY RAZ
165
+ - source: Ёж колючий
166
+ expected: Yëzh kolyuchiy
167
+ - source: ЁЖ КОЛЮЧИЙ
168
+ expected: YËZH KOLYUCHIY
169
+ - source: Он видел её в первый раз
170
+ expected: On videl yeyë v pervyy raz
171
+ - source: У ёжа колючки
172
+ expected: U yëzha kolyuchki
173
+ - source: ЙА Йа йа
174
+ expected: Y·A Y·a y·a
175
+ - source: ЫУ Ыу ыу
176
+ expected: Y·U Y·u y·u
177
+ - source: ОЫ Оы оы
178
+ expected: O·Y O·y o·y
179
+ - source: ОЫУ Оыу оыу
180
+ expected: O·Y·U O·y·u o·y·u
181
+ - source: СЭ Сэ сэ
182
+ expected: S·E S·e s·e
183
+ - source: ТС тс Тс тС
184
+ expected: T·S t·s T·s t·S
185
+ - source: ШЧ шч Шч шЧ
186
+ expected: SH·CH sh·ch Sh·ch sh·Ch
153
187
 
154
188
  map:
155
189
  rules:
156
- - pattern: ([ЄФІЦАаЕеИиЙйОоУуЫыЮюЯяії])\u0415
157
- result: "\\1YE"
158
- - pattern: \b\u0415
159
- result: YE
160
- - pattern: ([йьъ])\u0415
161
- result: "\\1YE"
162
- - pattern: ([ЄФІЦАаЕеИиЙйОоУуЫыЮюЯяії])\u0435
163
- result: "\\1ye"
164
- - pattern: \b\u0435
165
- result: ye
166
- - pattern: ([йьъ])\u0435
167
- result: "\\1ye"
190
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0401 # Ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
191
+ result: "Y\u00eb"
192
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0451 # ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
193
+ result: "y\u00eb"
194
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0415 # Е after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
195
+ result: "Y\u0415"
196
+ - pattern: \b\u0415 # Е initially
197
+ result: "Y\u0435"
198
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0435 # е after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
199
+ result: "y\u0435"
200
+ - pattern: \b\u0435 # е initially
201
+ result: "y\u0435"
202
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0401 # Ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
203
+ result: "Y\u00eb"
204
+ - pattern: \b\u0401
205
+ result: "Y\u00eb"
206
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯяЙйЪъЬь])\u0451 # ё after a, e, ё, и, о, у, ы, э, ю, я, й, ъ, ь
207
+ result: "y\u00eb"
208
+ - pattern: \b\u0451
209
+ result: "y\u00eb"
210
+ - pattern: \u0419(?=[АаУуЫыЭэ]) # Й before а, у, ы, or э
211
+ result: "Y\u00b7"
212
+ - pattern: \u0439(?=[АаУуЫыЭэ]) # й before а, у, ы, or э
213
+ result: "y\u00b7"
214
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯя])\u042b(?=[АаУуЫыЭэ]) # Ы after any vowel character and before а, у, ы, or э
215
+ result: "\u00b7Y\u00b7"
216
+ - pattern: (?<=[АаЕеЁёИиОоУуЫыЭэЮюЯя])\u044b(?=[АаУуЫыЭэ]) # ы after any vowel character and before а, у, ы, or э
217
+ result: "\u00b7y\u00b7"
218
+ - pattern: \u042b(?=[АаУуЫыЭэ]) # Ы before а, у, ы, or э
219
+ result: "Ы\u00b7"
220
+ - pattern: \u044b(?=[АаУуЫыЭэ]) # ы before а, у, ы, or э
221
+ result: "ы\u00b7"
222
+ - pattern: (?<=[Оо])\u042b # Ы after о
223
+ result: "\u00b7Y"
224
+ - pattern: (?<=[Оо])\u044b # ы after о
225
+ result: "\u00b7y"
226
+ - pattern: \b\u0401
227
+ result: "Y\u00eb"
228
+ - pattern: \b\u0451
229
+ result: "y\u00eb"
230
+ - pattern: (?<=[БбВвГгДдЖжЗзКкЛлМмНнПпРрСсТтФфХхЦцЧчШшЩщ])\u042d # Э after any consonant character except й
231
+ result: "\u00b7E"
232
+ - pattern: (?<=[БбВвГгДдЖжЗзКкЛлМмНнПпРрСсТтФфХхЦцЧчШшЩщ])\u044d # э after any consonant character except й
233
+ result: "\u00b7e"
234
+ - pattern: (Т|т)(С|с) # тс => t·s
235
+ result: "\\1\u00b7\\2"
236
+ - pattern: (Ш|ш)(Ч|ч) # шч => sh·ch
237
+ result: "\\1\u00b7\\2"
238
+
239
+ postrules:
240
+
241
+ #YE
242
+ - pattern: "((?<=[[:upper:]])Ye(?=[[:upper:]])?|(?<=[[:upper:]])?Ye(?=[[:upper:]]))"
243
+ result: "YE"
244
+ #YË
245
+ - pattern: "((?<=[[:upper:]])Yë(?=[[:upper:]])?|(?<=[[:upper:]])?Yë(?=[[:upper:]]))"
246
+ result: "YË"
168
247
 
169
248
  characters:
170
249
  "\u0410": "A"
@@ -173,7 +252,7 @@ map:
173
252
  "\u0413": "G"
174
253
  "\u0414": "D"
175
254
  "\u0415": "E"
176
- "\u0435": "e"
255
+ "\u0401": "\u00cb" # Ё
177
256
  "\u0416": "Zh"
178
257
  "\u0417": "Z"
179
258
  "\u0418": "I"
@@ -194,9 +273,9 @@ map:
194
273
  "\u0427": "Ch"
195
274
  "\u0428": "Sh"
196
275
  "\u0429": "Shch"
197
- "\u042a": "\""
276
+ "\u042a": "\"" # Ъ
198
277
  "\u042b": "Y"
199
- "\u042c": "\u2019"
278
+ "\u042c": "\u2019" # Ь => ’
200
279
  "\u042d": "E"
201
280
  "\u042e": "Yu"
202
281
  "\u042f": "Ya"
@@ -205,6 +284,8 @@ map:
205
284
  "\u0432": "v"
206
285
  "\u0433": "g"
207
286
  "\u0434": "d"
287
+ "\u0435": "e"
288
+ "\u0451": "\u00eb" # ё
208
289
  "\u0436": "zh"
209
290
  "\u0437": "z"
210
291
  "\u0438": "i"
@@ -225,9 +306,9 @@ map:
225
306
  "\u0447": "ch"
226
307
  "\u0448": "sh"
227
308
  "\u0449": "shch"
228
- "\u044a": "\""
309
+ "\u044a": "\"" # ъ
229
310
  "\u044b": "y"
230
- "\u044c": "\u2019"
311
+ "\u044c": "\u2019" # ь => ’
231
312
  "\u044d": "e"
232
313
  "\u044e": "yu"
233
314
  "\u044f": "ya"
@@ -0,0 +1,166 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2005
4
+ language: srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF SERBIAN, BGN/PCGN 2005 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816783/TABLE_OF_CORRESPONDENCES_FOR_SERBIAN.pdf
9
+ creation_date: 2005
10
+ confirmation_date: 2019-06
11
+ description: |
12
+ The tabulation below reflects the Serbian Cyrillic alphabet and the standard Roman script equivalents
13
+ used in both Serbia and Montenegro.
14
+
15
+ notes:
16
+ - The Serbian Cyrillic lowercase italic Д may sometimes be seen as g.
17
+ There is no specific Unicode encoding for this variant form so a comparable character
18
+ has been used here for illustrative purposes.
19
+
20
+ - The digraph dj(Dj) will occasionally be found as an alternative form of đ(Đ).
21
+
22
+ - The Serbian Cyrillic lowercase italic П may sometimes be seen as ӣ.
23
+ There is no specific Unicode encoding for this variant form so a comparable character
24
+ has been used here for illustrative purposes.
25
+
26
+ - The Serbian Cyrillic lowercase italic Т may sometimes be seen as w.
27
+ There is no specific Unicode encoding for this variant form so a comparable character
28
+ has been used here for illustrative purposes.
29
+
30
+ - |
31
+ An inventory of letter-diacritic combinations, with their Unicode encoding,
32
+ in addition to the unmodified letters of the basic Roman script is:
33
+ | Đ (U+0110) | đ (U+0111) |
34
+ | Ž (U+017D) | ž (U+017E) |
35
+ | Lj (U+01C8)* | lj (U+01C9)* |
36
+ | Ć (U+0106) | ć (U+0107) |
37
+ | Dž (U+01C5)* | dž (U+01C6)* |
38
+ | Š (U+0160) | š (U+0161) |
39
+ * Note that these characters can also be reproduced with individual letters (e.g. l+j).
40
+
41
+ - The Roman-script columns show only lowercase forms but, when applying the table,
42
+ uppercase and lowercase Roman letters as appropriate should be used.
43
+
44
+ tests:
45
+ - source: Шупља Стена
46
+ expected: Šuplja Stena
47
+ - source: Чукарица
48
+ expected: Čukarica
49
+ - source: Црна Трава
50
+ expected: Crna Trava
51
+ - source: Херцег Нови
52
+ expected: Herceg Novi
53
+ - source: Улцињ
54
+ expected: Ulcinj
55
+ - source: Ужице
56
+ expected: Užice
57
+ - source: Тресаначка Река
58
+ expected: Tresanačka Reka
59
+ - source: Сјеница
60
+ expected: Sjenica
61
+ - source: Рожаје
62
+ expected: Rožaje
63
+ - source: Пљевља
64
+ expected: Pljevlja
65
+ - source: Оџаци
66
+ expected: Odžaci
67
+ - source: Никшић
68
+ expected: Nikšić
69
+ - source: Медвеђа
70
+ expected: Medveđa
71
+ - source: Лозница
72
+ expected: Loznica
73
+ - source: Књажевац
74
+ expected: Knjaževac
75
+ - source: Зрењанин
76
+ expected: Zrenjanin
77
+ - source: Житорађа
78
+ expected: Žitorađa
79
+ - source: Ервеник
80
+ expected: Ervenik
81
+ - source: Доње Љупче
82
+ expected: Donje Ljupče
83
+ - source: Гусиње
84
+ expected: Gusinje
85
+ - source: ГУСИЊЕ
86
+ expected: GUSINJE
87
+ - source: Врњачка Бања
88
+ expected: Vrnjačka Banja
89
+ - source: Бијело Поље
90
+ expected: Bijelo Polje
91
+ - source: Алибунар
92
+ expected: Alibunar
93
+
94
+ map:
95
+ postrules:
96
+ #LJ
97
+ - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
98
+ result: "LJ"
99
+ #NJ
100
+ - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
101
+ result: "NJ"
102
+ #DŽ
103
+ - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
104
+ result: "DŽ"
105
+
106
+ characters:
107
+ "\u0410": "A"
108
+ "\u0411": "B"
109
+ "\u0412": "V"
110
+ "\u0413": "G"
111
+ "\u0414": "D"
112
+ "\u0402": "\u0110" # Đ
113
+ "\u0415": "E"
114
+ "\u0416": "\u005a\u030c" # Ž
115
+ "\u0417": "Z"
116
+ "\u0418": "I"
117
+ "\u0408": "J"
118
+ "\u041A": "K"
119
+ "\u041B": "L"
120
+ "\u0409": "Lj"
121
+ "\u041C": "M"
122
+ "\u041D": "N"
123
+ "\u040A": "Nj"
124
+ "\u041E": "O"
125
+ "\u041F": "P"
126
+ "\u0420": "R"
127
+ "\u0421": "S"
128
+ "\u0422": "T"
129
+ "\u040B": "\u0043\u0301" # Ć
130
+ "\u0423": "U"
131
+ "\u0424": "F"
132
+ "\u0425": "H"
133
+ "\u0426": "C"
134
+ "\u0427": "\u0043\u030c" # Č
135
+ "\u040F": "D\u007a\u030c" # Dž
136
+ "\u0428": "\u0053\u030c" # Š
137
+ "\u0430": "a"
138
+ "\u0431": "b"
139
+ "\u0432": "v"
140
+ "\u0433": "g"
141
+ "\u0434": "d"
142
+ "\u0452": "\u0111" # đ
143
+ "\u0435": "e"
144
+ "\u0436": "\u007a\u030c" # ž
145
+ "\u0437": "z"
146
+ "\u0438": "i"
147
+ "\u0458": "j"
148
+ "\u043A": "k"
149
+ "\u043B": "l"
150
+ "\u0459": "lj"
151
+ "\u043C": "m"
152
+ "\u043D": "n"
153
+ "\u045A": "nj"
154
+ "\u043E": "o"
155
+ "\u043F": "p"
156
+ "\u0440": "r"
157
+ "\u0441": "s"
158
+ "\u0442": "t"
159
+ "\u045B": "\u0063\u0301" # ć́
160
+ "\u0443": "u"
161
+ "\u0444": "f"
162
+ "\u0445": "h"
163
+ "\u0446": "c"
164
+ "\u0447": "\u0063\u030c" # č
165
+ "\u045F": "d\u007a\u030c" # dž
166
+ "\u0448": "\u0073\u030c" # š