taraskevizer 7.0.3 → 7.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +7 -7
- package/dist/bin.js +5 -5
- package/dist/index.cjs +247 -242
- package/dist/index.d.ts +54 -56
- package/dist/index.js +247 -241
- package/package.json +1 -1
package/README.md
CHANGED
|
@@ -27,7 +27,7 @@ import {
|
|
|
27
27
|
htmlPipeline,
|
|
28
28
|
abcOnlyPipeline,
|
|
29
29
|
TaraskConfig,
|
|
30
|
-
|
|
30
|
+
alphabets,
|
|
31
31
|
J,
|
|
32
32
|
VARIATION,
|
|
33
33
|
} from 'taraskevizer';
|
|
@@ -37,7 +37,7 @@ tarask('планета', plainTextPipeline);
|
|
|
37
37
|
|
|
38
38
|
const cfg = new TaraskConfig({
|
|
39
39
|
general: {
|
|
40
|
-
abc:
|
|
40
|
+
abc: alphabets.cyrillic,
|
|
41
41
|
j: J.ALWAYS,
|
|
42
42
|
},
|
|
43
43
|
nonHtml: {
|
|
@@ -51,7 +51,7 @@ tarask('планета і Гродна', plainTextPipeline, cfg);
|
|
|
51
51
|
|
|
52
52
|
const cfg = new TaraskConfig({
|
|
53
53
|
general: {
|
|
54
|
-
abc:
|
|
54
|
+
abc: alphabets.latin,
|
|
55
55
|
},
|
|
56
56
|
html: {
|
|
57
57
|
g: false, // ignored, because alphabet is set to latin
|
|
@@ -61,7 +61,7 @@ tarask('энергія планеты', htmlPipeline, cfg);
|
|
|
61
61
|
// "en<tarF>erg</tarF>ija p<tarF>lan</tarF>ety"
|
|
62
62
|
|
|
63
63
|
const latinWithJiCfg = new TaraskConfig({
|
|
64
|
-
general: { abc:
|
|
64
|
+
general: { abc: alphabets.latinJi },
|
|
65
65
|
});
|
|
66
66
|
|
|
67
67
|
tarask('яна і іншыя', abcOnlyPipeline, latinWithJiCfg);
|
|
@@ -83,10 +83,10 @@ Type: `object` with schema: `{lower: Dict, upper?: Dict}`,
|
|
|
83
83
|
where `Dict` is `[pattern: RegExp, result: string][]`
|
|
84
84
|
(may be empty)
|
|
85
85
|
|
|
86
|
-
`
|
|
87
|
-
`
|
|
86
|
+
`alphabets` contains the following pre-defined alphabets:
|
|
87
|
+
`cyrillic`, `latin`, `latinJi`, `arabic`
|
|
88
88
|
|
|
89
|
-
Default value: `
|
|
89
|
+
Default value: `alphabets.cyrillic`
|
|
90
90
|
|
|
91
91
|
### j
|
|
92
92
|
|
package/dist/bin.js
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
#!/usr/bin/env node
|
|
2
2
|
import {
|
|
3
|
-
|
|
3
|
+
dicts,
|
|
4
4
|
REPLACE_J,
|
|
5
5
|
VARIATION,
|
|
6
6
|
TaraskConfig,
|
|
@@ -16,7 +16,7 @@ const printWithPrefix = (msg) => {
|
|
|
16
16
|
process.argv.splice(0, 2);
|
|
17
17
|
const checkForOptions = (options) => process.argv[0] && options.includes(process.argv[0].toLowerCase());
|
|
18
18
|
if (checkForOptions(["-v", "--version"])) {
|
|
19
|
-
printWithPrefix("7.
|
|
19
|
+
printWithPrefix("7.1.1");
|
|
20
20
|
process.exit(0);
|
|
21
21
|
}
|
|
22
22
|
if (checkForOptions(["-h", "--help"])) {
|
|
@@ -88,19 +88,19 @@ const optionDict = toHashTable([
|
|
|
88
88
|
[
|
|
89
89
|
["--latin", "-l"],
|
|
90
90
|
() => {
|
|
91
|
-
general.abc =
|
|
91
|
+
general.abc = dicts.alphabets.latin;
|
|
92
92
|
}
|
|
93
93
|
],
|
|
94
94
|
[
|
|
95
95
|
["--latin-ji", "-lj"],
|
|
96
96
|
() => {
|
|
97
|
-
general.abc =
|
|
97
|
+
general.abc = dicts.alphabets.latinJi;
|
|
98
98
|
}
|
|
99
99
|
],
|
|
100
100
|
[
|
|
101
101
|
["--arabic", "-a"],
|
|
102
102
|
() => {
|
|
103
|
-
general.abc =
|
|
103
|
+
general.abc = dicts.alphabets.arabic;
|
|
104
104
|
}
|
|
105
105
|
],
|
|
106
106
|
[
|
package/dist/index.cjs
CHANGED
|
@@ -20,7 +20,6 @@ var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: tru
|
|
|
20
20
|
// src/index.ts
|
|
21
21
|
var src_exports = {};
|
|
22
22
|
__export(src_exports, {
|
|
23
|
-
ALPHABET: () => ALPHABET,
|
|
24
23
|
REPLACE_J: () => REPLACE_J,
|
|
25
24
|
TaraskConfig: () => TaraskConfig,
|
|
26
25
|
VARIATION: () => VARIATION,
|
|
@@ -37,24 +36,28 @@ module.exports = __toCommonJS(src_exports);
|
|
|
37
36
|
// src/dict/index.ts
|
|
38
37
|
var dict_exports = {};
|
|
39
38
|
__export(dict_exports, {
|
|
40
|
-
|
|
39
|
+
alphabets: () => alphabets_exports,
|
|
41
40
|
gobj: () => gobj,
|
|
42
|
-
latinLettersLowerCase: () => latinLettersLowerCase,
|
|
43
|
-
latinLettersLowerCaseJi: () => latinLettersLowerCaseJi,
|
|
44
|
-
latinLettersUpperCase: () => latinLettersUpperCase,
|
|
45
|
-
latinLettersUpperCaseJi: () => latinLettersUpperCaseJi,
|
|
46
41
|
noSoften: () => noSoften,
|
|
47
42
|
softeners: () => softeners,
|
|
48
43
|
wordlist: () => wordlist
|
|
49
44
|
});
|
|
50
45
|
|
|
46
|
+
// src/dict/gobj.ts
|
|
47
|
+
var gobj = {
|
|
48
|
+
г: "ґ",
|
|
49
|
+
Г: "Ґ",
|
|
50
|
+
ґ: "г",
|
|
51
|
+
Ґ: "Г"
|
|
52
|
+
};
|
|
53
|
+
|
|
51
54
|
// src/dict/lib.ts
|
|
52
55
|
var dictFrom = {
|
|
53
|
-
raw: (dict) => {
|
|
56
|
+
raw: (dict, additionalFlags = "g") => {
|
|
54
57
|
for (const item of dict)
|
|
55
58
|
item[0] = RegExp(
|
|
56
59
|
item[0],
|
|
57
|
-
item[0] instanceof RegExp ? item[0].flags +
|
|
60
|
+
item[0] instanceof RegExp ? item[0].flags + additionalFlags : additionalFlags
|
|
58
61
|
);
|
|
59
62
|
return dict;
|
|
60
63
|
},
|
|
@@ -127,213 +130,6 @@ var iwords = toOneLine(`біс
|
|
|
127
130
|
ць?він
|
|
128
131
|
шыяс`);
|
|
129
132
|
|
|
130
|
-
// src/dict/latin.ts
|
|
131
|
-
var common = {
|
|
132
|
-
lower: [
|
|
133
|
-
[
|
|
134
|
-
[/(?<=[аеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)е/, "je"],
|
|
135
|
-
[/(?<=[eаеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)ё/, "jo"],
|
|
136
|
-
[/(?<=[eoаеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)ю/, "ju"],
|
|
137
|
-
[/(?<=[eouаеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)я/, "ja"]
|
|
138
|
-
],
|
|
139
|
-
[
|
|
140
|
-
[/ʼ/, ""],
|
|
141
|
-
[/ць/, "ć"],
|
|
142
|
-
[/зь/, "ź"],
|
|
143
|
-
[/сь/, "ś"],
|
|
144
|
-
[/нь/, "ń"],
|
|
145
|
-
[/ль/, "l"],
|
|
146
|
-
[/а/, "a"],
|
|
147
|
-
[/б/, "b"],
|
|
148
|
-
[/в/, "v"],
|
|
149
|
-
[/г/, "h"],
|
|
150
|
-
[/ґ/, "g"],
|
|
151
|
-
[/д/, "d"],
|
|
152
|
-
[/е/, "ie"],
|
|
153
|
-
[/ё/, "io"],
|
|
154
|
-
[/ж/, "ž"],
|
|
155
|
-
[/з/, "z"],
|
|
156
|
-
[/і/, "i"],
|
|
157
|
-
[/й/, "j"],
|
|
158
|
-
[/к/, "k"],
|
|
159
|
-
[/л/, "ł"],
|
|
160
|
-
[/м/, "m"],
|
|
161
|
-
[/н/, "n"],
|
|
162
|
-
[/о/, "o"],
|
|
163
|
-
[/п/, "p"],
|
|
164
|
-
[/р/, "r"],
|
|
165
|
-
[/с/, "s"],
|
|
166
|
-
[/т/, "t"],
|
|
167
|
-
[/у/, "u"],
|
|
168
|
-
[/ў/, "ŭ"],
|
|
169
|
-
[/ф/, "f"],
|
|
170
|
-
[/х/, "ch"],
|
|
171
|
-
[/ц/, "c"],
|
|
172
|
-
[/ч/, "č"],
|
|
173
|
-
[/ш/, "š"],
|
|
174
|
-
[/ы/, "y"],
|
|
175
|
-
[/э/, "e"],
|
|
176
|
-
[/ю/, "iu"],
|
|
177
|
-
[/я/, "ia"],
|
|
178
|
-
[/łi(?=[eoua])/, "l"],
|
|
179
|
-
[/łi/, "li"]
|
|
180
|
-
]
|
|
181
|
-
].map(dictFrom.nonGlobal),
|
|
182
|
-
upper: [
|
|
183
|
-
[
|
|
184
|
-
[new RegExp(" Е(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Je"],
|
|
185
|
-
[new RegExp(" Ё(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Jo"],
|
|
186
|
-
[new RegExp(" Ю(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Ju"],
|
|
187
|
-
[new RegExp(" Я(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Ja"]
|
|
188
|
-
],
|
|
189
|
-
[
|
|
190
|
-
[/([АЕЁІОУЎЫЭЮЯЬ| ]\(?)Е/, "$1JE"],
|
|
191
|
-
[/([EАЕЁІОУЎЫЭЮЯЬ| ]\(?)Ё/, "$1JO"],
|
|
192
|
-
[/([EOАЕЁІОУЎЫЭЮЯЬ| ]\(?)Ю/, "$1JU"],
|
|
193
|
-
[/([EOUАЕЁІОУЎЫЭЮЯЬ| ]\(?)Я/, "$1JA"]
|
|
194
|
-
],
|
|
195
|
-
[
|
|
196
|
-
[/Е/, "IE"],
|
|
197
|
-
[/Ё/, "IO"],
|
|
198
|
-
[/Ю/, "IU"],
|
|
199
|
-
[/Я/, "IA"],
|
|
200
|
-
[/Ц[Ьь]/, "Ć"],
|
|
201
|
-
[/З[Ьь]/, "Ź"],
|
|
202
|
-
[/С[Ьь]/, "Ś"],
|
|
203
|
-
[/Н[Ьь]/, "Ń"],
|
|
204
|
-
[/Л[Ьь]/, "L"],
|
|
205
|
-
[/А/, "A"],
|
|
206
|
-
[/Б/, "B"],
|
|
207
|
-
[/В/, "V"],
|
|
208
|
-
[/Г/, "H"],
|
|
209
|
-
[/Ґ/, "G"],
|
|
210
|
-
[/Д/, "D"],
|
|
211
|
-
[/Ж/, "Ž"],
|
|
212
|
-
[/З/, "Z"],
|
|
213
|
-
[/І/, "I"],
|
|
214
|
-
[/Й/, "J"],
|
|
215
|
-
[/К/, "K"],
|
|
216
|
-
[/Л/, "Ł"],
|
|
217
|
-
[/М/, "M"],
|
|
218
|
-
[/Н/, "N"],
|
|
219
|
-
[/О/, "O"],
|
|
220
|
-
[/П/, "P"],
|
|
221
|
-
[/Р/, "R"],
|
|
222
|
-
[/С/, "S"],
|
|
223
|
-
[/Т/, "T"],
|
|
224
|
-
[/У/, "U"],
|
|
225
|
-
[/Ў/, "Ŭ"],
|
|
226
|
-
[/Ф/, "F"],
|
|
227
|
-
[/ Х(?=[\p{Ll} ])/u, " Ch"],
|
|
228
|
-
[/Х/, "CH"],
|
|
229
|
-
[/Ц/, "C"],
|
|
230
|
-
[/Ч/, "Č"],
|
|
231
|
-
[/Ш/, "Š"],
|
|
232
|
-
[/Ы/, "Y"],
|
|
233
|
-
[/Э/, "E"],
|
|
234
|
-
[/Ł[Ii](?=[AEOUaeou])/, "L"],
|
|
235
|
-
[/Ł(?=[Ii])/, "L"]
|
|
236
|
-
]
|
|
237
|
-
].map(dictFrom.nonGlobal)
|
|
238
|
-
};
|
|
239
|
-
var latinLettersLowerCase = [
|
|
240
|
-
...common.lower[0],
|
|
241
|
-
[/ʼі/g, "ji"],
|
|
242
|
-
...common.lower[1]
|
|
243
|
-
];
|
|
244
|
-
var latinLettersUpperCase = common.upper.flat();
|
|
245
|
-
var latinLettersLowerCaseJi = dictFrom.raw([
|
|
246
|
-
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )і Ў/, "$1j U"],
|
|
247
|
-
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )і ў/, "$1j u"],
|
|
248
|
-
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )і /, "$1j "],
|
|
249
|
-
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )І Ў/, "$1J U"],
|
|
250
|
-
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )І ў/, "$1J u"],
|
|
251
|
-
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )І /, "$1J "],
|
|
252
|
-
[` і(?=${iwords})`, " ji"],
|
|
253
|
-
[` І(?=${iwords})`, " Ji"],
|
|
254
|
-
[` І(?=${iwords.toUpperCase()})`, " JI"]
|
|
255
|
-
]).concat([
|
|
256
|
-
...common.lower[0],
|
|
257
|
-
[/([eouaаеёіоуыэюяʼАЕЁІОУЫЭЮЯЬ] *)і/g, "$1ji"],
|
|
258
|
-
...common.lower[1]
|
|
259
|
-
]);
|
|
260
|
-
var latinLettersUpperCaseJi = [
|
|
261
|
-
...common.upper[0],
|
|
262
|
-
[new RegExp("([eoua] *)І(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "gu"), "$1Ji"],
|
|
263
|
-
...common.upper[1],
|
|
264
|
-
[/([AOEUАЕЁІОУЎЫЭЮЯ][( ]*)І/g, "$1JI"],
|
|
265
|
-
...common.upper[2],
|
|
266
|
-
[/ JIŁ -/g, " IŁ -"]
|
|
267
|
-
];
|
|
268
|
-
|
|
269
|
-
// src/dict/arabic.ts
|
|
270
|
-
var soft = "ْ(?=[еёіюяь])";
|
|
271
|
-
var presoft = "([تزكثࢮбвгджзйклмнпрстфхцчшў])ْ?(ّ?)";
|
|
272
|
-
var arabLetters = dictFrom.raw([
|
|
273
|
-
[/ л[ая]/, " لا"],
|
|
274
|
-
[/л[ая]/, "ـلا"],
|
|
275
|
-
// падваеньне зычнага, шадда
|
|
276
|
-
[/([бвгджзйклмнпрстфхцчшў]|д[зж])\1/, "$1ّ"],
|
|
277
|
-
// няма галоснага, сукун
|
|
278
|
-
[/([бвгджзйклмнпрстфхцчшў])/, "$1ْ"],
|
|
279
|
-
// а, аліф
|
|
280
|
-
[/а/, "اа"],
|
|
281
|
-
// першая галосная, аліф
|
|
282
|
-
[/ (?=[еэыуо])/, " ا"],
|
|
283
|
-
["дْз" + soft, "ࢮ"],
|
|
284
|
-
["з" + soft, "ز"],
|
|
285
|
-
["к" + soft, "ك"],
|
|
286
|
-
["с" + soft, "ث"],
|
|
287
|
-
["т" + soft, "ت"],
|
|
288
|
-
[/([تزكث])і/, "ы"],
|
|
289
|
-
// $2 - шадда
|
|
290
|
-
[presoft + "[аяэе]", "$1$2َ"],
|
|
291
|
-
[presoft + "[іы]", "$1$2ِ"],
|
|
292
|
-
[/ і /, " اِ "],
|
|
293
|
-
[presoft + "[оёую]", "$1$2ُ"],
|
|
294
|
-
[/ʼ/, "ع"],
|
|
295
|
-
[/ь/, ""],
|
|
296
|
-
// [/[ьʼ]/, ''],
|
|
297
|
-
[/[яе]/, "يَ"],
|
|
298
|
-
[/і/, "يِ"],
|
|
299
|
-
[/[ёю]/, "يُ"],
|
|
300
|
-
[/[аэ]/, "َ"],
|
|
301
|
-
[/[ыі]/, "ِ"],
|
|
302
|
-
[/[оу]/, "ُ"],
|
|
303
|
-
[/б/, "ب"],
|
|
304
|
-
[/[вў]/, "و"],
|
|
305
|
-
[/г/, "ه"],
|
|
306
|
-
[/ґ/, "غ"],
|
|
307
|
-
[/дْж/, "ج"],
|
|
308
|
-
[/д/, "د"],
|
|
309
|
-
[/ж/, "ژ"],
|
|
310
|
-
[/з/, "ض"],
|
|
311
|
-
[/й/, "ي"],
|
|
312
|
-
[/к/, "ق"],
|
|
313
|
-
[/л/, "ل"],
|
|
314
|
-
[/м/, "م"],
|
|
315
|
-
[/н/, "ن"],
|
|
316
|
-
[/п/, "پ"],
|
|
317
|
-
[/р/, "ر"],
|
|
318
|
-
[/с/, "ص"],
|
|
319
|
-
[/т/, "ط"],
|
|
320
|
-
[/ф/, "ف"],
|
|
321
|
-
[/х/, "ح"],
|
|
322
|
-
[/ц/, "ࢯ"],
|
|
323
|
-
[/ч/, "چ"],
|
|
324
|
-
[/ш/, "ش"],
|
|
325
|
-
[/,/, "،"],
|
|
326
|
-
[/\?/, "؟"]
|
|
327
|
-
]);
|
|
328
|
-
|
|
329
|
-
// src/dict/gobj.ts
|
|
330
|
-
var gobj = {
|
|
331
|
-
г: "ґ",
|
|
332
|
-
Г: "Ґ",
|
|
333
|
-
ґ: "г",
|
|
334
|
-
Ґ: "Г"
|
|
335
|
-
};
|
|
336
|
-
|
|
337
133
|
// src/dict/wordlist.ts
|
|
338
134
|
var chemicalElements1 = [
|
|
339
135
|
"сканд|ванад|рубід|род|ірыд|рэзэрфорд",
|
|
@@ -2032,23 +1828,223 @@ var softeners = dictFrom.raw([
|
|
|
2032
1828
|
[/([сз])ʼ(?=[яюеё])/, "$1ь"]
|
|
2033
1829
|
]);
|
|
2034
1830
|
|
|
2035
|
-
// src/
|
|
2036
|
-
var
|
|
2037
|
-
|
|
2038
|
-
|
|
2039
|
-
|
|
2040
|
-
|
|
2041
|
-
|
|
2042
|
-
|
|
2043
|
-
|
|
2044
|
-
|
|
2045
|
-
|
|
2046
|
-
|
|
2047
|
-
|
|
2048
|
-
|
|
2049
|
-
|
|
2050
|
-
|
|
2051
|
-
|
|
1831
|
+
// src/dict/alphabets/index.ts
|
|
1832
|
+
var alphabets_exports = {};
|
|
1833
|
+
__export(alphabets_exports, {
|
|
1834
|
+
arabic: () => arabic,
|
|
1835
|
+
cyrillic: () => cyrillic,
|
|
1836
|
+
latin: () => latin,
|
|
1837
|
+
latinJi: () => latinJi
|
|
1838
|
+
});
|
|
1839
|
+
|
|
1840
|
+
// src/dict/alphabets/cyrillic.ts
|
|
1841
|
+
var cyrillic = {
|
|
1842
|
+
lower: [],
|
|
1843
|
+
upper: []
|
|
1844
|
+
};
|
|
1845
|
+
|
|
1846
|
+
// src/dict/alphabets/latin.ts
|
|
1847
|
+
var common = {
|
|
1848
|
+
lower: [
|
|
1849
|
+
[
|
|
1850
|
+
[/(?<=[аеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)е/, "je"],
|
|
1851
|
+
[/(?<=[eаеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)ё/, "jo"],
|
|
1852
|
+
[/(?<=[eoаеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)ю/, "ju"],
|
|
1853
|
+
[/(?<=[eouаеёіоуўыэюяьʼ| >АЕЁІОУЎЫЭЮЯЬ]|^)я/, "ja"]
|
|
1854
|
+
],
|
|
1855
|
+
[
|
|
1856
|
+
[/ʼ/, ""],
|
|
1857
|
+
[/ць/, "ć"],
|
|
1858
|
+
[/зь/, "ź"],
|
|
1859
|
+
[/сь/, "ś"],
|
|
1860
|
+
[/нь/, "ń"],
|
|
1861
|
+
[/ль/, "l"],
|
|
1862
|
+
[/а/, "a"],
|
|
1863
|
+
[/б/, "b"],
|
|
1864
|
+
[/в/, "v"],
|
|
1865
|
+
[/г/, "h"],
|
|
1866
|
+
[/ґ/, "g"],
|
|
1867
|
+
[/д/, "d"],
|
|
1868
|
+
[/е/, "ie"],
|
|
1869
|
+
[/ё/, "io"],
|
|
1870
|
+
[/ж/, "ž"],
|
|
1871
|
+
[/з/, "z"],
|
|
1872
|
+
[/і/, "i"],
|
|
1873
|
+
[/й/, "j"],
|
|
1874
|
+
[/к/, "k"],
|
|
1875
|
+
[/л/, "ł"],
|
|
1876
|
+
[/м/, "m"],
|
|
1877
|
+
[/н/, "n"],
|
|
1878
|
+
[/о/, "o"],
|
|
1879
|
+
[/п/, "p"],
|
|
1880
|
+
[/р/, "r"],
|
|
1881
|
+
[/с/, "s"],
|
|
1882
|
+
[/т/, "t"],
|
|
1883
|
+
[/у/, "u"],
|
|
1884
|
+
[/ў/, "ŭ"],
|
|
1885
|
+
[/ф/, "f"],
|
|
1886
|
+
[/х/, "ch"],
|
|
1887
|
+
[/ц/, "c"],
|
|
1888
|
+
[/ч/, "č"],
|
|
1889
|
+
[/ш/, "š"],
|
|
1890
|
+
[/ы/, "y"],
|
|
1891
|
+
[/э/, "e"],
|
|
1892
|
+
[/ю/, "iu"],
|
|
1893
|
+
[/я/, "ia"],
|
|
1894
|
+
[/łi(?=[eoua])/, "l"],
|
|
1895
|
+
[/łi/, "li"]
|
|
1896
|
+
]
|
|
1897
|
+
].map(dictFrom.nonGlobal),
|
|
1898
|
+
upper: [
|
|
1899
|
+
[
|
|
1900
|
+
[new RegExp(" Е(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Je"],
|
|
1901
|
+
[new RegExp(" Ё(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Jo"],
|
|
1902
|
+
[new RegExp(" Ю(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Ju"],
|
|
1903
|
+
[new RegExp(" Я(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "u"), " Ja"]
|
|
1904
|
+
],
|
|
1905
|
+
[
|
|
1906
|
+
[/([АЕЁІОУЎЫЭЮЯЬ| ]\(?)Е/, "$1JE"],
|
|
1907
|
+
[/([EАЕЁІОУЎЫЭЮЯЬ| ]\(?)Ё/, "$1JO"],
|
|
1908
|
+
[/([EOАЕЁІОУЎЫЭЮЯЬ| ]\(?)Ю/, "$1JU"],
|
|
1909
|
+
[/([EOUАЕЁІОУЎЫЭЮЯЬ| ]\(?)Я/, "$1JA"]
|
|
1910
|
+
],
|
|
1911
|
+
[
|
|
1912
|
+
[/Е/, "IE"],
|
|
1913
|
+
[/Ё/, "IO"],
|
|
1914
|
+
[/Ю/, "IU"],
|
|
1915
|
+
[/Я/, "IA"],
|
|
1916
|
+
[/Ц[Ьь]/, "Ć"],
|
|
1917
|
+
[/З[Ьь]/, "Ź"],
|
|
1918
|
+
[/С[Ьь]/, "Ś"],
|
|
1919
|
+
[/Н[Ьь]/, "Ń"],
|
|
1920
|
+
[/Л[Ьь]/, "L"],
|
|
1921
|
+
[/А/, "A"],
|
|
1922
|
+
[/Б/, "B"],
|
|
1923
|
+
[/В/, "V"],
|
|
1924
|
+
[/Г/, "H"],
|
|
1925
|
+
[/Ґ/, "G"],
|
|
1926
|
+
[/Д/, "D"],
|
|
1927
|
+
[/Ж/, "Ž"],
|
|
1928
|
+
[/З/, "Z"],
|
|
1929
|
+
[/І/, "I"],
|
|
1930
|
+
[/Й/, "J"],
|
|
1931
|
+
[/К/, "K"],
|
|
1932
|
+
[/Л/, "Ł"],
|
|
1933
|
+
[/М/, "M"],
|
|
1934
|
+
[/Н/, "N"],
|
|
1935
|
+
[/О/, "O"],
|
|
1936
|
+
[/П/, "P"],
|
|
1937
|
+
[/Р/, "R"],
|
|
1938
|
+
[/С/, "S"],
|
|
1939
|
+
[/Т/, "T"],
|
|
1940
|
+
[/У/, "U"],
|
|
1941
|
+
[/Ў/, "Ŭ"],
|
|
1942
|
+
[/Ф/, "F"],
|
|
1943
|
+
[/ Х(?=[\p{Ll} ])/u, " Ch"],
|
|
1944
|
+
[/Х/, "CH"],
|
|
1945
|
+
[/Ц/, "C"],
|
|
1946
|
+
[/Ч/, "Č"],
|
|
1947
|
+
[/Ш/, "Š"],
|
|
1948
|
+
[/Ы/, "Y"],
|
|
1949
|
+
[/Э/, "E"],
|
|
1950
|
+
[/Ł[Ii](?=[AEOUaeou])/, "L"],
|
|
1951
|
+
[/Ł(?=[Ii])/, "L"]
|
|
1952
|
+
]
|
|
1953
|
+
].map(dictFrom.nonGlobal)
|
|
1954
|
+
};
|
|
1955
|
+
var latin = {
|
|
1956
|
+
lower: [...common.lower[0], [/ʼі/g, "ji"], ...common.lower[1]],
|
|
1957
|
+
upper: common.upper.flat()
|
|
1958
|
+
};
|
|
1959
|
+
var latinJi = {
|
|
1960
|
+
lower: dictFrom.raw([
|
|
1961
|
+
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )і Ў/, "$1j U"],
|
|
1962
|
+
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )і ў/, "$1j u"],
|
|
1963
|
+
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )і /, "$1j "],
|
|
1964
|
+
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )І Ў/, "$1J U"],
|
|
1965
|
+
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )І ў/, "$1J u"],
|
|
1966
|
+
[/([аеёіоуыэюяАЕЁІОУЫЭЮЯ] )І /, "$1J "],
|
|
1967
|
+
[` і(?=${iwords})`, " ji"],
|
|
1968
|
+
[` І(?=${iwords})`, " Ji"],
|
|
1969
|
+
[` І(?=${iwords.toUpperCase()})`, " JI"]
|
|
1970
|
+
]).concat([
|
|
1971
|
+
...common.lower[0],
|
|
1972
|
+
[/([eouaаеёіоуыэюяʼАЕЁІОУЫЭЮЯЬ] *)і/g, "$1ji"],
|
|
1973
|
+
...common.lower[1]
|
|
1974
|
+
]),
|
|
1975
|
+
upper: [
|
|
1976
|
+
...common.upper[0],
|
|
1977
|
+
[new RegExp("([eoua] *)І(?=[ \\p{P}\\d]*\\p{Lu}?\\p{Ll})", "gu"), "$1Ji"],
|
|
1978
|
+
...common.upper[1],
|
|
1979
|
+
[/([AOEUАЕЁІОУЎЫЭЮЯ][( ]*)І/g, "$1JI"],
|
|
1980
|
+
...common.upper[2],
|
|
1981
|
+
[/ JIŁ -/g, " IŁ -"]
|
|
1982
|
+
]
|
|
1983
|
+
};
|
|
1984
|
+
|
|
1985
|
+
// src/dict/alphabets/arabic.ts
|
|
1986
|
+
var soft = "ْ(?=[еёіюяь])";
|
|
1987
|
+
var presoft = "([تزكثࢮбвгджзйклмнпрстфхцчшў])ْ?(ّ?)";
|
|
1988
|
+
var arabic = {
|
|
1989
|
+
lower: dictFrom.raw(
|
|
1990
|
+
[
|
|
1991
|
+
[/ л[ая]/, " لا"],
|
|
1992
|
+
[/л[ая]/, "ـلا"],
|
|
1993
|
+
// падваеньне зычнага, шадда
|
|
1994
|
+
[/([бвгджзйклмнпрстфхцчшў]|д[зж])\1/, "$1ّ"],
|
|
1995
|
+
// няма галоснага, сукун
|
|
1996
|
+
[/([бвгджзйклмнпрстфхцчшў])/, "$1ْ"],
|
|
1997
|
+
// а, аліф
|
|
1998
|
+
[/а/, "اа"],
|
|
1999
|
+
// першая галосная, аліф
|
|
2000
|
+
[/ (?=[еэыуо])/, " ا"],
|
|
2001
|
+
["дْз" + soft, "ࢮ"],
|
|
2002
|
+
["з" + soft, "ز"],
|
|
2003
|
+
["к" + soft, "ك"],
|
|
2004
|
+
["с" + soft, "ث"],
|
|
2005
|
+
["т" + soft, "ت"],
|
|
2006
|
+
[/([تزكث])і/, "ы"],
|
|
2007
|
+
// $2 - шадда
|
|
2008
|
+
[presoft + "[аяэе]", "$1$2َ"],
|
|
2009
|
+
[presoft + "[іы]", "$1$2ِ"],
|
|
2010
|
+
[/ і /, " اِ "],
|
|
2011
|
+
[presoft + "[оёую]", "$1$2ُ"],
|
|
2012
|
+
[/ʼ/, "ع"],
|
|
2013
|
+
[/ь/, ""],
|
|
2014
|
+
// [/[ьʼ]/, ''],
|
|
2015
|
+
[/[яе]/, "يَ"],
|
|
2016
|
+
[/і/, "يِ"],
|
|
2017
|
+
[/[ёю]/, "يُ"],
|
|
2018
|
+
[/[аэ]/, "َ"],
|
|
2019
|
+
[/[ыі]/, "ِ"],
|
|
2020
|
+
[/[оу]/, "ُ"],
|
|
2021
|
+
[/б/, "ب"],
|
|
2022
|
+
[/[вў]/, "و"],
|
|
2023
|
+
[/г/, "ه"],
|
|
2024
|
+
[/ґ/, "غ"],
|
|
2025
|
+
[/дْж/, "ج"],
|
|
2026
|
+
[/д/, "د"],
|
|
2027
|
+
[/ж/, "ژ"],
|
|
2028
|
+
[/з/, "ض"],
|
|
2029
|
+
[/й/, "ي"],
|
|
2030
|
+
[/к/, "ق"],
|
|
2031
|
+
[/л/, "ل"],
|
|
2032
|
+
[/м/, "م"],
|
|
2033
|
+
[/н/, "ن"],
|
|
2034
|
+
[/п/, "پ"],
|
|
2035
|
+
[/р/, "ر"],
|
|
2036
|
+
[/с/, "ص"],
|
|
2037
|
+
[/т/, "ط"],
|
|
2038
|
+
[/ф/, "ف"],
|
|
2039
|
+
[/х/, "ح"],
|
|
2040
|
+
[/ц/, "ࢯ"],
|
|
2041
|
+
[/ч/, "چ"],
|
|
2042
|
+
[/ш/, "ش"],
|
|
2043
|
+
[/,/, "،"],
|
|
2044
|
+
[/\?/, "؟"]
|
|
2045
|
+
],
|
|
2046
|
+
"gi"
|
|
2047
|
+
)
|
|
2052
2048
|
};
|
|
2053
2049
|
|
|
2054
2050
|
// src/config.ts
|
|
@@ -2069,7 +2065,7 @@ var TaraskConfig = class {
|
|
|
2069
2065
|
}
|
|
2070
2066
|
}
|
|
2071
2067
|
general = {
|
|
2072
|
-
abc:
|
|
2068
|
+
abc: alphabets_exports.cyrillic,
|
|
2073
2069
|
j: REPLACE_J.NEVER,
|
|
2074
2070
|
doEscapeCapitalized: true
|
|
2075
2071
|
};
|
|
@@ -2294,7 +2290,7 @@ var highlightDiffStep = (highlight) => (_, {
|
|
|
2294
2290
|
},
|
|
2295
2291
|
storage: { text, orig }
|
|
2296
2292
|
}) => {
|
|
2297
|
-
highlightDiff(text, orig, abc ===
|
|
2293
|
+
highlightDiff(text, orig, abc === alphabets_exports.cyrillic, highlight);
|
|
2298
2294
|
return _;
|
|
2299
2295
|
};
|
|
2300
2296
|
var highlightDiffNonHtmlStep = (_, {
|
|
@@ -2305,7 +2301,12 @@ var highlightDiffNonHtmlStep = (_, {
|
|
|
2305
2301
|
storage: { text, orig }
|
|
2306
2302
|
}) => {
|
|
2307
2303
|
if (ansiColors)
|
|
2308
|
-
highlightDiff(
|
|
2304
|
+
highlightDiff(
|
|
2305
|
+
text,
|
|
2306
|
+
orig,
|
|
2307
|
+
abc === alphabets_exports.cyrillic,
|
|
2308
|
+
ansiColorWrappers.fix
|
|
2309
|
+
);
|
|
2309
2310
|
return _;
|
|
2310
2311
|
};
|
|
2311
2312
|
|
|
@@ -2394,7 +2395,7 @@ var applyHtmlG = (text, {
|
|
|
2394
2395
|
}
|
|
2395
2396
|
}) => {
|
|
2396
2397
|
const colorize = htmlWrappers.letterH;
|
|
2397
|
-
return abc ===
|
|
2398
|
+
return abc === alphabets_exports.cyrillic ? replaceG(g ? colorize("$&") : ($0) => colorize(gobj[$0]))(text) : text;
|
|
2398
2399
|
};
|
|
2399
2400
|
|
|
2400
2401
|
// src/steps/i-to-j.ts
|
|
@@ -2403,7 +2404,7 @@ var replaceIbyJ = (text, {
|
|
|
2403
2404
|
cfg: {
|
|
2404
2405
|
general: { j, abc }
|
|
2405
2406
|
}
|
|
2406
|
-
}) => j && abc !==
|
|
2407
|
+
}) => j && abc !== alphabets_exports.latinJi ? text.replace(
|
|
2407
2408
|
/(?<=[аеёіоуыэюя] )і (ў?)/g,
|
|
2408
2409
|
j === REPLACE_J.ALWAYS ? ($0, $1) => toJ($1) : ($0, $1) => Math.random() >= 0.5 ? toJ($1) : $0
|
|
2409
2410
|
) : text;
|
|
@@ -2426,7 +2427,7 @@ var applyNonHtmlG = (text, {
|
|
|
2426
2427
|
}
|
|
2427
2428
|
}) => {
|
|
2428
2429
|
const colorize = ansiColorWrappers.variable;
|
|
2429
|
-
return abc ===
|
|
2430
|
+
return abc === alphabets_exports.cyrillic && (h || ansiColors) ? replaceG(
|
|
2430
2431
|
ansiColors ? h ? ($0) => colorize(gobj[$0]) : colorize("$&") : ($0) => gobj[$0]
|
|
2431
2432
|
)(text) : text;
|
|
2432
2433
|
};
|
|
@@ -2439,10 +2440,15 @@ var restoreCaseStep = (_, {
|
|
|
2439
2440
|
cfg: {
|
|
2440
2441
|
general: { abc }
|
|
2441
2442
|
},
|
|
2442
|
-
storage
|
|
2443
|
+
storage: { text, orig }
|
|
2443
2444
|
}) => {
|
|
2444
|
-
if (abc
|
|
2445
|
-
|
|
2445
|
+
if (abc.upper) {
|
|
2446
|
+
restoreCase(text, orig);
|
|
2447
|
+
} else {
|
|
2448
|
+
for (let i = 0; i < text.length; i++) {
|
|
2449
|
+
if (orig[i] !== orig[i].toLowerCase())
|
|
2450
|
+
text[i] = orig[i];
|
|
2451
|
+
}
|
|
2446
2452
|
}
|
|
2447
2453
|
return _;
|
|
2448
2454
|
};
|
|
@@ -2556,7 +2562,6 @@ var htmlPipeline = createPipeline(
|
|
|
2556
2562
|
);
|
|
2557
2563
|
// Annotate the CommonJS export names for ESM import in node:
|
|
2558
2564
|
0 && (module.exports = {
|
|
2559
|
-
ALPHABET,
|
|
2560
2565
|
REPLACE_J,
|
|
2561
2566
|
TaraskConfig,
|
|
2562
2567
|
VARIATION,
|