taraskevizer 4.1.1 → 5.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +0 -2
- package/dist/bin.js +0 -6
- package/dist/index.cjs +10 -135
- package/dist/index.d.ts +1 -2
- package/dist/index.js +10 -135
- package/package.json +1 -1
package/README.md
CHANGED
|
@@ -57,7 +57,6 @@ Default value: `0`
|
|
|
57
57
|
| 0 | cyrillic |
|
|
58
58
|
| 1 | latin |
|
|
59
59
|
| 2 | arabic |
|
|
60
|
-
| 3 | greek |
|
|
61
60
|
|
|
62
61
|
### j
|
|
63
62
|
|
|
@@ -191,7 +190,6 @@ $ tarask "планета"
|
|
|
191
190
|
# Alpabet
|
|
192
191
|
--latin (-l)
|
|
193
192
|
--arabic (-a)
|
|
194
|
-
--greek (-gr)
|
|
195
193
|
# When to replace і(i) by й(j) after vowels
|
|
196
194
|
--jrandom (-jr)
|
|
197
195
|
--jalways (-ja)
|
package/dist/bin.js
CHANGED
package/dist/index.cjs
CHANGED
|
@@ -129,126 +129,6 @@ var latinLettersUpperCase = [
|
|
|
129
129
|
[/ŁI/, "LI"]
|
|
130
130
|
];
|
|
131
131
|
|
|
132
|
-
// src/dict/greek.ts
|
|
133
|
-
var greekLetters = [
|
|
134
|
-
[/а/, "α"],
|
|
135
|
-
[/б/, "μπ"],
|
|
136
|
-
[/в/, "β"],
|
|
137
|
-
[/г/, "γ"],
|
|
138
|
-
[/ґ/, "γκ"],
|
|
139
|
-
[/д/, "δ"],
|
|
140
|
-
[/е/, "η"],
|
|
141
|
-
[/ё/, "υο"],
|
|
142
|
-
[/ж/, "ζ̌"],
|
|
143
|
-
[/з/, "ζ"],
|
|
144
|
-
[/і/, "ι"],
|
|
145
|
-
[/й/, "υ"],
|
|
146
|
-
[/к/, "κ"],
|
|
147
|
-
[/л/, "λ"],
|
|
148
|
-
[/мп/, "μ‘π"],
|
|
149
|
-
[/м/, "μ"],
|
|
150
|
-
[/н/, "ν"],
|
|
151
|
-
[/о/, "ο"],
|
|
152
|
-
[/п/, "π"],
|
|
153
|
-
[/р/, "ρ"],
|
|
154
|
-
[/с/, "σ"],
|
|
155
|
-
[/сь/, "ς"],
|
|
156
|
-
[/т/, "τ"],
|
|
157
|
-
[/у/, "ϋ"],
|
|
158
|
-
[/ў/, "ΰ"],
|
|
159
|
-
[/ф/, "φ"],
|
|
160
|
-
[/х/, "χ"],
|
|
161
|
-
[/ц/, "τσ"],
|
|
162
|
-
[/ць/, "τς"],
|
|
163
|
-
[/ч/, "τσ̌"],
|
|
164
|
-
[/ш/, "σ̌"],
|
|
165
|
-
[/ы/, "ί"],
|
|
166
|
-
[/э/, "ε"],
|
|
167
|
-
[/ю/, "υϋ"],
|
|
168
|
-
[/я/, "υα"],
|
|
169
|
-
[/ь/, "’"]
|
|
170
|
-
];
|
|
171
|
-
var greekLettersUpperCase = [
|
|
172
|
-
[new RegExp(" Б(?= *\\p{Ll})", "u"), " Μπ"],
|
|
173
|
-
[new RegExp(" Ґ(?= *\\p{Ll})", "u"), " Γκ"],
|
|
174
|
-
[new RegExp(" Ё(?= *\\p{Ll})", "u"), " Υο"],
|
|
175
|
-
[new RegExp(" Ю(?= *\\p{Ll})", "u"), " Υϋ"],
|
|
176
|
-
[new RegExp(" Я(?= *\\p{Ll})", "u"), " Υα"],
|
|
177
|
-
[new RegExp(" Ч(?= *\\p{Ll})", "u"), " Τσ̌"],
|
|
178
|
-
[/Б/, "ΜΠ"],
|
|
179
|
-
[/Ґ/, "ΓΚ"],
|
|
180
|
-
[/Ё/, "ΥΟ"],
|
|
181
|
-
[/Ю/, "ΥΫ"],
|
|
182
|
-
[/Я/, "ΥΑ"],
|
|
183
|
-
[/Ч/, "ΤΣ̌"],
|
|
184
|
-
[/А/, "Α"],
|
|
185
|
-
[/В/, "Β"],
|
|
186
|
-
[/Г/, "Γ"],
|
|
187
|
-
[/Д/, "Δ"],
|
|
188
|
-
[/Е/, "Η"],
|
|
189
|
-
[/Ж/, "Ζ̌"],
|
|
190
|
-
[/З/, "Ζ"],
|
|
191
|
-
[/І/, "Ι"],
|
|
192
|
-
[/Й/, "Υ"],
|
|
193
|
-
[/К/, "Κ"],
|
|
194
|
-
[/Л/, "Λ"],
|
|
195
|
-
[/МП/, "Μ‘Π"],
|
|
196
|
-
[/Мп/, "Μ‘π"],
|
|
197
|
-
[/М/, "Μ"],
|
|
198
|
-
[/Н/, "Ν"],
|
|
199
|
-
[/О/, "Ο"],
|
|
200
|
-
[/П/, "Π"],
|
|
201
|
-
[/Р/, "Ρ"],
|
|
202
|
-
[/С/, "Σ"],
|
|
203
|
-
[/С[Ьь]/, "ς"],
|
|
204
|
-
[/Т/, "Τ"],
|
|
205
|
-
[/У/, "Ϋ"],
|
|
206
|
-
[/Ў/, "Ϋ́"],
|
|
207
|
-
[/Ф/, "Φ"],
|
|
208
|
-
[/Х/, "Χ"],
|
|
209
|
-
[/Ц/, "Τσ"],
|
|
210
|
-
[/Ц[Ьь]/, "Τς"],
|
|
211
|
-
[/Ш/, "Σ̌"],
|
|
212
|
-
[/Ы/, "Ί"],
|
|
213
|
-
[/Э/, "Ε"],
|
|
214
|
-
[/Ь/, "’"]
|
|
215
|
-
];
|
|
216
|
-
var thWords = [
|
|
217
|
-
[/тэі(?=зм|ст)/, "θει"],
|
|
218
|
-
[/ агат/, " αγαθ"],
|
|
219
|
-
[/ анатэм/, " αναθεμ"],
|
|
220
|
-
[/антрапа/, "ανθραπα"],
|
|
221
|
-
[/ апатэ(?=оз|аты|м)/, " απαθε"],
|
|
222
|
-
[/ арта(?=графі|д[ао]кс|эпі)/, " αρθα"],
|
|
223
|
-
[/ арытмэт/, " αρίθμετ"],
|
|
224
|
-
[/ атэн/, " αθεν"],
|
|
225
|
-
[/ калітэ/, " καλιθε"],
|
|
226
|
-
[/ катэд(?=\(?а?р)/, " καθεδ"],
|
|
227
|
-
[/лябірынт/, "λυαμπιρίνθ"],
|
|
228
|
-
[/лягарытм/, "λυαγαρίθμ"],
|
|
229
|
-
[/ мар[фт]ы /, " μαρθί "],
|
|
230
|
-
[/ марфе /, " μαρθη "],
|
|
231
|
-
[/ матэматы/, " μαθεματί"],
|
|
232
|
-
[/ міт(?=[ауы]|оляг| )/, " μιθ"],
|
|
233
|
-
[/ мэт(?=[ао]д)/, " μεθ"],
|
|
234
|
-
[/пат(?=ал[ёя]гі|оляг|ычн|ыя|ы[ійю] |[ауы] |а[ўм] |амі | )/, "παθ"],
|
|
235
|
-
[/ пітагор/, " πιθαγορ"],
|
|
236
|
-
[/ ры[тф]м/, " ρίθμ"],
|
|
237
|
-
[/сынтэ[зт]/, "σίνθετ"],
|
|
238
|
-
[/ томас/, " θομασ"],
|
|
239
|
-
[/ тромб/, " θρομμπ"],
|
|
240
|
-
[/ трон/, " θρον"],
|
|
241
|
-
[/трамбоз/, "θραμμποζ"],
|
|
242
|
-
[/ тэадос/, " θεαδοσ"],
|
|
243
|
-
[/ тэарэм/, " θεαρεμ"],
|
|
244
|
-
[/ тэат(?=ар |р)/, " θεατ"],
|
|
245
|
-
[/ тэм(?=[аеуы])/, " θεμ"],
|
|
246
|
-
[/ тэ(?=[ао]р|салёнік|сал)/, " θε"],
|
|
247
|
-
[/тэ(?=с\S*алёнік|салё\)нік|\S*зіс)/, "θε"],
|
|
248
|
-
[/тэрма/, "θερμα"],
|
|
249
|
-
[/ эт(?=ы[кч]|эр)/, " εθ"]
|
|
250
|
-
];
|
|
251
|
-
|
|
252
132
|
// src/dict/arabic.ts
|
|
253
133
|
var soft = "ْ(?=[еёіюяь])";
|
|
254
134
|
var presoft = "([تزكثࢮбвгджзйклмнпрстфхцчшў])ْ?(ّ?)";
|
|
@@ -1992,7 +1872,7 @@ var rawWordlist = [
|
|
|
1992
1872
|
[/ расей /, " расе(й|яў) "],
|
|
1993
1873
|
[//, ""]
|
|
1994
1874
|
];
|
|
1995
|
-
var
|
|
1875
|
+
var rawsofteners = [
|
|
1996
1876
|
[/([лнц])\1(?=[еёіюяь])/, "$1ь$1"],
|
|
1997
1877
|
[/(\S\S)дз?дз(?=[еёіюяь])/, "$1дзьдз"],
|
|
1998
1878
|
[/адзьдз([ея])л/, "аддз$1л"],
|
|
@@ -2112,17 +1992,17 @@ var gobj = {
|
|
|
2112
1992
|
"Ґ": "Г"
|
|
2113
1993
|
};
|
|
2114
1994
|
var wordlist = [];
|
|
2115
|
-
var
|
|
1995
|
+
var softeners = [];
|
|
2116
1996
|
var arabLetters = [];
|
|
2117
1997
|
var arr = [
|
|
2118
1998
|
[rawWordlist, wordlist],
|
|
2119
|
-
[
|
|
1999
|
+
[rawsofteners, softeners],
|
|
2120
2000
|
[rawArabLetters, arabLetters]
|
|
2121
2001
|
];
|
|
2122
2002
|
for (const [raw, obj] of arr)
|
|
2123
2003
|
for (const [pattern, result] of raw)
|
|
2124
2004
|
obj.push([RegExp(pattern, "g"), result]);
|
|
2125
|
-
for (const obj of [latinLetters, latinLettersUpperCase
|
|
2005
|
+
for (const obj of [latinLetters, latinLettersUpperCase])
|
|
2126
2006
|
for (const item of obj)
|
|
2127
2007
|
item[0] = RegExp(item[0], "g" + item[0].flags);
|
|
2128
2008
|
for (const word of gwords)
|
|
@@ -2143,8 +2023,7 @@ var G_REGEX = /[Ґґ]/g;
|
|
|
2143
2023
|
var ALPHABET = {
|
|
2144
2024
|
CYRILLIC: 0,
|
|
2145
2025
|
LATIN: 1,
|
|
2146
|
-
ARABIC: 2
|
|
2147
|
-
GREEK: 3
|
|
2026
|
+
ARABIC: 2
|
|
2148
2027
|
};
|
|
2149
2028
|
var REPLACE_J = {
|
|
2150
2029
|
NEVER: 0,
|
|
@@ -2158,12 +2037,10 @@ var VARIATION = {
|
|
|
2158
2037
|
};
|
|
2159
2038
|
var letters = {
|
|
2160
2039
|
[ALPHABET.LATIN]: latinLetters,
|
|
2161
|
-
[ALPHABET.ARABIC]: arabLetters
|
|
2162
|
-
[ALPHABET.GREEK]: greekLetters
|
|
2040
|
+
[ALPHABET.ARABIC]: arabLetters
|
|
2163
2041
|
};
|
|
2164
2042
|
var lettersUpperCase = {
|
|
2165
|
-
[ALPHABET.LATIN]: latinLettersUpperCase
|
|
2166
|
-
[ALPHABET.GREEK]: greekLettersUpperCase
|
|
2043
|
+
[ALPHABET.LATIN]: latinLettersUpperCase
|
|
2167
2044
|
};
|
|
2168
2045
|
var wrappers = {
|
|
2169
2046
|
html: {
|
|
@@ -2290,7 +2167,7 @@ var replaceIbyJ = (text, always = false) => text.replace(
|
|
|
2290
2167
|
);
|
|
2291
2168
|
var __tarask__ = {
|
|
2292
2169
|
wordlist,
|
|
2293
|
-
|
|
2170
|
+
softeners,
|
|
2294
2171
|
replaceWithDict,
|
|
2295
2172
|
afterTarask
|
|
2296
2173
|
};
|
|
@@ -2379,8 +2256,6 @@ var Taraskevizer = class {
|
|
|
2379
2256
|
text = this.taraskevize(text.toLowerCase());
|
|
2380
2257
|
if (j)
|
|
2381
2258
|
text = replaceIbyJ(text, j === REPLACE_J.ALWAYS);
|
|
2382
|
-
if (abc === ALPHABET.GREEK)
|
|
2383
|
-
text = replaceWithDict(text, thWords);
|
|
2384
2259
|
text = replaceWithDict(text, letters[abc]);
|
|
2385
2260
|
splitted = text.split(" ");
|
|
2386
2261
|
if (abc !== ALPHABET.ARABIC)
|
|
@@ -2391,8 +2266,8 @@ var Taraskevizer = class {
|
|
|
2391
2266
|
text = replaceWithDict(text, wordlist);
|
|
2392
2267
|
softening:
|
|
2393
2268
|
do {
|
|
2394
|
-
text = replaceWithDict(text,
|
|
2395
|
-
for (const [pattern, result] of
|
|
2269
|
+
text = replaceWithDict(text, softeners);
|
|
2270
|
+
for (const [pattern, result] of softeners)
|
|
2396
2271
|
if (result !== "$1дзьдз" && pattern.test(text))
|
|
2397
2272
|
continue softening;
|
|
2398
2273
|
break;
|
package/dist/index.d.ts
CHANGED
|
@@ -27,7 +27,6 @@ declare const ALPHABET: {
|
|
|
27
27
|
readonly CYRILLIC: 0;
|
|
28
28
|
readonly LATIN: 1;
|
|
29
29
|
readonly ARABIC: 2;
|
|
30
|
-
readonly GREEK: 3;
|
|
31
30
|
};
|
|
32
31
|
declare const REPLACE_J: {
|
|
33
32
|
readonly NEVER: 0;
|
|
@@ -41,7 +40,7 @@ declare const VARIATION: {
|
|
|
41
40
|
};
|
|
42
41
|
declare const __tarask__: {
|
|
43
42
|
readonly wordlist: Dict;
|
|
44
|
-
readonly
|
|
43
|
+
readonly softeners: Dict;
|
|
45
44
|
readonly replaceWithDict: (text: string, dict?: ExtendedDict) => string;
|
|
46
45
|
readonly afterTarask: ExtendedDict;
|
|
47
46
|
};
|
package/dist/index.js
CHANGED
|
@@ -98,126 +98,6 @@ var latinLettersUpperCase = [
|
|
|
98
98
|
[/ŁI/, "LI"]
|
|
99
99
|
];
|
|
100
100
|
|
|
101
|
-
// src/dict/greek.ts
|
|
102
|
-
var greekLetters = [
|
|
103
|
-
[/а/, "α"],
|
|
104
|
-
[/б/, "μπ"],
|
|
105
|
-
[/в/, "β"],
|
|
106
|
-
[/г/, "γ"],
|
|
107
|
-
[/ґ/, "γκ"],
|
|
108
|
-
[/д/, "δ"],
|
|
109
|
-
[/е/, "η"],
|
|
110
|
-
[/ё/, "υο"],
|
|
111
|
-
[/ж/, "ζ̌"],
|
|
112
|
-
[/з/, "ζ"],
|
|
113
|
-
[/і/, "ι"],
|
|
114
|
-
[/й/, "υ"],
|
|
115
|
-
[/к/, "κ"],
|
|
116
|
-
[/л/, "λ"],
|
|
117
|
-
[/мп/, "μ‘π"],
|
|
118
|
-
[/м/, "μ"],
|
|
119
|
-
[/н/, "ν"],
|
|
120
|
-
[/о/, "ο"],
|
|
121
|
-
[/п/, "π"],
|
|
122
|
-
[/р/, "ρ"],
|
|
123
|
-
[/с/, "σ"],
|
|
124
|
-
[/сь/, "ς"],
|
|
125
|
-
[/т/, "τ"],
|
|
126
|
-
[/у/, "ϋ"],
|
|
127
|
-
[/ў/, "ΰ"],
|
|
128
|
-
[/ф/, "φ"],
|
|
129
|
-
[/х/, "χ"],
|
|
130
|
-
[/ц/, "τσ"],
|
|
131
|
-
[/ць/, "τς"],
|
|
132
|
-
[/ч/, "τσ̌"],
|
|
133
|
-
[/ш/, "σ̌"],
|
|
134
|
-
[/ы/, "ί"],
|
|
135
|
-
[/э/, "ε"],
|
|
136
|
-
[/ю/, "υϋ"],
|
|
137
|
-
[/я/, "υα"],
|
|
138
|
-
[/ь/, "’"]
|
|
139
|
-
];
|
|
140
|
-
var greekLettersUpperCase = [
|
|
141
|
-
[new RegExp(" Б(?= *\\p{Ll})", "u"), " Μπ"],
|
|
142
|
-
[new RegExp(" Ґ(?= *\\p{Ll})", "u"), " Γκ"],
|
|
143
|
-
[new RegExp(" Ё(?= *\\p{Ll})", "u"), " Υο"],
|
|
144
|
-
[new RegExp(" Ю(?= *\\p{Ll})", "u"), " Υϋ"],
|
|
145
|
-
[new RegExp(" Я(?= *\\p{Ll})", "u"), " Υα"],
|
|
146
|
-
[new RegExp(" Ч(?= *\\p{Ll})", "u"), " Τσ̌"],
|
|
147
|
-
[/Б/, "ΜΠ"],
|
|
148
|
-
[/Ґ/, "ΓΚ"],
|
|
149
|
-
[/Ё/, "ΥΟ"],
|
|
150
|
-
[/Ю/, "ΥΫ"],
|
|
151
|
-
[/Я/, "ΥΑ"],
|
|
152
|
-
[/Ч/, "ΤΣ̌"],
|
|
153
|
-
[/А/, "Α"],
|
|
154
|
-
[/В/, "Β"],
|
|
155
|
-
[/Г/, "Γ"],
|
|
156
|
-
[/Д/, "Δ"],
|
|
157
|
-
[/Е/, "Η"],
|
|
158
|
-
[/Ж/, "Ζ̌"],
|
|
159
|
-
[/З/, "Ζ"],
|
|
160
|
-
[/І/, "Ι"],
|
|
161
|
-
[/Й/, "Υ"],
|
|
162
|
-
[/К/, "Κ"],
|
|
163
|
-
[/Л/, "Λ"],
|
|
164
|
-
[/МП/, "Μ‘Π"],
|
|
165
|
-
[/Мп/, "Μ‘π"],
|
|
166
|
-
[/М/, "Μ"],
|
|
167
|
-
[/Н/, "Ν"],
|
|
168
|
-
[/О/, "Ο"],
|
|
169
|
-
[/П/, "Π"],
|
|
170
|
-
[/Р/, "Ρ"],
|
|
171
|
-
[/С/, "Σ"],
|
|
172
|
-
[/С[Ьь]/, "ς"],
|
|
173
|
-
[/Т/, "Τ"],
|
|
174
|
-
[/У/, "Ϋ"],
|
|
175
|
-
[/Ў/, "Ϋ́"],
|
|
176
|
-
[/Ф/, "Φ"],
|
|
177
|
-
[/Х/, "Χ"],
|
|
178
|
-
[/Ц/, "Τσ"],
|
|
179
|
-
[/Ц[Ьь]/, "Τς"],
|
|
180
|
-
[/Ш/, "Σ̌"],
|
|
181
|
-
[/Ы/, "Ί"],
|
|
182
|
-
[/Э/, "Ε"],
|
|
183
|
-
[/Ь/, "’"]
|
|
184
|
-
];
|
|
185
|
-
var thWords = [
|
|
186
|
-
[/тэі(?=зм|ст)/, "θει"],
|
|
187
|
-
[/ агат/, " αγαθ"],
|
|
188
|
-
[/ анатэм/, " αναθεμ"],
|
|
189
|
-
[/антрапа/, "ανθραπα"],
|
|
190
|
-
[/ апатэ(?=оз|аты|м)/, " απαθε"],
|
|
191
|
-
[/ арта(?=графі|д[ао]кс|эпі)/, " αρθα"],
|
|
192
|
-
[/ арытмэт/, " αρίθμετ"],
|
|
193
|
-
[/ атэн/, " αθεν"],
|
|
194
|
-
[/ калітэ/, " καλιθε"],
|
|
195
|
-
[/ катэд(?=\(?а?р)/, " καθεδ"],
|
|
196
|
-
[/лябірынт/, "λυαμπιρίνθ"],
|
|
197
|
-
[/лягарытм/, "λυαγαρίθμ"],
|
|
198
|
-
[/ мар[фт]ы /, " μαρθί "],
|
|
199
|
-
[/ марфе /, " μαρθη "],
|
|
200
|
-
[/ матэматы/, " μαθεματί"],
|
|
201
|
-
[/ міт(?=[ауы]|оляг| )/, " μιθ"],
|
|
202
|
-
[/ мэт(?=[ао]д)/, " μεθ"],
|
|
203
|
-
[/пат(?=ал[ёя]гі|оляг|ычн|ыя|ы[ійю] |[ауы] |а[ўм] |амі | )/, "παθ"],
|
|
204
|
-
[/ пітагор/, " πιθαγορ"],
|
|
205
|
-
[/ ры[тф]м/, " ρίθμ"],
|
|
206
|
-
[/сынтэ[зт]/, "σίνθετ"],
|
|
207
|
-
[/ томас/, " θομασ"],
|
|
208
|
-
[/ тромб/, " θρομμπ"],
|
|
209
|
-
[/ трон/, " θρον"],
|
|
210
|
-
[/трамбоз/, "θραμμποζ"],
|
|
211
|
-
[/ тэадос/, " θεαδοσ"],
|
|
212
|
-
[/ тэарэм/, " θεαρεμ"],
|
|
213
|
-
[/ тэат(?=ар |р)/, " θεατ"],
|
|
214
|
-
[/ тэм(?=[аеуы])/, " θεμ"],
|
|
215
|
-
[/ тэ(?=[ао]р|салёнік|сал)/, " θε"],
|
|
216
|
-
[/тэ(?=с\S*алёнік|салё\)нік|\S*зіс)/, "θε"],
|
|
217
|
-
[/тэрма/, "θερμα"],
|
|
218
|
-
[/ эт(?=ы[кч]|эр)/, " εθ"]
|
|
219
|
-
];
|
|
220
|
-
|
|
221
101
|
// src/dict/arabic.ts
|
|
222
102
|
var soft = "ْ(?=[еёіюяь])";
|
|
223
103
|
var presoft = "([تزكثࢮбвгджзйклмнпрстфхцчшў])ْ?(ّ?)";
|
|
@@ -1961,7 +1841,7 @@ var rawWordlist = [
|
|
|
1961
1841
|
[/ расей /, " расе(й|яў) "],
|
|
1962
1842
|
[//, ""]
|
|
1963
1843
|
];
|
|
1964
|
-
var
|
|
1844
|
+
var rawsofteners = [
|
|
1965
1845
|
[/([лнц])\1(?=[еёіюяь])/, "$1ь$1"],
|
|
1966
1846
|
[/(\S\S)дз?дз(?=[еёіюяь])/, "$1дзьдз"],
|
|
1967
1847
|
[/адзьдз([ея])л/, "аддз$1л"],
|
|
@@ -2081,17 +1961,17 @@ var gobj = {
|
|
|
2081
1961
|
"Ґ": "Г"
|
|
2082
1962
|
};
|
|
2083
1963
|
var wordlist = [];
|
|
2084
|
-
var
|
|
1964
|
+
var softeners = [];
|
|
2085
1965
|
var arabLetters = [];
|
|
2086
1966
|
var arr = [
|
|
2087
1967
|
[rawWordlist, wordlist],
|
|
2088
|
-
[
|
|
1968
|
+
[rawsofteners, softeners],
|
|
2089
1969
|
[rawArabLetters, arabLetters]
|
|
2090
1970
|
];
|
|
2091
1971
|
for (const [raw, obj] of arr)
|
|
2092
1972
|
for (const [pattern, result] of raw)
|
|
2093
1973
|
obj.push([RegExp(pattern, "g"), result]);
|
|
2094
|
-
for (const obj of [latinLetters, latinLettersUpperCase
|
|
1974
|
+
for (const obj of [latinLetters, latinLettersUpperCase])
|
|
2095
1975
|
for (const item of obj)
|
|
2096
1976
|
item[0] = RegExp(item[0], "g" + item[0].flags);
|
|
2097
1977
|
for (const word of gwords)
|
|
@@ -2112,8 +1992,7 @@ var G_REGEX = /[Ґґ]/g;
|
|
|
2112
1992
|
var ALPHABET = {
|
|
2113
1993
|
CYRILLIC: 0,
|
|
2114
1994
|
LATIN: 1,
|
|
2115
|
-
ARABIC: 2
|
|
2116
|
-
GREEK: 3
|
|
1995
|
+
ARABIC: 2
|
|
2117
1996
|
};
|
|
2118
1997
|
var REPLACE_J = {
|
|
2119
1998
|
NEVER: 0,
|
|
@@ -2127,12 +2006,10 @@ var VARIATION = {
|
|
|
2127
2006
|
};
|
|
2128
2007
|
var letters = {
|
|
2129
2008
|
[ALPHABET.LATIN]: latinLetters,
|
|
2130
|
-
[ALPHABET.ARABIC]: arabLetters
|
|
2131
|
-
[ALPHABET.GREEK]: greekLetters
|
|
2009
|
+
[ALPHABET.ARABIC]: arabLetters
|
|
2132
2010
|
};
|
|
2133
2011
|
var lettersUpperCase = {
|
|
2134
|
-
[ALPHABET.LATIN]: latinLettersUpperCase
|
|
2135
|
-
[ALPHABET.GREEK]: greekLettersUpperCase
|
|
2012
|
+
[ALPHABET.LATIN]: latinLettersUpperCase
|
|
2136
2013
|
};
|
|
2137
2014
|
var wrappers = {
|
|
2138
2015
|
html: {
|
|
@@ -2259,7 +2136,7 @@ var replaceIbyJ = (text, always = false) => text.replace(
|
|
|
2259
2136
|
);
|
|
2260
2137
|
var __tarask__ = {
|
|
2261
2138
|
wordlist,
|
|
2262
|
-
|
|
2139
|
+
softeners,
|
|
2263
2140
|
replaceWithDict,
|
|
2264
2141
|
afterTarask
|
|
2265
2142
|
};
|
|
@@ -2348,8 +2225,6 @@ var Taraskevizer = class {
|
|
|
2348
2225
|
text = this.taraskevize(text.toLowerCase());
|
|
2349
2226
|
if (j)
|
|
2350
2227
|
text = replaceIbyJ(text, j === REPLACE_J.ALWAYS);
|
|
2351
|
-
if (abc === ALPHABET.GREEK)
|
|
2352
|
-
text = replaceWithDict(text, thWords);
|
|
2353
2228
|
text = replaceWithDict(text, letters[abc]);
|
|
2354
2229
|
splitted = text.split(" ");
|
|
2355
2230
|
if (abc !== ALPHABET.ARABIC)
|
|
@@ -2360,8 +2235,8 @@ var Taraskevizer = class {
|
|
|
2360
2235
|
text = replaceWithDict(text, wordlist);
|
|
2361
2236
|
softening:
|
|
2362
2237
|
do {
|
|
2363
|
-
text = replaceWithDict(text,
|
|
2364
|
-
for (const [pattern, result] of
|
|
2238
|
+
text = replaceWithDict(text, softeners);
|
|
2239
|
+
for (const [pattern, result] of softeners)
|
|
2365
2240
|
if (result !== "$1дзьдз" && pattern.test(text))
|
|
2366
2241
|
continue softening;
|
|
2367
2242
|
break;
|