@qvac/translation-nmtcpp 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (109) hide show
  1. package/LICENSE +202 -0
  2. package/README.md +470 -0
  3. package/binding.js +1 -0
  4. package/index.d.ts +82 -0
  5. package/index.js +188 -0
  6. package/lib/error.js +65 -0
  7. package/marian.js +186 -0
  8. package/package.json +69 -0
  9. package/prebuilds/android-arm/qvac__translation-nmtcpp.bare +0 -0
  10. package/prebuilds/android-arm64/qvac__translation-nmtcpp.bare +0 -0
  11. package/prebuilds/android-ia32/qvac__translation-nmtcpp.bare +0 -0
  12. package/prebuilds/android-x64/qvac__translation-nmtcpp.bare +0 -0
  13. package/prebuilds/darwin-arm64/qvac__translation-nmtcpp.bare +0 -0
  14. package/prebuilds/darwin-arm64/qvac__translation-nmtcpp.bare.exports +3622 -0
  15. package/prebuilds/darwin-x64/qvac__translation-nmtcpp.bare +0 -0
  16. package/prebuilds/darwin-x64/qvac__translation-nmtcpp.bare.exports +3731 -0
  17. package/prebuilds/ios-arm64/qvac__translation-nmtcpp.bare +0 -0
  18. package/prebuilds/ios-arm64/qvac__translation-nmtcpp.bare.exports +3603 -0
  19. package/prebuilds/ios-arm64-simulator/qvac__translation-nmtcpp.bare +0 -0
  20. package/prebuilds/ios-arm64-simulator/qvac__translation-nmtcpp.bare.exports +3603 -0
  21. package/prebuilds/ios-x64-simulator/qvac__translation-nmtcpp.bare +0 -0
  22. package/prebuilds/ios-x64-simulator/qvac__translation-nmtcpp.bare.exports +3720 -0
  23. package/prebuilds/linux-x64/qvac__translation-nmtcpp.bare +0 -0
  24. package/prebuilds/win32-x64/qvac__translation-nmtcpp.bare +0 -0
  25. package/prebuilds/win32-x64/qvac__translation-nmtcpp.bare.exports +0 -0
  26. package/third-party/indic-processor-deps/indicnlp/INDIC_NLP_LICENCE +9 -0
  27. package/third-party/indic-processor-deps/indicnlp/index.js +11 -0
  28. package/third-party/indic-processor-deps/indicnlp/indic_detokenize.js +141 -0
  29. package/third-party/indic-processor-deps/indicnlp/indic_normalize.js +1213 -0
  30. package/third-party/indic-processor-deps/indicnlp/indic_tokenize.js +123 -0
  31. package/third-party/indic-processor-deps/indicnlp/langinfo.js +609 -0
  32. package/third-party/indic-processor-deps/indicnlp/sinhala_transliterator.js +197 -0
  33. package/third-party/indic-processor-deps/indicnlp/unicode_transliterator.js +120 -0
  34. package/third-party/indic-processor-deps/sacremoses/SACREMOSES_LICENCE +21 -0
  35. package/third-party/indic-processor-deps/sacremoses/cjk.js +202 -0
  36. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/README.txt +8 -0
  37. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.as +65 -0
  38. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.bn +65 -0
  39. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.ca +75 -0
  40. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.cs +390 -0
  41. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.de +325 -0
  42. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.el +1568 -0
  43. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.en +123 -0
  44. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.es +118 -0
  45. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.et +138 -0
  46. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.fi +138 -0
  47. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.fr +153 -0
  48. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.ga +48 -0
  49. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.gu +105 -0
  50. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.hi +113 -0
  51. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.hu +103 -0
  52. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.is +251 -0
  53. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.it +180 -0
  54. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.kn +70 -0
  55. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.lt +698 -0
  56. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.lv +100 -0
  57. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.ml +67 -0
  58. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.mni +65 -0
  59. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.mr +113 -0
  60. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.nl +115 -0
  61. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.or +101 -0
  62. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.pa +102 -0
  63. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.pl +283 -0
  64. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.pt +210 -0
  65. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.ro +38 -0
  66. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.ru +293 -0
  67. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.sk +474 -0
  68. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.sl +78 -0
  69. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.sv +97 -0
  70. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.ta +71 -0
  71. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.tdt +210 -0
  72. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.te +70 -0
  73. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.yue +53 -0
  74. package/third-party/indic-processor-deps/sacremoses/data/nonbreaking_prefixes/nonbreaking_prefix.zh +53 -0
  75. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/CJK.txt +23246 -0
  76. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/CJKSymbols.txt +1 -0
  77. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Close_Punctuation.txt +1 -0
  78. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Currency_Symbol.txt +1 -0
  79. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Han.txt +1 -0
  80. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Hangul.txt +1 -0
  81. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Hangul_Syllables.txt +1 -0
  82. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Hiragana.txt +1 -0
  83. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsAlnum-unichars-au.txt +1 -0
  84. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsAlnum.txt +1 -0
  85. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsAlpha-unichars-au.txt +1 -0
  86. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsAlpha.txt +1 -0
  87. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsLower.txt +1 -0
  88. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsN.txt +1 -0
  89. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsPf.txt +1 -0
  90. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsPi.txt +1 -0
  91. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsSc.txt +1 -0
  92. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsSo.txt +1 -0
  93. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/IsUpper.txt +1 -0
  94. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Katakana.txt +1 -0
  95. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Line_Separator.txt +1 -0
  96. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Lowercase_Letter.txt +1 -0
  97. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Number.txt +1 -0
  98. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Open_Punctuation.txt +1 -0
  99. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Punctuation.txt +1 -0
  100. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Separator.txt +1 -0
  101. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Symbol.txt +1 -0
  102. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Titlecase_Letter.txt +1 -0
  103. package/third-party/indic-processor-deps/sacremoses/data/perluniprops/Uppercase_Letter.txt +1 -0
  104. package/third-party/indic-processor-deps/sacremoses/index.js +8 -0
  105. package/third-party/indic-processor-deps/sacremoses/indic.js +76 -0
  106. package/third-party/indic-processor-deps/sacremoses/normalizer.js +264 -0
  107. package/third-party/indic-processor-deps/sacremoses/pernuliprops.js +287 -0
  108. package/third-party/indic-processor-deps/sacremoses/tokenizer.js +1217 -0
  109. package/third-party/indic-processor.js +565 -0
@@ -0,0 +1,70 @@
1
+ #Anything in this file, followed by a period (and an upper-case word), does NOT indicate an end-of-sentence marker.
2
+
3
+ #common exceptions
4
+ # Rs
5
+ ರೂ
6
+ # Dr
7
+ ಡಾ
8
+ # Mr
9
+ ಶ್ರೀ
10
+
11
+ #others
12
+
13
+
14
+ #phonetics
15
+ # A
16
+
17
+ # B
18
+ ಬಿ
19
+ # C
20
+ ಸಿ
21
+ # D
22
+ ಡಿ
23
+ # E
24
+
25
+ # F
26
+ ಎಫ್
27
+ # G
28
+ ಜಿ
29
+ # H
30
+ ಹೆಚ್
31
+ ಎಚ್‌
32
+ # I
33
+
34
+ # J
35
+ ಜೆ
36
+ # K
37
+ ಕೆ
38
+ # L
39
+ ಎಲ್
40
+ # M
41
+ ಎಂ
42
+ # N
43
+ ಎನ್
44
+ # O
45
+
46
+ # P
47
+ ಪಿ
48
+ # Q
49
+ ಕ್ಯೂ
50
+ # R
51
+ ಆರ್
52
+ # S
53
+ ಎಸ್
54
+ # T
55
+ ಟಿ
56
+ # U
57
+ ಯು
58
+ # V
59
+ ವಿ
60
+ # W
61
+ ಡಬ್ಲ್ಯೂ
62
+ # X
63
+ ಎಕ್ಸ್
64
+ # Y
65
+ ವೈ
66
+ # Z
67
+ ಜೆಡ್
68
+
69
+ #consonants
70
+
@@ -0,0 +1,698 @@
1
+ # Anything in this file, followed by a period (and an upper-case word),
2
+ # does NOT indicate an end-of-sentence marker.
3
+ # Special cases are included for prefixes that ONLY appear before 0-9 numbers.
4
+
5
+ # Any single upper case letter followed by a period is not a sentence ender
6
+ # (excluding I occasionally, but we leave it in)
7
+ # usually upper case letters are initials in a name
8
+ A
9
+ Ā
10
+ B
11
+ C
12
+ Č
13
+ D
14
+ E
15
+ Ē
16
+ F
17
+ G
18
+ Ģ
19
+ H
20
+ I
21
+ Ī
22
+ J
23
+ K
24
+ Ķ
25
+ L
26
+ Ļ
27
+ M
28
+ N
29
+ Ņ
30
+ O
31
+ P
32
+ Q
33
+ R
34
+ S
35
+ Š
36
+ T
37
+ U
38
+ Ū
39
+ V
40
+ W
41
+ X
42
+ Y
43
+ Z
44
+ Ž
45
+
46
+ # Initialis -- Džonas
47
+ Dz
48
+
49
+ Just
50
+
51
+ # Day and month abbreviations
52
+ # m. menesis d. diena g. gimes
53
+ m
54
+ mėn
55
+ d
56
+ g
57
+ gim
58
+ # Pirmadienis Penktadienis
59
+ Pr
60
+ Pn
61
+ Pirm
62
+ Antr
63
+ Treč
64
+ Ketv
65
+ Penkt
66
+ Šešt
67
+ Sekm
68
+ Saus
69
+ Vas
70
+ Kov
71
+ Bal
72
+ Geg
73
+ Birž
74
+ Liep
75
+ Rugpj
76
+ Rugs
77
+ Spal
78
+ Lapkr
79
+ Gruod
80
+
81
+ # Business, governmental, geographical terms
82
+ a
83
+ # aikštė
84
+ adv
85
+ # advokatas
86
+ akad
87
+ # akademikas
88
+ aklg
89
+ # akligatvis
90
+ akt
91
+ # aktorius
92
+ al
93
+ # alėja
94
+ A.V
95
+ # antspaudo vieta
96
+ aps
97
+ apskr
98
+ # apskritis
99
+ apyg
100
+ # apygarda
101
+ aps
102
+ apskr
103
+ # apskritis
104
+ asist
105
+ # asistentas
106
+ asmv
107
+ avd
108
+ # asmenvardis
109
+ a.k
110
+ asm
111
+ asm.k
112
+ # asmens kodas
113
+ atsak
114
+ # atsakingasis
115
+ atsisk
116
+ sąsk
117
+ # atsiskaitomoji sąskaita
118
+ aut
119
+ # autorius
120
+ b
121
+ k
122
+ b.k
123
+ # banko kodas
124
+ bkl
125
+ # bakalauras
126
+ bt
127
+ # butas
128
+ buv
129
+ # buvęs, -usi
130
+ dail
131
+ # dailininkas
132
+ dek
133
+ # dekanas
134
+ dėst
135
+ # dėstytojas
136
+ dir
137
+ # direktorius
138
+ dirig
139
+ # dirigentas
140
+ doc
141
+ # docentas
142
+ drp
143
+ # durpynas
144
+
145
+ # dešinysis
146
+ egz
147
+ # egzempliorius
148
+ eil
149
+ # eilutė
150
+ ekon
151
+ # ekonomika
152
+ el
153
+ # elektroninis
154
+ etc
155
+
156
+ # ežeras
157
+ faks
158
+ # faksas
159
+ fak
160
+ # fakultetas
161
+ gen
162
+ # generolas
163
+ gyd
164
+ # gydytojas
165
+ gv
166
+ # gyvenvietė
167
+ įl
168
+ # įlanka
169
+ Įn
170
+ # įnagininkas
171
+ insp
172
+ # inspektorius
173
+ pan
174
+ # ir panašiai
175
+ t.t
176
+ # ir taip toliau
177
+ k.a
178
+ # kaip antai
179
+ kand
180
+ # kandidatas
181
+ kat
182
+ # katedra
183
+ kyš
184
+ # kyšulys
185
+ kl
186
+ # klasė
187
+ kln
188
+ # kalnas
189
+ kn
190
+ # knyga
191
+ koresp
192
+ # korespondentas
193
+ kpt
194
+ # kapitonas
195
+ kr
196
+ # kairysis
197
+ kt
198
+ # kitas
199
+ kun
200
+ # kunigas
201
+ l
202
+ e
203
+ p
204
+ l.e.p
205
+ # laikinai einantis pareigas
206
+ ltn
207
+ # leitenantas
208
+ m
209
+ mst
210
+ # miestas
211
+ m.e
212
+ # mūsų eros
213
+ m.m
214
+ # mokslo metai
215
+ mot
216
+ # moteris
217
+ mstl
218
+ # miestelis
219
+ mgr
220
+ # magistras
221
+ mgnt
222
+ # magistrantas
223
+ mjr
224
+ # majoras
225
+ mln
226
+ # milijonas
227
+ mlrd
228
+ # milijardas
229
+ mok
230
+ # mokinys
231
+ mokyt
232
+ # mokytojas
233
+ moksl
234
+ # mokslinis
235
+ nkt
236
+ # nekaitomas
237
+ ntk
238
+ # neteiktinas
239
+ Nr
240
+ nr
241
+ # numeris
242
+ p
243
+ # ponas
244
+ p.d
245
+ a.d
246
+ # pašto dėžutė, abonentinė dėžutė
247
+ p.m.e
248
+ # prieš mūsų erą
249
+ pan
250
+ # ir panašiai
251
+ pav
252
+ # paveikslas
253
+ pavad
254
+ # pavaduotojas
255
+ pirm
256
+ # pirmininkas
257
+ pl
258
+ # plentas
259
+ plg
260
+ # palygink
261
+ plk
262
+ # pulkininkas; pelkė
263
+ pr
264
+ # prospektas
265
+ Kr
266
+ pr.Kr
267
+ # prieš Kristų
268
+ prok
269
+ # prokuroras
270
+ prot
271
+ # protokolas
272
+ pss
273
+ # pusiasalis
274
+ pšt
275
+ # paštas
276
+ pvz
277
+ # pavyzdžiui
278
+ r
279
+ # rajonas
280
+ red
281
+ # redaktorius
282
+
283
+ # raštų kalbos
284
+ sąs
285
+ # sąsiuvinis
286
+ saviv
287
+ sav
288
+ # savivaldybė
289
+ sekr
290
+ # sekretorius
291
+ sen
292
+ # seniūnija, seniūnas
293
+ sk
294
+ # skaityk; skyrius
295
+ skg
296
+ # skersgatvis
297
+ skyr
298
+ sk
299
+ # skyrius
300
+ skv
301
+ # skveras
302
+ sp
303
+ # spauda; spaustuvė
304
+ spec
305
+ # specialistas
306
+ sr
307
+ # sritis
308
+ st
309
+ # stotis
310
+ str
311
+ # straipsnis
312
+ stud
313
+ # studentas
314
+ š
315
+ š.m
316
+ # šių metų
317
+ šnek
318
+ # šnekamosios
319
+ tir
320
+ # tiražas
321
+ tūkst
322
+ # tūkstantis
323
+ up
324
+ # upė
325
+ upl
326
+ # upelis
327
+ vad
328
+ # vadinamasis, -oji
329
+ vlsč
330
+ # valsčius
331
+ ved
332
+ # vedėjas
333
+ vet
334
+ # veterinarija
335
+ virš
336
+ # viršininkas, viršaitis
337
+ vyr
338
+ # vyriausiasis, -ioji; vyras
339
+ vyresn
340
+ # vyresnysis
341
+ vlsč
342
+ # valsčius
343
+ vs
344
+ # viensėdis
345
+ Vt
346
+ vt
347
+ # vietininkas
348
+ vtv
349
+ vv
350
+ # vietovardis
351
+ žml
352
+ # žemėlapis
353
+
354
+ # Technical terms, abbreviations used in guidebooks, advertisments, etc.
355
+ # Generally lower-case.
356
+ air
357
+ # airiškai
358
+ amer
359
+ # amerikanizmas
360
+ anat
361
+ # anatomija
362
+ angl
363
+ # angl. angliskai
364
+ arab
365
+ # arabų
366
+ archeol
367
+ archit
368
+ asm
369
+ # asmuo
370
+ astr
371
+ # astronomija
372
+ austral
373
+ # australiškai
374
+ aut
375
+ # automobilis
376
+ av
377
+ # aviacija
378
+ bažn
379
+ bdv
380
+ # būdvardis
381
+ bibl
382
+ # Biblija
383
+ biol
384
+ # biologija
385
+ bot
386
+ # botanika
387
+ brt
388
+ # burtai, burtažodis.
389
+ brus
390
+ # baltarusių
391
+ buh
392
+ # buhalterija
393
+ chem
394
+ # chemija
395
+ col
396
+ # collectivum
397
+ con
398
+ conj
399
+ # conjunctivus, jungtukas
400
+ dab
401
+ # dab. dabartine
402
+ dgs
403
+ # daugiskaita
404
+ dial
405
+ # dialektizmas
406
+ dipl
407
+ dktv
408
+ # daiktavardis
409
+ džn
410
+ # dažnai
411
+ ekon
412
+ el
413
+ # elektra
414
+ esam
415
+ # esamasis laikas
416
+ euf
417
+ # eufemizmas
418
+ fam
419
+ # familiariai
420
+ farm
421
+ # farmacija
422
+ filol
423
+ # filologija
424
+ filos
425
+ # filosofija
426
+ fin
427
+ # finansai
428
+ fiz
429
+ # fizika
430
+ fiziol
431
+ # fiziologija
432
+ flk
433
+ # folkloras
434
+ fon
435
+ # fonetika
436
+ fot
437
+ # fotografija
438
+ geod
439
+ # geodezija
440
+ geogr
441
+ geol
442
+ # geologija
443
+ geom
444
+ # geometrija
445
+ glžk
446
+ gr
447
+ # graikų
448
+ gram
449
+ her
450
+ # heraldika
451
+ hidr
452
+ # hidrotechnika
453
+ ind
454
+ # Indų
455
+ iron
456
+ # ironiškai
457
+ isp
458
+ # ispanų
459
+ ist
460
+ istor
461
+ # istorija
462
+ it
463
+ # italų
464
+ įv
465
+ reikšm
466
+ įv.reikšm
467
+ # įvairiomis reikšmėmis
468
+ jap
469
+ # japonų
470
+ juok
471
+ # juokaujamai
472
+ jūr
473
+ # jūrininkystė
474
+ kalb
475
+ # kalbotyra
476
+ kar
477
+ # karyba
478
+ kas
479
+ # kasyba
480
+ kin
481
+ # kinematografija
482
+ klaus
483
+ # klausiamasis
484
+ knyg
485
+ # knyginis
486
+ kom
487
+ # komercija
488
+ komp
489
+ # kompiuteris
490
+ kosm
491
+ # kosmonautika
492
+ kt
493
+ # kitas
494
+ kul
495
+ # kulinarija
496
+ kuop
497
+ # kuopine
498
+ l
499
+ # laikas
500
+ lit
501
+ # literatūrinis
502
+ lingv
503
+ # lingvistika
504
+ log
505
+ # logika
506
+ lot
507
+ # lotynų
508
+ mat
509
+ # matematika
510
+ maž
511
+ # mažybinis
512
+ med
513
+ # medicina
514
+ medž
515
+ # medžioklė
516
+ men
517
+ # menas
518
+ menk
519
+ # menkinamai
520
+ metal
521
+ # metalurgija
522
+ meteor
523
+ min
524
+ # mineralogija
525
+ mit
526
+ # mitologija
527
+ mok
528
+ # mokyklinis
529
+ ms
530
+ # mįslė
531
+ muz
532
+ # muzikinis
533
+ n
534
+ # naujasis
535
+ neig
536
+ # neigiamasis
537
+ neol
538
+ # neologizmas
539
+ niek
540
+ # niekinamai
541
+ ofic
542
+ # oficialus
543
+ opt
544
+ # optika
545
+ orig
546
+ # original
547
+ p
548
+ # pietūs
549
+ pan
550
+ # panašiai
551
+ parl
552
+ # parlamentas
553
+ pat
554
+ # patarlė
555
+ paž
556
+ # pažodžiui
557
+ plg
558
+ # palygink
559
+ poet
560
+ # poetizmas
561
+ poez
562
+ # poezija
563
+ poligr
564
+ # poligrafija
565
+ polit
566
+ # politika
567
+ ppr
568
+ # paprastai
569
+ pranc
570
+ pr
571
+ # prancūzų, prūsų
572
+ priet
573
+ # prietaras
574
+ prek
575
+ # prekyba
576
+ prk
577
+ # perkeltine
578
+ prs
579
+ # persona, asmuo
580
+ psn
581
+ # pasenęs žodis
582
+ psich
583
+ # psichologija
584
+ pvz
585
+ # pavyzdžiui
586
+ r
587
+ # rytai
588
+ rad
589
+ # radiotechnika
590
+ rel
591
+ # religija
592
+ ret
593
+ # retai
594
+ rus
595
+ # rusų
596
+ sen
597
+ # senasis
598
+ sl
599
+ # slengas, slavų
600
+ sov
601
+ # sovietinis
602
+ spec
603
+ # specialus
604
+ sport
605
+ stat
606
+ # statyba
607
+ sudurt
608
+ # sudurtinis
609
+ sutr
610
+ # sutrumpintas
611
+ suv
612
+ # suvalkiečių
613
+ š
614
+ # šiaurė
615
+ šach
616
+ # šachmatai
617
+ šiaur
618
+ škot
619
+ # škotiškai
620
+ šnek
621
+ # šnekamoji
622
+ teatr
623
+ tech
624
+ techn
625
+ # technika
626
+ teig
627
+ # teigiamas
628
+ teis
629
+ # teisė
630
+ tekst
631
+ # tekstilė
632
+ tel
633
+ # telefonas
634
+ teol
635
+ # teologija
636
+ v
637
+ # tik vyriškosios, vakarai
638
+ t.p
639
+ t
640
+ p
641
+ # ir taip pat
642
+ t.t
643
+ # ir taip toliau
644
+ t.y
645
+ # tai yra
646
+ vaik
647
+ # vaikų
648
+ vart
649
+ # vartojama
650
+ vet
651
+ # veterinarija
652
+ vid
653
+ # vidurinis
654
+ vksm
655
+ # veiksmažodis
656
+ vns
657
+ # vienaskaita
658
+ vok
659
+ # vokiečių
660
+ vulg
661
+ # vulgariai
662
+ zool
663
+ # zoologija
664
+ žr
665
+ # žiūrėk
666
+ ž.ū
667
+ ž
668
+ ū
669
+ # žemės ūkis
670
+
671
+ # List of titles. These are often followed by upper-case names, but do
672
+ # not indicate sentence breaks
673
+ #
674
+ # Jo Eminencija
675
+ Em.
676
+ # Gerbiamasis
677
+ Gerb
678
+ gerb
679
+ # malonus
680
+ malon
681
+ # profesorius
682
+ Prof
683
+ prof
684
+ # daktaras (mokslų)
685
+ Dr
686
+ dr
687
+ habil
688
+ med
689
+ # inž inžinierius
690
+ inž
691
+ Inž
692
+
693
+
694
+ #Numbers only. These should only induce breaks when followed by a numeric sequence
695
+ # add NUMERIC_ONLY after the word for this function
696
+ #This case is mostly for the english "No." which can either be a sentence of its own, or
697
+ #if followed by a number, a non-breaking prefix
698
+ No #NUMERIC_ONLY#