readsight 1.0.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- readsight/__init__.py +35 -0
- readsight/config.py +22 -0
- readsight/data/languages/af.json +31 -0
- readsight/data/languages/ar.json +31 -0
- readsight/data/languages/as.json +31 -0
- readsight/data/languages/be.json +31 -0
- readsight/data/languages/bg.json +31 -0
- readsight/data/languages/bn.json +31 -0
- readsight/data/languages/ca.json +31 -0
- readsight/data/languages/cop.json +31 -0
- readsight/data/languages/cs.json +31 -0
- readsight/data/languages/cu.json +31 -0
- readsight/data/languages/cy.json +31 -0
- readsight/data/languages/da.json +31 -0
- readsight/data/languages/de-1901.json +43 -0
- readsight/data/languages/de-1996.json +43 -0
- readsight/data/languages/de-ch-1901.json +43 -0
- readsight/data/languages/el-monoton.json +31 -0
- readsight/data/languages/el-polyton.json +31 -0
- readsight/data/languages/en-gb.json +93 -0
- readsight/data/languages/en-us.json +117 -0
- readsight/data/languages/eo.json +31 -0
- readsight/data/languages/es.json +52 -0
- readsight/data/languages/et.json +31 -0
- readsight/data/languages/eu.json +31 -0
- readsight/data/languages/fa.json +31 -0
- readsight/data/languages/fi-x-school.json +31 -0
- readsight/data/languages/fi.json +31 -0
- readsight/data/languages/fr.json +40 -0
- readsight/data/languages/fur.json +31 -0
- readsight/data/languages/ga.json +31 -0
- readsight/data/languages/gl.json +31 -0
- readsight/data/languages/grc.json +31 -0
- readsight/data/languages/gu.json +31 -0
- readsight/data/languages/he.json +31 -0
- readsight/data/languages/hi.json +31 -0
- readsight/data/languages/hr.json +31 -0
- readsight/data/languages/hsb.json +31 -0
- readsight/data/languages/hu.json +31 -0
- readsight/data/languages/hy.json +31 -0
- readsight/data/languages/ia.json +31 -0
- readsight/data/languages/id.json +31 -0
- readsight/data/languages/is.json +31 -0
- readsight/data/languages/it.json +43 -0
- readsight/data/languages/ka.json +31 -0
- readsight/data/languages/kk.json +31 -0
- readsight/data/languages/kmr.json +31 -0
- readsight/data/languages/kn.json +31 -0
- readsight/data/languages/la-x-classic.json +31 -0
- readsight/data/languages/la-x-liturgic.json +31 -0
- readsight/data/languages/la.json +31 -0
- readsight/data/languages/lt.json +31 -0
- readsight/data/languages/lv.json +31 -0
- readsight/data/languages/mk.json +31 -0
- readsight/data/languages/ml.json +31 -0
- readsight/data/languages/mn-cyrl-x-lmc.json +31 -0
- readsight/data/languages/mn-cyrl.json +31 -0
- readsight/data/languages/mr.json +31 -0
- readsight/data/languages/mul-ethi.json +31 -0
- readsight/data/languages/nb.json +31 -0
- readsight/data/languages/nl.json +40 -0
- readsight/data/languages/nn.json +31 -0
- readsight/data/languages/oc.json +31 -0
- readsight/data/languages/or.json +31 -0
- readsight/data/languages/pa.json +31 -0
- readsight/data/languages/pi.json +31 -0
- readsight/data/languages/pl.json +34 -0
- readsight/data/languages/pms.json +31 -0
- readsight/data/languages/pt.json +40 -0
- readsight/data/languages/rm.json +31 -0
- readsight/data/languages/ro.json +31 -0
- readsight/data/languages/ru.json +40 -0
- readsight/data/languages/sa.json +31 -0
- readsight/data/languages/sh-cyrl.json +31 -0
- readsight/data/languages/sh-latn.json +31 -0
- readsight/data/languages/sk.json +31 -0
- readsight/data/languages/sl.json +31 -0
- readsight/data/languages/sq.json +31 -0
- readsight/data/languages/sr-cyrl.json +31 -0
- readsight/data/languages/sv.json +31 -0
- readsight/data/languages/ta.json +31 -0
- readsight/data/languages/te.json +31 -0
- readsight/data/languages/th.json +31 -0
- readsight/data/languages/tk.json +31 -0
- readsight/data/languages/tr.json +40 -0
- readsight/data/languages/uk.json +31 -0
- readsight/data/languages/vi.json +31 -0
- readsight/data/languages/zh-latn-pinyin.json +31 -0
- readsight/data/patterns/hyph-af.tex +10594 -0
- readsight/data/patterns/hyph-ar.tex +24 -0
- readsight/data/patterns/hyph-as.tex +142 -0
- readsight/data/patterns/hyph-be.tex +1630 -0
- readsight/data/patterns/hyph-bg.tex +7785 -0
- readsight/data/patterns/hyph-bn.tex +142 -0
- readsight/data/patterns/hyph-ca.tex +296 -0
- readsight/data/patterns/hyph-cop.tex +267 -0
- readsight/data/patterns/hyph-cs.tex +3684 -0
- readsight/data/patterns/hyph-cu.tex +14727 -0
- readsight/data/patterns/hyph-cy.tex +6791 -0
- readsight/data/patterns/hyph-da.tex +1202 -0
- readsight/data/patterns/hyph-de-1901.tex +36485 -0
- readsight/data/patterns/hyph-de-1996.tex +36797 -0
- readsight/data/patterns/hyph-de-ch-1901.tex +35926 -0
- readsight/data/patterns/hyph-el-monoton.tex +505 -0
- readsight/data/patterns/hyph-el-polyton.tex +881 -0
- readsight/data/patterns/hyph-en-gb.tex +8615 -0
- readsight/data/patterns/hyph-en-us.tex +5018 -0
- readsight/data/patterns/hyph-eo.tex +528 -0
- readsight/data/patterns/hyph-es.tex +2175 -0
- readsight/data/patterns/hyph-et.tex +3754 -0
- readsight/data/patterns/hyph-eu.tex +123 -0
- readsight/data/patterns/hyph-fa.tex +26 -0
- readsight/data/patterns/hyph-fi-x-school.tex +349 -0
- readsight/data/patterns/hyph-fi.tex +330 -0
- readsight/data/patterns/hyph-fr.tex +1372 -0
- readsight/data/patterns/hyph-fur.tex +488 -0
- readsight/data/patterns/hyph-ga.tex +6152 -0
- readsight/data/patterns/hyph-gl.tex +749 -0
- readsight/data/patterns/hyph-grc.tex +2149 -0
- readsight/data/patterns/hyph-gu.tex +135 -0
- readsight/data/patterns/hyph-he.tex +25 -0
- readsight/data/patterns/hyph-hi.tex +139 -0
- readsight/data/patterns/hyph-hr.tex +1543 -0
- readsight/data/patterns/hyph-hsb.tex +1591 -0
- readsight/data/patterns/hyph-hu.tex +62894 -0
- readsight/data/patterns/hyph-hy.tex +260 -0
- readsight/data/patterns/hyph-ia.tex +686 -0
- readsight/data/patterns/hyph-id.tex +101 -0
- readsight/data/patterns/hyph-is.tex +4223 -0
- readsight/data/patterns/hyph-it.tex +431 -0
- readsight/data/patterns/hyph-ka.tex +2145 -0
- readsight/data/patterns/hyph-kk.tex +5806 -0
- readsight/data/patterns/hyph-kmr.tex +349 -0
- readsight/data/patterns/hyph-kn.tex +142 -0
- readsight/data/patterns/hyph-la-x-classic.tex +26160 -0
- readsight/data/patterns/hyph-la-x-liturgic.tex +2008 -0
- readsight/data/patterns/hyph-la.tex +237 -0
- readsight/data/patterns/hyph-lt.tex +1618 -0
- readsight/data/patterns/hyph-lv.tex +11621 -0
- readsight/data/patterns/hyph-mk.tex +759 -0
- readsight/data/patterns/hyph-ml.tex +157 -0
- readsight/data/patterns/hyph-mn-cyrl-x-lmc.tex +578 -0
- readsight/data/patterns/hyph-mn-cyrl.tex +1060 -0
- readsight/data/patterns/hyph-mr.tex +139 -0
- readsight/data/patterns/hyph-mul-ethi.tex +518 -0
- readsight/data/patterns/hyph-nb.tex +50 -0
- readsight/data/patterns/hyph-nl.tex +12892 -0
- readsight/data/patterns/hyph-nn.tex +48 -0
- readsight/data/patterns/hyph-oc.tex +345 -0
- readsight/data/patterns/hyph-or.tex +133 -0
- readsight/data/patterns/hyph-pa.tex +129 -0
- readsight/data/patterns/hyph-pi.tex +140 -0
- readsight/data/patterns/hyph-pl.tex +4154 -0
- readsight/data/patterns/hyph-pms.tex +434 -0
- readsight/data/patterns/hyph-pt.tex +503 -0
- readsight/data/patterns/hyph-rm.tex +452 -0
- readsight/data/patterns/hyph-ro.tex +688 -0
- readsight/data/patterns/hyph-ru.tex +7255 -0
- readsight/data/patterns/hyph-sa.tex +899 -0
- readsight/data/patterns/hyph-sh-cyrl.tex +2822 -0
- readsight/data/patterns/hyph-sh-latn.tex +2839 -0
- readsight/data/patterns/hyph-sk.tex +2529 -0
- readsight/data/patterns/hyph-sl.tex +1144 -0
- readsight/data/patterns/hyph-sq.tex +108 -0
- readsight/data/patterns/hyph-sr-cyrl.tex +2724 -0
- readsight/data/patterns/hyph-sv.tex +4750 -0
- readsight/data/patterns/hyph-ta.tex +140 -0
- readsight/data/patterns/hyph-te.tex +141 -0
- readsight/data/patterns/hyph-th.tex +4888 -0
- readsight/data/patterns/hyph-tk.tex +2423 -0
- readsight/data/patterns/hyph-tr.tex +671 -0
- readsight/data/patterns/hyph-uk.tex +3661 -0
- readsight/data/patterns/hyph-vi.tex +25 -0
- readsight/data/patterns/hyph-zh-latn-pinyin.tex +262 -0
- readsight/engine.py +260 -0
- readsight/exceptions.py +35 -0
- readsight/formula/__init__.py +0 -0
- readsight/formula/automated_readability_index.py +36 -0
- readsight/formula/coleman_liau.py +41 -0
- readsight/formula/crawford.py +50 -0
- readsight/formula/dale_chall.py +53 -0
- readsight/formula/fernandez_huerta.py +49 -0
- readsight/formula/flesch_kincaid_grade_level.py +67 -0
- readsight/formula/flesch_reading_ease.py +69 -0
- readsight/formula/fog_pl.py +51 -0
- readsight/formula/formula.py +21 -0
- readsight/formula/formula_registry.py +45 -0
- readsight/formula/formula_registry_factory.py +44 -0
- readsight/formula/formula_result.py +13 -0
- readsight/formula/grade_level_interpretation.py +36 -0
- readsight/formula/gulpease.py +45 -0
- readsight/formula/gunning_fog.py +54 -0
- readsight/formula/gutierrez_polini.py +46 -0
- readsight/formula/lix.py +62 -0
- readsight/formula/osman.py +52 -0
- readsight/formula/smog_index.py +36 -0
- readsight/formula/spache.py +47 -0
- readsight/formula/szigriszt_pazos.py +54 -0
- readsight/formula/text_statistics_helper.py +18 -0
- readsight/formula/wiener_sachtextformel.py +93 -0
- readsight/hyphenation/__init__.py +0 -0
- readsight/hyphenation/cache/__init__.py +0 -0
- readsight/hyphenation/cache/json_pattern_cache.py +87 -0
- readsight/hyphenation/cache/pattern_cache.py +25 -0
- readsight/hyphenation/hyphenation_exceptions_collection.py +26 -0
- readsight/hyphenation/hyphenation_override.py +9 -0
- readsight/hyphenation/hyphenator.py +13 -0
- readsight/hyphenation/liang_hyphenator.py +124 -0
- readsight/hyphenation/pattern.py +15 -0
- readsight/hyphenation/patterns_collection.py +31 -0
- readsight/hyphenation/source/__init__.py +0 -0
- readsight/hyphenation/source/pattern_source.py +9 -0
- readsight/hyphenation/source/tex_source.py +123 -0
- readsight/language/__init__.py +0 -0
- readsight/language/json_language_repository.py +44 -0
- readsight/language/language.py +48 -0
- readsight/language/language_code.py +30 -0
- readsight/language/language_repository.py +19 -0
- readsight/language/script.py +27 -0
- readsight/syllable/__init__.py +0 -0
- readsight/syllable/composite_syllable_counter.py +31 -0
- readsight/syllable/heuristic_syllable_counter.py +110 -0
- readsight/syllable/syllable_counter.py +13 -0
- readsight/syllable/tex_syllable_counter.py +15 -0
- readsight/text/__init__.py +0 -0
- readsight/text/text_analyzer.py +142 -0
- readsight/text/text_splitter.py +59 -0
- readsight/text/text_statistics.py +16 -0
- readsight-1.0.0.dist-info/METADATA +339 -0
- readsight-1.0.0.dist-info/RECORD +233 -0
- readsight-1.0.0.dist-info/WHEEL +5 -0
- readsight-1.0.0.dist-info/licenses/LICENSE +21 -0
- readsight-1.0.0.dist-info/top_level.txt +1 -0
readsight/__init__.py
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
"""
|
|
2
|
+
ReadSight - Multilingual Readability Library for Python.
|
|
3
|
+
|
|
4
|
+
86 languages, 17 readability formulas, TeX-based syllable counting
|
|
5
|
+
via the Frank M. Liang hyphenation algorithm.
|
|
6
|
+
"""
|
|
7
|
+
|
|
8
|
+
from __future__ import annotations
|
|
9
|
+
|
|
10
|
+
from .config import Config
|
|
11
|
+
from .engine import ReadSight
|
|
12
|
+
from .exceptions import (
|
|
13
|
+
EmptyTextException,
|
|
14
|
+
ReadabilityEngineException,
|
|
15
|
+
UnsupportedFormulaException,
|
|
16
|
+
UnsupportedLanguageException,
|
|
17
|
+
)
|
|
18
|
+
from .formula.formula_result import FormulaResult
|
|
19
|
+
from .language.language import Language
|
|
20
|
+
from .language.script import Script
|
|
21
|
+
from .text.text_statistics import TextStatistics
|
|
22
|
+
|
|
23
|
+
__version__ = "1.0.0"
|
|
24
|
+
__all__ = [
|
|
25
|
+
"Config",
|
|
26
|
+
"EmptyTextException",
|
|
27
|
+
"FormulaResult",
|
|
28
|
+
"Language",
|
|
29
|
+
"ReadSight",
|
|
30
|
+
"ReadabilityEngineException",
|
|
31
|
+
"Script",
|
|
32
|
+
"TextStatistics",
|
|
33
|
+
"UnsupportedFormulaException",
|
|
34
|
+
"UnsupportedLanguageException",
|
|
35
|
+
]
|
readsight/config.py
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
from __future__ import annotations
|
|
2
|
+
|
|
3
|
+
from dataclasses import dataclass
|
|
4
|
+
from pathlib import Path
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
@dataclass(frozen=True, slots=True)
|
|
8
|
+
class Config:
|
|
9
|
+
patterns_dir: str
|
|
10
|
+
languages_dir: str
|
|
11
|
+
cache_dir: str
|
|
12
|
+
|
|
13
|
+
@classmethod
|
|
14
|
+
def default(cls) -> Config:
|
|
15
|
+
import platformdirs
|
|
16
|
+
|
|
17
|
+
pkg_dir = Path(__file__).resolve().parent
|
|
18
|
+
return cls(
|
|
19
|
+
patterns_dir=str(pkg_dir / "data" / "patterns"),
|
|
20
|
+
languages_dir=str(pkg_dir / "data" / "languages"),
|
|
21
|
+
cache_dir=str(Path(platformdirs.user_cache_dir("readsight", ensure_exists=True))),
|
|
22
|
+
)
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "af",
|
|
3
|
+
"name": "Afrikaans",
|
|
4
|
+
"nativeName": "Afrikaans",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 1,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "ar",
|
|
3
|
+
"name": "Arabic",
|
|
4
|
+
"nativeName": "العربية",
|
|
5
|
+
"script": "Arabic",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 0,
|
|
8
|
+
"right": 0
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[-ۿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?۔]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 5
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "as",
|
|
3
|
+
"name": "Assamese",
|
|
4
|
+
"nativeName": "অসমীয়া",
|
|
5
|
+
"script": "Other",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 1,
|
|
8
|
+
"right": 1
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "\\p{L}",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "be",
|
|
3
|
+
"name": "Belarusian",
|
|
4
|
+
"nativeName": "Беларуская",
|
|
5
|
+
"script": "Cyrillic",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[А-Яа-яЁёҐ-ӿЀ-ӿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?…]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "bg",
|
|
3
|
+
"name": "Bulgarian",
|
|
4
|
+
"nativeName": "Български",
|
|
5
|
+
"script": "Cyrillic",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[А-Яа-яЁёҐ-ӿЀ-ӿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?…]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "bn",
|
|
3
|
+
"name": "Bengali",
|
|
4
|
+
"nativeName": "বাংলা",
|
|
5
|
+
"script": "Bengali",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 1,
|
|
8
|
+
"right": 1
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[ঀ-]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[।.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "ca",
|
|
3
|
+
"name": "Catalan",
|
|
4
|
+
"nativeName": "Català",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "cop",
|
|
3
|
+
"name": "Coptic",
|
|
4
|
+
"nativeName": "ϯⲙⲉⲧⲣⲉⲙⲛⲭⲏⲙⲓ",
|
|
5
|
+
"script": "Coptic",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 1,
|
|
8
|
+
"right": 1
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[Ⲁ-⳿]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "cs",
|
|
3
|
+
"name": "Czech",
|
|
4
|
+
"nativeName": "Čeština",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 3
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "cu",
|
|
3
|
+
"name": "Church Slavonic",
|
|
4
|
+
"nativeName": "ⰔⰎⰑⰂⰡⰐⰠⰔⰍⰟ",
|
|
5
|
+
"script": "Cyrillic",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[А-Яа-яЁёҐ-ӿЀ-ӿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?…]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "cy",
|
|
3
|
+
"name": "Welsh",
|
|
4
|
+
"nativeName": "Cymraeg",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 3
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "da",
|
|
3
|
+
"name": "Danish",
|
|
4
|
+
"nativeName": "Dansk",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "de-1901",
|
|
3
|
+
"name": "German (traditional)",
|
|
4
|
+
"nativeName": "Deutsch (traditionell)",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
},
|
|
30
|
+
"flesch_reading_ease": {
|
|
31
|
+
"enabled": true,
|
|
32
|
+
"base": 180,
|
|
33
|
+
"aslMult": 1,
|
|
34
|
+
"aswMult": 58.5
|
|
35
|
+
},
|
|
36
|
+
"flesch_kincaid_grade_level": {
|
|
37
|
+
"enabled": true
|
|
38
|
+
},
|
|
39
|
+
"wiener_sachtextformel": {
|
|
40
|
+
"enabled": true
|
|
41
|
+
}
|
|
42
|
+
}
|
|
43
|
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "de-1996",
|
|
3
|
+
"name": "German (reformed)",
|
|
4
|
+
"nativeName": "Deutsch (reformiert)",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
},
|
|
30
|
+
"flesch_reading_ease": {
|
|
31
|
+
"enabled": true,
|
|
32
|
+
"base": 180,
|
|
33
|
+
"aslMult": 1,
|
|
34
|
+
"aswMult": 58.5
|
|
35
|
+
},
|
|
36
|
+
"flesch_kincaid_grade_level": {
|
|
37
|
+
"enabled": true
|
|
38
|
+
},
|
|
39
|
+
"wiener_sachtextformel": {
|
|
40
|
+
"enabled": true
|
|
41
|
+
}
|
|
42
|
+
}
|
|
43
|
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "de-ch-1901",
|
|
3
|
+
"name": "German (Swiss traditional)",
|
|
4
|
+
"nativeName": "Deutsch (Schweiz, traditionell)",
|
|
5
|
+
"script": "Latin",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 2,
|
|
8
|
+
"right": 2
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[A-Za-zÀ-ÖØ-öø-ÿĀ-žƀ-ɏḀ-ỿ]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
},
|
|
30
|
+
"flesch_reading_ease": {
|
|
31
|
+
"enabled": true,
|
|
32
|
+
"base": 180,
|
|
33
|
+
"aslMult": 1,
|
|
34
|
+
"aswMult": 58.5
|
|
35
|
+
},
|
|
36
|
+
"flesch_kincaid_grade_level": {
|
|
37
|
+
"enabled": true
|
|
38
|
+
},
|
|
39
|
+
"wiener_sachtextformel": {
|
|
40
|
+
"enabled": true
|
|
41
|
+
}
|
|
42
|
+
}
|
|
43
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "el-monoton",
|
|
3
|
+
"name": "Modern Greek (monotonic)",
|
|
4
|
+
"nativeName": "Νέα Ελληνικά (μονοτονικό)",
|
|
5
|
+
"script": "Greek",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 1,
|
|
8
|
+
"right": 1
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[Α-Ωα-ωἀ-῾]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?;]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"code": "el-polyton",
|
|
3
|
+
"name": "Modern Greek (polytonic)",
|
|
4
|
+
"nativeName": "Νέα Ελληνικά (πολυτονικό)",
|
|
5
|
+
"script": "Greek",
|
|
6
|
+
"hyphenMins": {
|
|
7
|
+
"left": 1,
|
|
8
|
+
"right": 1
|
|
9
|
+
},
|
|
10
|
+
"letterPattern": "[Α-Ωα-ωἀ-῾]",
|
|
11
|
+
"wordSplitPattern": "[^\\p{L}'’-]+",
|
|
12
|
+
"sentenceBoundaryPattern": "[.!?;]+",
|
|
13
|
+
"formulas": {
|
|
14
|
+
"gunning_fog": {
|
|
15
|
+
"enabled": true
|
|
16
|
+
},
|
|
17
|
+
"smog": {
|
|
18
|
+
"enabled": true
|
|
19
|
+
},
|
|
20
|
+
"coleman_liau": {
|
|
21
|
+
"enabled": true
|
|
22
|
+
},
|
|
23
|
+
"ari": {
|
|
24
|
+
"enabled": true
|
|
25
|
+
},
|
|
26
|
+
"lix": {
|
|
27
|
+
"enabled": true,
|
|
28
|
+
"longWordThreshold": 6
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|