axyseo 2.0.0-alpha.0.0.4 → 2.0.0-alpha.0.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (637) hide show
  1. package/package.json +5 -2
  2. package/.browserslistrc +0 -1
  3. package/.gitattributes +0 -1
  4. package/babel.config.js +0 -3
  5. package/eslint.config.mjs +0 -119
  6. package/src/bundledPlugins/index.js +0 -5
  7. package/src/bundledPlugins/previouslyUsedKeywords.js +0 -192
  8. package/src/config/diacritics.js +0 -106
  9. package/src/config/getTransliterations.js +0 -1447
  10. package/src/config/transliterationsWPstyle.js +0 -774
  11. package/src/config/wordBoundaries.js +0 -23
  12. package/src/config/wordBoundariesWithoutPunctuation.js +0 -9
  13. package/src/const/analysis.js +0 -41
  14. package/src/errors/invalidType.js +0 -14
  15. package/src/errors/missingArgument.js +0 -14
  16. package/src/helpers/createMeasurementElement.js +0 -40
  17. package/src/helpers/domManipulation.js +0 -65
  18. package/src/helpers/errors.js +0 -26
  19. package/src/helpers/factory.js +0 -219
  20. package/src/helpers/formatNumber.js +0 -12
  21. package/src/helpers/formatString.js +0 -33
  22. package/src/helpers/getLanguagesWithWordComplexity.js +0 -8
  23. package/src/helpers/getLanguagesWithWordFormSupport.js +0 -11
  24. package/src/helpers/getWordComplexityConfig.js +0 -20
  25. package/src/helpers/getWordComplexityHelper.js +0 -20
  26. package/src/helpers/htmlEntities.js +0 -41
  27. package/src/helpers/includesAny.js +0 -19
  28. package/src/helpers/index.js +0 -127
  29. package/src/helpers/shortlinker/Shortlinker.js +0 -75
  30. package/src/helpers/shortlinker/index.js +0 -1
  31. package/src/helpers/shortlinker/singleton.js +0 -68
  32. package/src/helpers/types.js +0 -34
  33. package/src/index.js +0 -60
  34. package/src/languageProcessing/AbstractResearcher.js +0 -366
  35. package/src/languageProcessing/helpers/highlighting/getMarkingsInSentence.js +0 -125
  36. package/src/languageProcessing/helpers/html/getFieldsToMark.js +0 -29
  37. package/src/languageProcessing/helpers/html/getSubheadingTexts.js +0 -47
  38. package/src/languageProcessing/helpers/html/getSubheadings.js +0 -95
  39. package/src/languageProcessing/helpers/html/html.js +0 -176
  40. package/src/languageProcessing/helpers/html/htmlParser.js +0 -145
  41. package/src/languageProcessing/helpers/html/matchParagraphs.js +0 -62
  42. package/src/languageProcessing/helpers/html/normalizeHTML.js +0 -16
  43. package/src/languageProcessing/helpers/image/getAltAttribute.js +0 -20
  44. package/src/languageProcessing/helpers/image/getImagesInTree.js +0 -16
  45. package/src/languageProcessing/helpers/image/imageInText.js +0 -19
  46. package/src/languageProcessing/helpers/index.js +0 -12
  47. package/src/languageProcessing/helpers/language/getLanguage.js +0 -9
  48. package/src/languageProcessing/helpers/link/checkNofollow.js +0 -38
  49. package/src/languageProcessing/helpers/link/getAnchorsFromText.js +0 -32
  50. package/src/languageProcessing/helpers/link/getLinkType.js +0 -32
  51. package/src/languageProcessing/helpers/match/findKeywordFormsInString.js +0 -101
  52. package/src/languageProcessing/helpers/match/isDoubleQuoted.js +0 -13
  53. package/src/languageProcessing/helpers/match/matchTextWithArray.js +0 -36
  54. package/src/languageProcessing/helpers/match/matchTextWithTransliteration.js +0 -58
  55. package/src/languageProcessing/helpers/match/matchTextWithWord.js +0 -45
  56. package/src/languageProcessing/helpers/match/matchWordFormsWithSentence.js +0 -164
  57. package/src/languageProcessing/helpers/match/processExactMatchRequest.js +0 -20
  58. package/src/languageProcessing/helpers/morphology/baseStemmer.js +0 -11
  59. package/src/languageProcessing/helpers/morphology/buildFormRule.js +0 -19
  60. package/src/languageProcessing/helpers/morphology/buildTopicStems.js +0 -169
  61. package/src/languageProcessing/helpers/morphology/createRulesFromArrays.js +0 -45
  62. package/src/languageProcessing/helpers/morphology/exceptionListHelpers.js +0 -65
  63. package/src/languageProcessing/helpers/morphology/findMatchingEndingInArray.js +0 -24
  64. package/src/languageProcessing/helpers/morphology/flattenSortLength.js +0 -14
  65. package/src/languageProcessing/helpers/morphology/getAllWordsFromPaper.js +0 -39
  66. package/src/languageProcessing/helpers/morphology/regexHelpers.js +0 -44
  67. package/src/languageProcessing/helpers/morphology/stemHelpers.js +0 -38
  68. package/src/languageProcessing/helpers/morphology/stemPrefixedFunctionWords.js +0 -31
  69. package/src/languageProcessing/helpers/passiveVoice/periphrastic/directPrecedenceException.js +0 -36
  70. package/src/languageProcessing/helpers/passiveVoice/periphrastic/freeAuxiliaryParticipleOrder/getClausesSplitOnStopWords.js +0 -113
  71. package/src/languageProcessing/helpers/passiveVoice/periphrastic/freeAuxiliaryParticipleOrder/nonDirectParticiplePrecedenceException.js +0 -45
  72. package/src/languageProcessing/helpers/passiveVoice/periphrastic/getClauses.js +0 -231
  73. package/src/languageProcessing/helpers/passiveVoice/periphrastic/getIndicesWithRegex.js +0 -20
  74. package/src/languageProcessing/helpers/passiveVoice/periphrastic/matchRegularParticiples.js +0 -23
  75. package/src/languageProcessing/helpers/passiveVoice/periphrastic/precedenceException.js +0 -40
  76. package/src/languageProcessing/helpers/prominentWords/determineProminentWords.js +0 -238
  77. package/src/languageProcessing/helpers/regex/createRegexFromArray.js +0 -35
  78. package/src/languageProcessing/helpers/regex/createRegexFromDoubleArray.js +0 -34
  79. package/src/languageProcessing/helpers/regex/createWordRegex.js +0 -30
  80. package/src/languageProcessing/helpers/regex/matchStringWithRegex.js +0 -19
  81. package/src/languageProcessing/helpers/regex/searchAndReplaceWithOneRegex.js +0 -14
  82. package/src/languageProcessing/helpers/sanitize/doubleQuotes.js +0 -12
  83. package/src/languageProcessing/helpers/sanitize/filterShortcodesFromTree.js +0 -131
  84. package/src/languageProcessing/helpers/sanitize/mergeListItems.js +0 -24
  85. package/src/languageProcessing/helpers/sanitize/parseSynonyms.js +0 -20
  86. package/src/languageProcessing/helpers/sanitize/quotes.js +0 -46
  87. package/src/languageProcessing/helpers/sanitize/removeEmailAddresses.js +0 -12
  88. package/src/languageProcessing/helpers/sanitize/removePunctuation.js +0 -64
  89. package/src/languageProcessing/helpers/sanitize/removePunctuationExceptQuotes.js +0 -18
  90. package/src/languageProcessing/helpers/sanitize/removeSentenceTerminators.js +0 -13
  91. package/src/languageProcessing/helpers/sanitize/removeURLs.js +0 -13
  92. package/src/languageProcessing/helpers/sanitize/sanitizeLineBreakTag.js +0 -11
  93. package/src/languageProcessing/helpers/sanitize/sanitizeString.js +0 -18
  94. package/src/languageProcessing/helpers/sanitize/stripHTMLTags.js +0 -57
  95. package/src/languageProcessing/helpers/sanitize/stripNonTextTags.js +0 -15
  96. package/src/languageProcessing/helpers/sanitize/stripNumbers.js +0 -21
  97. package/src/languageProcessing/helpers/sanitize/stripSpaces.js +0 -23
  98. package/src/languageProcessing/helpers/sanitize/stripWordBoundaries.js +0 -65
  99. package/src/languageProcessing/helpers/sanitize/unifyWhitespace.js +0 -61
  100. package/src/languageProcessing/helpers/sentence/SentenceTokenizer.js +0 -640
  101. package/src/languageProcessing/helpers/sentence/countSentences.js +0 -20
  102. package/src/languageProcessing/helpers/sentence/getSentences.js +0 -65
  103. package/src/languageProcessing/helpers/sentence/getSentencesFromTree.js +0 -55
  104. package/src/languageProcessing/helpers/sentence/memoizedSentenceTokenizer.js +0 -28
  105. package/src/languageProcessing/helpers/sentence/sentencesLength.js +0 -31
  106. package/src/languageProcessing/helpers/syllables/DeviationFragment.js +0 -112
  107. package/src/languageProcessing/helpers/syllables/countSyllables.js +0 -182
  108. package/src/languageProcessing/helpers/syllables/syllableCountIterator.js +0 -56
  109. package/src/languageProcessing/helpers/syllables/syllableCountStep.js +0 -68
  110. package/src/languageProcessing/helpers/transform/transformWordsWithHyphens.js +0 -17
  111. package/src/languageProcessing/helpers/transliterate/replaceDiacritics.js +0 -22
  112. package/src/languageProcessing/helpers/transliterate/specialCharacterMappings.js +0 -214
  113. package/src/languageProcessing/helpers/transliterate/transliterate.js +0 -20
  114. package/src/languageProcessing/helpers/transliterate/transliterateWPstyle.js +0 -21
  115. package/src/languageProcessing/helpers/url/parseSlug.js +0 -10
  116. package/src/languageProcessing/helpers/url/url.js +0 -172
  117. package/src/languageProcessing/helpers/word/addWordboundary.js +0 -37
  118. package/src/languageProcessing/helpers/word/areWordsInSentence.js +0 -16
  119. package/src/languageProcessing/helpers/word/countMetaDescriptionLength.js +0 -18
  120. package/src/languageProcessing/helpers/word/countWords.js +0 -14
  121. package/src/languageProcessing/helpers/word/createPunctuationTokens.js +0 -42
  122. package/src/languageProcessing/helpers/word/filterWordsFromArray.js +0 -15
  123. package/src/languageProcessing/helpers/word/followsIndex.js +0 -25
  124. package/src/languageProcessing/helpers/word/getAllWordsFromTree.js +0 -23
  125. package/src/languageProcessing/helpers/word/getWords.js +0 -43
  126. package/src/languageProcessing/helpers/word/includesIndex.js +0 -30
  127. package/src/languageProcessing/helpers/word/indices.js +0 -146
  128. package/src/languageProcessing/helpers/word/markWordsInSentences.js +0 -173
  129. package/src/languageProcessing/helpers/word/matchWordInSentence.js +0 -61
  130. package/src/languageProcessing/helpers/word/splitIntoTokens.js +0 -46
  131. package/src/languageProcessing/index.js +0 -91
  132. package/src/languageProcessing/languages/_default/Researcher.js +0 -34
  133. package/src/languageProcessing/languages/_default/helpers/getStemmer.js +0 -11
  134. package/src/languageProcessing/languages/ar/Researcher.js +0 -46
  135. package/src/languageProcessing/languages/ar/config/firstWordExceptions.js +0 -14
  136. package/src/languageProcessing/languages/ar/config/functionWords.js +0 -329
  137. package/src/languageProcessing/languages/ar/config/internal/passiveVerbsWithLongVowel.js +0 -570
  138. package/src/languageProcessing/languages/ar/config/prefixedFunctionWords.js +0 -5
  139. package/src/languageProcessing/languages/ar/config/transitionWords.js +0 -19
  140. package/src/languageProcessing/languages/ar/config/twoPartTransitionWords.js +0 -7
  141. package/src/languageProcessing/languages/ar/helpers/createBasicWordForms.js +0 -32
  142. package/src/languageProcessing/languages/ar/helpers/getStemmer.js +0 -22
  143. package/src/languageProcessing/languages/ar/helpers/internal/stem.js +0 -632
  144. package/src/languageProcessing/languages/ar/helpers/isPassiveSentence.js +0 -33
  145. package/src/languageProcessing/languages/ca/Researcher.js +0 -43
  146. package/src/languageProcessing/languages/ca/config/sentenceLength.js +0 -3
  147. package/src/languageProcessing/languages/ca/config/transitionWords.js +0 -31
  148. package/src/languageProcessing/languages/ca/config/twoPartTransitionWords.js +0 -7
  149. package/src/languageProcessing/languages/ca/helpers/getStemmer.js +0 -11
  150. package/src/languageProcessing/languages/cs/Researcher.js +0 -44
  151. package/src/languageProcessing/languages/cs/config/firstWordExceptions.js +0 -15
  152. package/src/languageProcessing/languages/cs/config/functionWords.js +0 -121
  153. package/src/languageProcessing/languages/cs/config/internal/passiveVoiceAuxiliaries.js +0 -38
  154. package/src/languageProcessing/languages/cs/config/internal/passiveVoiceEndings.js +0 -54
  155. package/src/languageProcessing/languages/cs/config/stopWords.js +0 -42
  156. package/src/languageProcessing/languages/cs/config/transitionWords.js +0 -26
  157. package/src/languageProcessing/languages/cs/config/twoPartTransitionWords.js +0 -8
  158. package/src/languageProcessing/languages/cs/helpers/getClauses.js +0 -26
  159. package/src/languageProcessing/languages/cs/helpers/getStemmer.js +0 -22
  160. package/src/languageProcessing/languages/cs/helpers/internal/getParticiples.js +0 -16
  161. package/src/languageProcessing/languages/cs/helpers/internal/stem.js +0 -499
  162. package/src/languageProcessing/languages/cs/values/Clause.js +0 -34
  163. package/src/languageProcessing/languages/de/Researcher.js +0 -52
  164. package/src/languageProcessing/languages/de/config/firstWordExceptions.js +0 -17
  165. package/src/languageProcessing/languages/de/config/functionWords.js +0 -303
  166. package/src/languageProcessing/languages/de/config/internal/exceptionsParticiplesActive.js +0 -2231
  167. package/src/languageProcessing/languages/de/config/internal/passiveVoiceAuxiliaries.js +0 -96
  168. package/src/languageProcessing/languages/de/config/internal/passiveVoiceIrregulars.js +0 -368
  169. package/src/languageProcessing/languages/de/config/internal/passiveVoiceRegex.js +0 -72
  170. package/src/languageProcessing/languages/de/config/keyphraseLength.js +0 -11
  171. package/src/languageProcessing/languages/de/config/stopWords.js +0 -67
  172. package/src/languageProcessing/languages/de/config/syllables.json +0 -460
  173. package/src/languageProcessing/languages/de/config/transitionWords.js +0 -31
  174. package/src/languageProcessing/languages/de/config/twoPartTransitionWords.js +0 -12
  175. package/src/languageProcessing/languages/de/config/wordComplexity.js +0 -4
  176. package/src/languageProcessing/languages/de/helpers/calculateFleschReadingScore.js +0 -18
  177. package/src/languageProcessing/languages/de/helpers/checkIfWordIsComplex.js +0 -40
  178. package/src/languageProcessing/languages/de/helpers/checkIfWordIsFunction.js +0 -15
  179. package/src/languageProcessing/languages/de/helpers/getClauses.js +0 -25
  180. package/src/languageProcessing/languages/de/helpers/getStemmer.js +0 -22
  181. package/src/languageProcessing/languages/de/helpers/internal/SentenceTokenizer.js +0 -31
  182. package/src/languageProcessing/languages/de/helpers/internal/detectAndStemRegularParticiple.js +0 -128
  183. package/src/languageProcessing/languages/de/helpers/internal/determineStem.js +0 -128
  184. package/src/languageProcessing/languages/de/helpers/internal/getParticiples.js +0 -40
  185. package/src/languageProcessing/languages/de/helpers/internal/stem.js +0 -215
  186. package/src/languageProcessing/languages/de/helpers/memoizedSentenceTokenizer.js +0 -28
  187. package/src/languageProcessing/languages/de/values/Clause.js +0 -85
  188. package/src/languageProcessing/languages/el/Researcher.js +0 -46
  189. package/src/languageProcessing/languages/el/config/firstWordExceptions.js +0 -47
  190. package/src/languageProcessing/languages/el/config/functionWords.js +0 -116
  191. package/src/languageProcessing/languages/el/config/internal/auxiliaries.js +0 -19
  192. package/src/languageProcessing/languages/el/config/internal/morphologicalPassiveSuffixes.js +0 -87
  193. package/src/languageProcessing/languages/el/config/internal/nonPassiveVerbStems.js +0 -138
  194. package/src/languageProcessing/languages/el/config/stopWords.js +0 -854
  195. package/src/languageProcessing/languages/el/config/transitionWords.js +0 -26
  196. package/src/languageProcessing/languages/el/config/twoPartTransitionWords.js +0 -10
  197. package/src/languageProcessing/languages/el/helpers/getClauses.js +0 -25
  198. package/src/languageProcessing/languages/el/helpers/getStemmer.js +0 -21
  199. package/src/languageProcessing/languages/el/helpers/internal/getParticiples.js +0 -20
  200. package/src/languageProcessing/languages/el/helpers/internal/stem.js +0 -368
  201. package/src/languageProcessing/languages/el/helpers/isPassiveSentence.js +0 -38
  202. package/src/languageProcessing/languages/el/values/Clause.js +0 -37
  203. package/src/languageProcessing/languages/en/Researcher.js +0 -46
  204. package/src/languageProcessing/languages/en/config/abbreviations.js +0 -55
  205. package/src/languageProcessing/languages/en/config/firstWordExceptions.js +0 -14
  206. package/src/languageProcessing/languages/en/config/functionWords.js +0 -186
  207. package/src/languageProcessing/languages/en/config/internal/passiveVoiceAuxiliaries.js +0 -44
  208. package/src/languageProcessing/languages/en/config/internal/passiveVoiceIrregulars.js +0 -354
  209. package/src/languageProcessing/languages/en/config/internal/passiveVoiceNonVerbEndingEd.js +0 -3047
  210. package/src/languageProcessing/languages/en/config/regularParticiplesRegex.js +0 -5
  211. package/src/languageProcessing/languages/en/config/stopWords.js +0 -52
  212. package/src/languageProcessing/languages/en/config/syllables.json +0 -86
  213. package/src/languageProcessing/languages/en/config/transitionWords.js +0 -48
  214. package/src/languageProcessing/languages/en/config/twoPartTransitionWords.js +0 -7
  215. package/src/languageProcessing/languages/en/config/wordComplexity.js +0 -5
  216. package/src/languageProcessing/languages/en/helpers/calculateFleschReadingScore.js +0 -18
  217. package/src/languageProcessing/languages/en/helpers/checkIfWordIsComplex.js +0 -43
  218. package/src/languageProcessing/languages/en/helpers/getClauses.js +0 -49
  219. package/src/languageProcessing/languages/en/helpers/getStemmer.js +0 -22
  220. package/src/languageProcessing/languages/en/helpers/internal/determineStem.js +0 -178
  221. package/src/languageProcessing/languages/en/helpers/internal/getAdjectiveStem.js +0 -162
  222. package/src/languageProcessing/languages/en/helpers/internal/getParticiples.js +0 -25
  223. package/src/languageProcessing/languages/en/helpers/internal/getVerbStem.js +0 -237
  224. package/src/languageProcessing/languages/en/values/Clause.js +0 -68
  225. package/src/languageProcessing/languages/es/Researcher.js +0 -48
  226. package/src/languageProcessing/languages/es/config/firstWordExceptions.js +0 -16
  227. package/src/languageProcessing/languages/es/config/functionWords.js +0 -321
  228. package/src/languageProcessing/languages/es/config/internal/passiveVoiceAuxiliaries.js +0 -60
  229. package/src/languageProcessing/languages/es/config/internal/passiveVoiceParticiples.js +0 -7327
  230. package/src/languageProcessing/languages/es/config/sentenceLength.js +0 -3
  231. package/src/languageProcessing/languages/es/config/stopWords.js +0 -33
  232. package/src/languageProcessing/languages/es/config/syllables.json +0 -176
  233. package/src/languageProcessing/languages/es/config/transitionWords.js +0 -40
  234. package/src/languageProcessing/languages/es/config/twoPartTransitionWords.js +0 -10
  235. package/src/languageProcessing/languages/es/config/wordComplexity.js +0 -4
  236. package/src/languageProcessing/languages/es/helpers/calculateFleschReadingScore.js +0 -18
  237. package/src/languageProcessing/languages/es/helpers/checkIfWordIsComplex.js +0 -56
  238. package/src/languageProcessing/languages/es/helpers/getClauses.js +0 -29
  239. package/src/languageProcessing/languages/es/helpers/getStemmer.js +0 -22
  240. package/src/languageProcessing/languages/es/helpers/internal/checkVerbStemModifications.js +0 -41
  241. package/src/languageProcessing/languages/es/helpers/internal/getParticiples.js +0 -35
  242. package/src/languageProcessing/languages/es/helpers/internal/stem.js +0 -793
  243. package/src/languageProcessing/languages/es/values/Clause.js +0 -47
  244. package/src/languageProcessing/languages/fa/Researcher.js +0 -47
  245. package/src/languageProcessing/languages/fa/config/firstWordExceptions.js +0 -12
  246. package/src/languageProcessing/languages/fa/config/functionWords.js +0 -122
  247. package/src/languageProcessing/languages/fa/config/internal/participles.js +0 -1429
  248. package/src/languageProcessing/languages/fa/config/sentenceLength.js +0 -3
  249. package/src/languageProcessing/languages/fa/config/transitionWords.js +0 -20
  250. package/src/languageProcessing/languages/fa/config/twoPartTransitionWords.js +0 -9
  251. package/src/languageProcessing/languages/fa/helpers/createBasicWordForms.js +0 -97
  252. package/src/languageProcessing/languages/fa/helpers/getStemmer.js +0 -13
  253. package/src/languageProcessing/languages/fa/helpers/isPassiveSentence.js +0 -14
  254. package/src/languageProcessing/languages/fr/Researcher.js +0 -46
  255. package/src/languageProcessing/languages/fr/config/firstWordExceptions.js +0 -16
  256. package/src/languageProcessing/languages/fr/config/functionWords.js +0 -281
  257. package/src/languageProcessing/languages/fr/config/internal/exceptionsParticiplesActive.js +0 -1510
  258. package/src/languageProcessing/languages/fr/config/internal/passiveVoiceAuxiliaries.js +0 -108
  259. package/src/languageProcessing/languages/fr/config/internal/passiveVoiceIrregulars.js +0 -565
  260. package/src/languageProcessing/languages/fr/config/stopWords.js +0 -119
  261. package/src/languageProcessing/languages/fr/config/syllables.json +0 -1426
  262. package/src/languageProcessing/languages/fr/config/transitionWords.js +0 -59
  263. package/src/languageProcessing/languages/fr/config/twoPartTransitionWords.js +0 -15
  264. package/src/languageProcessing/languages/fr/config/wordComplexity.js +0 -4
  265. package/src/languageProcessing/languages/fr/helpers/calculateFleschReadingScore.js +0 -18
  266. package/src/languageProcessing/languages/fr/helpers/checkIfWordIsComplex.js +0 -67
  267. package/src/languageProcessing/languages/fr/helpers/getClauses.js +0 -34
  268. package/src/languageProcessing/languages/fr/helpers/getStemmer.js +0 -22
  269. package/src/languageProcessing/languages/fr/helpers/internal/getParticiples.js +0 -72
  270. package/src/languageProcessing/languages/fr/helpers/internal/stem.js +0 -633
  271. package/src/languageProcessing/languages/fr/values/Clause.js +0 -96
  272. package/src/languageProcessing/languages/he/Researcher.js +0 -50
  273. package/src/languageProcessing/languages/he/config/firstWordExceptions.js +0 -13
  274. package/src/languageProcessing/languages/he/config/functionWords.js +0 -564
  275. package/src/languageProcessing/languages/he/config/internal/regularRootsHufal.js +0 -186
  276. package/src/languageProcessing/languages/he/config/internal/regularRootsNifal.js +0 -195
  277. package/src/languageProcessing/languages/he/config/internal/regularRootsPual.js +0 -168
  278. package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsHufal.js +0 -188
  279. package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsNifal.js +0 -197
  280. package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsPual.js +0 -170
  281. package/src/languageProcessing/languages/he/config/prefixedFunctionWords.js +0 -2
  282. package/src/languageProcessing/languages/he/config/sentenceLength.js +0 -3
  283. package/src/languageProcessing/languages/he/config/transitionWords.js +0 -28
  284. package/src/languageProcessing/languages/he/config/twoPartTransitionWords.js +0 -8
  285. package/src/languageProcessing/languages/he/helpers/createBasicWordForms.js +0 -33
  286. package/src/languageProcessing/languages/he/helpers/getStemmer.js +0 -22
  287. package/src/languageProcessing/languages/he/helpers/internal/stem.js +0 -52
  288. package/src/languageProcessing/languages/he/helpers/isPassiveSentence.js +0 -96
  289. package/src/languageProcessing/languages/he/helpers/stem.js +0 -52
  290. package/src/languageProcessing/languages/hu/Researcher.js +0 -48
  291. package/src/languageProcessing/languages/hu/config/firstWordExceptions.js +0 -31
  292. package/src/languageProcessing/languages/hu/config/functionWords.js +0 -284
  293. package/src/languageProcessing/languages/hu/config/internal/auxiliaries.js +0 -97
  294. package/src/languageProcessing/languages/hu/config/internal/morphologicalPassiveAffixes.js +0 -125
  295. package/src/languageProcessing/languages/hu/config/internal/nonPassivesInVaAndVe.js +0 -265
  296. package/src/languageProcessing/languages/hu/config/internal/odikVerbs.js +0 -273
  297. package/src/languageProcessing/languages/hu/config/internal/participles.js +0 -412
  298. package/src/languageProcessing/languages/hu/config/stopWords.js +0 -213
  299. package/src/languageProcessing/languages/hu/config/transitionWords.js +0 -42
  300. package/src/languageProcessing/languages/hu/config/twoPartTransitionWords.js +0 -34
  301. package/src/languageProcessing/languages/hu/helpers/getClauses.js +0 -25
  302. package/src/languageProcessing/languages/hu/helpers/getStemmer.js +0 -22
  303. package/src/languageProcessing/languages/hu/helpers/internal/getParticiples.js +0 -21
  304. package/src/languageProcessing/languages/hu/helpers/internal/stem.js +0 -389
  305. package/src/languageProcessing/languages/hu/helpers/isPassiveSentence.js +0 -54
  306. package/src/languageProcessing/languages/hu/values/Clause.js +0 -41
  307. package/src/languageProcessing/languages/id/Researcher.js +0 -46
  308. package/src/languageProcessing/languages/id/config/firstWordExceptions.js +0 -13
  309. package/src/languageProcessing/languages/id/config/functionWords.js +0 -202
  310. package/src/languageProcessing/languages/id/config/internal/nonPassiveVerbsStartingDi.js +0 -215
  311. package/src/languageProcessing/languages/id/config/transitionWords.js +0 -62
  312. package/src/languageProcessing/languages/id/config/twoPartTransitionWords.js +0 -13
  313. package/src/languageProcessing/languages/id/helpers/getStemmer.js +0 -22
  314. package/src/languageProcessing/languages/id/helpers/internal/stem.js +0 -462
  315. package/src/languageProcessing/languages/id/helpers/internal/stemHelpers.js +0 -78
  316. package/src/languageProcessing/languages/id/helpers/isPassiveSentence.js +0 -39
  317. package/src/languageProcessing/languages/id/helpers/splitIntoTokensCustom.js +0 -47
  318. package/src/languageProcessing/languages/it/Researcher.js +0 -48
  319. package/src/languageProcessing/languages/it/config/firstWordExceptions.js +0 -17
  320. package/src/languageProcessing/languages/it/config/functionWords.js +0 -277
  321. package/src/languageProcessing/languages/it/config/internal/passiveVoiceAuxiliaries.js +0 -98
  322. package/src/languageProcessing/languages/it/config/internal/passiveVoiceParticiples.js +0 -7197
  323. package/src/languageProcessing/languages/it/config/sentenceLength.js +0 -3
  324. package/src/languageProcessing/languages/it/config/stopWords.js +0 -57
  325. package/src/languageProcessing/languages/it/config/syllables.json +0 -573
  326. package/src/languageProcessing/languages/it/config/transitionWords.js +0 -104
  327. package/src/languageProcessing/languages/it/config/twoPartTransitionWords.js +0 -9
  328. package/src/languageProcessing/languages/it/helpers/calculateFleschReadingScore.js +0 -15
  329. package/src/languageProcessing/languages/it/helpers/getClauses.js +0 -32
  330. package/src/languageProcessing/languages/it/helpers/getStemmer.js +0 -22
  331. package/src/languageProcessing/languages/it/helpers/internal/getParticiples.js +0 -34
  332. package/src/languageProcessing/languages/it/helpers/internal/stem.js +0 -436
  333. package/src/languageProcessing/languages/it/values/Clause.js +0 -47
  334. package/src/languageProcessing/languages/ja/Researcher.js +0 -86
  335. package/src/languageProcessing/languages/ja/config/assessmentApplicabilityCharacterCount.js +0 -4
  336. package/src/languageProcessing/languages/ja/config/firstWordExceptions.js +0 -8
  337. package/src/languageProcessing/languages/ja/config/functionWords.js +0 -563
  338. package/src/languageProcessing/languages/ja/config/keyphraseLength.js +0 -16
  339. package/src/languageProcessing/languages/ja/config/metaDescriptionLength.js +0 -4
  340. package/src/languageProcessing/languages/ja/config/paragraphLength.js +0 -10
  341. package/src/languageProcessing/languages/ja/config/sentenceLength.js +0 -4
  342. package/src/languageProcessing/languages/ja/config/subheadingsTooLong.js +0 -18
  343. package/src/languageProcessing/languages/ja/config/textLength.js +0 -47
  344. package/src/languageProcessing/languages/ja/config/topicLength.js +0 -5
  345. package/src/languageProcessing/languages/ja/config/transitionWords.js +0 -354
  346. package/src/languageProcessing/languages/ja/customResearches/findKeyphraseInSEOTitle.js +0 -98
  347. package/src/languageProcessing/languages/ja/customResearches/getKeyphraseLength.js +0 -19
  348. package/src/languageProcessing/languages/ja/customResearches/getWordForms.js +0 -50
  349. package/src/languageProcessing/languages/ja/customResearches/textLength.js +0 -24
  350. package/src/languageProcessing/languages/ja/helpers/countCharacters.js +0 -19
  351. package/src/languageProcessing/languages/ja/helpers/customGetStemmer.js +0 -21
  352. package/src/languageProcessing/languages/ja/helpers/getContentWords.js +0 -21
  353. package/src/languageProcessing/languages/ja/helpers/getWords.js +0 -31
  354. package/src/languageProcessing/languages/ja/helpers/internal/SentenceTokenizer.js +0 -102
  355. package/src/languageProcessing/languages/ja/helpers/internal/createWordForms.js +0 -68
  356. package/src/languageProcessing/languages/ja/helpers/internal/determineStem.js +0 -17
  357. package/src/languageProcessing/languages/ja/helpers/matchTextWithWord.js +0 -53
  358. package/src/languageProcessing/languages/ja/helpers/matchTransitionWords.js +0 -25
  359. package/src/languageProcessing/languages/ja/helpers/memoizedSentenceTokenizer.js +0 -28
  360. package/src/languageProcessing/languages/ja/helpers/splitIntoTokensCustom.js +0 -20
  361. package/src/languageProcessing/languages/ja/helpers/wordsCharacterCount.js +0 -13
  362. package/src/languageProcessing/languages/nb/Researcher.js +0 -45
  363. package/src/languageProcessing/languages/nb/config/firstWordExceptions.js +0 -12
  364. package/src/languageProcessing/languages/nb/config/functionWords.js +0 -106
  365. package/src/languageProcessing/languages/nb/config/internal/participles.js +0 -3127
  366. package/src/languageProcessing/languages/nb/config/internal/passiveVoiceAuxiliaries.js +0 -15
  367. package/src/languageProcessing/languages/nb/config/stopWords.js +0 -39
  368. package/src/languageProcessing/languages/nb/config/transitionWords.js +0 -21
  369. package/src/languageProcessing/languages/nb/config/twoPartTransitionWords.js +0 -10
  370. package/src/languageProcessing/languages/nb/helpers/getClauses.js +0 -28
  371. package/src/languageProcessing/languages/nb/helpers/getStemmer.js +0 -22
  372. package/src/languageProcessing/languages/nb/helpers/internal/getParticiples.js +0 -24
  373. package/src/languageProcessing/languages/nb/helpers/internal/stem.js +0 -133
  374. package/src/languageProcessing/languages/nb/values/Clause.js +0 -43
  375. package/src/languageProcessing/languages/nl/Researcher.js +0 -48
  376. package/src/languageProcessing/languages/nl/config/firstWordExceptions.js +0 -15
  377. package/src/languageProcessing/languages/nl/config/functionWords.js +0 -233
  378. package/src/languageProcessing/languages/nl/config/internal/nonParticiples.js +0 -2515
  379. package/src/languageProcessing/languages/nl/config/internal/passiveVoiceAuxiliaries.js +0 -13
  380. package/src/languageProcessing/languages/nl/config/internal/passiveVoiceIrregulars.js +0 -474
  381. package/src/languageProcessing/languages/nl/config/keyphraseLength.js +0 -10
  382. package/src/languageProcessing/languages/nl/config/stopWords.js +0 -35
  383. package/src/languageProcessing/languages/nl/config/syllables.json +0 -343
  384. package/src/languageProcessing/languages/nl/config/transitionWords.js +0 -22
  385. package/src/languageProcessing/languages/nl/config/twoPartTransitionWords.js +0 -8
  386. package/src/languageProcessing/languages/nl/helpers/calculateFleschReadingScore.js +0 -15
  387. package/src/languageProcessing/languages/nl/helpers/getClauses.js +0 -25
  388. package/src/languageProcessing/languages/nl/helpers/getStemmer.js +0 -22
  389. package/src/languageProcessing/languages/nl/helpers/internal/checkExceptionsWithFullForms.js +0 -128
  390. package/src/languageProcessing/languages/nl/helpers/internal/detectAndStemRegularParticiple.js +0 -324
  391. package/src/languageProcessing/languages/nl/helpers/internal/detectAndStemSuffixes.js +0 -164
  392. package/src/languageProcessing/languages/nl/helpers/internal/determineStem.js +0 -133
  393. package/src/languageProcessing/languages/nl/helpers/internal/getParticiples.js +0 -25
  394. package/src/languageProcessing/languages/nl/helpers/internal/getStemWordsWithTAndDEnding.js +0 -183
  395. package/src/languageProcessing/languages/nl/helpers/internal/stem.js +0 -146
  396. package/src/languageProcessing/languages/nl/helpers/internal/stemModificationHelpers.js +0 -109
  397. package/src/languageProcessing/languages/nl/helpers/internal/stemTOrDFromEndOfWord.js +0 -65
  398. package/src/languageProcessing/languages/nl/values/Clause.js +0 -62
  399. package/src/languageProcessing/languages/pl/Researcher.js +0 -47
  400. package/src/languageProcessing/languages/pl/config/firstWordExceptions.js +0 -12
  401. package/src/languageProcessing/languages/pl/config/functionWords.js +0 -421
  402. package/src/languageProcessing/languages/pl/config/internal/auxiliaries.js +0 -85
  403. package/src/languageProcessing/languages/pl/config/internal/participles.js +0 -26433
  404. package/src/languageProcessing/languages/pl/config/sentenceLength.js +0 -10
  405. package/src/languageProcessing/languages/pl/config/stopWords.js +0 -36
  406. package/src/languageProcessing/languages/pl/config/transitionWords.js +0 -42
  407. package/src/languageProcessing/languages/pl/config/twoPartTransitionWords.js +0 -8
  408. package/src/languageProcessing/languages/pl/helpers/getClauses.js +0 -25
  409. package/src/languageProcessing/languages/pl/helpers/getStemmer.js +0 -22
  410. package/src/languageProcessing/languages/pl/helpers/internal/getParticiples.js +0 -18
  411. package/src/languageProcessing/languages/pl/helpers/internal/stem.js +0 -161
  412. package/src/languageProcessing/languages/pl/values/Clause.js +0 -53
  413. package/src/languageProcessing/languages/pt/Researcher.js +0 -48
  414. package/src/languageProcessing/languages/pt/config/firstWordExceptions.js +0 -15
  415. package/src/languageProcessing/languages/pt/config/functionWords.js +0 -226
  416. package/src/languageProcessing/languages/pt/config/internal/passiveVoiceAuxiliaries.js +0 -66
  417. package/src/languageProcessing/languages/pt/config/internal/passiveVoiceParticiples.js +0 -4088
  418. package/src/languageProcessing/languages/pt/config/sentenceLength.js +0 -3
  419. package/src/languageProcessing/languages/pt/config/stopWords.js +0 -50
  420. package/src/languageProcessing/languages/pt/config/syllables.json +0 -38
  421. package/src/languageProcessing/languages/pt/config/transitionWords.js +0 -34
  422. package/src/languageProcessing/languages/pt/config/twoPartTransitionWords.js +0 -9
  423. package/src/languageProcessing/languages/pt/helpers/calculateFleschReadingScore.js +0 -15
  424. package/src/languageProcessing/languages/pt/helpers/getClauses.js +0 -29
  425. package/src/languageProcessing/languages/pt/helpers/getStemmer.js +0 -22
  426. package/src/languageProcessing/languages/pt/helpers/internal/getParticiples.js +0 -35
  427. package/src/languageProcessing/languages/pt/helpers/internal/stem.js +0 -319
  428. package/src/languageProcessing/languages/pt/values/Clause.js +0 -43
  429. package/src/languageProcessing/languages/ru/Researcher.js +0 -48
  430. package/src/languageProcessing/languages/ru/config/firstWordExceptions.js +0 -14
  431. package/src/languageProcessing/languages/ru/config/fleschReadingEaseScores.js +0 -20
  432. package/src/languageProcessing/languages/ru/config/functionWords.js +0 -519
  433. package/src/languageProcessing/languages/ru/config/internal/participlesShortenedList.js +0 -2914
  434. package/src/languageProcessing/languages/ru/config/internal/passiveVoiceParticiples.js +0 -6295
  435. package/src/languageProcessing/languages/ru/config/sentenceLength.js +0 -3
  436. package/src/languageProcessing/languages/ru/config/syllables.json +0 -19
  437. package/src/languageProcessing/languages/ru/config/transitionWords.js +0 -62
  438. package/src/languageProcessing/languages/ru/config/twoPartTransitionWords.js +0 -14
  439. package/src/languageProcessing/languages/ru/helpers/calculateFleschReadingScore.js +0 -16
  440. package/src/languageProcessing/languages/ru/helpers/getStemmer.js +0 -22
  441. package/src/languageProcessing/languages/ru/helpers/internal/stem.js +0 -288
  442. package/src/languageProcessing/languages/ru/helpers/isPassiveSentence.js +0 -14
  443. package/src/languageProcessing/languages/sk/Researcher.js +0 -46
  444. package/src/languageProcessing/languages/sk/config/firstWordExceptions.js +0 -14
  445. package/src/languageProcessing/languages/sk/config/functionWords.js +0 -855
  446. package/src/languageProcessing/languages/sk/config/internal/nonPassives.js +0 -1074
  447. package/src/languageProcessing/languages/sk/config/internal/passiveVoiceAuxiliaries.js +0 -22
  448. package/src/languageProcessing/languages/sk/config/stopWords.js +0 -34
  449. package/src/languageProcessing/languages/sk/config/transitionWords.js +0 -23
  450. package/src/languageProcessing/languages/sk/config/twoPartTransitionWords.js +0 -10
  451. package/src/languageProcessing/languages/sk/helpers/getClauses.js +0 -26
  452. package/src/languageProcessing/languages/sk/helpers/getStemmer.js +0 -22
  453. package/src/languageProcessing/languages/sk/helpers/internal/getParticiples.js +0 -16
  454. package/src/languageProcessing/languages/sk/helpers/internal/stem.js +0 -319
  455. package/src/languageProcessing/languages/sk/values/Clause.js +0 -39
  456. package/src/languageProcessing/languages/sv/Researcher.js +0 -45
  457. package/src/languageProcessing/languages/sv/config/firstWordExceptions.js +0 -15
  458. package/src/languageProcessing/languages/sv/config/functionWords.js +0 -176
  459. package/src/languageProcessing/languages/sv/config/internal/passiveVerbs.js +0 -10400
  460. package/src/languageProcessing/languages/sv/config/keyphraseLength.js +0 -11
  461. package/src/languageProcessing/languages/sv/config/transitionWords.js +0 -35
  462. package/src/languageProcessing/languages/sv/config/twoPartTransitionWords.js +0 -8
  463. package/src/languageProcessing/languages/sv/helpers/getStemmer.js +0 -22
  464. package/src/languageProcessing/languages/sv/helpers/internal/stem.js +0 -152
  465. package/src/languageProcessing/languages/sv/helpers/isPassiveSentence.js +0 -14
  466. package/src/languageProcessing/languages/tr/Researcher.js +0 -44
  467. package/src/languageProcessing/languages/tr/config/firstWordExceptions.js +0 -13
  468. package/src/languageProcessing/languages/tr/config/functionWords.js +0 -116
  469. package/src/languageProcessing/languages/tr/config/internal/nonPassiveExceptions.js +0 -574
  470. package/src/languageProcessing/languages/tr/config/internal/passiveEndings.js +0 -151
  471. package/src/languageProcessing/languages/tr/config/sentenceLength.js +0 -7
  472. package/src/languageProcessing/languages/tr/config/transitionWords.js +0 -42
  473. package/src/languageProcessing/languages/tr/config/twoPartTransitionWords.js +0 -7
  474. package/src/languageProcessing/languages/tr/helpers/getStemmer.js +0 -22
  475. package/src/languageProcessing/languages/tr/helpers/internal/stem.js +0 -20
  476. package/src/languageProcessing/languages/tr/helpers/isPassiveSentence.js +0 -43
  477. package/src/languageProcessing/researches/altTagCount.js +0 -70
  478. package/src/languageProcessing/researches/countSentencesFromText.js +0 -19
  479. package/src/languageProcessing/researches/findKeyphraseInSEOTitle.js +0 -257
  480. package/src/languageProcessing/researches/findKeywordInFirstParagraph.js +0 -86
  481. package/src/languageProcessing/researches/findTransitionWords.js +0 -123
  482. package/src/languageProcessing/researches/functionWordsInKeyphrase.js +0 -44
  483. package/src/languageProcessing/researches/getAnchorsWithKeyphrase.js +0 -227
  484. package/src/languageProcessing/researches/getFleschReadingScore.js +0 -150
  485. package/src/languageProcessing/researches/getKeywordDensity.js +0 -44
  486. package/src/languageProcessing/researches/getLinkStatistics.js +0 -54
  487. package/src/languageProcessing/researches/getLinks.js +0 -18
  488. package/src/languageProcessing/researches/getLongCenterAlignedTexts.js +0 -37
  489. package/src/languageProcessing/researches/getParagraphLength.js +0 -44
  490. package/src/languageProcessing/researches/getParagraphs.js +0 -18
  491. package/src/languageProcessing/researches/getPassiveVoiceResult.js +0 -129
  492. package/src/languageProcessing/researches/getProminentWordsForInsights.js +0 -48
  493. package/src/languageProcessing/researches/getProminentWordsForInternalLinking.js +0 -119
  494. package/src/languageProcessing/researches/getSentenceBeginnings.js +0 -124
  495. package/src/languageProcessing/researches/getSubheadingTextLengths.js +0 -59
  496. package/src/languageProcessing/researches/getWordForms.js +0 -204
  497. package/src/languageProcessing/researches/h1s.js +0 -10
  498. package/src/languageProcessing/researches/imageCount.js +0 -16
  499. package/src/languageProcessing/researches/index.js +0 -5
  500. package/src/languageProcessing/researches/keyphraseDistribution.js +0 -249
  501. package/src/languageProcessing/researches/keyphraseLength.js +0 -17
  502. package/src/languageProcessing/researches/keywordCount.js +0 -134
  503. package/src/languageProcessing/researches/keywordCountInUrl.js +0 -57
  504. package/src/languageProcessing/researches/matchKeywordInSubheadings.js +0 -62
  505. package/src/languageProcessing/researches/metaDescriptionKeyword.js +0 -85
  506. package/src/languageProcessing/researches/metaDescriptionLength.js +0 -12
  507. package/src/languageProcessing/researches/pageTitleWidth.js +0 -11
  508. package/src/languageProcessing/researches/readingTime.js +0 -82
  509. package/src/languageProcessing/researches/sentences.js +0 -20
  510. package/src/languageProcessing/researches/videoCount.js +0 -32
  511. package/src/languageProcessing/researches/wordComplexity.js +0 -129
  512. package/src/languageProcessing/researches/wordCountInText.js +0 -29
  513. package/src/languageProcessing/values/Clause.js +0 -108
  514. package/src/languageProcessing/values/ProminentWord.js +0 -95
  515. package/src/languageProcessing/values/Sentence.js +0 -111
  516. package/src/languageProcessing/values/index.js +0 -9
  517. package/src/markers/addMark.js +0 -9
  518. package/src/markers/addMarkSingleWord.js +0 -32
  519. package/src/markers/index.js +0 -7
  520. package/src/markers/removeDuplicateMarks.js +0 -27
  521. package/src/markers/removeMarks.js +0 -11
  522. package/src/parse/build/build.js +0 -52
  523. package/src/parse/build/index.js +0 -10
  524. package/src/parse/build/private/adapt.js +0 -113
  525. package/src/parse/build/private/adaptAttributes.js +0 -36
  526. package/src/parse/build/private/alwaysFilterElements.js +0 -75
  527. package/src/parse/build/private/combineIntoImplicitParagraphs.js +0 -130
  528. package/src/parse/build/private/filterBeforeTokenizing.js +0 -32
  529. package/src/parse/build/private/filterHelpers.js +0 -44
  530. package/src/parse/build/private/filterTree.js +0 -42
  531. package/src/parse/build/private/getTextElementPositions.js +0 -184
  532. package/src/parse/build/private/helpers/parseClassAttribute.js +0 -9
  533. package/src/parse/build/private/isPhrasingContent.js +0 -28
  534. package/src/parse/build/private/parseBlocks.js +0 -151
  535. package/src/parse/build/private/tokenize.js +0 -74
  536. package/src/parse/language/LanguageProcessor.js +0 -74
  537. package/src/parse/structure/Heading.js +0 -26
  538. package/src/parse/structure/Node.js +0 -69
  539. package/src/parse/structure/Paragraph.js +0 -48
  540. package/src/parse/structure/Sentence.js +0 -30
  541. package/src/parse/structure/SourceCodeLocation.js +0 -41
  542. package/src/parse/structure/Text.js +0 -27
  543. package/src/parse/structure/Token.js +0 -24
  544. package/src/parse/structure/index.js +0 -16
  545. package/src/parse/traverse/findAllInTree.js +0 -58
  546. package/src/parse/traverse/index.js +0 -12
  547. package/src/parse/traverse/innerText.js +0 -26
  548. package/src/parsedPaper/ParsedPaper.js +0 -92
  549. package/src/parsedPaper/assess/TreeAssessor.js +0 -184
  550. package/src/parsedPaper/assess/assessmentListFactories.js +0 -73
  551. package/src/parsedPaper/assess/assessments/Assessment.js +0 -79
  552. package/src/parsedPaper/assess/assessments/index.js +0 -6
  553. package/src/parsedPaper/assess/assessorFactories.js +0 -104
  554. package/src/parsedPaper/assess/cornerstone/assessmentListFactories.js +0 -47
  555. package/src/parsedPaper/assess/cornerstone/index.js +0 -5
  556. package/src/parsedPaper/assess/index.js +0 -20
  557. package/src/parsedPaper/build/PaperParser.js +0 -105
  558. package/src/parsedPaper/build/linguisticParsing/Sentence.js +0 -89
  559. package/src/parsedPaper/build/linguisticParsing/SentenceTokenizer.js +0 -323
  560. package/src/parsedPaper/build/linguisticParsing/parseText.js +0 -20
  561. package/src/parsedPaper/build/tree/TreeBuilder.js +0 -75
  562. package/src/parsedPaper/build/tree/cleanup/calculateTextIndices.js +0 -190
  563. package/src/parsedPaper/build/tree/cleanup/getElementContent.js +0 -21
  564. package/src/parsedPaper/build/tree/cleanup/postParsing.js +0 -37
  565. package/src/parsedPaper/build/tree/html/HTMLTreeConverter.js +0 -230
  566. package/src/parsedPaper/build/tree/html/buildTree.js +0 -31
  567. package/src/parsedPaper/build/tree/html/htmlConstants.js +0 -37
  568. package/src/parsedPaper/build/tree/index.js +0 -14
  569. package/src/parsedPaper/build/tree/metadata/buildTree.js +0 -32
  570. package/src/parsedPaper/research/TreeResearcher.js +0 -134
  571. package/src/parsedPaper/research/index.js +0 -13
  572. package/src/parsedPaper/research/researches/Headings.js +0 -20
  573. package/src/parsedPaper/research/researches/LinkStatistics.js +0 -128
  574. package/src/parsedPaper/research/researches/Research.js +0 -50
  575. package/src/parsedPaper/research/researches/index.js +0 -1
  576. package/src/parsedPaper/structure/tree/FormattingElement.js +0 -67
  577. package/src/parsedPaper/structure/tree/SourceCodeLocation.js +0 -31
  578. package/src/parsedPaper/structure/tree/TextContainer.js +0 -85
  579. package/src/parsedPaper/structure/tree/index.js +0 -22
  580. package/src/parsedPaper/structure/tree/nodes/Heading.js +0 -26
  581. package/src/parsedPaper/structure/tree/nodes/LeafNode.js +0 -75
  582. package/src/parsedPaper/structure/tree/nodes/List.js +0 -47
  583. package/src/parsedPaper/structure/tree/nodes/ListItem.js +0 -26
  584. package/src/parsedPaper/structure/tree/nodes/MetadataMiscellaneous.js +0 -46
  585. package/src/parsedPaper/structure/tree/nodes/MetadataText.js +0 -26
  586. package/src/parsedPaper/structure/tree/nodes/Node.js +0 -154
  587. package/src/parsedPaper/structure/tree/nodes/Paragraph.js +0 -24
  588. package/src/parsedPaper/structure/tree/nodes/StructuredNode.js +0 -52
  589. package/src/parsedPaper/structure/tree/nodes/index.js +0 -21
  590. package/src/scoring/assessments/assessment.js +0 -63
  591. package/src/scoring/assessments/index.js +0 -58
  592. package/src/scoring/assessments/readability/ParagraphTooLongAssessment.js +0 -173
  593. package/src/scoring/assessments/readability/SentenceBeginningsAssessment.js +0 -132
  594. package/src/scoring/assessments/readability/SentenceLengthInTextAssessment.js +0 -186
  595. package/src/scoring/assessments/readability/TransitionWordsAssessment.js +0 -168
  596. package/src/scoring/assessments/seo/ImageCountAssessment.js +0 -112
  597. package/src/scoring/assessments/seo/InternalLinksAssessment.js +0 -114
  598. package/src/scoring/assessments/seo/IntroductionKeywordAssessment.js +0 -110
  599. package/src/scoring/assessments/seo/KeyphraseAssessment.js +0 -104
  600. package/src/scoring/assessments/seo/KeyphraseLengthAssessment.js +0 -110
  601. package/src/scoring/assessments/seo/KeywordDensityAssessment.js +0 -116
  602. package/src/scoring/assessments/seo/MetaDescriptionKeywordAssessment.js +0 -114
  603. package/src/scoring/assessments/seo/MetaDescriptionLengthAssessment.js +0 -112
  604. package/src/scoring/assessments/seo/MetaTitleKeywordAssessment.js +0 -111
  605. package/src/scoring/assessments/seo/NumberInMetaTitleAssessment.js +0 -107
  606. package/src/scoring/assessments/seo/OutboundLinksAssessment.js +0 -111
  607. package/src/scoring/assessments/seo/PageTitleWidthAssessment.js +0 -104
  608. package/src/scoring/assessments/seo/SingleH1Assessment.js +0 -118
  609. package/src/scoring/assessments/seo/SingleTitleAssessment.js +0 -108
  610. package/src/scoring/assessments/seo/SubHeadingsKeywordAssessment.js +0 -107
  611. package/src/scoring/assessments/seo/TextImagesAssessment.js +0 -144
  612. package/src/scoring/assessments/seo/TextLengthAssessment.js +0 -100
  613. package/src/scoring/assessments/seo/UrlKeywordAssessment.js +0 -111
  614. package/src/scoring/assessments/seo/UrlLengthAssessment.js +0 -103
  615. package/src/scoring/assessors/assessor.js +0 -269
  616. package/src/scoring/assessors/avadaAssessor.js +0 -67
  617. package/src/scoring/assessors/contentAssessor.js +0 -159
  618. package/src/scoring/assessors/index.js +0 -4
  619. package/src/scoring/assessors/seoAssessor.js +0 -57
  620. package/src/scoring/helpers/assessments/checkForTooLongSentences.js +0 -13
  621. package/src/scoring/helpers/assessments/inRange.js +0 -49
  622. package/src/scoring/helpers/assessments/keyphraseLengthFactor.js +0 -10
  623. package/src/scoring/helpers/assessments/recommendedKeywordCount.js +0 -43
  624. package/src/scoring/helpers/index.js +0 -74
  625. package/src/scoring/interpreters/index.js +0 -5
  626. package/src/scoring/interpreters/scoreToRating.js +0 -31
  627. package/src/scoring/renderers/AssessorPresenter.js +0 -360
  628. package/src/scoring/scoreAggregators/ReadabilityScoreAggregator.js +0 -203
  629. package/src/scoring/scoreAggregators/SEOScoreAggregator.js +0 -54
  630. package/src/scoring/scoreAggregators/ScoreAggregator.js +0 -23
  631. package/src/scoring/scoreAggregators/index.js +0 -3
  632. package/src/values/AssessmentResult.js +0 -496
  633. package/src/values/Mark.js +0 -271
  634. package/src/values/Paper.js +0 -425
  635. package/src/values/index.js +0 -9
  636. package/src/vendor/turkishStemmer.js +0 -3435
  637. package/tsconfig.json +0 -15
@@ -1,34 +0,0 @@
1
- /** @module config/twoPartTransitionWords */
2
-
3
- /**
4
- * Returns an array with two-part transition words to be used by the assessments.
5
- * @returns {Array} The array filled with two-part transition words.
6
- */
7
- export default [ [ "nemcsak", "hanem", "is" ], [ "ahogy", "akkor" ], [ "ahogy", "azonnal" ], [ "ahogy", "azután" ],
8
- [ "ahogy", "máris" ], [ "ahogy", "nyomban" ], [ "ahogy", "tüstént" ], [ "akkor", "amikor" ], [ "akkor", "ha" ],
9
- [ "akkor", "hogy" ], [ "akkor", "hogyha" ], [ "akkor", "mikor" ], [ "akkorra", "amikorra" ],
10
- [ "akkorra", "mikorra" ], [ "akkorra", "mire" ], [ "akkortól", "amikor" ], [ "akkortól", "mikor" ],
11
- [ "alighogy", "máris" ], [ "alighogy", "nyomban" ], [ "alighogy", "tüstént" ], [ "addig", "ameddig" ],
12
- [ "ameddig", "addig" ], [ "abba", "hogy" ], [ "abban", "hogy" ], [ "abból", "hogy" ], [ "addig", "amíg" ],
13
- [ "addig", "hogy" ], [ "addig", "míg" ], [ "afelé", "hogy" ], [ "ahelyett", "hogy" ], [ "ahhoz", "hogy" ],
14
- [ "akként", "hogy" ], [ "akkorra", "hogy" ], [ "amiatt", "hogy" ], [ "amellett", "hogy" ], [ "anélkül", "hogy" ],
15
- [ "annyi", "hogy" ], [ "annyi", "mint" ], [ "annyira", "hogy" ], [ "annyira", "mint" ], [ "arra", "hogy" ],
16
- [ "arról", "hogy" ], [ "attól fogva", "hogy" ], [ "attól", "hogy" ], [ "avégett", "hogy" ], [ "avégre", "hogy" ],
17
- [ "az ellen", "hogy" ], [ "az iránt", "hogy" ], [ "azelőtt", "hogy" ], [ "azért", "hogy" ], [ "azon", "hogy" ],
18
- [ "azonkívül", "hogy" ], [ "azóta", "hogy" ], [ "azután", "hogy" ], [ "azzal", "hogy" ], [ "hol", "hol" ],
19
- [ "igaz", "hogy" ], [ "mind", "mind" ], [ "nem úgy", "mint" ], [ "oly módon", "hogy" ], [ "inkább", "semhogy" ],
20
- [ "úgy", "hogy" ], [ "úgy", "mint" ], [ "vagy", "vagy" ], [ "se", "se" ], [ "sem", "sem" ], [ "is", "is" ],
21
- [ "akár", "akár" ], [ "is", "meg" ], [ "nem", "hanem" ], [ "egyrészt", "másrészt" ], [ "minél", "annál" ],
22
- [ "amíg", "addig" ], [ "amíg", "addigra" ], [ "amikor", "akkor" ], [ "akkor", "amikor" ], [ "amikor", "aközben" ],
23
- [ "amikor", "azalatt" ], [ "addigra", "amikorra" ], [ "amikorra", "addigra" ], [ "amikorra", "akkorra" ],
24
- [ "amint", "akkor" ], [ "amint", "azonnal" ], [ "amint", "máris" ], [ "amint", "nyomban" ], [ "amint", "tüstént" ],
25
- [ "amióta", "attól kezdve" ], [ "azóta", "amióta" ], [ "amióta", "azóta" ], [ "amire", "addig" ],
26
- [ "amire", "addigra" ], [ "azóta", "hogy" ], [ "ha", "akkor" ], [ "hogyha", "akkor" ], [ "is", "is" ],
27
- [ "azalatt", "mialatt" ], [ "mialatt", "azalatt" ], [ "mielőtt", "azelőtt" ],
28
- [ "azelőtt", "mielőtt" ], [ "mihelyt", "azonnal" ], [ "mihelyt", "máris" ], [ "mihelyt", "nyomban" ],
29
- [ "mihelyt", "tüstént" ], [ "mikor", "akkor" ], [ "mikor", "aközben" ], [ "mikor", "azalatt" ],
30
- [ "mikor", "azután" ], [ "mikorra", "addigra" ], [ "akkorra", "mikorra" ], [ "mikorra", "akkorra" ],
31
- [ "miközben", "azalatt" ], [ "mióta", "attól kezdve" ], [ "mire", "addigra" ], [ "miután", "azután" ],
32
- [ "attól kezdve", "mióta" ], [ "mióta", "azóta" ], [ "azóta", "mióta" ], [ "mire", "addig" ], [ "addigra", "mire" ],
33
- [ "azután", "miután" ], [ "nemcsak", "hanem" ], [ "sem", "sem" ], [ "vagy", "vagy" ] ];
34
-
@@ -1,25 +0,0 @@
1
- import {languageProcessing} from '../../../index';
2
- const {getClausesSplitOnStopWords, createRegexFromArray} = languageProcessing;
3
-
4
- import HungarianClause from '../values/Clause';
5
- import auxiliaries from '../config/internal/auxiliaries.js';
6
- import stopWords from '../config/stopWords.js';
7
-
8
- const options = {
9
- Clause: HungarianClause,
10
- regexes: {
11
- auxiliaryRegex: createRegexFromArray(auxiliaries.allAuxiliaries),
12
- stopwordRegex: createRegexFromArray(stopWords)
13
- }
14
- };
15
-
16
- /**
17
- * Gets the clauses from a sentence by determining sentence breakers.
18
- *
19
- * @param {string} sentence The sentence to split up in clauses.
20
- *
21
- * @returns {Array} The array with all clauses that have an auxiliary.
22
- */
23
- export default function getHungarianClauses(sentence) {
24
- return getClausesSplitOnStopWords(sentence, options);
25
- }
@@ -1,22 +0,0 @@
1
- import {get} from 'lodash';
2
- import {languageProcessing} from '../../../index';
3
- const {baseStemmer} = languageProcessing;
4
-
5
- import stem from './internal/stem';
6
-
7
- /**
8
- * Returns the stemmer for a researcher.
9
- *
10
- * @param {Researcher} researcher The researcher.
11
- *
12
- * @returns {Function} The stemmer.
13
- */
14
- export default function getStemmer(researcher) {
15
- const morphologyData = get(researcher.getData('morphology'), 'hu', false);
16
-
17
- if (morphologyData) {
18
- return word => stem(word, morphologyData);
19
- }
20
-
21
- return baseStemmer;
22
- }
@@ -1,21 +0,0 @@
1
- import {languageProcessing} from '../../../index';
2
- const {getWords} = languageProcessing;
3
-
4
- import participlesInReAndRa from '../../config/internal/participles.js';
5
-
6
- /**
7
- * Creates an array of participles found in a clause.
8
- *
9
- * @param {string} clauseText The clause to finds participles in.
10
- *
11
- * @returns {Array} The array with the participles.
12
- */
13
- export default function(clauseText) {
14
- const words = getWords(clauseText);
15
-
16
- const participleEndingsRegex = new RegExp('(ve|va|ódni|ődni)$');
17
-
18
- return words.filter(
19
- word => participleEndingsRegex.test(word) || participlesInReAndRa.includes(word)
20
- );
21
- }
@@ -1,389 +0,0 @@
1
- /*
2
- * Copyright (c) 2001, Dr Martin Porter,
3
- * Copyright (c) 2002, Richard Boulton.
4
- *
5
- * All rights reserved.
6
- * Redistribution and use in source and binary forms, with or without modification, are permitted provided
7
- * that the following conditions are met:
8
- * 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
9
- * 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer
10
- * in the documentation and/or other materials provided with the distribution.
11
- * 3. Neither the name of the copyright holder nor the names of its contributors may be used to endorse or promote products
12
- * derived from this software without specific prior written permission.
13
- *
14
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
15
- * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
16
- * IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
17
- * OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
18
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
19
- * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
20
- * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
21
- */
22
-
23
- /**
24
- * Checks if the input character is a Hungarian vowel.
25
- *
26
- * @param {Object} morphologyData The Hungarian morphology data.
27
- * @param {string} word The word to check
28
- * @returns {number} Whether the input character is a Hungarian vowel.
29
- */
30
- const isVowel = function( morphologyData, word ) {
31
- const vowels = morphologyData.externalStemmer.vowels;
32
- const regex = new RegExp( vowels );
33
- return word.search( regex );
34
- };
35
-
36
- /**
37
- * Defines consonants or digraphs position.
38
- *
39
- * @param {Object} morphologyData Morphology data file
40
- * @param {string} word The word to check
41
- * @returns {number} the position of the digraph or consonant
42
- */
43
- const consonantOrDigraphPosition = function( morphologyData, word ) {
44
- const digraphRegex = new RegExp( morphologyData.externalStemmer.digraphs );
45
- const consonantRegex = new RegExp( morphologyData.externalStemmer.consonants );
46
- const digraphPosition = word.search( digraphRegex );
47
- const consonantPosition = word.search( consonantRegex );
48
- if ( digraphPosition === consonantPosition ) {
49
- return digraphPosition + 1;
50
- }
51
- return consonantPosition;
52
- };
53
-
54
- /**
55
- * Defines the R1 region: Checks if the word begins with a vowel: defines R1 as the region after the first consonant or diagraph
56
- * Checks if the word begins with a consonant: defines R1 as the region after the first vowel
57
- *
58
- * @param {Object} morphologyData The Morphology data file
59
- * @param {string} word The word to stem
60
- * @returns {number} The R1 region index.
61
- */
62
- const findR1Position = function( morphologyData, word ) {
63
- const vowelPosition = isVowel( morphologyData, word );
64
- if ( vowelPosition === 0 ) {
65
- const consonantOrDigraph = consonantOrDigraphPosition( morphologyData, word );
66
- return ( consonantOrDigraph + 1 );
67
- }
68
- return ( vowelPosition + 1 );
69
- };
70
-
71
- /**
72
- * Searches on of the following noun case suffixes: al, el and stems the suffix if found in R1 and preceded by a double consonant
73
- * and removes one of the double consonants
74
- *
75
- * @param {string} word The word to stem
76
- * @param {Object} morphologyData The morphology data file with suffix list
77
- *
78
- * @returns {string} The stemmed word.
79
- *
80
- */
81
- const stemSuffixes1 = function( word, morphologyData ) {
82
- if ( word.length < 3 ) {
83
- return word;
84
- }
85
- const r1Position = findR1Position( morphologyData, word );
86
- const suffix = word.search( new RegExp( morphologyData.externalStemmer.suffixes1 ) );
87
- if ( suffix >= r1Position ) {
88
- let wordAfterStemming = word.slice( 0, -2 );
89
-
90
- const doubleConsonantRegex = new RegExp( morphologyData.externalStemmer.doubleConsonants );
91
- const checkIfWordEndsOnDoubleConsonant = wordAfterStemming.search( doubleConsonantRegex );
92
- if ( checkIfWordEndsOnDoubleConsonant !== -1 ) {
93
- wordAfterStemming = wordAfterStemming.slice( 0, -1 );
94
- }
95
-
96
- const tripleConsonantsRegex = new RegExp( morphologyData.externalStemmer.tripleDoubleConsonants );
97
- const checkIfWordEndsOnTripleDoubleConsonant = wordAfterStemming.search( tripleConsonantsRegex );
98
- if ( checkIfWordEndsOnTripleDoubleConsonant !== -1 ) {
99
- wordAfterStemming = wordAfterStemming.slice( 0, -2 ) + wordAfterStemming.charAt( wordAfterStemming.length - 1 );
100
- }
101
-
102
- if ( wordAfterStemming.length !== word.slice( 0, -2 ).length ) {
103
- return wordAfterStemming;
104
- }
105
- }
106
- return word;
107
- };
108
-
109
- /**
110
- * Searches for the longer of the following suffixes: ban ben ba be ra re nak nek val vel tól tõl
111
- * ról rõl ból bõl hoz hez höz nál nél ig at et ot öt ért képp képpen kor ul ül
112
- * vá vé onként enként anként ként en on an ön n t and stems the suffix if found in R1
113
- * If the suffix is preceded by á replaces with a. If the suffix is preceded by é replaces with e
114
- *
115
- * @param {string} word The word to stem
116
- * @param {string} suffixes2 The suffixes from group 2
117
- * @param {Object} morphologyData The Morphology data file
118
- *
119
- * @returns {string} The stemmed word
120
- */
121
- const stemSuffixes2 = function( word, suffixes2, morphologyData ) {
122
- if ( word.length < 3 ) {
123
- return word;
124
- }
125
- const r1Position = findR1Position( morphologyData, word );
126
- const suffix2 = word.search( new RegExp( suffixes2 ) );
127
- if ( suffix2 >= r1Position ) {
128
- const wordAfterStemming = word.substring( 0, suffix2 );
129
- if ( wordAfterStemming.endsWith( "á" ) ) {
130
- return wordAfterStemming.replace( /á$/i, "a" );
131
- }
132
- if ( wordAfterStemming.endsWith( "é" ) ) {
133
- return wordAfterStemming.replace( /é$/i, "e" );
134
- }
135
- return wordAfterStemming;
136
- }
137
- return word;
138
- };
139
-
140
- /**
141
- * Searches for the longest among the following suffixes in R1: án ánként and replace by a
142
- * Search for én in R1 and replace with e
143
- *
144
- * @param {string} word The word to check for the suffix.
145
- * @param {string} suffixes3 The suffixes to check.
146
- * @param {Object} morphologyData The Morphology data file
147
- *
148
- * @returns {string} The word without the suffix.
149
- */
150
- const stemSuffixes3 = function( word, suffixes3, morphologyData ) {
151
- if ( word.length < 3 ) {
152
- return word;
153
- }
154
- const r1Position = findR1Position( morphologyData, word );
155
- const suffix3 = word.search( new RegExp( suffixes3 ) );
156
- if ( suffix3 >= r1Position ) {
157
- return ( word.substring( 0, suffix3 ) + "a" );
158
- }
159
-
160
- return word;
161
- };
162
-
163
- /**
164
- * Searches for the longest among following suffixes astul estül stul stül in R1 and delete.
165
- *
166
- * @param {string} word The word to check for the suffix.
167
- * @param {string} suffixes4 The suffixes to check.
168
- * @param {Object} morphologyData The Morphology data file
169
- *
170
- * @returns {string} The word without the suffix.
171
- */
172
- const stemSuffixes4 = function( word, suffixes4, morphologyData ) {
173
- if ( word.length < 3 ) {
174
- return word;
175
- }
176
- const r1Position = findR1Position( morphologyData, word );
177
- const suffix4 = word.search( new RegExp( suffixes4 ) );
178
- if ( suffix4 >= r1Position ) {
179
- return ( word.substring( 0, suffix4 ) );
180
- }
181
- return word;
182
- };
183
-
184
- /**
185
- * Searches for one of the suffixes Search for one of the following suffixes: á é and delete. If preceded by double
186
- * Consonant, remove one of the double consonants.
187
- *
188
- * @param {string} word The word to check for the suffix.
189
- * @param {string} suffixes6 The suffixes to check.
190
- * @param {Object} morphologyData The Morphology data file
191
- *
192
- * @returns {string} The word without the suffix.
193
- */
194
- const stemSuffixes5 = function( word, suffixes6, morphologyData ) {
195
- if ( word.length < 3 ) {
196
- return word;
197
- }
198
- const r1Position = findR1Position( morphologyData, word );
199
- const suffix6 = word.search( new RegExp( suffixes6 ) );
200
- if ( suffix6 >= r1Position ) {
201
- let wordAfterStemming = word.slice( 0, -1 );
202
- const doubleConsonantRegex = new RegExp( morphologyData.externalStemmer.doubleConsonants );
203
- const checkIfWordEndsOnDoubleConsonant = wordAfterStemming.search( doubleConsonantRegex );
204
- if ( checkIfWordEndsOnDoubleConsonant !== -1 ) {
205
- wordAfterStemming = wordAfterStemming.slice( 0, -1 );
206
- }
207
- return wordAfterStemming;
208
- }
209
- return word;
210
- };
211
-
212
- /**
213
- * Searches for one of the suffixes in R1 and delete oké öké aké eké ké éi é.
214
- *
215
- * @param {string} word The word to check for the suffix.
216
- * @param {string} suffixes6 The suffixes to check.
217
- * @param {Object} morphologyData The Morphology data file
218
- *
219
- * @returns {string} The word without the suffix.
220
- */
221
- const stemSuffixes6 = function( word, suffixes6, morphologyData ) {
222
- if ( word.length < 3 ) {
223
- return word;
224
- }
225
- const r1Position = findR1Position( morphologyData, word );
226
- const suffix6 = word.search( new RegExp( suffixes6 ) );
227
- if ( suffix6 >= r1Position ) {
228
- return word.substring( 0, suffix6 );
229
- }
230
- return word;
231
- };
232
-
233
-
234
- /**
235
- * Searches for the longest one of the suffixes in R1 and delete: ünk unk nk juk jük uk ük em om am
236
- * m od ed ad öd d ja je a e o
237
- * @param {string} word The word to check for the suffix.
238
- * @param {string} suffixes7 The suffixes to check.
239
- * @param {Object} morphologyData The Morphology data file
240
- * @returns {string} The word without the suffix.
241
- */
242
- const stemSuffixes7 = function( word, suffixes7, morphologyData ) {
243
- if ( word.length < 3 ) {
244
- return word;
245
- }
246
- const r1Position = findR1Position( morphologyData, word );
247
- const suffix7 = word.search( new RegExp( suffixes7 ) );
248
- if ( suffix7 >= r1Position ) {
249
- return word.substring( 0, suffix7 );
250
- }
251
- return word;
252
- };
253
-
254
- /**
255
- * Searches for the longest one of these suffixes in R1: jaim, jeim, aim, eim, im, jaid, eid, aid, eid, id, jai, jei, ai,
256
- * ei, i, jaink, jeink, eink, aink, ink, jaitok, jeitek, aitok, eitek, itek, jeik, jaik, aik, eik, ik and stem it
257
- *
258
- * @param {string} word The word to check.
259
- * @param {string} suffixes8 The suffixes to check.
260
- * @param {Object} morphologyData The Morphology data file
261
- * @returns {string} The stemmed word.
262
- */
263
- const stemSuffixes8 = function( word, suffixes8, morphologyData ) {
264
- if ( word.length < 3 ) {
265
- return word;
266
- }
267
- const r1Position = findR1Position( morphologyData, word );
268
- const suffix8 = word.search( new RegExp( suffixes8 ) );
269
- if ( suffix8 >= r1Position ) {
270
- return word.substring( 0, suffix8 );
271
- }
272
- return word;
273
- };
274
-
275
- /**
276
- * Searches for the longest one of these suffixes in R1 ánk ájuk ám ád á and replace with a
277
- * Searches the longest one of the suffixes in R1 énk éjük ém éd é and replace with e
278
- *
279
- * @param {string} word The word to check for the suffix.
280
- * @param {Object} suffixes9 The suffixes to check.
281
- * @param {Object} morphologyData The Morphology data file
282
- *
283
- * @returns {string} The word without the suffix.
284
- */
285
- const stemSuffixes9 = function( word, suffixes9, morphologyData ) {
286
- if ( word.length < 3 ) {
287
- return word;
288
- }
289
- const r1Position = findR1Position( morphologyData, word );
290
- const suffixes9a = word.search( new RegExp( suffixes9.suffixes9a ) );
291
- if ( suffixes9a >= r1Position ) {
292
- return word.substring( 0, suffixes9a ) + "a";
293
- }
294
- const suffixes9b = word.search( new RegExp( suffixes9.suffixes9b ) );
295
- if ( suffixes9b >= r1Position ) {
296
- return word.substring( 0, suffixes9b ) + "e";
297
- }
298
- return word;
299
- };
300
-
301
- /**
302
- * Searches for the longest one of these suffixes in R1 áim áid ái áink áitok áik and replace with a, and
303
- * Search for the longest one of the suffixes in R1 éim éid éi éink éitek éik and replace with e
304
- *
305
- * @param {string} word The word to check.
306
- * @param {string} suffixes10 The suffixes to stem.
307
- * @param {string} morphologyData The Morphology data file
308
- * @returns {string} The stemmed word.
309
- */
310
- const stemSuffixes10 = function( word, suffixes10, morphologyData ) {
311
- if ( word.length < 3 ) {
312
- return word;
313
- }
314
- const r1Position = findR1Position( morphologyData, word );
315
- const suffix10 = word.search( new RegExp( suffixes10 ) );
316
- if ( suffix10 >= r1Position ) {
317
- return word.substring( 0, suffix10 ) + "a";
318
- }
319
- return word;
320
- };
321
-
322
- /**
323
- * Searches for suffix ák and ék in R1 and replace with a and e respectively.
324
- *
325
- * @param {string} word The word to check.
326
- * @param {Object} suffixes11 The suffixes to stem.
327
- * @param {Object} morphologyData The Morphology data file.
328
- *
329
- * @returns {string} The stemmed word.
330
- */
331
- const stemSuffixes11 = function( word, suffixes11, morphologyData ) {
332
- if ( word.length < 3 ) {
333
- return word;
334
- }
335
- const r1Position = findR1Position( morphologyData, word );
336
- const suffix11a = word.search( new RegExp( suffixes11.suffixes11a ) );
337
- if ( suffix11a >= r1Position ) {
338
- return ( word.slice( 0, -2 ) + "a" );
339
- }
340
- const suffix11b = word.search( new RegExp( suffixes11.suffixes11b ) );
341
- if ( suffix11b >= r1Position ) {
342
- return ( word.slice( 0, -2 ) + "e" );
343
- }
344
- return word;
345
- };
346
-
347
- /**
348
- * Searches for the longest of these suffixes ök ok ek ak k in R1 and stem the suffix
349
- *
350
- * @param {string} word The word to check.
351
- * @param {string}suffixes12 The suffixes to stem.
352
- * @param {Object} morphologyData Morphology data file
353
- * @returns {string} The stemmed word.
354
- */
355
- const stemSuffixes12 = function( word, suffixes12, morphologyData ) {
356
- if ( word.length < 3 ) {
357
- return word;
358
- }
359
- const r1Position = findR1Position( morphologyData, word );
360
- const suffix12 = word.search( new RegExp( suffixes12 ) );
361
- if ( suffix12 >= r1Position ) {
362
- return ( word.substring( 0, suffix12 ) );
363
- }
364
- return word;
365
- };
366
-
367
- /**
368
- * Stems Hungarian words.
369
- *
370
- * @param {string} word The word to stem.
371
- * @param {Object} morphologyData The Hungarian morphology data.
372
- *
373
- * @returns {string} The stemmed word.
374
- */
375
- export default function stem( word, morphologyData ) {
376
- const wordAfterSuffixes1 = stemSuffixes1( word, morphologyData );
377
- const wordAfterSuffixes2 = stemSuffixes2( wordAfterSuffixes1, morphologyData.externalStemmer.suffixes2, morphologyData );
378
- const wordAfterSuffixes3 = stemSuffixes3( wordAfterSuffixes2, morphologyData.externalStemmer.suffixes3, morphologyData );
379
- const wordAfterSuffixes4 = stemSuffixes4( wordAfterSuffixes3, morphologyData.externalStemmer.suffixes4, morphologyData );
380
- const wordAfterSuffixes5 = stemSuffixes5( wordAfterSuffixes4, morphologyData.externalStemmer.suffixes5, morphologyData );
381
- const wordAfterSuffixes6 = stemSuffixes6( wordAfterSuffixes5, morphologyData.externalStemmer.suffixes6, morphologyData );
382
- const wordAfterSuffixes7 = stemSuffixes7( wordAfterSuffixes6, morphologyData.externalStemmer.suffixes7, morphologyData );
383
- const wordAfterSuffixes8 = stemSuffixes8( wordAfterSuffixes7, morphologyData.externalStemmer.suffixes8, morphologyData );
384
- const wordAfterSuffixes9 = stemSuffixes9( wordAfterSuffixes8, morphologyData.externalStemmer.suffixes9, morphologyData );
385
- const wordAfterSuffixes10 = stemSuffixes10( wordAfterSuffixes9, morphologyData.externalStemmer.suffixes10, morphologyData );
386
- const wordAfterSuffixes11 = stemSuffixes11( wordAfterSuffixes10, morphologyData.externalStemmer.suffixes11, morphologyData );
387
-
388
- return ( stemSuffixes12( wordAfterSuffixes11, morphologyData.externalStemmer.suffixes12, morphologyData ) );
389
- }
@@ -1,54 +0,0 @@
1
- import {languageProcessing} from '../../../index';
2
- const {getWords} = languageProcessing;
3
-
4
- import passiveVerbs from '../config/internal/odikVerbs';
5
- import {
6
- verbPrefixes,
7
- odikSuffixes1,
8
- odikSuffixes2
9
- } from '../config/internal/morphologicalPassiveAffixes';
10
-
11
- /**
12
- * Checks if the input word's root is in the Hungarian verb roots list.
13
- *
14
- * @param {string} word The word to check.
15
- * @param {string[]} verbRootsList The Hungarian verb roots list.
16
- * @param {string[]} prefixes The list of prefixes.
17
- * @param {string[]} suffixes The list of suffixes.
18
- *
19
- * @returns {Boolean} Returns true if the root of the input word is in the list.
20
- */
21
- const checkHungarianPassive = function(word, verbRootsList, prefixes, suffixes) {
22
- return verbRootsList.some(root => {
23
- return suffixes.some(function(suffix) {
24
- const rootAndSuffix = root + suffix;
25
-
26
- // Check whether the word ends in a root + suffix combination.
27
- if (word.endsWith(rootAndSuffix)) {
28
- const beforeRoot = word.slice(0, word.indexOf(rootAndSuffix));
29
-
30
- // Word is passive if nothing precedes the root or the root is preceded by a valid prefix.
31
- return beforeRoot === '' || prefixes.includes(beforeRoot);
32
- }
33
- });
34
- });
35
- };
36
-
37
- /**
38
- * Checks the passed sentence to see if it contains Hungarian passive verb-forms.
39
- *
40
- * @param {string} sentence The sentence to match against.
41
- *
42
- * @returns {Boolean} Whether the sentence contains Hungarian passive voice.
43
- */
44
- export default function isPassiveSentence(sentence) {
45
- const words = getWords(sentence);
46
- const passiveVerbs1 = passiveVerbs.odikVerbStems1;
47
- const passiveVerbs2 = passiveVerbs.odikVerbStems2;
48
-
49
- return words.some(
50
- word =>
51
- checkHungarianPassive(word, passiveVerbs1, verbPrefixes, odikSuffixes1) ||
52
- checkHungarianPassive(word, passiveVerbs2, verbPrefixes, odikSuffixes2)
53
- );
54
- }
@@ -1,41 +0,0 @@
1
- import {languageProcessing} from '../../../index';
2
- const {values} = languageProcessing;
3
- const {Clause} = values;
4
-
5
- import getParticiples from '../helpers/internal/getParticiples';
6
- import nonPassivesInVaAndVe from '../config/internal/nonPassivesInVaAndVe';
7
-
8
- /**
9
- * Creates a Clause object for the Hungarian language.
10
- */
11
- class HungarianClause extends Clause {
12
- /**
13
- * Constructor.
14
- *
15
- * @param {string} clauseText The text of the clause.
16
- * @param {Array} auxiliaries The auxiliaries.
17
- *
18
- * @constructor
19
- */
20
- constructor(clauseText, auxiliaries) {
21
- super(clauseText, auxiliaries);
22
- this._participles = getParticiples(this.getClauseText());
23
- this.checkParticiples();
24
- }
25
-
26
- /**
27
- * Checks if any exceptions are applicable to this participle that would result in the clause not being passive.
28
- * If no exceptions are found, the clause is passive.
29
- *
30
- * @returns {void}
31
- */
32
- checkParticiples() {
33
- const foundParticiples = this.getParticiples().filter(
34
- participle => !nonPassivesInVaAndVe.includes(participle)
35
- );
36
-
37
- this.setPassive(foundParticiples.length > 0);
38
- }
39
- }
40
-
41
- export default HungarianClause;
@@ -1,46 +0,0 @@
1
- import {languageProcessing} from '../../../index';
2
- const {AbstractResearcher} = languageProcessing;
3
-
4
- // All config
5
- import firstWordExceptions from './config/firstWordExceptions';
6
- import {all as functionWords} from './config/functionWords';
7
- import transitionWords from './config/transitionWords';
8
- import twoPartTransitionWords from './config/twoPartTransitionWords';
9
-
10
- // All helpers
11
- import getStemmer from './helpers/getStemmer';
12
- import isPassiveSentence from './helpers/isPassiveSentence';
13
- import splitIntoTokensCustom from './helpers/splitIntoTokensCustom';
14
-
15
- /**
16
- * The researcher contains all the researches, helpers, data, and config.
17
- */
18
- export default class Researcher extends AbstractResearcher {
19
- /**
20
- * Constructor
21
- * @param {Paper} paper The Paper object that is needed within the researches.
22
- * @constructor
23
- */
24
- constructor(paper) {
25
- super(paper);
26
-
27
- // Delete the researches that are not available for Indonesian.
28
- delete this.defaultResearches.getFleschReadingScore;
29
-
30
- Object.assign(this.config, {
31
- language: 'id',
32
- passiveConstructionType: 'morphological',
33
- firstWordExceptions,
34
- functionWords,
35
- transitionWords,
36
- twoPartTransitionWords,
37
- areHyphensWordBoundaries: false
38
- });
39
-
40
- Object.assign(this.helpers, {
41
- getStemmer,
42
- isPassiveSentence,
43
- splitIntoTokensCustom
44
- });
45
- }
46
- }
@@ -1,13 +0,0 @@
1
- /**
2
- * Returns a list of exceptions for the sentence beginning research.
3
- * @returns {Array} The list of exceptions.
4
- */
5
- export default [
6
- // Indefinite articles:
7
- "sebuah", "seorang", "sang", "si",
8
- // Numbers 1-10:
9
- "satu", "dua", "tiga", "empat", "lima", "enam", "tujuh", "delapan", "sembilan",
10
- "sepuluh", "sebelas", "seratus", "seribu", "sejuta", "semiliar", "setriliun",
11
- // Demonstrative pronouns:
12
- "ini", "itu", "hal", "ia",
13
- ];