axyseo 2.0.0-alpha.0.0.4 → 2.0.0-alpha.0.0.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +5 -2
- package/.browserslistrc +0 -1
- package/.gitattributes +0 -1
- package/babel.config.js +0 -3
- package/eslint.config.mjs +0 -119
- package/src/bundledPlugins/index.js +0 -5
- package/src/bundledPlugins/previouslyUsedKeywords.js +0 -192
- package/src/config/diacritics.js +0 -106
- package/src/config/getTransliterations.js +0 -1447
- package/src/config/transliterationsWPstyle.js +0 -774
- package/src/config/wordBoundaries.js +0 -23
- package/src/config/wordBoundariesWithoutPunctuation.js +0 -9
- package/src/const/analysis.js +0 -41
- package/src/errors/invalidType.js +0 -14
- package/src/errors/missingArgument.js +0 -14
- package/src/helpers/createMeasurementElement.js +0 -40
- package/src/helpers/domManipulation.js +0 -65
- package/src/helpers/errors.js +0 -26
- package/src/helpers/factory.js +0 -219
- package/src/helpers/formatNumber.js +0 -12
- package/src/helpers/formatString.js +0 -33
- package/src/helpers/getLanguagesWithWordComplexity.js +0 -8
- package/src/helpers/getLanguagesWithWordFormSupport.js +0 -11
- package/src/helpers/getWordComplexityConfig.js +0 -20
- package/src/helpers/getWordComplexityHelper.js +0 -20
- package/src/helpers/htmlEntities.js +0 -41
- package/src/helpers/includesAny.js +0 -19
- package/src/helpers/index.js +0 -127
- package/src/helpers/shortlinker/Shortlinker.js +0 -75
- package/src/helpers/shortlinker/index.js +0 -1
- package/src/helpers/shortlinker/singleton.js +0 -68
- package/src/helpers/types.js +0 -34
- package/src/index.js +0 -60
- package/src/languageProcessing/AbstractResearcher.js +0 -366
- package/src/languageProcessing/helpers/highlighting/getMarkingsInSentence.js +0 -125
- package/src/languageProcessing/helpers/html/getFieldsToMark.js +0 -29
- package/src/languageProcessing/helpers/html/getSubheadingTexts.js +0 -47
- package/src/languageProcessing/helpers/html/getSubheadings.js +0 -95
- package/src/languageProcessing/helpers/html/html.js +0 -176
- package/src/languageProcessing/helpers/html/htmlParser.js +0 -145
- package/src/languageProcessing/helpers/html/matchParagraphs.js +0 -62
- package/src/languageProcessing/helpers/html/normalizeHTML.js +0 -16
- package/src/languageProcessing/helpers/image/getAltAttribute.js +0 -20
- package/src/languageProcessing/helpers/image/getImagesInTree.js +0 -16
- package/src/languageProcessing/helpers/image/imageInText.js +0 -19
- package/src/languageProcessing/helpers/index.js +0 -12
- package/src/languageProcessing/helpers/language/getLanguage.js +0 -9
- package/src/languageProcessing/helpers/link/checkNofollow.js +0 -38
- package/src/languageProcessing/helpers/link/getAnchorsFromText.js +0 -32
- package/src/languageProcessing/helpers/link/getLinkType.js +0 -32
- package/src/languageProcessing/helpers/match/findKeywordFormsInString.js +0 -101
- package/src/languageProcessing/helpers/match/isDoubleQuoted.js +0 -13
- package/src/languageProcessing/helpers/match/matchTextWithArray.js +0 -36
- package/src/languageProcessing/helpers/match/matchTextWithTransliteration.js +0 -58
- package/src/languageProcessing/helpers/match/matchTextWithWord.js +0 -45
- package/src/languageProcessing/helpers/match/matchWordFormsWithSentence.js +0 -164
- package/src/languageProcessing/helpers/match/processExactMatchRequest.js +0 -20
- package/src/languageProcessing/helpers/morphology/baseStemmer.js +0 -11
- package/src/languageProcessing/helpers/morphology/buildFormRule.js +0 -19
- package/src/languageProcessing/helpers/morphology/buildTopicStems.js +0 -169
- package/src/languageProcessing/helpers/morphology/createRulesFromArrays.js +0 -45
- package/src/languageProcessing/helpers/morphology/exceptionListHelpers.js +0 -65
- package/src/languageProcessing/helpers/morphology/findMatchingEndingInArray.js +0 -24
- package/src/languageProcessing/helpers/morphology/flattenSortLength.js +0 -14
- package/src/languageProcessing/helpers/morphology/getAllWordsFromPaper.js +0 -39
- package/src/languageProcessing/helpers/morphology/regexHelpers.js +0 -44
- package/src/languageProcessing/helpers/morphology/stemHelpers.js +0 -38
- package/src/languageProcessing/helpers/morphology/stemPrefixedFunctionWords.js +0 -31
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/directPrecedenceException.js +0 -36
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/freeAuxiliaryParticipleOrder/getClausesSplitOnStopWords.js +0 -113
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/freeAuxiliaryParticipleOrder/nonDirectParticiplePrecedenceException.js +0 -45
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/getClauses.js +0 -231
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/getIndicesWithRegex.js +0 -20
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/matchRegularParticiples.js +0 -23
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/precedenceException.js +0 -40
- package/src/languageProcessing/helpers/prominentWords/determineProminentWords.js +0 -238
- package/src/languageProcessing/helpers/regex/createRegexFromArray.js +0 -35
- package/src/languageProcessing/helpers/regex/createRegexFromDoubleArray.js +0 -34
- package/src/languageProcessing/helpers/regex/createWordRegex.js +0 -30
- package/src/languageProcessing/helpers/regex/matchStringWithRegex.js +0 -19
- package/src/languageProcessing/helpers/regex/searchAndReplaceWithOneRegex.js +0 -14
- package/src/languageProcessing/helpers/sanitize/doubleQuotes.js +0 -12
- package/src/languageProcessing/helpers/sanitize/filterShortcodesFromTree.js +0 -131
- package/src/languageProcessing/helpers/sanitize/mergeListItems.js +0 -24
- package/src/languageProcessing/helpers/sanitize/parseSynonyms.js +0 -20
- package/src/languageProcessing/helpers/sanitize/quotes.js +0 -46
- package/src/languageProcessing/helpers/sanitize/removeEmailAddresses.js +0 -12
- package/src/languageProcessing/helpers/sanitize/removePunctuation.js +0 -64
- package/src/languageProcessing/helpers/sanitize/removePunctuationExceptQuotes.js +0 -18
- package/src/languageProcessing/helpers/sanitize/removeSentenceTerminators.js +0 -13
- package/src/languageProcessing/helpers/sanitize/removeURLs.js +0 -13
- package/src/languageProcessing/helpers/sanitize/sanitizeLineBreakTag.js +0 -11
- package/src/languageProcessing/helpers/sanitize/sanitizeString.js +0 -18
- package/src/languageProcessing/helpers/sanitize/stripHTMLTags.js +0 -57
- package/src/languageProcessing/helpers/sanitize/stripNonTextTags.js +0 -15
- package/src/languageProcessing/helpers/sanitize/stripNumbers.js +0 -21
- package/src/languageProcessing/helpers/sanitize/stripSpaces.js +0 -23
- package/src/languageProcessing/helpers/sanitize/stripWordBoundaries.js +0 -65
- package/src/languageProcessing/helpers/sanitize/unifyWhitespace.js +0 -61
- package/src/languageProcessing/helpers/sentence/SentenceTokenizer.js +0 -640
- package/src/languageProcessing/helpers/sentence/countSentences.js +0 -20
- package/src/languageProcessing/helpers/sentence/getSentences.js +0 -65
- package/src/languageProcessing/helpers/sentence/getSentencesFromTree.js +0 -55
- package/src/languageProcessing/helpers/sentence/memoizedSentenceTokenizer.js +0 -28
- package/src/languageProcessing/helpers/sentence/sentencesLength.js +0 -31
- package/src/languageProcessing/helpers/syllables/DeviationFragment.js +0 -112
- package/src/languageProcessing/helpers/syllables/countSyllables.js +0 -182
- package/src/languageProcessing/helpers/syllables/syllableCountIterator.js +0 -56
- package/src/languageProcessing/helpers/syllables/syllableCountStep.js +0 -68
- package/src/languageProcessing/helpers/transform/transformWordsWithHyphens.js +0 -17
- package/src/languageProcessing/helpers/transliterate/replaceDiacritics.js +0 -22
- package/src/languageProcessing/helpers/transliterate/specialCharacterMappings.js +0 -214
- package/src/languageProcessing/helpers/transliterate/transliterate.js +0 -20
- package/src/languageProcessing/helpers/transliterate/transliterateWPstyle.js +0 -21
- package/src/languageProcessing/helpers/url/parseSlug.js +0 -10
- package/src/languageProcessing/helpers/url/url.js +0 -172
- package/src/languageProcessing/helpers/word/addWordboundary.js +0 -37
- package/src/languageProcessing/helpers/word/areWordsInSentence.js +0 -16
- package/src/languageProcessing/helpers/word/countMetaDescriptionLength.js +0 -18
- package/src/languageProcessing/helpers/word/countWords.js +0 -14
- package/src/languageProcessing/helpers/word/createPunctuationTokens.js +0 -42
- package/src/languageProcessing/helpers/word/filterWordsFromArray.js +0 -15
- package/src/languageProcessing/helpers/word/followsIndex.js +0 -25
- package/src/languageProcessing/helpers/word/getAllWordsFromTree.js +0 -23
- package/src/languageProcessing/helpers/word/getWords.js +0 -43
- package/src/languageProcessing/helpers/word/includesIndex.js +0 -30
- package/src/languageProcessing/helpers/word/indices.js +0 -146
- package/src/languageProcessing/helpers/word/markWordsInSentences.js +0 -173
- package/src/languageProcessing/helpers/word/matchWordInSentence.js +0 -61
- package/src/languageProcessing/helpers/word/splitIntoTokens.js +0 -46
- package/src/languageProcessing/index.js +0 -91
- package/src/languageProcessing/languages/_default/Researcher.js +0 -34
- package/src/languageProcessing/languages/_default/helpers/getStemmer.js +0 -11
- package/src/languageProcessing/languages/ar/Researcher.js +0 -46
- package/src/languageProcessing/languages/ar/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/ar/config/functionWords.js +0 -329
- package/src/languageProcessing/languages/ar/config/internal/passiveVerbsWithLongVowel.js +0 -570
- package/src/languageProcessing/languages/ar/config/prefixedFunctionWords.js +0 -5
- package/src/languageProcessing/languages/ar/config/transitionWords.js +0 -19
- package/src/languageProcessing/languages/ar/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/ar/helpers/createBasicWordForms.js +0 -32
- package/src/languageProcessing/languages/ar/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/ar/helpers/internal/stem.js +0 -632
- package/src/languageProcessing/languages/ar/helpers/isPassiveSentence.js +0 -33
- package/src/languageProcessing/languages/ca/Researcher.js +0 -43
- package/src/languageProcessing/languages/ca/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/ca/config/transitionWords.js +0 -31
- package/src/languageProcessing/languages/ca/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/ca/helpers/getStemmer.js +0 -11
- package/src/languageProcessing/languages/cs/Researcher.js +0 -44
- package/src/languageProcessing/languages/cs/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/cs/config/functionWords.js +0 -121
- package/src/languageProcessing/languages/cs/config/internal/passiveVoiceAuxiliaries.js +0 -38
- package/src/languageProcessing/languages/cs/config/internal/passiveVoiceEndings.js +0 -54
- package/src/languageProcessing/languages/cs/config/stopWords.js +0 -42
- package/src/languageProcessing/languages/cs/config/transitionWords.js +0 -26
- package/src/languageProcessing/languages/cs/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/cs/helpers/getClauses.js +0 -26
- package/src/languageProcessing/languages/cs/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/cs/helpers/internal/getParticiples.js +0 -16
- package/src/languageProcessing/languages/cs/helpers/internal/stem.js +0 -499
- package/src/languageProcessing/languages/cs/values/Clause.js +0 -34
- package/src/languageProcessing/languages/de/Researcher.js +0 -52
- package/src/languageProcessing/languages/de/config/firstWordExceptions.js +0 -17
- package/src/languageProcessing/languages/de/config/functionWords.js +0 -303
- package/src/languageProcessing/languages/de/config/internal/exceptionsParticiplesActive.js +0 -2231
- package/src/languageProcessing/languages/de/config/internal/passiveVoiceAuxiliaries.js +0 -96
- package/src/languageProcessing/languages/de/config/internal/passiveVoiceIrregulars.js +0 -368
- package/src/languageProcessing/languages/de/config/internal/passiveVoiceRegex.js +0 -72
- package/src/languageProcessing/languages/de/config/keyphraseLength.js +0 -11
- package/src/languageProcessing/languages/de/config/stopWords.js +0 -67
- package/src/languageProcessing/languages/de/config/syllables.json +0 -460
- package/src/languageProcessing/languages/de/config/transitionWords.js +0 -31
- package/src/languageProcessing/languages/de/config/twoPartTransitionWords.js +0 -12
- package/src/languageProcessing/languages/de/config/wordComplexity.js +0 -4
- package/src/languageProcessing/languages/de/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/de/helpers/checkIfWordIsComplex.js +0 -40
- package/src/languageProcessing/languages/de/helpers/checkIfWordIsFunction.js +0 -15
- package/src/languageProcessing/languages/de/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/de/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/de/helpers/internal/SentenceTokenizer.js +0 -31
- package/src/languageProcessing/languages/de/helpers/internal/detectAndStemRegularParticiple.js +0 -128
- package/src/languageProcessing/languages/de/helpers/internal/determineStem.js +0 -128
- package/src/languageProcessing/languages/de/helpers/internal/getParticiples.js +0 -40
- package/src/languageProcessing/languages/de/helpers/internal/stem.js +0 -215
- package/src/languageProcessing/languages/de/helpers/memoizedSentenceTokenizer.js +0 -28
- package/src/languageProcessing/languages/de/values/Clause.js +0 -85
- package/src/languageProcessing/languages/el/Researcher.js +0 -46
- package/src/languageProcessing/languages/el/config/firstWordExceptions.js +0 -47
- package/src/languageProcessing/languages/el/config/functionWords.js +0 -116
- package/src/languageProcessing/languages/el/config/internal/auxiliaries.js +0 -19
- package/src/languageProcessing/languages/el/config/internal/morphologicalPassiveSuffixes.js +0 -87
- package/src/languageProcessing/languages/el/config/internal/nonPassiveVerbStems.js +0 -138
- package/src/languageProcessing/languages/el/config/stopWords.js +0 -854
- package/src/languageProcessing/languages/el/config/transitionWords.js +0 -26
- package/src/languageProcessing/languages/el/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/el/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/el/helpers/getStemmer.js +0 -21
- package/src/languageProcessing/languages/el/helpers/internal/getParticiples.js +0 -20
- package/src/languageProcessing/languages/el/helpers/internal/stem.js +0 -368
- package/src/languageProcessing/languages/el/helpers/isPassiveSentence.js +0 -38
- package/src/languageProcessing/languages/el/values/Clause.js +0 -37
- package/src/languageProcessing/languages/en/Researcher.js +0 -46
- package/src/languageProcessing/languages/en/config/abbreviations.js +0 -55
- package/src/languageProcessing/languages/en/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/en/config/functionWords.js +0 -186
- package/src/languageProcessing/languages/en/config/internal/passiveVoiceAuxiliaries.js +0 -44
- package/src/languageProcessing/languages/en/config/internal/passiveVoiceIrregulars.js +0 -354
- package/src/languageProcessing/languages/en/config/internal/passiveVoiceNonVerbEndingEd.js +0 -3047
- package/src/languageProcessing/languages/en/config/regularParticiplesRegex.js +0 -5
- package/src/languageProcessing/languages/en/config/stopWords.js +0 -52
- package/src/languageProcessing/languages/en/config/syllables.json +0 -86
- package/src/languageProcessing/languages/en/config/transitionWords.js +0 -48
- package/src/languageProcessing/languages/en/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/en/config/wordComplexity.js +0 -5
- package/src/languageProcessing/languages/en/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/en/helpers/checkIfWordIsComplex.js +0 -43
- package/src/languageProcessing/languages/en/helpers/getClauses.js +0 -49
- package/src/languageProcessing/languages/en/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/en/helpers/internal/determineStem.js +0 -178
- package/src/languageProcessing/languages/en/helpers/internal/getAdjectiveStem.js +0 -162
- package/src/languageProcessing/languages/en/helpers/internal/getParticiples.js +0 -25
- package/src/languageProcessing/languages/en/helpers/internal/getVerbStem.js +0 -237
- package/src/languageProcessing/languages/en/values/Clause.js +0 -68
- package/src/languageProcessing/languages/es/Researcher.js +0 -48
- package/src/languageProcessing/languages/es/config/firstWordExceptions.js +0 -16
- package/src/languageProcessing/languages/es/config/functionWords.js +0 -321
- package/src/languageProcessing/languages/es/config/internal/passiveVoiceAuxiliaries.js +0 -60
- package/src/languageProcessing/languages/es/config/internal/passiveVoiceParticiples.js +0 -7327
- package/src/languageProcessing/languages/es/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/es/config/stopWords.js +0 -33
- package/src/languageProcessing/languages/es/config/syllables.json +0 -176
- package/src/languageProcessing/languages/es/config/transitionWords.js +0 -40
- package/src/languageProcessing/languages/es/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/es/config/wordComplexity.js +0 -4
- package/src/languageProcessing/languages/es/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/es/helpers/checkIfWordIsComplex.js +0 -56
- package/src/languageProcessing/languages/es/helpers/getClauses.js +0 -29
- package/src/languageProcessing/languages/es/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/es/helpers/internal/checkVerbStemModifications.js +0 -41
- package/src/languageProcessing/languages/es/helpers/internal/getParticiples.js +0 -35
- package/src/languageProcessing/languages/es/helpers/internal/stem.js +0 -793
- package/src/languageProcessing/languages/es/values/Clause.js +0 -47
- package/src/languageProcessing/languages/fa/Researcher.js +0 -47
- package/src/languageProcessing/languages/fa/config/firstWordExceptions.js +0 -12
- package/src/languageProcessing/languages/fa/config/functionWords.js +0 -122
- package/src/languageProcessing/languages/fa/config/internal/participles.js +0 -1429
- package/src/languageProcessing/languages/fa/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/fa/config/transitionWords.js +0 -20
- package/src/languageProcessing/languages/fa/config/twoPartTransitionWords.js +0 -9
- package/src/languageProcessing/languages/fa/helpers/createBasicWordForms.js +0 -97
- package/src/languageProcessing/languages/fa/helpers/getStemmer.js +0 -13
- package/src/languageProcessing/languages/fa/helpers/isPassiveSentence.js +0 -14
- package/src/languageProcessing/languages/fr/Researcher.js +0 -46
- package/src/languageProcessing/languages/fr/config/firstWordExceptions.js +0 -16
- package/src/languageProcessing/languages/fr/config/functionWords.js +0 -281
- package/src/languageProcessing/languages/fr/config/internal/exceptionsParticiplesActive.js +0 -1510
- package/src/languageProcessing/languages/fr/config/internal/passiveVoiceAuxiliaries.js +0 -108
- package/src/languageProcessing/languages/fr/config/internal/passiveVoiceIrregulars.js +0 -565
- package/src/languageProcessing/languages/fr/config/stopWords.js +0 -119
- package/src/languageProcessing/languages/fr/config/syllables.json +0 -1426
- package/src/languageProcessing/languages/fr/config/transitionWords.js +0 -59
- package/src/languageProcessing/languages/fr/config/twoPartTransitionWords.js +0 -15
- package/src/languageProcessing/languages/fr/config/wordComplexity.js +0 -4
- package/src/languageProcessing/languages/fr/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/fr/helpers/checkIfWordIsComplex.js +0 -67
- package/src/languageProcessing/languages/fr/helpers/getClauses.js +0 -34
- package/src/languageProcessing/languages/fr/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/fr/helpers/internal/getParticiples.js +0 -72
- package/src/languageProcessing/languages/fr/helpers/internal/stem.js +0 -633
- package/src/languageProcessing/languages/fr/values/Clause.js +0 -96
- package/src/languageProcessing/languages/he/Researcher.js +0 -50
- package/src/languageProcessing/languages/he/config/firstWordExceptions.js +0 -13
- package/src/languageProcessing/languages/he/config/functionWords.js +0 -564
- package/src/languageProcessing/languages/he/config/internal/regularRootsHufal.js +0 -186
- package/src/languageProcessing/languages/he/config/internal/regularRootsNifal.js +0 -195
- package/src/languageProcessing/languages/he/config/internal/regularRootsPual.js +0 -168
- package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsHufal.js +0 -188
- package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsNifal.js +0 -197
- package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsPual.js +0 -170
- package/src/languageProcessing/languages/he/config/prefixedFunctionWords.js +0 -2
- package/src/languageProcessing/languages/he/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/he/config/transitionWords.js +0 -28
- package/src/languageProcessing/languages/he/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/he/helpers/createBasicWordForms.js +0 -33
- package/src/languageProcessing/languages/he/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/he/helpers/internal/stem.js +0 -52
- package/src/languageProcessing/languages/he/helpers/isPassiveSentence.js +0 -96
- package/src/languageProcessing/languages/he/helpers/stem.js +0 -52
- package/src/languageProcessing/languages/hu/Researcher.js +0 -48
- package/src/languageProcessing/languages/hu/config/firstWordExceptions.js +0 -31
- package/src/languageProcessing/languages/hu/config/functionWords.js +0 -284
- package/src/languageProcessing/languages/hu/config/internal/auxiliaries.js +0 -97
- package/src/languageProcessing/languages/hu/config/internal/morphologicalPassiveAffixes.js +0 -125
- package/src/languageProcessing/languages/hu/config/internal/nonPassivesInVaAndVe.js +0 -265
- package/src/languageProcessing/languages/hu/config/internal/odikVerbs.js +0 -273
- package/src/languageProcessing/languages/hu/config/internal/participles.js +0 -412
- package/src/languageProcessing/languages/hu/config/stopWords.js +0 -213
- package/src/languageProcessing/languages/hu/config/transitionWords.js +0 -42
- package/src/languageProcessing/languages/hu/config/twoPartTransitionWords.js +0 -34
- package/src/languageProcessing/languages/hu/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/hu/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/hu/helpers/internal/getParticiples.js +0 -21
- package/src/languageProcessing/languages/hu/helpers/internal/stem.js +0 -389
- package/src/languageProcessing/languages/hu/helpers/isPassiveSentence.js +0 -54
- package/src/languageProcessing/languages/hu/values/Clause.js +0 -41
- package/src/languageProcessing/languages/id/Researcher.js +0 -46
- package/src/languageProcessing/languages/id/config/firstWordExceptions.js +0 -13
- package/src/languageProcessing/languages/id/config/functionWords.js +0 -202
- package/src/languageProcessing/languages/id/config/internal/nonPassiveVerbsStartingDi.js +0 -215
- package/src/languageProcessing/languages/id/config/transitionWords.js +0 -62
- package/src/languageProcessing/languages/id/config/twoPartTransitionWords.js +0 -13
- package/src/languageProcessing/languages/id/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/id/helpers/internal/stem.js +0 -462
- package/src/languageProcessing/languages/id/helpers/internal/stemHelpers.js +0 -78
- package/src/languageProcessing/languages/id/helpers/isPassiveSentence.js +0 -39
- package/src/languageProcessing/languages/id/helpers/splitIntoTokensCustom.js +0 -47
- package/src/languageProcessing/languages/it/Researcher.js +0 -48
- package/src/languageProcessing/languages/it/config/firstWordExceptions.js +0 -17
- package/src/languageProcessing/languages/it/config/functionWords.js +0 -277
- package/src/languageProcessing/languages/it/config/internal/passiveVoiceAuxiliaries.js +0 -98
- package/src/languageProcessing/languages/it/config/internal/passiveVoiceParticiples.js +0 -7197
- package/src/languageProcessing/languages/it/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/it/config/stopWords.js +0 -57
- package/src/languageProcessing/languages/it/config/syllables.json +0 -573
- package/src/languageProcessing/languages/it/config/transitionWords.js +0 -104
- package/src/languageProcessing/languages/it/config/twoPartTransitionWords.js +0 -9
- package/src/languageProcessing/languages/it/helpers/calculateFleschReadingScore.js +0 -15
- package/src/languageProcessing/languages/it/helpers/getClauses.js +0 -32
- package/src/languageProcessing/languages/it/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/it/helpers/internal/getParticiples.js +0 -34
- package/src/languageProcessing/languages/it/helpers/internal/stem.js +0 -436
- package/src/languageProcessing/languages/it/values/Clause.js +0 -47
- package/src/languageProcessing/languages/ja/Researcher.js +0 -86
- package/src/languageProcessing/languages/ja/config/assessmentApplicabilityCharacterCount.js +0 -4
- package/src/languageProcessing/languages/ja/config/firstWordExceptions.js +0 -8
- package/src/languageProcessing/languages/ja/config/functionWords.js +0 -563
- package/src/languageProcessing/languages/ja/config/keyphraseLength.js +0 -16
- package/src/languageProcessing/languages/ja/config/metaDescriptionLength.js +0 -4
- package/src/languageProcessing/languages/ja/config/paragraphLength.js +0 -10
- package/src/languageProcessing/languages/ja/config/sentenceLength.js +0 -4
- package/src/languageProcessing/languages/ja/config/subheadingsTooLong.js +0 -18
- package/src/languageProcessing/languages/ja/config/textLength.js +0 -47
- package/src/languageProcessing/languages/ja/config/topicLength.js +0 -5
- package/src/languageProcessing/languages/ja/config/transitionWords.js +0 -354
- package/src/languageProcessing/languages/ja/customResearches/findKeyphraseInSEOTitle.js +0 -98
- package/src/languageProcessing/languages/ja/customResearches/getKeyphraseLength.js +0 -19
- package/src/languageProcessing/languages/ja/customResearches/getWordForms.js +0 -50
- package/src/languageProcessing/languages/ja/customResearches/textLength.js +0 -24
- package/src/languageProcessing/languages/ja/helpers/countCharacters.js +0 -19
- package/src/languageProcessing/languages/ja/helpers/customGetStemmer.js +0 -21
- package/src/languageProcessing/languages/ja/helpers/getContentWords.js +0 -21
- package/src/languageProcessing/languages/ja/helpers/getWords.js +0 -31
- package/src/languageProcessing/languages/ja/helpers/internal/SentenceTokenizer.js +0 -102
- package/src/languageProcessing/languages/ja/helpers/internal/createWordForms.js +0 -68
- package/src/languageProcessing/languages/ja/helpers/internal/determineStem.js +0 -17
- package/src/languageProcessing/languages/ja/helpers/matchTextWithWord.js +0 -53
- package/src/languageProcessing/languages/ja/helpers/matchTransitionWords.js +0 -25
- package/src/languageProcessing/languages/ja/helpers/memoizedSentenceTokenizer.js +0 -28
- package/src/languageProcessing/languages/ja/helpers/splitIntoTokensCustom.js +0 -20
- package/src/languageProcessing/languages/ja/helpers/wordsCharacterCount.js +0 -13
- package/src/languageProcessing/languages/nb/Researcher.js +0 -45
- package/src/languageProcessing/languages/nb/config/firstWordExceptions.js +0 -12
- package/src/languageProcessing/languages/nb/config/functionWords.js +0 -106
- package/src/languageProcessing/languages/nb/config/internal/participles.js +0 -3127
- package/src/languageProcessing/languages/nb/config/internal/passiveVoiceAuxiliaries.js +0 -15
- package/src/languageProcessing/languages/nb/config/stopWords.js +0 -39
- package/src/languageProcessing/languages/nb/config/transitionWords.js +0 -21
- package/src/languageProcessing/languages/nb/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/nb/helpers/getClauses.js +0 -28
- package/src/languageProcessing/languages/nb/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/nb/helpers/internal/getParticiples.js +0 -24
- package/src/languageProcessing/languages/nb/helpers/internal/stem.js +0 -133
- package/src/languageProcessing/languages/nb/values/Clause.js +0 -43
- package/src/languageProcessing/languages/nl/Researcher.js +0 -48
- package/src/languageProcessing/languages/nl/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/nl/config/functionWords.js +0 -233
- package/src/languageProcessing/languages/nl/config/internal/nonParticiples.js +0 -2515
- package/src/languageProcessing/languages/nl/config/internal/passiveVoiceAuxiliaries.js +0 -13
- package/src/languageProcessing/languages/nl/config/internal/passiveVoiceIrregulars.js +0 -474
- package/src/languageProcessing/languages/nl/config/keyphraseLength.js +0 -10
- package/src/languageProcessing/languages/nl/config/stopWords.js +0 -35
- package/src/languageProcessing/languages/nl/config/syllables.json +0 -343
- package/src/languageProcessing/languages/nl/config/transitionWords.js +0 -22
- package/src/languageProcessing/languages/nl/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/nl/helpers/calculateFleschReadingScore.js +0 -15
- package/src/languageProcessing/languages/nl/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/nl/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/nl/helpers/internal/checkExceptionsWithFullForms.js +0 -128
- package/src/languageProcessing/languages/nl/helpers/internal/detectAndStemRegularParticiple.js +0 -324
- package/src/languageProcessing/languages/nl/helpers/internal/detectAndStemSuffixes.js +0 -164
- package/src/languageProcessing/languages/nl/helpers/internal/determineStem.js +0 -133
- package/src/languageProcessing/languages/nl/helpers/internal/getParticiples.js +0 -25
- package/src/languageProcessing/languages/nl/helpers/internal/getStemWordsWithTAndDEnding.js +0 -183
- package/src/languageProcessing/languages/nl/helpers/internal/stem.js +0 -146
- package/src/languageProcessing/languages/nl/helpers/internal/stemModificationHelpers.js +0 -109
- package/src/languageProcessing/languages/nl/helpers/internal/stemTOrDFromEndOfWord.js +0 -65
- package/src/languageProcessing/languages/nl/values/Clause.js +0 -62
- package/src/languageProcessing/languages/pl/Researcher.js +0 -47
- package/src/languageProcessing/languages/pl/config/firstWordExceptions.js +0 -12
- package/src/languageProcessing/languages/pl/config/functionWords.js +0 -421
- package/src/languageProcessing/languages/pl/config/internal/auxiliaries.js +0 -85
- package/src/languageProcessing/languages/pl/config/internal/participles.js +0 -26433
- package/src/languageProcessing/languages/pl/config/sentenceLength.js +0 -10
- package/src/languageProcessing/languages/pl/config/stopWords.js +0 -36
- package/src/languageProcessing/languages/pl/config/transitionWords.js +0 -42
- package/src/languageProcessing/languages/pl/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/pl/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/pl/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/pl/helpers/internal/getParticiples.js +0 -18
- package/src/languageProcessing/languages/pl/helpers/internal/stem.js +0 -161
- package/src/languageProcessing/languages/pl/values/Clause.js +0 -53
- package/src/languageProcessing/languages/pt/Researcher.js +0 -48
- package/src/languageProcessing/languages/pt/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/pt/config/functionWords.js +0 -226
- package/src/languageProcessing/languages/pt/config/internal/passiveVoiceAuxiliaries.js +0 -66
- package/src/languageProcessing/languages/pt/config/internal/passiveVoiceParticiples.js +0 -4088
- package/src/languageProcessing/languages/pt/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/pt/config/stopWords.js +0 -50
- package/src/languageProcessing/languages/pt/config/syllables.json +0 -38
- package/src/languageProcessing/languages/pt/config/transitionWords.js +0 -34
- package/src/languageProcessing/languages/pt/config/twoPartTransitionWords.js +0 -9
- package/src/languageProcessing/languages/pt/helpers/calculateFleschReadingScore.js +0 -15
- package/src/languageProcessing/languages/pt/helpers/getClauses.js +0 -29
- package/src/languageProcessing/languages/pt/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/pt/helpers/internal/getParticiples.js +0 -35
- package/src/languageProcessing/languages/pt/helpers/internal/stem.js +0 -319
- package/src/languageProcessing/languages/pt/values/Clause.js +0 -43
- package/src/languageProcessing/languages/ru/Researcher.js +0 -48
- package/src/languageProcessing/languages/ru/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/ru/config/fleschReadingEaseScores.js +0 -20
- package/src/languageProcessing/languages/ru/config/functionWords.js +0 -519
- package/src/languageProcessing/languages/ru/config/internal/participlesShortenedList.js +0 -2914
- package/src/languageProcessing/languages/ru/config/internal/passiveVoiceParticiples.js +0 -6295
- package/src/languageProcessing/languages/ru/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/ru/config/syllables.json +0 -19
- package/src/languageProcessing/languages/ru/config/transitionWords.js +0 -62
- package/src/languageProcessing/languages/ru/config/twoPartTransitionWords.js +0 -14
- package/src/languageProcessing/languages/ru/helpers/calculateFleschReadingScore.js +0 -16
- package/src/languageProcessing/languages/ru/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/ru/helpers/internal/stem.js +0 -288
- package/src/languageProcessing/languages/ru/helpers/isPassiveSentence.js +0 -14
- package/src/languageProcessing/languages/sk/Researcher.js +0 -46
- package/src/languageProcessing/languages/sk/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/sk/config/functionWords.js +0 -855
- package/src/languageProcessing/languages/sk/config/internal/nonPassives.js +0 -1074
- package/src/languageProcessing/languages/sk/config/internal/passiveVoiceAuxiliaries.js +0 -22
- package/src/languageProcessing/languages/sk/config/stopWords.js +0 -34
- package/src/languageProcessing/languages/sk/config/transitionWords.js +0 -23
- package/src/languageProcessing/languages/sk/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/sk/helpers/getClauses.js +0 -26
- package/src/languageProcessing/languages/sk/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/sk/helpers/internal/getParticiples.js +0 -16
- package/src/languageProcessing/languages/sk/helpers/internal/stem.js +0 -319
- package/src/languageProcessing/languages/sk/values/Clause.js +0 -39
- package/src/languageProcessing/languages/sv/Researcher.js +0 -45
- package/src/languageProcessing/languages/sv/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/sv/config/functionWords.js +0 -176
- package/src/languageProcessing/languages/sv/config/internal/passiveVerbs.js +0 -10400
- package/src/languageProcessing/languages/sv/config/keyphraseLength.js +0 -11
- package/src/languageProcessing/languages/sv/config/transitionWords.js +0 -35
- package/src/languageProcessing/languages/sv/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/sv/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/sv/helpers/internal/stem.js +0 -152
- package/src/languageProcessing/languages/sv/helpers/isPassiveSentence.js +0 -14
- package/src/languageProcessing/languages/tr/Researcher.js +0 -44
- package/src/languageProcessing/languages/tr/config/firstWordExceptions.js +0 -13
- package/src/languageProcessing/languages/tr/config/functionWords.js +0 -116
- package/src/languageProcessing/languages/tr/config/internal/nonPassiveExceptions.js +0 -574
- package/src/languageProcessing/languages/tr/config/internal/passiveEndings.js +0 -151
- package/src/languageProcessing/languages/tr/config/sentenceLength.js +0 -7
- package/src/languageProcessing/languages/tr/config/transitionWords.js +0 -42
- package/src/languageProcessing/languages/tr/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/tr/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/tr/helpers/internal/stem.js +0 -20
- package/src/languageProcessing/languages/tr/helpers/isPassiveSentence.js +0 -43
- package/src/languageProcessing/researches/altTagCount.js +0 -70
- package/src/languageProcessing/researches/countSentencesFromText.js +0 -19
- package/src/languageProcessing/researches/findKeyphraseInSEOTitle.js +0 -257
- package/src/languageProcessing/researches/findKeywordInFirstParagraph.js +0 -86
- package/src/languageProcessing/researches/findTransitionWords.js +0 -123
- package/src/languageProcessing/researches/functionWordsInKeyphrase.js +0 -44
- package/src/languageProcessing/researches/getAnchorsWithKeyphrase.js +0 -227
- package/src/languageProcessing/researches/getFleschReadingScore.js +0 -150
- package/src/languageProcessing/researches/getKeywordDensity.js +0 -44
- package/src/languageProcessing/researches/getLinkStatistics.js +0 -54
- package/src/languageProcessing/researches/getLinks.js +0 -18
- package/src/languageProcessing/researches/getLongCenterAlignedTexts.js +0 -37
- package/src/languageProcessing/researches/getParagraphLength.js +0 -44
- package/src/languageProcessing/researches/getParagraphs.js +0 -18
- package/src/languageProcessing/researches/getPassiveVoiceResult.js +0 -129
- package/src/languageProcessing/researches/getProminentWordsForInsights.js +0 -48
- package/src/languageProcessing/researches/getProminentWordsForInternalLinking.js +0 -119
- package/src/languageProcessing/researches/getSentenceBeginnings.js +0 -124
- package/src/languageProcessing/researches/getSubheadingTextLengths.js +0 -59
- package/src/languageProcessing/researches/getWordForms.js +0 -204
- package/src/languageProcessing/researches/h1s.js +0 -10
- package/src/languageProcessing/researches/imageCount.js +0 -16
- package/src/languageProcessing/researches/index.js +0 -5
- package/src/languageProcessing/researches/keyphraseDistribution.js +0 -249
- package/src/languageProcessing/researches/keyphraseLength.js +0 -17
- package/src/languageProcessing/researches/keywordCount.js +0 -134
- package/src/languageProcessing/researches/keywordCountInUrl.js +0 -57
- package/src/languageProcessing/researches/matchKeywordInSubheadings.js +0 -62
- package/src/languageProcessing/researches/metaDescriptionKeyword.js +0 -85
- package/src/languageProcessing/researches/metaDescriptionLength.js +0 -12
- package/src/languageProcessing/researches/pageTitleWidth.js +0 -11
- package/src/languageProcessing/researches/readingTime.js +0 -82
- package/src/languageProcessing/researches/sentences.js +0 -20
- package/src/languageProcessing/researches/videoCount.js +0 -32
- package/src/languageProcessing/researches/wordComplexity.js +0 -129
- package/src/languageProcessing/researches/wordCountInText.js +0 -29
- package/src/languageProcessing/values/Clause.js +0 -108
- package/src/languageProcessing/values/ProminentWord.js +0 -95
- package/src/languageProcessing/values/Sentence.js +0 -111
- package/src/languageProcessing/values/index.js +0 -9
- package/src/markers/addMark.js +0 -9
- package/src/markers/addMarkSingleWord.js +0 -32
- package/src/markers/index.js +0 -7
- package/src/markers/removeDuplicateMarks.js +0 -27
- package/src/markers/removeMarks.js +0 -11
- package/src/parse/build/build.js +0 -52
- package/src/parse/build/index.js +0 -10
- package/src/parse/build/private/adapt.js +0 -113
- package/src/parse/build/private/adaptAttributes.js +0 -36
- package/src/parse/build/private/alwaysFilterElements.js +0 -75
- package/src/parse/build/private/combineIntoImplicitParagraphs.js +0 -130
- package/src/parse/build/private/filterBeforeTokenizing.js +0 -32
- package/src/parse/build/private/filterHelpers.js +0 -44
- package/src/parse/build/private/filterTree.js +0 -42
- package/src/parse/build/private/getTextElementPositions.js +0 -184
- package/src/parse/build/private/helpers/parseClassAttribute.js +0 -9
- package/src/parse/build/private/isPhrasingContent.js +0 -28
- package/src/parse/build/private/parseBlocks.js +0 -151
- package/src/parse/build/private/tokenize.js +0 -74
- package/src/parse/language/LanguageProcessor.js +0 -74
- package/src/parse/structure/Heading.js +0 -26
- package/src/parse/structure/Node.js +0 -69
- package/src/parse/structure/Paragraph.js +0 -48
- package/src/parse/structure/Sentence.js +0 -30
- package/src/parse/structure/SourceCodeLocation.js +0 -41
- package/src/parse/structure/Text.js +0 -27
- package/src/parse/structure/Token.js +0 -24
- package/src/parse/structure/index.js +0 -16
- package/src/parse/traverse/findAllInTree.js +0 -58
- package/src/parse/traverse/index.js +0 -12
- package/src/parse/traverse/innerText.js +0 -26
- package/src/parsedPaper/ParsedPaper.js +0 -92
- package/src/parsedPaper/assess/TreeAssessor.js +0 -184
- package/src/parsedPaper/assess/assessmentListFactories.js +0 -73
- package/src/parsedPaper/assess/assessments/Assessment.js +0 -79
- package/src/parsedPaper/assess/assessments/index.js +0 -6
- package/src/parsedPaper/assess/assessorFactories.js +0 -104
- package/src/parsedPaper/assess/cornerstone/assessmentListFactories.js +0 -47
- package/src/parsedPaper/assess/cornerstone/index.js +0 -5
- package/src/parsedPaper/assess/index.js +0 -20
- package/src/parsedPaper/build/PaperParser.js +0 -105
- package/src/parsedPaper/build/linguisticParsing/Sentence.js +0 -89
- package/src/parsedPaper/build/linguisticParsing/SentenceTokenizer.js +0 -323
- package/src/parsedPaper/build/linguisticParsing/parseText.js +0 -20
- package/src/parsedPaper/build/tree/TreeBuilder.js +0 -75
- package/src/parsedPaper/build/tree/cleanup/calculateTextIndices.js +0 -190
- package/src/parsedPaper/build/tree/cleanup/getElementContent.js +0 -21
- package/src/parsedPaper/build/tree/cleanup/postParsing.js +0 -37
- package/src/parsedPaper/build/tree/html/HTMLTreeConverter.js +0 -230
- package/src/parsedPaper/build/tree/html/buildTree.js +0 -31
- package/src/parsedPaper/build/tree/html/htmlConstants.js +0 -37
- package/src/parsedPaper/build/tree/index.js +0 -14
- package/src/parsedPaper/build/tree/metadata/buildTree.js +0 -32
- package/src/parsedPaper/research/TreeResearcher.js +0 -134
- package/src/parsedPaper/research/index.js +0 -13
- package/src/parsedPaper/research/researches/Headings.js +0 -20
- package/src/parsedPaper/research/researches/LinkStatistics.js +0 -128
- package/src/parsedPaper/research/researches/Research.js +0 -50
- package/src/parsedPaper/research/researches/index.js +0 -1
- package/src/parsedPaper/structure/tree/FormattingElement.js +0 -67
- package/src/parsedPaper/structure/tree/SourceCodeLocation.js +0 -31
- package/src/parsedPaper/structure/tree/TextContainer.js +0 -85
- package/src/parsedPaper/structure/tree/index.js +0 -22
- package/src/parsedPaper/structure/tree/nodes/Heading.js +0 -26
- package/src/parsedPaper/structure/tree/nodes/LeafNode.js +0 -75
- package/src/parsedPaper/structure/tree/nodes/List.js +0 -47
- package/src/parsedPaper/structure/tree/nodes/ListItem.js +0 -26
- package/src/parsedPaper/structure/tree/nodes/MetadataMiscellaneous.js +0 -46
- package/src/parsedPaper/structure/tree/nodes/MetadataText.js +0 -26
- package/src/parsedPaper/structure/tree/nodes/Node.js +0 -154
- package/src/parsedPaper/structure/tree/nodes/Paragraph.js +0 -24
- package/src/parsedPaper/structure/tree/nodes/StructuredNode.js +0 -52
- package/src/parsedPaper/structure/tree/nodes/index.js +0 -21
- package/src/scoring/assessments/assessment.js +0 -63
- package/src/scoring/assessments/index.js +0 -58
- package/src/scoring/assessments/readability/ParagraphTooLongAssessment.js +0 -173
- package/src/scoring/assessments/readability/SentenceBeginningsAssessment.js +0 -132
- package/src/scoring/assessments/readability/SentenceLengthInTextAssessment.js +0 -186
- package/src/scoring/assessments/readability/TransitionWordsAssessment.js +0 -168
- package/src/scoring/assessments/seo/ImageCountAssessment.js +0 -112
- package/src/scoring/assessments/seo/InternalLinksAssessment.js +0 -114
- package/src/scoring/assessments/seo/IntroductionKeywordAssessment.js +0 -110
- package/src/scoring/assessments/seo/KeyphraseAssessment.js +0 -104
- package/src/scoring/assessments/seo/KeyphraseLengthAssessment.js +0 -110
- package/src/scoring/assessments/seo/KeywordDensityAssessment.js +0 -116
- package/src/scoring/assessments/seo/MetaDescriptionKeywordAssessment.js +0 -114
- package/src/scoring/assessments/seo/MetaDescriptionLengthAssessment.js +0 -112
- package/src/scoring/assessments/seo/MetaTitleKeywordAssessment.js +0 -111
- package/src/scoring/assessments/seo/NumberInMetaTitleAssessment.js +0 -107
- package/src/scoring/assessments/seo/OutboundLinksAssessment.js +0 -111
- package/src/scoring/assessments/seo/PageTitleWidthAssessment.js +0 -104
- package/src/scoring/assessments/seo/SingleH1Assessment.js +0 -118
- package/src/scoring/assessments/seo/SingleTitleAssessment.js +0 -108
- package/src/scoring/assessments/seo/SubHeadingsKeywordAssessment.js +0 -107
- package/src/scoring/assessments/seo/TextImagesAssessment.js +0 -144
- package/src/scoring/assessments/seo/TextLengthAssessment.js +0 -100
- package/src/scoring/assessments/seo/UrlKeywordAssessment.js +0 -111
- package/src/scoring/assessments/seo/UrlLengthAssessment.js +0 -103
- package/src/scoring/assessors/assessor.js +0 -269
- package/src/scoring/assessors/avadaAssessor.js +0 -67
- package/src/scoring/assessors/contentAssessor.js +0 -159
- package/src/scoring/assessors/index.js +0 -4
- package/src/scoring/assessors/seoAssessor.js +0 -57
- package/src/scoring/helpers/assessments/checkForTooLongSentences.js +0 -13
- package/src/scoring/helpers/assessments/inRange.js +0 -49
- package/src/scoring/helpers/assessments/keyphraseLengthFactor.js +0 -10
- package/src/scoring/helpers/assessments/recommendedKeywordCount.js +0 -43
- package/src/scoring/helpers/index.js +0 -74
- package/src/scoring/interpreters/index.js +0 -5
- package/src/scoring/interpreters/scoreToRating.js +0 -31
- package/src/scoring/renderers/AssessorPresenter.js +0 -360
- package/src/scoring/scoreAggregators/ReadabilityScoreAggregator.js +0 -203
- package/src/scoring/scoreAggregators/SEOScoreAggregator.js +0 -54
- package/src/scoring/scoreAggregators/ScoreAggregator.js +0 -23
- package/src/scoring/scoreAggregators/index.js +0 -3
- package/src/values/AssessmentResult.js +0 -496
- package/src/values/Mark.js +0 -271
- package/src/values/Paper.js +0 -425
- package/src/values/index.js +0 -9
- package/src/vendor/turkishStemmer.js +0 -3435
- package/tsconfig.json +0 -15
|
@@ -1,26 +0,0 @@
|
|
|
1
|
-
/** @module config/transitionWords */
|
|
2
|
-
|
|
3
|
-
/**
|
|
4
|
-
* Returns a list of transition words consisting of single words
|
|
5
|
-
*
|
|
6
|
-
* @type {string[]} The list of single transition words.
|
|
7
|
-
*/
|
|
8
|
-
export const singleWords = [ "εξαιτίας", "επειδή", "γιατί", "διότι", "καθώς", "ώστε", "λοιπόν", "αλλά", "μα", "όμως ", "παρά", "μόνο", "μόλο",
|
|
9
|
-
"ωστόσο", "εντούτοις", "έπειτα", "μολαταύτα", "μάλιστα", "εξάλλου", "αντίθετα", "απεναντίας", "διαφορετικά", "ειδάλλως ", "ειδεμή", "αλλιώς ",
|
|
10
|
-
"αλλιώτικα", "πάλι", "ενώ", "μολονότι", "αντίστροφα", "αρχικά", "προγουμένως", "πρώτα", "ύστερα", "πριν", "εντωμεταξύ", "τέλος", "όταν",
|
|
11
|
-
"καθ΄ψς", "όποτε", "μόλις", "αργότερα", "αν", "δηλαδή", "ειδικότερα", "ήτοι", "συγκεκριμένα", "ειδικά", "καταρχήν", "κατόπιν", "πρωταρχικα",
|
|
12
|
-
"συγκεφαλαιωτικά", "συγκεφαλαιώνοντας", "συγκεντρωτικά", "συνοπτικά", "επιλογικά", "ανακεφαλαιώνοντας", "τελικά", "γενικά", "ευρύτερα",
|
|
13
|
-
"επιπλέον", "επιπρόσθετα", "επίσης", "ακόμη", "πρόσθετα", "όπως", "ομοίως", "σαν", "επομένως", "συνεπώς", "πράγματι", "βέβαια", "όντως",
|
|
14
|
-
"αφού", "αφότου", "καταρχάς", "ακολούθως", "εφόσον", "κυρίως", "φυσικά", "ασφαλώς", "οπωσδήποτε", "αναντίρρητα", "προφανώς" ];
|
|
15
|
-
|
|
16
|
-
export const multipleWords = [ "παρόλο που", "ένας ακόμα λόγος", "αυτό οφείλεται", "αυτό εξηγείται", "αυτό δικαιλογείται", "η αιτία είναι",
|
|
17
|
-
"ο λόγος είναι", "γι'αυτό τον λόγο", "παρόλα ταύτα", "ως επακόλουθο", "ως αποτέλεσμα", "κατά συνέπεια", "έτσι που", "και όμως", "και γι'αυτό",
|
|
18
|
-
"σε αντίθεση", "από την άλλη πλευρά", "αν και", "και αν", "στον αντίποδα", "ακόμη κι αν", "παρ'όλα αυτά", "στη συνέχεια", "είναι γεγονός ότι",
|
|
19
|
-
"αξίζει να σημειωθεί", "με άλλα λόγια", "αυτό σημαίνει ότι", "για παράδειγμα", "παραδείγματος χάριν", "λόγου χάριν", "σε περίπτωση που",
|
|
20
|
-
"εκτός κι αν", "εξαιτίας αυτού", "με τον ίδιο τρόπο", "με παρόμοιο τρόπο", "με την προϋπόθεση να", "υπό τον όρο να", "εν κατακλείδι ",
|
|
21
|
-
"χάρη σε αυτό", "από την στιγμή που", "έχει μεγάλη σημασία να", "είναι απαραίτητο να", "είναι αναγκαίο να", "είναι αξιοσημείωτο", "στο μεταξύ",
|
|
22
|
-
"στην αρχή", "με δεδομένο" ];
|
|
23
|
-
|
|
24
|
-
export const allWords = singleWords.concat( multipleWords );
|
|
25
|
-
|
|
26
|
-
export default allWords;
|
|
@@ -1,10 +0,0 @@
|
|
|
1
|
-
/** @module config/twoPartTransitionWords */
|
|
2
|
-
|
|
3
|
-
/**
|
|
4
|
-
* Returns an array with two-part transition words to be used by the assessments.
|
|
5
|
-
* @returns {Array} The array filled with two-part transition words.
|
|
6
|
-
*/
|
|
7
|
-
export default [
|
|
8
|
-
[ "όχι μόνο", "αλλά και" ], [ "όχι μόνο να μην", "αλλά ούτε και να" ], [ "από την μία", "από την άλλη" ], [ "αφενός", "αφετέρου" ],
|
|
9
|
-
[ "μεν", "δε" ], [ "είτε", "είτε" ],
|
|
10
|
-
];
|
|
@@ -1,25 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {getClausesSplitOnStopWords, createRegexFromArray} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
import GreekClause from '../values/Clause';
|
|
5
|
-
import auxiliaries from '../config/internal/auxiliaries.js';
|
|
6
|
-
import stopWords from '../config/stopWords';
|
|
7
|
-
|
|
8
|
-
const options = {
|
|
9
|
-
Clause: GreekClause,
|
|
10
|
-
regexes: {
|
|
11
|
-
auxiliaryRegex: createRegexFromArray(auxiliaries),
|
|
12
|
-
stopwordRegex: createRegexFromArray(stopWords)
|
|
13
|
-
}
|
|
14
|
-
};
|
|
15
|
-
|
|
16
|
-
/**
|
|
17
|
-
* Gets the clauses from a sentence by determining sentence breakers.
|
|
18
|
-
*
|
|
19
|
-
* @param {string} sentence The sentence to split up in clauses.
|
|
20
|
-
*
|
|
21
|
-
* @returns {Array} The array with all clauses that have an auxiliary.
|
|
22
|
-
*/
|
|
23
|
-
export default function getGreekClauses(sentence) {
|
|
24
|
-
return getClausesSplitOnStopWords(sentence, options);
|
|
25
|
-
}
|
|
@@ -1,21 +0,0 @@
|
|
|
1
|
-
import {get} from 'lodash';
|
|
2
|
-
import {languageProcessing} from '../../../index';
|
|
3
|
-
import stem from './internal/stem';
|
|
4
|
-
const {baseStemmer} = languageProcessing;
|
|
5
|
-
|
|
6
|
-
/**
|
|
7
|
-
* Returns the stemmer for a researcher.
|
|
8
|
-
*
|
|
9
|
-
* @param {Researcher} researcher The researcher.
|
|
10
|
-
*
|
|
11
|
-
* @returns {Function} The stemmer.
|
|
12
|
-
*/
|
|
13
|
-
export default function getStemmer(researcher) {
|
|
14
|
-
const morphologyData = get(researcher.getData('morphology'), 'el', false);
|
|
15
|
-
|
|
16
|
-
if (morphologyData) {
|
|
17
|
-
return word => stem(word, morphologyData);
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
return baseStemmer;
|
|
21
|
-
}
|
|
@@ -1,20 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {getWords} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
const passiveParticipleEndings =
|
|
5
|
-
'(ούμενους|ημένους|ούμενος|ούμενου|ούμενον|ούμενης|ούμενοι|ούμενων|ούμενες|μένους|' +
|
|
6
|
-
'ημένος|ημένου|ημένον|ημένοι|ημένων|ημένης|ημένες|ούμενη|ούμενο|ούμενα|μένος|μένου|μένον|μένοι|μένης|μένες|' +
|
|
7
|
-
'μένων|ημένη|ημένο|ημένα|μένη|μένο|μένα)$';
|
|
8
|
-
|
|
9
|
-
/**
|
|
10
|
-
* Creates an array of participles found in a clause.
|
|
11
|
-
*
|
|
12
|
-
* @param {string} clauseText The clause to finds participles in.
|
|
13
|
-
*
|
|
14
|
-
* @returns {Array} The array with the participles found.
|
|
15
|
-
*/
|
|
16
|
-
export default function(clauseText) {
|
|
17
|
-
const words = getWords(clauseText);
|
|
18
|
-
|
|
19
|
-
return words.filter(word => new RegExp(passiveParticipleEndings).test(word));
|
|
20
|
-
}
|
|
@@ -1,368 +0,0 @@
|
|
|
1
|
-
/* eslint-disable max-statements,complexity */
|
|
2
|
-
/**
|
|
3
|
-
* MIT License
|
|
4
|
-
*
|
|
5
|
-
* Copyright (c) 2015 apmats <amatsagkas@gmail.com>
|
|
6
|
-
*
|
|
7
|
-
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
8
|
-
* of this software and associated documentation files (the "Software"), to deal
|
|
9
|
-
* in the Software without restriction, including without limitation the rights
|
|
10
|
-
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
11
|
-
* copies of the Software, and to permit persons to whom the Software is
|
|
12
|
-
* furnished to do so, subject to the following conditions:
|
|
13
|
-
*
|
|
14
|
-
* The above copyright notice and this permission notice shall be included in all
|
|
15
|
-
* copies or substantial portions of the Software.
|
|
16
|
-
*
|
|
17
|
-
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
18
|
-
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
19
|
-
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
20
|
-
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
21
|
-
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
22
|
-
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
23
|
-
* SOFTWARE.
|
|
24
|
-
*
|
|
25
|
-
* https://github.com/Apmats/greekstemmerjs
|
|
26
|
-
*/
|
|
27
|
-
|
|
28
|
-
/**
|
|
29
|
-
* Matches word with an array of regexes and stems the word if there is any match. Further processes the stemmed word
|
|
30
|
-
* if it matches one of the regexes in the second array by attaching an additional ending.
|
|
31
|
-
*
|
|
32
|
-
* @param {string} word The word to check.
|
|
33
|
-
* @param {Array} regexes1 The first array of regexes to check.
|
|
34
|
-
* @param {Array} regexes2 The second array of regexes to check.
|
|
35
|
-
* @param {Array} endings The array of endings to attach to the stemmed word
|
|
36
|
-
* if the previously stemmed word matches one of the regexes in the second array.
|
|
37
|
-
* @returns {string} The stemmed word if there is any matches or otherwise the original word.
|
|
38
|
-
*/
|
|
39
|
-
export function matchAndStemWordWithRegexArray( word, regexes1, regexes2, endings ) {
|
|
40
|
-
let match;
|
|
41
|
-
for ( let i = 0; i < regexes1.length; i++ ) {
|
|
42
|
-
if ( ( match = new RegExp( regexes1[ i ] ).exec( word ) ) !== null ) {
|
|
43
|
-
word = match[ 1 ];
|
|
44
|
-
if ( new RegExp( regexes2[ i ] ).test( word ) ) {
|
|
45
|
-
word += endings[ i ];
|
|
46
|
-
}
|
|
47
|
-
}
|
|
48
|
-
}
|
|
49
|
-
return word;
|
|
50
|
-
}
|
|
51
|
-
|
|
52
|
-
/**
|
|
53
|
-
* Matches word with a regex and stems the word if there is any match.
|
|
54
|
-
*
|
|
55
|
-
* @param {string} word The word to check.
|
|
56
|
-
* @param {string} regex The regex to match.
|
|
57
|
-
*
|
|
58
|
-
* @returns {string} The stemmed word if there is any matches or otherwise the original word.
|
|
59
|
-
*/
|
|
60
|
-
export function matchAndStemWordWithOneRegex( word, regex ) {
|
|
61
|
-
let match;
|
|
62
|
-
if ( ( match = new RegExp( regex ).exec( word ) ) !== null ) {
|
|
63
|
-
word = match[ 1 ];
|
|
64
|
-
}
|
|
65
|
-
return word;
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
/**
|
|
69
|
-
* Matches word with a regex and stems the word if there is any match. Further processes the stemmed word
|
|
70
|
-
* if it matches one of the two regexes in the second check by attaching an additional ending.
|
|
71
|
-
*
|
|
72
|
-
* @param {string} word The word to check.
|
|
73
|
-
* @param {string} regex1 The first regex to match.
|
|
74
|
-
* @param {string} regex2 The second regex to match.
|
|
75
|
-
* @param {string} regex3 The third regex to match.
|
|
76
|
-
* @param {string} ending The ending to attach to the stemmed word
|
|
77
|
-
* if the previously stemmed word matches one of the conditions in the second check.
|
|
78
|
-
* @returns {string} The stemmed word if there is any matches or otherwise the original word.
|
|
79
|
-
*/
|
|
80
|
-
export function matchAndStemWord( word, regex1, regex2, regex3, ending ) {
|
|
81
|
-
let match;
|
|
82
|
-
if ( ( match = new RegExp( regex1 ).exec( word ) ) !== null ) {
|
|
83
|
-
word = match[ 1 ];
|
|
84
|
-
if ( new RegExp( regex2 ).test( word ) || new RegExp( regex3 ).test( word ) ) {
|
|
85
|
-
word += ending;
|
|
86
|
-
}
|
|
87
|
-
}
|
|
88
|
-
return word;
|
|
89
|
-
}
|
|
90
|
-
|
|
91
|
-
/**
|
|
92
|
-
* Checks if a word is in the exception list of step 1 stemming process.
|
|
93
|
-
*
|
|
94
|
-
* @param {string} word The word to check.
|
|
95
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
96
|
-
* @returns {string} The stem of the word.
|
|
97
|
-
*/
|
|
98
|
-
function checkExceptionStep1( word, morphologyData ) {
|
|
99
|
-
const exceptions = morphologyData.externalStemmer.step1Exceptions;
|
|
100
|
-
const regex = new RegExp( "(.*)(" + Object.keys( exceptions ).join( "|" ) + ")$" );
|
|
101
|
-
const match = regex.exec( word );
|
|
102
|
-
if ( match !== null ) {
|
|
103
|
-
word = match[ 1 ] + exceptions[ match[ 2 ] ];
|
|
104
|
-
}
|
|
105
|
-
return word;
|
|
106
|
-
}
|
|
107
|
-
|
|
108
|
-
/**
|
|
109
|
-
* Stems suffixes from step 1.
|
|
110
|
-
*
|
|
111
|
-
* @param {string} word The word to stem.
|
|
112
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
113
|
-
*
|
|
114
|
-
* @returns {string} The word without suffixes or the original word if no such suffix is found.
|
|
115
|
-
*/
|
|
116
|
-
function stemWordStep1( word, morphologyData ) {
|
|
117
|
-
const regexesStep1 = morphologyData.externalStemmer.regexesStep1;
|
|
118
|
-
const regexesArrays = regexesStep1.regexesArrays;
|
|
119
|
-
let match;
|
|
120
|
-
if ( ( match = new RegExp( regexesStep1.regex1a ).exec( word ) ) !== null ) {
|
|
121
|
-
word = match[ 1 ];
|
|
122
|
-
if ( ! new RegExp( regexesStep1.regex1b ).test( word ) ) {
|
|
123
|
-
word += "ΑΔ";
|
|
124
|
-
}
|
|
125
|
-
}
|
|
126
|
-
word = matchAndStemWordWithRegexArray( word, regexesArrays[ 0 ], regexesArrays[ 1 ], regexesArrays[ 2 ] );
|
|
127
|
-
|
|
128
|
-
return word;
|
|
129
|
-
}
|
|
130
|
-
|
|
131
|
-
/**
|
|
132
|
-
* Stems suffixes from step 2.
|
|
133
|
-
*
|
|
134
|
-
* @param {string} word The word to stem.
|
|
135
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
136
|
-
*
|
|
137
|
-
* @returns {string} The word without suffixes or the original word if no such suffix is found.
|
|
138
|
-
*/
|
|
139
|
-
function stemWordStep2( word, morphologyData ) {
|
|
140
|
-
const regexesStep2 = morphologyData.externalStemmer.regexesStep2;
|
|
141
|
-
const vowelRegex1 = new RegExp( morphologyData.externalStemmer.vowelRegex1 );
|
|
142
|
-
let match;
|
|
143
|
-
if ( ( match = new RegExp( regexesStep2.regex2a ).exec( word ) ) !== null && match[ 1 ].length > 4 ) {
|
|
144
|
-
word = match[ 1 ];
|
|
145
|
-
}
|
|
146
|
-
if ( ( match = new RegExp( regexesStep2.regex2b ).exec( word ) ) !== null ) {
|
|
147
|
-
word = match[ 1 ];
|
|
148
|
-
|
|
149
|
-
if ( vowelRegex1.test( word ) || word.length < 2 || new RegExp( regexesStep2.regex2c ).test( match[ 1 ] ) ) {
|
|
150
|
-
word += "Ι";
|
|
151
|
-
}
|
|
152
|
-
if ( new RegExp( regexesStep2.regex2d ).test( match[ 1 ] ) ) {
|
|
153
|
-
word += "ΑΙ";
|
|
154
|
-
}
|
|
155
|
-
}
|
|
156
|
-
return word;
|
|
157
|
-
}
|
|
158
|
-
|
|
159
|
-
/**
|
|
160
|
-
* Stems suffixes from step 3.
|
|
161
|
-
*
|
|
162
|
-
* @param {string} word The word to stem.
|
|
163
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
164
|
-
*
|
|
165
|
-
* @returns {string} The word without suffixes or the original word if no such suffix is found.
|
|
166
|
-
*/
|
|
167
|
-
function stemWordStep3( word, morphologyData ) {
|
|
168
|
-
const vowelRegex1 = new RegExp( morphologyData.externalStemmer.vowelRegex1 );
|
|
169
|
-
const regexesStep3 = morphologyData.externalStemmer.regexesStep3;
|
|
170
|
-
let match;
|
|
171
|
-
if ( ( match = new RegExp( regexesStep3.regex3a ).exec( word ) ) !== null ) {
|
|
172
|
-
word = match[ 1 ];
|
|
173
|
-
if ( vowelRegex1.test( word ) || new RegExp( regexesStep3.regex3b ).test( word ) || new RegExp( regexesStep3.regex3c ).test( word ) ) {
|
|
174
|
-
word += "ΙΚ";
|
|
175
|
-
}
|
|
176
|
-
}
|
|
177
|
-
return word;
|
|
178
|
-
}
|
|
179
|
-
|
|
180
|
-
/**
|
|
181
|
-
* Stems verb and nouns suffixes.
|
|
182
|
-
*
|
|
183
|
-
* @param {string} word The word to stem.
|
|
184
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
185
|
-
*
|
|
186
|
-
* @returns {string} The word without suffixes or the original word if no such suffix is found.
|
|
187
|
-
*/
|
|
188
|
-
function stemWordStep4( word, morphologyData ) {
|
|
189
|
-
const regexesStep4 = morphologyData.externalStemmer.regexesStep4;
|
|
190
|
-
const regexesArrays = regexesStep4.regexesArrays;
|
|
191
|
-
const vowelRegex1 = morphologyData.externalStemmer.vowelRegex1;
|
|
192
|
-
const vowelRegex2 = morphologyData.externalStemmer.vowelRegex2;
|
|
193
|
-
let match;
|
|
194
|
-
if ( word === "ΑΓΑΜΕ" ) {
|
|
195
|
-
return "ΑΓΑΜ";
|
|
196
|
-
}
|
|
197
|
-
|
|
198
|
-
word = matchAndStemWordWithOneRegex( word, regexesStep4.regex4a );
|
|
199
|
-
|
|
200
|
-
word = matchAndStemWordWithRegexArray( word, regexesArrays.arrays1[ 0 ], regexesArrays.arrays1[ 1 ], regexesArrays.arrays1[ 2 ] );
|
|
201
|
-
|
|
202
|
-
word = matchAndStemWord( word, regexesStep4.regex4b, vowelRegex2, regexesStep4.regex4c, "ΑΝ" );
|
|
203
|
-
|
|
204
|
-
word = matchAndStemWordWithOneRegex( word, regexesStep4.regex4d );
|
|
205
|
-
|
|
206
|
-
if ( ( match = new RegExp( regexesStep4.regex4e ).exec( word ) ) !== null ) {
|
|
207
|
-
word = match[ 1 ];
|
|
208
|
-
if ( new RegExp( vowelRegex2 ).test( word ) || new RegExp( regexesStep4.regex4f ).test( word ) ||
|
|
209
|
-
new RegExp( regexesStep4.regex4g ).test( word ) ) {
|
|
210
|
-
word += "ΕΤ";
|
|
211
|
-
}
|
|
212
|
-
}
|
|
213
|
-
|
|
214
|
-
if ( ( match = new RegExp( regexesStep4.regex4h ).exec( word ) ) !== null ) {
|
|
215
|
-
word = match[ 1 ];
|
|
216
|
-
if ( new RegExp( regexesStep4.regex4i ).test( match[ 1 ] ) ) {
|
|
217
|
-
word += "ΟΝΤ";
|
|
218
|
-
} else if ( new RegExp( regexesStep4.regex4j ).test( match[ 1 ] ) ) {
|
|
219
|
-
word += "ΩΝΤ";
|
|
220
|
-
}
|
|
221
|
-
}
|
|
222
|
-
word = matchAndStemWordWithRegexArray( word, regexesArrays.arrays2[ 0 ], regexesArrays.arrays2[ 1 ], regexesArrays.arrays2[ 2 ] );
|
|
223
|
-
|
|
224
|
-
word = matchAndStemWordWithOneRegex( word, regexesStep4.regex4k );
|
|
225
|
-
|
|
226
|
-
word = matchAndStemWord( word, regexesStep4.regex4l, regexesStep4.regex4m, regexesStep4.regex4n, "ΗΚ" );
|
|
227
|
-
|
|
228
|
-
if ( ( match = new RegExp( regexesStep4.regex4o ).exec( word ) ) !== null ) {
|
|
229
|
-
word = match[ 1 ];
|
|
230
|
-
if ( new RegExp( vowelRegex1 ).test( word ) || new RegExp( regexesStep4.regex4p ).test( match[ 1 ] ) ||
|
|
231
|
-
new RegExp( regexesStep4.regex4q ).test( match[ 1 ] ) ) {
|
|
232
|
-
word += "ΟΥΣ";
|
|
233
|
-
}
|
|
234
|
-
}
|
|
235
|
-
|
|
236
|
-
if ( ( match = new RegExp( regexesStep4.regex4r ).exec( word ) ) !== null ) {
|
|
237
|
-
word = match[ 1 ];
|
|
238
|
-
|
|
239
|
-
if ( new RegExp( regexesStep4.regex4s ).test( word ) ||
|
|
240
|
-
( new RegExp( regexesStep4.regex4t ).test( word ) && ! new RegExp( regexesStep4.regex4u ).test( word ) ) ) {
|
|
241
|
-
word += "ΑΓ";
|
|
242
|
-
}
|
|
243
|
-
}
|
|
244
|
-
word = matchAndStemWordWithRegexArray( word, regexesArrays.arrays3[ 0 ], regexesArrays.arrays3[ 1 ], regexesArrays.arrays3[ 2 ] );
|
|
245
|
-
|
|
246
|
-
return word;
|
|
247
|
-
}
|
|
248
|
-
|
|
249
|
-
/**
|
|
250
|
-
* Stems adjective suffixes.
|
|
251
|
-
*
|
|
252
|
-
* @param {string} word The word to stem.
|
|
253
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
254
|
-
*
|
|
255
|
-
* @returns {string} The word without suffixes or the original word if no such suffix is found.
|
|
256
|
-
*/
|
|
257
|
-
function stemWordStep5( word, morphologyData ) {
|
|
258
|
-
const regexesStep5 = morphologyData.externalStemmer.regexesStep5;
|
|
259
|
-
let match;
|
|
260
|
-
if ( ( match = new RegExp( regexesStep5.regex5a ).exec( word ) ) !== null ) {
|
|
261
|
-
word = match[ 1 ] + "Μ";
|
|
262
|
-
if ( new RegExp( regexesStep5.regex5b ).test( match[ 1 ] ) ) {
|
|
263
|
-
word += "Α";
|
|
264
|
-
} else if ( new RegExp( regexesStep5.regex5c ).test( match[ 1 ] ) ) {
|
|
265
|
-
word += "ΑΤ";
|
|
266
|
-
}
|
|
267
|
-
}
|
|
268
|
-
|
|
269
|
-
if ( ( match = new RegExp( regexesStep5.regex5d ).exec( word ) ) !== null ) {
|
|
270
|
-
word = match[ 1 ] + "ΟΥ";
|
|
271
|
-
}
|
|
272
|
-
|
|
273
|
-
return word;
|
|
274
|
-
}
|
|
275
|
-
|
|
276
|
-
/**
|
|
277
|
-
* Stems superlative and comparative suffixes.
|
|
278
|
-
*
|
|
279
|
-
* @param {string} word The word to stem.
|
|
280
|
-
* @param {Object} morphologyData The Greek morphology data.
|
|
281
|
-
*
|
|
282
|
-
* @returns {string} The word without suffixes or the original word if no such suffix is found.
|
|
283
|
-
*/
|
|
284
|
-
function stemWordStep6( word, morphologyData ) {
|
|
285
|
-
const regexesStep6 = morphologyData.externalStemmer.regexesStep6;
|
|
286
|
-
|
|
287
|
-
let match;
|
|
288
|
-
if ( ( match = new RegExp( regexesStep6.regex6a ).exec( word ) ) !== null ) {
|
|
289
|
-
if ( ! new RegExp( regexesStep6.regex6b ).test( match[ 1 ] ) ) {
|
|
290
|
-
word = match[ 1 ];
|
|
291
|
-
}
|
|
292
|
-
if ( new RegExp( regexesStep6.regex6c ).test( match[ 1 ] ) ) {
|
|
293
|
-
word += "ΥΤ";
|
|
294
|
-
}
|
|
295
|
-
}
|
|
296
|
-
|
|
297
|
-
return word;
|
|
298
|
-
}
|
|
299
|
-
|
|
300
|
-
/**
|
|
301
|
-
* Normalizes Greek by removing accents.
|
|
302
|
-
*
|
|
303
|
-
* @param {string} text The text that should be normalized.
|
|
304
|
-
*
|
|
305
|
-
* @returns {string} The normalized text.
|
|
306
|
-
*/
|
|
307
|
-
function normalizeGreek( text ) {
|
|
308
|
-
return text.replace( /[ΆΑά]/g, "α" )
|
|
309
|
-
.replace( /[ΈΕέ]/g, "ε" )
|
|
310
|
-
.replace( /[ΉΗή]/g, "η" )
|
|
311
|
-
.replace( /[ΊΪΙίΐϊ]/g, "ι" )
|
|
312
|
-
.replace( /[ΌΟό]/g, "ο" )
|
|
313
|
-
.replace( /[ΎΫΥύΰϋ]/g, "υ" )
|
|
314
|
-
.replace( /[ΏΩώ]/g, "ω" )
|
|
315
|
-
.replace( /[Σς]/g, "σ" );
|
|
316
|
-
}
|
|
317
|
-
|
|
318
|
-
/**
|
|
319
|
-
* Stems Greek words
|
|
320
|
-
*
|
|
321
|
-
* @param {string} word The word to stem.
|
|
322
|
-
* @param {Object} morphologyData The object that contains regex-based rules and exception lists for Greek stemming.
|
|
323
|
-
*
|
|
324
|
-
* @returns {string} The stem of a Greek word.
|
|
325
|
-
*/
|
|
326
|
-
export default function stem( word, morphologyData ) {
|
|
327
|
-
word = normalizeGreek( word );
|
|
328
|
-
|
|
329
|
-
// We process the word in uppercase to account for the character changing in lowercase depending on its position in the word.
|
|
330
|
-
word = word.toLocaleUpperCase( "el" );
|
|
331
|
-
|
|
332
|
-
const originalWord = word;
|
|
333
|
-
|
|
334
|
-
const doNotStemWords = morphologyData.externalStemmer.doNotStemWords;
|
|
335
|
-
if ( word.length < 3 || doNotStemWords.includes( word ) ) {
|
|
336
|
-
return word.toLocaleLowerCase( "el" );
|
|
337
|
-
}
|
|
338
|
-
// Check for exceptions first before proceeding to the next step.
|
|
339
|
-
word = checkExceptionStep1( word, morphologyData );
|
|
340
|
-
|
|
341
|
-
// Step 1
|
|
342
|
-
word = stemWordStep1( word, morphologyData );
|
|
343
|
-
|
|
344
|
-
// Step 2
|
|
345
|
-
word = stemWordStep2( word, morphologyData );
|
|
346
|
-
|
|
347
|
-
// Step 3
|
|
348
|
-
word = stemWordStep3( word, morphologyData );
|
|
349
|
-
|
|
350
|
-
// Step 4
|
|
351
|
-
word = stemWordStep4( word, morphologyData );
|
|
352
|
-
|
|
353
|
-
// Step 5
|
|
354
|
-
word = stemWordStep5( word, morphologyData );
|
|
355
|
-
|
|
356
|
-
// Handle long words.
|
|
357
|
-
const longWordRegex = morphologyData.externalStemmer.longWordRegex;
|
|
358
|
-
if ( originalWord.length === word.length ) {
|
|
359
|
-
word = matchAndStemWordWithOneRegex( word, longWordRegex );
|
|
360
|
-
}
|
|
361
|
-
// Step 6
|
|
362
|
-
word = stemWordStep6( word, morphologyData );
|
|
363
|
-
|
|
364
|
-
// Make the word lowercase again after the stemming process complete.
|
|
365
|
-
word = word.toLocaleLowerCase( "el" );
|
|
366
|
-
|
|
367
|
-
return word;
|
|
368
|
-
}
|
|
@@ -1,38 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {getWords, directPrecedenceException} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
import nonPassiveVerbStems from '../config/internal/nonPassiveVerbStems';
|
|
5
|
-
import {passiveSuffixes} from '../config/internal/morphologicalPassiveSuffixes.js';
|
|
6
|
-
|
|
7
|
-
const directPrecedenceExceptionList = ['να'];
|
|
8
|
-
|
|
9
|
-
/**
|
|
10
|
-
* Checks the passed sentence to see if it contains Greek passive verb-forms.
|
|
11
|
-
*
|
|
12
|
-
* @param {string} sentence The sentence to match against.
|
|
13
|
-
*
|
|
14
|
-
* @returns {Boolean} Whether the sentence is passive or not.
|
|
15
|
-
*/
|
|
16
|
-
export default function isPassiveSentence(sentence) {
|
|
17
|
-
const words = getWords(sentence);
|
|
18
|
-
|
|
19
|
-
for (const word of words) {
|
|
20
|
-
for (const suffix of passiveSuffixes) {
|
|
21
|
-
if (word.endsWith(suffix) && word.length > 4) {
|
|
22
|
-
// Get the stem of the word.
|
|
23
|
-
const stem = word.slice(0, -suffix.length);
|
|
24
|
-
/*
|
|
25
|
-
* Return true if the word ends with one of the passive suffixes, if the word is more than 4 characters long
|
|
26
|
-
* And if the word stem is not in the non-passive exception list.
|
|
27
|
-
*
|
|
28
|
-
* Passive infinitive with -θεί/-τεί is not a valid passive if it's directly preceded by "να".
|
|
29
|
-
*/
|
|
30
|
-
return /^(θεί|τεί)$/.test(suffix)
|
|
31
|
-
? !nonPassiveVerbStems.includes(stem) &&
|
|
32
|
-
!directPrecedenceException(sentence, word, directPrecedenceExceptionList)
|
|
33
|
-
: !nonPassiveVerbStems.includes(stem);
|
|
34
|
-
}
|
|
35
|
-
}
|
|
36
|
-
}
|
|
37
|
-
return false;
|
|
38
|
-
}
|
|
@@ -1,37 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {values} = languageProcessing;
|
|
3
|
-
const {Clause} = values;
|
|
4
|
-
import getParticiples from '../helpers/internal/getParticiples';
|
|
5
|
-
|
|
6
|
-
/**
|
|
7
|
-
* Creates a Clause object for the Greek language.
|
|
8
|
-
*/
|
|
9
|
-
class GreekClause extends Clause {
|
|
10
|
-
/**
|
|
11
|
-
* Constructor.
|
|
12
|
-
*
|
|
13
|
-
* @param {string} clauseText The text of the clause.
|
|
14
|
-
* @param {Array} auxiliaries The auxiliaries.
|
|
15
|
-
*
|
|
16
|
-
* @constructor
|
|
17
|
-
*/
|
|
18
|
-
constructor(clauseText, auxiliaries) {
|
|
19
|
-
super(clauseText, auxiliaries);
|
|
20
|
-
this._participles = getParticiples(this.getClauseText());
|
|
21
|
-
this.checkParticiples();
|
|
22
|
-
}
|
|
23
|
-
|
|
24
|
-
/**
|
|
25
|
-
* Sets the passiveness of a clause based on whether the matched participle is a valid one.
|
|
26
|
-
* We only process clauses that have an auxiliary in this check.
|
|
27
|
-
*
|
|
28
|
-
* @returns {void}
|
|
29
|
-
*/
|
|
30
|
-
checkParticiples() {
|
|
31
|
-
const participles = this.getParticiples();
|
|
32
|
-
|
|
33
|
-
this.setPassive(participles.length > 0);
|
|
34
|
-
}
|
|
35
|
-
}
|
|
36
|
-
|
|
37
|
-
export default GreekClause;
|
|
@@ -1,46 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {AbstractResearcher} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
// All config
|
|
5
|
-
import firstWordExceptions from './config/firstWordExceptions';
|
|
6
|
-
import {all as functionWords} from './config/functionWords';
|
|
7
|
-
import stopWords from './config/stopWords';
|
|
8
|
-
import transitionWords from './config/transitionWords';
|
|
9
|
-
import twoPartTransitionWords from './config/twoPartTransitionWords';
|
|
10
|
-
import syllables from './config/syllables.json';
|
|
11
|
-
|
|
12
|
-
// All helpers
|
|
13
|
-
import getClauses from './helpers/getClauses';
|
|
14
|
-
import getStemmer from './helpers/getStemmer';
|
|
15
|
-
import fleschReadingScore from './helpers/calculateFleschReadingScore';
|
|
16
|
-
|
|
17
|
-
/**
|
|
18
|
-
* The researcher contains all the researches, helpers, data, and config.
|
|
19
|
-
*/
|
|
20
|
-
export default class Researcher extends AbstractResearcher {
|
|
21
|
-
/**
|
|
22
|
-
* Constructor
|
|
23
|
-
* @param {Paper} paper The Paper object that is needed within the researches.
|
|
24
|
-
* @constructor
|
|
25
|
-
*/
|
|
26
|
-
constructor(paper) {
|
|
27
|
-
super(paper);
|
|
28
|
-
|
|
29
|
-
Object.assign(this.config, {
|
|
30
|
-
language: 'en',
|
|
31
|
-
passiveConstructionType: 'periphrastic',
|
|
32
|
-
firstWordExceptions,
|
|
33
|
-
functionWords,
|
|
34
|
-
stopWords,
|
|
35
|
-
transitionWords,
|
|
36
|
-
twoPartTransitionWords,
|
|
37
|
-
syllables
|
|
38
|
-
});
|
|
39
|
-
|
|
40
|
-
Object.assign(this.helpers, {
|
|
41
|
-
getClauses,
|
|
42
|
-
getStemmer,
|
|
43
|
-
fleschReadingScore
|
|
44
|
-
});
|
|
45
|
-
}
|
|
46
|
-
}
|
|
@@ -1,55 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Returns a list with abbreviations. Originally created for use in avadaseo/src/languageProcessing/helpers/sentence/SentenceTokenizer.js
|
|
3
|
-
* Abbreviations were originally sourced from: https://github.com/Yoast/YoastSEO.js/issues/698
|
|
4
|
-
* IMPORTANT! For the use in the SentenceTokenizer it is important that:
|
|
5
|
-
* - all abbreviations end in a full stop.
|
|
6
|
-
* - all abbreviations should contain more than one letter to prevent clashes with the check for initials.
|
|
7
|
-
* @type {Array} The list with abbreviations.
|
|
8
|
-
*/
|
|
9
|
-
export default [
|
|
10
|
-
"A.D.",
|
|
11
|
-
"Adm.",
|
|
12
|
-
"Adv.",
|
|
13
|
-
"B.C.",
|
|
14
|
-
"Br.",
|
|
15
|
-
"Brig.",
|
|
16
|
-
"Cmrd.",
|
|
17
|
-
"Col.",
|
|
18
|
-
"Cpl.",
|
|
19
|
-
"Cpt.",
|
|
20
|
-
"Dr.",
|
|
21
|
-
"Esq.",
|
|
22
|
-
"Fr.",
|
|
23
|
-
"Gen.",
|
|
24
|
-
"Gov.",
|
|
25
|
-
"Hon.",
|
|
26
|
-
"Jr.",
|
|
27
|
-
"Lieut.",
|
|
28
|
-
"Lt.",
|
|
29
|
-
"Maj.",
|
|
30
|
-
"Mr.",
|
|
31
|
-
"Mrs.",
|
|
32
|
-
"Ms.",
|
|
33
|
-
"Msgr.",
|
|
34
|
-
"Mx.",
|
|
35
|
-
"No.",
|
|
36
|
-
"Pfc.",
|
|
37
|
-
"Pr.",
|
|
38
|
-
"Prof.",
|
|
39
|
-
"Pvt.",
|
|
40
|
-
"Rep.",
|
|
41
|
-
"Reps.",
|
|
42
|
-
"Rev.",
|
|
43
|
-
"Rt. Hon.",
|
|
44
|
-
"Sen.",
|
|
45
|
-
"Sens.",
|
|
46
|
-
"Sgt.",
|
|
47
|
-
"Sps.",
|
|
48
|
-
"Sr.",
|
|
49
|
-
"St.",
|
|
50
|
-
"vs.",
|
|
51
|
-
"i.e.",
|
|
52
|
-
"e.g.",
|
|
53
|
-
"viz.",
|
|
54
|
-
"Mt.",
|
|
55
|
-
];
|
|
@@ -1,14 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Returns an array with exceptions for the sentence beginning researcher.
|
|
3
|
-
* @type {Array} The array filled with exceptions.
|
|
4
|
-
*/
|
|
5
|
-
export default [
|
|
6
|
-
// Definite articles:
|
|
7
|
-
"the",
|
|
8
|
-
// Indefinite articles:
|
|
9
|
-
"a", "an",
|
|
10
|
-
// Numbers 1-10:
|
|
11
|
-
"one", "two", "three", "four", "five", "six", "seven", "eight", "nine", "ten",
|
|
12
|
-
// Demonstrative pronouns:
|
|
13
|
-
"this", "that", "these", "those",
|
|
14
|
-
];
|