axyseo 2.0.0-alpha.0.0.4 → 2.0.0-alpha.0.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +5 -2
- package/.browserslistrc +0 -1
- package/.gitattributes +0 -1
- package/babel.config.js +0 -3
- package/eslint.config.mjs +0 -119
- package/src/bundledPlugins/index.js +0 -5
- package/src/bundledPlugins/previouslyUsedKeywords.js +0 -192
- package/src/config/diacritics.js +0 -106
- package/src/config/getTransliterations.js +0 -1447
- package/src/config/transliterationsWPstyle.js +0 -774
- package/src/config/wordBoundaries.js +0 -23
- package/src/config/wordBoundariesWithoutPunctuation.js +0 -9
- package/src/const/analysis.js +0 -41
- package/src/errors/invalidType.js +0 -14
- package/src/errors/missingArgument.js +0 -14
- package/src/helpers/createMeasurementElement.js +0 -40
- package/src/helpers/domManipulation.js +0 -65
- package/src/helpers/errors.js +0 -26
- package/src/helpers/factory.js +0 -219
- package/src/helpers/formatNumber.js +0 -12
- package/src/helpers/formatString.js +0 -33
- package/src/helpers/getLanguagesWithWordComplexity.js +0 -8
- package/src/helpers/getLanguagesWithWordFormSupport.js +0 -11
- package/src/helpers/getWordComplexityConfig.js +0 -20
- package/src/helpers/getWordComplexityHelper.js +0 -20
- package/src/helpers/htmlEntities.js +0 -41
- package/src/helpers/includesAny.js +0 -19
- package/src/helpers/index.js +0 -127
- package/src/helpers/shortlinker/Shortlinker.js +0 -75
- package/src/helpers/shortlinker/index.js +0 -1
- package/src/helpers/shortlinker/singleton.js +0 -68
- package/src/helpers/types.js +0 -34
- package/src/index.js +0 -60
- package/src/languageProcessing/AbstractResearcher.js +0 -366
- package/src/languageProcessing/helpers/highlighting/getMarkingsInSentence.js +0 -125
- package/src/languageProcessing/helpers/html/getFieldsToMark.js +0 -29
- package/src/languageProcessing/helpers/html/getSubheadingTexts.js +0 -47
- package/src/languageProcessing/helpers/html/getSubheadings.js +0 -95
- package/src/languageProcessing/helpers/html/html.js +0 -176
- package/src/languageProcessing/helpers/html/htmlParser.js +0 -145
- package/src/languageProcessing/helpers/html/matchParagraphs.js +0 -62
- package/src/languageProcessing/helpers/html/normalizeHTML.js +0 -16
- package/src/languageProcessing/helpers/image/getAltAttribute.js +0 -20
- package/src/languageProcessing/helpers/image/getImagesInTree.js +0 -16
- package/src/languageProcessing/helpers/image/imageInText.js +0 -19
- package/src/languageProcessing/helpers/index.js +0 -12
- package/src/languageProcessing/helpers/language/getLanguage.js +0 -9
- package/src/languageProcessing/helpers/link/checkNofollow.js +0 -38
- package/src/languageProcessing/helpers/link/getAnchorsFromText.js +0 -32
- package/src/languageProcessing/helpers/link/getLinkType.js +0 -32
- package/src/languageProcessing/helpers/match/findKeywordFormsInString.js +0 -101
- package/src/languageProcessing/helpers/match/isDoubleQuoted.js +0 -13
- package/src/languageProcessing/helpers/match/matchTextWithArray.js +0 -36
- package/src/languageProcessing/helpers/match/matchTextWithTransliteration.js +0 -58
- package/src/languageProcessing/helpers/match/matchTextWithWord.js +0 -45
- package/src/languageProcessing/helpers/match/matchWordFormsWithSentence.js +0 -164
- package/src/languageProcessing/helpers/match/processExactMatchRequest.js +0 -20
- package/src/languageProcessing/helpers/morphology/baseStemmer.js +0 -11
- package/src/languageProcessing/helpers/morphology/buildFormRule.js +0 -19
- package/src/languageProcessing/helpers/morphology/buildTopicStems.js +0 -169
- package/src/languageProcessing/helpers/morphology/createRulesFromArrays.js +0 -45
- package/src/languageProcessing/helpers/morphology/exceptionListHelpers.js +0 -65
- package/src/languageProcessing/helpers/morphology/findMatchingEndingInArray.js +0 -24
- package/src/languageProcessing/helpers/morphology/flattenSortLength.js +0 -14
- package/src/languageProcessing/helpers/morphology/getAllWordsFromPaper.js +0 -39
- package/src/languageProcessing/helpers/morphology/regexHelpers.js +0 -44
- package/src/languageProcessing/helpers/morphology/stemHelpers.js +0 -38
- package/src/languageProcessing/helpers/morphology/stemPrefixedFunctionWords.js +0 -31
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/directPrecedenceException.js +0 -36
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/freeAuxiliaryParticipleOrder/getClausesSplitOnStopWords.js +0 -113
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/freeAuxiliaryParticipleOrder/nonDirectParticiplePrecedenceException.js +0 -45
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/getClauses.js +0 -231
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/getIndicesWithRegex.js +0 -20
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/matchRegularParticiples.js +0 -23
- package/src/languageProcessing/helpers/passiveVoice/periphrastic/precedenceException.js +0 -40
- package/src/languageProcessing/helpers/prominentWords/determineProminentWords.js +0 -238
- package/src/languageProcessing/helpers/regex/createRegexFromArray.js +0 -35
- package/src/languageProcessing/helpers/regex/createRegexFromDoubleArray.js +0 -34
- package/src/languageProcessing/helpers/regex/createWordRegex.js +0 -30
- package/src/languageProcessing/helpers/regex/matchStringWithRegex.js +0 -19
- package/src/languageProcessing/helpers/regex/searchAndReplaceWithOneRegex.js +0 -14
- package/src/languageProcessing/helpers/sanitize/doubleQuotes.js +0 -12
- package/src/languageProcessing/helpers/sanitize/filterShortcodesFromTree.js +0 -131
- package/src/languageProcessing/helpers/sanitize/mergeListItems.js +0 -24
- package/src/languageProcessing/helpers/sanitize/parseSynonyms.js +0 -20
- package/src/languageProcessing/helpers/sanitize/quotes.js +0 -46
- package/src/languageProcessing/helpers/sanitize/removeEmailAddresses.js +0 -12
- package/src/languageProcessing/helpers/sanitize/removePunctuation.js +0 -64
- package/src/languageProcessing/helpers/sanitize/removePunctuationExceptQuotes.js +0 -18
- package/src/languageProcessing/helpers/sanitize/removeSentenceTerminators.js +0 -13
- package/src/languageProcessing/helpers/sanitize/removeURLs.js +0 -13
- package/src/languageProcessing/helpers/sanitize/sanitizeLineBreakTag.js +0 -11
- package/src/languageProcessing/helpers/sanitize/sanitizeString.js +0 -18
- package/src/languageProcessing/helpers/sanitize/stripHTMLTags.js +0 -57
- package/src/languageProcessing/helpers/sanitize/stripNonTextTags.js +0 -15
- package/src/languageProcessing/helpers/sanitize/stripNumbers.js +0 -21
- package/src/languageProcessing/helpers/sanitize/stripSpaces.js +0 -23
- package/src/languageProcessing/helpers/sanitize/stripWordBoundaries.js +0 -65
- package/src/languageProcessing/helpers/sanitize/unifyWhitespace.js +0 -61
- package/src/languageProcessing/helpers/sentence/SentenceTokenizer.js +0 -640
- package/src/languageProcessing/helpers/sentence/countSentences.js +0 -20
- package/src/languageProcessing/helpers/sentence/getSentences.js +0 -65
- package/src/languageProcessing/helpers/sentence/getSentencesFromTree.js +0 -55
- package/src/languageProcessing/helpers/sentence/memoizedSentenceTokenizer.js +0 -28
- package/src/languageProcessing/helpers/sentence/sentencesLength.js +0 -31
- package/src/languageProcessing/helpers/syllables/DeviationFragment.js +0 -112
- package/src/languageProcessing/helpers/syllables/countSyllables.js +0 -182
- package/src/languageProcessing/helpers/syllables/syllableCountIterator.js +0 -56
- package/src/languageProcessing/helpers/syllables/syllableCountStep.js +0 -68
- package/src/languageProcessing/helpers/transform/transformWordsWithHyphens.js +0 -17
- package/src/languageProcessing/helpers/transliterate/replaceDiacritics.js +0 -22
- package/src/languageProcessing/helpers/transliterate/specialCharacterMappings.js +0 -214
- package/src/languageProcessing/helpers/transliterate/transliterate.js +0 -20
- package/src/languageProcessing/helpers/transliterate/transliterateWPstyle.js +0 -21
- package/src/languageProcessing/helpers/url/parseSlug.js +0 -10
- package/src/languageProcessing/helpers/url/url.js +0 -172
- package/src/languageProcessing/helpers/word/addWordboundary.js +0 -37
- package/src/languageProcessing/helpers/word/areWordsInSentence.js +0 -16
- package/src/languageProcessing/helpers/word/countMetaDescriptionLength.js +0 -18
- package/src/languageProcessing/helpers/word/countWords.js +0 -14
- package/src/languageProcessing/helpers/word/createPunctuationTokens.js +0 -42
- package/src/languageProcessing/helpers/word/filterWordsFromArray.js +0 -15
- package/src/languageProcessing/helpers/word/followsIndex.js +0 -25
- package/src/languageProcessing/helpers/word/getAllWordsFromTree.js +0 -23
- package/src/languageProcessing/helpers/word/getWords.js +0 -43
- package/src/languageProcessing/helpers/word/includesIndex.js +0 -30
- package/src/languageProcessing/helpers/word/indices.js +0 -146
- package/src/languageProcessing/helpers/word/markWordsInSentences.js +0 -173
- package/src/languageProcessing/helpers/word/matchWordInSentence.js +0 -61
- package/src/languageProcessing/helpers/word/splitIntoTokens.js +0 -46
- package/src/languageProcessing/index.js +0 -91
- package/src/languageProcessing/languages/_default/Researcher.js +0 -34
- package/src/languageProcessing/languages/_default/helpers/getStemmer.js +0 -11
- package/src/languageProcessing/languages/ar/Researcher.js +0 -46
- package/src/languageProcessing/languages/ar/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/ar/config/functionWords.js +0 -329
- package/src/languageProcessing/languages/ar/config/internal/passiveVerbsWithLongVowel.js +0 -570
- package/src/languageProcessing/languages/ar/config/prefixedFunctionWords.js +0 -5
- package/src/languageProcessing/languages/ar/config/transitionWords.js +0 -19
- package/src/languageProcessing/languages/ar/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/ar/helpers/createBasicWordForms.js +0 -32
- package/src/languageProcessing/languages/ar/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/ar/helpers/internal/stem.js +0 -632
- package/src/languageProcessing/languages/ar/helpers/isPassiveSentence.js +0 -33
- package/src/languageProcessing/languages/ca/Researcher.js +0 -43
- package/src/languageProcessing/languages/ca/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/ca/config/transitionWords.js +0 -31
- package/src/languageProcessing/languages/ca/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/ca/helpers/getStemmer.js +0 -11
- package/src/languageProcessing/languages/cs/Researcher.js +0 -44
- package/src/languageProcessing/languages/cs/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/cs/config/functionWords.js +0 -121
- package/src/languageProcessing/languages/cs/config/internal/passiveVoiceAuxiliaries.js +0 -38
- package/src/languageProcessing/languages/cs/config/internal/passiveVoiceEndings.js +0 -54
- package/src/languageProcessing/languages/cs/config/stopWords.js +0 -42
- package/src/languageProcessing/languages/cs/config/transitionWords.js +0 -26
- package/src/languageProcessing/languages/cs/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/cs/helpers/getClauses.js +0 -26
- package/src/languageProcessing/languages/cs/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/cs/helpers/internal/getParticiples.js +0 -16
- package/src/languageProcessing/languages/cs/helpers/internal/stem.js +0 -499
- package/src/languageProcessing/languages/cs/values/Clause.js +0 -34
- package/src/languageProcessing/languages/de/Researcher.js +0 -52
- package/src/languageProcessing/languages/de/config/firstWordExceptions.js +0 -17
- package/src/languageProcessing/languages/de/config/functionWords.js +0 -303
- package/src/languageProcessing/languages/de/config/internal/exceptionsParticiplesActive.js +0 -2231
- package/src/languageProcessing/languages/de/config/internal/passiveVoiceAuxiliaries.js +0 -96
- package/src/languageProcessing/languages/de/config/internal/passiveVoiceIrregulars.js +0 -368
- package/src/languageProcessing/languages/de/config/internal/passiveVoiceRegex.js +0 -72
- package/src/languageProcessing/languages/de/config/keyphraseLength.js +0 -11
- package/src/languageProcessing/languages/de/config/stopWords.js +0 -67
- package/src/languageProcessing/languages/de/config/syllables.json +0 -460
- package/src/languageProcessing/languages/de/config/transitionWords.js +0 -31
- package/src/languageProcessing/languages/de/config/twoPartTransitionWords.js +0 -12
- package/src/languageProcessing/languages/de/config/wordComplexity.js +0 -4
- package/src/languageProcessing/languages/de/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/de/helpers/checkIfWordIsComplex.js +0 -40
- package/src/languageProcessing/languages/de/helpers/checkIfWordIsFunction.js +0 -15
- package/src/languageProcessing/languages/de/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/de/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/de/helpers/internal/SentenceTokenizer.js +0 -31
- package/src/languageProcessing/languages/de/helpers/internal/detectAndStemRegularParticiple.js +0 -128
- package/src/languageProcessing/languages/de/helpers/internal/determineStem.js +0 -128
- package/src/languageProcessing/languages/de/helpers/internal/getParticiples.js +0 -40
- package/src/languageProcessing/languages/de/helpers/internal/stem.js +0 -215
- package/src/languageProcessing/languages/de/helpers/memoizedSentenceTokenizer.js +0 -28
- package/src/languageProcessing/languages/de/values/Clause.js +0 -85
- package/src/languageProcessing/languages/el/Researcher.js +0 -46
- package/src/languageProcessing/languages/el/config/firstWordExceptions.js +0 -47
- package/src/languageProcessing/languages/el/config/functionWords.js +0 -116
- package/src/languageProcessing/languages/el/config/internal/auxiliaries.js +0 -19
- package/src/languageProcessing/languages/el/config/internal/morphologicalPassiveSuffixes.js +0 -87
- package/src/languageProcessing/languages/el/config/internal/nonPassiveVerbStems.js +0 -138
- package/src/languageProcessing/languages/el/config/stopWords.js +0 -854
- package/src/languageProcessing/languages/el/config/transitionWords.js +0 -26
- package/src/languageProcessing/languages/el/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/el/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/el/helpers/getStemmer.js +0 -21
- package/src/languageProcessing/languages/el/helpers/internal/getParticiples.js +0 -20
- package/src/languageProcessing/languages/el/helpers/internal/stem.js +0 -368
- package/src/languageProcessing/languages/el/helpers/isPassiveSentence.js +0 -38
- package/src/languageProcessing/languages/el/values/Clause.js +0 -37
- package/src/languageProcessing/languages/en/Researcher.js +0 -46
- package/src/languageProcessing/languages/en/config/abbreviations.js +0 -55
- package/src/languageProcessing/languages/en/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/en/config/functionWords.js +0 -186
- package/src/languageProcessing/languages/en/config/internal/passiveVoiceAuxiliaries.js +0 -44
- package/src/languageProcessing/languages/en/config/internal/passiveVoiceIrregulars.js +0 -354
- package/src/languageProcessing/languages/en/config/internal/passiveVoiceNonVerbEndingEd.js +0 -3047
- package/src/languageProcessing/languages/en/config/regularParticiplesRegex.js +0 -5
- package/src/languageProcessing/languages/en/config/stopWords.js +0 -52
- package/src/languageProcessing/languages/en/config/syllables.json +0 -86
- package/src/languageProcessing/languages/en/config/transitionWords.js +0 -48
- package/src/languageProcessing/languages/en/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/en/config/wordComplexity.js +0 -5
- package/src/languageProcessing/languages/en/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/en/helpers/checkIfWordIsComplex.js +0 -43
- package/src/languageProcessing/languages/en/helpers/getClauses.js +0 -49
- package/src/languageProcessing/languages/en/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/en/helpers/internal/determineStem.js +0 -178
- package/src/languageProcessing/languages/en/helpers/internal/getAdjectiveStem.js +0 -162
- package/src/languageProcessing/languages/en/helpers/internal/getParticiples.js +0 -25
- package/src/languageProcessing/languages/en/helpers/internal/getVerbStem.js +0 -237
- package/src/languageProcessing/languages/en/values/Clause.js +0 -68
- package/src/languageProcessing/languages/es/Researcher.js +0 -48
- package/src/languageProcessing/languages/es/config/firstWordExceptions.js +0 -16
- package/src/languageProcessing/languages/es/config/functionWords.js +0 -321
- package/src/languageProcessing/languages/es/config/internal/passiveVoiceAuxiliaries.js +0 -60
- package/src/languageProcessing/languages/es/config/internal/passiveVoiceParticiples.js +0 -7327
- package/src/languageProcessing/languages/es/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/es/config/stopWords.js +0 -33
- package/src/languageProcessing/languages/es/config/syllables.json +0 -176
- package/src/languageProcessing/languages/es/config/transitionWords.js +0 -40
- package/src/languageProcessing/languages/es/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/es/config/wordComplexity.js +0 -4
- package/src/languageProcessing/languages/es/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/es/helpers/checkIfWordIsComplex.js +0 -56
- package/src/languageProcessing/languages/es/helpers/getClauses.js +0 -29
- package/src/languageProcessing/languages/es/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/es/helpers/internal/checkVerbStemModifications.js +0 -41
- package/src/languageProcessing/languages/es/helpers/internal/getParticiples.js +0 -35
- package/src/languageProcessing/languages/es/helpers/internal/stem.js +0 -793
- package/src/languageProcessing/languages/es/values/Clause.js +0 -47
- package/src/languageProcessing/languages/fa/Researcher.js +0 -47
- package/src/languageProcessing/languages/fa/config/firstWordExceptions.js +0 -12
- package/src/languageProcessing/languages/fa/config/functionWords.js +0 -122
- package/src/languageProcessing/languages/fa/config/internal/participles.js +0 -1429
- package/src/languageProcessing/languages/fa/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/fa/config/transitionWords.js +0 -20
- package/src/languageProcessing/languages/fa/config/twoPartTransitionWords.js +0 -9
- package/src/languageProcessing/languages/fa/helpers/createBasicWordForms.js +0 -97
- package/src/languageProcessing/languages/fa/helpers/getStemmer.js +0 -13
- package/src/languageProcessing/languages/fa/helpers/isPassiveSentence.js +0 -14
- package/src/languageProcessing/languages/fr/Researcher.js +0 -46
- package/src/languageProcessing/languages/fr/config/firstWordExceptions.js +0 -16
- package/src/languageProcessing/languages/fr/config/functionWords.js +0 -281
- package/src/languageProcessing/languages/fr/config/internal/exceptionsParticiplesActive.js +0 -1510
- package/src/languageProcessing/languages/fr/config/internal/passiveVoiceAuxiliaries.js +0 -108
- package/src/languageProcessing/languages/fr/config/internal/passiveVoiceIrregulars.js +0 -565
- package/src/languageProcessing/languages/fr/config/stopWords.js +0 -119
- package/src/languageProcessing/languages/fr/config/syllables.json +0 -1426
- package/src/languageProcessing/languages/fr/config/transitionWords.js +0 -59
- package/src/languageProcessing/languages/fr/config/twoPartTransitionWords.js +0 -15
- package/src/languageProcessing/languages/fr/config/wordComplexity.js +0 -4
- package/src/languageProcessing/languages/fr/helpers/calculateFleschReadingScore.js +0 -18
- package/src/languageProcessing/languages/fr/helpers/checkIfWordIsComplex.js +0 -67
- package/src/languageProcessing/languages/fr/helpers/getClauses.js +0 -34
- package/src/languageProcessing/languages/fr/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/fr/helpers/internal/getParticiples.js +0 -72
- package/src/languageProcessing/languages/fr/helpers/internal/stem.js +0 -633
- package/src/languageProcessing/languages/fr/values/Clause.js +0 -96
- package/src/languageProcessing/languages/he/Researcher.js +0 -50
- package/src/languageProcessing/languages/he/config/firstWordExceptions.js +0 -13
- package/src/languageProcessing/languages/he/config/functionWords.js +0 -564
- package/src/languageProcessing/languages/he/config/internal/regularRootsHufal.js +0 -186
- package/src/languageProcessing/languages/he/config/internal/regularRootsNifal.js +0 -195
- package/src/languageProcessing/languages/he/config/internal/regularRootsPual.js +0 -168
- package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsHufal.js +0 -188
- package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsNifal.js +0 -197
- package/src/languageProcessing/languages/he/config/passiveVoice/regularRootsPual.js +0 -170
- package/src/languageProcessing/languages/he/config/prefixedFunctionWords.js +0 -2
- package/src/languageProcessing/languages/he/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/he/config/transitionWords.js +0 -28
- package/src/languageProcessing/languages/he/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/he/helpers/createBasicWordForms.js +0 -33
- package/src/languageProcessing/languages/he/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/he/helpers/internal/stem.js +0 -52
- package/src/languageProcessing/languages/he/helpers/isPassiveSentence.js +0 -96
- package/src/languageProcessing/languages/he/helpers/stem.js +0 -52
- package/src/languageProcessing/languages/hu/Researcher.js +0 -48
- package/src/languageProcessing/languages/hu/config/firstWordExceptions.js +0 -31
- package/src/languageProcessing/languages/hu/config/functionWords.js +0 -284
- package/src/languageProcessing/languages/hu/config/internal/auxiliaries.js +0 -97
- package/src/languageProcessing/languages/hu/config/internal/morphologicalPassiveAffixes.js +0 -125
- package/src/languageProcessing/languages/hu/config/internal/nonPassivesInVaAndVe.js +0 -265
- package/src/languageProcessing/languages/hu/config/internal/odikVerbs.js +0 -273
- package/src/languageProcessing/languages/hu/config/internal/participles.js +0 -412
- package/src/languageProcessing/languages/hu/config/stopWords.js +0 -213
- package/src/languageProcessing/languages/hu/config/transitionWords.js +0 -42
- package/src/languageProcessing/languages/hu/config/twoPartTransitionWords.js +0 -34
- package/src/languageProcessing/languages/hu/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/hu/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/hu/helpers/internal/getParticiples.js +0 -21
- package/src/languageProcessing/languages/hu/helpers/internal/stem.js +0 -389
- package/src/languageProcessing/languages/hu/helpers/isPassiveSentence.js +0 -54
- package/src/languageProcessing/languages/hu/values/Clause.js +0 -41
- package/src/languageProcessing/languages/id/Researcher.js +0 -46
- package/src/languageProcessing/languages/id/config/firstWordExceptions.js +0 -13
- package/src/languageProcessing/languages/id/config/functionWords.js +0 -202
- package/src/languageProcessing/languages/id/config/internal/nonPassiveVerbsStartingDi.js +0 -215
- package/src/languageProcessing/languages/id/config/transitionWords.js +0 -62
- package/src/languageProcessing/languages/id/config/twoPartTransitionWords.js +0 -13
- package/src/languageProcessing/languages/id/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/id/helpers/internal/stem.js +0 -462
- package/src/languageProcessing/languages/id/helpers/internal/stemHelpers.js +0 -78
- package/src/languageProcessing/languages/id/helpers/isPassiveSentence.js +0 -39
- package/src/languageProcessing/languages/id/helpers/splitIntoTokensCustom.js +0 -47
- package/src/languageProcessing/languages/it/Researcher.js +0 -48
- package/src/languageProcessing/languages/it/config/firstWordExceptions.js +0 -17
- package/src/languageProcessing/languages/it/config/functionWords.js +0 -277
- package/src/languageProcessing/languages/it/config/internal/passiveVoiceAuxiliaries.js +0 -98
- package/src/languageProcessing/languages/it/config/internal/passiveVoiceParticiples.js +0 -7197
- package/src/languageProcessing/languages/it/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/it/config/stopWords.js +0 -57
- package/src/languageProcessing/languages/it/config/syllables.json +0 -573
- package/src/languageProcessing/languages/it/config/transitionWords.js +0 -104
- package/src/languageProcessing/languages/it/config/twoPartTransitionWords.js +0 -9
- package/src/languageProcessing/languages/it/helpers/calculateFleschReadingScore.js +0 -15
- package/src/languageProcessing/languages/it/helpers/getClauses.js +0 -32
- package/src/languageProcessing/languages/it/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/it/helpers/internal/getParticiples.js +0 -34
- package/src/languageProcessing/languages/it/helpers/internal/stem.js +0 -436
- package/src/languageProcessing/languages/it/values/Clause.js +0 -47
- package/src/languageProcessing/languages/ja/Researcher.js +0 -86
- package/src/languageProcessing/languages/ja/config/assessmentApplicabilityCharacterCount.js +0 -4
- package/src/languageProcessing/languages/ja/config/firstWordExceptions.js +0 -8
- package/src/languageProcessing/languages/ja/config/functionWords.js +0 -563
- package/src/languageProcessing/languages/ja/config/keyphraseLength.js +0 -16
- package/src/languageProcessing/languages/ja/config/metaDescriptionLength.js +0 -4
- package/src/languageProcessing/languages/ja/config/paragraphLength.js +0 -10
- package/src/languageProcessing/languages/ja/config/sentenceLength.js +0 -4
- package/src/languageProcessing/languages/ja/config/subheadingsTooLong.js +0 -18
- package/src/languageProcessing/languages/ja/config/textLength.js +0 -47
- package/src/languageProcessing/languages/ja/config/topicLength.js +0 -5
- package/src/languageProcessing/languages/ja/config/transitionWords.js +0 -354
- package/src/languageProcessing/languages/ja/customResearches/findKeyphraseInSEOTitle.js +0 -98
- package/src/languageProcessing/languages/ja/customResearches/getKeyphraseLength.js +0 -19
- package/src/languageProcessing/languages/ja/customResearches/getWordForms.js +0 -50
- package/src/languageProcessing/languages/ja/customResearches/textLength.js +0 -24
- package/src/languageProcessing/languages/ja/helpers/countCharacters.js +0 -19
- package/src/languageProcessing/languages/ja/helpers/customGetStemmer.js +0 -21
- package/src/languageProcessing/languages/ja/helpers/getContentWords.js +0 -21
- package/src/languageProcessing/languages/ja/helpers/getWords.js +0 -31
- package/src/languageProcessing/languages/ja/helpers/internal/SentenceTokenizer.js +0 -102
- package/src/languageProcessing/languages/ja/helpers/internal/createWordForms.js +0 -68
- package/src/languageProcessing/languages/ja/helpers/internal/determineStem.js +0 -17
- package/src/languageProcessing/languages/ja/helpers/matchTextWithWord.js +0 -53
- package/src/languageProcessing/languages/ja/helpers/matchTransitionWords.js +0 -25
- package/src/languageProcessing/languages/ja/helpers/memoizedSentenceTokenizer.js +0 -28
- package/src/languageProcessing/languages/ja/helpers/splitIntoTokensCustom.js +0 -20
- package/src/languageProcessing/languages/ja/helpers/wordsCharacterCount.js +0 -13
- package/src/languageProcessing/languages/nb/Researcher.js +0 -45
- package/src/languageProcessing/languages/nb/config/firstWordExceptions.js +0 -12
- package/src/languageProcessing/languages/nb/config/functionWords.js +0 -106
- package/src/languageProcessing/languages/nb/config/internal/participles.js +0 -3127
- package/src/languageProcessing/languages/nb/config/internal/passiveVoiceAuxiliaries.js +0 -15
- package/src/languageProcessing/languages/nb/config/stopWords.js +0 -39
- package/src/languageProcessing/languages/nb/config/transitionWords.js +0 -21
- package/src/languageProcessing/languages/nb/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/nb/helpers/getClauses.js +0 -28
- package/src/languageProcessing/languages/nb/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/nb/helpers/internal/getParticiples.js +0 -24
- package/src/languageProcessing/languages/nb/helpers/internal/stem.js +0 -133
- package/src/languageProcessing/languages/nb/values/Clause.js +0 -43
- package/src/languageProcessing/languages/nl/Researcher.js +0 -48
- package/src/languageProcessing/languages/nl/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/nl/config/functionWords.js +0 -233
- package/src/languageProcessing/languages/nl/config/internal/nonParticiples.js +0 -2515
- package/src/languageProcessing/languages/nl/config/internal/passiveVoiceAuxiliaries.js +0 -13
- package/src/languageProcessing/languages/nl/config/internal/passiveVoiceIrregulars.js +0 -474
- package/src/languageProcessing/languages/nl/config/keyphraseLength.js +0 -10
- package/src/languageProcessing/languages/nl/config/stopWords.js +0 -35
- package/src/languageProcessing/languages/nl/config/syllables.json +0 -343
- package/src/languageProcessing/languages/nl/config/transitionWords.js +0 -22
- package/src/languageProcessing/languages/nl/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/nl/helpers/calculateFleschReadingScore.js +0 -15
- package/src/languageProcessing/languages/nl/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/nl/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/nl/helpers/internal/checkExceptionsWithFullForms.js +0 -128
- package/src/languageProcessing/languages/nl/helpers/internal/detectAndStemRegularParticiple.js +0 -324
- package/src/languageProcessing/languages/nl/helpers/internal/detectAndStemSuffixes.js +0 -164
- package/src/languageProcessing/languages/nl/helpers/internal/determineStem.js +0 -133
- package/src/languageProcessing/languages/nl/helpers/internal/getParticiples.js +0 -25
- package/src/languageProcessing/languages/nl/helpers/internal/getStemWordsWithTAndDEnding.js +0 -183
- package/src/languageProcessing/languages/nl/helpers/internal/stem.js +0 -146
- package/src/languageProcessing/languages/nl/helpers/internal/stemModificationHelpers.js +0 -109
- package/src/languageProcessing/languages/nl/helpers/internal/stemTOrDFromEndOfWord.js +0 -65
- package/src/languageProcessing/languages/nl/values/Clause.js +0 -62
- package/src/languageProcessing/languages/pl/Researcher.js +0 -47
- package/src/languageProcessing/languages/pl/config/firstWordExceptions.js +0 -12
- package/src/languageProcessing/languages/pl/config/functionWords.js +0 -421
- package/src/languageProcessing/languages/pl/config/internal/auxiliaries.js +0 -85
- package/src/languageProcessing/languages/pl/config/internal/participles.js +0 -26433
- package/src/languageProcessing/languages/pl/config/sentenceLength.js +0 -10
- package/src/languageProcessing/languages/pl/config/stopWords.js +0 -36
- package/src/languageProcessing/languages/pl/config/transitionWords.js +0 -42
- package/src/languageProcessing/languages/pl/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/pl/helpers/getClauses.js +0 -25
- package/src/languageProcessing/languages/pl/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/pl/helpers/internal/getParticiples.js +0 -18
- package/src/languageProcessing/languages/pl/helpers/internal/stem.js +0 -161
- package/src/languageProcessing/languages/pl/values/Clause.js +0 -53
- package/src/languageProcessing/languages/pt/Researcher.js +0 -48
- package/src/languageProcessing/languages/pt/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/pt/config/functionWords.js +0 -226
- package/src/languageProcessing/languages/pt/config/internal/passiveVoiceAuxiliaries.js +0 -66
- package/src/languageProcessing/languages/pt/config/internal/passiveVoiceParticiples.js +0 -4088
- package/src/languageProcessing/languages/pt/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/pt/config/stopWords.js +0 -50
- package/src/languageProcessing/languages/pt/config/syllables.json +0 -38
- package/src/languageProcessing/languages/pt/config/transitionWords.js +0 -34
- package/src/languageProcessing/languages/pt/config/twoPartTransitionWords.js +0 -9
- package/src/languageProcessing/languages/pt/helpers/calculateFleschReadingScore.js +0 -15
- package/src/languageProcessing/languages/pt/helpers/getClauses.js +0 -29
- package/src/languageProcessing/languages/pt/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/pt/helpers/internal/getParticiples.js +0 -35
- package/src/languageProcessing/languages/pt/helpers/internal/stem.js +0 -319
- package/src/languageProcessing/languages/pt/values/Clause.js +0 -43
- package/src/languageProcessing/languages/ru/Researcher.js +0 -48
- package/src/languageProcessing/languages/ru/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/ru/config/fleschReadingEaseScores.js +0 -20
- package/src/languageProcessing/languages/ru/config/functionWords.js +0 -519
- package/src/languageProcessing/languages/ru/config/internal/participlesShortenedList.js +0 -2914
- package/src/languageProcessing/languages/ru/config/internal/passiveVoiceParticiples.js +0 -6295
- package/src/languageProcessing/languages/ru/config/sentenceLength.js +0 -3
- package/src/languageProcessing/languages/ru/config/syllables.json +0 -19
- package/src/languageProcessing/languages/ru/config/transitionWords.js +0 -62
- package/src/languageProcessing/languages/ru/config/twoPartTransitionWords.js +0 -14
- package/src/languageProcessing/languages/ru/helpers/calculateFleschReadingScore.js +0 -16
- package/src/languageProcessing/languages/ru/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/ru/helpers/internal/stem.js +0 -288
- package/src/languageProcessing/languages/ru/helpers/isPassiveSentence.js +0 -14
- package/src/languageProcessing/languages/sk/Researcher.js +0 -46
- package/src/languageProcessing/languages/sk/config/firstWordExceptions.js +0 -14
- package/src/languageProcessing/languages/sk/config/functionWords.js +0 -855
- package/src/languageProcessing/languages/sk/config/internal/nonPassives.js +0 -1074
- package/src/languageProcessing/languages/sk/config/internal/passiveVoiceAuxiliaries.js +0 -22
- package/src/languageProcessing/languages/sk/config/stopWords.js +0 -34
- package/src/languageProcessing/languages/sk/config/transitionWords.js +0 -23
- package/src/languageProcessing/languages/sk/config/twoPartTransitionWords.js +0 -10
- package/src/languageProcessing/languages/sk/helpers/getClauses.js +0 -26
- package/src/languageProcessing/languages/sk/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/sk/helpers/internal/getParticiples.js +0 -16
- package/src/languageProcessing/languages/sk/helpers/internal/stem.js +0 -319
- package/src/languageProcessing/languages/sk/values/Clause.js +0 -39
- package/src/languageProcessing/languages/sv/Researcher.js +0 -45
- package/src/languageProcessing/languages/sv/config/firstWordExceptions.js +0 -15
- package/src/languageProcessing/languages/sv/config/functionWords.js +0 -176
- package/src/languageProcessing/languages/sv/config/internal/passiveVerbs.js +0 -10400
- package/src/languageProcessing/languages/sv/config/keyphraseLength.js +0 -11
- package/src/languageProcessing/languages/sv/config/transitionWords.js +0 -35
- package/src/languageProcessing/languages/sv/config/twoPartTransitionWords.js +0 -8
- package/src/languageProcessing/languages/sv/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/sv/helpers/internal/stem.js +0 -152
- package/src/languageProcessing/languages/sv/helpers/isPassiveSentence.js +0 -14
- package/src/languageProcessing/languages/tr/Researcher.js +0 -44
- package/src/languageProcessing/languages/tr/config/firstWordExceptions.js +0 -13
- package/src/languageProcessing/languages/tr/config/functionWords.js +0 -116
- package/src/languageProcessing/languages/tr/config/internal/nonPassiveExceptions.js +0 -574
- package/src/languageProcessing/languages/tr/config/internal/passiveEndings.js +0 -151
- package/src/languageProcessing/languages/tr/config/sentenceLength.js +0 -7
- package/src/languageProcessing/languages/tr/config/transitionWords.js +0 -42
- package/src/languageProcessing/languages/tr/config/twoPartTransitionWords.js +0 -7
- package/src/languageProcessing/languages/tr/helpers/getStemmer.js +0 -22
- package/src/languageProcessing/languages/tr/helpers/internal/stem.js +0 -20
- package/src/languageProcessing/languages/tr/helpers/isPassiveSentence.js +0 -43
- package/src/languageProcessing/researches/altTagCount.js +0 -70
- package/src/languageProcessing/researches/countSentencesFromText.js +0 -19
- package/src/languageProcessing/researches/findKeyphraseInSEOTitle.js +0 -257
- package/src/languageProcessing/researches/findKeywordInFirstParagraph.js +0 -86
- package/src/languageProcessing/researches/findTransitionWords.js +0 -123
- package/src/languageProcessing/researches/functionWordsInKeyphrase.js +0 -44
- package/src/languageProcessing/researches/getAnchorsWithKeyphrase.js +0 -227
- package/src/languageProcessing/researches/getFleschReadingScore.js +0 -150
- package/src/languageProcessing/researches/getKeywordDensity.js +0 -44
- package/src/languageProcessing/researches/getLinkStatistics.js +0 -54
- package/src/languageProcessing/researches/getLinks.js +0 -18
- package/src/languageProcessing/researches/getLongCenterAlignedTexts.js +0 -37
- package/src/languageProcessing/researches/getParagraphLength.js +0 -44
- package/src/languageProcessing/researches/getParagraphs.js +0 -18
- package/src/languageProcessing/researches/getPassiveVoiceResult.js +0 -129
- package/src/languageProcessing/researches/getProminentWordsForInsights.js +0 -48
- package/src/languageProcessing/researches/getProminentWordsForInternalLinking.js +0 -119
- package/src/languageProcessing/researches/getSentenceBeginnings.js +0 -124
- package/src/languageProcessing/researches/getSubheadingTextLengths.js +0 -59
- package/src/languageProcessing/researches/getWordForms.js +0 -204
- package/src/languageProcessing/researches/h1s.js +0 -10
- package/src/languageProcessing/researches/imageCount.js +0 -16
- package/src/languageProcessing/researches/index.js +0 -5
- package/src/languageProcessing/researches/keyphraseDistribution.js +0 -249
- package/src/languageProcessing/researches/keyphraseLength.js +0 -17
- package/src/languageProcessing/researches/keywordCount.js +0 -134
- package/src/languageProcessing/researches/keywordCountInUrl.js +0 -57
- package/src/languageProcessing/researches/matchKeywordInSubheadings.js +0 -62
- package/src/languageProcessing/researches/metaDescriptionKeyword.js +0 -85
- package/src/languageProcessing/researches/metaDescriptionLength.js +0 -12
- package/src/languageProcessing/researches/pageTitleWidth.js +0 -11
- package/src/languageProcessing/researches/readingTime.js +0 -82
- package/src/languageProcessing/researches/sentences.js +0 -20
- package/src/languageProcessing/researches/videoCount.js +0 -32
- package/src/languageProcessing/researches/wordComplexity.js +0 -129
- package/src/languageProcessing/researches/wordCountInText.js +0 -29
- package/src/languageProcessing/values/Clause.js +0 -108
- package/src/languageProcessing/values/ProminentWord.js +0 -95
- package/src/languageProcessing/values/Sentence.js +0 -111
- package/src/languageProcessing/values/index.js +0 -9
- package/src/markers/addMark.js +0 -9
- package/src/markers/addMarkSingleWord.js +0 -32
- package/src/markers/index.js +0 -7
- package/src/markers/removeDuplicateMarks.js +0 -27
- package/src/markers/removeMarks.js +0 -11
- package/src/parse/build/build.js +0 -52
- package/src/parse/build/index.js +0 -10
- package/src/parse/build/private/adapt.js +0 -113
- package/src/parse/build/private/adaptAttributes.js +0 -36
- package/src/parse/build/private/alwaysFilterElements.js +0 -75
- package/src/parse/build/private/combineIntoImplicitParagraphs.js +0 -130
- package/src/parse/build/private/filterBeforeTokenizing.js +0 -32
- package/src/parse/build/private/filterHelpers.js +0 -44
- package/src/parse/build/private/filterTree.js +0 -42
- package/src/parse/build/private/getTextElementPositions.js +0 -184
- package/src/parse/build/private/helpers/parseClassAttribute.js +0 -9
- package/src/parse/build/private/isPhrasingContent.js +0 -28
- package/src/parse/build/private/parseBlocks.js +0 -151
- package/src/parse/build/private/tokenize.js +0 -74
- package/src/parse/language/LanguageProcessor.js +0 -74
- package/src/parse/structure/Heading.js +0 -26
- package/src/parse/structure/Node.js +0 -69
- package/src/parse/structure/Paragraph.js +0 -48
- package/src/parse/structure/Sentence.js +0 -30
- package/src/parse/structure/SourceCodeLocation.js +0 -41
- package/src/parse/structure/Text.js +0 -27
- package/src/parse/structure/Token.js +0 -24
- package/src/parse/structure/index.js +0 -16
- package/src/parse/traverse/findAllInTree.js +0 -58
- package/src/parse/traverse/index.js +0 -12
- package/src/parse/traverse/innerText.js +0 -26
- package/src/parsedPaper/ParsedPaper.js +0 -92
- package/src/parsedPaper/assess/TreeAssessor.js +0 -184
- package/src/parsedPaper/assess/assessmentListFactories.js +0 -73
- package/src/parsedPaper/assess/assessments/Assessment.js +0 -79
- package/src/parsedPaper/assess/assessments/index.js +0 -6
- package/src/parsedPaper/assess/assessorFactories.js +0 -104
- package/src/parsedPaper/assess/cornerstone/assessmentListFactories.js +0 -47
- package/src/parsedPaper/assess/cornerstone/index.js +0 -5
- package/src/parsedPaper/assess/index.js +0 -20
- package/src/parsedPaper/build/PaperParser.js +0 -105
- package/src/parsedPaper/build/linguisticParsing/Sentence.js +0 -89
- package/src/parsedPaper/build/linguisticParsing/SentenceTokenizer.js +0 -323
- package/src/parsedPaper/build/linguisticParsing/parseText.js +0 -20
- package/src/parsedPaper/build/tree/TreeBuilder.js +0 -75
- package/src/parsedPaper/build/tree/cleanup/calculateTextIndices.js +0 -190
- package/src/parsedPaper/build/tree/cleanup/getElementContent.js +0 -21
- package/src/parsedPaper/build/tree/cleanup/postParsing.js +0 -37
- package/src/parsedPaper/build/tree/html/HTMLTreeConverter.js +0 -230
- package/src/parsedPaper/build/tree/html/buildTree.js +0 -31
- package/src/parsedPaper/build/tree/html/htmlConstants.js +0 -37
- package/src/parsedPaper/build/tree/index.js +0 -14
- package/src/parsedPaper/build/tree/metadata/buildTree.js +0 -32
- package/src/parsedPaper/research/TreeResearcher.js +0 -134
- package/src/parsedPaper/research/index.js +0 -13
- package/src/parsedPaper/research/researches/Headings.js +0 -20
- package/src/parsedPaper/research/researches/LinkStatistics.js +0 -128
- package/src/parsedPaper/research/researches/Research.js +0 -50
- package/src/parsedPaper/research/researches/index.js +0 -1
- package/src/parsedPaper/structure/tree/FormattingElement.js +0 -67
- package/src/parsedPaper/structure/tree/SourceCodeLocation.js +0 -31
- package/src/parsedPaper/structure/tree/TextContainer.js +0 -85
- package/src/parsedPaper/structure/tree/index.js +0 -22
- package/src/parsedPaper/structure/tree/nodes/Heading.js +0 -26
- package/src/parsedPaper/structure/tree/nodes/LeafNode.js +0 -75
- package/src/parsedPaper/structure/tree/nodes/List.js +0 -47
- package/src/parsedPaper/structure/tree/nodes/ListItem.js +0 -26
- package/src/parsedPaper/structure/tree/nodes/MetadataMiscellaneous.js +0 -46
- package/src/parsedPaper/structure/tree/nodes/MetadataText.js +0 -26
- package/src/parsedPaper/structure/tree/nodes/Node.js +0 -154
- package/src/parsedPaper/structure/tree/nodes/Paragraph.js +0 -24
- package/src/parsedPaper/structure/tree/nodes/StructuredNode.js +0 -52
- package/src/parsedPaper/structure/tree/nodes/index.js +0 -21
- package/src/scoring/assessments/assessment.js +0 -63
- package/src/scoring/assessments/index.js +0 -58
- package/src/scoring/assessments/readability/ParagraphTooLongAssessment.js +0 -173
- package/src/scoring/assessments/readability/SentenceBeginningsAssessment.js +0 -132
- package/src/scoring/assessments/readability/SentenceLengthInTextAssessment.js +0 -186
- package/src/scoring/assessments/readability/TransitionWordsAssessment.js +0 -168
- package/src/scoring/assessments/seo/ImageCountAssessment.js +0 -112
- package/src/scoring/assessments/seo/InternalLinksAssessment.js +0 -114
- package/src/scoring/assessments/seo/IntroductionKeywordAssessment.js +0 -110
- package/src/scoring/assessments/seo/KeyphraseAssessment.js +0 -104
- package/src/scoring/assessments/seo/KeyphraseLengthAssessment.js +0 -110
- package/src/scoring/assessments/seo/KeywordDensityAssessment.js +0 -116
- package/src/scoring/assessments/seo/MetaDescriptionKeywordAssessment.js +0 -114
- package/src/scoring/assessments/seo/MetaDescriptionLengthAssessment.js +0 -112
- package/src/scoring/assessments/seo/MetaTitleKeywordAssessment.js +0 -111
- package/src/scoring/assessments/seo/NumberInMetaTitleAssessment.js +0 -107
- package/src/scoring/assessments/seo/OutboundLinksAssessment.js +0 -111
- package/src/scoring/assessments/seo/PageTitleWidthAssessment.js +0 -104
- package/src/scoring/assessments/seo/SingleH1Assessment.js +0 -118
- package/src/scoring/assessments/seo/SingleTitleAssessment.js +0 -108
- package/src/scoring/assessments/seo/SubHeadingsKeywordAssessment.js +0 -107
- package/src/scoring/assessments/seo/TextImagesAssessment.js +0 -144
- package/src/scoring/assessments/seo/TextLengthAssessment.js +0 -100
- package/src/scoring/assessments/seo/UrlKeywordAssessment.js +0 -111
- package/src/scoring/assessments/seo/UrlLengthAssessment.js +0 -103
- package/src/scoring/assessors/assessor.js +0 -269
- package/src/scoring/assessors/avadaAssessor.js +0 -67
- package/src/scoring/assessors/contentAssessor.js +0 -159
- package/src/scoring/assessors/index.js +0 -4
- package/src/scoring/assessors/seoAssessor.js +0 -57
- package/src/scoring/helpers/assessments/checkForTooLongSentences.js +0 -13
- package/src/scoring/helpers/assessments/inRange.js +0 -49
- package/src/scoring/helpers/assessments/keyphraseLengthFactor.js +0 -10
- package/src/scoring/helpers/assessments/recommendedKeywordCount.js +0 -43
- package/src/scoring/helpers/index.js +0 -74
- package/src/scoring/interpreters/index.js +0 -5
- package/src/scoring/interpreters/scoreToRating.js +0 -31
- package/src/scoring/renderers/AssessorPresenter.js +0 -360
- package/src/scoring/scoreAggregators/ReadabilityScoreAggregator.js +0 -203
- package/src/scoring/scoreAggregators/SEOScoreAggregator.js +0 -54
- package/src/scoring/scoreAggregators/ScoreAggregator.js +0 -23
- package/src/scoring/scoreAggregators/index.js +0 -3
- package/src/values/AssessmentResult.js +0 -496
- package/src/values/Mark.js +0 -271
- package/src/values/Paper.js +0 -425
- package/src/values/index.js +0 -9
- package/src/vendor/turkishStemmer.js +0 -3435
- package/tsconfig.json +0 -15
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
// These auxiliaries are filtered from the beginning of word combinations in the prominent words.
|
|
2
|
-
export const filteredAuxiliaries = [
|
|
3
|
-
"byť",
|
|
4
|
-
"som",
|
|
5
|
-
"si",
|
|
6
|
-
"je",
|
|
7
|
-
"sme",
|
|
8
|
-
"ste",
|
|
9
|
-
"sú",
|
|
10
|
-
"bol",
|
|
11
|
-
"bola",
|
|
12
|
-
"boli",
|
|
13
|
-
"bolo",
|
|
14
|
-
"budem",
|
|
15
|
-
"budeš",
|
|
16
|
-
"bude",
|
|
17
|
-
"budeme",
|
|
18
|
-
"budete",
|
|
19
|
-
"budú",
|
|
20
|
-
];
|
|
21
|
-
|
|
22
|
-
export default filteredAuxiliaries;
|
|
@@ -1,34 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Returns a list with stopwords for the Slovak passive voice assessment.
|
|
3
|
-
*
|
|
4
|
-
* @returns {Array} The list with stopwords.
|
|
5
|
-
*/
|
|
6
|
-
export default [
|
|
7
|
-
"ktorí",
|
|
8
|
-
"ktorých",
|
|
9
|
-
"ktorými",
|
|
10
|
-
"ktorá",
|
|
11
|
-
"ktorého",
|
|
12
|
-
"ktorému",
|
|
13
|
-
"ktorom",
|
|
14
|
-
"ktorým",
|
|
15
|
-
"ktorý",
|
|
16
|
-
"ktoré",
|
|
17
|
-
"ktorej",
|
|
18
|
-
"ktorou",
|
|
19
|
-
"ktorú",
|
|
20
|
-
"lebo",
|
|
21
|
-
"keby",
|
|
22
|
-
"že",
|
|
23
|
-
"aby",
|
|
24
|
-
"alebo",
|
|
25
|
-
"keďže",
|
|
26
|
-
"kedže",
|
|
27
|
-
"lenže",
|
|
28
|
-
"ale",
|
|
29
|
-
"nakoľko",
|
|
30
|
-
"pretože",
|
|
31
|
-
"či",
|
|
32
|
-
"ak",
|
|
33
|
-
"kedy",
|
|
34
|
-
];
|
|
@@ -1,23 +0,0 @@
|
|
|
1
|
-
/** @module config/transitionWords */
|
|
2
|
-
|
|
3
|
-
export const singleWords = [ "kvôli", "miesto", "pre", "oproti", "aj", "i", "ani", "ale", "avšak", "však", "preto", "tak", "teda",
|
|
4
|
-
"hoci", "aby", "ako", "keď", "keďže", "kým", "pokiaľ", "ohľadne", "takto", "tiež ", "potom", "takže", "odtiaľ", "odteraz",
|
|
5
|
-
"lebo", "akonáhle", "lenže", "okrem", "nakoľko", "pokým", "pretože", "čiže", "jednako", "doteraz", "dosiaľ", "najmä",
|
|
6
|
-
"napríklad", "napr.", "napokon", "predsa", "určite", "dodatočne", "ďalej", "následne", "napriek", "hlavne", "nakoniec",
|
|
7
|
-
"medzitým", "inak ", "ináč", "obdobne", "podobne", "predovšetkým", "naozaj", "spočiatku ", "najprv", "najskôr", "stručne",
|
|
8
|
-
"všeobecne", "samozrejme", "pravdaže", "doposiaľ", "nielen", "než", "síce", "pričom", "až", "jednak", "zato", "nielenže",
|
|
9
|
-
"ibaže", "skôr", "prv", "hoc", "namiesto", "buďto", "inakšie", "hneď", "kedykoľvek" ];
|
|
10
|
-
|
|
11
|
-
export const multipleWords = [ "ako aj", "ako i", "a tak ďalej", "a tak", "aj tak", "a jednako", "a naopak", "a predsa", "ale jednako",
|
|
12
|
-
"ale predsa", "a tým", "a to", "i to", "jednako však", "predsa však", "to jest", "a preto", "i keby", "i keď", "čo aj",
|
|
13
|
-
"keby aj", "pretor, aby", "odvtedy čo", "zatiar čo", "vzhľadom na to, že", "berúc do úvahy, že", "napriek tomu, že",
|
|
14
|
-
"preto, aby", "za účelom", "za týmto účelom", "skôr či neskôr ", "hneď ako", "len čo", "pokiaľ ide o", "pokiaľ nie",
|
|
15
|
-
"pokiaľ viem", "po prvé", "čo sa týka", "až do", "až na", "až po", "z tohto dôvodu", "z toho dôvodu", "no predsa",
|
|
16
|
-
"iba ak", "ak nie", "keď nie", "tobôž nie", "pravdu povediac", "ako napríklad", "okrem toho ", "v podstate", "ako je uvedené ",
|
|
17
|
-
"v každom prípade", "na rozdiel od", "v porovnaní s", "v oboch prípadoch", "stručne povedané", "inými slovami",
|
|
18
|
-
"na jednej strane", "na druhej strane", "s týmto cieľom" ];
|
|
19
|
-
|
|
20
|
-
export const allWords = singleWords.concat( multipleWords );
|
|
21
|
-
|
|
22
|
-
export default allWords;
|
|
23
|
-
|
|
@@ -1,10 +0,0 @@
|
|
|
1
|
-
/** @module config/twoPartTransitionWords */
|
|
2
|
-
|
|
3
|
-
/**
|
|
4
|
-
* Returns an array with two-part transition words to be used by the assessments.
|
|
5
|
-
* @returns {Array} The array filled with two-part transition words.
|
|
6
|
-
*/
|
|
7
|
-
export default [ [ "buď, buď" ], [ "buď, alebo" ], [ "ani, ani" ], [ "aj, aj" ], [ "tak, ako" ], [ "nielenže, lež aj" ],
|
|
8
|
-
[ "nielen, lež aj" ], [ "nielen, lež i" ], [ "nielenže, lež ai" ], [ "či, alebo" ], [ "i, i" ], [ "nielen, ale i" ],
|
|
9
|
-
[ "síce, ale" ] ];
|
|
10
|
-
|
|
@@ -1,26 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {getClausesSplitOnStopWords, createRegexFromArray} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
import SlovakClause from '../values/Clause';
|
|
5
|
-
import auxiliaries from '../config/internal/passiveVoiceAuxiliaries.js';
|
|
6
|
-
import stopwords from '../config/stopWords.js';
|
|
7
|
-
|
|
8
|
-
const options = {
|
|
9
|
-
Clause: SlovakClause,
|
|
10
|
-
regexes: {
|
|
11
|
-
auxiliaryRegex: createRegexFromArray(auxiliaries),
|
|
12
|
-
stopCharacterRegex: /([:,])(?=[ \n\r\t'"+\-»«‹›<>])/gi,
|
|
13
|
-
stopwordRegex: createRegexFromArray(stopwords)
|
|
14
|
-
}
|
|
15
|
-
};
|
|
16
|
-
|
|
17
|
-
/**
|
|
18
|
-
* Gets the clauses from a sentence by determining sentence breakers.
|
|
19
|
-
*
|
|
20
|
-
* @param {string} sentence The sentence to split up into clauses.
|
|
21
|
-
*
|
|
22
|
-
* @returns {Array} The array with all clauses that have an auxiliary.
|
|
23
|
-
*/
|
|
24
|
-
export default function getSlovakClauses(sentence) {
|
|
25
|
-
return getClausesSplitOnStopWords(sentence, options);
|
|
26
|
-
}
|
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
import {get} from 'lodash';
|
|
2
|
-
import {languageProcessing} from '../../../index';
|
|
3
|
-
const {baseStemmer} = languageProcessing;
|
|
4
|
-
|
|
5
|
-
import stem from './internal/stem';
|
|
6
|
-
|
|
7
|
-
/**
|
|
8
|
-
* Returns the stemmer for a researcher.
|
|
9
|
-
*
|
|
10
|
-
* @param {Researcher} researcher The researcher.
|
|
11
|
-
*
|
|
12
|
-
* @returns {Function} The stemmer.
|
|
13
|
-
*/
|
|
14
|
-
export default function getStemmer(researcher) {
|
|
15
|
-
const morphologyData = get(researcher.getData('morphology'), 'sk', false);
|
|
16
|
-
|
|
17
|
-
if (morphologyData) {
|
|
18
|
-
return word => stem(word, morphologyData);
|
|
19
|
-
}
|
|
20
|
-
|
|
21
|
-
return baseStemmer;
|
|
22
|
-
}
|
|
@@ -1,16 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {getWords} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
/**
|
|
5
|
-
* Creates an array of participles found in a clause.
|
|
6
|
-
*
|
|
7
|
-
* @param {string} clauseText The clause to find participles in.
|
|
8
|
-
*
|
|
9
|
-
* @returns {Array} The list with participles found.
|
|
10
|
-
*/
|
|
11
|
-
export default function(clauseText) {
|
|
12
|
-
const words = getWords(clauseText);
|
|
13
|
-
const participleEndingsRegex = new RegExp('(ný|ní|tý|ná|tá|né|té)$');
|
|
14
|
-
|
|
15
|
-
return words.filter(word => participleEndingsRegex.test(word));
|
|
16
|
-
}
|
|
@@ -1,319 +0,0 @@
|
|
|
1
|
-
/* eslint-disable max-statements,complexity */
|
|
2
|
-
/*
|
|
3
|
-
* The MIT License (MIT)
|
|
4
|
-
*
|
|
5
|
-
* Copyright (c) 2015 Marek Šuppa
|
|
6
|
-
*
|
|
7
|
-
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
8
|
-
* of this software and associated documentation files (the "Software"), to deal
|
|
9
|
-
* in the Software without restriction, including without limitation the rights
|
|
10
|
-
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
11
|
-
* copies of the Software, and to permit persons to whom the Software is
|
|
12
|
-
* furnished to do so, subject to the following conditions:
|
|
13
|
-
*
|
|
14
|
-
* The above copyright notice and this permission notice shall be included in all
|
|
15
|
-
* copies or substantial portions of the Software.
|
|
16
|
-
*
|
|
17
|
-
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
18
|
-
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
19
|
-
* FITNESS FOR A PARTICULAR PURPOSE AND NON INFRINGEMENT. IN NO EVENT SHALL THE
|
|
20
|
-
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
21
|
-
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
22
|
-
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
23
|
-
* SOFTWARE.
|
|
24
|
-
*/
|
|
25
|
-
|
|
26
|
-
/**
|
|
27
|
-
* Takes care of palatalisation.
|
|
28
|
-
*
|
|
29
|
-
* @param {string} word The word to stem.
|
|
30
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
31
|
-
*
|
|
32
|
-
* @returns {string} The non-palatalised word or the original word if no such suffix is found.
|
|
33
|
-
*/
|
|
34
|
-
function palatalise( word, morphologyData ) {
|
|
35
|
-
const palatalEndingsRegexes = morphologyData.externalStemmer.palatalEndingsRegexes;
|
|
36
|
-
// Check if word ends in a palatal ending and return the regex if it does.
|
|
37
|
-
const checkPalatalEnding = palatalEndingsRegexes.find( regex => new RegExp( regex[ 0 ] ).test( word ) );
|
|
38
|
-
if ( checkPalatalEnding ) {
|
|
39
|
-
return word.replace( new RegExp( checkPalatalEnding[ 0 ] ), checkPalatalEnding[ 1 ] );
|
|
40
|
-
}
|
|
41
|
-
return word.slice( 0, -1 );
|
|
42
|
-
}
|
|
43
|
-
|
|
44
|
-
/**
|
|
45
|
-
* Removes case suffixes.
|
|
46
|
-
*
|
|
47
|
-
* @param {string} word The word to stem.
|
|
48
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
49
|
-
*
|
|
50
|
-
* @returns {string} The word without case suffixes or the original word if no such suffix is found.
|
|
51
|
-
*/
|
|
52
|
-
function removeCases( word, morphologyData ) {
|
|
53
|
-
const caseSuffixes = morphologyData.externalStemmer.caseSuffixes;
|
|
54
|
-
const caseRegexes = morphologyData.externalStemmer.caseRegexes;
|
|
55
|
-
|
|
56
|
-
if ( word.length > 7 && word.endsWith( caseSuffixes.caseSuffix1 ) ) {
|
|
57
|
-
// Return the word without the suffix
|
|
58
|
-
return word.slice( 0, -5 );
|
|
59
|
-
}
|
|
60
|
-
if ( word.length > 6 && word.endsWith( caseSuffixes.caseSuffix2 ) ) {
|
|
61
|
-
return palatalise( word.slice( 0, -3 ), morphologyData );
|
|
62
|
-
}
|
|
63
|
-
if ( word.length > 5 ) {
|
|
64
|
-
if ( caseSuffixes.caseSuffixes3.includes( word.slice( -3 ) ) ) {
|
|
65
|
-
return palatalise( word.slice( 0, -2 ), morphologyData );
|
|
66
|
-
} else if ( caseSuffixes.caseSuffixes4.includes( word.slice( -3 ) ) ) {
|
|
67
|
-
return word.slice( 0, -3 );
|
|
68
|
-
}
|
|
69
|
-
}
|
|
70
|
-
if ( word.length > 4 ) {
|
|
71
|
-
if ( word.endsWith( caseSuffixes.caseSuffix5 ) ) {
|
|
72
|
-
return palatalise( word.slice( 0, -1 ), morphologyData );
|
|
73
|
-
} else if ( caseSuffixes.caseSuffixes6.includes( word.slice( -2 ) ) ) {
|
|
74
|
-
return palatalise( word.slice( 0, -2 ), morphologyData );
|
|
75
|
-
} else if ( caseSuffixes.caseSuffixes7.includes( word.slice( -2 ) ) ) {
|
|
76
|
-
return word.slice( 0, -2 );
|
|
77
|
-
}
|
|
78
|
-
}
|
|
79
|
-
if ( word.length > 3 ) {
|
|
80
|
-
if ( new RegExp( caseRegexes.caseRegex1 ).test( word ) ) {
|
|
81
|
-
return palatalise( word, morphologyData );
|
|
82
|
-
} else if ( new RegExp( caseRegexes.caseRegex2 ).test( word ) ) {
|
|
83
|
-
return word.slice( 0, -1 );
|
|
84
|
-
}
|
|
85
|
-
}
|
|
86
|
-
return word;
|
|
87
|
-
}
|
|
88
|
-
|
|
89
|
-
/**
|
|
90
|
-
* Removes possessive suffixes.
|
|
91
|
-
*
|
|
92
|
-
* @param {string} word The word to stem.
|
|
93
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
94
|
-
*
|
|
95
|
-
* @returns {string} The word without possessive suffixes or the original word if no such suffix is found.
|
|
96
|
-
*/
|
|
97
|
-
function removePossessives( word, morphologyData ) {
|
|
98
|
-
const possessiveSuffixes = morphologyData.externalStemmer.possessiveSuffixes;
|
|
99
|
-
|
|
100
|
-
if ( word.length > 5 ) {
|
|
101
|
-
if ( word.endsWith( possessiveSuffixes.posSuffixOv ) ) {
|
|
102
|
-
return word.slice( 0, -2 );
|
|
103
|
-
}
|
|
104
|
-
if ( word.endsWith( possessiveSuffixes.posSuffixIn ) ) {
|
|
105
|
-
return palatalise( word.slice( 0, -1 ), morphologyData );
|
|
106
|
-
}
|
|
107
|
-
}
|
|
108
|
-
return word;
|
|
109
|
-
}
|
|
110
|
-
|
|
111
|
-
/**
|
|
112
|
-
* Removes comparative and superlative affixes.
|
|
113
|
-
*
|
|
114
|
-
* @param {string} word The word to stem.
|
|
115
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
116
|
-
*
|
|
117
|
-
* @returns {string} The word without comparative and superlative affixes or the original word if no such suffix is found.
|
|
118
|
-
*/
|
|
119
|
-
function removeComparativeAndSuperlative( word, morphologyData ) {
|
|
120
|
-
const superlativePrefix = morphologyData.externalStemmer.superlativePrefix;
|
|
121
|
-
if ( word.length > 6 && word.startsWith( superlativePrefix ) ) {
|
|
122
|
-
word = word.slice( 3, word.length );
|
|
123
|
-
}
|
|
124
|
-
|
|
125
|
-
if ( word.length > 5 ) {
|
|
126
|
-
const comparativeSuffixes = morphologyData.externalStemmer.comparativeSuffixes;
|
|
127
|
-
if ( comparativeSuffixes.includes( word.slice( -3 ) ) ) {
|
|
128
|
-
word = palatalise( word.slice( 0, -2 ), morphologyData );
|
|
129
|
-
}
|
|
130
|
-
}
|
|
131
|
-
return word;
|
|
132
|
-
}
|
|
133
|
-
|
|
134
|
-
/**
|
|
135
|
-
* Removes diminutive suffixes.
|
|
136
|
-
*
|
|
137
|
-
* @param {string} word The word to stem.
|
|
138
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
139
|
-
*
|
|
140
|
-
* @returns {string} The word without diminutive suffixes or the original word if no such suffix is found.
|
|
141
|
-
*/
|
|
142
|
-
function removeDiminutives( word, morphologyData ) {
|
|
143
|
-
const diminutiveSuffixes = morphologyData.externalStemmer.diminutiveSuffixes;
|
|
144
|
-
if ( word.length > 7 && word.endsWith( diminutiveSuffixes.diminutiveSuffix1 ) ) {
|
|
145
|
-
return word.slice( 0, -5 );
|
|
146
|
-
}
|
|
147
|
-
if ( word.length > 6 ) {
|
|
148
|
-
if ( diminutiveSuffixes.diminutiveSuffixes2.includes( word.slice( -4 ) ) ) {
|
|
149
|
-
return palatalise( word.slice( 0, -3 ), morphologyData );
|
|
150
|
-
}
|
|
151
|
-
if ( diminutiveSuffixes.diminutiveSuffixes3.includes( word.slice( -4 ) ) ) {
|
|
152
|
-
return palatalise( word.slice( 0, -4 ), morphologyData );
|
|
153
|
-
}
|
|
154
|
-
}
|
|
155
|
-
if ( word.length > 5 ) {
|
|
156
|
-
if ( diminutiveSuffixes.diminutiveSuffixes4.includes( word.slice( -3 ) ) ) {
|
|
157
|
-
return palatalise( word.slice( 0, -3 ), morphologyData );
|
|
158
|
-
}
|
|
159
|
-
if ( diminutiveSuffixes.diminutiveSuffixes5.includes( word.slice( -3 ) ) ) {
|
|
160
|
-
return word.slice( 0, -3 );
|
|
161
|
-
}
|
|
162
|
-
}
|
|
163
|
-
if ( word.length > 4 ) {
|
|
164
|
-
if ( diminutiveSuffixes.diminutiveSuffixes6.includes( word.slice( -2 ) ) ) {
|
|
165
|
-
return palatalise( word.slice( 0, -1 ), morphologyData );
|
|
166
|
-
}
|
|
167
|
-
if ( diminutiveSuffixes.diminutiveSuffixes7.includes( word.slice( -2 ) ) ) {
|
|
168
|
-
return word.slice( 0, -1 );
|
|
169
|
-
}
|
|
170
|
-
}
|
|
171
|
-
if ( word.length > 3 && word.endsWith( "k" ) && ! word.endsWith( "isk" ) ) {
|
|
172
|
-
return word.slice( 0, -1 );
|
|
173
|
-
}
|
|
174
|
-
return word;
|
|
175
|
-
}
|
|
176
|
-
|
|
177
|
-
/**
|
|
178
|
-
* Removes augmentative suffixes.
|
|
179
|
-
*
|
|
180
|
-
* @param {string} word The word to stem.
|
|
181
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
182
|
-
*
|
|
183
|
-
* @returns {string} The word without augmentative suffixes or the original word if no such suffix is found.
|
|
184
|
-
*/
|
|
185
|
-
function removeAugmentatives( word, morphologyData ) {
|
|
186
|
-
const augmentativeSuffixes = morphologyData.externalStemmer.augmentativeSuffixes;
|
|
187
|
-
if ( word.length > 6 && word.endsWith( augmentativeSuffixes.augmentativeSuffix1 ) ) {
|
|
188
|
-
return word.slice( 0, -4 );
|
|
189
|
-
}
|
|
190
|
-
if ( word.length > 5 && augmentativeSuffixes.augmentativeSuffixes2.includes( word.slice( -3 ) ) ) {
|
|
191
|
-
return palatalise( word.slice( 0, -2 ), morphologyData );
|
|
192
|
-
}
|
|
193
|
-
return word;
|
|
194
|
-
}
|
|
195
|
-
|
|
196
|
-
/**
|
|
197
|
-
* Removes derivational suffixes.
|
|
198
|
-
*
|
|
199
|
-
* @param {string} word The word to stem.
|
|
200
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
201
|
-
*
|
|
202
|
-
* @returns {string} The word without derivational suffixes or the original word if no such suffix is found.
|
|
203
|
-
*/
|
|
204
|
-
function stemDerivational( word, morphologyData ) {
|
|
205
|
-
const derivationalSuffixes = morphologyData.externalStemmer.derivationalSuffixes;
|
|
206
|
-
if ( word.length > 8 && word.endsWith( derivationalSuffixes.derivationalSuffix1 ) ) {
|
|
207
|
-
return word.slice( 0, -6 );
|
|
208
|
-
}
|
|
209
|
-
if ( word.length > 7 ) {
|
|
210
|
-
if ( word.endsWith( derivationalSuffixes.derivationalSuffix2 ) ) {
|
|
211
|
-
return palatalise( word.slice( 0, -4 ), morphologyData );
|
|
212
|
-
}
|
|
213
|
-
if ( derivationalSuffixes.derivationalSuffixes3.includes( word.slice( -5 ) ) ) {
|
|
214
|
-
return word.slice( 0, -5 );
|
|
215
|
-
}
|
|
216
|
-
}
|
|
217
|
-
if ( word.length > 6 ) {
|
|
218
|
-
if ( derivationalSuffixes.derivationalSuffixes4.includes( word.slice( -4 ) ) ) {
|
|
219
|
-
return word.slice( 0, -4 );
|
|
220
|
-
}
|
|
221
|
-
if ( derivationalSuffixes.derivationalSuffixes5.includes( word.slice( -4 ) ) ) {
|
|
222
|
-
return palatalise( word.slice( 0, -3 ), morphologyData );
|
|
223
|
-
}
|
|
224
|
-
}
|
|
225
|
-
if ( word.length > 5 ) {
|
|
226
|
-
if ( word.endsWith( derivationalSuffixes.derivationalSuffix6 ) ) {
|
|
227
|
-
return word.slice( 0, -3 );
|
|
228
|
-
}
|
|
229
|
-
if ( derivationalSuffixes.derivationalSuffixes7.includes( word.slice( -3 ) ) ) {
|
|
230
|
-
return palatalise( word.slice( 0, -2 ), morphologyData );
|
|
231
|
-
}
|
|
232
|
-
if ( derivationalSuffixes.derivationalSuffixes8.includes( word.slice( -3 ) ) ) {
|
|
233
|
-
return word.slice( 0, -3 );
|
|
234
|
-
}
|
|
235
|
-
}
|
|
236
|
-
if ( word.length > 4 ) {
|
|
237
|
-
if ( derivationalSuffixes.derivationalSuffixes9.includes( word.slice( -2 ) ) ) {
|
|
238
|
-
return word.slice( 0, -2 );
|
|
239
|
-
}
|
|
240
|
-
if ( derivationalSuffixes.derivationalSuffixes10.includes( word.slice( -2 ) ) ) {
|
|
241
|
-
return palatalise( word.slice( 0, -1 ), morphologyData );
|
|
242
|
-
}
|
|
243
|
-
}
|
|
244
|
-
const derivationalRegex = new RegExp( morphologyData.externalStemmer.derivationalRegex );
|
|
245
|
-
if ( word.length > 3 && derivationalRegex.test( word ) ) {
|
|
246
|
-
return word.slice( 0, -1 );
|
|
247
|
-
}
|
|
248
|
-
return word;
|
|
249
|
-
}
|
|
250
|
-
|
|
251
|
-
/**
|
|
252
|
-
* Checks whether a word is in the full-form exception list and if so returns the canonical stem.
|
|
253
|
-
*
|
|
254
|
-
* @param {string} word The word to be checked.
|
|
255
|
-
* @param {Object} exceptionListWithFullForms The exception list to check.
|
|
256
|
-
*
|
|
257
|
-
* @returns {string} The canonical stem if word was found on the list or the original word otherwise.
|
|
258
|
-
*/
|
|
259
|
-
const checkWordInFullFormExceptions = function( word, exceptionListWithFullForms ) {
|
|
260
|
-
for ( const paradigm of exceptionListWithFullForms ) {
|
|
261
|
-
if ( paradigm[ 1 ].includes( word ) ) {
|
|
262
|
-
return paradigm[ 0 ];
|
|
263
|
-
}
|
|
264
|
-
}
|
|
265
|
-
return null;
|
|
266
|
-
};
|
|
267
|
-
|
|
268
|
-
/**
|
|
269
|
-
* Checks whether a stem is in an exception list of words with multiple stems and if so returns the canonical stem.
|
|
270
|
-
*
|
|
271
|
-
* @param {string} stemmedWord The stemmed word to be checked.
|
|
272
|
-
* @param {Object} stemsThatBelongToOneWord The data that shows how non-canonical stems should be canonicalized.
|
|
273
|
-
*
|
|
274
|
-
* @returns {null|string} The canonical stem or null if nothing was found.
|
|
275
|
-
*/
|
|
276
|
-
const canonicalizeStem = function( stemmedWord, stemsThatBelongToOneWord ) {
|
|
277
|
-
for ( const paradigm of stemsThatBelongToOneWord ) {
|
|
278
|
-
if ( paradigm.includes( stemmedWord ) ) {
|
|
279
|
-
return paradigm[ 0 ];
|
|
280
|
-
}
|
|
281
|
-
}
|
|
282
|
-
return null;
|
|
283
|
-
};
|
|
284
|
-
|
|
285
|
-
/**
|
|
286
|
-
* Stems Slovak words.
|
|
287
|
-
*
|
|
288
|
-
* @param {string} word The word to stem.
|
|
289
|
-
* @param {Object} morphologyData The Slovak morphology data.
|
|
290
|
-
*
|
|
291
|
-
* @returns {string} The stemmed word.
|
|
292
|
-
*/
|
|
293
|
-
export default function stem( word, morphologyData ) {
|
|
294
|
-
// Return stem of words on the full forms exception list.
|
|
295
|
-
const stemFromExceptionListWithFullForms = checkWordInFullFormExceptions( word, morphologyData.exceptionLists.exceptionStemsWithFullForms );
|
|
296
|
-
if ( stemFromExceptionListWithFullForms ) {
|
|
297
|
-
return stemFromExceptionListWithFullForms;
|
|
298
|
-
}
|
|
299
|
-
// Remove case suffixes
|
|
300
|
-
word = removeCases( word, morphologyData );
|
|
301
|
-
// Remove possessive suffixes
|
|
302
|
-
word = removePossessives( word, morphologyData );
|
|
303
|
-
// Remove comparative and superlative affixes
|
|
304
|
-
word = removeComparativeAndSuperlative( word, morphologyData );
|
|
305
|
-
// Remove diminutive suffixes
|
|
306
|
-
word = removeDiminutives( word, morphologyData );
|
|
307
|
-
// Remove augmentative suffixes
|
|
308
|
-
word = removeAugmentatives( word, morphologyData );
|
|
309
|
-
// Remove derivational suffixes
|
|
310
|
-
word = stemDerivational( word, morphologyData );
|
|
311
|
-
|
|
312
|
-
// Return canonical stem of words that get a few different stems depending on the form.
|
|
313
|
-
const canonicalStem = canonicalizeStem( word, morphologyData.exceptionLists.stemsThatBelongToOneWord );
|
|
314
|
-
if ( canonicalStem ) {
|
|
315
|
-
return canonicalStem;
|
|
316
|
-
}
|
|
317
|
-
|
|
318
|
-
return word;
|
|
319
|
-
}
|
|
@@ -1,39 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {values} = languageProcessing;
|
|
3
|
-
const {Clause} = values;
|
|
4
|
-
import getParticiples from '../helpers/internal/getParticiples';
|
|
5
|
-
import nonPassives from '../../sk/config/internal/nonPassives';
|
|
6
|
-
|
|
7
|
-
/**
|
|
8
|
-
* Creates a Clause object for the Slovak language.
|
|
9
|
-
*/
|
|
10
|
-
class SlovakClause extends Clause {
|
|
11
|
-
/**
|
|
12
|
-
* Constructor.
|
|
13
|
-
*
|
|
14
|
-
* @param {string} clauseText The text of the clause.
|
|
15
|
-
* @param {Array} auxiliaries The auxiliaries.
|
|
16
|
-
*
|
|
17
|
-
* @constructor
|
|
18
|
-
*/
|
|
19
|
-
constructor(clauseText, auxiliaries) {
|
|
20
|
-
super(clauseText, auxiliaries);
|
|
21
|
-
this._participles = getParticiples(this.getClauseText());
|
|
22
|
-
this.checkParticiples();
|
|
23
|
-
}
|
|
24
|
-
|
|
25
|
-
/**
|
|
26
|
-
* Checks if any exceptions are applicable to this participle that would result in the clause not being passive.
|
|
27
|
-
* If no exceptions are found, the clause is passive.
|
|
28
|
-
*
|
|
29
|
-
* @returns {void}
|
|
30
|
-
*/
|
|
31
|
-
checkParticiples() {
|
|
32
|
-
const foundParticiples = this.getParticiples().filter(
|
|
33
|
-
participle => !nonPassives.includes(participle)
|
|
34
|
-
);
|
|
35
|
-
this.setPassive(foundParticiples.length > 0);
|
|
36
|
-
}
|
|
37
|
-
}
|
|
38
|
-
|
|
39
|
-
export default SlovakClause;
|
|
@@ -1,45 +0,0 @@
|
|
|
1
|
-
import {languageProcessing} from '../../../index';
|
|
2
|
-
const {AbstractResearcher} = languageProcessing;
|
|
3
|
-
|
|
4
|
-
// All config
|
|
5
|
-
import firstWordExceptions from './config/firstWordExceptions';
|
|
6
|
-
import {all as functionWords} from './config/functionWords';
|
|
7
|
-
import transitionWords from './config/transitionWords';
|
|
8
|
-
import twoPartTransitionWords from './config/twoPartTransitionWords';
|
|
9
|
-
import keyphraseLength from './config/keyphraseLength';
|
|
10
|
-
|
|
11
|
-
// All helpers
|
|
12
|
-
import getStemmer from './helpers/getStemmer';
|
|
13
|
-
import isPassiveSentence from './helpers/isPassiveSentence';
|
|
14
|
-
|
|
15
|
-
/**
|
|
16
|
-
* The researcher contains all the researches, helpers, data, and config.
|
|
17
|
-
*/
|
|
18
|
-
export default class Researcher extends AbstractResearcher {
|
|
19
|
-
/**
|
|
20
|
-
* Constructor
|
|
21
|
-
* @param {Paper} paper The Paper object that is needed within the researches.
|
|
22
|
-
* @constructor
|
|
23
|
-
*/
|
|
24
|
-
constructor(paper) {
|
|
25
|
-
super(paper);
|
|
26
|
-
|
|
27
|
-
// Delete the researches that are not available in Swedish.
|
|
28
|
-
delete this.defaultResearches.getFleschReadingScore;
|
|
29
|
-
|
|
30
|
-
Object.assign(this.config, {
|
|
31
|
-
language: 'sv',
|
|
32
|
-
passiveConstructionType: 'morphological',
|
|
33
|
-
firstWordExceptions,
|
|
34
|
-
functionWords,
|
|
35
|
-
transitionWords,
|
|
36
|
-
twoPartTransitionWords,
|
|
37
|
-
keyphraseLength
|
|
38
|
-
});
|
|
39
|
-
|
|
40
|
-
Object.assign(this.helpers, {
|
|
41
|
-
getStemmer,
|
|
42
|
-
isPassiveSentence
|
|
43
|
-
});
|
|
44
|
-
}
|
|
45
|
-
}
|
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Returns an array with exceptions for the sentence beginning researcher.
|
|
3
|
-
*
|
|
4
|
-
* @returns {string[]} The array filled with exceptions.
|
|
5
|
-
*/
|
|
6
|
-
export default [
|
|
7
|
-
// Indefinite articles:
|
|
8
|
-
"ett",
|
|
9
|
-
// Definite articles:
|
|
10
|
-
"det", "den", "de",
|
|
11
|
-
// Numbers 1-10:
|
|
12
|
-
"en", "två", "tre", "fyra", "fem", "sex", "sju", "åtta", "nio", "tio",
|
|
13
|
-
// Demonstrative pronouns:
|
|
14
|
-
"denne", "denna", "detta", "dessa",
|
|
15
|
-
];
|