npm - henkan - Versions diffs - 0.2.1 → 0.3.1 - Mend

henkan 0.2.1 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

package/dist/index.cjs.js +91 -54
package/dist/index.cjs.js.map +3 -3
package/dist/index.mjs +91 -54
package/dist/index.mjs.map +3 -3
package/dist/types/constants.d.ts.map +1 -1
package/dist/types/types.d.ts +8 -0
package/dist/types/types.d.ts.map +1 -1
package/dist/types/utils.d.ts.map +1 -1
package/docs/api/functions/capitalizeString.md +1 -1
package/docs/api/functions/convertJMdict.md +1 -1
package/docs/api/functions/convertKanjiDic.md +1 -1
package/docs/api/functions/convertKradFile.md +1 -1
package/docs/api/functions/convertRadkFile.md +1 -1
package/docs/api/functions/convertTanakaCorpus.md +1 -1
package/docs/api/functions/generateAnkiNote.md +1 -1
package/docs/api/functions/generateAnkiNotesFile.md +1 -1
package/docs/api/functions/getKanji.md +1 -1
package/docs/api/functions/getKanjiExtended.md +1 -1
package/docs/api/functions/getWord.md +1 -1
package/docs/api/functions/isStringArray.md +1 -1
package/docs/api/functions/isValidArray.md +1 -1
package/docs/api/functions/isValidArrayWithFirstElement.md +1 -1
package/docs/api/functions/makeSSML.md +1 -1
package/docs/api/functions/shuffleArray.md +1 -1
package/docs/api/functions/synthesizeSpeech.md +1 -1
package/docs/api/interfaces/DictKanji.md +5 -5
package/docs/api/interfaces/DictKanjiForm.md +4 -4
package/docs/api/interfaces/DictKanjiMisc.md +5 -5
package/docs/api/interfaces/DictKanjiReading.md +3 -3
package/docs/api/interfaces/DictKanjiReadingMeaning.md +3 -3
package/docs/api/interfaces/DictKanjiReadingMeaningGroup.md +3 -3
package/docs/api/interfaces/DictKanjiWithRadicals.md +3 -3
package/docs/api/interfaces/DictMeaning.md +11 -11
package/docs/api/interfaces/DictRadical.md +4 -4
package/docs/api/interfaces/DictReading.md +5 -5
package/docs/api/interfaces/DictWord.md +7 -7
package/docs/api/interfaces/ExamplePart.md +7 -7
package/docs/api/interfaces/Grammar.md +15 -15
package/docs/api/interfaces/GrammarMeaning.md +3 -3
package/docs/api/interfaces/Kana.md +11 -11
package/docs/api/interfaces/Kanji.md +22 -22
package/docs/api/interfaces/KanjiComponent.md +3 -3
package/docs/api/interfaces/KanjiForm.md +13 -3
package/docs/api/interfaces/NoteAndTag.md +3 -3
package/docs/api/interfaces/Phrase.md +4 -4
package/docs/api/interfaces/Radical.md +16 -16
package/docs/api/interfaces/Reading.md +14 -4
package/docs/api/interfaces/ResultEntry.md +7 -7
package/docs/api/interfaces/TanakaExample.md +5 -5
package/docs/api/interfaces/Translation.md +3 -3
package/docs/api/interfaces/UsefulRegExps.md +9 -9
package/docs/api/interfaces/Word.md +14 -14
package/docs/api/type-aliases/Dict.md +1 -1
package/docs/api/type-aliases/DictName.md +1 -1
package/docs/api/type-aliases/EntryType.md +1 -1
package/docs/api/type-aliases/JLPT.md +1 -1
package/docs/api/type-aliases/Result.md +1 -1
package/package.json +8 -8

package/dist/index.mjs CHANGED Viewed

@@ -65,10 +65,21 @@ var symbolMap = {
   "&": "\u30A2\u30F3\u30C9"
 };
 var notSearchedForms = /* @__PURE__ */ new Set([
+  "search-only kana form",
   "Search-only kana form",
+  "rarely used kana form",
   "Rarely used kana form",
+  "out-dated or obsolete kana usage",
   "Out-dated or obsolete kana usage",
-  "Word containing out-dated kanji or kanji usage"
+  "search-only kanji form",
+  "Search-only kanji form",
+  "rarely-used kanji form",
+  "Rarely-used kanji form",
+  "out-dated kanji",
+  "Out-dated kanji form",
+  "out-dated kanji or kanji usage",
+  "word containing out-dated kanji or kanji usage",
+  "Out-dated kanji or kanji usage"
 ]);
 var noteMap = /* @__PURE__ */ new Map([
   ["brazilian", ["dialect::brazilian", "Dialect: Brazilian"]],
@@ -1160,13 +1171,15 @@ function convertJMdict(xmlString, examples) {
     const dict = [];
     xml.parseString(dictParsed, (err, result) => {
       if (err) throw err;
-      let tanakaBaseParts = void 0;
-      if (examples)
-        tanakaBaseParts = new Set(
-          examples.map(
-            (example) => example.parts.map((part) => part.baseForm)
-          ).flat()
-        );
+      const tanakaParts = examples && examples.length > 0 ? new Set(
+        examples.map(
+          (example) => example.parts.map((part) => [
+            part.baseForm,
+            ...part.reading ? [part.reading] : [],
+            ...part.referenceID ? [part.referenceID] : []
+          ])
+        ).flat(2)
+      ) : void 0;
       if (result.JMdict && typeof result.JMdict === "object" && isValidArray(result.JMdict.entry))
         for (const entry of result.JMdict.entry) {
           const entryObj = {
@@ -1250,34 +1263,36 @@ function convertJMdict(xmlString, examples) {
           if (examples) {
             const readings2 = new Set(
               entryObj.readings.filter(
-                (reading) => !reading.notes || reading.notes && !reading.notes.some(
+                (reading) => (!reading.notes || !reading.notes.some(
                   (note) => notSearchedForms.has(note)
-                )
+                )) && (entryObj.isCommon === void 0 || reading.commonness && reading.commonness.length > 0)
               ).map((reading) => reading.reading)
             );
             const kanjiForms2 = entryObj.kanjiForms ? new Set(
-              entryObj.kanjiForms.map(
-                (kanjiForm) => kanjiForm.form
-              )
+              entryObj.kanjiForms.filter(
+                (kanjiForm) => (!kanjiForm.notes || !kanjiForm.notes.some(
+                  (note) => notSearchedForms.has(note)
+                )) && (entryObj.isCommon === void 0 || kanjiForm.commonness && kanjiForm.commonness.length > 0)
+              ).map((kanjiForm) => kanjiForm.form)
             ) : void 0;
-            let kanjiFormExamples = false;
-            let readingExamples = false;
-            if (kanjiForms2 && kanjiForms2.size > 0 && tanakaBaseParts) {
+            let existsExample = false;
+            if (kanjiForms2 && kanjiForms2.size > 0 && tanakaParts) {
               for (const kf of kanjiForms2)
-                if (tanakaBaseParts.has(kf)) {
-                  kanjiFormExamples = true;
+                if (tanakaParts.has(kf)) {
+                  existsExample = true;
                   break;
                 }
             }
-            if (!kanjiFormExamples && readings2.size > 0 && tanakaBaseParts) {
+            if (!existsExample && readings2.size > 0 && tanakaParts) {
               for (const r of readings2)
-                if (tanakaBaseParts.has(r)) {
-                  readingExamples = true;
+                if (tanakaParts.has(r)) {
+                  existsExample = true;
                   break;
                 }
             }
-            if (kanjiFormExamples || readingExamples)
-              entryObj.hasPhrases = true;
+            if (!existsExample && tanakaParts && tanakaParts.has(entryObj.id))
+              existsExample = true;
+            if (existsExample) entryObj.hasPhrases = true;
           }
           if (entryObj.id.length > 0 && entryObj.readings.length > 0 && entryObj.meanings.length > 0)
             dict.push(entryObj);
@@ -1570,7 +1585,8 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
                 );
                 return capitalizeString(noteAndTag.note ?? note);
               })
-            } : {}
+            } : {},
+            ...dictKanjiForm.commonness && dictKanjiForm.commonness.length > 0 ? { common: true } : {}
           })
         );
       word.readings = dictWord.readings.map((dictReading) => ({
@@ -1591,7 +1607,8 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
               return capitalizeString(noteAndTag.note ?? note);
             }) : []
           ]
-        } : {}
+        } : {},
+        ...dictReading.commonness && dictReading.commonness.length > 0 ? { common: true } : {}
       }));
       let usuallyInKanaMeanings = 0;
       word.translations = dictWord.meanings.map((dictMeaning) => {
@@ -1684,36 +1701,61 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
         if (word.kanji.length === 0) delete word.kanji;
       }
       if (examples && dictWord.hasPhrases === true) {
+        let pushIfUnique2 = function(ex) {
+          if (!seenPhrases.has(ex.phrase)) {
+            wordExamples.push(ex);
+            seenPhrases.add(ex.phrase);
+          }
+        };
+        var pushIfUnique = pushIfUnique2;
         const readings = new Set(
           word.readings.filter(
-            (reading) => !reading.notes || reading.notes && !reading.notes.some(
+            (reading) => (!reading.notes || !reading.notes.some(
               (note) => notSearchedForms.has(note)
-            )
+            )) && (word.common === void 0 || reading.common === true)
           ).map((reading) => reading.reading)
         );
         const kanjiForms = word.kanjiForms ? new Set(
-          word.kanjiForms.map(
-            (kanjiForm) => kanjiForm.kanjiForm
-          )
+          word.kanjiForms.filter(
+            (kanjiForm) => (!kanjiForm.notes || !kanjiForm.notes.some(
+              (note) => notSearchedForms.has(note)
+            )) && (word.common === void 0 || kanjiForm.common === true)
+          ).map((kanjiForm) => kanjiForm.kanjiForm)
         ) : void 0;
         const kanjiFormExamples = [];
+        const readingMatchingKanjiFormExamples = [];
         const readingExamples = [];
-        if (kanjiForms) {
-          for (const example of examples)
-            for (const part of example.parts)
-              if (kanjiForms.has(part.baseForm))
-                kanjiFormExamples.push(example);
-        }
-        if (kanjiFormExamples.length === 0) {
-          for (const example of examples)
-            for (const part of example.parts)
-              if (readings.has(part.baseForm)) readingExamples.push(example);
-        }
-        examples = [...kanjiFormExamples, ...readingExamples];
+        for (const example of examples)
+          for (const part of example.parts) {
+            const readingMatch = part.reading && readings.has(part.reading) || readings.has(part.baseForm);
+            if (kanjiForms && kanjiForms.size > 0 && kanjiForms.has(part.baseForm)) {
+              if (readingMatch) readingMatchingKanjiFormExamples.push(example);
+              else kanjiFormExamples.push(example);
+              break;
+            }
+            if (readingMatch || part.referenceID && word.id && part.referenceID === word.id) {
+              readingExamples.push(example);
+              break;
+            }
+          }
+        const exampleSize = (/* @__PURE__ */ new Set([
+          ...readingMatchingKanjiFormExamples,
+          ...kanjiFormExamples,
+          ...readingExamples
+        ])).size;
+        const includeKanjiFormExamples = readingMatchingKanjiFormExamples.length < Math.max(2, Math.round(exampleSize * 0.05));
+        const includeReadingExamples = word.usuallyInKana === void 0 && includeKanjiFormExamples && readingExamples.length >= Math.max(10, Math.round(exampleSize * 0.15)) || word.usuallyInKana === true && readingExamples.length >= Math.max(2, Math.round(exampleSize * 0.5));
+        const seenPhrases = /* @__PURE__ */ new Set();
+        let wordExamples = [];
+        for (const ex of readingMatchingKanjiFormExamples) pushIfUnique2(ex);
+        if (includeKanjiFormExamples)
+          for (const ex of kanjiFormExamples) pushIfUnique2(ex);
+        if (includeReadingExamples)
+          for (const ex of readingExamples) pushIfUnique2(ex);
         if (word.translations) {
           const glossSpecificExamples = [];
           for (let i = 0; i < word.translations.length; i++) {
-            outer: for (const example of examples)
+            outer: for (const example of wordExamples)
               for (const part of example.parts)
                 if (part.glossNumber === i + 1) {
                   glossSpecificExamples.push(example);
@@ -1722,24 +1764,19 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
             if (glossSpecificExamples.length === 5) break;
           }
           if (glossSpecificExamples.length === 5)
-            examples = glossSpecificExamples;
+            wordExamples = glossSpecificExamples;
           else if (glossSpecificExamples.length > 0) {
-            const seenPhrases = new Set(
+            const seenPhrases2 = new Set(
               glossSpecificExamples.map((ex) => ex.phrase)
             );
-            examples = [
+            wordExamples = [
               ...glossSpecificExamples,
-              ...examples.filter((ex) => !seenPhrases.has(ex.phrase)).slice(0, 5 - glossSpecificExamples.length)
+              ...wordExamples.filter((ex) => !seenPhrases2.has(ex.phrase)).slice(0, 5 - glossSpecificExamples.length)
             ];
           }
         }
-        examples = examples.filter(
-          (example, index, arr) => arr.findIndex(
-            (ex) => ex.phrase === example.phrase
-          ) === index
-        );
-        if (examples.length > 0)
-          word.phrases = (examples.length > 5 ? examples.slice(0, 5) : examples).map((ex) => ({
+        if (wordExamples.length > 0)
+          word.phrases = (wordExamples.length > 5 ? wordExamples.slice(0, 5) : wordExamples).map((ex) => ({
             phrase: ex.furigana ?? ex.phrase,
             translation: ex.translation,
             originalPhrase: ex.phrase