npm - henkan - Versions diffs - 0.3.1 → 0.3.3 - Mend

henkan 0.3.1 → 0.3.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

package/dist/index.cjs.js +34 -31
package/dist/index.cjs.js.map +3 -3
package/dist/index.mjs +34 -31
package/dist/index.mjs.map +3 -3
package/dist/types/utils.d.ts.map +1 -1
package/docs/api/functions/capitalizeString.md +1 -1
package/docs/api/functions/convertJMdict.md +1 -1
package/docs/api/functions/convertKanjiDic.md +1 -1
package/docs/api/functions/convertKradFile.md +1 -1
package/docs/api/functions/convertRadkFile.md +1 -1
package/docs/api/functions/convertTanakaCorpus.md +1 -1
package/docs/api/functions/generateAnkiNote.md +1 -1
package/docs/api/functions/generateAnkiNotesFile.md +1 -1
package/docs/api/functions/getKanji.md +1 -1
package/docs/api/functions/getKanjiExtended.md +1 -1
package/docs/api/functions/getWord.md +1 -1
package/docs/api/functions/isStringArray.md +1 -1
package/docs/api/functions/isValidArray.md +1 -1
package/docs/api/functions/isValidArrayWithFirstElement.md +1 -1
package/docs/api/functions/makeSSML.md +1 -1
package/docs/api/functions/shuffleArray.md +1 -1
package/docs/api/functions/synthesizeSpeech.md +1 -1
package/docs/api/interfaces/DictKanji.md +5 -5
package/docs/api/interfaces/DictKanjiForm.md +4 -4
package/docs/api/interfaces/DictKanjiMisc.md +5 -5
package/docs/api/interfaces/DictKanjiReading.md +3 -3
package/docs/api/interfaces/DictKanjiReadingMeaning.md +3 -3
package/docs/api/interfaces/DictKanjiReadingMeaningGroup.md +3 -3
package/docs/api/interfaces/DictKanjiWithRadicals.md +3 -3
package/docs/api/interfaces/DictMeaning.md +11 -11
package/docs/api/interfaces/DictRadical.md +4 -4
package/docs/api/interfaces/DictReading.md +5 -5
package/docs/api/interfaces/DictWord.md +7 -7
package/docs/api/interfaces/ExamplePart.md +7 -7
package/docs/api/interfaces/Grammar.md +15 -15
package/docs/api/interfaces/GrammarMeaning.md +3 -3
package/docs/api/interfaces/Kana.md +11 -11
package/docs/api/interfaces/Kanji.md +22 -22
package/docs/api/interfaces/KanjiComponent.md +3 -3
package/docs/api/interfaces/KanjiForm.md +4 -4
package/docs/api/interfaces/NoteAndTag.md +3 -3
package/docs/api/interfaces/Phrase.md +4 -4
package/docs/api/interfaces/Radical.md +16 -16
package/docs/api/interfaces/Reading.md +5 -5
package/docs/api/interfaces/ResultEntry.md +7 -7
package/docs/api/interfaces/TanakaExample.md +5 -5
package/docs/api/interfaces/Translation.md +3 -3
package/docs/api/interfaces/UsefulRegExps.md +9 -9
package/docs/api/interfaces/Word.md +14 -14
package/docs/api/type-aliases/Dict.md +1 -1
package/docs/api/type-aliases/DictName.md +1 -1
package/docs/api/type-aliases/EntryType.md +1 -1
package/docs/api/type-aliases/JLPT.md +1 -1
package/docs/api/type-aliases/Result.md +1 -1
package/package.json +2 -2

package/dist/index.mjs CHANGED Viewed

@@ -14,7 +14,7 @@ var regexps = {
   regExChars: /[-\/\\^$*+?.()|[\]{}]/,
   tanakaID: /#ID=\d+_\d+$/,
   tanakaPart: /(?<base>[^()\[\]\{\}\s]+)(?:\((?<reading>[\S]+)\))?(?:\[(?<glossnum>[\S]+)\])?(?:\{(?<inflection>[\S]+)\})?/,
-  tanakaReferenceID: /#([\d]+)/
+  tanakaReferenceID: /#(?<entryid>[\d]+)/
 };
 var romajiMap = {
   A: "\u30A8\u30FC",
@@ -1408,9 +1408,9 @@ async function convertTanakaCorpus(tanakaString, generateFurigana) {
               if (reading)
                 if (regexps.tanakaReferenceID.test(reading)) {
                   const referenceID = regexps.tanakaReferenceID.exec(reading);
-                  if (!referenceID)
+                  if (!referenceID || !referenceID.groups || !referenceID.groups["entryid"])
                     throw new Error(`Invalid reference ID: ${reading}`);
-                  examplePart.referenceID = referenceID[0];
+                  examplePart.referenceID = referenceID.groups["entryid"];
                 } else examplePart.reading = reading;
               if (glossNumber)
                 examplePart.glossNumber = glossNumber.startsWith("0") ? Number.parseInt(glossNumber.substring(1)) : Number.parseInt(glossNumber);
@@ -1547,9 +1547,10 @@ function lookupWordNote(key, notes, tags, required, fallback) {
     if (notes) notes.push(fallback ?? key);
     return { note: fallback ?? key };
   }
-  if (tags) tags.push(`word::${info[0]}`);
+  const tag = `word::${info[0]}`;
+  if (tags && !tags.includes(tag)) tags.push(tag);
   if (notes) notes.push(info[1]);
-  return { note: info[1], tag: `word::${info[0]}` };
+  return { note: info[1], tag };
 }
 var wordAddNoteArray = (arr, cb) => {
   if (!arr) return;
@@ -1701,13 +1702,6 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
         if (word.kanji.length === 0) delete word.kanji;
       }
       if (examples && dictWord.hasPhrases === true) {
-        let pushIfUnique2 = function(ex) {
-          if (!seenPhrases.has(ex.phrase)) {
-            wordExamples.push(ex);
-            seenPhrases.add(ex.phrase);
-          }
-        };
-        var pushIfUnique = pushIfUnique2;
         const readings = new Set(
           word.readings.filter(
             (reading) => (!reading.notes || !reading.notes.some(
@@ -1725,46 +1719,55 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
         const kanjiFormExamples = [];
         const readingMatchingKanjiFormExamples = [];
         const readingExamples = [];
+        const partParts = /* @__PURE__ */ new Set();
         for (const example of examples)
           for (const part of example.parts) {
-            const readingMatch = part.reading && readings.has(part.reading) || readings.has(part.baseForm);
+            const readingAsReadingMatch = part.reading !== void 0 && readings.has(part.reading);
             if (kanjiForms && kanjiForms.size > 0 && kanjiForms.has(part.baseForm)) {
-              if (readingMatch) readingMatchingKanjiFormExamples.push(example);
-              else kanjiFormExamples.push(example);
+              if (readingAsReadingMatch) {
+                readingMatchingKanjiFormExamples.push(example);
+                partParts.add(part.baseForm).add(part.reading);
+              } else {
+                kanjiFormExamples.push(example);
+                partParts.add(part.baseForm);
+              }
               break;
             }
-            if (readingMatch || part.referenceID && word.id && part.referenceID === word.id) {
+            const readingAsBaseFormMatch = readings.has(part.baseForm);
+            const referenceIDMatch = part.referenceID !== void 0 && word.id !== void 0 && part.referenceID === word.id;
+            if (readingAsReadingMatch || readingAsBaseFormMatch || referenceIDMatch) {
               readingExamples.push(example);
+              if (readingAsReadingMatch) partParts.add(part.reading);
+              if (readingAsBaseFormMatch) partParts.add(part.baseForm);
+              if (referenceIDMatch) partParts.add(part.referenceID);
               break;
             }
           }
-        const exampleSize = (/* @__PURE__ */ new Set([
-          ...readingMatchingKanjiFormExamples,
-          ...kanjiFormExamples,
-          ...readingExamples
-        ])).size;
+        const exampleSize = readingMatchingKanjiFormExamples.length + kanjiFormExamples.length + readingExamples.length;
         const includeKanjiFormExamples = readingMatchingKanjiFormExamples.length < Math.max(2, Math.round(exampleSize * 0.05));
         const includeReadingExamples = word.usuallyInKana === void 0 && includeKanjiFormExamples && readingExamples.length >= Math.max(10, Math.round(exampleSize * 0.15)) || word.usuallyInKana === true && readingExamples.length >= Math.max(2, Math.round(exampleSize * 0.5));
-        const seenPhrases = /* @__PURE__ */ new Set();
-        let wordExamples = [];
-        for (const ex of readingMatchingKanjiFormExamples) pushIfUnique2(ex);
-        if (includeKanjiFormExamples)
-          for (const ex of kanjiFormExamples) pushIfUnique2(ex);
-        if (includeReadingExamples)
-          for (const ex of readingExamples) pushIfUnique2(ex);
+        let wordExamples = [
+          ...readingMatchingKanjiFormExamples,
+          ...includeKanjiFormExamples ? kanjiFormExamples : [],
+          ...includeReadingExamples ? readingExamples : []
+        ];
         if (word.translations) {
           const glossSpecificExamples = [];
+          const seenPhrases = /* @__PURE__ */ new Set();
           for (let i = 0; i < word.translations.length; i++) {
-            outer: for (const example of wordExamples)
+            outer: for (const example of wordExamples) {
+              if (seenPhrases.has(example.phrase)) continue;
               for (const part of example.parts)
-                if (part.glossNumber === i + 1) {
+                if (part.glossNumber === i + 1 && (partParts.has(part.baseForm) || part.reading && partParts.has(part.reading) || part.referenceID && partParts.has(part.referenceID))) {
                   glossSpecificExamples.push(example);
+                  seenPhrases.add(example.phrase);
                   break outer;
                 }
+            }
             if (glossSpecificExamples.length === 5) break;
           }
           if (glossSpecificExamples.length === 5)
-            wordExamples = glossSpecificExamples;
+            wordExamples = [...glossSpecificExamples];
           else if (glossSpecificExamples.length > 0) {
             const seenPhrases2 = new Set(
               glossSpecificExamples.map((ex) => ex.phrase)