npm - henkan - Versions diffs - 0.4.1 → 0.6.0 - Mend

henkan 0.4.1 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

package/dist/index.cjs.js +127 -124
package/dist/index.cjs.js.map +3 -3
package/dist/index.mjs +123 -122
package/dist/index.mjs.map +3 -3
package/dist/types/types.d.ts +9 -7
package/dist/types/types.d.ts.map +1 -1
package/dist/types/utils.d.ts.map +1 -1
package/docs/api/functions/capitalizeString.md +1 -1
package/docs/api/functions/convertJMdict.md +1 -1
package/docs/api/functions/convertKanjiDic.md +1 -1
package/docs/api/functions/convertKradFile.md +1 -1
package/docs/api/functions/convertRadkFile.md +1 -1
package/docs/api/functions/convertTanakaCorpus.md +1 -1
package/docs/api/functions/generateAnkiNote.md +1 -1
package/docs/api/functions/generateAnkiNotesFile.md +1 -1
package/docs/api/functions/getKanji.md +1 -1
package/docs/api/functions/getKanjiExtended.md +1 -1
package/docs/api/functions/getWord.md +1 -1
package/docs/api/functions/isStringArray.md +1 -1
package/docs/api/functions/isValidArray.md +1 -1
package/docs/api/functions/isValidArrayWithFirstElement.md +1 -1
package/docs/api/functions/makeSSML.md +1 -1
package/docs/api/functions/shuffleArray.md +1 -1
package/docs/api/functions/synthesizeSpeech.md +1 -1
package/docs/api/interfaces/DictKanji.md +5 -5
package/docs/api/interfaces/DictKanjiForm.md +4 -4
package/docs/api/interfaces/DictKanjiMisc.md +5 -5
package/docs/api/interfaces/DictKanjiReading.md +3 -3
package/docs/api/interfaces/DictKanjiReadingMeaning.md +3 -3
package/docs/api/interfaces/DictKanjiReadingMeaningGroup.md +3 -3
package/docs/api/interfaces/DictKanjiWithRadicals.md +3 -3
package/docs/api/interfaces/DictMeaning.md +11 -11
package/docs/api/interfaces/DictRadical.md +7 -7
package/docs/api/interfaces/DictReading.md +5 -5
package/docs/api/interfaces/DictWord.md +19 -17
package/docs/api/interfaces/ExamplePart.md +7 -7
package/docs/api/interfaces/Grammar.md +15 -15
package/docs/api/interfaces/GrammarMeaning.md +3 -3
package/docs/api/interfaces/Kana.md +11 -11
package/docs/api/interfaces/Kanji.md +22 -22
package/docs/api/interfaces/KanjiComponent.md +3 -3
package/docs/api/interfaces/KanjiForm.md +4 -4
package/docs/api/interfaces/NoteAndTag.md +3 -3
package/docs/api/interfaces/Phrase.md +4 -4
package/docs/api/interfaces/Radical.md +16 -16
package/docs/api/interfaces/Reading.md +5 -5
package/docs/api/interfaces/ResultEntry.md +7 -7
package/docs/api/interfaces/TanakaExample.md +6 -6
package/docs/api/interfaces/Translation.md +3 -3
package/docs/api/interfaces/UsefulRegExps.md +9 -9
package/docs/api/interfaces/Word.md +16 -16
package/docs/api/type-aliases/Dict.md +1 -1
package/docs/api/type-aliases/DictName.md +1 -1
package/docs/api/type-aliases/EntryType.md +1 -1
package/docs/api/type-aliases/JLPT.md +1 -1
package/docs/api/type-aliases/Result.md +1 -1
package/package.json +1 -1

package/dist/index.mjs CHANGED Viewed

@@ -1168,10 +1168,18 @@ function convertJMdict(xmlString, examples) {
       noent: true,
       recover: false
     });
-    let dict = [];
-    const partMatches = /* @__PURE__ */ new Set();
+    const dict = [];
     xml.parseString(dictParsed, (err, result) => {
       if (err) throw err;
+      const tanakaParts = examples && examples.length > 0 ? new Set(
+        examples.map(
+          (example) => example.parts.map((part) => [
+            part.baseForm,
+            ...part.reading ? [part.reading] : [],
+            ...part.referenceID ? [part.referenceID] : []
+          ])
+        ).flat(2)
+      ) : void 0;
       if (result.JMdict && typeof result.JMdict === "object" && isValidArray(result.JMdict.entry))
         for (const entry of result.JMdict.entry) {
           const entryObj = {
@@ -1263,117 +1271,43 @@ function convertJMdict(xmlString, examples) {
               entryObj.usuallyInKana = true;
           }
           if (examples) {
-            const readings2 = entryObj.readings.filter(
-              (reading) => (!reading.notes || !reading.notes.some(
-                (note) => notSearchedForms.has(note)
-              )) && (entryObj.isCommon === void 0 || reading.commonness && reading.commonness.length > 0)
-            ).map((reading) => reading.reading);
-            const kanjiForms2 = entryObj.kanjiForms ? entryObj.kanjiForms.filter(
-              (kanjiForm) => (!kanjiForm.notes || !kanjiForm.notes.some(
-                (note) => notSearchedForms.has(note)
-              )) && (entryObj.isCommon === void 0 || kanjiForm.commonness && kanjiForm.commonness.length > 0)
-            ).map((kanjiForm) => kanjiForm.form) : void 0;
-            for (const reading of readings2) partMatches.add(reading);
-            if (kanjiForms2)
-              for (const kanjiForm of kanjiForms2) partMatches.add(kanjiForm);
-            partMatches.add(entryObj.id);
+            const readings2 = new Set(
+              entryObj.readings.filter(
+                (reading) => (!reading.notes || !reading.notes.some(
+                  (note) => notSearchedForms.has(note)
+                )) && (entryObj.isCommon === void 0 || reading.commonness && reading.commonness.length > 0)
+              ).map((reading) => reading.reading)
+            );
+            const kanjiForms2 = entryObj.kanjiForms ? new Set(
+              entryObj.kanjiForms.filter(
+                (kanjiForm) => (!kanjiForm.notes || !kanjiForm.notes.some(
+                  (note) => notSearchedForms.has(note)
+                )) && (entryObj.isCommon === void 0 || kanjiForm.commonness && kanjiForm.commonness.length > 0)
+              ).map((kanjiForm) => kanjiForm.form)
+            ) : void 0;
+            let existsExample = false;
+            if (kanjiForms2 && kanjiForms2.size > 0 && tanakaParts) {
+              for (const kf of kanjiForms2)
+                if (tanakaParts.has(kf)) {
+                  existsExample = true;
+                  break;
+                }
+            }
+            if (!existsExample && readings2.size > 0 && tanakaParts) {
+              for (const r of readings2)
+                if (tanakaParts.has(r)) {
+                  existsExample = true;
+                  break;
+                }
+            }
+            if (!existsExample && tanakaParts && tanakaParts.has(entryObj.id))
+              existsExample = true;
+            if (existsExample) entryObj.hasPhrases = true;
           }
           if (entryObj.id.length > 0 && entryObj.readings.length > 0 && entryObj.meanings.length > 0)
             dict.push(entryObj);
         }
     });
-    if (examples && dict.length > 0) {
-      const filteredExamples = examples.filter(
-        (ex) => {
-          const parts = ex.parts.flatMap((part) => [
-            part.baseForm,
-            ...part.reading ? [part.reading] : [],
-            ...part.referenceID ? [part.referenceID] : []
-          ]);
-          for (const part of parts) if (partMatches.has(part)) return true;
-          return false;
-        }
-      );
-      dict = dict.map((entryObj) => {
-        const readings = new Set(
-          entryObj.readings.filter(
-            (reading) => (!reading.notes || !reading.notes.some(
-              (note) => notSearchedForms.has(note)
-            )) && (entryObj.isCommon === void 0 || reading.commonness && reading.commonness.length > 0)
-          ).map((reading) => reading.reading)
-        );
-        const kanjiForms = entryObj.kanjiForms ? new Set(
-          entryObj.kanjiForms.filter(
-            (kanjiForm) => (!kanjiForm.notes || !kanjiForm.notes.some(
-              (note) => notSearchedForms.has(note)
-            )) && (entryObj.isCommon === void 0 || kanjiForm.commonness && kanjiForm.commonness.length > 0)
-          ).map((kanjiForm) => kanjiForm.form)
-        ) : void 0;
-        const kanjiFormExamples = [];
-        const readingMatchingKanjiFormExamples = [];
-        const readingExamples = [];
-        const partParts = /* @__PURE__ */ new Set();
-        for (const example of filteredExamples)
-          for (const part of example.parts) {
-            const readingAsReadingMatch = part.reading !== void 0 && readings.has(part.reading);
-            if (kanjiForms && kanjiForms.size > 0 && kanjiForms.has(part.baseForm)) {
-              if (readingAsReadingMatch) {
-                readingMatchingKanjiFormExamples.push(example);
-                partParts.add(part.baseForm).add(part.reading);
-              } else {
-                kanjiFormExamples.push(example);
-                partParts.add(part.baseForm);
-              }
-              break;
-            }
-            const readingAsBaseFormMatch = readings.has(part.baseForm);
-            const referenceIDMatch = part.referenceID !== void 0 && entryObj.id !== void 0 && part.referenceID === entryObj.id;
-            if (readingAsReadingMatch || readingAsBaseFormMatch || referenceIDMatch) {
-              readingExamples.push(example);
-              if (readingAsReadingMatch) partParts.add(part.reading);
-              if (readingAsBaseFormMatch) partParts.add(part.baseForm);
-              if (referenceIDMatch) partParts.add(part.referenceID);
-              break;
-            }
-          }
-        const exampleSize = readingMatchingKanjiFormExamples.length + kanjiFormExamples.length + readingExamples.length;
-        const includeKanjiFormExamples = readingMatchingKanjiFormExamples.length < Math.max(2, Math.round(exampleSize * 0.05));
-        const includeReadingExamples = entryObj.usuallyInKana === void 0 && includeKanjiFormExamples && readingExamples.length >= Math.max(10, Math.round(exampleSize * 0.15)) || entryObj.usuallyInKana === true && readingExamples.length >= Math.max(2, Math.round(exampleSize * 0.5));
-        let wordExamples = [
-          ...readingMatchingKanjiFormExamples,
-          ...includeKanjiFormExamples ? kanjiFormExamples : [],
-          ...includeReadingExamples ? readingExamples : []
-        ];
-        const glossSpecificExamples = [];
-        const seenPhrases = /* @__PURE__ */ new Set();
-        for (let i = 0; i < entryObj.meanings.length; i++) {
-          outer: for (const example of wordExamples) {
-            if (seenPhrases.has(example.phrase)) continue;
-            for (const part of example.parts)
-              if (part.glossNumber === i + 1 && (partParts.has(part.baseForm) || part.reading && partParts.has(part.reading) || part.referenceID && partParts.has(part.referenceID))) {
-                glossSpecificExamples.push(example);
-                seenPhrases.add(example.phrase);
-                break outer;
-              }
-          }
-          if (glossSpecificExamples.length === 5) break;
-        }
-        if (glossSpecificExamples.length === 5)
-          wordExamples = glossSpecificExamples;
-        else if (glossSpecificExamples.length > 0) {
-          const seenPhrases2 = new Set(
-            glossSpecificExamples.map((ex) => ex.phrase)
-          );
-          wordExamples = [
-            ...glossSpecificExamples,
-            ...wordExamples.filter((ex) => !seenPhrases2.has(ex.phrase)).slice(0, 5 - glossSpecificExamples.length)
-          ];
-        }
-        if (wordExamples.length > 0)
-          entryObj.phraseIDs = (wordExamples.length > 5 ? wordExamples.slice(0, 5) : wordExamples).map((ex) => ex.id);
-        return entryObj;
-      });
-    }
     return dict;
   } catch (err) {
     throw err;
@@ -1537,27 +1471,27 @@ function convertRadkFile(radkBuffer, kanjiDic) {
       if (line.startsWith("$ ")) {
         const radical = {
           radical: line.charAt(2),
-          kanji: [],
           strokes: line.substring(4)
         };
         let j = i + 1;
         let kanjiLine = fileParsed[j];
         if (!kanjiLine) continue;
+        const kanjiList = [];
         while (kanjiLine && !kanjiLine.startsWith("$ ")) {
           const kanjis = kanjiLine.split("");
           for (const kanji of kanjis) {
             const foundKanji = kanjiDic.find(
               (dictKanji) => dictKanji.kanji === kanji
             );
-            if (!foundKanji) throw new Error("Kanji not found");
-            radical.kanji.push(foundKanji);
+            if (foundKanji) kanjiList.push(foundKanji);
           }
           j++;
           kanjiLine = fileParsed[j];
           if (!kanjiLine) continue;
           if (kanjiLine.startsWith("$ ")) i = j - 1;
         }
-        if (radical.radical.length > 0 && radical.strokes.length > 0 && radical.kanji.length > 0)
+        if (kanjiList.length > 0) radical.kanji = kanjiList;
+        if (radical.radical.length > 0 && radical.strokes.length > 0)
           radicals.push(radical);
       }
     }
@@ -1778,16 +1712,83 @@ function getWord(dict, id, kanjiDic, examples, dictWord, noteTypeName, deckPath)
           }
         if (word.kanji.length === 0) delete word.kanji;
       }
-      if (examples && dictWord.phraseIDs && dictWord.phraseIDs.length > 0) {
-        word.phrases = [];
-        const phraseIDs = new Set(dictWord.phraseIDs);
-        for (const ex of examples)
-          if (phraseIDs.has(ex.id))
-            word.phrases.push({
-              phrase: ex.furigana ?? ex.phrase,
-              translation: ex.translation,
-              originalPhrase: ex.phrase
-            });
+      if (dictWord.hasPhrases === true && examples) {
+        const readings = new Set(
+          word.readings.filter(
+            (reading) => (!reading.notes || !reading.notes.some(
+              (note) => notSearchedForms.has(note)
+            )) && (word.common === void 0 || reading.common === true)
+          ).map((reading) => reading.reading)
+        );
+        const kanjiForms = word.kanjiForms ? new Set(
+          word.kanjiForms.filter(
+            (kanjiForm) => (!kanjiForm.notes || !kanjiForm.notes.some(
+              (note) => notSearchedForms.has(note)
+            )) && (word.common === void 0 || kanjiForm.common === true)
+          ).map((kanjiForm) => kanjiForm.kanjiForm)
+        ) : void 0;
+        const kanjiFormExamples = [];
+        const readingMatchingKanjiFormExamples = [];
+        const readingExamples = [];
+        const partParts = /* @__PURE__ */ new Set();
+        for (const example of examples)
+          for (const part of example.parts) {
+            const readingAsReadingMatch = part.reading !== void 0 && readings.has(part.reading);
+            if (kanjiForms && kanjiForms.size > 0 && kanjiForms.has(part.baseForm)) {
+              if (readingAsReadingMatch) {
+                readingMatchingKanjiFormExamples.push(example);
+                partParts.add(part.baseForm).add(part.reading);
+              } else {
+                kanjiFormExamples.push(example);
+                partParts.add(part.baseForm);
+              }
+              break;
+            }
+            const readingAsBaseFormMatch = readings.has(part.baseForm);
+            const referenceIDMatch = part.referenceID !== void 0 && word.id !== void 0 && part.referenceID === word.id;
+            if (readingAsReadingMatch || readingAsBaseFormMatch || referenceIDMatch) {
+              readingExamples.push(example);
+              if (readingAsReadingMatch) partParts.add(part.reading);
+              if (readingAsBaseFormMatch) partParts.add(part.baseForm);
+              if (referenceIDMatch) partParts.add(part.referenceID);
+              break;
+            }
+          }
+        const exampleSize = readingMatchingKanjiFormExamples.length + kanjiFormExamples.length + readingExamples.length;
+        const includeKanjiFormExamples = readingMatchingKanjiFormExamples.length < Math.max(2, Math.round(exampleSize * 0.05));
+        const includeReadingExamples = word.usuallyInKana === void 0 && includeKanjiFormExamples && readingExamples.length >= Math.max(10, Math.round(exampleSize * 0.15)) || word.usuallyInKana === true && readingExamples.length >= Math.max(2, Math.round(exampleSize * 0.5));
+        let wordExamples = [
+          ...readingMatchingKanjiFormExamples,
+          ...includeKanjiFormExamples ? kanjiFormExamples : [],
+          ...includeReadingExamples ? readingExamples : []
+        ];
+        const glossSpecificExamples = [];
+        const seenPhrases = /* @__PURE__ */ new Set();
+        for (let i = 0; i < word.translations.length; i++) {
+          outer: for (const example of wordExamples) {
+            if (seenPhrases.has(example.phrase)) continue;
+            for (const part of example.parts)
+              if (part.glossNumber === i + 1 && (partParts.has(part.baseForm) || part.reading && partParts.has(part.reading) || part.referenceID && partParts.has(part.referenceID))) {
+                glossSpecificExamples.push(example);
+                seenPhrases.add(example.phrase);
+                break outer;
+              }
+          }
+          if (glossSpecificExamples.length === 5) break;
+        }
+        if (glossSpecificExamples.length === 5)
+          wordExamples = [...glossSpecificExamples];
+        else if (glossSpecificExamples.length > 0)
+          wordExamples = [
+            ...glossSpecificExamples,
+            ...wordExamples.filter((ex) => !seenPhrases.has(ex.phrase)).slice(0, 5 - glossSpecificExamples.length)
+          ];
+        if (wordExamples.length > 0)
+          word.phrases = (wordExamples.length > 5 ? wordExamples.slice(0, 5) : wordExamples).map((ex) => ({
+            phrase: ex.furigana ?? ex.phrase,
+            translation: ex.translation,
+            originalPhrase: ex.phrase
+          }));
       }
       return word;
     } else throw new Error(`Word${id ? ` ${id}` : ""} not found`);