npm - twl-generator - Versions diffs - 1.4.7 → 1.4.9 - Mend

twl-generator 1.4.7 → 1.4.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json +1 -1
package/src/index.js +25 -7
package/src/utils/zipProcessor.js +11 -2

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "twl-generator",
-  "version": "1.4.7",
+  "version": "1.4.9",
   "description": "Generate term-to-article lists from unfoldingWord en_tw archive for Bible books. Works in both Node.js (CLI) and React.js (browser) environments.",
   "main": "src/index.js",
   "bin": {

package/src/index.js CHANGED Viewed

@@ -866,17 +866,32 @@ export async function generateTwlByBook(bookCode, options = {}) {
   // Helpers for Variant of decision (allow only plural/-ed/-ing without marking variant)
   const pluralizeWord = (w) => {
-    return new Inflectors(w).toPlural();
+    if (/[^aeiou]y$/i.test(w)) return w.replace(/y$/i, 'ies');
+    if (/(s|x|z|ch|sh)$/i.test(w)) return w + 'es';
+    if (/f$/i.test(w) && !/(roof|belief|chief|proof)$/i.test(w)) return w.replace(/f$/i, 'ves');
+    if (/fe$/i.test(w)) return w.replace(/fe$/i, 'ves');
+    if (/o$/i.test(w)) return w + 'es';
+    return w + 's';
   };
+  const isVowel = (ch) => /[aeiou]/i.test(ch);
+  const isConsonant = (ch) => /[a-z]/i.test(ch) && !isVowel(ch);
+  const endsWithCVC = (w) => w.length >= 3 && isConsonant(w[w.length - 3]) && isVowel(w[w.length - 2]) && isConsonant(w[w.length - 1]) && !/[wxy]/i.test(w[w.length - 1]);
   const edForm = (w) => {
-    return new Inflectors(w).toPast()
+    if (/e$/i.test(w)) return w + 'd';
+    if (/[^aeiou]y$/i.test(w)) return w.replace(/y$/i, 'ied');
+    // Do not double the final consonant for words ending in "er" (e.g., gather -> gathered)
+    const lastCh = w[w.length - 1];
+    if (endsWithCVC(w) && !/(?:er|en|or|on|al)$/i.test(w)) return w + lastCh + 'ed';
+    return w + 'ed';
   };
   const ingForm = (w) => {
-    return new Inflectors(w).toGerund()
+    if (/ie$/i.test(w)) return w.replace(/ie$/i, 'ying');
+    if (/ee$/i.test(w)) return w + 'ing';
+    if (/e$/i.test(w)) return w.replace(/e$/i, 'ing');
+    const lastCh = w[w.length - 1];
+    if (endsWithCVC(w) && !/(?:er|en|or|on|al)$/i.test(w)) return w + lastCh + 'ing';
+    return w + 'ing';
   };
-  const singularForm = (w) => {
-    return new Inflectors(w).toSingular();
-  }
   const allowNoVariant = (base, match) => {
     const b = String(base || '');
@@ -888,9 +903,12 @@ export async function generateTwlByBook(bookCode, options = {}) {
     const last = parts[parts.length - 1];
     const allowed = new Set([
       head + pluralizeWord(last),
+      head + new Inflectors(last).toPlural(),
+      head + new Inflectors(last).toSingular(),
       head + edForm(last),
+      head + new Inflectors(last).toPast(),
       head + ingForm(last),
-      head + singularForm(last),
+      head + new Inflectors(last).toGerund(),
     ].map(x => x.toLowerCase()));
     return allowed.has(m.toLowerCase());
   };

package/src/utils/zipProcessor.js CHANGED Viewed

@@ -43,12 +43,21 @@ async function processZipBuffer(zipBuffer) {
     for (const term of terms) {
       // Normalize terms by removing parentheses and spaces before them
       // e.g., "Joseph (OT)" -> "Joseph", "Mary (sister of Martha)" -> "Mary"
-      const normalizedTerm = term.replace(/\s+\([^)]*\)$/, '').trim();
+      let normalizedTerm = term.replace(/\s+\([^)]*\)$/, '').trim();
+      // Strip leading articles, demonstratives, and possessive pronouns (allow repeated prefixes)
+      const prefixRegex = /^(?:(?:a|an|the|this|that|these|those|my|your|his|her|its|our|their)\s+)+/i;
+      let cleaned = normalizedTerm.trim();
+      while (prefixRegex.test(cleaned)) {
+        cleaned = cleaned.replace(prefixRegex, '').trim();
+      }
+      normalizedTerm = cleaned;
       if (!termMap[normalizedTerm]) {
         termMap[normalizedTerm] = [];
       }
-      termMap[normalizedTerm].push(truncated);
+      if (!termMap[normalizedTerm].includes(truncated)) {
+        termMap[normalizedTerm].push(truncated);
+      }
     }
   }