npm - @unlaxer/dde-toolkit - Versions diffs - 0.1.6 → 0.1.8 - Mend

@unlaxer/dde-toolkit 0.1.6 → 0.1.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/lib/dictionary.js CHANGED Viewed

@@ -110,7 +110,33 @@ export function buildDictionary(glossaryDir, dictionaryPath, lang = 'en') {
     }
   }
-  // 3. 文字数降順ソート（最長一致のため）
+  // 3. .ja.md の H1 から日本語用語を自動補完
+  //    dictionary.yaml に ja: エントリがない .ja.md が対象（lang=ja のみ）
+  if (lang === 'ja' && existsSync(glossaryDir)) {
+    const jaFiles = readdirSync(glossaryDir).filter(f => f.endsWith('.ja.md') && f !== 'README.ja.md');
+    for (const jaFile of jaFiles) {
+      const jaFilePath = join(glossaryDir, jaFile);
+      // 既に ja: エントリがあればスキップ
+      if (entries.some(e => e.file === jaFilePath && e.lang === 'ja')) continue;
+      // H1 から日本語用語を抽出
+      try {
+        const content = readFileSync(jaFilePath, 'utf8');
+        const h1Match = content.match(/^#\s+(.+)$/m);
+        if (!h1Match) continue;
+        const jaTerm = h1Match[1]
+          .replace(/（[^）]*）/g, '')  // 全角括弧内を削除
+          .replace(/\([^)]*\)/g, '')   // 半角括弧内を削除
+          .trim();
+        if (jaTerm) {
+          entries.push({ term: jaTerm, file: jaFilePath, lang: 'ja' });
+        }
+      } catch {
+        // 読み取り失敗は無視
+      }
+    }
+  }
+  // 4. 文字数降順ソート（最長一致のため）
   entries.sort((a, b) => b.term.length - a.term.length);
   return entries;

package/lib/markdown.js CHANGED Viewed

@@ -85,6 +85,7 @@ export function processMarkdown(content, dictionary, lang = 'en', sourceFile = n
  * テキスト内で用語の置換箇所を検出する
  * - 段落ごとに 1 用語 1 回まで
  * - 最長一致（辞書はすでに降順ソート済み）
+ * - ASCII 用語は単語境界チェックを適用（複合語内マッチを防ぐ）
  */
 function findReplacements(text, dictionary, alreadyMatched, lang) {
   // 使用済み範囲を追跡（重複マッチ防止）
@@ -95,7 +96,20 @@ function findReplacements(text, dictionary, alreadyMatched, lang) {
     if (entry.lang !== lang && entry.lang !== 'en') continue;
     if (alreadyMatched.has(entry.term)) continue;
-    const idx = text.indexOf(entry.term);
+    // 単語境界チェックが必要な ASCII 用語は、条件を満たす最初の出現を探す
+    let idx = -1;
+    const needsBoundary = isAsciiTerm(entry.term);
+    let searchFrom = 0;
+    while (true) {
+      const found = text.indexOf(entry.term, searchFrom);
+      if (found === -1) break;
+      if (needsBoundary && !hasWordBoundary(text, found, found + entry.term.length)) {
+        searchFrom = found + 1;
+        continue;
+      }
+      idx = found;
+      break;
+    }
     if (idx === -1) continue;
     // 重複範囲チェック
@@ -113,6 +127,23 @@ function findReplacements(text, dictionary, alreadyMatched, lang) {
   return replacements;
 }
+/**
+ * 用語が ASCII 文字のみで構成されているか（日本語等は除外）
+ */
+function isAsciiTerm(term) {
+  return /^[\x00-\x7F]+$/.test(term);
+}
+/**
+ * text[start..end] の前後が単語文字（\w）でないか確認する
+ */
+function hasWordBoundary(text, start, end) {
+  const wordChar = /\w/;
+  if (start > 0 && wordChar.test(text[start - 1])) return false;
+  if (end < text.length && wordChar.test(text[end])) return false;
+  return true;
+}
 /**
  * テキストと置換リストから AST ノード配列を生成
  * @param {string} sourceFile - リンクを埋め込むファイルのパス（相対パス計算用）
@@ -185,7 +216,21 @@ export function findUnlinked(content, dictionary, lang = 'en') {
     for (const entry of dictionary) {
       if (entry.lang !== lang && entry.lang !== 'en') continue;
-      if (node.value.includes(entry.term)) {
+      const text = node.value;
+      const needsBoundary = isAsciiTerm(entry.term);
+      let found = false;
+      let searchFrom = 0;
+      while (true) {
+        const idx = text.indexOf(entry.term, searchFrom);
+        if (idx === -1) break;
+        if (needsBoundary && !hasWordBoundary(text, idx, idx + entry.term.length)) {
+          searchFrom = idx + 1;
+          continue;
+        }
+        found = true;
+        break;
+      }
+      if (found) {
         const key = entry.term;
         if (!unlinked.has(key)) {
           unlinked.set(key, { term: entry.term, file: entry.file, count: 0 });

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@unlaxer/dde-toolkit",
-  "version": "0.1.6",
+  "version": "0.1.8",
   "description": "Document Deficit Extraction — find what's not understood in your docs",
   "license": "MIT",
   "type": "module",

package/version.txt CHANGED Viewed

	@@ -1 +1 @@
1	- 0.1.6
1	+ 0.1.8