npm - sigmap - Versions diffs - 7.21.0 → 7.22.1 - Mend

sigmap 7.21.0 → 7.22.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/CHANGELOG.md +21 -0
package/README.md +1 -1
package/gen-context.js +197 -184
package/llms-full.txt +2 -2
package/llms.txt +2 -2
package/package.json +1 -1
package/packages/cli/package.json +1 -1
package/packages/core/package.json +1 -1
package/src/eval/llm-ablation.js +58 -32
package/src/mcp/server.js +1 -1
package/src/verify/parsers.js +14 -0

package/CHANGELOG.md CHANGED Viewed

@@ -10,6 +10,27 @@ Format: [Semantic Versioning](https://semver.org/)
 ---
+## [7.22.1] — 2026-06-18
+Patch release — hardens the `verify-ai-output` file-path extractor against the dominant false-positive class.
+### Fixed
+- **`verify-ai-output` no longer flags runtime/library names or placeholder filenames (#347):** `extractFilePaths` now skips well-known `X.js` product names (`node.js`, `next.js`, `vue.js`, `express.js`, `three.js`, `d3.js`, …) and illustrative placeholder basenames (`example`/`sample`/`demo`/`placeholder`, including `minimal-example.js`). Genuine repo-shaped paths (`src/foo/bar.js`, `main.js`, `index.ts`) are still extracted, so real hallucinations are unaffected. This removes the dominant Hallucination Guard false-positive class — in the §9 ablation, 22 of ~34 flags were literally "Node.js" — turning the directional grounding delta into a clean signal. The bundled `src/verify/parsers` factory was regenerated for standalone-binary parity.
+---
+## [7.22.0] — 2026-06-18
+Minor release — realistic §9 ablation (real-symbol corpus, exact-signature grounding, --verbose) + Gemini model fix.
+### Added
+- **Realistic §9 ablation — real-symbol corpus, exact-signature grounding, `--verbose` (#344):** the LLM A/B ablation now measures something meaningful. `buildGrounding` emits **exact signatures grouped by file** (what `get_callee_signatures` returns, bounded by `maxSignatures`) instead of a flat symbol-name dump — the real product behavior. New `scripts/gen-ablation-corpus.mjs` generates ~40 tasks from the repo's actual exported symbols/files (`benchmarks/llm-ablation-tasks.json`). `src/eval/llm-ablation.js` adds `scoreAnswerDetail` (count + issues) and `runAblation`'s `collectIssues`; the runner's `--verbose` prints every flagged item per arm. A 40-task Gemini run showed grounding reduced flagged errors 62.5 → 22.5 per 100 (directionally positive vs the earlier 4-task noise) — and `--verbose` revealed most flags are `verify-ai-output` file-path false-positives (e.g. "Node.js"), the next thing to harden before publishing a number.
+### Fixed
+- **Gemini default model (#343):** the ablation runner's default `gemini-2.0-flash` was retired by AI Studio (404 NOT_FOUND); the default is now the live `gemini-2.5-flash`. The `--model` flag selects any model.
+---
 ## [7.21.0] — 2026-06-18
 Minor release — LLM ablation runner gains a Gemini (AI Studio) provider.

package/README.md CHANGED Viewed

@@ -88,7 +88,7 @@ Ask → Rank → Context → Validate → Judge → Learn
 ```
 Benchmark : sigmap-v7.0-main (21 repositories, including R language)
-Date      : 2026-06-14
+Date      : 2026-06-18
 Hit@5          : 75.6%   (baseline 13.6%  — 5.6× lift)
 Token reduction: 97.0%   (across 21 repos)

package/gen-context.js CHANGED Viewed

@@ -7931,7 +7931,7 @@ __factories["./src/mcp/server"] = function(module, exports) {
   const SERVER_INFO = {
     name: 'sigmap',
-    version: '7.21.0',
+    version: '7.22.1',
     description: 'SigMap MCP server — code signatures on demand',
   };
@@ -12756,207 +12756,220 @@ module.exports = { checkStarNudge, readUsage, usagePath, showStarNudge, RUN_THRE
 // ── ./src/verify/parsers ──
 __factories["./src/verify/parsers"] = function(module, exports) {
-'use strict';
+  /**
+   * Parsers for the Hallucination Guard (verify-ai-output).
+   *
+   * Extract the verifiable claims an AI answer makes about a codebase:
+   *   - file paths it references
+   *   - import / require statements it shows
+   *   - function / class symbols it calls
+   *   - fenced code blocks (so callers can scope checks to code vs prose)
+   *
+   * Everything here is deterministic and offline — pure string analysis.
+   */
-/**
- * Parsers for the Hallucination Guard (verify-ai-output).
- *
- * Extract the verifiable claims an AI answer makes about a codebase:
- *   - file paths it references
- *   - import / require statements it shows
- *   - function / class symbols it calls
- *   - fenced code blocks (so callers can scope checks to code vs prose)
- *
- * Everything here is deterministic and offline — pure string analysis.
- */
+  // Extensions we are confident name a source/code/config file (no slash required).
+  const KNOWN_CODE_EXT = new Set([
+    'js', 'jsx', 'mjs', 'cjs', 'ts', 'tsx', 'py', 'pyw', 'rb', 'go', 'rs',
+    'java', 'kt', 'swift', 'c', 'h', 'cpp', 'hpp', 'cs', 'php', 'r',
+    'vue', 'svelte', 'css', 'scss', 'less', 'html', 'json', 'yml', 'yaml',
+    'toml', 'xml', 'sql', 'graphql', 'gql', 'proto', 'tf', 'md', 'sh',
+    'gd', 'gdscript',
+  ]);
-// Extensions we are confident name a source/code/config file (no slash required).
-const KNOWN_CODE_EXT = new Set([
-  'js', 'jsx', 'mjs', 'cjs', 'ts', 'tsx', 'py', 'pyw', 'rb', 'go', 'rs',
-  'java', 'kt', 'swift', 'c', 'h', 'cpp', 'hpp', 'cs', 'php', 'r',
-  'vue', 'svelte', 'css', 'scss', 'less', 'html', 'json', 'yml', 'yaml',
-  'toml', 'xml', 'sql', 'graphql', 'gql', 'proto', 'tf', 'md', 'sh',
-  'gd', 'gdscript',
-]);
+  // Well-known "X.js" runtime/library product names — never repo files.
+  const LIBRARY_TOKENS = new Set([
+    'node.js', 'next.js', 'nuxt.js', 'vue.js', 'react.js', 'express.js', 'koa.js',
+    'nest.js', 'three.js', 'd3.js', 'chart.js', 'ember.js', 'backbone.js',
+    'angular.js', 'meteor.js', 'moment.js', 'anime.js', 'p5.js', 'next.config.js',
+  ]);
-/**
- * Extract fenced code blocks.
- * @param {string} text
- * @returns {{ lang: string, content: string, line: number }[]}
- */
-function extractCodeBlocks(text) {
-  const blocks = [];
-  const lines = text.split('\n');
-  let inBlock = false;
-  let lang = '';
-  let buf = [];
-  let startLine = 0;
-  for (let i = 0; i < lines.length; i++) {
-    const m = lines[i].match(/^```(\w*)/);
-    if (m) {
-      if (!inBlock) {
-        inBlock = true;
-        lang = m[1] || '';
-        buf = [];
-        startLine = i + 2; // first content line (1-based)
-      } else {
-        blocks.push({ lang, content: buf.join('\n'), line: startLine });
-        inBlock = false;
+  // Illustrative placeholder names the model writes in prose, not repo claims:
+  // e.g. example.js, minimal-example.js, sample.ts, demo.js, placeholder.js.
+  const PLACEHOLDER_RE = /(?:^|[-_.])(?:example|sample|demo|placeholder)(?:[-_.]|$)/i;
+  /**
+   * Extract fenced code blocks.
+   * @param {string} text
+   * @returns {{ lang: string, content: string, line: number }[]}
+   */
+  function extractCodeBlocks(text) {
+    const blocks = [];
+    const lines = text.split('\n');
+    let inBlock = false;
+    let lang = '';
+    let buf = [];
+    let startLine = 0;
+    for (let i = 0; i < lines.length; i++) {
+      const m = lines[i].match(/^```(\w*)/);
+      if (m) {
+        if (!inBlock) {
+          inBlock = true;
+          lang = m[1] || '';
+          buf = [];
+          startLine = i + 2; // first content line (1-based)
+        } else {
+          blocks.push({ lang, content: buf.join('\n'), line: startLine });
+          inBlock = false;
+        }
+        continue;
       }
-      continue;
+      if (inBlock) buf.push(lines[i]);
     }
-    if (inBlock) buf.push(lines[i]);
+    return blocks;
   }
-  return blocks;
-}
-/**
- * Extract file-path references (deduped, first-seen line kept).
- * A token counts as a path when it has a `.<letter…>` extension AND
- * either contains a `/` or carries a known code/config extension.
- * @param {string} text
- * @returns {{ path: string, line: number }[]}
- */
-function extractFilePaths(text) {
-  const lines = text.split('\n');
-  const seen = new Map();
-  const re = /(?:^|[\s`"'(\[<])([A-Za-z0-9_][\w./-]*\.[A-Za-z][A-Za-z0-9]*)/g;
-  for (let i = 0; i < lines.length; i++) {
-    const line = lines[i];
-    let m;
-    re.lastIndex = 0;
-    while ((m = re.exec(line)) !== null) {
-      const p = m[1];
-      if (/^https?:/i.test(p)) continue;
-      const ext = (p.split('.').pop() || '').toLowerCase();
-      const hasSlash = p.includes('/');
-      if (!hasSlash && !KNOWN_CODE_EXT.has(ext)) continue;
-      if (!seen.has(p)) seen.set(p, i + 1);
+  /**
+   * Extract file-path references (deduped, first-seen line kept).
+   * A token counts as a path when it has a `.<letter…>` extension AND
+   * either contains a `/` or carries a known code/config extension.
+   * @param {string} text
+   * @returns {{ path: string, line: number }[]}
+   */
+  function extractFilePaths(text) {
+    const lines = text.split('\n');
+    const seen = new Map();
+    const re = /(?:^|[\s`"'(\[<])([A-Za-z0-9_][\w./-]*\.[A-Za-z][A-Za-z0-9]*)/g;
+    for (let i = 0; i < lines.length; i++) {
+      const line = lines[i];
+      let m;
+      re.lastIndex = 0;
+      while ((m = re.exec(line)) !== null) {
+        const p = m[1];
+        if (/^https?:/i.test(p)) continue;
+        const ext = (p.split('.').pop() || '').toLowerCase();
+        const hasSlash = p.includes('/');
+        if (!hasSlash && !KNOWN_CODE_EXT.has(ext)) continue;
+        if (LIBRARY_TOKENS.has(p.toLowerCase())) continue;
+        const base = p.split('/').pop();
+        if (PLACEHOLDER_RE.test(base)) continue;
+        if (!seen.has(p)) seen.set(p, i + 1);
+      }
     }
+    return [...seen.entries()].map(([p, line]) => ({ path: p, line }));
   }
-  return [...seen.entries()].map(([p, line]) => ({ path: p, line }));
-}
-/**
- * Extract import / require statements.
- * @param {string} text
- * @returns {{ module: string, kind: 'js'|'py', relative: boolean, line: number, raw: string }[]}
- */
-function extractImports(text) {
-  const lines = text.split('\n');
-  const out = [];
-  const push = (module, kind, line, raw) => {
-    if (!module) return;
-    out.push({ module, kind, relative: /^[./]/.test(module), line, raw: raw.trim() });
-  };
-  for (let i = 0; i < lines.length; i++) {
-    const line = lines[i];
-    let m;
-    // JS/TS: import ... from 'x'  |  export ... from 'x'
-    if ((m = line.match(/\b(?:import|export)\b[^'"]*\bfrom\s*['"]([^'"]+)['"]/))) {
-      push(m[1], 'js', i + 1, line);
-    } else if ((m = line.match(/\bimport\s*['"]([^'"]+)['"]/))) {
-      // side-effect import 'x'
-      push(m[1], 'js', i + 1, line);
-    }
-    // require('x') / dynamic import('x') — may co-occur, scan separately
-    const reqRe = /\b(?:require|import)\s*\(\s*['"]([^'"]+)['"]\s*\)/g;
-    let r;
-    while ((r = reqRe.exec(line)) !== null) push(r[1], 'js', i + 1, line);
-    // TS: import X = require('mod')
-    if ((m = line.match(/\bimport\s+[A-Za-z_$][\w$]*\s*=\s*require\s*\(\s*['"]([^'"]+)['"]\s*\)/))) {
-      push(m[1], 'js', i + 1, line);
-    }
-    // Python: from x import y  |  import x
-    if ((m = line.match(/^\s*from\s+([.\w]+)\s+import\b/))) {
-      push(m[1], 'py', i + 1, line);
-    } else if ((m = line.match(/^\s*import\s+([A-Za-z_][\w.]*)/))) {
-      push(m[1], 'py', i + 1, line);
-    }
-  }
-  // Multi-line JS/TS imports, e.g.
-  //   import {
-  //     A as B,
-  //   } from './mod';
-  // The per-line pass above misses these because `from '…'` sits on a later
-  // line. Trigger only when the opening line has no quote and no `from` yet,
-  // then gather forward until the source string appears.
-  for (let i = 0; i < lines.length; i++) {
-    const start = lines[i];
-    if (!/^\s*(?:import|export)\b/.test(start)) continue;
-    if (/['"]/.test(start) || /\bfrom\b/.test(start)) continue; // single-line, already handled
-    let joined = start;
-    for (let j = i + 1; j < Math.min(lines.length, i + 12); j++) {
-      joined += ' ' + lines[j];
-      const fm = joined.match(/\bfrom\s*['"]([^'"]+)['"]/);
-      if (fm) { push(fm[1], 'js', i + 1, start.trim()); break; }
-      if (/['"]/.test(lines[j]) && !/\bfrom\b/.test(joined)) break; // a string that isn't a source — bail
+  /**
+   * Extract import / require statements.
+   * @param {string} text
+   * @returns {{ module: string, kind: 'js'|'py', relative: boolean, line: number, raw: string }[]}
+   */
+  function extractImports(text) {
+    const lines = text.split('\n');
+    const out = [];
+    const push = (module, kind, line, raw) => {
+      if (!module) return;
+      out.push({ module, kind, relative: /^[./]/.test(module), line, raw: raw.trim() });
+    };
+    for (let i = 0; i < lines.length; i++) {
+      const line = lines[i];
+      let m;
+      // JS/TS: import ... from 'x'  |  export ... from 'x'
+      if ((m = line.match(/\b(?:import|export)\b[^'"]*\bfrom\s*['"]([^'"]+)['"]/))) {
+        push(m[1], 'js', i + 1, line);
+      } else if ((m = line.match(/\bimport\s*['"]([^'"]+)['"]/))) {
+        // side-effect import 'x'
+        push(m[1], 'js', i + 1, line);
+      }
+      // require('x') / dynamic import('x') — may co-occur, scan separately
+      const reqRe = /\b(?:require|import)\s*\(\s*['"]([^'"]+)['"]\s*\)/g;
+      let r;
+      while ((r = reqRe.exec(line)) !== null) push(r[1], 'js', i + 1, line);
+      // TS: import X = require('mod')
+      if ((m = line.match(/\bimport\s+[A-Za-z_$][\w$]*\s*=\s*require\s*\(\s*['"]([^'"]+)['"]\s*\)/))) {
+        push(m[1], 'js', i + 1, line);
+      }
+      // Python: from x import y  |  import x
+      if ((m = line.match(/^\s*from\s+([.\w]+)\s+import\b/))) {
+        push(m[1], 'py', i + 1, line);
+      } else if ((m = line.match(/^\s*import\s+([A-Za-z_][\w.]*)/))) {
+        push(m[1], 'py', i + 1, line);
+      }
+    }
+    // Multi-line JS/TS imports, e.g.
+    //   import {
+    //     A as B,
+    //   } from './mod';
+    // The per-line pass above misses these because `from '…'` sits on a later
+    // line. Trigger only when the opening line has no quote and no `from` yet,
+    // then gather forward until the source string appears.
+    for (let i = 0; i < lines.length; i++) {
+      const start = lines[i];
+      if (!/^\s*(?:import|export)\b/.test(start)) continue;
+      if (/['"]/.test(start) || /\bfrom\b/.test(start)) continue; // single-line, already handled
+      let joined = start;
+      for (let j = i + 1; j < Math.min(lines.length, i + 12); j++) {
+        joined += ' ' + lines[j];
+        const fm = joined.match(/\bfrom\s*['"]([^'"]+)['"]/);
+        if (fm) { push(fm[1], 'js', i + 1, start.trim()); break; }
+        if (/['"]/.test(lines[j]) && !/\bfrom\b/.test(joined)) break; // a string that isn't a source — bail
+      }
     }
+    return out;
   }
-  return out;
-}
-/**
- * Extract npm/pnpm/yarn script invocations (`npm run <name>`).
- * Only the explicit `run` form is matched, to avoid confusing package-manager
- * subcommands (`yarn add`, `pnpm install`) with script names.
- * @param {string} text
- * @returns {{ name: string, line: number }[]}
- */
-function extractNpmScripts(text) {
-  const lines = text.split('\n');
-  const out = [];
-  const seen = new Set();
-  const re = /\b(?:npm|pnpm|yarn)\s+run(?:-script)?\s+([A-Za-z0-9:_-]+)/g;
-  for (let i = 0; i < lines.length; i++) {
-    let m;
-    re.lastIndex = 0;
-    while ((m = re.exec(lines[i])) !== null) {
-      const name = m[1];
-      if (seen.has(name)) continue;
-      seen.add(name);
-      out.push({ name, line: i + 1 });
+  /**
+   * Extract npm/pnpm/yarn script invocations (`npm run <name>`).
+   * Only the explicit `run` form is matched, to avoid confusing package-manager
+   * subcommands (`yarn add`, `pnpm install`) with script names.
+   * @param {string} text
+   * @returns {{ name: string, line: number }[]}
+   */
+  function extractNpmScripts(text) {
+    const lines = text.split('\n');
+    const out = [];
+    const seen = new Set();
+    const re = /\b(?:npm|pnpm|yarn)\s+run(?:-script)?\s+([A-Za-z0-9:_-]+)/g;
+    for (let i = 0; i < lines.length; i++) {
+      let m;
+      re.lastIndex = 0;
+      while ((m = re.exec(lines[i])) !== null) {
+        const name = m[1];
+        if (seen.has(name)) continue;
+        seen.add(name);
+        out.push({ name, line: i + 1 });
+      }
     }
+    return out;
   }
-  return out;
-}
-/**
- * Extract function/class symbol references that look like calls.
- * Restricted to backtick-wrapped calls (`foo(...)`) for high precision.
- * @param {string} text
- * @returns {{ name: string, line: number }[]}
- */
-function extractSymbols(text) {
-  const lines = text.split('\n');
-  const out = [];
-  const seen = new Set();
-  const re = /`([A-Za-z_$][\w$]*)\s*\([^`]*\)`/g;
-  for (let i = 0; i < lines.length; i++) {
-    let m;
-    re.lastIndex = 0;
-    while ((m = re.exec(lines[i])) !== null) {
-      const name = m[1];
-      const key = name + '@' + (i + 1);
-      if (seen.has(key)) continue;
-      seen.add(key);
-      out.push({ name, line: i + 1 });
+  /**
+   * Extract function/class symbol references that look like calls.
+   * Restricted to backtick-wrapped calls (`foo(...)`) for high precision.
+   * @param {string} text
+   * @returns {{ name: string, line: number }[]}
+   */
+  function extractSymbols(text) {
+    const lines = text.split('\n');
+    const out = [];
+    const seen = new Set();
+    const re = /`([A-Za-z_$][\w$]*)\s*\([^`]*\)`/g;
+    for (let i = 0; i < lines.length; i++) {
+      let m;
+      re.lastIndex = 0;
+      while ((m = re.exec(lines[i])) !== null) {
+        const name = m[1];
+        const key = name + '@' + (i + 1);
+        if (seen.has(key)) continue;
+        seen.add(key);
+        out.push({ name, line: i + 1 });
+      }
     }
+    return out;
   }
-  return out;
-}
-module.exports = {
-  extractCodeBlocks,
-  extractFilePaths,
-  extractImports,
-  extractSymbols,
-  extractNpmScripts,
-};
+  module.exports = {
+    extractCodeBlocks,
+    extractFilePaths,
+    extractImports,
+    extractSymbols,
+    extractNpmScripts,
+  };
 };
 // ── ./src/verify/closest-match ──
@@ -13609,7 +13622,7 @@ function __tryGit(args, opts = {}) {
   catch (_) { return ''; }
 }
-const VERSION = '7.21.0';
+const VERSION = '7.22.1';
 const MARKER = '\n\n## Auto-generated signatures\n<!-- Updated by gen-context.js -->\n';
 function requireSourceOrBundled(key) {

package/llms-full.txt CHANGED Viewed

@@ -9,13 +9,13 @@ the files relevant to the task — cutting tokens ~97% while keeping answers
 grounded. Deterministic, offline, no embeddings or vector database. Works with
 Claude, Cursor, GitHub Copilot, Aider, Windsurf, local LLMs, and MCP.
-# Version: 7.21.0 | Benchmark: sigmap-v7.0-main (2026-06-14)
+# Version: 7.22.1 | Benchmark: sigmap-v7.0-main (2026-06-18)
 # Source: auto-generated from package.json, version.json, src/mcp/tools.js, src/config/defaults.js
 # Regenerate: npm run generate:llms   |   Validate: npm run validate:llms
 ---
-## Core metrics (benchmark: sigmap-v7.0-main, 2026-06-14)
+## Core metrics (benchmark: sigmap-v7.0-main, 2026-06-18)
 | Metric | Without SigMap | With SigMap |
 |--------|----------------|-------------|

package/llms.txt CHANGED Viewed

@@ -9,7 +9,7 @@ the files relevant to the task — cutting tokens ~97% while keeping answers
 grounded. Deterministic, offline, no embeddings or vector database. Works with
 Claude, Cursor, GitHub Copilot, Aider, Windsurf, local LLMs, and MCP.
-# Version: 7.21.0 | Benchmark: sigmap-v7.0-main (2026-06-14)
+# Version: 7.22.1 | Benchmark: sigmap-v7.0-main (2026-06-18)
 # Source: auto-generated from package.json, version.json, src/mcp/tools.js, src/config/defaults.js
 # Regenerate: npm run generate:llms   |   Validate: npm run validate:llms
@@ -21,7 +21,7 @@ Claude, Cursor, GitHub Copilot, Aider, Windsurf, local LLMs, and MCP.
 - No blast-radius awareness before editing a hub file — `--impact` shows every file a change touches.
 - Pasted stack traces, CI logs, and JSON bloat the prompt — `squeeze` minimizes them and enriches the top frame from the symbol index.
-## Core metrics (benchmark: sigmap-v7.0-main, 2026-06-14)
+## Core metrics (benchmark: sigmap-v7.0-main, 2026-06-18)
 - hit@5 retrieval: 75.6% vs 13.6% random baseline (5.6× lift)
 - Token reduction: 97.0% average across benchmark repos

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "sigmap",
-  "version": "7.21.0",
+  "version": "7.22.1",
   "description": "97% token reduction for AI coding. Extracts function & class signatures with TF-IDF ranking to feed only the right files to Claude, Cursor, Copilot, Aider, Windsurf, local LLMs & MCP. Zero dependencies, runs offline via npx.",
   "main": "packages/core/index.js",
   "exports": {

package/packages/cli/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "sigmap-cli",
-  "version": "7.21.0",
+  "version": "7.22.1",
   "description": "SigMap CLI wrapper — thin adapter for programmatic CLI invocation",
   "main": "index.js",
   "keywords": [

package/packages/core/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "sigmap-core",
-  "version": "7.21.0",
+  "version": "7.22.1",
   "description": "SigMap core library — zero-dependency code signature extraction, retrieval, and security scanning",
   "main": "index.js",
   "keywords": [

package/src/eval/llm-ablation.js CHANGED Viewed

@@ -13,59 +13,82 @@
 const { verify } = require('../verify/hallucination-guard');
+const path = require('path');
+/** Strip a signature's trailing line anchor (` :12-20`) for prompt cleanliness. */
+function _cleanSig(sig) {
+  return String(sig).replace(/\s*:\d+(?:-\d+)?\s*$/, '').trim();
+}
 /**
  * Build the SigMap grounding block for a repo — what we prepend to a task
- * prompt in arm B. Conventions (the house style) + the known-symbol list
- * (so the model can reference real names instead of guessing).
+ * prompt in arm B. Conventions (the house style) + **exact signatures** grouped
+ * by file (what `get_callee_signatures` returns), so the model references the
+ * real surface instead of guessing — the actual product behavior, not a flat
+ * name dump.
  * @param {string} cwd
  * @param {object} [opts]
- * @param {number} [opts.maxSymbols=80]
+ * @param {number} [opts.maxSignatures=150] cap on signature lines (bounds prompt size)
  * @returns {string}
  */
 function buildGrounding(cwd, opts = {}) {
-  const maxSymbols = opts.maxSymbols != null ? opts.maxSymbols : 80;
+  const maxSignatures = opts.maxSignatures != null ? opts.maxSignatures : 150;
   const parts = [];
+  let index = null;
   try {
-    const { extractConventions } = require('../conventions/extract');
-    const { renderConventionsBlock } = require('../conventions/inject');
-    const { loadConfig } = require('../config/loader');
-    let files = [];
-    try {
-      const cfg = loadConfig(cwd);
-      const { buildSigIndex } = require('../retrieval/ranker');
-      files = [...buildSigIndex(cwd).keys()];
-      void cfg;
-    } catch (_) {}
-    const conv = extractConventions(cwd, files);
-    parts.push(renderConventionsBlock(conv));
+    const { buildSigIndex } = require('../retrieval/ranker');
+    index = buildSigIndex(cwd);
   } catch (_) {}
   try {
-    const { buildSymbolSet } = require('../verify/hallucination-guard');
-    const { set } = buildSymbolSet(cwd);
-    const names = [...set].slice(0, maxSymbols);
-    if (names.length) parts.push(`## Known symbols (reference these exactly)\n${names.join(', ')}`);
+    const { extractConventions } = require('../conventions/extract');
+    const { renderConventionsBlock } = require('../conventions/inject');
+    const files = index ? [...index.keys()] : [];
+    parts.push(renderConventionsBlock(extractConventions(cwd, files)));
   } catch (_) {}
+  if (index) {
+    const lines = ['## Exact signatures (use these — do not invent symbols or paths)'];
+    let count = 0;
+    for (const [file, sigs] of index) {
+      if (count >= maxSignatures) break;
+      const rel = path.relative(cwd, file).replace(/\\/g, '/');
+      const clean = (sigs || []).map(_cleanSig).filter(Boolean);
+      if (!clean.length) continue;
+      lines.push(`### ${rel}`);
+      for (const s of clean) {
+        if (count >= maxSignatures) break;
+        lines.push(s);
+        count++;
+      }
+    }
+    if (count > 0) parts.push(lines.join('\n'));
+  }
   return parts.join('\n\n');
 }
 /**
- * Count flagged codebase-fact errors in an answer (the §9 metric).
+ * Score an answer: flagged codebase-fact errors + the issue list (the §9 metric).
  * @param {string} answerText
  * @param {string} cwd
- * @returns {number}
+ * @returns {{ total: number, issues: object[] }}
  */
-function scoreAnswer(answerText, cwd) {
+function scoreAnswerDetail(answerText, cwd) {
   try {
-    const { summary } = verify(String(answerText || ''), cwd);
-    return summary.total || 0;
+    const { issues, summary } = verify(String(answerText || ''), cwd);
+    return { total: summary.total || 0, issues: issues || [] };
   } catch (_) {
-    return 0;
+    return { total: 0, issues: [] };
   }
 }
+/** Count flagged codebase-fact errors in an answer (the §9 metric). */
+function scoreAnswer(answerText, cwd) {
+  return scoreAnswerDetail(answerText, cwd).total;
+}
 /**
  * Run the A/B ablation over a task corpus.
  * @param {Array<{id:string, prompt:string}>} tasks
@@ -73,6 +96,7 @@ function scoreAnswer(answerText, cwd) {
  * @param {(prompt:string, meta:object)=>string} complete injected model call
  * @param {object} [opts]
  * @param {string} [opts.grounding] precomputed grounding (else built from cwd)
+ * @param {boolean} [opts.collectIssues] attach `aIssues`/`bIssues` per task
  * @returns {{ tasks: object[], aggregate: object }}
  */
 function runAblation(tasks, cwd, complete, opts = {}) {
@@ -88,11 +112,13 @@ function runAblation(tasks, cwd, complete, opts = {}) {
     const outA = String(complete(basePrompt, { id: task.id, grounded: false }) || '');
     const outB = String(complete(groundedPrompt, { id: task.id, grounded: true }) || '');
-    const aFlagged = scoreAnswer(outA, cwd);
-    const bFlagged = scoreAnswer(outB, cwd);
-    sumA += aFlagged;
-    sumB += bFlagged;
-    rows.push({ id: task.id, aFlagged, bFlagged });
+    const a = scoreAnswerDetail(outA, cwd);
+    const b = scoreAnswerDetail(outB, cwd);
+    sumA += a.total;
+    sumB += b.total;
+    const row = { id: task.id, aFlagged: a.total, bFlagged: b.total };
+    if (opts.collectIssues) { row.aIssues = a.issues; row.bIssues = b.issues; }
+    rows.push(row);
   }
   const n = rows.length;
@@ -110,4 +136,4 @@ function runAblation(tasks, cwd, complete, opts = {}) {
   };
 }
-module.exports = { buildGrounding, scoreAnswer, runAblation };
+module.exports = { buildGrounding, scoreAnswer, scoreAnswerDetail, runAblation };

package/src/mcp/server.js CHANGED Viewed

@@ -18,7 +18,7 @@ const { readContext, searchSignatures, getMap, createCheckpoint, getRouting, exp
 const SERVER_INFO = {
   name: 'sigmap',
-  version: '7.21.0',
+  version: '7.22.1',
   description: 'SigMap MCP server — code signatures on demand',
 };

package/src/verify/parsers.js CHANGED Viewed

@@ -21,6 +21,17 @@ const KNOWN_CODE_EXT = new Set([
   'gd', 'gdscript',
 ]);
+// Well-known "X.js" runtime/library product names — never repo files.
+const LIBRARY_TOKENS = new Set([
+  'node.js', 'next.js', 'nuxt.js', 'vue.js', 'react.js', 'express.js', 'koa.js',
+  'nest.js', 'three.js', 'd3.js', 'chart.js', 'ember.js', 'backbone.js',
+  'angular.js', 'meteor.js', 'moment.js', 'anime.js', 'p5.js', 'next.config.js',
+]);
+// Illustrative placeholder names the model writes in prose, not repo claims:
+// e.g. example.js, minimal-example.js, sample.ts, demo.js, placeholder.js.
+const PLACEHOLDER_RE = /(?:^|[-_.])(?:example|sample|demo|placeholder)(?:[-_.]|$)/i;
 /**
  * Extract fenced code blocks.
  * @param {string} text
@@ -73,6 +84,9 @@ function extractFilePaths(text) {
       const ext = (p.split('.').pop() || '').toLowerCase();
       const hasSlash = p.includes('/');
       if (!hasSlash && !KNOWN_CODE_EXT.has(ext)) continue;
+      if (LIBRARY_TOKENS.has(p.toLowerCase())) continue;
+      const base = p.split('/').pop();
+      if (PLACEHOLDER_RE.test(base)) continue;
       if (!seen.has(p)) seen.set(p, i + 1);
     }
   }