npm - sweet-search - Versions diffs - 2.5.2 → 2.5.4 - Mend

sweet-search 2.5.2 → 2.5.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (155) hide show

package/core/cli.js +24 -3
package/core/graph/graph-expansion.js +215 -36
package/core/graph/graph-extractor.js +196 -11
package/core/graph/graph-search.js +395 -92
package/core/graph/hcgs-generator.js +2 -1
package/core/graph/index.js +2 -0
package/core/graph/repo-map.js +28 -6
package/core/graph/structural-answer-cues.js +168 -0
package/core/graph/structural-callsite-hints.js +40 -0
package/core/graph/structural-context-format.js +40 -0
package/core/graph/structural-context.js +450 -0
package/core/graph/structural-forward-push.js +156 -0
package/core/graph/structural-header-context.js +19 -0
package/core/graph/structural-importance.js +148 -0
package/core/graph/structural-pagerank.js +197 -0
package/core/graph/summary-manager.js +13 -9
package/core/incremental-indexing/application/dirty-scan.mjs +236 -0
package/core/incremental-indexing/application/file-watcher.mjs +197 -0
package/core/incremental-indexing/application/maintenance-handlers.mjs +519 -0
package/core/incremental-indexing/application/maintenance-worker.mjs +380 -0
package/core/incremental-indexing/application/operator-cli.mjs +554 -0
package/core/incremental-indexing/application/production-li-delta.mjs +192 -0
package/core/incremental-indexing/application/production-reconciler-helpers.mjs +107 -0
package/core/incremental-indexing/application/production-reconciler.mjs +583 -0
package/core/incremental-indexing/application/reconciler.mjs +477 -0
package/core/incremental-indexing/application/tombstone-injector.mjs +148 -0
package/core/incremental-indexing/domain/chunk-identity.mjs +260 -0
package/core/incremental-indexing/domain/encoder-deps.mjs +193 -0
package/core/incremental-indexing/domain/encoder-input.mjs +225 -0
package/core/incremental-indexing/domain/interval-autotune.mjs +255 -0
package/core/incremental-indexing/domain/reconcile-counters.mjs +149 -0
package/core/incremental-indexing/domain/watermark-scheduler.mjs +239 -0
package/core/incremental-indexing/infrastructure/artifact-temp-sweep.mjs +163 -0
package/core/incremental-indexing/infrastructure/baseline-readiness.mjs +121 -0
package/core/incremental-indexing/infrastructure/dirty-set.mjs +233 -0
package/core/incremental-indexing/infrastructure/graph-gc.mjs +314 -0
package/core/incremental-indexing/infrastructure/hashing.mjs +298 -0
package/core/incremental-indexing/infrastructure/hcgs-invalidation.mjs +182 -0
package/core/incremental-indexing/infrastructure/li-segment-merge.mjs +278 -0
package/core/incremental-indexing/infrastructure/li-segment-state.mjs +173 -0
package/core/incremental-indexing/infrastructure/lockfile.mjs +119 -0
package/core/incremental-indexing/infrastructure/maintenance-state-reader.mjs +283 -0
package/core/incremental-indexing/infrastructure/manifest.mjs +194 -0
package/core/incremental-indexing/infrastructure/path-filter.mjs +190 -0
package/core/incremental-indexing/infrastructure/reader-heartbeat.mjs +201 -0
package/core/incremental-indexing/infrastructure/schema-migrations.mjs +257 -0
package/core/incremental-indexing/infrastructure/sparse-gram-delta.mjs +335 -0
package/core/incremental-indexing/infrastructure/sqlite-fts5.mjs +176 -0
package/core/incremental-indexing/infrastructure/staleness-display.mjs +105 -0
package/core/incremental-indexing/infrastructure/tombstone-bitmap.mjs +234 -0
package/core/incremental-indexing/infrastructure/vector-delta-writer.mjs +359 -0
package/core/incremental-indexing/infrastructure/vector-gc.mjs +133 -0
package/core/incremental-indexing/infrastructure/worktree-stamp.mjs +155 -0
package/core/incremental-indexing/infrastructure/wsl2-detect.mjs +115 -0
package/core/indexing/admission-policy.js +139 -0
package/core/indexing/artifact-builder.js +29 -12
package/core/indexing/ast-chunker.js +107 -30
package/core/indexing/dedup/exemplar-selector.js +19 -1
package/core/indexing/gitignore-filter.js +223 -0
package/core/indexing/incremental-tracker.js +99 -30
package/core/indexing/index-codebase-v21.js +6 -5
package/core/indexing/index-maintainer.mjs +698 -6
package/core/indexing/indexer-ann.js +99 -15
package/core/indexing/indexer-build.js +158 -45
package/core/indexing/indexer-empty-baseline.js +80 -0
package/core/indexing/indexer-manifest.js +66 -0
package/core/indexing/indexer-phases.js +56 -23
package/core/indexing/indexer-sparse-gram.js +54 -13
package/core/indexing/indexer-utils.js +26 -208
package/core/indexing/indexing-file-policy.js +32 -7
package/core/indexing/maintainer-launcher.mjs +137 -0
package/core/indexing/merkle-tracker.js +251 -244
package/core/indexing/model-pool.js +46 -5
package/core/infrastructure/code-graph-repository.js +758 -6
package/core/infrastructure/code-graph-visibility.js +157 -0
package/core/infrastructure/codebase-repository.js +100 -13
package/core/infrastructure/config/search.js +1 -1
package/core/infrastructure/db-utils.js +118 -0
package/core/infrastructure/dedup-hashing.js +10 -13
package/core/infrastructure/hardware-capability.js +17 -7
package/core/infrastructure/index.js +8 -2
package/core/infrastructure/language-patterns/maps.js +4 -1
package/core/infrastructure/language-patterns/registry-core.js +56 -17
package/core/infrastructure/language-patterns/registry-object-oriented.js +12 -5
package/core/infrastructure/language-patterns.js +69 -0
package/core/infrastructure/model-registry.js +20 -0
package/core/infrastructure/native-inference.js +7 -12
package/core/infrastructure/native-resolver.js +52 -37
package/core/infrastructure/native-sparse-gram.js +261 -20
package/core/infrastructure/native-tokenizer.js +6 -15
package/core/infrastructure/simd-distance.js +10 -16
package/core/infrastructure/sparse-gram-delta-reader.js +76 -0
package/core/infrastructure/structural-alias-resolver.js +122 -0
package/core/infrastructure/structural-candidate-ranker.js +34 -0
package/core/infrastructure/structural-context-repository.js +472 -0
package/core/infrastructure/structural-context-utils.js +51 -0
package/core/infrastructure/structural-graph-signals.js +121 -0
package/core/infrastructure/structural-qualified-resolution.js +15 -0
package/core/infrastructure/structural-source-definitions.js +100 -0
package/core/infrastructure/tombstone-bitmap-reader.js +139 -0
package/core/infrastructure/tree-sitter-provider.js +811 -37
package/core/prompt-optimization/data/p7-final/sweet-search-system-prompt.md +50 -0
package/core/query/query-router.js +55 -5
package/core/ranking/file-kind-ranking.js +2192 -15
package/core/ranking/late-interaction-index.js +87 -12
package/core/search/cli-decoration.js +290 -0
package/core/search/context-expander.js +988 -78
package/core/search/index.js +1 -0
package/core/search/output-policy.js +275 -0
package/core/search/search-anchor.js +499 -0
package/core/search/search-boost.js +93 -1
package/core/search/search-cli.js +61 -204
package/core/search/search-hybrid.js +250 -10
package/core/search/search-pattern-chunks.js +57 -8
package/core/search/search-pattern-planner.js +68 -9
package/core/search/search-pattern-prefilter.js +30 -10
package/core/search/search-pattern-ripgrep.js +40 -4
package/core/search/search-pattern-sparse-overlay.js +256 -0
package/core/search/search-pattern.js +117 -29
package/core/search/search-postprocess.js +479 -5
package/core/search/search-read-semantic.js +260 -23
package/core/search/search-read.js +82 -64
package/core/search/search-reader-pin.js +71 -0
package/core/search/search-rrf.js +279 -0
package/core/search/search-semantic.js +110 -5
package/core/search/search-server.js +130 -57
package/core/search/search-trace.js +107 -0
package/core/search/server-identity.js +93 -0
package/core/search/session-daemon-prewarm.mjs +33 -10
package/core/search/sweet-search.js +399 -7
package/core/skills/sweet-index/SKILL.md +8 -6
package/core/vector-store/binary-hnsw-index.js +194 -30
package/core/vector-store/float-vector-store.js +96 -6
package/core/vector-store/hnsw-index.js +220 -49
package/eval/agent-read-workflows/bin/_ss-helpers.mjs +471 -0
package/eval/agent-read-workflows/bin/ss-find +15 -0
package/eval/agent-read-workflows/bin/ss-grep +12 -0
package/eval/agent-read-workflows/bin/ss-read +14 -0
package/eval/agent-read-workflows/bin/ss-search +18 -0
package/eval/agent-read-workflows/bin/ss-semantic +12 -0
package/eval/agent-read-workflows/bin/ss-trace +11 -0
package/mcp/read-tool.js +109 -0
package/mcp/server.js +55 -15
package/mcp/tool-handlers.js +14 -124
package/mcp/trace-tool.js +81 -0
package/package.json +25 -10
package/scripts/hooks/intercept-read.mjs +55 -0
package/scripts/hooks/remind-tools.mjs +40 -0
package/scripts/init.js +698 -54
package/scripts/inject-agent-instructions.js +431 -0
package/scripts/install-prompt-reminders.js +188 -0
package/scripts/install-tool-enforcement.js +220 -0
package/scripts/smoke-test.js +12 -9
package/scripts/uninstall.js +276 -18
package/scripts/write-claude-rules.js +110 -0

package/core/search/context-expander.js CHANGED Viewed

@@ -146,16 +146,39 @@ export function expandToSymbol(result, opts) {
   const origRange = `${origStart}-${origEnd}`;
   const chunkLines = (origEnd - origStart) + 1;
   // Check if chunk already looks like a complete symbol
-  // (has a name/type and is > 10 lines — not just a signature fragment)
+  // (has a name/type and is > 10 lines — not just a signature fragment).
+  // Even when no expansion is needed we still:
+  //   (1) look up the enclosing entity so callers (graph-neighbour
+  //       reservation) can attach edges to it.
+  //   (2) absorb leading trivia (Rust /// + #[...], JSDoc, Python decorators)
+  //       so the agent sees attribute-driven semantics like #[non_exhaustive]
+  //       that the judge keeps asking for.
   if (meta.name && chunkLines > 10) {
+    const filePath0 = meta.file || result.file;
+    // Try strict enclosing-range first; fall back to a single-line query at
+    // origStart when the chunk overshoots the entity by trailing lines (a
+    // common chunker artefact — observed on gin handleHTTPRequest where
+    // chunk=690-762 but entity=690-760, leaving the strict query empty).
+    let ent0 = findEnclosingEntity(codeGraphRepo, filePath0, origStart, origEnd);
+    if (!ent0) ent0 = findEnclosingEntity(codeGraphRepo, filePath0, origStart, origStart);
+    let triviaStart0 = origStart;
+    if (opts.fileCache && !opts.ablations?.has('no-leading-trivia') && origStart > 1) {
+      const lang0 = inferLanguage(filePath0);
+      const candidate = expandLeadingTrivia(filePath0, origStart, opts.fileCache, opts.projectRoot, lang0);
+      // Only commit when the absorbed trivia fits the cap (10 tok/line est).
+      const newLines = (origEnd - candidate) + 1;
+      if (newLines * 10 <= tokenCap) triviaStart0 = candidate;
+    }
     return {
-      startLine: origStart,
+      startLine: triviaStart0,
       endLine: origEnd,
-      expanded: false,
-      expandedFrom: null,
+      expanded: triviaStart0 < origStart,
+      expandedFrom: triviaStart0 < origStart ? origRange : null,
       symbol: meta.name,
       symbolType: meta.type || null,
+      entityId: ent0?.id || null,
       kind: 'chunk',
     };
   }
@@ -169,13 +192,25 @@ export function expandToSymbol(result, opts) {
     // Only expand if it fits within the token cap
     if (entityTokens <= tokenCap) {
+      // Absorb leading trivia (doc comments, decorators, attributes) above
+      // the entity. This recovers context the judge keeps asking for —
+      // ripgrep `#[non_exhaustive]`, JSDoc, Rust /// docs, Python decorators.
+      const lang = inferLanguage(filePath);
+      const triviaStart = (opts.fileCache && !opts.ablations?.has('no-leading-trivia'))
+        ? expandLeadingTrivia(filePath, entity.startLine, opts.fileCache, opts.projectRoot, lang)
+        : entity.startLine;
+      const startWithTrivia = Math.max(1, Math.min(triviaStart, entity.startLine));
+      // Re-check budget with trivia included; fall back to symbol-only if it overflows.
+      const expandedLines = (entity.endLine - startWithTrivia) + 1;
+      const fits = expandedLines * 10 <= tokenCap;
       return {
-        startLine: entity.startLine,
+        startLine: fits ? startWithTrivia : entity.startLine,
         endLine: entity.endLine,
         expanded: true,
         expandedFrom: origRange,
         symbol: entity.name,
         symbolType: entity.type,
+        entityId: entity.id || null,
         kind: 'full',
       };
     }
@@ -193,6 +228,7 @@ export function expandToSymbol(result, opts) {
           expandedFrom: origRange,
           symbol: entity.name,
           symbolType: entity.type,
+          entityId: entity.id || null,
           kind: 'sandwich',
           sandwich,
         };
@@ -206,22 +242,44 @@ export function expandToSymbol(result, opts) {
       expandedFrom: null,
       symbol: entity.name,
       symbolType: entity.type,
+      entityId: entity.id || null,
       kind: 'chunk',
     };
   }
+  // F5 (2026-05-07): when no enclosing entity exists for the chunk, fall back
+  // to the FIRST entity that starts within the chunk range. This catches cases
+  // like fastify lib/reply.js:64-225 where the chunk spans the Reply function
+  // (64-76) plus prototype methods later — no single entity contains the chunk,
+  // but Reply is the topmost identifier and matches the gold ("send" / "Reply"
+  // / "buildReply"). Only applies in fallback path where meta.name is also null.
+  let firstContained = null;
+  if (codeGraphRepo && typeof codeGraphRepo.findFirstEntityInRange === 'function' && !meta.name) {
+    try {
+      firstContained = codeGraphRepo.findFirstEntityInRange(filePath, origStart, origEnd);
+    } catch { firstContained = null; }
+  }
   // Try sibling chunk merge (contiguous chunks in the same file)
   const intervals = locationMap?.get(filePath);
   if (intervals && intervals.length > 1) {
     const merged = mergeSiblingChunks(intervals, origStart, origEnd, tokenCap);
     if (merged) {
+      // F5: when the merged range spans a previously-unseen entity, label it.
+      let mergedFirstContained = firstContained;
+      if (!meta.name && !mergedFirstContained && codeGraphRepo
+          && typeof codeGraphRepo.findFirstEntityInRange === 'function') {
+        try {
+          mergedFirstContained = codeGraphRepo.findFirstEntityInRange(filePath, merged.startLine, merged.endLine);
+        } catch { /* keep original firstContained */ }
+      }
       return {
         startLine: merged.startLine,
         endLine: merged.endLine,
         expanded: true,
         expandedFrom: origRange,
-        symbol: meta.name || null,
-        symbolType: meta.type || null,
+        symbol: meta.name || mergedFirstContained?.name || null,
+        symbolType: meta.type || mergedFirstContained?.type || null,
         kind: 'syntax',
       };
     }
@@ -243,13 +301,24 @@ export function expandToSymbol(result, opts) {
     fileCache, filePath, origStart, origEnd, tokenCap, projectRoot
   );
   if (syntaxExpanded) {
+    // F5: when syntax expansion enlarges the range, the new range may contain
+    // entities the raw chunk didn't. Re-lookup the first contained entity in
+    // the expanded range so chunks like fastify lib/reply.js:139-192 (no
+    // entities) → 64-225 (contains Reply at 64-76) get a meaningful symbol.
+    let syntaxFirstContained = firstContained;
+    if (!meta.name && !syntaxFirstContained && codeGraphRepo
+        && typeof codeGraphRepo.findFirstEntityInRange === 'function') {
+      try {
+        syntaxFirstContained = codeGraphRepo.findFirstEntityInRange(filePath, syntaxExpanded.startLine, syntaxExpanded.endLine);
+      } catch { /* keep firstContained */ }
+    }
     return {
       startLine: syntaxExpanded.startLine,
       endLine: syntaxExpanded.endLine,
       expanded: true,
       expandedFrom: origRange,
-      symbol: meta.name || null,
-      symbolType: meta.type || null,
+      symbol: meta.name || syntaxFirstContained?.name || null,
+      symbolType: meta.type || syntaxFirstContained?.type || null,
       kind: 'syntax',
     };
   }
@@ -260,8 +329,8 @@ export function expandToSymbol(result, opts) {
     endLine: origEnd,
     expanded: false,
     expandedFrom: null,
-    symbol: meta.name || null,
-    symbolType: meta.type || null,
+    symbol: meta.name || firstContained?.name || null,
+    symbolType: meta.type || firstContained?.type || null,
     kind: 'chunk',
   };
 }
@@ -550,6 +619,70 @@ export function expandBySyntax(fileCache, filePath, startLine, endLine, tokenCap
   return { startLine: expandedStart, endLine: expandedEnd };
 }
+/**
+ * Walk upward from `baseStartLine` to absorb leading trivia (doc comments,
+ * attributes, decorators) that document the symbol. This recovers context
+ * the judge keeps asking for: ripgrep `#[non_exhaustive]`, JSDoc above
+ * the function, Python decorators, Rust `///` and `//!` doc lines.
+ *
+ * Caps at 30 lines back so we never blow the budget on accidentally
+ * absorbing a previous symbol's body. Returns the adjusted startLine
+ * (never less than 1, never above baseStartLine).
+ *
+ * @param {string} filePath
+ * @param {number} baseStartLine
+ * @param {Map} fileCache
+ * @param {string} projectRoot
+ * @param {string} lang
+ * @returns {number}
+ */
+export function expandLeadingTrivia(filePath, baseStartLine, fileCache, projectRoot, lang) {
+  if (!filePath || !baseStartLine || baseStartLine <= 1) return baseStartLine;
+  const windowStart = Math.max(1, baseStartLine - 30);
+  const text = readFileRange(fileCache, filePath, windowStart, baseStartLine - 1, projectRoot);
+  if (!text) return baseStartLine;
+  const lines = text.split('\n');
+  // Walk lines BACKWARDS, classifying each:
+  //   - trivia line (doc / attr / decorator)  → mark as the new topmost
+  //   - blank line                            → tolerated INSIDE a doc run,
+  //                                              but not absorbed (the blank
+  //                                              above the topmost trivia
+  //                                              row stays attached to the
+  //                                              prior code, not the symbol)
+  //   - anything else (code / punct / close)  → stop
+  let topmostTrivia = baseStartLine;   // 1-based absolute, only moves on trivia
+  for (let idx = lines.length - 1; idx >= 0; idx--) {
+    const raw = lines[idx];
+    const ln = windowStart + idx;
+    if (ln >= baseStartLine) continue;
+    const trimmed = raw.trim();
+    if (trimmed === '') {
+      // Tolerate blank gaps inside the doc run but DO NOT include them: the
+      // returned line is always the topmost actual trivia row.
+      continue;
+    }
+    let isTrivia = false;
+    if (lang === 'rust') {
+      // /// and //! doc comments, #[attr] / #![attr], block comments,
+      // // regular comments adjacent to a doc run.
+      isTrivia = /^(\/\/[!/]?|\/\*\*?|\*\/?|\*\s|#\!?\[)/.test(trimmed);
+    } else if (lang === 'go') {
+      isTrivia = /^\/\//.test(trimmed);
+    } else if (lang === 'python') {
+      // Decorators, comments, and raw docstring lines (rare directly above def)
+      isTrivia = /^@\w/.test(trimmed) || /^#/.test(trimmed)
+        || /^['"]{3}/.test(trimmed);
+    } else {
+      // JS/TS/Java/C-style: //, /** ... */, *, decorators (TS @Decorator)
+      isTrivia = /^(\/\/|\/\*\*?|\*\/?|\*\s|@\w)/.test(trimmed);
+    }
+    if (!isTrivia) break;
+    topmostTrivia = ln;
+  }
+  return topmostTrivia;
+}
 /** Get Python indent level (number of leading spaces, tabs=4). */
 function getIndentLevel(line) {
   let indent = 0;
@@ -618,47 +751,131 @@ export function checkStaleness(filePath, projectRoot, codeGraphRepo, cache = {})
 /**
  * Extract import lines from file header, language-aware.
  *
- * Handles:
- *   - JS/TS: import/require/export statements
- *   - Go: import (...) blocks and single imports
- *   - Python: import/from statements
- *   - Rust: use declarations
+ * Handles multi-line constructs that the previous line-by-line filter
+ * dropped on the floor (the dominant cause of "missing alias" judge
+ * complaints, e.g. fastify uses
+ *   const { kSchemaParams: paramsSchema, ... } = require('./symbols')
+ * spanning 5+ lines — the body uses `paramsSchema`, but only the multi-line
+ * form maps it back to `kSchemaParams`):
+ *
+ *   - JS/TS: ES `import { a, b } from 'x'` (multi-line)
+ *           `const { a, b } = require('x')` (multi-line, with `kKey: alias`)
+ *           `export { ... } from '...'`
+ *   - Go: `import (...)` blocks (with aliases like `alias "path"`)
+ *   - Python: `import x` / `from x import (a, b, c)` (multi-line with parens)
+ *   - Rust: `use foo::{bar, baz}` (multi-line grouped) + `pub use` + extern crate
+ *
+ * Output is one logical statement per array entry; multi-line statements
+ * are joined with a space so the consumer (header rendering, identifier
+ * scan) sees a single string per import.
  */
 function extractImportLines(headerText, lang) {
   const lines = headerText.split('\n');
+  // ── Generic multi-line statement collector ───────────────────────────────
+  // Walk lines, accumulate balanced bracket levels for each "starter" we
+  // recognise, emit when the statement closes. Falls back to single-line
+  // emission for languages where a statement ends at EOL.
+  const out = [];
   if (lang === 'go') {
-    // Go: capture `import (...)` block contents and single `import "..."`
-    const result = [];
+    // Go: capture `import (...)` block contents (each line) and single `import "..."`
     let inBlock = false;
     for (const line of lines) {
       if (/^\s*import\s*\(/.test(line)) { inBlock = true; continue; }
       if (inBlock) {
         if (/^\s*\)/.test(line)) { inBlock = false; continue; }
-        if (line.trim()) result.push(line);
-      } else if (/^\s*import\s+"/.test(line)) {
-        result.push(line);
+        if (line.trim()) out.push(line.trimEnd());
+      } else if (/^\s*import\s+(\w+\s+)?"/.test(line)) {
+        out.push(line.trimEnd());
       }
     }
-    return result;
+    return out;
   }
   if (lang === 'python') {
-    return lines.filter(line =>
-      /^\s*(import\s+\w|from\s+\w)/.test(line)
-    );
+    // Python: `import x`, `from x import y`, `from x import (a, b, ...)`
+    // multi-line via parens or trailing backslash.
+    let i = 0;
+    while (i < lines.length) {
+      const line = lines[i];
+      if (/^\s*(import\s+\w|from\s+[.\w]+\s+import)/.test(line)) {
+        let stmt = line.trimEnd();
+        // Continue while line ends with backslash or has unbalanced (
+        const opens = () => (stmt.match(/\(/g) || []).length;
+        const closes = () => (stmt.match(/\)/g) || []).length;
+        const continued = () => /\\\s*$/.test(stmt) || opens() > closes();
+        while (continued() && i + 1 < lines.length) {
+          stmt = stmt.replace(/\\\s*$/, '').trimEnd() + ' ' + lines[++i].trim();
+        }
+        out.push(stmt);
+      }
+      i++;
+    }
+    return out;
   }
   if (lang === 'rust') {
-    return lines.filter(line =>
-      /^\s*(use\s+|pub\s+use\s+|extern\s+crate\s+)/.test(line)
-    );
+    // Rust: `use foo::{bar, baz}` (possibly multi-line via { ... });
+    // also `pub use ...;` and `extern crate ...;` (single line).
+    let i = 0;
+    while (i < lines.length) {
+      const line = lines[i];
+      if (/^\s*(pub\s+)?use\s+/.test(line) || /^\s*extern\s+crate\s+/.test(line)) {
+        let stmt = line.trimEnd();
+        // Continue until we see the terminating `;`
+        while (!/;\s*(\/\/.*)?$/.test(stmt) && i + 1 < lines.length) {
+          stmt += ' ' + lines[++i].trim();
+        }
+        out.push(stmt);
+      }
+      i++;
+    }
+    return out;
   }
-  // JS/TS/default
-  return lines.filter(line =>
-    /^\s*(import\s|const\s+\{.*\}\s*=\s*require|from\s+['"]|export\s+\{)/.test(line)
-  );
+  // JS/TS/default — handle multi-line ES imports and CommonJS destructured requires.
+  // Examples we want to capture as ONE logical line:
+  //   import {
+  //     foo,
+  //     bar as baz,
+  //   } from 'mod'
+  //   const {
+  //     kSchemaParams: paramsSchema,
+  //     kSchemaBody: bodySchema,
+  //   } = require('./symbols')
+  //   const x = require('./y')
+  //   export { a, b } from './x'
+  let i = 0;
+  while (i < lines.length) {
+    const line = lines[i];
+    const isStartES = /^\s*(import|export)\s/.test(line);
+    // CJS detector: start at any line that begins a const/let/var declaration.
+    // We accumulate continuation lines until brackets balance, THEN filter to
+    // only keep statements that prove themselves to be import-like (contain
+    // `require(...)` or destructured-assignment from a bracketed expression).
+    const isStartCJS = /^\s*(const|let|var)\s+/.test(line)
+      && (/\brequire\s*\(/.test(line) || /\{[^}]*$/.test(line));
+    if (isStartES || isStartCJS) {
+      let stmt = line.trimEnd();
+      const opens = () => (stmt.match(/[{(]/g) || []).length;
+      const closes = () => (stmt.match(/[})]/g) || []).length;
+      // Continue while open brackets exceed closes OR statement ends with comma
+      // (suggests a continuation line for object / list).
+      while ((opens() > closes() || /,\s*(\/\/.*)?$/.test(stmt))
+             && i + 1 < lines.length) {
+        stmt += ' ' + lines[++i].trim();
+        if (opens() === closes() && /;\s*$/.test(stmt)) break;
+      }
+      // Only keep statements that look like imports (drop unrelated
+      // const/let assignments that happened to span lines).
+      if (/\b(import|require\s*\(|from\s+['"]|export\s*\{)/.test(stmt)) {
+        out.push(stmt);
+      }
+    }
+    i++;
+  }
+  return out;
 }
 /**
@@ -829,46 +1046,349 @@ export function computeConfidence(results, stats) {
   return { confidence, confidenceReason };
 }
+/**
+ * Identifiers that look like external references the body uses but does
+ * NOT define. We treat anything matching `\b[A-Za-z_][A-Za-z0-9_]{2,}\b`
+ * (≥3 chars), excluding language keywords and the symbol's own name.
+ * Returns a Set, lower-cased keys plus the original case for diagnostics.
+ */
+function extractCodeIdentifiers(code, ownSymbolName) {
+  const out = new Set();
+  if (!code) return out;
+  const matches = code.match(/\b[A-Za-z_][A-Za-z0-9_]{2,}\b/g) || [];
+  const ownLower = (ownSymbolName || '').toLowerCase();
+  for (const id of matches) {
+    if (LANG_KEYWORDS.has(id)) continue;
+    if (id.toLowerCase() === ownLower) continue;
+    // Drop pure numerics and trivially-short tokens already filtered.
+    out.add(id);
+  }
+  return out;
+}
+/**
+ * Decide whether the body's referenced identifiers are all locally
+ * resolvable from headerContext + neighbours + the body itself
+ * (i.e. the symbol introduces or imports them all). Used by the
+ * stricter `computeSufficiency` rule.
+ *
+ * Identifiers count as resolved when they are:
+ *   - mentioned in `headerContext` (any kind of import/require line)
+ *   - mentioned in `neighborsRendered` (callees/imports we surfaced)
+ *   - declared inside `code` itself (e.g. const x = ..., function x ...,
+ *     parameters in the symbol signature) — detected as identifiers that
+ *     appear in lvalue positions (`const X`, `let X`, `function X`,
+ *     `class X`, function parameters)
+ */
+function unresolvedExternalRefs(code, ownSymbolName, headerContext, neighborsRendered) {
+  const externals = extractCodeIdentifiers(code, ownSymbolName);
+  if (!externals.size) return new Set();
+  const resolvedHaystack = (headerContext || '') + '\n' + (neighborsRendered || '');
+  // Approximate "declared locally in this code block": any identifier that
+  // appears in an lvalue-ish position. We only need a rough check, false
+  // positives here just mean "looks self-contained" (which is fine).
+  const localDecls = new Set();
+  const lvalueRe = /\b(?:const|let|var|function|class|fn|def|struct|enum|trait|impl|type|interface)\s+([A-Za-z_][A-Za-z0-9_]*)/g;
+  let m;
+  while ((m = lvalueRe.exec(code))) localDecls.add(m[1]);
+  // Function-parameter approximation: capture top-of-block `(...)` after the symbol name.
+  const sigRe = new RegExp(`\\b${(ownSymbolName || '').replace(/[.*+?^${}()|[\\]\\\\]/g, '\\\\$&')}\\s*\\(([^)]*)\\)`);
+  if (ownSymbolName) {
+    const sig = code.match(sigRe);
+    if (sig) {
+      for (const part of sig[1].split(/[,\s]+/)) {
+        const id = part.replace(/[:=\[\]?<>]/g, '').replace(/\.\.\./, '').trim();
+        if (id) localDecls.add(id);
+      }
+    }
+  }
+  const unresolved = new Set();
+  for (const id of externals) {
+    if (localDecls.has(id)) continue;
+    if (resolvedHaystack.includes(id)) continue;
+    unresolved.add(id);
+  }
+  return unresolved;
+}
 /**
  * Compute sufficiency signal — does the returned context likely contain
- * enough information to answer the query? (Fix #7, plan §5)
+ * enough information to answer the query?
  *
- * Signals:
- *   (a) Expanded region contains a complete symbol (not truncated)
- *   (b) Header context resolves all referenced imports
- *   (c) Score gap suggests the match is specific, not generic
+ * Tightened rule (May 2026 — addresses the dominant agent-bench loss
+ * pattern): a complete symbol on its own is NOT sufficient. We also
+ * require either (a) the symbol's external references are resolved
+ * (header imports + 1-hop graph neighbours), or (b) the symbol is
+ * provably self-contained (no unresolved external identifiers).
  *
- * @param {object} topResult - The top-1 agent result
- * @param {{ confidence: string }} confidenceInfo - Confidence computation result
- * @returns {{ sufficient: boolean, reasons: string[] }}
+ * Reasons emitted (independent signals, kept for diagnostics):
+ *   - complete_symbol     : top-1 is a full, non-truncated symbol
+ *   - header_resolved     : top-1 has resolved import/header context
+ *   - neighbors_present   : the package surfaced ≥1 1-hop graph neighbour
+ *   - self_contained_strict: every external identifier in the body is
+ *                            either declared locally, in headerContext,
+ *                            or in the surfaced neighbours list
+ *   - high_confidence     : score gap puts top-1 well ahead of top-2
+ *
+ * sufficient := complete_symbol
+ *               AND (header_resolved OR neighbors_present OR self_contained_strict)
+ *               AND (high_confidence OR header_resolved OR neighbors_present)
+ *
+ * @param {object} topResult
+ * @param {{ confidence: string }} confidenceInfo
+ * @returns {{ sufficient: boolean, reasons: string[], unresolvedExternalCount: number }}
  */
 export function computeSufficiency(topResult, confidenceInfo) {
   const reasons = [];
-  // (a) Is the result a complete symbol (not truncated)?
-  const isComplete = topResult.symbol &&
+  const isComplete = !!(topResult.symbol &&
     topResult.presentation === 'full' &&
-    !topResult.code?.includes('// ... (');
-  if (isComplete) {
-    reasons.push('complete_symbol');
+    !topResult.code?.includes('// ... ('));
+  if (isComplete) reasons.push('complete_symbol');
+  const hasHeader = !!topResult.headerContext;
+  if (hasHeader) reasons.push('header_resolved');
+  const hasNeighbors = !!(topResult.neighbors && topResult.neighbors.count > 0);
+  if (hasNeighbors) reasons.push('neighbors_present');
+  // Strict self-containment: only fires if the body has zero unresolved
+  // external identifiers (after considering header + neighbours + locals).
+  let unresolvedCount = 0;
+  if (isComplete && topResult.code) {
+    const unresolved = unresolvedExternalRefs(
+      topResult.code,
+      topResult.symbol,
+      topResult.headerContext || '',
+      topResult.neighbors?.rendered || ''
+    );
+    unresolvedCount = unresolved.size;
+    if (unresolvedCount === 0) reasons.push('self_contained_strict');
+  }
+  if (confidenceInfo?.confidence === 'high') reasons.push('high_confidence');
+  // Tightened rule: complete symbol is necessary but NOT sufficient.
+  // We require at least one resolution reason AND at least one specificity
+  // reason. This stops a bare "complete + high_confidence" from claiming
+  // sufficient when the body still references a dozen helpers we never
+  // surfaced (the validation-pipeline failure mode).
+  const hasResolution = hasHeader || hasNeighbors || reasons.includes('self_contained_strict');
+  const hasSpecificity = confidenceInfo?.confidence === 'high' || hasHeader || hasNeighbors;
+  const sufficient = isComplete && hasResolution && hasSpecificity;
+  return { sufficient, reasons, unresolvedExternalCount: unresolvedCount };
+}
+// =============================================================================
+// Graph-neighbour reservation (Phase 6) — 1-hop neighbours for top-1
+// =============================================================================
+/**
+ * Extract identifier candidates from a code body that look like type names
+ * (struct / interface / class / enum / trait / type). Used by the
+ * graph-neighbour tier to find type definitions that the relationships
+ * table didn't capture as explicit edges (the canonical failure case is
+ * gin:http-dispatch — `methodTree` is an unexported Go struct referenced
+ * via a field-of-field, never as a direct relationship edge).
+ *
+ * Heuristic: any token ≥3 chars containing at least one uppercase AND at
+ * least one lowercase letter (Pascal/camelCase). This captures both
+ * exported types (`Engine`, `Context`, `ErrorKind`) and unexported Go
+ * types (`methodTree`, `nodeType`). It deliberately rejects:
+ *   - all-uppercase SCREAMING_SNAKE_CASE constants
+ *   - all-lowercase variables / function names
+ *   - language keywords
+ *   - the symbol's own name
+ *
+ * False positives (e.g. method names in camelCase) are cheap because the
+ * downstream SQL lookup ALSO filters by entity type, so a camelCase
+ * function name won't match a struct/interface/class entity.
+ *
+ * @param {string} code
+ * @param {string|null} ownName - the symbol's own name, excluded from results
+ * @returns {string[]}
+ */
+function extractTypeCandidates(code, ownName) {
+  if (!code) return [];
+  const matches = code.match(/\b[A-Za-z_][A-Za-z0-9_]{2,}\b/g) || [];
+  const own = (ownName || '').toLowerCase();
+  const seen = new Set();
+  const out = [];
+  for (const id of matches) {
+    if (seen.has(id)) continue;
+    seen.add(id);
+    if (LANG_KEYWORDS.has(id)) continue;
+    if (id.toLowerCase() === own) continue;
+    // Require BOTH upper and lower (Pascal/camelCase). Filters out
+    // SCREAMING_SNAKE constants AND all-lowercase variables. A pure
+    // single-word lowercase token like `trees` is rejected — most
+    // unexported Go types are camelCase like `methodTree` and survive.
+    if (!/[A-Z]/.test(id)) continue;
+    if (!/[a-z]/.test(id)) continue;
+    out.push(id);
   }
+  // Cap the candidate list — DB lookup is bounded but we still pay query cost.
+  return out.slice(0, 32);
+}
-  // (b) Does header context exist, OR is the symbol self-contained?
-  // Self-contained: complete symbol with code but no header needed (no imports referenced).
-  // This prevents false negatives for utility functions that don't use imports.
-  if (topResult.headerContext) {
-    reasons.push('header_resolved');
-  } else if (isComplete && topResult.code && topResult.codeTokens > 0) {
-    reasons.push('self_contained');
+/**
+ * Render a one-hop graph-neighbour tier for the top-1 result. This addresses
+ * the dominant loss pattern in the agent benchmark: ss-search returned a
+ * tight, "complete" symbol, the agent stopped at one tool call, and the
+ * judge then complained the answer didn't surface CALLERS, IMPORTED
+ * SYMBOLS, or HELPER FUNCTIONS that the chunk plainly references.
+ *
+ * The renderer:
+ *   - asks the code graph for outgoing relationships (calls / imports / uses /
+ *     extends / implements / overrides / throws) from top-1's entity,
+ *   - asks for incoming callers / users (top-K by weight),
+ *   - dedupes anything whose target file:line range overlaps a result that
+ *     is already in the ranked pack (no point spending budget on a row the
+ *     agent already sees),
+ *   - groups by edge family and renders compact one-liners that include the
+ *     target's `file:line` so the agent can cite the neighbour directly,
+ *   - hard-caps the rendered text at `tokenCap`. The result is fully
+ *     elidable — when the cap is 0, the function returns null.
+ *
+ * @param {object} opts
+ * @param {object} opts.codeGraphRepo - CodeGraphRepository instance
+ * @param {object} opts.entity        - { id, filePath, startLine, endLine, name, type }
+ * @param {Set<string>} opts.skipKeys - "file|startLine|endLine" of results already in the pack
+ * @param {number} opts.tokenCap      - max tokens for the rendered tier
+ * @param {string} [opts.body]        - top-1 code body, used to discover
+ *   referenced TYPE names (struct/interface/class/...) that the
+ *   relationships table doesn't capture as explicit edges
+ * @returns {{ rendered: string, count: number, tokens: number,
+ *             outgoingCount: number, incomingCount: number,
+ *             typeRefCount: number }|null}
+ */
+export function renderGraphNeighbors(opts) {
+  const { codeGraphRepo, entity, skipKeys, tokenCap = 0, body = '' } = opts;
+  if (!codeGraphRepo || !entity || !entity.id || tokenCap <= 0) return null;
+  const OUT_TYPES = ['imports', 'calls', 'uses', 'extends', 'implements', 'overrides', 'throws'];
+  const IN_TYPES = ['calls', 'uses', 'extends', 'implements'];
+  // typeAlias is what Go's graph extractor stores for struct/interface/type
+  // declarations; the others cover JS/TS/Java/Rust/Python conventions.
+  const TYPE_KINDS = ['struct', 'class', 'interface', 'enum', 'trait', 'type', 'typeAlias'];
+  let outgoing = [];
+  let incoming = [];
+  let typeRefs = [];
+  try { outgoing = codeGraphRepo.getOutgoingRelationships(entity.id, { types: OUT_TYPES, limit: 16 }) || []; }
+  catch { outgoing = []; }
+  try { incoming = codeGraphRepo.getIncomingRelationships(entity.id, { types: IN_TYPES, limit: 8 }) || []; }
+  catch { incoming = []; }
+  // Type-reference discovery: extract identifiers from the body and ask the
+  // graph for entities of struct/interface/class/enum/trait/type/typeAlias
+  // with that name. This recovers the case the relationships table misses —
+  // e.g. a Go method whose receiver field has type `methodTrees []methodTree`
+  // never gets a 'calls/imports/uses' edge to `methodTree`, yet the agent
+  // needs that type's defining file:line to give a correct answer
+  // (gin:http-dispatch was the canonical failure).
+  //
+  // Dedup uses range-based skipKeys (NOT excludeFile) — same-file types
+  // matter when top-1 is a method and the receiver struct lives next to
+  // it (e.g. Engine in gin.go vs handleHTTPRequest in gin.go).
+  if (body && typeof codeGraphRepo.findEntitiesByNames === 'function') {
+    try {
+      const ids = extractTypeCandidates(body, entity.name);
+      if (ids.length) {
+        typeRefs = codeGraphRepo.findEntitiesByNames(ids, {
+          types: TYPE_KINDS,
+          limit: 8,
+        }) || [];
+      }
+    } catch { typeRefs = []; }
   }
-  // (c) Is the confidence high (specific match)?
-  if (confidenceInfo.confidence === 'high') {
-    reasons.push('high_confidence');
+  if (outgoing.length === 0 && incoming.length === 0 && typeRefs.length === 0) return null;
+  // Group by edge family for stable rendering. Each row is a one-liner.
+  // Format:
+  //   - imports paramsSchema → lib/symbols.js:14 [Symbol]
+  //   - calls validateParam → lib/validation.js:118-144 [function]
+  //   - caller handleRequest → lib/handle-request.js:88-104 [function]
+  //   - imports module './x' (unresolved)
+  const ownKey = `${entity.filePath}|${entity.startLine}|${entity.endLine}`;
+  const seen = new Set([ownKey, ...(skipKeys || [])]);
+  const formatLineRange = (a, b) => (a && b && b > a) ? `${a}-${b}` : `${a || '?'}`;
+  const lines = [];
+  // OUTGOING — group resolved targets first, then unresolved imports
+  const grouped = new Map();
+  for (const r of outgoing) {
+    const fam = r.type;
+    if (!grouped.has(fam)) grouped.set(fam, []);
+    grouped.get(fam).push(r);
+  }
+  // Render order: imports, calls, uses, extends, implements, overrides, throws
+  for (const fam of OUT_TYPES) {
+    const rows = grouped.get(fam) || [];
+    for (const r of rows) {
+      let rendered;
+      if (r.target && r.target.filePath) {
+        const k = `${r.target.filePath}|${r.target.startLine}|${r.target.endLine}`;
+        if (seen.has(k)) continue;          // already in the pack — skip
+        seen.add(k);
+        const range = formatLineRange(r.target.startLine, r.target.endLine);
+        rendered = `- ${fam} ${r.target.name} → ${r.target.filePath}:${range} [${r.target.type}]`;
+      } else if (r.fullImportPath) {
+        rendered = `- ${fam} ${r.targetName} ← '${r.fullImportPath}' (unresolved)`;
+      } else if (r.targetName && r.contextLine) {
+        rendered = `- ${fam} ${r.targetName} (referenced at line ${r.contextLine})`;
+      } else if (r.targetName) {
+        rendered = `- ${fam} ${r.targetName}`;
+      } else {
+        continue;
+      }
+      lines.push(rendered);
+    }
+  }
+  // INCOMING — flag as "caller" or "user"
+  for (const r of incoming) {
+    const s = r.source;
+    if (!s) continue;
+    const k = `${s.filePath}|${s.startLine}|${s.endLine}`;
+    if (seen.has(k)) continue;
+    seen.add(k);
+    const range = formatLineRange(s.startLine, s.endLine);
+    const kind = r.type === 'calls' ? 'caller' : (r.type === 'uses' ? 'user' : r.type);
+    lines.push(`- ${kind} ${s.name} ← ${s.filePath}:${range} [${s.type}]`);
+  }
+  // TYPE-REFERENCES — entities discovered by name from the body. Renders as
+  // "type" prefix to disambiguate from the relationship-driven rows above.
+  // Same dedup against skipKeys.
+  for (const t of typeRefs) {
+    const k = `${t.filePath}|${t.startLine}|${t.endLine}`;
+    if (seen.has(k)) continue;
+    seen.add(k);
+    const range = formatLineRange(t.startLine, t.endLine);
+    lines.push(`- type ${t.name} → ${t.filePath}:${range} [${t.type}]`);
+  }
+  if (lines.length === 0) return null;
+  // Hard-cap to tokenCap. Drop tail lines until it fits.
+  let combined = lines.join('\n');
+  while (estimateTokens(combined) > tokenCap && lines.length > 1) {
+    lines.pop();
+    combined = lines.join('\n');
   }
+  if (estimateTokens(combined) > tokenCap) return null;
-  const sufficient = reasons.length >= 2;
-  return { sufficient, reasons };
+  return {
+    rendered: combined,
+    count: lines.length,
+    tokens: estimateTokens(combined),
+    outgoingCount: outgoing.length,
+    incomingCount: incoming.length,
+    typeRefCount: typeRefs.length,
+  };
 }
 // =============================================================================
@@ -1069,11 +1589,21 @@ function compressToPreview(code, tokenCap) {
 /**
  * Resolve the effective sub-mode from the format string.
- *   'agent' / 'agent_preview' → 'agent_preview' (compact 4k budget)
- *   'agent_full'               → 'agent_full' (8k budget)
- *   'agent_full_xl'            → 'agent_full_xl' (12k budget, opt-in only;
- *                                falls back to agent_full at allocation time
- *                                when the dominance gate fails)
+ *
+ * EXPLICIT TIERS (caller picks):
+ *   'agent_preview' → 'agent_preview' (compact 4k budget)
+ *   'agent_full'    → 'agent_full'    (8k budget)
+ *   'agent_full_xl' → 'agent_full_xl' (12k budget, opt-in only;
+ *                                      falls back to per-result baseline cap
+ *                                      at allocation time when the top-1
+ *                                      dominance gate fails)
+ *
+ * AUTO-PICK (default for the bare 'agent' format):
+ *   'agent'         → tier chosen by selectAgentBudget(); see that fn.
+ *
+ * Used as a fallback when caller bypasses the auto-pick path (e.g. unit tests
+ * that call resolveSubMode directly). Production code goes through
+ * selectAgentBudget(format, signals) which understands auto-pick.
  */
 function resolveSubMode(format) {
   if (format === 'agent_full_xl') return 'agent_full_xl';
@@ -1081,6 +1611,256 @@ function resolveSubMode(format) {
   return 'agent_preview'; // 'agent' and 'agent_preview' both map here
 }
+// =============================================================================
+// Auto-tier selection — selectAgentBudget
+// =============================================================================
+//
+// Picks the agent-mode budget tier (preview 4k / full 8k / xl 12k) from
+// post-ranking signals when callers pass the bare format='agent'.
+//
+// DESIGN PRINCIPLE: 4k is enough for ~99% of queries.
+//
+// Lost-in-the-middle and RAG-vs-long-context studies (Liu et al., Xu et al.)
+// consistently show that smaller, focused context outperforms bigger context
+// for retrieval tasks. The preview tier already renders top-1 fully (up to
+// 2000 tokens) and gives ranks 2-3 a signature + 5-line snippet — that's
+// enough for the agent to either answer or to escalate via an explicit
+// `format='agent_full'` re-query. Auto should NOT silently pay an 8k or 12k
+// token bill on every borderline query.
+//
+// When does extra budget STRICTLY beat preview?
+//
+//   XL: top-1 itself needs >2k tokens. The dominance gate at allocation
+//       (allocateBudget L1448-1454) raises top-1's per-result cap from 2k
+//       → 8k IFF top-1 >= 2 * top-2. Without the gate, XL caps top-1 at
+//       2k anyway — identical to preview for the top-1 case. So XL only
+//       pays off when BOTH conditions hold: chunk really is big, AND
+//       dominance gate will fire.
+//
+//   FULL: rank 2/3 need full body (each up to 2000 tokens) instead of a
+//         signature + 5 lines. That's only useful when several results
+//         are TIGHTLY tied — i.e. when there's no single answer, just a
+//         set the agent must compare. A query with moderate dominance
+//         (top-1 = 0.9, top-2 = 0.6) doesn't qualify; the agent can read
+//         top-1 fully and re-query if needed.
+//
+// Decision tree (only fires when format='agent'; explicit tiers are pass-thru):
+//
+//   numResults == 0                                       → preview ('auto_empty')
+//   top1Tokens >= 2400 AND (numResults == 1 OR D >= 2.5)  → xl      ('auto_xl_*')
+//   numResults >= 10 AND D < 1.05 AND top1Tokens >= 600   → full    ('auto_full_tight_cluster')
+//   default                                               → preview ('auto_preview_default')
+//
+// Thresholds are deliberately tight — designed so XL+FULL combined fire on
+// roughly 1-5% of queries. On a fastify spot-check (NL queries with k=10),
+// all 6 representative queries land on preview under this rule. Single
+// dominant answers stay on preview unless the chunk is genuinely huge
+// (200+ lines × 9 tokens/line ≥ 2400). Multi-result clusters need 10+ items
+// within 5% of the top score before auto goes to full.
+//
+// Crucially: dominance answers "is top-1 the answer?", NOT "is top-1 big?".
+// We require both signals (and a high-bar threshold on each) before paying
+// the XL token cost. Likewise, "many results" alone is not a reason to
+// upgrade — the cluster has to be tight (D < 1.05) AND deep (≥ 10 items).
+//
+// Signals (computeBudgetSignals, all post-ranking — pure):
+//   - numResults  : ranked-results length
+//   - dominance   : top1.score / top2.score (sentinel 99 for single result)
+//   - top1Tokens  : estimated tokens of top-1 chunk (lineCount * 9, the
+//                   same per-line conversion the rest of the packager uses).
+//                   Equals 0 when start/end lines are unavailable — those
+//                   results stay on preview.
+//
+// `breadth` (grepMatches / candidatePoolSize) and `entropy` are still
+// computed and surfaced in `budgetSignals` for diagnostics, but neither
+// drives the decision: a broad pool is not a reason to give top-1 more
+// space, and small-N entropy is dominated by the 1/log(n) denominator and
+// stops being a reliable distribution-width signal.
+const BUDGET_TIERS = {
+  preview: { subMode: 'agent_preview', budget: 4000 },
+  full:    { subMode: 'agent_full',    budget: 8000 },
+  xl:      { subMode: 'agent_full_xl', budget: 12000 },
+};
+/**
+ * Compute auto-pick signals from ranked results + searchStats.
+ * Pure: does not look at file content or call into expensive code paths.
+ *
+ * @param {Array} rankedResults - Results after ranking pipeline (PRE-packaging)
+ * @param {object} searchStats - Stats from the retrieval pipeline
+ * @returns {{
+ *   numResults: number, breadth: number, dominance: number,
+ *   entropy: number, top1Tokens: number, top1LineCount: number
+ * }}
+ */
+export function computeBudgetSignals(rankedResults, searchStats = {}) {
+  const numResults = Array.isArray(rankedResults) ? rankedResults.length : 0;
+  if (numResults === 0) {
+    return { numResults: 0, breadth: 0, dominance: 0, entropy: 0, top1Tokens: 0, top1LineCount: 0 };
+  }
+  // Use whichever score field the ranker emitted. Pattern (colgrep) emits
+  // `lateInteractionScore`; hybrid/semantic/lexical emit `score`. Keep both
+  // paths working without renaming.
+  const scores = rankedResults
+    .map(r => Number(r?.score ?? r?.lateInteractionScore ?? 0))
+    .filter(s => Number.isFinite(s) && s > 0);
+  // Top-1 size proxy — derived from the chunk's start/end lines. Uses the
+  // same 9 tokens/line conversion the rest of the packager applies (see
+  // expandToSymbol / renderCode in structural-context.js). Returns 0 when
+  // either bound is missing, in which case the auto-pick falls back to the
+  // preview branch instead of guessing.
+  const top1 = rankedResults[0] || {};
+  const top1Start = top1.metadata?.startLine ?? top1.startLine ?? null;
+  const top1End = top1.metadata?.endLine ?? top1.endLine ?? null;
+  const top1LineCount = (top1Start != null && top1End != null && top1End >= top1Start)
+    ? (top1End - top1Start + 1)
+    : 0;
+  const top1Tokens = top1LineCount * 9;
+  if (scores.length === 0) {
+    return { numResults, breadth: 0, dominance: 0, entropy: 0, top1Tokens, top1LineCount };
+  }
+  const topScore = scores[0];
+  const secondScore = scores[1] ?? 0;
+  // Sentinel "very high" dominance when there's only one positive-score result
+  // — keeps single-answer queries on the preview path.
+  const dominance = secondScore > 0 ? topScore / secondScore : 99;
+  // Normalised Shannon entropy — KEPT FOR DIAGNOSTIC OUTPUT only. Not used
+  // by selectAgentBudget after the small-N flaw was identified (2-result
+  // entropy is forced into [0.7, 1.0] by the 1/log(n) denominator).
+  let entropy = 0;
+  if (scores.length > 1) {
+    const sum = scores.reduce((a, b) => a + b, 0);
+    if (sum > 0) {
+      let H = 0;
+      for (const s of scores) {
+        const p = s / sum;
+        if (p > 0) H -= p * Math.log(p);
+      }
+      entropy = H / Math.log(scores.length);
+    }
+  }
+  // Breadth — KEPT FOR DIAGNOSTIC OUTPUT only. Not used by tier selection
+  // (broad candidate pools aren't a reason to give top-1 more tokens; only
+  // top-1 actually being big is). `allocateBudget` still uses breadth for
+  // its within-tier top-1-share sharpening (its job, not ours).
+  const breadth = Number(
+    searchStats?.grepMatches
+    ?? searchStats?.candidatePoolSize
+    ?? 0
+  ) || 0;
+  return { numResults, breadth, dominance, entropy, top1Tokens, top1LineCount };
+}
+/**
+ * Pick the agent-mode tier for a request.
+ *
+ * Explicit tier formats (agent_preview / agent_full / agent_full_xl) are
+ * pass-through. The bare 'agent' format triggers the auto-pick decision
+ * tree using the signals above.
+ *
+ * Format-gating note: all return values keep `format='agent_*'` semantics,
+ * so the `_isAgentFormat` ranking flag (file-kind-ranking.js:1443) remains
+ * TRUE regardless of which tier we land on. Ranking is unchanged.
+ *
+ * @param {string} format - 'agent' | 'agent_preview' | 'agent_full' | 'agent_full_xl'
+ * @param {object} signals - From computeBudgetSignals()
+ * @param {object} [opts]
+ * @param {number} [opts.explicitBudget] - Caller-supplied tokenBudget; if set,
+ *   bypass auto-pick and infer the tier from the value (matches trace's
+ *   selectBudget contract).
+ * @returns {{ tier: 'preview'|'full'|'xl', subMode: string, tokenBudget: number, reason: string }}
+ */
+export function selectAgentBudget(format, signals, opts = {}) {
+  // Explicit numeric budget always wins. Pass the value through unchanged
+  // (callers that pass tiny budgets — e.g. `tokenBudget: 1` for hard-ceiling
+  // tests — expect the packager to honour them as a strict cap). We only
+  // clamp the value used for tier inference, so the subMode label stays sane.
+  if (opts.explicitBudget != null && Number.isFinite(opts.explicitBudget)) {
+    const n = Math.floor(opts.explicitBudget);
+    const tierBound = Math.max(1000, Math.min(16000, n));
+    const tier = tierBound >= 11000 ? 'xl' : tierBound >= 7000 ? 'full' : 'preview';
+    return { tier, subMode: BUDGET_TIERS[tier].subMode, tokenBudget: n, reason: 'explicit_budget' };
+  }
+  // Explicit tier flags — caller is asking for a specific budget.
+  if (format === 'agent_preview') {
+    return { tier: 'preview', ...BUDGET_TIERS.preview, tokenBudget: BUDGET_TIERS.preview.budget, reason: 'explicit_preview' };
+  }
+  if (format === 'agent_full') {
+    return { tier: 'full', ...BUDGET_TIERS.full, tokenBudget: BUDGET_TIERS.full.budget, reason: 'explicit_full' };
+  }
+  if (format === 'agent_full_xl') {
+    return { tier: 'xl', ...BUDGET_TIERS.xl, tokenBudget: BUDGET_TIERS.xl.budget, reason: 'explicit_xl' };
+  }
+  // Auto-pick: format === 'agent' (or anything unrecognised — defensive).
+  // Design target: preview fires on ~99% of queries; XL+FULL combined ~1-5%.
+  const { numResults, dominance, top1Tokens } = signals || {};
+  const N = Number(numResults) || 0;
+  const D = Number.isFinite(dominance) ? dominance : 0;
+  const T1 = Number(top1Tokens) || 0;
+  const pick = (tier, reason) => ({
+    tier,
+    subMode: BUDGET_TIERS[tier].subMode,
+    tokenBudget: BUDGET_TIERS[tier].budget,
+    reason,
+  });
+  // Tight thresholds. Both upgrade paths require strong, hard-to-fake signals.
+  //   XL_TOP1_TOKENS = ~267 lines × 9 t/line. Below this, top-1's render fits
+  //                    inside the 2000-token per-result preview cap and XL
+  //                    adds no usable budget.
+  //   XL_DOMINANCE   = 2.5×. We need the dominance gate to FIRE at
+  //                    allocation time (allocateBudget L1448-1454 needs
+  //                    top1 ≥ 2 × top2); we add headroom (2.5 vs 2.0) so
+  //                    we don't pick XL on borderline cases that the gate
+  //                    might miss.
+  //   FULL_MIN_N     = 10 results. Fewer than this and the agent can
+  //                    re-read rank 2 (which is shown as a preview anyway).
+  //   FULL_MAX_DOM   = 1.05. Strictly tied cluster — top-1 is at most 5%
+  //                    ahead of top-2. Anything wider and the agent
+  //                    can treat top-1 as the answer.
+  //   FULL_MIN_TOP1  = 600 t (~67 lines). If top-1 is tiny, ranks 2-3
+  //                    being expanded buys nothing — preview's signature
+  //                    already shows everything.
+  const XL_TOP1_TOKENS = 2400;
+  const XL_DOMINANCE = 2.5;
+  const FULL_MIN_N = 10;
+  const FULL_MAX_DOM = 1.05;
+  const FULL_MIN_TOP1 = 600;
+  if (N === 0) return pick('preview', 'auto_empty');
+  // XL path: huge top-1 that dominates. Single-result counts as "dominates"
+  // (no top-2 to compete). Both branches gate on T1 >= XL_TOP1_TOKENS so we
+  // never pick XL when extra space would go unused.
+  if (T1 >= XL_TOP1_TOKENS) {
+    if (N === 1) return pick('xl', 'auto_xl_single_huge');
+    if (D >= XL_DOMINANCE) return pick('xl', 'auto_xl_dominant_huge_top1');
+  }
+  // FULL path: tightly-clustered multi-result set with non-trivial chunks.
+  // All three conditions must hold — comparison-shaped queries with many
+  // tied alternatives are the narrow profile where rank 2/3 full bodies
+  // pay off. Single dominant answers and small clusters stay on preview.
+  if (N >= FULL_MIN_N && D < FULL_MAX_DOM && T1 >= FULL_MIN_TOP1) {
+    return pick('full', 'auto_full_tight_cluster');
+  }
+  // PREVIEW: default for ~99% of queries. The agent can always escalate
+  // to full or xl with an explicit format flag if the answer needs more.
+  return pick('preview', 'auto_preview_default');
+}
 /**
  * Package ranked results into agent-mode context blocks.
  *
@@ -1119,28 +1899,86 @@ export function packageForAgent(rankedResults, searchStats, opts) {
   } = opts;
   const ablations = opts.ablations || new Set();
-  const subMode = resolveSubMode(formatOpt);
-  const defaultBudget = subMode === 'agent_full_xl' ? AGENT_FULL_XL_TOKEN_BUDGET
-    : subMode === 'agent_full' ? AGENT_FULL_TOKEN_BUDGET
-    : DEFAULT_TOKEN_BUDGET;
-  const tokenBudget = opts.tokenBudget ?? defaultBudget;
+  // Auto-tier selection: pick preview / full / xl based on score-distribution
+  // signals when format='agent'. Explicit format=='agent_preview|full|full_xl'
+  // and explicit numeric tokenBudget remain as overrides. Mirrors trace's
+  // adaptive selectBudget (core/graph/structural-context.js:37). See
+  // selectAgentBudget() above for the decision tree.
+  //
+  // Disabled by 'no-auto-budget' ablation — falls back to the legacy
+  // resolveSubMode mapping (which treats 'agent' as 'agent_preview').
+  let subMode, tokenBudget, budgetReason, budgetSignals;
+  if (ablations.has('no-auto-budget')) {
+    subMode = resolveSubMode(formatOpt);
+    const defaultBudget = subMode === 'agent_full_xl' ? AGENT_FULL_XL_TOKEN_BUDGET
+      : subMode === 'agent_full' ? AGENT_FULL_TOKEN_BUDGET
+      : DEFAULT_TOKEN_BUDGET;
+    tokenBudget = opts.tokenBudget ?? defaultBudget;
+    budgetReason = 'ablation_no_auto_budget';
+    budgetSignals = null;
+  } else {
+    budgetSignals = computeBudgetSignals(rankedResults, searchStats);
+    const pick = selectAgentBudget(formatOpt, budgetSignals, {
+      explicitBudget: opts.tokenBudget,
+    });
+    subMode = pick.subMode;
+    tokenBudget = pick.tokenBudget;
+    budgetReason = pick.reason;
+  }
   const start = performance.now();
   const fileCache = new Map();
+  // Locality clustering: pull up to two non-overlapping companion results
+  // from the SAME file as top-1 (when their score is competitive, ≥ top-1/3)
+  // ahead of unrelated higher-scoring distractors. This addresses the
+  // dominant agent-bench loss pattern where the right helper symbol existed
+  // in the ranked list at rank 4 but got demoted to summary because a
+  // tangential file scored slightly higher. Top-1 is never moved.
+  // Disabled by 'no-locality-cluster' ablation.
+  let workingResults = rankedResults;
+  if (!ablations.has('no-locality-cluster') && rankedResults.length >= 3) {
+    const top = rankedResults[0];
+    const topFile = top?.metadata?.file || top?.file;
+    const topScore = top?.score || top?.lateInteractionScore || 0;
+    if (topFile && topScore > 0) {
+      const sameFile = [];
+      const other = [];
+      for (let i = 1; i < rankedResults.length; i++) {
+        const r = rankedResults[i];
+        const f = r.metadata?.file || r.file;
+        const s = r.score || r.lateInteractionScore || 0;
+        // Don't pull up overlapping same-file ranges (those are diversity dups).
+        const ts = top.metadata?.startLine || top.startLine;
+        const te = top.metadata?.endLine || top.endLine;
+        const rs = r.metadata?.startLine || r.startLine;
+        const re = r.metadata?.endLine || r.endLine;
+        const overlapsTop = (rs != null && re != null && ts != null && te != null)
+          && rs <= te + 10 && re >= ts - 10;
+        if (f === topFile && s >= topScore / 3 && !overlapsTop) sameFile.push(r);
+        else other.push(r);
+      }
+      // Promote up to 2 companion results into ranks 2 and 3, push the
+      // rest behind. We deliberately keep `score` untouched so callers
+      // can still inspect the original ranking signal.
+      workingResults = [top, ...sameFile.slice(0, 2), ...other, ...sameFile.slice(2)]
+        .map((r, idx) => ({ ...r, rank: idx + 1 }));
+    }
+  }
   // Diversity: demote results that cluster in same file+region as a higher-ranked result.
   // Skipped when 'no-diversity' ablation is active.
   // This prevents wasting preview/full budget on near-duplicate chunks from the same symbol.
   const diversityDemotions = new Set();
   if (ablations.has('no-diversity')) { /* skip diversity check */ }
-  else for (let i = 0; i < Math.min(rankedResults.length, 5); i++) {
-    const ri = rankedResults[i];
+  else for (let i = 0; i < Math.min(workingResults.length, 5); i++) {
+    const ri = workingResults[i];
     const fi = ri.metadata?.file || ri.file;
     const si = ri.metadata?.startLine || ri.startLine;
     const ei = ri.metadata?.endLine || ri.endLine;
-    for (let j = i + 1; j < Math.min(rankedResults.length, 5); j++) {
+    for (let j = i + 1; j < Math.min(workingResults.length, 5); j++) {
       if (diversityDemotions.has(j)) continue;
-      const rj = rankedResults[j];
+      const rj = workingResults[j];
       const fj = rj.metadata?.file || rj.file;
       if (fi !== fj) continue;
       const sj = rj.metadata?.startLine || rj.startLine;
@@ -1159,12 +1997,12 @@ export function packageForAgent(rankedResults, searchStats, opts) {
     : {
         ...(searchStats?.grepMatches != null ? { grepMatches: searchStats.grepMatches } : {}),
         ...(searchStats?.candidatePoolSize != null ? { candidatePoolSize: searchStats.candidatePoolSize } : {}),
-        results: rankedResults,
+        results: workingResults,
       };
-  const allocations = allocateBudget(tokenBudget, rankedResults.length, subMode, budgetContext);
+  const allocations = allocateBudget(tokenBudget, workingResults.length, subMode, budgetContext);
   // Compute confidence from ranked results (Fix #4: regex selectivity included)
-  const confidenceInfo = computeConfidence(rankedResults, searchStats);
+  const confidenceInfo = computeConfidence(workingResults, searchStats);
   // Shared staleness cache — db mtime is the same for all results in one search.
   // Avoids repeated statSync calls (Fix D: perf).
@@ -1173,8 +2011,8 @@ export function packageForAgent(rankedResults, searchStats, opts) {
   let tokensUsed = 0;
   const agentResults = [];
-  for (let i = 0; i < rankedResults.length; i++) {
-    const result = rankedResults[i];
+  for (let i = 0; i < workingResults.length; i++) {
+    const result = workingResults[i];
     const allocation = allocations[i] || { presentation: 'summary', tokenCap: 0 };
     const meta = result.metadata || {};
     const filePath = meta.file || result.file;
@@ -1370,36 +2208,108 @@ export function packageForAgent(rankedResults, searchStats, opts) {
       }
     }
+    // Phase 6: Graph-neighbour reservation (top-1 only). The pack reserves
+    // up to 20% of the budget (capped at 1000 tokens, floored at 600 when
+    // the budget allows) for a dedicated 1-hop neighbours tier. Surfaced
+    // as `agentResult.neighbors`; rendered for the agent by the CLI shim.
+    // Disabled by 'no-graph-neighbors' ablation. Always opt-OUT, never
+    // model-specific — the rendering is plain text.
+    if (i === 0
+        && !ablations.has('no-graph-neighbors')
+        && expansion.entityId
+        && codeGraphRepo) {
+      // Reserve fraction depends on subMode but never above 20% / 1000 toks.
+      // Stretches the floor for full+xl so the top-1 actually gets useful
+      // neighbour evidence even when the chunk consumed most of the budget.
+      const reserveFraction = subMode === 'agent_full_xl' ? 0.20
+        : subMode === 'agent_full' ? 0.18
+        : 0.15;
+      const headroom = Math.max(0, tokenBudget - tokensUsed);
+      const desired = Math.min(1000, Math.floor(tokenBudget * reserveFraction));
+      const tokenCap = Math.min(headroom, desired);
+      if (tokenCap >= 80) {
+        // Build skip set from ALL ranked locations that will be shown
+        // with code (full / preview tiers). Summary-tier rows are not
+        // skipped — they convey no code and the neighbour tier still
+        // adds value (edge type + direction). This avoids the
+        // pathological case (validation-pipeline) where every caller is
+        // already in the pack as a summary row, leaving the agent with
+        // file:line refs but no edge attribution.
+        const skipKeys = new Set();
+        for (let j = 0; j < workingResults.length; j++) {
+          const tier = allocations[j]?.presentation;
+          if (tier !== 'full' && tier !== 'preview') continue;
+          const r = workingResults[j];
+          const f = r.metadata?.file || r.file;
+          const s = r.metadata?.startLine || r.startLine;
+          const e = r.metadata?.endLine || r.endLine;
+          if (f && s != null && e != null) {
+            skipKeys.add(`${f}|${s}|${e}`);
+          }
+        }
+        skipKeys.add(`${filePath}|${expansion.startLine}|${expansion.endLine}`);
+        const neighbours = renderGraphNeighbors({
+          codeGraphRepo,
+          entity: {
+            id: expansion.entityId,
+            filePath,
+            startLine: expansion.startLine,
+            endLine: expansion.endLine,
+            name: expansion.symbol,
+            type: expansion.symbolType,
+          },
+          skipKeys,
+          tokenCap,
+          // Pass the loaded code so the neighbour tier can also surface
+          // referenced TYPE definitions (struct/enum/...) discovered by
+          // name from the body — fills the gap left by relationship-only
+          // edges (e.g. Go method receiver fields with custom types).
+          body: code,
+        });
+        if (neighbours) {
+          agentResult.neighbors = neighbours;
+          tokensUsed += neighbours.tokens;
+        }
+      }
+    }
     agentResults.push(agentResult);
   }
   const packagingMs = Math.round(performance.now() - start);
-  // Fix #7: Sufficiency signal for top-1 result
+  // Sufficiency signal for top-1. Tightened in 2026-05: requires resolution
+  // (header_resolved OR neighbors_present OR self_contained_strict) instead
+  // of the old "complete_symbol + high_confidence" rule.
   let sufficient = false;
   let sufficiencyReasons = [];
+  let unresolvedExternalCount = 0;
   if (agentResults.length > 0 && agentResults[0].code) {
     const sufficiency = computeSufficiency(agentResults[0], confidenceInfo);
     sufficient = sufficiency.sufficient;
     sufficiencyReasons = sufficiency.reasons;
+    unresolvedExternalCount = sufficiency.unresolvedExternalCount || 0;
   }
   return {
     query,
     regex,
     mode: modeOpt || searchStats?.path || 'pattern',
-    totalResults: rankedResults.length,
+    totalResults: workingResults.length,
     latencyMs: searchStats?.total_ms || 0,
     packagingMs,
     format: 'agent',
     subMode,
     tokenBudget,
+    budgetReason,
+    budgetSignals,
     tokensUsed,
     confidence: confidenceInfo.confidence,
     confidenceReason: confidenceInfo.confidenceReason,
     sufficient,
     sufficiencyReasons,
+    unresolvedExternalCount,
     results: agentResults,
   };