npm - supipowers - Versions diffs - 2.0.2 → 2.1.0 - Mend

supipowers 2.0.2 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (76) hide show

package/README.md +5 -6
package/package.json +4 -2
package/skills/harness/SKILL.md +1 -0
package/src/bootstrap.ts +5 -133
package/src/config/defaults.ts +5 -5
package/src/config/loader.ts +1 -0
package/src/config/schema.ts +2 -6
package/src/context-mode/knowledge/store.ts +381 -43
package/src/context-mode/tools.ts +41 -3
package/src/deps/registry.ts +1 -12
package/src/fix-pr/assessment.ts +1 -0
package/src/fix-pr/prompt-builder.ts +1 -0
package/src/git/commit.ts +76 -18
package/src/harness/command.ts +103 -6
package/src/harness/default-agents/docs.md +39 -0
package/src/harness/docs/config.ts +29 -0
package/src/harness/docs/glob-match.ts +27 -0
package/src/harness/docs/index-renderer.ts +82 -0
package/src/harness/docs/provenance.ts +125 -0
package/src/harness/docs/regen-decision.ts +167 -0
package/src/harness/docs/representative-files.ts +175 -0
package/src/harness/docs/source-hash.ts +106 -0
package/src/harness/docs/validator.ts +233 -0
package/src/harness/hooks/layer-context-inject.ts +35 -1
package/src/harness/hooks/register.ts +24 -3
package/src/harness/pipeline.ts +20 -5
package/src/harness/pr-comment/baseline.ts +105 -0
package/src/harness/pr-comment/ci-env.ts +120 -0
package/src/harness/pr-comment/gh-poster.ts +227 -0
package/src/harness/pr-comment/handler.ts +198 -0
package/src/harness/pr-comment/render.ts +297 -0
package/src/harness/pr-comment/status.ts +95 -0
package/src/harness/pr-comment/types.ts +73 -0
package/src/harness/pr-comment/workflow-summary.ts +47 -0
package/src/harness/project-paths.ts +95 -0
package/src/harness/stages/design.ts +1 -0
package/src/harness/stages/discover.ts +1 -13
package/src/harness/stages/docs.ts +708 -0
package/src/harness/stages/implement-apply.ts +877 -0
package/src/harness/stages/implement.ts +64 -51
package/src/harness/stages/plan.ts +25 -16
package/src/harness/stages/validate.ts +370 -0
package/src/harness/storage.ts +142 -0
package/src/harness/tools.ts +130 -0
package/src/mempalace/bridge.ts +207 -41
package/src/mempalace/config.ts +10 -4
package/src/mempalace/format.ts +122 -6
package/src/mempalace/hooks.ts +204 -56
package/src/mempalace/installer-helper.ts +18 -4
package/src/mempalace/python/mempalace_bridge.py +128 -3
package/src/mempalace/runtime.ts +53 -16
package/src/mempalace/schema.ts +151 -30
package/src/mempalace/session-summary.ts +5 -0
package/src/mempalace/tool.ts +17 -4
package/src/mempalace/upstream-limits.ts +69 -0
package/src/planning/approval-flow.ts +25 -2
package/src/planning/planning-ask-tool.ts +34 -4
package/src/planning/system-prompt.ts +1 -1
package/src/tool-catalog/active-tool-controller.ts +0 -22
package/src/tool-catalog/active-tool-planner.ts +0 -26
package/src/tool-catalog/tool-groups.ts +1 -9
package/src/types.ts +87 -8
package/src/ui-design/session.ts +114 -8
package/src/utils/executable.ts +10 -1
package/src/workspace/state-paths.ts +1 -1
package/src/commands/mcp.ts +0 -814
package/src/mcp/activation.ts +0 -77
package/src/mcp/config.ts +0 -223
package/src/mcp/docs.ts +0 -154
package/src/mcp/gateway.ts +0 -103
package/src/mcp/lifecycle.ts +0 -79
package/src/mcp/manager-tool.ts +0 -104
package/src/mcp/mcpc.ts +0 -113
package/src/mcp/registry.ts +0 -98
package/src/mcp/triggers.ts +0 -62
package/src/mcp/types.ts +0 -95

package/src/context-mode/knowledge/store.ts CHANGED Viewed

@@ -11,6 +11,8 @@ export interface SearchOptions {
   includeAllSessions?: boolean;
 }
+export type SearchMatchLayer = "porter" | "trigram" | "rrf" | "rrf-fuzzy";
 export interface SearchResult {
   title: string;
   body: string;
@@ -19,6 +21,12 @@ export interface SearchResult {
   score: number;
   ownerScope: KnowledgeOwnerScope;
   ownerId: string;
+  /** Which layer of the fallback chain surfaced this row. Optional for backward compat. */
+  matchLayer?: SearchMatchLayer;
+}
+interface RankedSearchResult extends SearchResult {
+  chunkId: number;
 }
 export interface QueryGroupedResults {
@@ -37,7 +45,7 @@ export interface KnowledgeClearResult {
   urlCacheDeleted: number;
 }
-const SCHEMA_VERSION = 2;
+const SCHEMA_VERSION = 3;
 const SCHEMA = `
 CREATE TABLE IF NOT EXISTS content_chunks (
@@ -58,12 +66,26 @@ CREATE VIRTUAL TABLE IF NOT EXISTS content_chunks_fts USING fts5(
   tokenize='porter'
 );
+CREATE VIRTUAL TABLE IF NOT EXISTS content_chunks_trigram USING fts5(
+  title,
+  body,
+  content='content_chunks',
+  content_rowid='id',
+  tokenize='trigram'
+);
+CREATE TABLE IF NOT EXISTS vocabulary (
+  word TEXT PRIMARY KEY
+);
 CREATE TRIGGER IF NOT EXISTS content_chunks_ai AFTER INSERT ON content_chunks BEGIN
   INSERT INTO content_chunks_fts(rowid, title, body) VALUES (new.id, new.title, new.body);
+  INSERT INTO content_chunks_trigram(rowid, title, body) VALUES (new.id, new.title, new.body);
 END;
 CREATE TRIGGER IF NOT EXISTS content_chunks_ad AFTER DELETE ON content_chunks BEGIN
   INSERT INTO content_chunks_fts(content_chunks_fts, rowid, title, body) VALUES ('delete', old.id, old.title, old.body);
+  INSERT INTO content_chunks_trigram(content_chunks_trigram, rowid, title, body) VALUES ('delete', old.id, old.title, old.body);
 END;
 CREATE INDEX IF NOT EXISTS idx_content_chunks_owner ON content_chunks(owner_scope, owner_id);
@@ -106,7 +128,50 @@ export class KnowledgeStore {
     this.#ensureDeleteJournalMode();
     this.#migrate();
     this._db.exec(SCHEMA);
+    this.#rebuildFtsIfNeeded();
+    this.#backfillVocabularyIfNeeded();
+  }
+  #rebuildFtsIfNeeded(): void {
+    const chunkCount = this._db.prepare("SELECT COUNT(*) AS cnt FROM content_chunks").get() as { cnt: number };
+    if (chunkCount.cnt === 0) return;
+    const ftsCount = this.#countRows("content_chunks_fts");
+    const trigramCount = this.#countRows("content_chunks_trigram");
+    if (ftsCount === chunkCount.cnt && trigramCount === chunkCount.cnt) return;
     this._db.exec("INSERT INTO content_chunks_fts(content_chunks_fts) VALUES('rebuild')");
+    this._db.exec("INSERT INTO content_chunks_trigram(content_chunks_trigram) VALUES('rebuild')");
+  }
+  #countRows(table: "content_chunks_fts" | "content_chunks_trigram"): number {
+    const row = this._db.prepare(`SELECT COUNT(*) AS cnt FROM ${table}`).get() as { cnt: number };
+    return row.cnt;
+  }
+  /**
+   * Populate `vocabulary` from existing chunks when it is empty but the store
+   * is not. Runs once on the first init() after a v2 → v3 migration; a no-op
+   * for fresh stores (no chunks) and for already-populated stores.
+   */
+  #backfillVocabularyIfNeeded(): void {
+    const vocabCount = this._db.prepare("SELECT COUNT(*) AS cnt FROM vocabulary").get() as { cnt: number };
+    if (vocabCount.cnt > 0) return;
+    const chunkCount = this._db.prepare("SELECT COUNT(*) AS cnt FROM content_chunks").get() as { cnt: number };
+    if (chunkCount.cnt === 0) return;
+    const ins = this._db.prepare("INSERT OR IGNORE INTO vocabulary (word) VALUES (?)");
+    const rows = this._db
+      .prepare("SELECT title, body FROM content_chunks")
+      .iterate() as IterableIterator<{ title: string; body: string }>;
+    this._db.transaction(() => {
+      for (const row of rows) {
+        for (const word of extractVocabWords(`${row.title}\n${row.body}`)) {
+          ins.run(word);
+        }
+      }
+    })();
   }
   #ensureDeleteJournalMode(): void {
@@ -176,6 +241,15 @@ export class KnowledgeStore {
       `);
     }
+    if (user_version < 3) {
+      // v2 → v3: the INSERT/DELETE triggers now also fan out to
+      // `content_chunks_trigram`. Drop the legacy single-table triggers so the
+      // idempotent CREATE TRIGGER IF NOT EXISTS in `SCHEMA` reinstalls the
+      // multi-table versions. Trigram + vocab backfill happen in init().
+      this._db.exec(`DROP TRIGGER IF EXISTS content_chunks_ai;`);
+      this._db.exec(`DROP TRIGGER IF EXISTS content_chunks_ad;`);
+    }
     this._db.exec(`PRAGMA user_version = ${SCHEMA_VERSION}`);
   }
@@ -193,6 +267,7 @@ export class KnowledgeStore {
       `INSERT INTO content_chunks (source, title, body, content_type, owner_scope, owner_id)
        VALUES (?, ?, ?, ?, ?, ?)`,
     );
+    const vocabIns = this._db.prepare("INSERT OR IGNORE INTO vocabulary (word) VALUES (?)");
     this._db.transaction(() => {
       del.run(source, resolvedOwner.ownerScope, resolvedOwner.ownerId, resolvedOwner.ownerScope);
@@ -205,6 +280,9 @@ export class KnowledgeStore {
           resolvedOwner.ownerScope,
           resolvedOwner.ownerId,
         );
+        for (const word of extractVocabWords(`${chunk.title}\n${chunk.body}`)) {
+          vocabIns.run(word);
+        }
       }
     })();
   }
@@ -216,53 +294,126 @@ export class KnowledgeStore {
     const results: QueryGroupedResults[] = [];
     for (const query of queries) {
-      const sanitized = sanitizeFtsQuery(query);
-      if (!sanitized) {
+      const tokens = tokenizeQuery(query);
+      if (tokens.length === 0) {
         results.push({ query, results: [] });
         continue;
       }
-      let sql = `
-        SELECT c.title, c.body, c.source, c.content_type AS contentType,
-               c.owner_scope AS ownerScope,
-               c.owner_id AS ownerId,
-               bm25(content_chunks_fts, 5.0, 1.0) AS score
-        FROM content_chunks_fts f
-        JOIN content_chunks c ON c.id = f.rowid
-        WHERE content_chunks_fts MATCH ?
-      `;
-      const params: (string | number)[] = [sanitized];
-      if (options?.source) {
-        sql += " AND c.source LIKE '%' || ? || '%'";
-        params.push(options.source);
-      }
-      if (options?.contentType) {
-        sql += " AND c.content_type = ?";
-        params.push(options.contentType);
-      }
+      const fetchLimit = Math.max(limit * 2, 10);
+      const porterRows = this.#runFts("content_chunks_fts", buildOrQuery(tokens), fetchLimit, options);
+      const trigramRows = this.#runFts("content_chunks_trigram", buildOrQuery(tokens.filter(t => t.length >= 3)), fetchLimit, options);
-      const visibility = buildVisibilityClause(options);
-      if (visibility) {
-        sql += ` AND ${visibility.sql}`;
-        params.push(...visibility.params);
-      }
-      sql += " ORDER BY score LIMIT ?";
-      params.push(limit);
+      let fused = rrfFuse(porterRows, trigramRows, limit, "rrf");
-      try {
-        const rows = this._db.prepare(sql).all(...params) as SearchResult[];
-        results.push({ query, results: rows });
-      } catch {
-        // FTS5 query syntax error — return empty for this query
-        results.push({ query, results: [] });
+      if (fused.length === 0) {
+        const corrected = this.#fuzzyCorrectTokens(tokens);
+        if (corrected && corrected.join(" ") !== tokens.join(" ")) {
+          const porter2 = this.#runFts("content_chunks_fts", buildOrQuery(corrected), fetchLimit, options);
+          const trigram2 = this.#runFts("content_chunks_trigram", buildOrQuery(corrected.filter(t => t.length >= 3)), fetchLimit, options);
+          fused = rrfFuse(porter2, trigram2, limit, "rrf-fuzzy");
+        }
       }
+      const reranked = applyProximityReranking(fused, tokens);
+      results.push({ query, results: reranked });
     }
     return results;
   }
+  /**
+   * Run one FTS5 MATCH query against `table` with the standard source /
+   * contentType / visibility filters. Returns empty on FTS5 syntax errors so
+   * a single bad token in a multi-query call cannot break sibling queries.
+   */
+  #runFts(
+    table: "content_chunks_fts" | "content_chunks_trigram",
+    matchExpr: string,
+    limit: number,
+    options: SearchOptions | undefined,
+  ): RankedSearchResult[] {
+    if (!matchExpr) return [];
+    const sql: string[] = [
+      `SELECT c.id AS chunkId, c.title, c.body, c.source, c.content_type AS contentType,`,
+      `       c.owner_scope AS ownerScope,`,
+      `       c.owner_id AS ownerId,`,
+      `       bm25(${table}, 5.0, 1.0) AS score`,
+      `FROM ${table} f`,
+      `JOIN content_chunks c ON c.id = f.rowid`,
+      `WHERE ${table} MATCH ?`,
+    ];
+    const params: (string | number)[] = [matchExpr];
+    if (options?.source) {
+      sql.push("AND c.source LIKE '%' || ? || '%'");
+      params.push(options.source);
+    }
+    if (options?.contentType) {
+      sql.push("AND c.content_type = ?");
+      params.push(options.contentType);
+    }
+    const visibility = buildVisibilityClause(options);
+    if (visibility) {
+      sql.push(`AND ${visibility.sql}`);
+      params.push(...visibility.params);
+    }
+    sql.push("ORDER BY score LIMIT ?");
+    params.push(limit);
+    try {
+      return this._db.prepare(sql.join("\n")).all(...params) as RankedSearchResult[];
+    } catch {
+      return [];
+    }
+  }
+  /**
+   * Try to repair each token via Levenshtein lookup against `vocabulary`.
+   * Returns null when nothing was corrected (caller skips fuzzy retry).
+   */
+  #fuzzyCorrectTokens(tokens: string[]): string[] | null {
+    const candidatesByLen = this._db.prepare(
+      "SELECT word FROM vocabulary WHERE length(word) BETWEEN ? AND ?",
+    );
+    const corrected: string[] = [];
+    let changed = false;
+    for (const token of tokens) {
+      const lower = token.toLowerCase();
+      if (lower.length < 3) {
+        corrected.push(token);
+        continue;
+      }
+      const maxDist = maxEditDistance(lower.length);
+      const candidates = candidatesByLen.all(lower.length - maxDist, lower.length + maxDist) as Array<{ word: string }>;
+      let best: string | null = null;
+      let bestDist = maxDist + 1;
+      let exact = false;
+      for (const { word } of candidates) {
+        if (word === lower) { exact = true; break; }
+        const dist = levenshtein(lower, word);
+        if (dist < bestDist) {
+          bestDist = dist;
+          best = word;
+        }
+      }
+      if (exact) {
+        corrected.push(token);
+        continue;
+      }
+      if (best && bestDist <= maxDist) {
+        corrected.push(best);
+        changed = true;
+      } else {
+        corrected.push(token);
+      }
+    }
+    return changed ? corrected : null;
+  }
   purge(): number {
     const row = this._db.prepare("SELECT COUNT(*) AS cnt FROM content_chunks").get() as {
       cnt: number;
@@ -270,6 +421,8 @@ export class KnowledgeStore {
     const count = row.cnt;
     this._db.exec("DELETE FROM content_chunks");
     this._db.exec("INSERT INTO content_chunks_fts(content_chunks_fts) VALUES('rebuild')");
+    this._db.exec("INSERT INTO content_chunks_trigram(content_chunks_trigram) VALUES('rebuild')");
+    this._db.exec("DELETE FROM vocabulary");
     this._db.exec("DELETE FROM url_cache");
     return count;
   }
@@ -325,6 +478,7 @@ export class KnowledgeStore {
       "DELETE FROM url_cache WHERE owner_scope = 'session' AND owner_id = ?",
     ).run(ownerId);
     this._db.exec("INSERT INTO content_chunks_fts(content_chunks_fts) VALUES('rebuild')");
+    this._db.exec("INSERT INTO content_chunks_trigram(content_chunks_trigram) VALUES('rebuild')");
     return { chunksDeleted: chunks.cnt, urlCacheDeleted: urls.cnt };
   }
@@ -338,6 +492,8 @@ export class KnowledgeStore {
     this._db.exec("DELETE FROM content_chunks");
     this._db.exec("DELETE FROM url_cache");
     this._db.exec("INSERT INTO content_chunks_fts(content_chunks_fts) VALUES('rebuild')");
+    this._db.exec("INSERT INTO content_chunks_trigram(content_chunks_trigram) VALUES('rebuild')");
+    this._db.exec("DELETE FROM vocabulary");
     return { chunksDeleted: chunks.cnt, urlCacheDeleted: urls.cnt };
   }
@@ -420,12 +576,194 @@ function addColumnIfMissing(db: Database, table: string, column: string, definit
   db.exec(`ALTER TABLE ${table} ADD COLUMN ${column} ${definition}`);
 }
-/** Strip FTS5 special operators to prevent syntax errors. Keep alphanumeric + spaces. */
-function sanitizeFtsQuery(query: string): string {
-  // Remove characters that have special meaning in FTS5: ^, *, ", (, ), {, }, +, -
-  // Keep words separated by spaces for implicit AND matching
+// ── Tokenization ─────────────────────────────────────────────
+/** Common English stopwords and noise terms — kept out of the vocabulary
+ *  table so fuzzy correction does not snap rare typos to "the" or "fix". */
+const STOPWORDS = new Set<string>([
+  "the", "and", "for", "are", "but", "not", "you", "all", "can", "had",
+  "her", "was", "one", "our", "out", "has", "his", "how", "its", "may",
+  "new", "now", "old", "see", "way", "who", "did", "get", "got", "let",
+  "say", "she", "too", "use", "will", "with", "this", "that", "from",
+  "they", "been", "have", "many", "some", "them", "than", "each", "make",
+  "like", "just", "over", "such", "take", "into", "year", "your", "good",
+  "could", "would", "about", "which", "their", "there", "other", "after",
+  "should", "through", "also", "more", "most", "only", "very", "when",
+  "what", "then", "these", "those", "being", "does", "done", "both",
+  "same", "still", "while", "where", "here", "were", "much",
+  "update", "updates", "updated", "deps", "dev", "tests", "test",
+  "add", "added", "fix", "fixed", "run", "running", "using",
+]);
+/** FTS5 operators we strip from queries to avoid syntax errors. */
+const FTS5_OPERATORS = new Set(["AND", "OR", "NOT", "NEAR"]);
+/**
+ * Split a user query into FTS5-safe tokens.
+ *
+ * - Unicode-letters, digits, and underscore are token chars (so snake_case
+ *   stays joined for trigram matching — the porter tokenizer will resplit
+ *   on underscore at index-time, which is what we want).
+ * - Bare FTS5 operators (`AND`, `OR`, `NOT`, `NEAR`) are dropped.
+ * - Returns lowercase tokens with no quoting; caller picks AND/OR shape.
+ */
+function tokenizeQuery(query: string): string[] {
   return query
-    .replace(/[^\p{L}\p{N}\s]/gu, " ")
-    .replace(/\s+/g, " ")
-    .trim();
+    .replace(/[^\p{L}\p{N}_\s]/gu, " ")
+    .split(/\s+/)
+    .filter((w) => w.length > 0 && !FTS5_OPERATORS.has(w.toUpperCase()))
+    .map((w) => w.toLowerCase());
+}
+/** Build an FTS5 OR query: each token quoted and joined by " OR ". */
+function buildOrQuery(tokens: string[]): string {
+  if (tokens.length === 0) return "";
+  return tokens.map((t) => `"${t.replace(/"/g, "")}"`).filter((t) => t !== `""`).join(" OR ");
+}
+/** Words ≥3 chars, stopword-filtered, lowercased — used for the vocab table. */
+function extractVocabWords(text: string): Set<string> {
+  const seen = new Set<string>();
+  for (const raw of text.toLowerCase().split(/[^\p{L}\p{N}_-]+/u)) {
+    if (raw.length < 3) continue;
+    if (STOPWORDS.has(raw)) continue;
+    seen.add(raw);
+  }
+  return seen;
+}
+// ── Fuzzy correction ─────────────────────────────────────────
+/** Edit-distance budget by word length — short words tolerate fewer typos. */
+function maxEditDistance(wordLength: number): number {
+  if (wordLength <= 4) return 1;
+  if (wordLength <= 12) return 2;
+  return 3;
+}
+function levenshtein(a: string, b: string): number {
+  if (a.length === 0) return b.length;
+  if (b.length === 0) return a.length;
+  let prev = Array.from({ length: b.length + 1 }, (_, i) => i);
+  for (let i = 1; i <= a.length; i++) {
+    const curr = [i];
+    for (let j = 1; j <= b.length; j++) {
+      curr[j] = a[i - 1] === b[j - 1]
+        ? prev[j - 1]
+        : 1 + Math.min(prev[j], curr[j - 1], prev[j - 1]);
+    }
+    prev = curr;
+  }
+  return prev[b.length];
+}
+// ── Reciprocal Rank Fusion (Cormack et al. 2009) ────────────
+/**
+ * Fuse two BM25-ranked result lists into one ranking. Standard RRF with
+ * K = 60: each result contributes 1/(K + rank) to its chunk-id key,
+ * top-`limit` survives, lower RRF score becomes a more negative `score`
+ * for downstream ORDER-BY-`score` ascending callers (e.g. tests).
+ */
+function rrfFuse(
+  porter: RankedSearchResult[],
+  trigram: RankedSearchResult[],
+  limit: number,
+  layer: SearchMatchLayer,
+): SearchResult[] {
+  const K = 60;
+  const scoreMap = new Map<number, { result: RankedSearchResult; score: number }>();
+  const key = (r: RankedSearchResult) => r.chunkId;
+  for (let i = 0; i < porter.length; i++) {
+    const r = porter[i];
+    const k = key(r);
+    const existing = scoreMap.get(k);
+    const contribution = 1 / (K + i + 1);
+    if (existing) existing.score += contribution;
+    else scoreMap.set(k, { result: r, score: contribution });
+  }
+  for (let i = 0; i < trigram.length; i++) {
+    const r = trigram[i];
+    const k = key(r);
+    const existing = scoreMap.get(k);
+    const contribution = 1 / (K + i + 1);
+    if (existing) existing.score += contribution;
+    else scoreMap.set(k, { result: r, score: contribution });
+  }
+  return Array.from(scoreMap.values())
+    .sort((a, b) => b.score - a.score)
+    .slice(0, limit)
+    .map(({ result, score }) => {
+      const { chunkId: _chunkId, ...publicResult } = result;
+      return { ...publicResult, score: -score, matchLayer: layer };
+    });
+}
+// ── Proximity reranking ─────────────────────────────────────
+function findAllPositions(text: string, term: string): number[] {
+  if (!term) return [];
+  const positions: number[] = [];
+  let idx = text.indexOf(term);
+  while (idx !== -1) {
+    positions.push(idx);
+    idx = text.indexOf(term, idx + 1);
+  }
+  return positions;
+}
+/**
+ * Find the minimum span (window size in chars) covering one position from
+ * each list. Sweep-line: advance the pointer at the current minimum.
+ */
+function findMinSpan(positionLists: number[][]): number {
+  if (positionLists.length === 0) return Infinity;
+  if (positionLists.length === 1) return 0;
+  const sorted = positionLists.map((p) => [...p].sort((a, b) => a - b));
+  const ptrs = new Array(sorted.length).fill(0);
+  let minSpan = Infinity;
+  while (true) {
+    let curMin = Infinity;
+    let curMax = -Infinity;
+    let minIdx = 0;
+    for (let i = 0; i < sorted.length; i++) {
+      const val = sorted[i][ptrs[i]];
+      if (val < curMin) { curMin = val; minIdx = i; }
+      if (val > curMax) curMax = val;
+    }
+    const span = curMax - curMin;
+    if (span < minSpan) minSpan = span;
+    ptrs[minIdx]++;
+    if (ptrs[minIdx] >= sorted[minIdx].length) break;
+  }
+  return minSpan;
+}
+/**
+ * For multi-term queries, rerank fused results so that rows where the terms
+ * appear close together (small min-span) float to the top. Single-term
+ * queries are returned untouched.
+ */
+function applyProximityReranking(results: SearchResult[], tokens: string[]): SearchResult[] {
+  const terms = tokens.filter((t) => t.length >= 2);
+  if (terms.length < 2) return results;
+  return results
+    .map((r) => {
+      const haystack = r.body.toLowerCase();
+      const positions = terms.map((t) => findAllPositions(haystack, t));
+      if (positions.some((p) => p.length === 0)) {
+        return { result: r, boost: 0 };
+      }
+      const minSpan = findMinSpan(positions);
+      const boost = 1 / (1 + minSpan / Math.max(haystack.length, 1));
+      return { result: r, boost };
+    })
+    .sort((a, b) => b.boost - a.boost || a.result.score - b.result.score)
+    .map(({ result }) => result);
 }

package/src/context-mode/tools.ts CHANGED Viewed

@@ -303,12 +303,30 @@ const AUTO_INDEX_MAX_FILE_BYTES = 256 * 1024;
 const AUTO_INDEX_MAX_DEPTH = 8;
 const AUTO_INDEX_MIN_TERM_LEN = 3;
-/** Sessions for which we have already attempted bootstrap. Prevents repeat scans. */
+/**
+ * Sessions for which bootstrap should NOT run again. A `sessionKey` lands
+ * here when bootstrap was either successful (chunks indexed) or definitively
+ * barren (no scannable files in the cwd at all) — neither warrants a retry.
+ */
 const _autoIndexAttempted = new Set<string>();
+/**
+ * Per-session memoization of failed bootstrap scans, keyed by the query-term
+ * fingerprint. A scan that walked files but produced zero indexed chunks is
+ * not retried for the same fingerprint, but a different fingerprint (i.e. a
+ * reformulated query) is allowed through.
+ */
+const _autoIndexNoMatchByQuery = new Map<string, Set<string>>();
 /** Reset auto-index attempt tracking. Test-only. */
 export function _resetAutoIndexAttempts(): void {
   _autoIndexAttempted.clear();
+  _autoIndexNoMatchByQuery.clear();
+}
+/** Compute the per-query fingerprint used to gate retries on no-match scans. */
+function autoIndexQueryFingerprint(queries: string[]): string {
+  return extractIndexTerms(queries).slice().sort().join("|");
 }
 /** Drop bootstrap-attempted entries that belong to a closed session. */
@@ -318,6 +336,9 @@ export function _forgetAutoIndexSession(ownerId: string): void {
   for (const key of _autoIndexAttempted) {
     if (key.startsWith(prefix)) _autoIndexAttempted.delete(key);
   }
+  for (const key of [..._autoIndexNoMatchByQuery.keys()]) {
+    if (key.startsWith(prefix)) _autoIndexNoMatchByQuery.delete(key);
+  }
 }
 function extractIndexTerms(queries: string[]): string[] {
@@ -736,15 +757,17 @@ export function registerContextModeTools(
       const allEmpty = results.every((g) => g.results.length === 0);
       const sessionKey = `${owner.ownerId}|${source ?? ""}`;
+      const queryFingerprint = autoIndexQueryFingerprint(queries);
+      const failedFingerprints = _autoIndexNoMatchByQuery.get(sessionKey);
       const canBootstrap =
         allEmpty &&
         Array.isArray(queries) &&
         queries.length > 0 &&
         !source &&
-        !_autoIndexAttempted.has(sessionKey);
+        !_autoIndexAttempted.has(sessionKey) &&
+        !(failedFingerprints?.has(queryFingerprint) ?? false);
       if (canBootstrap) {
-        _autoIndexAttempted.add(sessionKey);
         const stats = store.getStats();
         if (stats.totalChunks === 0) {
           const cwd = typeof ctx?.cwd === "string" && ctx.cwd.length > 0 ? ctx.cwd : process.cwd();
@@ -755,15 +778,30 @@ export function registerContextModeTools(
             bootstrap = { chunksIndexed: 0, filesIndexed: 0, filesScanned: 0 };
           }
           if (bootstrap.chunksIndexed > 0) {
+            _autoIndexAttempted.add(sessionKey);
             results = store.search(queries, { source, contentType, limit, owner });
             bootstrapNote =
               `[auto-indexed ${bootstrap.filesIndexed} files (${bootstrap.chunksIndexed} chunks) ` +
               `from ${bootstrap.filesScanned} scanned to bootstrap the empty knowledge store]\n\n`;
           } else if (bootstrap.filesScanned > 0) {
+            // Scan ran but nothing matched this query fingerprint. Memoize by
+            // fingerprint so a reformulated query still gets a fresh scan.
+            let set = _autoIndexNoMatchByQuery.get(sessionKey);
+            if (!set) {
+              set = new Set<string>();
+              _autoIndexNoMatchByQuery.set(sessionKey, set);
+            }
+            set.add(queryFingerprint);
             bootstrapNote =
               `[scanned ${bootstrap.filesScanned} files but none matched the query terms; ` +
               `use ctx_batch_execute or ctx_index to index relevant content explicitly]\n\n`;
+          } else {
+            // No scannable files at all — cwd is barren. Don't retry, period.
+            _autoIndexAttempted.add(sessionKey);
           }
+        } else {
+          // Store had chunks but the query still missed; record nothing here —
+          // the search-side fallback already exhausted its options.
         }
       }

package/src/deps/registry.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export interface Dependency {
   name: string;
   binary: string;
   required: boolean;
-  category: "core" | "mcp" | "lsp" | "testing";
+  category: "core" | "lsp" | "testing";
   description: string;
   checkFn: (exec: ExecFn) => Promise<{ installed: boolean; version?: string }>;
   installCmd: string | null;
@@ -83,16 +83,6 @@ export const DEPENDENCIES: Dependency[] = [
     installCmd: null,
     url: "https://bun.sh",
   },
-  {
-    name: "mcpc",
-    binary: "mcpc",
-    required: false,
-    category: "mcp",
-    description: "MCP client CLI for server management",
-    checkFn: (exec) => checkBinary(exec, "mcpc"),
-    installCmd: "npm install -g @apify/mcpc",
-    url: "https://github.com/apify/mcpc",
-  },
   {
     name: "TypeScript LSP",
     binary: "typescript-language-server",
@@ -244,7 +234,6 @@ export function formatReport(
   // Object.keys preserves insertion order for string keys in all major engines (V8/JSC/SM).
   const categoryLabels: Record<Dependency["category"], string> = {
     core: "Core",
-    mcp: "MCP",
     lsp: "Language Servers",
     testing: "Testing",
   };

package/src/fix-pr/assessment.ts CHANGED Viewed

@@ -55,6 +55,7 @@ function buildAssessmentPrompt(args: BuildAssessmentPromptArgs): string {
     "",
     "Rules:",
     "- Read the referenced code before assigning a verdict.",
+    `- If a comment's diffHunk lacks enough context, read \`pr://${args.repo}/${args.prNumber}/diff/all\`; the changed-file list is \`pr://${args.repo}/${args.prNumber}/diff\`. Use these only for verdict assessment and do not edit during assessment.`,
     "- Do not perform any code edits. This is a pure assessment pass.",
     "- One assessment per comment. `commentId` ties back to the PR comment id.",
     "",

package/src/fix-pr/prompt-builder.ts CHANGED Viewed

@@ -84,6 +84,7 @@ export function buildFixPrOrchestratorPrompt(options: FixPrPromptOptions): strin
     `- Session dir: \`${sessionDir}\``,
     `- Iteration: ${iteration} of ${maxIter}`,
     `- Selected target: ${selectedTargetLabel}`,
+    `- Full PR diff: \`pr://${repo}/${prNumber}/diff/all\`; changed-file list: \`pr://${repo}/${prNumber}/diff\``,
     `- Comment reply policy: ${config.commentPolicy}`,
     `- Reviewer: ${reviewer.type}${reviewer.triggerMethod ? ` (trigger: ${reviewer.triggerMethod})` : ""}`,
     deferredCommentsSummary