npm - @loreai/core - Versions diffs - 0.16.0 → 0.17.0 - Mend

@loreai/core 0.16.0 → 0.17.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (155) hide show

package/README.md +11 -0
package/dist/bun/agents-file.d.ts +13 -1
package/dist/bun/agents-file.d.ts.map +1 -1
package/dist/bun/config.d.ts +20 -1
package/dist/bun/config.d.ts.map +1 -1
package/dist/bun/data.d.ts +174 -0
package/dist/bun/data.d.ts.map +1 -0
package/dist/bun/db.d.ts +65 -0
package/dist/bun/db.d.ts.map +1 -1
package/dist/bun/distillation.d.ts +49 -6
package/dist/bun/distillation.d.ts.map +1 -1
package/dist/bun/embedding-vendor.d.ts +66 -0
package/dist/bun/embedding-vendor.d.ts.map +1 -0
package/dist/bun/embedding-worker-types.d.ts +66 -0
package/dist/bun/embedding-worker-types.d.ts.map +1 -0
package/dist/bun/embedding-worker.d.ts +16 -0
package/dist/bun/embedding-worker.d.ts.map +1 -0
package/dist/bun/embedding-worker.js +100 -0
package/dist/bun/embedding-worker.js.map +7 -0
package/dist/bun/embedding.d.ts +91 -8
package/dist/bun/embedding.d.ts.map +1 -1
package/dist/bun/git.d.ts +47 -0
package/dist/bun/git.d.ts.map +1 -0
package/dist/bun/gradient.d.ts +19 -1
package/dist/bun/gradient.d.ts.map +1 -1
package/dist/bun/index.d.ts +9 -6
package/dist/bun/index.d.ts.map +1 -1
package/dist/bun/index.js +13029 -10885
package/dist/bun/index.js.map +4 -4
package/dist/bun/lat-reader.d.ts +1 -1
package/dist/bun/lat-reader.d.ts.map +1 -1
package/dist/bun/ltm.d.ts.map +1 -1
package/dist/bun/markdown.d.ts +11 -0
package/dist/bun/markdown.d.ts.map +1 -1
package/dist/bun/prompt.d.ts +1 -1
package/dist/bun/prompt.d.ts.map +1 -1
package/dist/bun/recall.d.ts +53 -0
package/dist/bun/recall.d.ts.map +1 -1
package/dist/bun/search.d.ts +29 -0
package/dist/bun/search.d.ts.map +1 -1
package/dist/bun/temporal.d.ts +2 -0
package/dist/bun/temporal.d.ts.map +1 -1
package/dist/bun/types.d.ts +15 -0
package/dist/bun/types.d.ts.map +1 -1
package/dist/bun/worker-model.d.ts +12 -9
package/dist/bun/worker-model.d.ts.map +1 -1
package/dist/node/agents-file.d.ts +13 -1
package/dist/node/agents-file.d.ts.map +1 -1
package/dist/node/config.d.ts +20 -1
package/dist/node/config.d.ts.map +1 -1
package/dist/node/data.d.ts +174 -0
package/dist/node/data.d.ts.map +1 -0
package/dist/node/db.d.ts +65 -0
package/dist/node/db.d.ts.map +1 -1
package/dist/node/distillation.d.ts +49 -6
package/dist/node/distillation.d.ts.map +1 -1
package/dist/node/embedding-vendor.d.ts +66 -0
package/dist/node/embedding-vendor.d.ts.map +1 -0
package/dist/node/embedding-worker-types.d.ts +66 -0
package/dist/node/embedding-worker-types.d.ts.map +1 -0
package/dist/node/embedding-worker.d.ts +16 -0
package/dist/node/embedding-worker.d.ts.map +1 -0
package/dist/node/embedding-worker.js +100 -0
package/dist/node/embedding-worker.js.map +7 -0
package/dist/node/embedding.d.ts +91 -8
package/dist/node/embedding.d.ts.map +1 -1
package/dist/node/git.d.ts +47 -0
package/dist/node/git.d.ts.map +1 -0
package/dist/node/gradient.d.ts +19 -1
package/dist/node/gradient.d.ts.map +1 -1
package/dist/node/index.d.ts +9 -6
package/dist/node/index.d.ts.map +1 -1
package/dist/node/index.js +13029 -10885
package/dist/node/index.js.map +4 -4
package/dist/node/lat-reader.d.ts +1 -1
package/dist/node/lat-reader.d.ts.map +1 -1
package/dist/node/ltm.d.ts.map +1 -1
package/dist/node/markdown.d.ts +11 -0
package/dist/node/markdown.d.ts.map +1 -1
package/dist/node/prompt.d.ts +1 -1
package/dist/node/prompt.d.ts.map +1 -1
package/dist/node/recall.d.ts +53 -0
package/dist/node/recall.d.ts.map +1 -1
package/dist/node/search.d.ts +29 -0
package/dist/node/search.d.ts.map +1 -1
package/dist/node/temporal.d.ts +2 -0
package/dist/node/temporal.d.ts.map +1 -1
package/dist/node/types.d.ts +15 -0
package/dist/node/types.d.ts.map +1 -1
package/dist/node/worker-model.d.ts +12 -9
package/dist/node/worker-model.d.ts.map +1 -1
package/dist/types/agents-file.d.ts +13 -1
package/dist/types/agents-file.d.ts.map +1 -1
package/dist/types/config.d.ts +20 -1
package/dist/types/config.d.ts.map +1 -1
package/dist/types/data.d.ts +174 -0
package/dist/types/data.d.ts.map +1 -0
package/dist/types/db.d.ts +65 -0
package/dist/types/db.d.ts.map +1 -1
package/dist/types/distillation.d.ts +49 -6
package/dist/types/distillation.d.ts.map +1 -1
package/dist/types/embedding-vendor.d.ts +66 -0
package/dist/types/embedding-vendor.d.ts.map +1 -0
package/dist/types/embedding-worker-types.d.ts +66 -0
package/dist/types/embedding-worker-types.d.ts.map +1 -0
package/dist/types/embedding-worker.d.ts +16 -0
package/dist/types/embedding-worker.d.ts.map +1 -0
package/dist/types/embedding.d.ts +91 -8
package/dist/types/embedding.d.ts.map +1 -1
package/dist/types/git.d.ts +47 -0
package/dist/types/git.d.ts.map +1 -0
package/dist/types/gradient.d.ts +19 -1
package/dist/types/gradient.d.ts.map +1 -1
package/dist/types/index.d.ts +9 -6
package/dist/types/index.d.ts.map +1 -1
package/dist/types/lat-reader.d.ts +1 -1
package/dist/types/lat-reader.d.ts.map +1 -1
package/dist/types/ltm.d.ts.map +1 -1
package/dist/types/markdown.d.ts +11 -0
package/dist/types/markdown.d.ts.map +1 -1
package/dist/types/prompt.d.ts +1 -1
package/dist/types/prompt.d.ts.map +1 -1
package/dist/types/recall.d.ts +53 -0
package/dist/types/recall.d.ts.map +1 -1
package/dist/types/search.d.ts +29 -0
package/dist/types/search.d.ts.map +1 -1
package/dist/types/temporal.d.ts +2 -0
package/dist/types/temporal.d.ts.map +1 -1
package/dist/types/types.d.ts +15 -0
package/dist/types/types.d.ts.map +1 -1
package/dist/types/worker-model.d.ts +12 -9
package/dist/types/worker-model.d.ts.map +1 -1
package/package.json +5 -2
package/src/agents-file.ts +87 -4
package/src/config.ts +68 -5
package/src/curator.ts +2 -2
package/src/data.ts +768 -0
package/src/db.ts +386 -7
package/src/distillation.ts +178 -35
package/src/embedding-vendor.ts +102 -0
package/src/embedding-worker-types.ts +82 -0
package/src/embedding-worker.ts +185 -0
package/src/embedding.ts +607 -61
package/src/git.ts +144 -0
package/src/gradient.ts +174 -17
package/src/index.ts +20 -0
package/src/lat-reader.ts +5 -11
package/src/ltm.ts +17 -44
package/src/markdown.ts +15 -0
package/src/prompt.ts +1 -2
package/src/recall.ts +401 -70
package/src/search.ts +71 -1
package/src/temporal.ts +42 -35
package/src/types.ts +15 -0
package/src/worker-model.ts +14 -9

package/src/recall.ts CHANGED Viewed

@@ -23,10 +23,10 @@ import {
   expandQuery,
   filterTerms,
   ftsQuery,
-  ftsQueryOr,
   reciprocalRankFusion,
+  runRelaxedSearch,
 } from "./search";
-import { h, inline, lip, liph, p, root, serialize, t, ul } from "./markdown";
+import { inline } from "./markdown";
 // ---------------------------------------------------------------------------
 // Types
@@ -49,6 +49,8 @@ export type RecallInput = {
   query: string;
   /** Narrow the search surface. Defaults to `"all"`. */
   scope?: RecallScope;
+  /** Fetch full content of a specific result by its source-prefixed ID (e.g. "k:xxx", "d:xxx"). */
+  id?: string;
   /** Project root — used by all scoring paths. */
   projectPath: string;
   /** Current session ID — required when `scope === "session"`. */
@@ -64,7 +66,7 @@ export type RecallInput = {
 /** Result of a full recall run — markdown-formatted string for the LLM. */
 export type RecallResult = string;
-type TaggedResult =
+export type TaggedResult =
   | { source: "knowledge"; item: ltm.ScoredKnowledgeEntry }
   | {
       source: "cross-knowledge";
@@ -75,6 +77,8 @@ type TaggedResult =
   | { source: "temporal"; item: temporal.ScoredTemporalMessage }
   | { source: "lat-section"; item: latReader.ScoredLatSection };
+export type ScoredTaggedResult = { item: TaggedResult; score: number };
 // ---------------------------------------------------------------------------
 // Tagged result helpers (used by exact-match boost + formatting)
 // ---------------------------------------------------------------------------
@@ -149,8 +153,6 @@ function searchDistillationsScored(input: {
 }): ScoredDistillation[] {
   const pid = ensureProject(input.projectPath);
   const limit = input.limit ?? 10;
-  const q = ftsQuery(input.query);
-  if (q === EMPTY_QUERY) return [];
   const ftsSQL = input.sessionID
     ? `SELECT d.id, d.observations, d.generation, d.created_at, d.session_id, d.c_norm, rank
@@ -165,21 +167,14 @@ function searchDistillationsScored(input: {
        WHERE distillation_fts MATCH ?
        AND d.project_id = ?
        ORDER BY rank LIMIT ?`;
-  const params = input.sessionID
-    ? [q, pid, input.sessionID, limit]
-    : [q, pid, limit];
   try {
-    const results = db().query(ftsSQL).all(...params) as ScoredDistillation[];
-    if (results.length) return results;
-    // AND returned nothing — try OR fallback
-    const qOr = ftsQueryOr(input.query);
-    if (qOr === EMPTY_QUERY) return [];
-    const paramsOr = input.sessionID
-      ? [qOr, pid, input.sessionID, limit]
-      : [qOr, pid, limit];
-    return db().query(ftsSQL).all(...paramsOr) as ScoredDistillation[];
+    return runRelaxedSearch(input.query, (matchExpr) => {
+      const params = input.sessionID
+        ? [matchExpr, pid, input.sessionID, limit]
+        : [matchExpr, pid, limit];
+      return db().query(ftsSQL).all(...params) as ScoredDistillation[];
+    });
   } catch {
     // FTS5 failed — fall back to LIKE search with synthetic rank
     return searchDistillationsLike({
@@ -195,69 +190,264 @@ function searchDistillationsScored(input: {
 // Result formatting
 // ---------------------------------------------------------------------------
+/** Default formatting config used when no overrides are provided. */
+const DEFAULT_FORMAT_CONFIG = {
+  charBudget: 8000,
+  relevanceFloor: 0.15,
+  maxResults: 15,
+};
+type FormatConfig = typeof DEFAULT_FORMAT_CONFIG;
+/**
+ * Truncate text at a sentence boundary within maxChars.
+ *
+ * Walks backwards from the budget limit looking for sentence-ending
+ * punctuation (. ! ?) followed by whitespace or end-of-string.
+ * Only searches the back half of the budget to avoid cutting too short.
+ * Falls back to word boundary if no sentence end is found.
+ */
+function truncateAtSentence(text: string, maxChars: number): string {
+  if (text.length <= maxChars) return text;
+  // Search backwards from maxChars for a sentence boundary
+  const minPos = Math.floor(maxChars * 0.5);
+  for (let i = maxChars - 1; i >= minPos; i--) {
+    if (
+      (text[i] === "." || text[i] === "!" || text[i] === "?") &&
+      (i + 1 >= text.length || /\s/.test(text[i + 1]))
+    ) {
+      return text.slice(0, i + 1);
+    }
+  }
+  // No sentence boundary — fall back to word boundary
+  const slice = text.slice(0, maxChars);
+  const lastSpace = slice.lastIndexOf(" ");
+  if (lastSpace > minPos) return text.slice(0, lastSpace) + "...";
+  return slice + "...";
+}
+/** Source-type weights for budget allocation. Higher = more space. */
+const SOURCE_WEIGHT: Record<TaggedResult["source"], number> = {
+  knowledge: 1.0,
+  "cross-knowledge": 1.0,
+  "lat-section": 0.9,
+  distillation: 0.8,
+  temporal: 0.5,
+};
+/** Tier multipliers for budget allocation. */
+const TIER_MULTIPLIERS = [3.0, 1.5, 0.7] as const;
+/** Human-readable tier labels. */
+const TIER_NAMES = ["Strong Matches", "Supporting", "Peripheral"] as const;
+/** Source display order within a tier. */
+const SOURCE_ORDER: Record<TaggedResult["source"], number> = {
+  knowledge: 0,
+  "cross-knowledge": 1,
+  "lat-section": 2,
+  distillation: 3,
+  temporal: 4,
+};
+/** Human-readable source group labels for sub-headers. */
+const SOURCE_LABELS: Record<TaggedResult["source"], string> = {
+  knowledge: "Knowledge",
+  "cross-knowledge": "Cross-Project",
+  "lat-section": "Reference",
+  distillation: "Distilled",
+  temporal: "Conversation",
+};
+/** Format a relative age string from a timestamp. */
+function relativeAge(createdAt: number): string {
+  const diffMs = Date.now() - createdAt;
+  const mins = Math.floor(diffMs / 60_000);
+  if (mins < 60) return `${mins}m ago`;
+  const hours = Math.floor(mins / 60);
+  if (hours < 24) return `${hours}h ago`;
+  const days = Math.floor(hours / 24);
+  return `${days}d ago`;
+}
+type TieredResult = ScoredTaggedResult & {
+  tier: 0 | 1 | 2;
+  charBudget: number;
+};
 function formatFusedResults(
-  results: Array<{ item: TaggedResult; score: number }>,
-  maxResults: number,
+  results: ScoredTaggedResult[],
+  config: FormatConfig,
 ): string {
   if (!results.length) return "No results found for this query.";
-  const items = results.slice(0, maxResults).map(({ item: tagged }) => {
-    switch (tagged.source) {
-      case "knowledge": {
-        const k = tagged.item;
-        return liph(
-          t(
-            `**[knowledge/${k.category}]** ${inline(k.title)}: ${inline(k.content)}`,
-          ),
-        );
-      }
-      case "cross-knowledge": {
-        const k = tagged.item;
-        return liph(
-          t(
-            `**[knowledge/${k.category} from: ${tagged.projectLabel}]** ${inline(k.title)}: ${inline(k.content)}`,
-          ),
-        );
-      }
-      case "distillation": {
-        const d = tagged.item;
-        const preview =
-          d.observations.length > 500
-            ? d.observations.slice(0, 500) + "..."
-            : d.observations;
-        return lip(`**[distilled]** ${inline(preview)}`);
-      }
-      case "temporal": {
-        const m = tagged.item;
-        const preview =
-          m.content.length > 500 ? m.content.slice(0, 500) + "..." : m.content;
-        return lip(
-          `**[temporal/${m.role}]** (session: ${m.session_id.slice(0, 8)}...) ${inline(preview)}`,
-        );
-      }
-      case "lat-section": {
-        const s = tagged.item;
-        const preview = s.first_paragraph
-          ? inline(s.first_paragraph)
-          : inline(
-              s.content.length > 300 ? s.content.slice(0, 300) + "..." : s.content,
-            );
-        return liph(
-          t(`**[lat.md/${s.file}]** ${inline(s.heading)}: ${preview}`),
-        );
+  const totalFound = results.length;
+  const topScore = results[0].score;
+  const scoreFloor = topScore * config.relevanceFloor;
+  // Step 1: Score-based cutoff + hard cap. Always keep at least 3.
+  let kept = results.filter((r) => r.score >= scoreFloor);
+  kept = kept.slice(0, config.maxResults);
+  if (kept.length < 3) kept = results.slice(0, Math.min(3, results.length));
+  // Step 2: Assign tiers based on relative score.
+  const tiered: TieredResult[] = kept.map((r) => ({
+    ...r,
+    tier:
+      r.score >= topScore * 0.6 ? 0 : r.score >= topScore * 0.3 ? 1 : 2,
+    charBudget: 0, // computed next
+  }));
+  // Step 3: Compute per-result char budgets proportional to weight.
+  const rawWeights = tiered.map(
+    (r) => SOURCE_WEIGHT[r.item.source] * TIER_MULTIPLIERS[r.tier],
+  );
+  const totalWeight = rawWeights.reduce((a, b) => a + b, 0);
+  for (let i = 0; i < tiered.length; i++) {
+    tiered[i].charBudget = Math.max(
+      80,
+      Math.min(
+        1200,
+        Math.floor((config.charBudget * rawWeights[i]) / totalWeight),
+      ),
+    );
+  }
+  // Step 4+5: Build markdown output grouped by tier, then by source.
+  const lowScore = kept[kept.length - 1].score;
+  const lines: string[] = [];
+  lines.push(`## Recall Results`);
+  lines.push(``);
+  lines.push(
+    `Found ${totalFound} results, showing top ${kept.length} (score range: ${topScore.toFixed(3)}–${lowScore.toFixed(3)}).`,
+  );
+  for (const tierIdx of [0, 1, 2] as const) {
+    const tierResults = tiered.filter((r) => r.tier === tierIdx);
+    if (!tierResults.length) continue;
+    // Sort by source order within tier
+    tierResults.sort(
+      (a, b) => SOURCE_ORDER[a.item.source] - SOURCE_ORDER[b.item.source],
+    );
+    lines.push(``);
+    lines.push(`### ${TIER_NAMES[tierIdx]}`);
+    // Group by source type for sub-headers
+    let currentSource: TaggedResult["source"] | null = null;
+    for (const r of tierResults) {
+      if (r.item.source !== currentSource) {
+        currentSource = r.item.source;
+        lines.push(``);
+        lines.push(`#### ${SOURCE_LABELS[currentSource]}`);
       }
+      const line = renderResultLine(r.item, r.charBudget);
+      lines.push(line);
     }
-  });
+  }
+  // Footer
+  const anyTruncated = tiered.some(
+    (r) => getFullContentLength(r.item) > r.charBudget,
+  );
+  lines.push(``);
+  lines.push(`---`);
+  if (anyTruncated) {
+    lines.push(
+      `*${kept.length} of ${totalFound} results shown. Use recall with id parameter to see full content of truncated results.*`,
+    );
+  } else {
+    lines.push(`*${kept.length} of ${totalFound} results shown.*`);
+  }
-  return serialize(root(h(2, "Recall Results"), ul(items)));
+  return lines.join("\n");
+}
+/** Get the full content length of a tagged result (before truncation). */
+function getFullContentLength(tagged: TaggedResult): number {
+  switch (tagged.source) {
+    case "knowledge":
+    case "cross-knowledge":
+      return tagged.item.title.length + tagged.item.content.length + 4; // **: :
+    case "distillation":
+      return tagged.item.observations.length;
+    case "temporal":
+      return tagged.item.content.length;
+    case "lat-section":
+      return tagged.item.heading.length + tagged.item.content.length;
+  }
+}
+/** Render a single result as a markdown list item line. */
+function renderResultLine(tagged: TaggedResult, charBudget: number): string {
+  const id = taggedResultKey(tagged);
+  switch (tagged.source) {
+    case "knowledge": {
+      const k = tagged.item;
+      const titlePart = `**${inline(k.title)}**: `;
+      const contentBudget = Math.max(40, charBudget - titlePart.length);
+      const content = truncateAtSentence(inline(k.content), contentBudget);
+      const wasTruncated = inline(k.content).length > contentBudget;
+      return `- ${titlePart}${content}${wasTruncated ? ` (${id})` : ""}`;
+    }
+    case "cross-knowledge": {
+      const k = tagged.item;
+      const titlePart = `**${inline(k.title)}** (from: ${tagged.projectLabel}): `;
+      const contentBudget = Math.max(40, charBudget - titlePart.length);
+      const content = truncateAtSentence(inline(k.content), contentBudget);
+      const wasTruncated = inline(k.content).length > contentBudget;
+      return `- ${titlePart}${content}${wasTruncated ? ` (${id})` : ""}`;
+    }
+    case "distillation": {
+      const d = tagged.item;
+      const fullText = inline(d.observations);
+      const content = truncateAtSentence(fullText, charBudget);
+      const wasTruncated = fullText.length > charBudget;
+      return `- ${content}${wasTruncated ? ` (${id})` : ""}`;
+    }
+    case "temporal": {
+      const m = tagged.item;
+      const prefix = `(${m.role}, ${relativeAge(m.created_at)}) `;
+      const contentBudget = Math.max(40, charBudget - prefix.length);
+      const fullText = inline(m.content);
+      const content = truncateAtSentence(fullText, contentBudget);
+      const wasTruncated = fullText.length > contentBudget;
+      return `- ${prefix}${content}${wasTruncated ? ` (${id})` : ""}`;
+    }
+    case "lat-section": {
+      const s = tagged.item;
+      const heading = `**${inline(s.file)} \u00A7 ${inline(s.heading)}**: `;
+      const contentBudget = Math.max(40, charBudget - heading.length);
+      const fullText = s.first_paragraph
+        ? inline(s.first_paragraph)
+        : inline(s.content);
+      const content = truncateAtSentence(fullText, contentBudget);
+      const wasTruncated = fullText.length > contentBudget;
+      return `- ${heading}${content}${wasTruncated ? ` (${id})` : ""}`;
+    }
+  }
 }
 // ---------------------------------------------------------------------------
 // Main entry point
 // ---------------------------------------------------------------------------
-/** Full recall run: search every relevant source, fuse with RRF, format as markdown. */
-export async function runRecall(input: RecallInput): Promise<RecallResult> {
+/**
+ * Search every relevant source, fuse with RRF, and return raw scored results.
+ *
+ * This is the search+fusion core shared by `runRecall()` (LLM-formatted) and
+ * direct consumers like the web UI that need access to the raw result items.
+ */
+export async function searchRecall(
+  input: RecallInput,
+): Promise<ScoredTaggedResult[]> {
   const {
     query,
     scope = "all",
@@ -272,7 +462,7 @@ export async function runRecall(input: RecallInput): Promise<RecallResult> {
   // Short-circuit vague queries — stopwords-only would match everything.
   if (ftsQuery(query) === EMPTY_QUERY) {
-    return "Query too vague — try using specific keywords, file names, or technical terms.";
+    return [];
   }
   // Optional query expansion: generate alternative phrasings via LLM.
@@ -431,6 +621,36 @@ export async function runRecall(input: RecallInput): Promise<RecallResult> {
           });
         }
       }
+      // Temporal vector search (undistilled messages only)
+      if (scope !== "knowledge") {
+        const pid = ensureProject(projectPath);
+        const temporalVectorHits = embedding.vectorSearchTemporal(
+          queryVec,
+          pid,
+          limit,
+        );
+        const temporalVectorTagged: TaggedResult[] = temporalVectorHits
+          .map((hit): TaggedResult | null => {
+            const row = db()
+              .query(
+                "SELECT id, project_id, session_id, role, content, tokens, distilled, created_at, metadata FROM temporal_messages WHERE id = ?",
+              )
+              .get(hit.id) as temporal.TemporalMessage | null;
+            if (!row) return null;
+            return {
+              source: "temporal",
+              item: { ...row, rank: -hit.similarity },
+            };
+          })
+          .filter((r): r is TaggedResult => r !== null);
+        if (temporalVectorTagged.length) {
+          allRrfLists.push({
+            items: temporalVectorTagged,
+            key: (r) => `t:${r.item.id}`,
+          });
+        }
+      }
     } catch (err) {
       log.info("recall: vector search failed:", err);
     }
@@ -567,7 +787,117 @@ export async function runRecall(input: RecallInput): Promise<RecallResult> {
   }
   const fused = reciprocalRankFusion<TaggedResult>(allRrfLists);
-  return formatFusedResults(fused, 20);
+  // Cap output: return at most 3x the per-source limit. With 7+ RRF sources
+  // each contributing up to `limit` items, uncapped output can be huge (89+
+  // results for broad OR fallbacks). The top-scoring items after RRF fusion
+  // are the ones that appeared in multiple lists — capping preserves those
+  // while dropping the long tail of single-list noise.
+  const maxResults = limit * 3;
+  return fused.slice(0, maxResults);
+}
+// ---------------------------------------------------------------------------
+// Recall by ID — fetch full untruncated content of a specific result
+// ---------------------------------------------------------------------------
+/**
+ * Fetch the full content of a single result by its source-prefixed ID.
+ *
+ * IDs use the format `prefix:uuid` where prefix is one of:
+ *   k: (knowledge), xk: (cross-knowledge), d: (distillation),
+ *   t: (temporal), lat: (lat-section).
+ */
+export function recallById(id: string): string {
+  const colonIdx = id.indexOf(":");
+  if (colonIdx < 1) return `No entry found for id: ${id}`;
+  const prefix = id.slice(0, colonIdx);
+  const rawId = id.slice(colonIdx + 1);
+  switch (prefix) {
+    case "k":
+    case "xk": {
+      const entry = ltm.get(rawId);
+      if (!entry) return `No entry found for id: ${id}`;
+      return [
+        `## Recall Detail: ${id}`,
+        ``,
+        `#### Knowledge`,
+        `- **${inline(entry.title)}** (${entry.category}): ${inline(entry.content)}`,
+      ].join("\n");
+    }
+    case "d": {
+      const row = db()
+        .query(
+          "SELECT id, observations, generation, created_at, session_id, c_norm FROM distillations WHERE id = ?",
+        )
+        .get(rawId) as Distillation | null;
+      if (!row) return `No entry found for id: ${id}`;
+      return [
+        `## Recall Detail: ${id}`,
+        ``,
+        `#### Distilled`,
+        `${inline(row.observations)}`,
+      ].join("\n");
+    }
+    case "t": {
+      const row = db()
+        .query(
+          "SELECT id, project_id, session_id, role, content, tokens, distilled, created_at, metadata FROM temporal_messages WHERE id = ?",
+        )
+        .get(rawId) as temporal.TemporalMessage | null;
+      if (!row) return `No entry found for id: ${id}`;
+      return [
+        `## Recall Detail: ${id}`,
+        ``,
+        `#### Conversation`,
+        `(${row.role}, ${relativeAge(row.created_at)}, session: ${row.session_id.slice(0, 8)})`,
+        ``,
+        `${inline(row.content)}`,
+      ].join("\n");
+    }
+    case "lat": {
+      const row = db()
+        .query(
+          "SELECT id, project_id, file, heading, depth, content, content_hash, first_paragraph, updated_at FROM lat_sections WHERE id = ?",
+        )
+        .get(rawId) as latReader.LatSection | null;
+      if (!row) return `No entry found for id: ${id}`;
+      return [
+        `## Recall Detail: ${id}`,
+        ``,
+        `#### Reference`,
+        `**${inline(row.file)} \u00A7 ${inline(row.heading)}**`,
+        ``,
+        `${inline(row.content)}`,
+      ].join("\n");
+    }
+    default:
+      return `Unknown source prefix "${prefix}" in id: ${id}`;
+  }
+}
+/** Full recall run: search every relevant source, fuse with RRF, format as markdown. */
+export async function runRecall(input: RecallInput): Promise<RecallResult> {
+  // ID-based detail retrieval — bypass search entirely.
+  if (input.id) {
+    return recallById(input.id);
+  }
+  // Short-circuit vague queries — stopwords-only would match everything.
+  if (ftsQuery(input.query) === EMPTY_QUERY) {
+    return "Query too vague — try using specific keywords, file names, or technical terms.";
+  }
+  const fused = await searchRecall(input);
+  const recallCfg = input.searchConfig?.recall;
+  return formatFusedResults(fused, {
+    charBudget: recallCfg?.charBudget ?? DEFAULT_FORMAT_CONFIG.charBudget,
+    relevanceFloor:
+      recallCfg?.relevanceFloor ?? DEFAULT_FORMAT_CONFIG.relevanceFloor,
+    maxResults: recallCfg?.maxResults ?? DEFAULT_FORMAT_CONFIG.maxResults,
+  });
 }
 /** Standard tool description reused verbatim by each host adapter. */
@@ -579,4 +909,5 @@ export const RECALL_PARAM_DESCRIPTIONS = {
   query: "What to search for — be specific. Include keywords, file names, or concepts.",
   scope:
     "Search scope: 'all' (default) searches everything, 'session' searches current session only, 'project' searches all sessions in this project, 'knowledge' searches only long-term knowledge.",
+  id: "Fetch full content of a specific result by its source-prefixed ID (e.g. 'k:abc123', 'd:abc123'). IDs are shown on truncated results in recall output. When id is provided, query is ignored.",
 };

package/src/search.ts CHANGED Viewed

@@ -173,6 +173,76 @@ export function ftsQueryOr(raw: string): string {
   return terms.map((w) => `${w}*`).join(" OR ");
 }
+/**
+ * Build a cascade of progressively relaxed FTS5 queries.
+ *
+ * For N terms, produces up to (N - minTerms) queries, each dropping one more
+ * term (least significant first — shortest terms dropped first as a rough
+ * proxy for specificity). The final entry is always the full OR query.
+ *
+ * Example for 6 terms with minTerms=3:
+ *   [0] 5-of-6 AND (drop shortest term)
+ *   [1] 4-of-6 AND
+ *   [2] 3-of-6 AND
+ *   [3] full OR (all 6 terms)
+ *
+ * For ≤ minTerms terms, returns just the OR query (no intermediate steps).
+ * Callers should try each query in order, stopping at the first that returns
+ * results. This avoids the AND→OR cliff that produces massive low-quality
+ * result sets.
+ */
+export function ftsQueryRelaxed(raw: string, minTerms = 3): string[] {
+  const terms = filterTerms(raw);
+  if (!terms.length) return [EMPTY_QUERY];
+  const orQuery = terms.map((w) => `${w}*`).join(" OR ");
+  // Not enough terms for progressive relaxation — just OR.
+  if (terms.length <= minTerms) return [orQuery];
+  // Sort by length ascending — shortest (least specific) terms dropped first.
+  const ranked = [...terms].sort((a, b) => a.length - b.length);
+  const cascade: string[] = [];
+  for (let drop = 1; drop <= terms.length - minTerms; drop++) {
+    const kept = ranked.slice(drop);
+    cascade.push(kept.map((w) => `${w}*`).join(" "));
+  }
+  cascade.push(orQuery);
+  return cascade;
+}
+/**
+ * Run a search function through the relaxed cascade, stopping at the first
+ * query that produces results. Falls back through progressively looser AND
+ * queries before trying full OR.
+ *
+ * @param raw     The original query string
+ * @param runner  A function that takes an FTS5 MATCH expression and returns results
+ * @returns       The results from the first cascade step that produced matches
+ */
+export function runRelaxedSearch<T>(
+  raw: string,
+  runner: (matchExpr: string) => T[],
+): T[] {
+  // First try exact AND (all terms)
+  const q = ftsQuery(raw);
+  if (q === EMPTY_QUERY) return [];
+  const andResults = runner(q);
+  if (andResults.length) return andResults;
+  // Try progressively relaxed queries
+  const cascade = ftsQueryRelaxed(raw);
+  for (const relaxed of cascade) {
+    if (relaxed === EMPTY_QUERY) continue;
+    const results = runner(relaxed);
+    if (results.length) return results;
+  }
+  return [];
+}
 // ---------------------------------------------------------------------------
 // Term extraction (Phase 3)
 // ---------------------------------------------------------------------------
@@ -335,7 +405,7 @@ export async function expandQuery(
       llm.prompt(
         QUERY_EXPANSION_SYSTEM,
         `Input: "${query}"`,
-        { model, workerID: "lore-query-expand", thinking: false, urgent: true, sessionID },
+        { model, workerID: "lore-query-expand", thinking: false, urgent: true, sessionID, maxTokens: 256 },
       ),
       new Promise<null>((resolve) => setTimeout(() => resolve(null), TIMEOUT_MS)),
     ]);