npm - @loreai/core - Versions diffs - 0.0.1 → 0.10.0 - Mend

@loreai/core 0.0.1 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (147) hide show

package/LICENSE +21 -0
package/README.md +26 -5
package/dist/bun/agents-file.d.ts +59 -0
package/dist/bun/agents-file.d.ts.map +1 -0
package/dist/bun/config.d.ts +58 -0
package/dist/bun/config.d.ts.map +1 -0
package/dist/bun/curator.d.ts +35 -0
package/dist/bun/curator.d.ts.map +1 -0
package/dist/bun/db/driver.bun.d.ts +5 -0
package/dist/bun/db/driver.bun.d.ts.map +1 -0
package/dist/bun/db/driver.node.d.ts +15 -0
package/dist/bun/db/driver.node.d.ts.map +1 -0
package/dist/bun/db.d.ts +22 -0
package/dist/bun/db.d.ts.map +1 -0
package/dist/bun/distillation.d.ts +32 -0
package/dist/bun/distillation.d.ts.map +1 -0
package/dist/bun/embedding.d.ts +90 -0
package/dist/bun/embedding.d.ts.map +1 -0
package/dist/bun/gradient.d.ts +73 -0
package/dist/bun/gradient.d.ts.map +1 -0
package/dist/bun/index.d.ts +19 -0
package/dist/bun/index.d.ts.map +1 -0
package/dist/bun/index.js +28236 -0
package/dist/bun/index.js.map +7 -0
package/dist/bun/lat-reader.d.ts +69 -0
package/dist/bun/lat-reader.d.ts.map +1 -0
package/dist/bun/log.d.ts +17 -0
package/dist/bun/log.d.ts.map +1 -0
package/dist/bun/ltm.d.ts +138 -0
package/dist/bun/ltm.d.ts.map +1 -0
package/dist/bun/markdown.d.ts +37 -0
package/dist/bun/markdown.d.ts.map +1 -0
package/dist/bun/prompt.d.ts +47 -0
package/dist/bun/prompt.d.ts.map +1 -0
package/dist/bun/recall.d.ts +41 -0
package/dist/bun/recall.d.ts.map +1 -0
package/dist/bun/search.d.ts +113 -0
package/dist/bun/search.d.ts.map +1 -0
package/dist/bun/temporal.d.ts +66 -0
package/dist/bun/temporal.d.ts.map +1 -0
package/dist/bun/types.d.ts +180 -0
package/dist/bun/types.d.ts.map +1 -0
package/dist/bun/worker.d.ts +6 -0
package/dist/bun/worker.d.ts.map +1 -0
package/dist/node/agents-file.d.ts +59 -0
package/dist/node/agents-file.d.ts.map +1 -0
package/dist/node/config.d.ts +58 -0
package/dist/node/config.d.ts.map +1 -0
package/dist/node/curator.d.ts +35 -0
package/dist/node/curator.d.ts.map +1 -0
package/dist/node/db/driver.bun.d.ts +5 -0
package/dist/node/db/driver.bun.d.ts.map +1 -0
package/dist/node/db/driver.node.d.ts +15 -0
package/dist/node/db/driver.node.d.ts.map +1 -0
package/dist/node/db.d.ts +22 -0
package/dist/node/db.d.ts.map +1 -0
package/dist/node/distillation.d.ts +32 -0
package/dist/node/distillation.d.ts.map +1 -0
package/dist/node/embedding.d.ts +90 -0
package/dist/node/embedding.d.ts.map +1 -0
package/dist/node/gradient.d.ts +73 -0
package/dist/node/gradient.d.ts.map +1 -0
package/dist/node/index.d.ts +19 -0
package/dist/node/index.d.ts.map +1 -0
package/dist/node/index.js +28253 -0
package/dist/node/index.js.map +7 -0
package/dist/node/lat-reader.d.ts +69 -0
package/dist/node/lat-reader.d.ts.map +1 -0
package/dist/node/log.d.ts +17 -0
package/dist/node/log.d.ts.map +1 -0
package/dist/node/ltm.d.ts +138 -0
package/dist/node/ltm.d.ts.map +1 -0
package/dist/node/markdown.d.ts +37 -0
package/dist/node/markdown.d.ts.map +1 -0
package/dist/node/prompt.d.ts +47 -0
package/dist/node/prompt.d.ts.map +1 -0
package/dist/node/recall.d.ts +41 -0
package/dist/node/recall.d.ts.map +1 -0
package/dist/node/search.d.ts +113 -0
package/dist/node/search.d.ts.map +1 -0
package/dist/node/temporal.d.ts +66 -0
package/dist/node/temporal.d.ts.map +1 -0
package/dist/node/types.d.ts +180 -0
package/dist/node/types.d.ts.map +1 -0
package/dist/node/worker.d.ts +6 -0
package/dist/node/worker.d.ts.map +1 -0
package/dist/types/agents-file.d.ts +59 -0
package/dist/types/agents-file.d.ts.map +1 -0
package/dist/types/config.d.ts +58 -0
package/dist/types/config.d.ts.map +1 -0
package/dist/types/curator.d.ts +35 -0
package/dist/types/curator.d.ts.map +1 -0
package/dist/types/db/driver.bun.d.ts +5 -0
package/dist/types/db/driver.bun.d.ts.map +1 -0
package/dist/types/db/driver.node.d.ts +15 -0
package/dist/types/db/driver.node.d.ts.map +1 -0
package/dist/types/db.d.ts +22 -0
package/dist/types/db.d.ts.map +1 -0
package/dist/types/distillation.d.ts +32 -0
package/dist/types/distillation.d.ts.map +1 -0
package/dist/types/embedding.d.ts +90 -0
package/dist/types/embedding.d.ts.map +1 -0
package/dist/types/gradient.d.ts +73 -0
package/dist/types/gradient.d.ts.map +1 -0
package/dist/types/index.d.ts +19 -0
package/dist/types/index.d.ts.map +1 -0
package/dist/types/lat-reader.d.ts +69 -0
package/dist/types/lat-reader.d.ts.map +1 -0
package/dist/types/log.d.ts +17 -0
package/dist/types/log.d.ts.map +1 -0
package/dist/types/ltm.d.ts +138 -0
package/dist/types/ltm.d.ts.map +1 -0
package/dist/types/markdown.d.ts +37 -0
package/dist/types/markdown.d.ts.map +1 -0
package/dist/types/prompt.d.ts +47 -0
package/dist/types/prompt.d.ts.map +1 -0
package/dist/types/recall.d.ts +41 -0
package/dist/types/recall.d.ts.map +1 -0
package/dist/types/search.d.ts +113 -0
package/dist/types/search.d.ts.map +1 -0
package/dist/types/temporal.d.ts +66 -0
package/dist/types/temporal.d.ts.map +1 -0
package/dist/types/types.d.ts +180 -0
package/dist/types/types.d.ts.map +1 -0
package/dist/types/worker.d.ts +6 -0
package/dist/types/worker.d.ts.map +1 -0
package/package.json +48 -5
package/src/agents-file.ts +406 -0
package/src/config.ts +132 -0
package/src/curator.ts +220 -0
package/src/db/driver.bun.ts +18 -0
package/src/db/driver.node.ts +54 -0
package/src/db.ts +433 -0
package/src/distillation.ts +433 -0
package/src/embedding.ts +528 -0
package/src/gradient.ts +1387 -0
package/src/index.ts +109 -0
package/src/lat-reader.ts +374 -0
package/src/log.ts +27 -0
package/src/ltm.ts +861 -0
package/src/markdown.ts +129 -0
package/src/prompt.ts +454 -0
package/src/recall.ts +446 -0
package/src/search.ts +330 -0
package/src/temporal.ts +379 -0
package/src/types.ts +199 -0
package/src/worker.ts +26 -0

package/src/markdown.ts ADDED Viewed

@@ -0,0 +1,129 @@
+import { remark } from "remark";
+import type {
+  Root,
+  Heading,
+  List,
+  ListItem,
+  Paragraph,
+  Text,
+  Strong,
+  BlockContent,
+  PhrasingContent,
+} from "mdast";
+// Reuse a single processor — remark freezes on first use anyway
+const processor = remark();
+// Serialize an mdast tree to a markdown string.
+// The serializer automatically escapes any characters in text nodes
+// that would be structurally ambiguous (code fences, headings, list
+// markers, thematic breaks, etc.), so callers never need to pre-escape.
+export function serialize(tree: Root): string {
+  return processor.stringify(tree);
+}
+/**
+ * Replace unpaired Unicode surrogates with U+FFFD (replacement character).
+ *
+ * Unpaired surrogates (a high surrogate U+D800-U+DBFF without a following low
+ * surrogate U+DC00-U+DFFF, or a lone low surrogate) are technically invalid in
+ * UTF-8/JSON. They can appear in tool outputs (binary file contents, command
+ * output) and survive through SQLite storage into recall results. When the
+ * resulting string is serialized to JSON for the LLM API, the API rejects it
+ * with "no low surrogate in string".
+ */
+export function sanitizeSurrogates(value: string): string {
+  // eslint-disable-next-line no-control-regex
+  return value.replace(
+    /[\uD800-\uDBFF](?![\uDC00-\uDFFF])|(?<![\uD800-\uDBFF])[\uDC00-\uDFFF]/g,
+    "\uFFFD",
+  );
+}
+// Collapse newlines in LLM-generated text before inserting into a text node.
+// Embedded blank lines (\n\n) cause list items to become "spread" (loose),
+// which then breaks the surrounding markdown structure on re-parse.
+// Newlines within a single fact/narrative are replaced with a space.
+// Also sanitizes unpaired surrogates to prevent JSON serialization failures.
+export function inline(value: string): string {
+  return sanitizeSurrogates(value).replace(/\s*\n\s*/g, " ").trim();
+}
+// Normalize arbitrary markdown via parse → stringify roundtrip.
+// Used for content we don't control (e.g. existing text parts in Layer 4
+// after tool parts are stripped out), where we can't build from AST.
+// Two passes are needed: remark's asterisk/underscore escaping can introduce
+// new sequences on the first pass that the second pass then stabilizes.
+export function normalize(md: string): string {
+  const once = processor.stringify(processor.parse(md));
+  return processor.stringify(processor.parse(once));
+}
+/**
+ * Unescape a markdown-serialized inline string back to plain text.
+ *
+ * remark's serializer escapes special characters with backslashes
+ * (e.g. `<` → `\<`, `*` → `\*`, `\` → `\\`). When we read content
+ * back from an AGENTS.md file we must unescape it so it round-trips
+ * cleanly — otherwise each export/import cycle doubles the escapes.
+ *
+ * Uses remark's own parser to extract the text value, which handles
+ * all escape sequences correctly.
+ */
+export function unescapeMarkdown(md: string): string {
+  const tree = processor.parse(md);
+  // Collect all text node values from the first paragraph
+  const texts: string[] = [];
+  const para = tree.children[0];
+  if (para && para.type === "paragraph") {
+    for (const child of para.children) {
+      if (child.type === "text") texts.push(child.value);
+      else if (child.type === "strong" || child.type === "emphasis") {
+        for (const gc of child.children) {
+          if (gc.type === "text") texts.push(gc.value);
+        }
+      }
+    }
+  }
+  return texts.join("") || md;
+}
+// --- Node builders ---
+export function h(depth: 1 | 2 | 3 | 4 | 5 | 6, value: string): Heading {
+  return { type: "heading", depth, children: [t(value)] };
+}
+export function p(value: string): Paragraph {
+  return { type: "paragraph", children: [t(value)] };
+}
+export function ul(items: ListItem[]): List {
+  return { type: "list", ordered: false, spread: false, children: items };
+}
+export function li(...children: BlockContent[]): ListItem {
+  return { type: "listItem", spread: false, children };
+}
+// List item containing a single paragraph (the common case for facts/entries)
+export function lip(value: string): ListItem {
+  return li(p(value));
+}
+// List item with inline phrasing content — e.g. **bold**: text
+export function liph(...children: PhrasingContent[]): ListItem {
+  return li({ type: "paragraph", children });
+}
+export function t(value: string): Text {
+  return { type: "text", value };
+}
+export function strong(value: string): Strong {
+  return { type: "strong", children: [t(value)] };
+}
+export function root(...children: Root["children"]): Root {
+  return { type: "root", children };
+}

package/src/prompt.ts ADDED Viewed

@@ -0,0 +1,454 @@
+import type { Root } from "mdast";
+import { serialize, inline, h, ul, liph, strong, t, root } from "./markdown";
+// All prompts are locked down — they are our core value offering.
+// Do not make these configurable.
+export const DISTILLATION_SYSTEM = `You are a memory observer. Your observations will be the ONLY information an AI assistant has about past interactions. Produce a dense, dated event log — not a summary.
+CRITICAL: DISTINGUISH USER ASSERTIONS FROM QUESTIONS
+When the user TELLS you something about themselves, mark it as an assertion (🔴):
+- "I have two kids" → 🔴 (14:30) User stated has two kids
+- "I work at Acme Corp" → 🔴 (14:31) User stated works at Acme Corp
+When the user ASKS about something, mark it as a question (🟡):
+- "Can you help me with X?" → 🟡 (15:00) User asked for help with X
+User assertions are AUTHORITATIVE — the user is the source of truth about their own life.
+TEMPORAL ANCHORING — CRITICAL FOR TEMPORAL REASONING:
+Each observation has up to two timestamps:
+1. BEGINNING: The time the statement was made — ALWAYS include this as (HH:MM)
+2. END: The referenced date, if the content refers to a different time — add as "(meaning DATE)" or "(estimated DATE)"
+ONLY add "(meaning DATE)" when you can derive an actual date:
+- "last week", "yesterday", "next month" → compute and add the date
+- "recently", "a while ago", "soon" → too vague, omit the end date
+ALWAYS put the date annotation at the END of the observation line.
+GOOD: (09:15) User will visit parents this weekend. (meaning Jun 17-18, 2025)
+GOOD: (09:15) User's friend had a birthday party last month. (estimated May 2025)
+GOOD: (09:15) User prefers hiking in the mountains.
+BAD: (09:15) User prefers hiking. (meaning Jun 15, 2025)  ← no time reference, don't add date
+If an observation contains MULTIPLE events, split into SEPARATE lines, each with its own date.
+STATE CHANGES — make supersession explicit:
+- "User will use X (replacing Y)" — not just "User will use X"
+- "User moved to Berlin (no longer in London)"
+DETAILS TO ALWAYS PRESERVE:
+- Names, handles, usernames (@username, "Dr. Smith")
+- Numbers, counts, quantities (4 items, 3 sessions, $120)
+- Measurements, percentages (5kg, 20% improvement, 85% accuracy)
+- Sequences and orderings (steps 1-5, lucky numbers: 7 14 23)
+- Prices, dates, times, durations
+- Locations and distinguishing attributes
+- User's specific role (presenter, volunteer, organizer — not just "attended")
+- Exact phrasing when unusual ("movement session" for exercise)
+EXACT NUMBERS — NEVER APPROXIMATE:
+When the conversation states a specific count, record that EXACT number — do not round, estimate, or substitute a count you see later. If the same quantity appears with different values at different times, record each with its timestamp.
+BAD: All existing entries bulk-updated to cross_project=1 (50 entries)  ← wrong: mixed up with a later count
+GOOD: 43 knowledge entries bulk-updated to cross_project=1 via SQL UPDATE  ← exact number from the operation
+BAD: ~130 test failures
+GOOD: 131 test failures (1902 pass, 131 fail, 1 error across 100 files)  ← preserve exact counts
+BUG FIXES AND CODE CHANGES — HIGH PRIORITY:
+Every bug fix, code change, or technical decision is important regardless of where it appears in the conversation. Early-session fixes are just as valuable as later ones.
+For each fix, record:
+- The specific bug/problem (what went wrong)
+- The root cause (why it went wrong)
+- The fix applied (what changed, with file paths and line numbers)
+- The outcome (tests pass, deployed, etc.)
+BAD: 🟡 Fixed an FTS5 search bug
+GOOD: 🟡 FTS5 was doing exact term matching instead of prefix matching in ltm.ts. Fix: added ftsQuery() function that appends * to each search term for prefix matching. Committed as [hash].
+ASSISTANT-GENERATED CONTENT — THIS IS CRITICAL:
+When the assistant produces lists, recommendations, explanations, recipes, schedules, creative content, or any structured output — record EVERY ITEM with its distinguishing details. The user WILL ask about specific items later.
+BAD: 🟡 Assistant recommended 5 dessert spots in Orlando.
+GOOD: 🟡 Assistant recommended dessert spots: Sugar Factory (Icon Park, giant milkshakes), Wondermade (Sanford, gourmet marshmallows), Gideon's Bakehouse (Disney Springs, cookies), Farris & Foster's (unique flavors), Kilwins (handmade fudge)
+BAD: 🟡 Assistant listed work-from-home jobs for seniors.
+GOOD: 🟡 Assistant listed 10 WFH jobs for seniors: 1. Virtual assistant, 2. Online tutor, 3. Freelance writer, 4. Social media manager, 5. Customer service rep, 6. Bookkeeper, 7. Transcriptionist, 8. Web designer, 9. Data entry, 10. Consultant
+BAD: 🟡 Assistant explained refining processes.
+GOOD: 🟡 Assistant explained Lake Charles refinery processes: atmospheric distillation, fluid catalytic cracking (FCC), alkylation, hydrotreating
+Rules for assistant content:
+- Record EACH item in a list with at least one distinguishing attribute
+- For numbered lists, preserve the EXACT ordering (1st, 2nd, 3rd...)
+- For recipes: preserve specific quantities, ratios, temperatures, times
+- For recommendations: preserve names, locations, prices, key features
+- For creative content (songs, stories, poems): preserve titles, key phrases, character names, structural details
+- For technical explanations: preserve specific values, percentages, formulas, tool/library names
+- Ordered lists must keep their numbering — users ask "what was the 7th item?"
+- Use 🟡 priority but NEVER skip assistant-generated details to save space
+ENUMERATABLE ENTITIES — always flag for cross-session aggregation:
+When the user mentions attending events, buying things, meeting people, completing tasks — mark with entity type so these can be aggregated across sessions:
+🔴 [event-attended] User attended Rachel+Mike's wedding (vineyard in Napa, Aug 12, 2023)
+🔴 [item-purchased] User bought Sony WH-1000XM5 headphones ($280, replaced old Bose)
+This makes it possible to answer "how many weddings did I attend?" by aggregating across sessions.
+PRIORITY LEVELS:
+- 🔴 High: user assertions, stated facts, preferences, goals, enumeratable entities
+- 🟡 Medium: questions asked, context, assistant-generated content with full detail
+- 🟢 Low: minor conversational context, greetings, acknowledgments
+OUTPUT FORMAT — output ONLY observations, no preamble:
+<observations>
+Date: Jan 15, 2026
+* 🔴 (09:15) User stated has two kids: Emma (12) and Jake (9)
+* 🔴 (09:16) User's anniversary is March 15
+* 🟡 (09:20) User asked how to optimize database queries
+* 🔴 [event-attended] (10:00) User attended company holiday party as a presenter (gave talk on microservices)
+* 🔴 (11:30) User will visit parents this weekend. (meaning Jan 17-18, 2026)
+* 🟡 (14:00) Agent debugging auth issue — found missing null check in auth.ts:45, applied fix, tests pass
+* 🟡 (14:30) Assistant recommended 5 hotels: 1. Grand Plaza (near station, $180), 2. Seaside Inn (pet-friendly, $120), 3. Mountain Lodge (pool, free breakfast, $95), 4. Harbor View (historic, walkable, $150), 5. Zen Garden (quietest, spa, $200)
+* 🔴 (15:00) User switched from Python to TypeScript for the project (no longer using Python)
+</observations>`;
+export function distillationUser(input: {
+  priorObservations?: string;
+  date: string;
+  messages: string;
+}): string {
+  const context = input.priorObservations
+    ? `Previous observations (do NOT repeat these — your new observations will be appended):\n${input.priorObservations}\n\n---`
+    : "This is the beginning of the session.";
+  return `${context}
+Session date: ${input.date}
+Conversation to observe:
+${input.messages}
+Extract new observations. Output ONLY an <observations> block.`;
+}
+// Meta-distillation prompt using a context-distillation objective: instead of
+// reorganizing observations into another event log (which Eyuboglu et al. 2025
+// showed is a memorization objective that fails to generalize), produce a
+// structured working context optimized for diverse downstream queries.
+// This mirrors the Self-Study approach from "Cartridges" (Eyuboglu et al.,
+// 2025) where diverse seed prompt types ensure the compressed representation
+// supports varied information needs, not just chronological recall.
+// Reference: https://arxiv.org/abs/2501.17390
+export const RECURSIVE_SYSTEM = `You are a memory reflector. You are given a set of observations from multiple conversation segments. Your job is to consolidate them into a structured working context that will become the agent's entire memory going forward.
+IMPORTANT: Your reflections ARE the entirety of the assistant's memory. Any information you omit is permanently forgotten. Do not leave out anything important.
+STRUCTURE your output into these sections — each section supports a different type of downstream query:
+### Current State
+What is in progress right now? Active branches, open files, current task, blockers.
+This section answers: "What was I working on?"
+### Key Decisions
+What was decided and why? Include the alternatives considered and rationale.
+This section answers: "Why did we choose approach X?" and "What alternatives were rejected?"
+### Technical Changes
+Bugs found, root causes, fixes applied, files modified, tests added/fixed.
+Preserve exact file paths, line numbers, error messages, and commit references.
+This section answers: "What bugs were fixed?" and "What files were changed?"
+### Session Timeline
+Condensed chronological events with timestamps. Older events compressed more aggressively; recent events retain detail. This section answers: "When did X happen?" and "What was the sequence of events?"
+CONSOLIDATION RULES:
+- Preserve ALL dates and timestamps — temporal context is critical
+- Combine related items (e.g., "agent called view tool 5 times on file x" → single line)
+- Merge duplicate facts, keeping the most specific version
+- Drop observations superseded by later info (if value changed, keep only final value)
+- When consolidating, USER ASSERTIONS take precedence over questions about the same topic
+- Preserve all enumeratable entities [entity-type] — these are needed for aggregation questions
+- For enumeratable entities spanning multiple segments, create an explicit aggregation:
+  🔴 [event-attended] User attended 3 weddings total: Rachel+Mike (vineyard, Aug 2023), Emily+Sarah (garden, Sep 2023), Jen+Tom (Oct 8, 2023)
+EXACT NUMBERS: When two segments report different numbers for what seems like the same thing, keep the number from the earlier/original observation — it's likely the correct one from the actual event. Later references may be from memory or approximation.
+EARLY-SESSION CONTENT: Bug fixes, code changes, and decisions from the start of a session are just as important as later work. Never drop them just because the segment is short or old. If the first segment contains a specific bug fix with file paths and root cause, it MUST survive into the reflection.
+Output ONLY an <observations> block with the consolidated observations.`;
+export function recursiveUser(
+  distillations: Array<{ observations: string }>,
+): string {
+  const entries = distillations.map(
+    (d, i) => `Segment ${i + 1}:\n${d.observations}`,
+  );
+  return `Observation segments to consolidate (chronological order):
+${entries.join("\n\n---\n\n")}`;
+}
+export const CURATOR_SYSTEM = `You are a long-term memory curator. Your job is to extract durable knowledge from a conversation that should persist across sessions.
+Focus ONLY on knowledge that helps a coding agent work effectively on THIS codebase:
+- Architectural decisions and their rationale (why something was built a certain way)
+- Non-obvious implementation patterns and conventions specific to the project
+- Recurring gotchas, constraints, or traps in the codebase
+- Environment/tooling setup details that affect development
+- Important relationships between components that aren't obvious from reading the code
+- User preferences and working style specific to how they use this project
+Do NOT extract:
+- Task-specific details (file currently being edited, current bug being fixed)
+- Temporary state (current branch, in-progress work)
+- Information that will change frequently
+- Ecosystem descriptions, product announcements, or marketing content
+- Business strategy, roadmap, or organizational information
+- Information that's readily available in public documentation or READMEs
+- Knowledge about unrelated projects or repositories unless explicitly cross-project
+- Restatements of what the code obviously does (e.g. "the auth module handles authentication")
+BREVITY IS CRITICAL — each entry must be concise:
+- content MUST be under 150 words (~600 characters). Capture ONE specific actionable
+  insight in 2-3 sentences. Prefer terse technical language.
+- Each "gotcha": one specific trap + its fix in 1-2 sentences
+- Each "architecture": one design decision and its key constraint
+- Focus on the actionable insight, not the full story behind it
+- If a pattern requires more detail, split into multiple focused entries (each under 150 words)
+- Omit code examples unless a single short snippet is essential
+- Never include full file contents, large diffs, or complete command outputs
+PREFER UPDATES OVER CREATES:
+- Before creating a new entry, always check if an existing entry covers the same system
+  or component. Update the existing entry rather than creating a new one.
+- When updating, REPLACE the full content with a concise rewrite — do not append to
+  the existing content or repeat what was already there.
+- If multiple existing entries cover the same system from different angles (e.g. different
+  bugs in the same module), consolidate them: update one with merged insights, delete the
+  rest. Fewer, denser entries are better than many scattered ones.
+CROSS-REFERENCES between entries:
+- When an entry relates to another entry, reference it with [[entry-uuid]] using the entry's ID
+  from the existing entries list. This creates navigable links between entries.
+- Only reference entries you can see in the existing entries list — don't guess IDs.
+- Example: "Uses the gradient system [[019c904b-791e-772a-ab2b-93ac892a960c]] for context management."
+crossProject flag:
+- Default is true — most useful knowledge is worth sharing across projects
+- Set crossProject to false for things that are meaningless outside this specific repo (e.g. a config path, a project-local naming convention that conflicts with your usual style)
+Produce a JSON array of operations:
+[
+  {
+    "op": "create",
+    "category": "decision" | "pattern" | "preference" | "architecture" | "gotcha",
+    "title": "Short descriptive title",
+    "content": "Concise knowledge entry — under 150 words",
+    "scope": "project" | "global",
+    "crossProject": true
+  },
+  {
+    "op": "update",
+    "id": "existing-entry-id",
+    "content": "Updated content — under 150 words",
+    "confidence": 0.0-1.0
+  },
+  {
+    "op": "delete",
+    "id": "existing-entry-id",
+    "reason": "Why this is no longer relevant"
+  }
+]
+If nothing warrants extraction, return an empty array: []
+Output ONLY valid JSON. No markdown fences, no explanation, no preamble.`;
+export function curatorUser(input: {
+  messages: string;
+  existing: Array<{
+    id: string;
+    category: string;
+    title: string;
+    content: string;
+  }>;
+}): string {
+  const count = input.existing.length;
+  const existing = count
+    ? `Existing knowledge entries (${count} total — you may update or delete these):\n${input.existing.map((e) => `- [${e.id}] (${e.category}) ${e.title}: ${e.content}`).join("\n")}`
+    : "No existing knowledge entries.";
+  return `${existing}
+---
+Recent conversation to extract knowledge from:
+${input.messages}
+---
+IMPORTANT:
+1. Prefer updating existing entries over creating new ones. If a new insight refines or
+   extends an existing entry on the same topic, update that entry — don't create a new one.
+2. When updating, REPLACE the content with a complete rewrite — never append.
+3. If entries cover the same system from different angles, merge them: update one, delete the rest.
+4. Only create a new entry for genuinely distinct knowledge with no existing home.
+5. Keep all entries under 150 words. If an existing entry is too long, use an update op to trim it.`;
+}
+/**
+ * System prompt for the consolidation pass.
+ * Unlike the normal curator (which extracts from conversation), consolidation
+ * reviews the FULL entry corpus and aggressively merges/trims/deletes to reduce
+ * entry count while preserving the most actionable knowledge.
+ */
+export const CONSOLIDATION_SYSTEM = `You are a long-term memory curator performing a consolidation pass. The knowledge base has grown too large and needs to be trimmed.
+Your goal: reduce the entry count to the target maximum while preserving the most valuable knowledge.
+CONSOLIDATION RULES:
+1. MERGE related entries — if multiple entries describe the same system, module, or concept
+   from different angles (e.g. several bug fixes in the same component), merge them into
+   ONE concise entry. Use an "update" op for the surviving entry and "delete" ops for the rest.
+2. TRIM verbose entries — any entry over 150 words must be trimmed to its essential insight.
+   Use an "update" op with the rewritten content.
+3. DELETE low-value entries:
+   - Stale entries about bugs that have been fixed and no longer need gotcha warnings
+   - Entries whose knowledge is fully subsumed by another entry
+   - Entries about one-off incidents with no recurring applicability
+   - General advice available in any documentation
+4. PRESERVE:
+   - Entries describing non-obvious design decisions specific to this codebase
+   - Entries about recurring traps that a developer would hit again
+   - Entries that capture a hard-won gotcha with a concrete fix
+OUTPUT: A JSON array of "update" and "delete" ops only. No "create" ops — you are not
+extracting new knowledge, only consolidating existing knowledge.
+- "update": Replace content with a concise rewrite (under 150 words). Use to merge survivors or trim verbose entries.
+- "delete": Remove entries that are merged, stale, or low-value.
+Output ONLY valid JSON. No markdown fences, no explanation, no preamble.`;
+export function consolidationUser(input: {
+  entries: Array<{
+    id: string;
+    category: string;
+    title: string;
+    content: string;
+  }>;
+  targetMax: number;
+}): string {
+  const count = input.entries.length;
+  const listed = input.entries
+    .map((e) => `- [${e.id}] (${e.category}) ${e.title}: ${e.content}`)
+    .join("\n");
+  return `Current knowledge entries (${count} total, target max: ${input.targetMax}):
+${listed}
+Produce update/delete ops to reduce entry count to at most ${input.targetMax}. Prioritize merging related entries and trimming verbose ones over outright deletion.`;
+}
+// Format distillations for injection into the message context.
+// Observations are plain event-log text — inject them directly under a header.
+export function formatDistillations(
+  distillations: Array<{
+    observations: string;
+    generation: number;
+  }>,
+): string {
+  if (!distillations.length) return "";
+  const meta = distillations.filter((d) => d.generation > 0);
+  const recent = distillations.filter((d) => d.generation === 0);
+  const sections: string[] = ["## Session History"];
+  if (meta.length) {
+    sections.push("### Earlier Work (summarized)");
+    for (const d of meta) {
+      sections.push(d.observations.trim());
+    }
+  }
+  if (recent.length) {
+    sections.push("### Recent Work (distilled)");
+    for (const d of recent) {
+      sections.push(d.observations.trim());
+    }
+  }
+  return sections.join("\n\n");
+}
+// ~3 chars per token — validated as best heuristic against real API data.
+function estimateTokens(text: string): number {
+  return Math.ceil(text.length / 3);
+}
+export function formatKnowledge(
+  entries: Array<{ category: string; title: string; content: string }>,
+  maxTokens?: number,
+): string {
+  if (!entries.length) return "";
+  // Apply token budget: greedily include entries (already sorted by confidence
+  // DESC from the DB query) until the budget is exhausted. Overhead accounts for
+  // the section heading and per-entry markdown scaffolding (~50 chars each).
+  let included = entries;
+  if (maxTokens !== undefined) {
+    const HEADER_OVERHEAD = 50; // "## Long-term Knowledge\n### Category\n"
+    let used = HEADER_OVERHEAD;
+    const fitting: typeof entries = [];
+    for (const e of entries) {
+      const cost = estimateTokens(e.title + e.content) + 10; // per-entry bullet overhead
+      if (used + cost > maxTokens) continue; // skip; keep trying smaller entries
+      fitting.push(e);
+      used += cost;
+    }
+    included = fitting;
+    if (!included.length) return "";
+  }
+  const grouped: Record<string, Array<{ title: string; content: string }>> = {};
+  for (const e of included) {
+    const group = grouped[e.category] ?? (grouped[e.category] = []);
+    group.push(e);
+  }
+  const children: Root["children"] = [h(2, "Long-term Knowledge")];
+  for (const [category, items] of Object.entries(grouped)) {
+    children.push(h(3, category.charAt(0).toUpperCase() + category.slice(1)));
+    children.push(
+      ul(
+        items.map((i) =>
+          liph(strong(inline(i.title)), t(": " + inline(i.content))),
+        ),
+      ),
+    );
+  }
+  return serialize(root(...children));
+}
+// ---------------------------------------------------------------------------
+// Query expansion (Phase 4)
+// ---------------------------------------------------------------------------
+export const QUERY_EXPANSION_SYSTEM = `You are a search query expander for a code knowledge base. Given a search query, generate 2–3 alternative queries that would help find relevant results. Focus on:
+- Synonyms and related technical terms
+- Different phrasings of the same concept
+- Broader or narrower scopes
+Return ONLY a JSON array of strings. No explanation, no markdown.
+Example:
+Input: "SQLite FTS5 ranking"
+Output: ["full text search scoring SQLite", "BM25 relevance ranking database", "FTS5 match order by rank"]`;