npm - @agentmemory/agentmemory - Versions diffs - 0.7.0 → 0.7.3 - Mend

@agentmemory/agentmemory 0.7.0 → 0.7.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (218) hide show

package/AGENTS.md +2 -2
package/README.md +76 -82
package/dist/cli.mjs +99 -32
package/dist/cli.mjs.map +1 -1
package/dist/index.mjs +4 -2
package/dist/index.mjs.map +1 -1
package/dist/{src-QxitMPfJ.mjs → src-sYZDDbiA.mjs} +5 -3
package/dist/src-sYZDDbiA.mjs.map +1 -0
package/dist/standalone.mjs +1 -1
package/dist/standalone.mjs.map +1 -1
package/package.json +11 -1
package/plugin/.claude-plugin/plugin.json +1 -1
package/plugin/scripts/notification.d.mts +1 -0
package/plugin/scripts/notification.mjs.map +1 -0
package/plugin/scripts/post-tool-failure.d.mts +1 -0
package/plugin/scripts/post-tool-failure.mjs.map +1 -0
package/plugin/scripts/post-tool-use.d.mts +1 -0
package/plugin/scripts/post-tool-use.mjs.map +1 -0
package/plugin/scripts/pre-compact.d.mts +1 -0
package/plugin/scripts/pre-compact.mjs.map +1 -0
package/plugin/scripts/pre-tool-use.d.mts +1 -0
package/plugin/scripts/pre-tool-use.mjs.map +1 -0
package/plugin/scripts/prompt-submit.d.mts +1 -0
package/plugin/scripts/prompt-submit.mjs.map +1 -0
package/plugin/scripts/session-end.d.mts +1 -0
package/plugin/scripts/session-end.mjs.map +1 -0
package/plugin/scripts/session-start.d.mts +1 -0
package/plugin/scripts/session-start.mjs.map +1 -0
package/plugin/scripts/stop.d.mts +1 -0
package/plugin/scripts/stop.mjs.map +1 -0
package/plugin/scripts/subagent-start.d.mts +1 -0
package/plugin/scripts/subagent-start.mjs.map +1 -0
package/plugin/scripts/subagent-stop.d.mts +1 -0
package/plugin/scripts/subagent-stop.mjs.map +1 -0
package/plugin/scripts/task-completed.d.mts +1 -0
package/plugin/scripts/task-completed.mjs.map +1 -0
package/.claude-plugin/marketplace.json +0 -14
package/.github/workflows/ci.yml +0 -22
package/.github/workflows/publish.yml +0 -28
package/assets/banner.png +0 -0
package/assets/demo.gif +0 -0
package/assets/demo.mp4 +0 -0
package/benchmark/QUALITY.md +0 -73
package/benchmark/REAL-EMBEDDINGS.md +0 -67
package/benchmark/SCALE.md +0 -110
package/benchmark/dataset.ts +0 -293
package/benchmark/quality-eval.ts +0 -643
package/benchmark/real-embeddings-eval.ts +0 -405
package/benchmark/scale-eval.ts +0 -398
package/dist/src-QxitMPfJ.mjs.map +0 -1
package/src/auth.ts +0 -12
package/src/cli.ts +0 -159
package/src/config.ts +0 -221
package/src/eval/metrics-store.ts +0 -65
package/src/eval/quality.ts +0 -51
package/src/eval/schemas.ts +0 -124
package/src/eval/self-correct.ts +0 -28
package/src/eval/validator.ts +0 -31
package/src/functions/actions.ts +0 -288
package/src/functions/audit.ts +0 -61
package/src/functions/auto-forget.ts +0 -169
package/src/functions/branch-aware.ts +0 -169
package/src/functions/cascade.ts +0 -80
package/src/functions/checkpoints.ts +0 -209
package/src/functions/claude-bridge.ts +0 -161
package/src/functions/compress.ts +0 -194
package/src/functions/consolidate.ts +0 -212
package/src/functions/consolidation-pipeline.ts +0 -258
package/src/functions/context.ts +0 -169
package/src/functions/crystallize.ts +0 -293
package/src/functions/dedup.ts +0 -57
package/src/functions/diagnostics.ts +0 -785
package/src/functions/enrich.ts +0 -132
package/src/functions/evict.ts +0 -163
package/src/functions/export-import.ts +0 -508
package/src/functions/facets.ts +0 -248
package/src/functions/file-index.ts +0 -106
package/src/functions/flow-compress.ts +0 -214
package/src/functions/frontier.ts +0 -196
package/src/functions/governance.ts +0 -131
package/src/functions/graph-retrieval.ts +0 -277
package/src/functions/graph.ts +0 -275
package/src/functions/leases.ts +0 -216
package/src/functions/lessons.ts +0 -253
package/src/functions/mesh.ts +0 -434
package/src/functions/migrate.ts +0 -165
package/src/functions/observe.ts +0 -144
package/src/functions/obsidian-export.ts +0 -310
package/src/functions/patterns.ts +0 -138
package/src/functions/privacy.ts +0 -39
package/src/functions/profile.ts +0 -155
package/src/functions/query-expansion.ts +0 -186
package/src/functions/relations.ts +0 -237
package/src/functions/remember.ts +0 -162
package/src/functions/retention.ts +0 -235
package/src/functions/routines.ts +0 -289
package/src/functions/search.ts +0 -80
package/src/functions/sentinels.ts +0 -417
package/src/functions/signals.ts +0 -186
package/src/functions/sketches.ts +0 -274
package/src/functions/sliding-window.ts +0 -257
package/src/functions/smart-search.ts +0 -115
package/src/functions/snapshot.ts +0 -219
package/src/functions/summarize.ts +0 -155
package/src/functions/team.ts +0 -147
package/src/functions/temporal-graph.ts +0 -476
package/src/functions/timeline.ts +0 -138
package/src/functions/verify.ts +0 -117
package/src/health/monitor.ts +0 -110
package/src/health/thresholds.ts +0 -73
package/src/hooks/notification.ts +0 -52
package/src/hooks/post-tool-failure.ts +0 -58
package/src/hooks/post-tool-use.ts +0 -62
package/src/hooks/pre-compact.ts +0 -60
package/src/hooks/pre-tool-use.ts +0 -72
package/src/hooks/prompt-submit.ts +0 -46
package/src/hooks/session-end.ts +0 -71
package/src/hooks/session-start.ts +0 -48
package/src/hooks/stop.ts +0 -39
package/src/hooks/subagent-start.ts +0 -49
package/src/hooks/subagent-stop.ts +0 -54
package/src/hooks/task-completed.ts +0 -54
package/src/index.ts +0 -342
package/src/mcp/in-memory-kv.ts +0 -61
package/src/mcp/server.ts +0 -1455
package/src/mcp/standalone.ts +0 -177
package/src/mcp/tools-registry.ts +0 -769
package/src/mcp/transport.ts +0 -91
package/src/prompts/compression.ts +0 -67
package/src/prompts/consolidation.ts +0 -48
package/src/prompts/graph-extraction.ts +0 -35
package/src/prompts/summary.ts +0 -38
package/src/prompts/xml.ts +0 -26
package/src/providers/agent-sdk.ts +0 -34
package/src/providers/anthropic.ts +0 -35
package/src/providers/circuit-breaker.ts +0 -82
package/src/providers/embedding/cohere.ts +0 -46
package/src/providers/embedding/gemini.ts +0 -54
package/src/providers/embedding/index.ts +0 -39
package/src/providers/embedding/local.ts +0 -52
package/src/providers/embedding/openai.ts +0 -45
package/src/providers/embedding/openrouter.ts +0 -51
package/src/providers/embedding/voyage.ts +0 -46
package/src/providers/fallback-chain.ts +0 -31
package/src/providers/index.ts +0 -84
package/src/providers/openrouter.ts +0 -71
package/src/providers/resilient.ts +0 -37
package/src/state/hybrid-search.ts +0 -295
package/src/state/index-persistence.ts +0 -63
package/src/state/keyed-mutex.ts +0 -18
package/src/state/kv.ts +0 -33
package/src/state/schema.ts +0 -71
package/src/state/search-index.ts +0 -245
package/src/state/stemmer.ts +0 -104
package/src/state/synonyms.ts +0 -63
package/src/state/vector-index.ts +0 -130
package/src/telemetry/setup.ts +0 -116
package/src/triggers/api.ts +0 -1904
package/src/triggers/events.ts +0 -71
package/src/types.ts +0 -769
package/src/version.ts +0 -1
package/src/viewer/index.html +0 -2497
package/src/viewer/server.ts +0 -207
package/src/xenova.d.ts +0 -3
package/test/actions.test.ts +0 -490
package/test/audit.test.ts +0 -108
package/test/auto-forget.test.ts +0 -188
package/test/cascade.test.ts +0 -277
package/test/checkpoints.test.ts +0 -493
package/test/circuit-breaker.test.ts +0 -107
package/test/claude-bridge.test.ts +0 -178
package/test/confidence.test.ts +0 -247
package/test/consistency.test.ts +0 -61
package/test/consolidation-pipeline.test.ts +0 -251
package/test/crystallize.test.ts +0 -521
package/test/diagnostics.test.ts +0 -638
package/test/embedding-provider.test.ts +0 -49
package/test/enrich.test.ts +0 -209
package/test/eval.test.ts +0 -300
package/test/export-import.test.ts +0 -251
package/test/facets.test.ts +0 -448
package/test/fallback-chain.test.ts +0 -93
package/test/frontier.test.ts +0 -485
package/test/governance.test.ts +0 -147
package/test/graph-retrieval.test.ts +0 -186
package/test/graph.test.ts +0 -160
package/test/helpers/mocks.ts +0 -40
package/test/hybrid-search.test.ts +0 -145
package/test/index-persistence.test.ts +0 -124
package/test/integration.test.ts +0 -265
package/test/leases.test.ts +0 -399
package/test/mcp-prompts.test.ts +0 -218
package/test/mcp-resources.test.ts +0 -286
package/test/mcp-standalone.test.ts +0 -113
package/test/mesh.test.ts +0 -700
package/test/privacy.test.ts +0 -87
package/test/profile.test.ts +0 -161
package/test/query-expansion.test.ts +0 -154
package/test/relations.test.ts +0 -198
package/test/retention.test.ts +0 -245
package/test/routines.test.ts +0 -497
package/test/schema-fingerprint.test.ts +0 -81
package/test/schema.test.ts +0 -42
package/test/search-index.test.ts +0 -128
package/test/sentinels.test.ts +0 -626
package/test/signals.test.ts +0 -410
package/test/sketches.test.ts +0 -549
package/test/sliding-window.test.ts +0 -199
package/test/smart-search.test.ts +0 -169
package/test/snapshot.test.ts +0 -165
package/test/team.test.ts +0 -156
package/test/temporal-graph.test.ts +0 -378
package/test/timeline.test.ts +0 -148
package/test/vector-index.test.ts +0 -79
package/test/verify.test.ts +0 -209
package/test/xml.test.ts +0 -65
package/tsconfig.json +0 -22
package/tsdown.config.ts +0 -62

package/benchmark/scale-eval.ts DELETED Viewed

@@ -1,398 +0,0 @@
-import { SearchIndex } from "../src/state/search-index.js";
-import { VectorIndex } from "../src/state/vector-index.js";
-import { HybridSearch } from "../src/state/hybrid-search.js";
-import type { CompressedObservation } from "../src/types.js";
-import { generateScaleDataset, generateDataset } from "./dataset.js";
-import { writeFileSync } from "node:fs";
-function mockKV() {
-  const store = new Map<string, Map<string, unknown>>();
-  return {
-    get: async <T>(scope: string, key: string): Promise<T | null> =>
-      (store.get(scope)?.get(key) as T) ?? null,
-    set: async <T>(scope: string, key: string, data: T): Promise<T> => {
-      if (!store.has(scope)) store.set(scope, new Map());
-      store.get(scope)!.set(key, data);
-      return data;
-    },
-    delete: async (scope: string, key: string): Promise<void> => {
-      store.get(scope)?.delete(key);
-    },
-    list: async <T>(scope: string): Promise<T[]> => {
-      const entries = store.get(scope);
-      return entries ? (Array.from(entries.values()) as T[]) : [];
-    },
-  };
-}
-function deterministicEmbedding(text: string, dims = 384): Float32Array {
-  const arr = new Float32Array(dims);
-  const words = text.toLowerCase().split(/\W+/).filter(w => w.length > 2);
-  for (const word of words) {
-    for (let i = 0; i < word.length; i++) {
-      const idx = (word.charCodeAt(i) * 31 + i * 17) % dims;
-      arr[idx] += 1;
-      const idx2 = (word.charCodeAt(i) * 37 + i * 13 + word.length * 7) % dims;
-      arr[idx2] += 0.5;
-    }
-  }
-  const norm = Math.sqrt(arr.reduce((s, v) => s + v * v, 0));
-  if (norm > 0) for (let i = 0; i < dims; i++) arr[i] /= norm;
-  return arr;
-}
-function estimateTokens(text: string): number {
-  return Math.ceil(text.length / 4);
-}
-interface ScaleResult {
-  scale: number;
-  sessions: number;
-  index_build_ms: number;
-  index_build_per_doc_ms: number;
-  bm25_search_ms: number;
-  hybrid_search_ms: number;
-  index_size_kb: number;
-  vector_size_kb: number;
-  heap_mb: number;
-  builtin_tokens: number;
-  builtin_200line_tokens: number;
-  agentmemory_tokens: number;
-  token_savings_pct: number;
-  builtin_unreachable_pct: number;
-}
-interface CrossSessionResult {
-  query: string;
-  target_session: string;
-  current_session: string;
-  sessions_apart: number;
-  bm25_found: boolean;
-  bm25_rank: number;
-  hybrid_found: boolean;
-  hybrid_rank: number;
-  builtin_found: boolean;
-  latency_ms: number;
-}
-const SEARCH_QUERIES = [
-  "authentication middleware JWT",
-  "PostgreSQL connection pooling",
-  "Kubernetes pod crash",
-  "rate limiting API",
-  "Playwright E2E tests",
-  "Docker multi-stage build",
-  "Redis caching layer",
-  "CI/CD GitHub Actions",
-  "Prisma migration drift",
-  "monitoring Datadog alerts",
-];
-async function benchmarkScale(counts: number[]): Promise<ScaleResult[]> {
-  const results: ScaleResult[] = [];
-  for (const count of counts) {
-    console.log(`  Scale: ${count.toLocaleString()} observations...`);
-    const observations = generateScaleDataset(count);
-    const sessionCount = new Set(observations.map(o => o.sessionId)).size;
-    const heapBefore = process.memoryUsage().heapUsed;
-    const buildStart = performance.now();
-    const bm25 = new SearchIndex();
-    const vector = new VectorIndex();
-    const kv = mockKV();
-    const dims = 384;
-    for (const obs of observations) {
-      bm25.add(obs);
-      const text = [obs.title, obs.narrative, ...obs.concepts].join(" ");
-      vector.add(obs.id, obs.sessionId, deterministicEmbedding(text, dims));
-      await kv.set(`mem:obs:${obs.sessionId}`, obs.id, obs);
-    }
-    const buildMs = performance.now() - buildStart;
-    const heapAfter = process.memoryUsage().heapUsed;
-    const mockEmbed: any = {
-      name: "deterministic", dimensions: dims,
-      embed: async (t: string) => deterministicEmbedding(t, dims),
-      embedBatch: async (ts: string[]) => ts.map(t => deterministicEmbedding(t, dims)),
-    };
-    const hybrid = new HybridSearch(bm25, vector, mockEmbed, kv as never, 0.4, 0.6, 0);
-    let bm25Total = 0;
-    let hybridTotal = 0;
-    const iters = 20;
-    for (let i = 0; i < iters; i++) {
-      const q = SEARCH_QUERIES[i % SEARCH_QUERIES.length];
-      const s1 = performance.now();
-      bm25.search(q, 10);
-      bm25Total += performance.now() - s1;
-      const s2 = performance.now();
-      await hybrid.search(q, 10);
-      hybridTotal += performance.now() - s2;
-    }
-    const bm25Ser = bm25.serialize();
-    const vecSer = vector.serialize();
-    const allText = observations.map(o =>
-      `- ${o.title}: ${o.narrative.slice(0, 80)}... [${o.concepts.slice(0, 3).join(", ")}]`
-    ).join("\n");
-    const builtinTokens = estimateTokens(allText);
-    const truncatedText = observations.slice(0, 200).map(o =>
-      `- ${o.title}: ${o.narrative.slice(0, 60)}... [${o.concepts.slice(0, 3).join(", ")}]`
-    ).join("\n");
-    const builtin200Tokens = estimateTokens(truncatedText);
-    let totalResultTokens = 0;
-    for (let i = 0; i < iters; i++) {
-      const q = SEARCH_QUERIES[i % SEARCH_QUERIES.length];
-      const results = await hybrid.search(q, 10);
-      totalResultTokens += estimateTokens(JSON.stringify(results.map(r => r.observation)));
-    }
-    const agentmemoryTokens = Math.round(totalResultTokens / iters);
-    results.push({
-      scale: count,
-      sessions: sessionCount,
-      index_build_ms: Math.round(buildMs),
-      index_build_per_doc_ms: +(buildMs / count).toFixed(3),
-      bm25_search_ms: +(bm25Total / iters).toFixed(3),
-      hybrid_search_ms: +(hybridTotal / iters).toFixed(3),
-      index_size_kb: Math.round(Buffer.byteLength(bm25Ser, "utf-8") / 1024),
-      vector_size_kb: Math.round(Buffer.byteLength(vecSer, "utf-8") / 1024),
-      heap_mb: Math.round((heapAfter - heapBefore) / 1024 / 1024),
-      builtin_tokens: builtinTokens,
-      builtin_200line_tokens: builtin200Tokens,
-      agentmemory_tokens: agentmemoryTokens,
-      token_savings_pct: Math.round((1 - agentmemoryTokens / builtinTokens) * 100),
-      builtin_unreachable_pct: count <= 200 ? 0 : Math.round((1 - 200 / count) * 100),
-    });
-  }
-  return results;
-}
-async function benchmarkCrossSession(): Promise<CrossSessionResult[]> {
-  const { observations } = generateDataset();
-  const results: CrossSessionResult[] = [];
-  const bm25 = new SearchIndex();
-  const kv = mockKV();
-  const vector = new VectorIndex();
-  const dims = 384;
-  for (const obs of observations) {
-    bm25.add(obs);
-    const text = [obs.title, obs.narrative, ...obs.concepts].join(" ");
-    vector.add(obs.id, obs.sessionId, deterministicEmbedding(text, dims));
-    await kv.set(`mem:obs:${obs.sessionId}`, obs.id, obs);
-  }
-  const mockEmbed: any = {
-    name: "deterministic", dimensions: dims,
-    embed: async (t: string) => deterministicEmbedding(t, dims),
-    embedBatch: async (ts: string[]) => ts.map(t => deterministicEmbedding(t, dims)),
-  };
-  const hybrid = new HybridSearch(bm25, vector, mockEmbed, kv as never, 0.4, 0.6, 0);
-  const crossQueries: Array<{
-    query: string;
-    targetConcepts: string[];
-    targetSessionRange: [number, number];
-    currentSession: number;
-  }> = [
-    { query: "How did we set up OAuth providers?", targetConcepts: ["oauth", "nextauth"], targetSessionRange: [5, 9], currentSession: 29 },
-    { query: "What was the N+1 query fix?", targetConcepts: ["n+1", "eager-loading"], targetSessionRange: [10, 14], currentSession: 28 },
-    { query: "PostgreSQL full-text search setup", targetConcepts: ["full-text-search", "tsvector"], targetSessionRange: [10, 14], currentSession: 27 },
-    { query: "bcrypt password hashing configuration", targetConcepts: ["bcrypt", "password-hashing"], targetSessionRange: [5, 9], currentSession: 25 },
-    { query: "Vitest unit testing setup", targetConcepts: ["vitest", "unit-testing"], targetSessionRange: [20, 24], currentSession: 29 },
-    { query: "webhook retry exponential backoff", targetConcepts: ["webhooks", "exponential-backoff"], targetSessionRange: [15, 19], currentSession: 29 },
-    { query: "ESLint flat config migration", targetConcepts: ["eslint", "linting"], targetSessionRange: [0, 4], currentSession: 29 },
-    { query: "Kubernetes HPA autoscaling configuration", targetConcepts: ["hpa", "autoscaling", "kubernetes"], targetSessionRange: [25, 29], currentSession: 29 },
-    { query: "Prisma database seed script", targetConcepts: ["seeding", "faker", "prisma"], targetSessionRange: [10, 14], currentSession: 26 },
-    { query: "API cursor-based pagination", targetConcepts: ["cursor-based", "pagination"], targetSessionRange: [15, 19], currentSession: 29 },
-    { query: "CSRF protection double-submit cookie", targetConcepts: ["csrf", "cookies"], targetSessionRange: [5, 9], currentSession: 29 },
-    { query: "blue-green deployment rollback", targetConcepts: ["blue-green", "rollback", "zero-downtime"], targetSessionRange: [25, 29], currentSession: 29 },
-  ];
-  for (const cq of crossQueries) {
-    const targetObs = observations.filter(o =>
-      o.concepts.some(c => cq.targetConcepts.includes(c))
-    );
-    const targetIds = new Set(targetObs.map(o => o.id));
-    const start = performance.now();
-    const bm25Results = bm25.search(cq.query, 20);
-    const hybridResults = await hybrid.search(cq.query, 20);
-    const latency = performance.now() - start;
-    const bm25Rank = bm25Results.findIndex(r => targetIds.has(r.obsId));
-    const hybridRank = hybridResults.findIndex(r => targetIds.has(r.observation.id));
-    const builtinLines = 200;
-    const visibleObs = observations.slice(0, builtinLines);
-    const builtinFound = visibleObs.some(o => targetIds.has(o.id));
-    const sessionsApart = cq.currentSession - cq.targetSessionRange[0];
-    results.push({
-      query: cq.query,
-      target_session: `ses_${cq.targetSessionRange[0].toString().padStart(3, "0")}-${cq.targetSessionRange[1].toString().padStart(3, "0")}`,
-      current_session: `ses_${cq.currentSession.toString().padStart(3, "0")}`,
-      sessions_apart: sessionsApart,
-      bm25_found: bm25Rank >= 0,
-      bm25_rank: bm25Rank >= 0 ? bm25Rank + 1 : -1,
-      hybrid_found: hybridRank >= 0,
-      hybrid_rank: hybridRank >= 0 ? hybridRank + 1 : -1,
-      builtin_found: builtinFound,
-      latency_ms: latency,
-    });
-  }
-  return results;
-}
-function generateReport(scale: ScaleResult[], cross: CrossSessionResult[]): string {
-  const lines: string[] = [];
-  const w = (s: string) => lines.push(s);
-  w("# agentmemory v0.6.0 — Scale & Cross-Session Evaluation");
-  w("");
-  w(`**Date:** ${new Date().toISOString()}`);
-  w(`**Platform:** ${process.platform} ${process.arch}, Node ${process.version}`);
-  w("");
-  w("## 1. Scale: agentmemory vs Built-in Memory");
-  w("");
-  w("Every built-in agent memory (CLAUDE.md, .cursorrules, Cline's memory-bank) loads ALL memory into context every session. agentmemory searches and returns only relevant results.");
-  w("");
-  w("| Observations | Sessions | Index Build | BM25 Search | Hybrid Search | Heap | Context Tokens (built-in) | Context Tokens (agentmemory) | Savings | Built-in Unreachable |");
-  w("|-------------|----------|------------|-------------|---------------|------|--------------------------|-----------------------------|---------|--------------------|");
-  for (const r of scale) {
-    w(`| ${r.scale.toLocaleString()} | ${r.sessions} | ${r.index_build_ms}ms | ${r.bm25_search_ms}ms | ${r.hybrid_search_ms}ms | ${r.heap_mb}MB | ${r.builtin_tokens.toLocaleString()} | ${r.agentmemory_tokens.toLocaleString()} | ${r.token_savings_pct}% | ${r.builtin_unreachable_pct}% |`);
-  }
-  w("");
-  w("### What the numbers mean");
-  w("");
-  w("**Context Tokens (built-in):** How many tokens Claude Code/Cursor/Cline would consume loading ALL memory into the context window. At 5,000 observations, this is ~250K tokens — exceeding most context windows entirely.");
-  w("");
-  w("**Context Tokens (agentmemory):** How many tokens the top-10 search results consume. Stays constant regardless of corpus size.");
-  w("");
-  w("**Built-in Unreachable:** Percentage of memories that built-in systems CANNOT access because they exceed the 200-line MEMORY.md cap or context window limits. At 1,000 observations, 80% of your project history is invisible.");
-  w("");
-  w("### Storage Costs");
-  w("");
-  w("| Observations | BM25 Index | Vector Index (d=384) | Total Storage |");
-  w("|-------------|-----------|---------------------|---------------|");
-  for (const r of scale) {
-    const total = r.index_size_kb + r.vector_size_kb;
-    w(`| ${r.scale.toLocaleString()} | ${r.index_size_kb.toLocaleString()} KB | ${r.vector_size_kb.toLocaleString()} KB | ${(total / 1024).toFixed(1)} MB |`);
-  }
-  w("");
-  w("## 2. Cross-Session Retrieval");
-  w("");
-  w("Can the system find relevant information from past sessions? This is impossible for built-in memory once observations exceed the line/context cap.");
-  w("");
-  w("| Query | Target Session | Gap | BM25 Found | BM25 Rank | Hybrid Found | Hybrid Rank | Built-in Visible |");
-  w("|-------|---------------|-----|-----------|-----------|-------------|-------------|-----------------|");
-  for (const r of cross) {
-    w(`| ${r.query.slice(0, 40)}${r.query.length > 40 ? "..." : ""} | ${r.target_session} | ${r.sessions_apart} | ${r.bm25_found ? "Yes" : "No"} | ${r.bm25_rank > 0 ? `#${r.bm25_rank}` : "-"} | ${r.hybrid_found ? "Yes" : "No"} | ${r.hybrid_rank > 0 ? `#${r.hybrid_rank}` : "-"} | ${r.builtin_found ? "Yes" : "No"} |`);
-  }
-  const bm25Found = cross.filter(r => r.bm25_found).length;
-  const hybridFound = cross.filter(r => r.hybrid_found).length;
-  const builtinFound = cross.filter(r => r.builtin_found).length;
-  w("");
-  w(`**Summary:** agentmemory BM25 found ${bm25Found}/${cross.length} cross-session queries. Hybrid found ${hybridFound}/${cross.length}. Built-in memory (200-line cap) could only reach ${builtinFound}/${cross.length}.`);
-  w("");
-  w("## 3. The Context Window Problem");
-  w("");
-  w("```");
-  w("Agent context window: ~200K tokens");
-  w("System prompt + tools:  ~20K tokens");
-  w("User conversation:      ~30K tokens");
-  w("Available for memory:  ~150K tokens");
-  w("");
-  w("At 50 tokens/observation:");
-  w("  200 observations  =  10,000 tokens  (fits, but 200-line cap hits first)");
-  w("  1,000 observations =  50,000 tokens  (33% of available budget)");
-  w("  5,000 observations = 250,000 tokens  (EXCEEDS total context window)");
-  w("");
-  w("agentmemory top-10 results:");
-  w(`  Any corpus size     =  ~${scale[0]?.agentmemory_tokens.toLocaleString() || "500"} tokens  (0.3% of budget)`);
-  w("```");
-  w("");
-  w("## 4. What Built-in Memory Cannot Do");
-  w("");
-  w("| Capability | Built-in (CLAUDE.md) | agentmemory |");
-  w("|-----------|---------------------|-------------|");
-  w("| Semantic search | No (keyword grep only) | BM25 + vector + graph |");
-  w("| Scale beyond 200 lines | No (hard cap) | Unlimited |");
-  w("| Cross-session recall | Only if in 200-line window | Full corpus search |");
-  w("| Cross-agent sharing | No (per-agent files) | MCP + REST API |");
-  w("| Multi-agent coordination | No | Leases, signals, actions |");
-  w("| Temporal queries | No | Point-in-time graph |");
-  w("| Memory lifecycle | No (manual pruning) | Ebbinghaus decay + eviction |");
-  w("| Knowledge graph | No | Entity extraction + traversal |");
-  w("| Query expansion | No | LLM-generated reformulations |");
-  w("| Retention scoring | No | Time-frequency decay model |");
-  w("| Real-time dashboard | No (read files manually) | Viewer on :3113 |");
-  w("| Concurrent access | No (file lock) | Keyed mutex + KV store |");
-  w("");
-  w("## 5. When to Use What");
-  w("");
-  w("**Use built-in memory (CLAUDE.md) when:**");
-  w("- You have < 200 items to remember");
-  w("- Single agent, single project");
-  w("- Preferences and quick facts only");
-  w("- Zero setup is the priority");
-  w("");
-  w("**Use agentmemory when:**");
-  w("- Project history exceeds 200 observations");
-  w("- You need to recall specific incidents from weeks ago");
-  w("- Multiple agents work on the same codebase");
-  w("- You want semantic search (\"how does auth work?\") not just keyword matching");
-  w("- You need to track memory quality, decay, and lifecycle");
-  w("- You want a shared memory layer across Claude Code, Cursor, Windsurf, etc.");
-  w("");
-  w("Built-in memory is your sticky notes. agentmemory is the searchable database behind them.");
-  w("");
-  w("---");
-  w(`*Scale tests: ${scale.length} corpus sizes. Cross-session tests: ${cross.length} queries targeting specific past sessions.*`);
-  return lines.join("\n");
-}
-async function main() {
-  console.log("=== agentmemory Scale & Cross-Session Evaluation ===\n");
-  console.log("1. Scale benchmarks...");
-  const scaleResults = await benchmarkScale([240, 1_000, 5_000, 10_000, 50_000]);
-  console.log("\n2. Cross-session retrieval...");
-  const crossResults = await benchmarkCrossSession();
-  console.log("");
-  const report = generateReport(scaleResults, crossResults);
-  writeFileSync("benchmark/SCALE.md", report);
-  console.log(report);
-  console.log(`\nReport written to benchmark/SCALE.md`);
-}
-main().catch(console.error);