npm - @teammates/recall - Versions diffs - 0.6.1 → 0.6.3 - Mend

@teammates/recall 0.6.1 → 0.6.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/dist/cli.js +23 -23
package/dist/index.d.ts +1 -1
package/dist/query-expansion.js +136 -15
package/package.json +1 -1
package/src/cli.test.ts +324 -324
package/src/cli.ts +407 -407
package/src/embeddings.ts +56 -56
package/src/index.ts +11 -11
package/src/indexer.test.ts +337 -337
package/src/indexer.ts +260 -260
package/src/memory-index.ts +3 -1
package/src/query-expansion.test.ts +9 -3
package/src/query-expansion.ts +136 -15
package/src/search.test.ts +3 -9
package/src/search.ts +244 -244

package/src/query-expansion.ts CHANGED Viewed

@@ -7,21 +7,142 @@
 /** Common English stopwords to filter from queries. */
 const STOPWORDS = new Set([
-  "a", "an", "the", "and", "or", "but", "in", "on", "at", "to", "for",
-  "of", "with", "by", "from", "is", "are", "was", "were", "be", "been",
-  "being", "have", "has", "had", "do", "does", "did", "will", "would",
-  "could", "should", "may", "might", "shall", "can", "need", "must",
-  "it", "its", "this", "that", "these", "those", "i", "you", "he", "she",
-  "we", "they", "me", "him", "her", "us", "them", "my", "your", "his",
-  "our", "their", "what", "which", "who", "whom", "where", "when", "how",
-  "why", "if", "then", "so", "not", "no", "just", "also", "very", "too",
-  "some", "any", "all", "each", "every", "both", "few", "more", "most",
-  "other", "into", "over", "after", "before", "between", "through",
-  "about", "up", "out", "off", "down", "here", "there", "again", "once",
-  "let", "lets", "let's", "get", "got", "go", "going", "make", "made",
-  "take", "took", "come", "came", "see", "saw", "know", "knew", "think",
-  "thought", "say", "said", "tell", "told", "ask", "asked", "want",
-  "wanted", "like", "look", "use", "used", "find", "give", "work",
+  "a",
+  "an",
+  "the",
+  "and",
+  "or",
+  "but",
+  "in",
+  "on",
+  "at",
+  "to",
+  "for",
+  "of",
+  "with",
+  "by",
+  "from",
+  "is",
+  "are",
+  "was",
+  "were",
+  "be",
+  "been",
+  "being",
+  "have",
+  "has",
+  "had",
+  "do",
+  "does",
+  "did",
+  "will",
+  "would",
+  "could",
+  "should",
+  "may",
+  "might",
+  "shall",
+  "can",
+  "need",
+  "must",
+  "it",
+  "its",
+  "this",
+  "that",
+  "these",
+  "those",
+  "i",
+  "you",
+  "he",
+  "she",
+  "we",
+  "they",
+  "me",
+  "him",
+  "her",
+  "us",
+  "them",
+  "my",
+  "your",
+  "his",
+  "our",
+  "their",
+  "what",
+  "which",
+  "who",
+  "whom",
+  "where",
+  "when",
+  "how",
+  "why",
+  "if",
+  "then",
+  "so",
+  "not",
+  "no",
+  "just",
+  "also",
+  "very",
+  "too",
+  "some",
+  "any",
+  "all",
+  "each",
+  "every",
+  "both",
+  "few",
+  "more",
+  "most",
+  "other",
+  "into",
+  "over",
+  "after",
+  "before",
+  "between",
+  "through",
+  "about",
+  "up",
+  "out",
+  "off",
+  "down",
+  "here",
+  "there",
+  "again",
+  "once",
+  "let",
+  "lets",
+  "let's",
+  "get",
+  "got",
+  "go",
+  "going",
+  "make",
+  "made",
+  "take",
+  "took",
+  "come",
+  "came",
+  "see",
+  "saw",
+  "know",
+  "knew",
+  "think",
+  "thought",
+  "say",
+  "said",
+  "tell",
+  "told",
+  "ask",
+  "asked",
+  "want",
+  "wanted",
+  "like",
+  "look",
+  "use",
+  "used",
+  "find",
+  "give",
+  "work",
 ]);
 /**

package/src/search.test.ts CHANGED Viewed

@@ -3,8 +3,8 @@ import { tmpdir } from "node:os";
 import { join } from "node:path";
 import { afterEach, beforeEach, describe, expect, it, vi } from "vitest";
 import { Indexer } from "./indexer.js";
-import { classifyUri, multiSearch, search } from "./search.js";
 import type { SearchResult } from "./search.js";
+import { classifyUri, multiSearch, search } from "./search.js";
 // Deterministic stub embeddings based on text content
 function stubCreateEmbeddings(inputs: string | string[]) {
@@ -138,10 +138,7 @@ describe("search", () => {
       join(weeklyDir, "2026-W11.md"),
       "# Week 11\nWorked on indexer.",
     );
-    await writeFile(
-      join(weeklyDir, "2026-W09.md"),
-      "# Week 9\nOld stuff.",
-    );
+    await writeFile(join(weeklyDir, "2026-W09.md"), "# Week 9\nOld stuff.");
     const results = await search("anything", {
       teammatesDir: testDir,
@@ -162,10 +159,7 @@ describe("search", () => {
     const weeklyDir = join(beacon, "memory", "weekly");
     await mkdir(weeklyDir, { recursive: true });
     await writeFile(join(beacon, "SOUL.md"), "# Beacon");
-    await writeFile(
-      join(weeklyDir, "2026-W11.md"),
-      "# Week 11\nContent here.",
-    );
+    await writeFile(join(weeklyDir, "2026-W11.md"), "# Week 11\nContent here.");
     const results = await search("anything", {
       teammatesDir: testDir,

package/src/search.ts CHANGED Viewed

@@ -1,244 +1,244 @@
-import * as fs from "node:fs/promises";
-import * as path from "node:path";
-import { LocalDocumentIndex } from "vectra";
-import { LocalEmbeddings } from "./embeddings.js";
-import { Indexer } from "./indexer.js";
-export interface SearchOptions {
-  /** Path to the .teammates directory */
-  teammatesDir: string;
-  /** Teammate name to search (searches all if omitted) */
-  teammate?: string;
-  /** Max results per teammate (default: 5) */
-  maxResults?: number;
-  /** Max chunks per document (default: 3) */
-  maxChunks?: number;
-  /** Max tokens per section (default: 500) */
-  maxTokens?: number;
-  /** Embedding model name */
-  model?: string;
-  /** Skip auto-sync before searching (default: false) */
-  skipSync?: boolean;
-  /** Number of recent weekly summaries to always include (default: 2) */
-  recencyDepth?: number;
-  /** Relevance boost multiplier for typed memories over episodic summaries (default: 1.2) */
-  typedMemoryBoost?: number;
-}
-/** Options for multi-query search with deduplication. */
-export interface MultiSearchOptions extends SearchOptions {
-  /** Additional queries beyond the primary (keyword-focused, conversation-derived, etc.) */
-  additionalQueries?: string[];
-  /** Pre-matched memory catalog results to merge into the final set */
-  catalogMatches?: SearchResult[];
-}
-export interface SearchResult {
-  teammate: string;
-  uri: string;
-  text: string;
-  score: number;
-  /** Content type: "typed_memory", "weekly", "monthly", or "other" */
-  contentType?: string;
-}
-/**
- * Classify a URI into a content type for priority scoring.
- */
-export function classifyUri(uri: string): string {
-  if (uri.includes("/memory/weekly/")) return "weekly";
-  if (uri.includes("/memory/monthly/")) return "monthly";
-  // Typed memories are in memory/ but not daily logs (YYYY-MM-DD) and not in subdirs
-  const memoryMatch = uri.match(/\/memory\/([^/]+)\.md$/);
-  if (memoryMatch) {
-    const stem = memoryMatch[1];
-    if (/^\d{4}-\d{2}-\d{2}$/.test(stem)) return "daily";
-    return "typed_memory";
-  }
-  return "other";
-}
-/**
- * Search teammate memories using multi-pass retrieval.
- *
- * Pass 1 (Recency): Always returns the N most recent weekly summaries.
- * Pass 2 (Semantic): Query-driven search across all indexed content.
- * Results are merged, deduped, and typed memories get a relevance boost.
- */
-export async function search(
-  query: string,
-  options: SearchOptions,
-): Promise<SearchResult[]> {
-  const embeddings = new LocalEmbeddings(options.model);
-  const indexer = new Indexer({
-    teammatesDir: options.teammatesDir,
-    model: options.model,
-  });
-  const maxResults = options.maxResults ?? 5;
-  const maxChunks = options.maxChunks ?? 3;
-  const maxTokens = options.maxTokens ?? 500;
-  const recencyDepth = options.recencyDepth ?? 2;
-  const typedMemoryBoost = options.typedMemoryBoost ?? 1.2;
-  // Auto-sync: upsert any new/changed files before searching
-  if (!options.skipSync) {
-    if (options.teammate) {
-      await indexer.syncTeammate(options.teammate);
-    } else {
-      await indexer.syncAll();
-    }
-  }
-  // Determine which teammates to search
-  let teammates: string[];
-  if (options.teammate) {
-    teammates = [options.teammate];
-  } else {
-    teammates = await indexer.discoverTeammates();
-  }
-  const allResults: SearchResult[] = [];
-  const seenUris = new Set<string>();
-  // ── Pass 1: Recency (recent weekly summaries, always included) ───
-  for (const teammate of teammates) {
-    const weeklyDir = path.join(
-      options.teammatesDir,
-      teammate,
-      "memory",
-      "weekly",
-    );
-    try {
-      const entries = await fs.readdir(weeklyDir);
-      const weeklyFiles = entries
-        .filter((e) => e.endsWith(".md"))
-        .sort()
-        .reverse()
-        .slice(0, recencyDepth);
-      for (const file of weeklyFiles) {
-        const uri = `${teammate}/memory/weekly/${file}`;
-        const text = await fs.readFile(path.join(weeklyDir, file), "utf-8");
-        if (text.trim().length === 0) continue;
-        seenUris.add(uri);
-        allResults.push({
-          teammate,
-          uri,
-          text: text.slice(0, maxTokens * 4), // rough token estimate
-          score: 0.9, // high base score for recency results
-          contentType: "weekly",
-        });
-      }
-    } catch {
-      // No weekly/ directory for this teammate
-    }
-  }
-  // ── Pass 2: Semantic (query-driven across all indexed content) ───
-  for (const teammate of teammates) {
-    const indexPath = indexer.indexPath(teammate);
-    try {
-      await fs.access(indexPath);
-    } catch {
-      continue;
-    }
-    const index = new LocalDocumentIndex({
-      folderPath: indexPath,
-      embeddings,
-    });
-    if (!(await index.isIndexCreated())) continue;
-    const docs = await index.queryDocuments(query, {
-      maxDocuments: maxResults,
-      maxChunks,
-    });
-    for (const doc of docs) {
-      if (seenUris.has(doc.uri)) continue; // dedup with recency pass
-      seenUris.add(doc.uri);
-      const sections = await doc.renderSections(maxTokens, 1);
-      const contentType = classifyUri(doc.uri);
-      for (const section of sections) {
-        let score = section.score;
-        // Apply type-based priority boost for typed memories
-        if (contentType === "typed_memory") {
-          score *= typedMemoryBoost;
-        }
-        allResults.push({
-          teammate,
-          uri: doc.uri,
-          text: section.text,
-          score,
-          contentType,
-        });
-      }
-    }
-  }
-  // Sort by score descending, return top results
-  allResults.sort((a, b) => b.score - a.score);
-  return allResults.slice(0, maxResults + recencyDepth); // allow extra slots for recency results
-}
-/**
- * Multi-query search with deduplication and catalog merge.
- *
- * Fires the primary query plus any additional queries (keyword-focused,
- * conversation-derived) and merges results. Catalog matches (from frontmatter
- * text matching) are also merged. Deduplication is by URI — when the same
- * URI appears from multiple queries, the highest score wins.
- */
-export async function multiSearch(
-  primaryQuery: string,
-  options: MultiSearchOptions,
-): Promise<SearchResult[]> {
-  const additionalQueries = options.additionalQueries ?? [];
-  const catalogMatches = options.catalogMatches ?? [];
-  const maxResults = options.maxResults ?? 5;
-  const recencyDepth = options.recencyDepth ?? 2;
-  // Fire all queries — primary gets full treatment (recency pass + semantic)
-  // Additional queries get semantic only (skipRecency to avoid duplicate weeklies)
-  const primaryResults = await search(primaryQuery, options);
-  // Collect all results keyed by URI, keeping highest score
-  const bestByUri = new Map<string, SearchResult>();
-  for (const r of primaryResults) {
-    const existing = bestByUri.get(r.uri);
-    if (!existing || r.score > existing.score) {
-      bestByUri.set(r.uri, r);
-    }
-  }
-  // Fire additional queries (reuse same search options minus recency to avoid dupes)
-  for (const query of additionalQueries) {
-    const results = await search(query, {
-      ...options,
-      recencyDepth: 0, // primary already got the weekly summaries
-    });
-    for (const r of results) {
-      const existing = bestByUri.get(r.uri);
-      if (!existing || r.score > existing.score) {
-        bestByUri.set(r.uri, r);
-      }
-    }
-  }
-  // Merge catalog matches (frontmatter text-matched results)
-  for (const r of catalogMatches) {
-    const existing = bestByUri.get(r.uri);
-    if (!existing || r.score > existing.score) {
-      bestByUri.set(r.uri, r);
-    }
-  }
-  // Sort by score descending, return top results
-  const merged = [...bestByUri.values()];
-  merged.sort((a, b) => b.score - a.score);
-  return merged.slice(0, maxResults + recencyDepth);
-}
+import * as fs from "node:fs/promises";
+import * as path from "node:path";
+import { LocalDocumentIndex } from "vectra";
+import { LocalEmbeddings } from "./embeddings.js";
+import { Indexer } from "./indexer.js";
+export interface SearchOptions {
+  /** Path to the .teammates directory */
+  teammatesDir: string;
+  /** Teammate name to search (searches all if omitted) */
+  teammate?: string;
+  /** Max results per teammate (default: 5) */
+  maxResults?: number;
+  /** Max chunks per document (default: 3) */
+  maxChunks?: number;
+  /** Max tokens per section (default: 500) */
+  maxTokens?: number;
+  /** Embedding model name */
+  model?: string;
+  /** Skip auto-sync before searching (default: false) */
+  skipSync?: boolean;
+  /** Number of recent weekly summaries to always include (default: 2) */
+  recencyDepth?: number;
+  /** Relevance boost multiplier for typed memories over episodic summaries (default: 1.2) */
+  typedMemoryBoost?: number;
+}
+/** Options for multi-query search with deduplication. */
+export interface MultiSearchOptions extends SearchOptions {
+  /** Additional queries beyond the primary (keyword-focused, conversation-derived, etc.) */
+  additionalQueries?: string[];
+  /** Pre-matched memory catalog results to merge into the final set */
+  catalogMatches?: SearchResult[];
+}
+export interface SearchResult {
+  teammate: string;
+  uri: string;
+  text: string;
+  score: number;
+  /** Content type: "typed_memory", "weekly", "monthly", or "other" */
+  contentType?: string;
+}
+/**
+ * Classify a URI into a content type for priority scoring.
+ */
+export function classifyUri(uri: string): string {
+  if (uri.includes("/memory/weekly/")) return "weekly";
+  if (uri.includes("/memory/monthly/")) return "monthly";
+  // Typed memories are in memory/ but not daily logs (YYYY-MM-DD) and not in subdirs
+  const memoryMatch = uri.match(/\/memory\/([^/]+)\.md$/);
+  if (memoryMatch) {
+    const stem = memoryMatch[1];
+    if (/^\d{4}-\d{2}-\d{2}$/.test(stem)) return "daily";
+    return "typed_memory";
+  }
+  return "other";
+}
+/**
+ * Search teammate memories using multi-pass retrieval.
+ *
+ * Pass 1 (Recency): Always returns the N most recent weekly summaries.
+ * Pass 2 (Semantic): Query-driven search across all indexed content.
+ * Results are merged, deduped, and typed memories get a relevance boost.
+ */
+export async function search(
+  query: string,
+  options: SearchOptions,
+): Promise<SearchResult[]> {
+  const embeddings = new LocalEmbeddings(options.model);
+  const indexer = new Indexer({
+    teammatesDir: options.teammatesDir,
+    model: options.model,
+  });
+  const maxResults = options.maxResults ?? 5;
+  const maxChunks = options.maxChunks ?? 3;
+  const maxTokens = options.maxTokens ?? 500;
+  const recencyDepth = options.recencyDepth ?? 2;
+  const typedMemoryBoost = options.typedMemoryBoost ?? 1.2;
+  // Auto-sync: upsert any new/changed files before searching
+  if (!options.skipSync) {
+    if (options.teammate) {
+      await indexer.syncTeammate(options.teammate);
+    } else {
+      await indexer.syncAll();
+    }
+  }
+  // Determine which teammates to search
+  let teammates: string[];
+  if (options.teammate) {
+    teammates = [options.teammate];
+  } else {
+    teammates = await indexer.discoverTeammates();
+  }
+  const allResults: SearchResult[] = [];
+  const seenUris = new Set<string>();
+  // ── Pass 1: Recency (recent weekly summaries, always included) ───
+  for (const teammate of teammates) {
+    const weeklyDir = path.join(
+      options.teammatesDir,
+      teammate,
+      "memory",
+      "weekly",
+    );
+    try {
+      const entries = await fs.readdir(weeklyDir);
+      const weeklyFiles = entries
+        .filter((e) => e.endsWith(".md"))
+        .sort()
+        .reverse()
+        .slice(0, recencyDepth);
+      for (const file of weeklyFiles) {
+        const uri = `${teammate}/memory/weekly/${file}`;
+        const text = await fs.readFile(path.join(weeklyDir, file), "utf-8");
+        if (text.trim().length === 0) continue;
+        seenUris.add(uri);
+        allResults.push({
+          teammate,
+          uri,
+          text: text.slice(0, maxTokens * 4), // rough token estimate
+          score: 0.9, // high base score for recency results
+          contentType: "weekly",
+        });
+      }
+    } catch {
+      // No weekly/ directory for this teammate
+    }
+  }
+  // ── Pass 2: Semantic (query-driven across all indexed content) ───
+  for (const teammate of teammates) {
+    const indexPath = indexer.indexPath(teammate);
+    try {
+      await fs.access(indexPath);
+    } catch {
+      continue;
+    }
+    const index = new LocalDocumentIndex({
+      folderPath: indexPath,
+      embeddings,
+    });
+    if (!(await index.isIndexCreated())) continue;
+    const docs = await index.queryDocuments(query, {
+      maxDocuments: maxResults,
+      maxChunks,
+    });
+    for (const doc of docs) {
+      if (seenUris.has(doc.uri)) continue; // dedup with recency pass
+      seenUris.add(doc.uri);
+      const sections = await doc.renderSections(maxTokens, 1);
+      const contentType = classifyUri(doc.uri);
+      for (const section of sections) {
+        let score = section.score;
+        // Apply type-based priority boost for typed memories
+        if (contentType === "typed_memory") {
+          score *= typedMemoryBoost;
+        }
+        allResults.push({
+          teammate,
+          uri: doc.uri,
+          text: section.text,
+          score,
+          contentType,
+        });
+      }
+    }
+  }
+  // Sort by score descending, return top results
+  allResults.sort((a, b) => b.score - a.score);
+  return allResults.slice(0, maxResults + recencyDepth); // allow extra slots for recency results
+}
+/**
+ * Multi-query search with deduplication and catalog merge.
+ *
+ * Fires the primary query plus any additional queries (keyword-focused,
+ * conversation-derived) and merges results. Catalog matches (from frontmatter
+ * text matching) are also merged. Deduplication is by URI — when the same
+ * URI appears from multiple queries, the highest score wins.
+ */
+export async function multiSearch(
+  primaryQuery: string,
+  options: MultiSearchOptions,
+): Promise<SearchResult[]> {
+  const additionalQueries = options.additionalQueries ?? [];
+  const catalogMatches = options.catalogMatches ?? [];
+  const maxResults = options.maxResults ?? 5;
+  const recencyDepth = options.recencyDepth ?? 2;
+  // Fire all queries — primary gets full treatment (recency pass + semantic)
+  // Additional queries get semantic only (skipRecency to avoid duplicate weeklies)
+  const primaryResults = await search(primaryQuery, options);
+  // Collect all results keyed by URI, keeping highest score
+  const bestByUri = new Map<string, SearchResult>();
+  for (const r of primaryResults) {
+    const existing = bestByUri.get(r.uri);
+    if (!existing || r.score > existing.score) {
+      bestByUri.set(r.uri, r);
+    }
+  }
+  // Fire additional queries (reuse same search options minus recency to avoid dupes)
+  for (const query of additionalQueries) {
+    const results = await search(query, {
+      ...options,
+      recencyDepth: 0, // primary already got the weekly summaries
+    });
+    for (const r of results) {
+      const existing = bestByUri.get(r.uri);
+      if (!existing || r.score > existing.score) {
+        bestByUri.set(r.uri, r);
+      }
+    }
+  }
+  // Merge catalog matches (frontmatter text-matched results)
+  for (const r of catalogMatches) {
+    const existing = bestByUri.get(r.uri);
+    if (!existing || r.score > existing.score) {
+      bestByUri.set(r.uri, r);
+    }
+  }
+  // Sort by score descending, return top results
+  const merged = [...bestByUri.values()];
+  merged.sort((a, b) => b.score - a.score);
+  return merged.slice(0, maxResults + recencyDepth);
+}