npm - @twelvehart/supermemory-runtime - Versions diffs - 1.0.0-next.0 - Mend

@twelvehart/supermemory-runtime 1.0.0-next.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (156) hide show

package/.env.example +57 -0
package/README.md +374 -0
package/dist/index.js +189 -0
package/dist/mcp/index.js +1132 -0
package/docker-compose.prod.yml +91 -0
package/docker-compose.yml +358 -0
package/drizzle/0000_dapper_the_professor.sql +159 -0
package/drizzle/0001_api_keys.sql +51 -0
package/drizzle/meta/0000_snapshot.json +1532 -0
package/drizzle/meta/_journal.json +13 -0
package/drizzle.config.ts +20 -0
package/package.json +114 -0
package/scripts/add-extraction-job.ts +122 -0
package/scripts/benchmark-pgvector.ts +122 -0
package/scripts/bootstrap.sh +209 -0
package/scripts/check-runtime-pack.ts +111 -0
package/scripts/claude-mcp-config.ts +336 -0
package/scripts/docker-entrypoint.sh +183 -0
package/scripts/doctor.ts +377 -0
package/scripts/init-db.sql +33 -0
package/scripts/install.sh +1110 -0
package/scripts/mcp-setup.ts +271 -0
package/scripts/migrations/001_create_pgvector_extension.sql +31 -0
package/scripts/migrations/002_create_memory_embeddings_table.sql +75 -0
package/scripts/migrations/003_create_hnsw_index.sql +94 -0
package/scripts/migrations/004_create_memory_embeddings_standalone.sql +70 -0
package/scripts/migrations/005_create_chunks_table.sql +95 -0
package/scripts/migrations/006_create_processing_queue.sql +45 -0
package/scripts/migrations/generate_test_data.sql +42 -0
package/scripts/migrations/phase1_comprehensive_test.sql +204 -0
package/scripts/migrations/run_migrations.sh +286 -0
package/scripts/migrations/test_hnsw_index.sql +255 -0
package/scripts/pre-commit-secrets +282 -0
package/scripts/run-extraction-worker.ts +46 -0
package/scripts/run-phase1-tests.sh +291 -0
package/scripts/setup.ts +222 -0
package/scripts/smoke-install.sh +12 -0
package/scripts/test-health-endpoint.sh +328 -0
package/src/api/index.ts +2 -0
package/src/api/middleware/auth.ts +80 -0
package/src/api/middleware/csrf.ts +308 -0
package/src/api/middleware/errorHandler.ts +166 -0
package/src/api/middleware/rateLimit.ts +360 -0
package/src/api/middleware/validation.ts +514 -0
package/src/api/routes/documents.ts +286 -0
package/src/api/routes/profiles.ts +237 -0
package/src/api/routes/search.ts +71 -0
package/src/api/stores/index.ts +58 -0
package/src/config/bootstrap-env.ts +3 -0
package/src/config/env.ts +71 -0
package/src/config/feature-flags.ts +25 -0
package/src/config/index.ts +140 -0
package/src/config/secrets.config.ts +291 -0
package/src/db/client.ts +92 -0
package/src/db/index.ts +73 -0
package/src/db/postgres.ts +72 -0
package/src/db/schema/chunks.schema.ts +31 -0
package/src/db/schema/containers.schema.ts +46 -0
package/src/db/schema/documents.schema.ts +49 -0
package/src/db/schema/embeddings.schema.ts +32 -0
package/src/db/schema/index.ts +11 -0
package/src/db/schema/memories.schema.ts +72 -0
package/src/db/schema/profiles.schema.ts +34 -0
package/src/db/schema/queue.schema.ts +59 -0
package/src/db/schema/relationships.schema.ts +42 -0
package/src/db/schema.ts +223 -0
package/src/db/worker-connection.ts +47 -0
package/src/index.ts +235 -0
package/src/mcp/CLAUDE.md +1 -0
package/src/mcp/index.ts +1380 -0
package/src/mcp/legacyState.ts +22 -0
package/src/mcp/rateLimit.ts +358 -0
package/src/mcp/resources.ts +309 -0
package/src/mcp/results.ts +104 -0
package/src/mcp/tools.ts +401 -0
package/src/queues/config.ts +119 -0
package/src/queues/index.ts +289 -0
package/src/sdk/client.ts +225 -0
package/src/sdk/errors.ts +266 -0
package/src/sdk/http.ts +560 -0
package/src/sdk/index.ts +244 -0
package/src/sdk/resources/base.ts +65 -0
package/src/sdk/resources/connections.ts +204 -0
package/src/sdk/resources/documents.ts +163 -0
package/src/sdk/resources/index.ts +10 -0
package/src/sdk/resources/memories.ts +150 -0
package/src/sdk/resources/search.ts +60 -0
package/src/sdk/resources/settings.ts +36 -0
package/src/sdk/types.ts +674 -0
package/src/services/chunking/index.ts +451 -0
package/src/services/chunking.service.ts +650 -0
package/src/services/csrf.service.ts +252 -0
package/src/services/documents.repository.ts +219 -0
package/src/services/documents.service.ts +191 -0
package/src/services/embedding.service.ts +404 -0
package/src/services/extraction.service.ts +300 -0
package/src/services/extractors/code.extractor.ts +451 -0
package/src/services/extractors/index.ts +9 -0
package/src/services/extractors/markdown.extractor.ts +461 -0
package/src/services/extractors/pdf.extractor.ts +315 -0
package/src/services/extractors/text.extractor.ts +118 -0
package/src/services/extractors/url.extractor.ts +243 -0
package/src/services/index.ts +235 -0
package/src/services/ingestion.service.ts +177 -0
package/src/services/llm/anthropic.ts +400 -0
package/src/services/llm/base.ts +460 -0
package/src/services/llm/contradiction-detector.service.ts +526 -0
package/src/services/llm/heuristics.ts +148 -0
package/src/services/llm/index.ts +309 -0
package/src/services/llm/memory-classifier.service.ts +383 -0
package/src/services/llm/memory-extension-detector.service.ts +523 -0
package/src/services/llm/mock.ts +470 -0
package/src/services/llm/openai.ts +398 -0
package/src/services/llm/prompts.ts +438 -0
package/src/services/llm/types.ts +373 -0
package/src/services/memory.repository.ts +1769 -0
package/src/services/memory.service.ts +1338 -0
package/src/services/memory.types.ts +234 -0
package/src/services/persistence/index.ts +295 -0
package/src/services/pipeline.service.ts +509 -0
package/src/services/profile.repository.ts +436 -0
package/src/services/profile.service.ts +560 -0
package/src/services/profile.types.ts +270 -0
package/src/services/relationships/detector.ts +1128 -0
package/src/services/relationships/index.ts +268 -0
package/src/services/relationships/memory-integration.ts +459 -0
package/src/services/relationships/strategies.ts +132 -0
package/src/services/relationships/types.ts +370 -0
package/src/services/search.service.ts +761 -0
package/src/services/search.types.ts +220 -0
package/src/services/secrets.service.ts +384 -0
package/src/services/vectorstore/base.ts +327 -0
package/src/services/vectorstore/index.ts +444 -0
package/src/services/vectorstore/memory.ts +286 -0
package/src/services/vectorstore/migration.ts +295 -0
package/src/services/vectorstore/mock.ts +403 -0
package/src/services/vectorstore/pgvector.ts +695 -0
package/src/services/vectorstore/types.ts +247 -0
package/src/startup.ts +389 -0
package/src/types/api.types.ts +193 -0
package/src/types/document.types.ts +103 -0
package/src/types/index.ts +241 -0
package/src/types/profile.base.ts +133 -0
package/src/utils/errors.ts +447 -0
package/src/utils/id.ts +15 -0
package/src/utils/index.ts +101 -0
package/src/utils/logger.ts +313 -0
package/src/utils/sanitization.ts +501 -0
package/src/utils/secret-validation.ts +273 -0
package/src/utils/synonyms.ts +188 -0
package/src/utils/validation.ts +581 -0
package/src/workers/chunking.worker.ts +242 -0
package/src/workers/embedding.worker.ts +358 -0
package/src/workers/extraction.worker.ts +346 -0
package/src/workers/indexing.worker.ts +505 -0
package/tsconfig.json +38 -0

package/src/services/llm/prompts.ts ADDED Viewed

@@ -0,0 +1,438 @@
+/**
+ * LLM Prompts for Memory Extraction and Relationship Detection
+ *
+ * Contains carefully crafted prompts with few-shot examples for accurate
+ * memory extraction and classification.
+ */
+import type { MemoryType } from '../../types/index.js'
+// ============================================================================
+// Memory Extraction Prompts
+// ============================================================================
+/**
+ * System prompt for memory extraction
+ */
+export const MEMORY_EXTRACTION_SYSTEM_PROMPT = `You are an expert memory extraction system. Your task is to extract discrete, standalone facts, preferences, skills, and episodic memories from text content.
+For each extracted memory, you must:
+1. Create a clear, standalone statement that makes sense without context
+2. Classify it into the correct type
+3. Assign a confidence score (0.0-1.0) based on clarity and reliability
+4. Extract relevant entities (people, places, organizations, dates)
+5. Identify key keywords
+Memory Types:
+- fact: Objective information, statements of truth, definitions
+- event: Time-bound occurrences, meetings, experiences
+- preference: Personal likes, dislikes, preferences, opinions
+- skill: Abilities, capabilities, expertise, knowledge areas
+- relationship: Interpersonal connections, social bonds
+- context: Current situations, states, or ongoing activities
+- note: General notes, reminders, todos
+Guidelines:
+- Each memory should be self-contained and understandable alone
+- Be precise and avoid vague statements
+- Include relevant context in the memory itself
+- Higher confidence for explicit statements, lower for inferences
+- Extract multiple memories from complex sentences`
+/**
+ * Few-shot examples for memory extraction
+ */
+export const MEMORY_EXTRACTION_EXAMPLES = `
+Example 1:
+Input: "I've been using TypeScript for 3 years now and really prefer it over plain JavaScript. Currently working on a React project for my company Acme Inc."
+Output:
+{
+  "memories": [
+    {
+      "content": "Has been using TypeScript for 3 years",
+      "type": "skill",
+      "confidence": 0.95,
+      "entities": [{"name": "TypeScript", "type": "concept"}],
+      "keywords": ["typescript", "programming", "experience"]
+    },
+    {
+      "content": "Prefers TypeScript over plain JavaScript for development",
+      "type": "preference",
+      "confidence": 0.90,
+      "entities": [{"name": "TypeScript", "type": "concept"}, {"name": "JavaScript", "type": "concept"}],
+      "keywords": ["typescript", "javascript", "preference"]
+    },
+    {
+      "content": "Currently working on a React project",
+      "type": "context",
+      "confidence": 0.85,
+      "entities": [{"name": "React", "type": "concept"}],
+      "keywords": ["react", "project", "current"]
+    },
+    {
+      "content": "Works for Acme Inc.",
+      "type": "relationship",
+      "confidence": 0.90,
+      "entities": [{"name": "Acme Inc.", "type": "organization"}],
+      "keywords": ["employment", "company", "work"]
+    }
+  ]
+}
+Example 2:
+Input: "Note: Remember to update the API docs before the Friday release. The authentication endpoint was changed last week."
+Output:
+{
+  "memories": [
+    {
+      "content": "Need to update API docs before Friday release",
+      "type": "note",
+      "confidence": 0.85,
+      "entities": [],
+      "keywords": ["api", "documentation", "release", "friday"]
+    },
+    {
+      "content": "Authentication endpoint was modified recently",
+      "type": "event",
+      "confidence": 0.90,
+      "entities": [],
+      "keywords": ["authentication", "endpoint", "change", "api"]
+    }
+  ]
+}
+Example 3:
+Input: "Dr. Sarah Chen, my mentor at Stanford, taught me that clean code is more important than clever code."
+Output:
+{
+  "memories": [
+    {
+      "content": "Dr. Sarah Chen is a mentor",
+      "type": "relationship",
+      "confidence": 0.95,
+      "entities": [{"name": "Dr. Sarah Chen", "type": "person"}, {"name": "Stanford", "type": "organization"}],
+      "keywords": ["mentor", "relationship"]
+    },
+    {
+      "content": "Believes clean code is more important than clever code",
+      "type": "preference",
+      "confidence": 0.85,
+      "entities": [],
+      "keywords": ["clean code", "programming", "philosophy"]
+    },
+    {
+      "content": "Has connection to Stanford",
+      "type": "relationship",
+      "confidence": 0.80,
+      "entities": [{"name": "Stanford", "type": "organization"}],
+      "keywords": ["stanford", "education"]
+    }
+  ]
+}`
+/**
+ * Generate the user prompt for memory extraction
+ */
+export function generateExtractionPrompt(
+  text: string,
+  options?: {
+    containerTag?: string
+    context?: string
+    maxMemories?: number
+    minConfidence?: number
+  }
+): string {
+  let prompt = `Extract memories from the following text. Return a JSON object with a "memories" array.\n\n`
+  if (options?.containerTag) {
+    prompt += `Container/Category: ${options.containerTag}\n`
+  }
+  if (options?.context) {
+    prompt += `Additional Context: ${options.context}\n`
+  }
+  if (options?.maxMemories) {
+    prompt += `Maximum memories to extract: ${options.maxMemories}\n`
+  }
+  if (options?.minConfidence) {
+    prompt += `Minimum confidence threshold: ${options.minConfidence}\n`
+  }
+  prompt += `\nText to analyze:\n"""\n${text}\n"""\n\n`
+  prompt += `Respond with ONLY a valid JSON object in this exact format:
+{
+  "memories": [
+    {
+      "content": "string - standalone statement",
+      "type": "fact|event|preference|skill|relationship|context|note",
+      "confidence": 0.0-1.0,
+      "entities": [{"name": "string", "type": "person|place|organization|date|concept|other"}],
+      "keywords": ["string"]
+    }
+  ]
+}`
+  return prompt
+}
+// ============================================================================
+// Relationship Detection Prompts
+// ============================================================================
+/**
+ * System prompt for relationship detection
+ */
+export const RELATIONSHIP_DETECTION_SYSTEM_PROMPT = `You are an expert at detecting semantic relationships between pieces of information.
+Given a NEW memory and a list of EXISTING memories, determine what relationships exist.
+Relationship Types:
+- updates: NEW contradicts or corrects OLD, making OLD outdated
+- extends: NEW adds detail or elaboration to OLD without contradicting
+- derives: NEW is a logical consequence or inference from OLD
+- contradicts: NEW directly conflicts with OLD (both may be valid from different times)
+- related: NEW is semantically similar or topically connected to OLD
+- supersedes: NEW completely replaces OLD (OLD should be archived)
+Guidelines:
+- Only identify relationships with confidence >= 0.6
+- "updates" and "supersedes" should mark the old memory for supersession
+- "contradicts" does NOT mean the old memory should be removed (both may be valid)
+- Consider temporal context when detecting updates
+- Be conservative - prefer no relationship over a weak one`
+/**
+ * Few-shot examples for relationship detection
+ */
+export const RELATIONSHIP_DETECTION_EXAMPLES = `
+Example 1:
+NEW Memory: { "id": "new1", "content": "Uses Python 3.11 for all projects", "type": "preference" }
+EXISTING Memories: [
+  { "id": "old1", "content": "Prefers Python 3.9", "type": "preference" },
+  { "id": "old2", "content": "Expert in Python programming", "type": "skill" }
+]
+Output:
+{
+  "relationships": [
+    {
+      "sourceMemoryId": "new1",
+      "targetMemoryId": "old1",
+      "type": "updates",
+      "confidence": 0.90,
+      "reason": "New version preference supersedes old version preference"
+    },
+    {
+      "sourceMemoryId": "new1",
+      "targetMemoryId": "old2",
+      "type": "related",
+      "confidence": 0.75,
+      "reason": "Both relate to Python programming"
+    }
+  ],
+  "supersededMemoryIds": ["old1"]
+}
+Example 2:
+NEW Memory: { "id": "new2", "content": "The API now supports batch operations", "type": "fact" }
+EXISTING Memories: [
+  { "id": "old3", "content": "The API only supports single-item operations", "type": "fact" },
+  { "id": "old4", "content": "Working on adding batch support to the API", "type": "context" }
+]
+Output:
+{
+  "relationships": [
+    {
+      "sourceMemoryId": "new2",
+      "targetMemoryId": "old3",
+      "type": "supersedes",
+      "confidence": 0.95,
+      "reason": "New capability statement makes old limitation statement obsolete"
+    },
+    {
+      "sourceMemoryId": "new2",
+      "targetMemoryId": "old4",
+      "type": "derives",
+      "confidence": 0.85,
+      "reason": "Batch support being complete is a result of the work mentioned"
+    }
+  ],
+  "supersededMemoryIds": ["old3", "old4"]
+}`
+/**
+ * Generate the user prompt for relationship detection
+ */
+export function generateRelationshipPrompt(
+  newMemory: { id: string; content: string; type: MemoryType },
+  existingMemories: Array<{ id: string; content: string; type: MemoryType }>,
+  options?: {
+    maxRelationships?: number
+    minConfidence?: number
+  }
+): string {
+  let prompt = `Analyze the relationship between the NEW memory and EXISTING memories.\n\n`
+  prompt += `NEW Memory:\n${JSON.stringify(newMemory, null, 2)}\n\n`
+  prompt += `EXISTING Memories:\n${JSON.stringify(existingMemories, null, 2)}\n\n`
+  if (options?.minConfidence) {
+    prompt += `Only include relationships with confidence >= ${options.minConfidence}\n`
+  }
+  if (options?.maxRelationships) {
+    prompt += `Return at most ${options.maxRelationships} relationships\n`
+  }
+  prompt += `\nRespond with ONLY a valid JSON object in this exact format:
+{
+  "relationships": [
+    {
+      "sourceMemoryId": "string - always the NEW memory id",
+      "targetMemoryId": "string - an EXISTING memory id",
+      "type": "updates|extends|derives|contradicts|related|supersedes",
+      "confidence": 0.0-1.0,
+      "reason": "string - brief explanation"
+    }
+  ],
+  "supersededMemoryIds": ["string - ids of memories that should be marked as outdated"]
+}`
+  return prompt
+}
+// ============================================================================
+// Response Parsing
+// ============================================================================
+/**
+ * Normalize LLM JSON responses by stripping markdown fences and common wrappers.
+ */
+export function normalizeJsonResponse(response: string): string {
+  const trimmed = response.trim()
+  // Prefer fenced JSON blocks when present (allows explanatory prose around JSON).
+  const fencedMatch = trimmed.match(/```(?:json)?\s*([\s\S]*?)\s*```/i)
+  if (fencedMatch?.[1]) {
+    return fencedMatch[1].trim()
+  }
+  // Fallback: extract the outermost JSON object if surrounded by extra text.
+  const firstBrace = trimmed.indexOf('{')
+  const lastBrace = trimmed.lastIndexOf('}')
+  if (firstBrace !== -1 && lastBrace > firstBrace) {
+    return trimmed.slice(firstBrace, lastBrace + 1).trim()
+  }
+  return trimmed
+}
+/**
+ * Parse and validate extraction response from LLM
+ */
+export function parseExtractionResponse(response: string): {
+  memories: Array<{
+    content: string
+    type: MemoryType
+    confidence: number
+    entities: Array<{ name: string; type: string }>
+    keywords: string[]
+  }>
+} {
+  const cleaned = normalizeJsonResponse(response)
+  try {
+    const parsed = JSON.parse(cleaned)
+    if (!parsed.memories || !Array.isArray(parsed.memories)) {
+      throw new Error('Response missing memories array')
+    }
+    // Validate and clean each memory
+    const validTypes: MemoryType[] = ['fact', 'event', 'preference', 'skill', 'relationship', 'context', 'note']
+    const memories = parsed.memories
+      .filter((m: unknown) => {
+        if (!m || typeof m !== 'object') return false
+        const mem = m as Record<string, unknown>
+        return (
+          typeof mem.content === 'string' &&
+          mem.content.length > 0 &&
+          typeof mem.type === 'string' &&
+          validTypes.includes(mem.type as MemoryType)
+        )
+      })
+      .map((m: Record<string, unknown>) => ({
+        content: String(m.content).trim(),
+        type: m.type as MemoryType,
+        confidence: typeof m.confidence === 'number' ? Math.max(0, Math.min(1, m.confidence)) : 0.5,
+        entities: Array.isArray(m.entities)
+          ? m.entities.filter(
+              (e: unknown) => e && typeof e === 'object' && 'name' in (e as object) && 'type' in (e as object)
+            )
+          : [],
+        keywords: Array.isArray(m.keywords) ? m.keywords.filter((k: unknown) => typeof k === 'string') : [],
+      }))
+    return { memories }
+  } catch (error) {
+    throw new Error(`Failed to parse extraction response: ${error instanceof Error ? error.message : String(error)}`)
+  }
+}
+/**
+ * Parse and validate relationship response from LLM
+ */
+export function parseRelationshipResponse(response: string): {
+  relationships: Array<{
+    sourceMemoryId: string
+    targetMemoryId: string
+    type: string
+    confidence: number
+    reason: string
+  }>
+  supersededMemoryIds: string[]
+} {
+  const cleaned = normalizeJsonResponse(response)
+  try {
+    const parsed = JSON.parse(cleaned)
+    const validTypes = ['updates', 'extends', 'derives', 'contradicts', 'related', 'supersedes']
+    const relationships = Array.isArray(parsed.relationships)
+      ? parsed.relationships
+          .filter((r: unknown) => {
+            if (!r || typeof r !== 'object') return false
+            const rel = r as Record<string, unknown>
+            return (
+              typeof rel.sourceMemoryId === 'string' &&
+              typeof rel.targetMemoryId === 'string' &&
+              typeof rel.type === 'string' &&
+              validTypes.includes(rel.type)
+            )
+          })
+          .map((r: Record<string, unknown>) => ({
+            sourceMemoryId: String(r.sourceMemoryId),
+            targetMemoryId: String(r.targetMemoryId),
+            type: String(r.type),
+            confidence: typeof r.confidence === 'number' ? Math.max(0, Math.min(1, r.confidence)) : 0.5,
+            reason: typeof r.reason === 'string' ? r.reason : 'No reason provided',
+          }))
+      : []
+    const supersededMemoryIds = Array.isArray(parsed.supersededMemoryIds)
+      ? parsed.supersededMemoryIds.filter((id: unknown) => typeof id === 'string')
+      : []
+    return { relationships, supersededMemoryIds }
+  } catch (error) {
+    throw new Error(`Failed to parse relationship response: ${error instanceof Error ? error.message : String(error)}`)
+  }
+}