npm - audrey - Versions diffs - 0.17.0 → 0.20.0 - Mend

audrey 0.17.0 → 0.20.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (191) hide show

package/README.md +129 -374
package/dist/mcp-server/config.d.ts +20 -0
package/dist/mcp-server/config.d.ts.map +1 -0
package/dist/mcp-server/config.js +125 -0
package/dist/mcp-server/config.js.map +1 -0
package/dist/mcp-server/index.d.ts +100 -0
package/dist/mcp-server/index.d.ts.map +1 -0
package/dist/mcp-server/index.js +1113 -0
package/dist/mcp-server/index.js.map +1 -0
package/dist/src/adaptive.d.ts +7 -0
package/dist/src/adaptive.d.ts.map +1 -0
package/dist/src/adaptive.js +49 -0
package/dist/src/adaptive.js.map +1 -0
package/dist/src/affect.d.ts +19 -0
package/dist/src/affect.d.ts.map +1 -0
package/dist/src/affect.js +72 -0
package/dist/src/affect.js.map +1 -0
package/dist/src/audrey.d.ts +140 -0
package/dist/src/audrey.d.ts.map +1 -0
package/dist/src/audrey.js +564 -0
package/dist/src/audrey.js.map +1 -0
package/dist/src/capsule.d.ts +68 -0
package/dist/src/capsule.d.ts.map +1 -0
package/dist/src/capsule.js +311 -0
package/dist/src/capsule.js.map +1 -0
package/dist/src/causal.d.ts +28 -0
package/dist/src/causal.d.ts.map +1 -0
package/dist/src/causal.js +65 -0
package/dist/src/causal.js.map +1 -0
package/dist/src/confidence.d.ts +12 -0
package/dist/src/confidence.d.ts.map +1 -0
package/dist/src/confidence.js +63 -0
package/dist/src/confidence.js.map +1 -0
package/dist/src/consolidate.d.ts +8 -0
package/dist/src/consolidate.d.ts.map +1 -0
package/dist/src/consolidate.js +218 -0
package/dist/src/consolidate.js.map +1 -0
package/dist/src/context.d.ts +3 -0
package/dist/src/context.d.ts.map +1 -0
package/dist/src/context.js +19 -0
package/dist/src/context.js.map +1 -0
package/dist/src/db.d.ts +12 -0
package/dist/src/db.d.ts.map +1 -0
package/dist/src/db.js +380 -0
package/dist/src/db.js.map +1 -0
package/dist/src/decay.d.ts +7 -0
package/dist/src/decay.d.ts.map +1 -0
package/dist/src/decay.js +68 -0
package/dist/src/decay.js.map +1 -0
package/dist/src/embedding.d.ts +57 -0
package/dist/src/embedding.d.ts.map +1 -0
package/dist/src/embedding.js +254 -0
package/dist/src/embedding.js.map +1 -0
package/dist/src/encode.d.ts +15 -0
package/dist/src/encode.d.ts.map +1 -0
package/dist/src/encode.js +36 -0
package/dist/src/encode.js.map +1 -0
package/dist/src/events.d.ts +69 -0
package/dist/src/events.d.ts.map +1 -0
package/dist/src/events.js +149 -0
package/dist/src/events.js.map +1 -0
package/dist/src/export.d.ts +3 -0
package/dist/src/export.d.ts.map +1 -0
package/dist/src/export.js +46 -0
package/dist/src/export.js.map +1 -0
package/dist/src/forget.d.ts +11 -0
package/dist/src/forget.d.ts.map +1 -0
package/dist/src/forget.js +105 -0
package/dist/src/forget.js.map +1 -0
package/dist/src/fts.d.ts +34 -0
package/dist/src/fts.d.ts.map +1 -0
package/dist/src/fts.js +117 -0
package/dist/src/fts.js.map +1 -0
package/dist/src/hybrid-recall.d.ts +37 -0
package/dist/src/hybrid-recall.d.ts.map +1 -0
package/dist/src/hybrid-recall.js +213 -0
package/dist/src/hybrid-recall.js.map +1 -0
package/dist/src/import.d.ts +4 -0
package/dist/src/import.d.ts.map +1 -0
package/dist/src/import.js +127 -0
package/dist/src/import.js.map +1 -0
package/dist/src/index.d.ts +22 -0
package/dist/src/index.d.ts.map +1 -0
package/{src → dist/src}/index.js +5 -13
package/dist/src/index.js.map +1 -0
package/dist/src/interference.d.ts +13 -0
package/dist/src/interference.d.ts.map +1 -0
package/dist/src/interference.js +45 -0
package/dist/src/interference.js.map +1 -0
package/dist/src/introspect.d.ts +4 -0
package/dist/src/introspect.d.ts.map +1 -0
package/dist/src/introspect.js +40 -0
package/dist/src/introspect.js.map +1 -0
package/dist/src/llm.d.ts +38 -0
package/dist/src/llm.d.ts.map +1 -0
package/dist/src/llm.js +167 -0
package/dist/src/llm.js.map +1 -0
package/dist/src/migrate.d.ts +6 -0
package/dist/src/migrate.d.ts.map +1 -0
package/dist/src/migrate.js +51 -0
package/dist/src/migrate.js.map +1 -0
package/dist/src/promote.d.ts +40 -0
package/dist/src/promote.d.ts.map +1 -0
package/dist/src/promote.js +200 -0
package/dist/src/promote.js.map +1 -0
package/dist/src/prompts.d.ts +16 -0
package/dist/src/prompts.d.ts.map +1 -0
package/{src → dist/src}/prompts.js +172 -203
package/dist/src/prompts.js.map +1 -0
package/dist/src/recall.d.ts +9 -0
package/dist/src/recall.d.ts.map +1 -0
package/dist/src/recall.js +432 -0
package/dist/src/recall.js.map +1 -0
package/dist/src/redact.d.ts +27 -0
package/dist/src/redact.d.ts.map +1 -0
package/dist/src/redact.js +228 -0
package/dist/src/redact.js.map +1 -0
package/dist/src/rollback.d.ts +8 -0
package/dist/src/rollback.d.ts.map +1 -0
package/dist/src/rollback.js +33 -0
package/dist/src/rollback.js.map +1 -0
package/dist/src/routes.d.ts +7 -0
package/dist/src/routes.d.ts.map +1 -0
package/dist/src/routes.js +226 -0
package/dist/src/routes.js.map +1 -0
package/dist/src/rules-compiler.d.ts +20 -0
package/dist/src/rules-compiler.d.ts.map +1 -0
package/dist/src/rules-compiler.js +143 -0
package/dist/src/rules-compiler.js.map +1 -0
package/dist/src/server.d.ts +12 -0
package/dist/src/server.d.ts.map +1 -0
package/dist/src/server.js +22 -0
package/dist/src/server.js.map +1 -0
package/dist/src/tool-trace.d.ts +37 -0
package/dist/src/tool-trace.d.ts.map +1 -0
package/dist/src/tool-trace.js +142 -0
package/dist/src/tool-trace.js.map +1 -0
package/dist/src/types.d.ts +446 -0
package/dist/src/types.d.ts.map +1 -0
package/dist/src/types.js +6 -0
package/dist/src/types.js.map +1 -0
package/dist/src/ulid.d.ts +3 -0
package/dist/src/ulid.d.ts.map +1 -0
package/dist/src/ulid.js +11 -0
package/dist/src/ulid.js.map +1 -0
package/dist/src/utils.d.ts +10 -0
package/dist/src/utils.d.ts.map +1 -0
package/dist/src/utils.js +41 -0
package/dist/src/utils.js.map +1 -0
package/dist/src/validate.d.ts +22 -0
package/dist/src/validate.d.ts.map +1 -0
package/dist/src/validate.js +109 -0
package/dist/src/validate.js.map +1 -0
package/docs/production-readiness.md +28 -0
package/examples/fintech-ops-demo.js +1 -1
package/examples/healthcare-ops-demo.js +1 -1
package/examples/stripe-demo.js +1 -1
package/package.json +34 -13
package/benchmarks/baselines.js +0 -169
package/benchmarks/cases.js +0 -421
package/benchmarks/reference-results.js +0 -70
package/benchmarks/report.js +0 -255
package/benchmarks/run.js +0 -514
package/mcp-server/config.js +0 -133
package/mcp-server/index.js +0 -1265
package/mcp-server/serve.js +0 -482
package/src/adaptive.js +0 -53
package/src/affect.js +0 -64
package/src/audrey.js +0 -642
package/src/causal.js +0 -95
package/src/confidence.js +0 -120
package/src/consolidate.js +0 -281
package/src/context.js +0 -15
package/src/db.js +0 -391
package/src/decay.js +0 -84
package/src/embedding.js +0 -260
package/src/encode.js +0 -69
package/src/export.js +0 -67
package/src/forget.js +0 -111
package/src/fts.js +0 -134
package/src/import.js +0 -273
package/src/interference.js +0 -51
package/src/introspect.js +0 -48
package/src/llm.js +0 -249
package/src/migrate.js +0 -58
package/src/recall.js +0 -573
package/src/rollback.js +0 -42
package/src/ulid.js +0 -18
package/src/utils.js +0 -63
package/src/validate.js +0 -172
package/types/index.d.ts +0 -434

package/README.md CHANGED Viewed

@@ -4,472 +4,227 @@
 [![npm version](https://img.shields.io/npm/v/audrey.svg)](https://www.npmjs.com/package/audrey)
 [![License: MIT](https://img.shields.io/badge/license-MIT-blue.svg)](LICENSE)
-Persistent memory for Claude Code and AI agents. Two commands, every session remembers.
+Audrey is a persistent memory and continuity engine for Claude Code and AI agents.
-```bash
-npx audrey install          # 13 MCP memory tools
-npx audrey hooks install    # automatic memory in every session
-```
+It gives an agent a local memory store, durable recall, consolidation, contradiction handling, a REST sidecar, MCP tools, and benchmark gates without adding external infrastructure.
-That's it. Claude Code now wakes up knowing what happened yesterday, recalls relevant context per-prompt, and consolidates learnings when the session ends. No cloud, no config files, no infrastructure — one SQLite file.
+Requires Node.js 20+.
-Audrey also works as a standalone SDK, MCP server, and REST API for any AI agent framework.
+## Quick Start
-> **On `/dream`** — Anthropic recently shipped `/dream` for Claude Code memory maintenance. Audrey predates it and goes further: episodic-to-semantic consolidation, contradiction detection, confidence decay, emotional affect, causal reasoning, and source reliability weighting. `/dream` is a maintenance pass. Audrey is a cognitive memory architecture.
+### Claude Code
-## Why Audrey
+```bash
+npx audrey init
+npx audrey doctor
+```
-Most AI memory tools are storage wrappers. They save facts, retrieve facts, and keep everything forever. That leaves real production problems unsolved:
+This uses the default `local-offline` preset:
-- Old information stays weighted like new information.
-- Raw events never become reusable operating knowledge.
-- Conflicting facts quietly coexist.
-- Model-generated mistakes can get reinforced into false "truth."
+- registers Audrey with Claude Code
+- installs hooks for automatic recall and reflection
+- uses local embeddings by default
+- stores memory in one local SQLite-backed data directory
-Audrey models memory as a working system instead of a filing cabinet.
+### REST or Docker Sidecar
-| Brain Structure | Audrey Component | What It Does |
-|---|---|---|
-| Hippocampus | Episodic Memory | Fast capture of raw events and observations |
-| Neocortex | Semantic Memory | Consolidated principles and patterns |
-| Cerebellum | Procedural Memory | Learned workflows and conditional behaviors |
-| Sleep Replay | Dream Cycle | Consolidates episodes into principles and applies decay |
-| Prefrontal Cortex | Validation Engine | Truth-checking and contradiction detection |
-| Amygdala | Affect System | Emotional encoding, arousal-salience coupling, and mood-congruent recall |
-## What You Get
-- Local SQLite-backed memory with `sqlite-vec`
-- MCP server for Claude Code with 13 memory tools
-- **Claude Code hooks integration** — automatic memory in every session (`npx audrey hooks install`)
-- JavaScript SDK for direct application use
-- **Git-friendly versioning** via JSON snapshots (`npx audrey snapshot` / `restore`)
-- **REST API server** - any language, any framework (`npx audrey serve`)
-- Health checks via `npx audrey status --json`
-- Benchmark harness with retrieval and lifecycle-operation tracks via `npm run bench:memory`
-- Regression gate for benchmark quality via `npm run bench:memory:check`
-- Optional local embeddings and optional hosted LLM providers
-- Strongest production fit today in financial services ops and healthcare ops
-## Install
-### MCP Server for Claude Code
+```bash
+npx audrey init sidecar-prod
+docker compose up -d --build
+```
+Then verify:
 ```bash
-npx audrey install          # Register 13 MCP memory tools
-npx audrey hooks install    # Wire automatic memory into session lifecycle
+npx audrey doctor
+curl http://localhost:3487/health
 ```
-Audrey auto-detects providers from your environment:
+## Why Audrey
-- `GOOGLE_API_KEY` or `GEMINI_API_KEY` -> Gemini embeddings (3072d)
-- no embedding key -> local embeddings (384d, MiniLM, offline-capable)
-- `AUDREY_EMBEDDING_PROVIDER=openai` -> explicit OpenAI embeddings (1536d)
-- `ANTHROPIC_API_KEY` -> LLM-powered consolidation, contradiction detection, and reflection
+- Local-first: memory lives in SQLite with `sqlite-vec`, not a hosted vector database.
+- Practical: MCP, CLI, REST, JavaScript, Python, and Docker are all first-class.
+- Durable: snapshot, restore, health checks, benchmark gates, and graceful shutdown are built in.
+- Structured: Audrey does more than save notes. It consolidates, decays, tracks contradictions, and supports procedural memory.
-Quick checks:
+## What Ships
-```bash
-npx audrey status
-npx audrey status --json
-npx audrey status --json --fail-on-unhealthy
-```
+- Claude Code MCP server with 13 memory tools
+- Automatic hook-based recall and reflection for Claude Code sessions
+- JavaScript SDK
+- Python SDK packaged as `audrey-memory`
+- REST API for sidecar deployment
+- Docker and Compose deployment path
+- Snapshot and restore for portable memory state
+- Machine-readable health and benchmark gates
+- Local benchmark harness with retrieval and lifecycle-operation tracks
+## Setup Presets
-### SDK
+`npx audrey init` supports four named presets:
+| Preset | Best For | Behavior |
+|---|---|---|
+| `local-offline` | Claude Code on one machine | Local embeddings, MCP install, hooks install |
+| `hosted-fast` | Claude Code with provider keys already present | Auto-picks hosted providers from env, MCP install, hooks install |
+| `ci-mock` | CI and smoke tests | Mock embedding + LLM providers, no Claude-specific setup |
+| `sidecar-prod` | REST API and Docker deployment | Sidecar-oriented defaults, no Claude-specific setup |
+Useful checks:
 ```bash
-npm install audrey
+npx audrey doctor
+npx audrey status
+npx audrey status --json --fail-on-unhealthy
 ```
-Zero external infrastructure. One SQLite file.
+## Use Audrey From Code
-## Quick Start
+### JavaScript
 ```js
 import { Audrey } from 'audrey';
 const brain = new Audrey({
-  dataDir: './agent-memory',
+  dataDir: './audrey-data',
   agent: 'support-agent',
   embedding: { provider: 'local', dimensions: 384 },
 });
 await brain.encode({
-  content: 'Stripe API returned 429 above 100 req/s',
+  content: 'Stripe returns HTTP 429 above 100 req/s',
   source: 'direct-observation',
   tags: ['stripe', 'rate-limit'],
-  context: { task: 'debugging', domain: 'payments' },
-  affect: { valence: -0.4, arousal: 0.7, label: 'frustration' },
-});
-const memories = await brain.recall('stripe rate limits', {
-  limit: 5,
-  context: { task: 'debugging', domain: 'payments' },
 });
-const dream = await brain.dream();
-const briefing = await brain.greeting({ context: 'debugging stripe' });
+const memories = await brain.recall('stripe rate limit');
 await brain.waitForIdle();
 brain.close();
 ```
-## MCP Tools
-Every Claude Code session gets these tools after `npx audrey install`:
-- `memory_encode`
-- `memory_recall`
-- `memory_consolidate`
-- `memory_dream`
-- `memory_introspect`
-- `memory_resolve_truth`
-- `memory_export`
-- `memory_import`
-- `memory_forget`
-- `memory_decay`
-- `memory_status`
-- `memory_reflect`
-- `memory_greeting`
-## CLI
-```bash
-# Setup
-npx audrey install              # Register MCP server with Claude Code
-npx audrey uninstall            # Remove MCP server registration
-npx audrey hooks install        # Wire Audrey into Claude Code hooks (automatic memory)
-npx audrey hooks uninstall      # Remove Audrey hooks
-# Health and monitoring
-npx audrey status               # Human-readable health report
-npx audrey status --json        # Machine-readable health output
-npx audrey status --json --fail-on-unhealthy  # CI gate
-# Session lifecycle (used by hooks automatically)
-npx audrey greeting             # Load identity, principles, mood
-npx audrey greeting "auth"      # With context-aware recall
-npx audrey recall "query"       # Semantic memory search (returns hook-compatible JSON)
-npx audrey reflect              # Consolidate learnings from stdin conversation + dream
-# Maintenance
-npx audrey dream                # Full consolidation + decay cycle
-npx audrey reembed              # Re-embed all memories after provider/dimension change
-# Versioning
-npx audrey snapshot             # Export memories to timestamped JSON file
-npx audrey snapshot backup.json # Export to specific file
-npx audrey restore backup.json  # Restore from snapshot (re-embeds with current provider)
-npx audrey restore backup.json --force  # Overwrite existing memories
-# REST API server
-npx audrey serve                # Start HTTP server on port 3487
-npx audrey serve 8080           # Custom port
-```
-## Hooks Integration
-Audrey integrates directly into Claude Code's hook lifecycle for automatic, zero-config memory in every session:
-```bash
-npx audrey hooks install
-```
-This configures four hooks in `~/.claude/settings.json`:
-| Hook Event | Command | What Happens |
-|---|---|---|
-| **SessionStart** | `npx audrey greeting` | Loads identity, learned principles, current mood, and recent memories |
-| **UserPromptSubmit** | `npx audrey recall` | Semantic search on every prompt — injects relevant memories as context |
-| **Stop** | `npx audrey reflect` | Extracts lasting learnings from the conversation, then runs a dream cycle |
-| **PostCompact** | `npx audrey greeting` | Re-injects critical memories after context window compaction |
-With hooks installed, Claude Code sessions automatically wake up with context, recall relevant memories per-prompt, and consolidate learnings when the session ends. No manual tool calls needed.
-## REST API Server
-Turn Audrey into an HTTP service that any language or framework can use:
+### Python
 ```bash
-npx audrey serve           # Start on port 3487
-npx audrey serve 8080      # Custom port
-AUDREY_API_KEY=secret npx audrey serve  # With Bearer token auth
+pip install audrey-memory
 ```
-Endpoints:
+```python
+from audrey_memory import Audrey
-| Method | Path | Description |
-|--------|------|-------------|
-| `GET` | `/health` | Liveness probe |
-| `GET` | `/status` | Memory stats (introspect) |
-| `POST` | `/encode` | Store a memory (`{ content, source, tags?, context?, affect? }`) |
-| `POST` | `/recall` | Semantic search (`{ query, limit?, context? }`) |
-| `POST` | `/dream` | Full consolidation + decay cycle |
-| `POST` | `/consolidate` | Run consolidation only |
-| `POST` | `/forget` | Forget by `{ id }` or `{ query }` |
-| `POST` | `/snapshot` | Export all memories as JSON |
-| `POST` | `/restore` | Wipe and reimport from snapshot |
+brain = Audrey(
+    base_url="http://127.0.0.1:3487",
+    api_key="secret",
+    agent="support-agent",
+)
-Example from any language:
-```bash
-# Store a memory
-curl -X POST http://localhost:3487/encode \
-  -H "Content-Type: application/json" \
-  -d '{"content": "The deploy failed due to OOM", "source": "direct-observation"}'
-# Search memories
-curl -X POST http://localhost:3487/recall \
-  -H "Content-Type: application/json" \
-  -d '{"query": "deploy failures", "limit": 5}'
+memory_id = brain.encode(
+    "Stripe returns HTTP 429 above 100 req/s",
+    source="direct-observation",
+)
+results = brain.recall("stripe rate limit", limit=5)
+brain.close()
 ```
-## Versioning
-Audrey stores memories in SQLite with WAL mode, which isn't git-friendly. Instead, use JSON snapshots:
+## Key Commands
 ```bash
-# Save a checkpoint
-npx audrey snapshot
-# Commit it
-git add audrey-snapshot-*.json && git commit -m "memory checkpoint"
-# Restore on another machine or after a reset
-npx audrey restore audrey-snapshot-2026-03-24_15-30-00.json
-```
-Snapshots are human-readable, diffable, and provider-agnostic. Embeddings are re-generated on import, so you can switch providers (e.g., local to Gemini) and restore seamlessly.
-## Production Fit
-Audrey is strongest today in workflows where memory must stay local, reviewable, and durable:
-- **Financial services operations**: payments ops, fraud and dispute workflows, KYC/KYB review, internal policy assistants
-- **Healthcare operations**: care coordination, prior-auth workflows, intake and referral routing, internal staff knowledge assistants
-Audrey is a memory layer, not a compliance boundary. For regulated environments, pair it with application-level access control, encryption, retention, audit logging, and data-minimization rules.
-Production guide: [docs/production-readiness.md](docs/production-readiness.md)
-Industry demos:
-- [examples/fintech-ops-demo.js](examples/fintech-ops-demo.js)
-- [examples/healthcare-ops-demo.js](examples/healthcare-ops-demo.js)
-## Core Concepts
-### Memory Types
-- **Episodic**: raw events and observations
-- **Semantic**: consolidated principles
-- **Procedural**: reusable workflows and actions
-- **Causal**: relationships that explain why something happened
-### Confidence
-Audrey scores memories using source reliability, evidence agreement, recency decay, and retrieval reinforcement. That helps keep direct observations above guesses and keeps stale or weakly supported knowledge from dominating recall.
-### Dream Cycle
-`brain.dream()` runs the full maintenance path:
-1. Consolidate related episodes into principles.
-2. Apply decay so low-value memories lose weight over time.
-3. Report memory health and current stats.
-### Contradiction Handling
-When evidence conflicts, Audrey tracks the contradiction instead of silently picking a winner. Resolutions can stay open, be marked resolved, or become context-dependent.
-## Configuration
-```js
-const brain = new Audrey({
-  dataDir: './audrey-data',
-  agent: 'my-agent',
-  embedding: {
-    provider: 'local', // mock | local | gemini | openai
-    dimensions: 384,
-    device: 'gpu',
-  },
-  llm: {
-    provider: 'anthropic', // mock | anthropic | openai
-    apiKey: process.env.ANTHROPIC_API_KEY,
-  },
-  consolidation: {
-    minEpisodes: 3,
-  },
-  context: {
-    enabled: true,
-    weight: 0.3,
-  },
-  affect: {
-    enabled: true,
-    weight: 0.2,
-  },
-  decay: {
-    dormantThreshold: 0.1,
-  },
-});
-```
-## Operations
+# Setup
+npx audrey init
+npx audrey init hosted-fast
+npx audrey init ci-mock
+npx audrey init sidecar-prod
-Recommended production workflow:
+# Claude Code integration
+npx audrey install
+npx audrey hooks install
+npx audrey hooks uninstall
+npx audrey uninstall
-```bash
-# Health checks
+# Health and maintenance
+npx audrey doctor
 npx audrey status
-npx audrey status --json --fail-on-unhealthy
-# Scheduled maintenance
 npx audrey dream
-# Repair vector/index drift after provider or dimension changes
 npx audrey reembed
-# Version control your memories
+# Versioning
 npx audrey snapshot
-npx audrey restore <file> --force
-# Run the benchmark harness
-npm run bench:memory
+npx audrey restore backup.json --force
-# Fail CI if Audrey drops below benchmark guardrails
-npm run bench:memory:check
+# Sidecar
+npx audrey serve
+docker compose up -d --build
 ```
-## Benchmarking
-Audrey now ships with a memory benchmark harness built for three purposes:
+## Benchmarks
-- measure Audrey against naive local baselines on LongMemEval-style memory abilities plus privacy and abstention checks
-- measure Audrey on lifecycle operations that other memory systems usually hand-wave: update, overwrite, delete, merge, and abstain
-- keep Audrey grounded against published LoCoMo results from leading memory systems
-Run it with:
+Audrey ships with a benchmark harness and release gate:
 ```bash
 npm run bench:memory
+npm run bench:memory:check
 ```
-Artifacts land in `benchmarks/output/` as JSON, SVG charts, and an HTML report.
+The benchmark suite measures:
-For CI and release gates:
+- retrieval behavior
+- update and overwrite behavior
+- delete and abstain behavior
+- semantic and procedural merge behavior
-```bash
-npm run bench:memory:check
-```
+Current repo snapshot:
-That command fails if Audrey drops below its minimum local score, local pass rate, or required margin over the strongest naive baseline.
+![Audrey local benchmark](docs/assets/benchmarks/local-benchmark.svg)
-For track-specific runs:
+For detailed methodology, published comparison anchors, and generated reports, see [docs/benchmarking.md](docs/benchmarking.md).
-```bash
-npm run bench:memory:retrieval
-npm run bench:memory:operations
-```
+## Production
-For committed GitHub-friendly charts:
+Audrey is strongest in workflows where memory must stay local, reviewable, and durable. It already fits well as a sidecar for internal agents in operational domains like financial services and healthcare operations, but it is a memory layer, not a compliance boundary.
-```bash
-npm run bench:memory:readme-assets
-```
+Production guide: [docs/production-readiness.md](docs/production-readiness.md)
-### README Snapshot
+Examples:
-Local Audrey-vs-baseline results:
+- [examples/fintech-ops-demo.js](examples/fintech-ops-demo.js)
+- [examples/healthcare-ops-demo.js](examples/healthcare-ops-demo.js)
+- [examples/stripe-demo.js](examples/stripe-demo.js)
-![Audrey local memory benchmark](docs/assets/benchmarks/local-benchmark.svg)
+## Environment
-Lifecycle operations benchmark:
+Starter config:
-![Audrey memory operations benchmark](docs/assets/benchmarks/operations-benchmark.svg)
+- [.env.example](.env.example)
+- [.env.docker.example](.env.docker.example)
-Published comparison anchors from current LLM memory systems:
+Key environment variables:
-![Published LLM memory benchmark comparison](docs/assets/benchmarks/published-memory-standards.svg)
+- `AUDREY_DATA_DIR`
+- `AUDREY_EMBEDDING_PROVIDER`
+- `AUDREY_LLM_PROVIDER`
+- `AUDREY_DEVICE`
+- `AUDREY_API_KEY`
+- `AUDREY_HOST`
+- `AUDREY_PORT`
-**Current deterministic CI snapshot** (`node benchmarks/run.js --provider mock --dimensions 64`):
+## Documentation
-| Local track | Audrey | Best Baseline |
-|---|---|---|
-| Combined local benchmark | **100.0%** | 41.7% |
-| Retrieval capabilities | **100.0%** | 56.3% |
-| Memory operations | **100.0%** | 25.0% |
-Retrieval-family breakdown:
-| Category | Audrey | Vector Only | Best Baseline |
-|---|---|---|---|
-| Information Extraction | 100% | 100% | 100% |
-| Knowledge Updates | 100% | 50% | 50% |
-| Multi-Session Reasoning | 100% | 100% | 100% |
-| Temporal Reasoning | 100% | 100% | 100% |
-| Abstention | 100% | 50% | 50% |
-| Conflict Resolution | 100% | 50% | 50% |
-| Procedural Learning | 100% | 0% | 0% |
-| Privacy | 100% | 0% | 0% |
-Operation-family breakdown:
-| Operation | Audrey | Vector Only | Best Baseline |
-|---|---|---|---|
-| Update / Overwrite | 100% | 50% | 50% |
-| Delete + Abstain | 100% | 0% | 50% |
-| Semantic Merge | 100% | 0% | 0% |
-| Procedural Merge | 100% | 0% | 0% |
-Published comparison anchors from the field (different benchmarks and conditions - included for field context, not direct comparison):
-| System | Benchmark | Score | What it represents |
-|---|---|---|---|
-| **Audrey** | Internal retrieval + operations benchmark | **100.0%** | Update, overwrite, delete, merge, abstention, consolidation, privacy |
-| MIRIX | Published LoCoMo | 85.4% | Typed multimodal memory |
-| Letta Filesystem | Published LoCoMo | 74.0% | Context-engineering |
-| Mem0 Graph Memory | Published LoCoMo | 68.5% | Graph memory |
-| Mem0 | Published LoCoMo | 66.9% | Production baseline |
-Primary comparison sources:
-- [MIRIX paper](https://arxiv.org/abs/2507.07957)
-- [Mem0 paper](https://arxiv.org/abs/2504.19413)
-- [Letta benchmark write-up](https://www.letta.com/blog/benchmarking-ai-agent-memory)
-- [LongMemEval paper](https://arxiv.org/abs/2410.10813)
-Benchmark guide: [docs/benchmarking.md](docs/benchmarking.md)
-## Repository
-- Contributing guide: [CONTRIBUTING.md](CONTRIBUTING.md)
-- Security policy: [SECURITY.md](SECURITY.md)
-- CI workflow: [.github/workflows/ci.yml](.github/workflows/ci.yml)
-- Benchmarking guide: [docs/benchmarking.md](docs/benchmarking.md)
+- [docs/benchmarking.md](docs/benchmarking.md)
+- [docs/production-readiness.md](docs/production-readiness.md)
+- [CONTRIBUTING.md](CONTRIBUTING.md)
+- [SECURITY.md](SECURITY.md)
 ## Development
 ```bash
 npm ci
 npm test
-npm run pack:check
-npm run bench:memory
-npm run bench:memory:retrieval
-npm run bench:memory:operations
 npm run bench:memory:check
-npm run bench:memory:readme-assets
+npm run pack:check
+python -m unittest discover -s python/tests -v
+python -m build --no-isolation python
 ```
-Current validated baseline:
-- `npm test`
-- `npm run pack:check`
-- `npm run bench:memory`
-- `npm run bench:memory:retrieval`
-- `npm run bench:memory:operations`
-- `npm run bench:memory:check`
-- `npm run bench:memory:readme-assets`
 ## License
 MIT. See [LICENSE](LICENSE).

package/dist/mcp-server/config.d.ts ADDED Viewed

@@ -0,0 +1,20 @@
+import type { AudreyConfig, EmbeddingConfig, LLMConfig } from '../src/types.js';
+export declare const VERSION = "0.20.0";
+export declare const SERVER_NAME = "audrey-memory";
+export declare const DEFAULT_DATA_DIR: string;
+export declare const MCP_ENTRYPOINT: string;
+export declare function resolveDataDir(env?: Record<string, string | undefined>): string;
+/**
+ * Resolves which embedding provider to use.
+ * Priority: explicit config -> gemini (if GOOGLE_API_KEY exists) -> local
+ * OpenAI is NEVER auto-selected -- must be set explicitly via AUDREY_EMBEDDING_PROVIDER=openai.
+ */
+export declare function resolveEmbeddingProvider(env: Record<string, string | undefined>, explicit?: string | undefined): EmbeddingConfig & {
+    dimensions: number;
+};
+export declare function resolveLLMProvider(env: Record<string, string | undefined>, explicit?: string | undefined): (LLMConfig & {
+    apiKey?: string;
+}) | null;
+export declare function buildAudreyConfig(): AudreyConfig;
+export declare function buildInstallArgs(env?: Record<string, string | undefined>): string[];
+//# sourceMappingURL=config.d.ts.map

package/dist/mcp-server/config.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"config.d.ts","sourceRoot":"","sources":["../../mcp-server/config.ts"],"names":[],"mappings":"AAGA,OAAO,KAAK,EAAE,YAAY,EAAE,eAAe,EAAE,SAAS,EAAE,MAAM,iBAAiB,CAAC;AAEhF,eAAO,MAAM,OAAO,WAAW,CAAC;AAChC,eAAO,MAAM,WAAW,kBAAkB,CAAC;AAC3C,eAAO,MAAM,gBAAgB,QAAqC,CAAC;AACnE,eAAO,MAAM,cAAc,QAAwD,CAAC;AAyBpF,wBAAgB,cAAc,CAAC,GAAG,GAAE,MAAM,CAAC,MAAM,EAAE,MAAM,GAAG,SAAS,CAAe,GAAG,MAAM,CAE5F;AAED;;;;GAIG;AACH,wBAAgB,wBAAwB,CACtC,GAAG,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,GAAG,SAAS,CAAC,EACvC,QAAQ,GAAE,MAAM,GAAG,SAA4C,GAC9D,eAAe,GAAG;IAAE,UAAU,EAAE,MAAM,CAAA;CAAE,CAkB1C;AAED,wBAAgB,kBAAkB,CAChC,GAAG,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,GAAG,SAAS,CAAC,EACvC,QAAQ,GAAE,MAAM,GAAG,SAAsC,GACxD,CAAC,SAAS,GAAG;IAAE,MAAM,CAAC,EAAE,MAAM,CAAA;CAAE,CAAC,GAAG,IAAI,CAoB1C;AAED,wBAAgB,iBAAiB,IAAI,YAAY,CAehD;AAED,wBAAgB,gBAAgB,CAAC,GAAG,GAAE,MAAM,CAAC,MAAM,EAAE,MAAM,GAAG,SAAS,CAAe,GAAG,MAAM,EAAE,CAoChG"}