npm - bikky - Versions diffs - 0.3.12 → 0.4.0 - Mend

bikky 0.3.12 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

package/CONTRIBUTING.md +206 -0
package/README.md +116 -154
package/dist/config.d.ts +49 -1
package/dist/config.d.ts.map +1 -1
package/dist/config.js +125 -4
package/dist/config.js.map +1 -1
package/dist/daemon/extraction.d.ts.map +1 -1
package/dist/daemon/extraction.js +24 -19
package/dist/daemon/extraction.js.map +1 -1
package/dist/daemon/loop.d.ts.map +1 -1
package/dist/daemon/loop.js +15 -1
package/dist/daemon/loop.js.map +1 -1
package/dist/daemon/qdrant.d.ts.map +1 -1
package/dist/daemon/qdrant.js +0 -1
package/dist/daemon/qdrant.js.map +1 -1
package/dist/lib/qdrant-pool.d.ts +57 -0
package/dist/lib/qdrant-pool.d.ts.map +1 -0
package/dist/lib/qdrant-pool.js +104 -0
package/dist/lib/qdrant-pool.js.map +1 -0
package/dist/mcp/api.d.ts +56 -19
package/dist/mcp/api.d.ts.map +1 -1
package/dist/mcp/api.js +133 -72
package/dist/mcp/api.js.map +1 -1
package/dist/mcp/helpers.d.ts +0 -1
package/dist/mcp/helpers.d.ts.map +1 -1
package/dist/mcp/helpers.js +2 -15
package/dist/mcp/helpers.js.map +1 -1
package/dist/mcp/helpers.test.js +3 -21
package/dist/mcp/helpers.test.js.map +1 -1
package/dist/mcp/index.d.ts.map +1 -1
package/dist/mcp/index.js +29 -14
package/dist/mcp/index.js.map +1 -1
package/dist/mcp/tools.d.ts +0 -7
package/dist/mcp/tools.d.ts.map +1 -1
package/dist/mcp/tools.js +337 -219
package/dist/mcp/tools.js.map +1 -1
package/dist/mcp/types.d.ts +0 -3
package/dist/mcp/types.d.ts.map +1 -1
package/dist/routing.d.ts +53 -0
package/dist/routing.d.ts.map +1 -0
package/dist/routing.js +129 -0
package/dist/routing.js.map +1 -0
package/dist/routing.test.d.ts +2 -0
package/dist/routing.test.d.ts.map +1 -0
package/dist/routing.test.js +79 -0
package/dist/routing.test.js.map +1 -0
package/docs/config/fully-hosted.md +57 -0
package/docs/config/hosted-models.md +50 -0
package/docs/config/hosted-qdrant-local-models.md +39 -0
package/docs/config/local.md +34 -0
package/docs/configuration.md +374 -0
package/docs/screenshots/dashboard.png +0 -0
package/docs/screenshots/graph.png +0 -0
package/docs/screenshots/memory.png +0 -0
package/package.json +7 -4
package/dist/mcp/api.test.d.ts +0 -6
package/dist/mcp/api.test.d.ts.map +0 -1
package/dist/mcp/api.test.js +0 -130
package/dist/mcp/api.test.js.map +0 -1
package/dist/mcp/tools.integration.itest.d.ts +0 -23
package/dist/mcp/tools.integration.itest.d.ts.map +0 -1
package/dist/mcp/tools.integration.itest.js +0 -171
package/dist/mcp/tools.integration.itest.js.map +0 -1
package/dist/mcp/tools.test.d.ts +0 -16
package/dist/mcp/tools.test.d.ts.map +0 -1
package/dist/mcp/tools.test.js +0 -908
package/dist/mcp/tools.test.js.map +0 -1

package/CONTRIBUTING.md ADDED Viewed

@@ -0,0 +1,206 @@
+# Contributing to bikky
+Thanks for your interest in bikky! We welcome PRs of all sizes — from typo fixes to new daemon features. This document covers the practical bits: how the repo is laid out, how to run the tests, and what we look for in a contribution.
+## Repository layout
+bikky is a small monorepo:
+```
+.
+├── src/                  # Core CLI + MCP server + daemon (published as `bikky`)
+│   ├── cli/              # `bikky <subcommand>` entrypoints
+│   ├── daemon/           # Background workers: extraction, consolidation, staleness, …
+│   ├── mcp/              # MCP server (the surface AI agents call into)
+│   ├── prompts/          # Versioned LLM prompt registry
+│   └── llm/              # Provider adapters (OpenAI, Bedrock, Ollama, Portkey)
+│       ├── embedding/    #   embedding registry + providers
+│       └── inference/    #   chat-completion registry + providers
+└── packages/
+    └── ui/               # Local web UI (`bikky-ui`) — Hono server + React frontend
+        ├── src/lib/      #   - config, qdrant client, embeddings
+        ├── src/routes/   #   - REST API routes
+        └── app/          #   - React/Vite frontend
+```
+## Setup
+```bash
+git clone https://github.com/bikky-dev/bikky.git
+cd bikky
+npm install
+cd packages/ui && npm install && cd ../..
+```
+## Running the tests
+We use the Node.js built-in test runner ([`node:test`](https://nodejs.org/api/test.html)) — no Jest, no Vitest, no extra dependencies.
+```bash
+# Core (CLI, daemon, MCP server) — 300+ tests
+npm test
+# UI server + libraries — 50+ tests
+cd packages/ui && npm test
+```
+Both packages compile TypeScript into `dist/` first and then run the compiled `*.test.js` files. The UI test suite uses `--test-isolation=process --test-concurrency=1` because several tests share `~/.bikky/config.json` on the developer's machine; running them in isolation avoids flakiness.
+> **Note on `~/.bikky/config.json`** — UI tests back up your real config in `before()` and restore it in `after()`. If a test crashes mid-run the file *should* survive, but if you ever see odd behaviour after a failed test run, just delete the file and re-run `bikky setup`.
+### What we test
+We aim for **focused, fast unit tests** that lock in behaviour without being a maintenance tax:
+- Pure functions (filter builders, hashers, parsers) — exhaustive cases.
+- Stateful modules (config loaders, lifecycle/PID, daemons) — happy path + a couple of failure modes.
+- Network clients (Qdrant, embeddings, LLM providers) — mock `globalThis.fetch` and assert on the request, never call a real backend.
+- HTTP routes (Hono) — exercise via `app.fetch(new Request(...))` against the real router with mocked underlying calls.
+We deliberately **do not** test:
+- LLM prompt quality or extraction accuracy. Those live in the separate [`bikky-evals`](https://github.com/bikky-dev/bikky-evals) repo, which uses DeepEval for prompt-level scoring.
+- Implementation details (private function internals, exact log strings) — these change often and tests that pin them slow contributors down.
+- The React frontend — the testable surface there is small; we rely on type-checking and manual smoke tests.
+### Adding a new test
+Tests live alongside the source as `*.test.ts`:
+```
+src/foo.ts       # source
+src/foo.test.ts  # tests
+```
+Use the [`node:test`](https://nodejs.org/api/test.html) `describe/it/before/after` API and `node:assert/strict`. For mocking, prefer **dependency injection** (e.g. the `StaleDeps` pattern in `src/daemon/staleness.ts`) over module mocking — it keeps tests deterministic and the production code easier to reason about.
+Good references for new tests:
+| Pattern                          | Reference                              |
+|----------------------------------|----------------------------------------|
+| Filesystem with backup/restore   | `src/lifecycle.test.ts`                |
+| Temp dir with `mkdtemp`          | `src/logger.test.ts`                   |
+| Env-based path override          | `src/llm/telemetry.test.ts`            |
+| Dependency injection for daemons | `src/daemon/staleness.test.ts`         |
+| Mocking `globalThis.fetch`       | `src/mcp/api.test.ts`, `packages/ui/src/lib/qdrant.test.ts` |
+| Hono route via `app.fetch`       | `packages/ui/src/routes/memory.test.ts` |
+### Integration tests (opt-in, real Qdrant)
+The default `npm test` mocks every external call. We also ship one **opt-in** end-to-end smoke test that talks to a real Qdrant instance (Cloud, local Docker, or self-hosted) and a real embedding provider — it's the only thing that catches filter-shape rejections, payload-index mismatches, vector-dimension drift, and whether the dedup similarity thresholds (`THRESHOLD_DUPLICATE`, `THRESHOLD_RELATED`) actually correspond to near-duplicates against your embedding model.
+```bash
+# Uses your existing ~/.bikky/config.json + QDRANT_URL (and QDRANT_API_KEY if your Qdrant requires it).
+BIKKY_INTEGRATION=1 npm run test:integration
+```
+What it does:
+1. Creates a throwaway collection named `bikky-it-<short-uuid>` with the real payload indexes.
+2. Exercises `memory_store` (insert, exact-dup, near-duplicate paraphrase), `memory_recall`, `memory_entity`, and `memory_forget` against live Qdrant + your real embeddings.
+3. Drops the collection in `after()` regardless of pass/fail.
+Cost is negligible — a handful of small embedding calls per run (≈ $0.0001 on OpenAI's `text-embedding-3-small`, free on Ollama). Files end in `.itest.ts` so the default `*.test.js` glob never picks them up.
+If the near-duplicate paraphrase doesn't reinforce on your embedding model, the test logs the actual similarity score so you can re-tune `THRESHOLD_DUPLICATE` rather than failing outright.
+## Adding an embedding or LLM provider
+The most common contribution is **adding a new embedding or LLM provider**. Each provider is a single file. The registry dispatches by `provider.name`, so no central edits are required beyond adding one import line to the barrel.
+### Embedding provider
+1. Create `src/llm/embedding/providers/<name>.ts`:
+   ```ts
+   import {
+     registerEmbeddingProvider,
+     type EmbeddingProvider,
+     type ResolvedEmbeddingConfig,
+   } from "../registry.js";
+   export const myProvider: EmbeddingProvider = {
+     name: "myprovider",
+     label: "My Provider",
+     browserCompatible: true, // false if it needs a server-only SDK
+     defaults: {
+       model: "default-model",
+       dimensions: 1024,
+       baseUrl: "https://api.example.com", // omit if SDK-only
+     },
+     async embed(text, cfg) {
+       // cfg.{model,baseUrl,apiKey,extra} are pre-resolved
+       const resp = await fetch(`${cfg.baseUrl}/v1/embeddings`, { /* … */ });
+       // throw on programmer error; return number[] on success
+       return [/* embedding vector */];
+     },
+   };
+   registerEmbeddingProvider(myProvider);
+   ```
+2. Add a side-effect import in `src/llm/embedding/providers/index.ts`:
+   ```ts
+   import "./myprovider.js";
+   ```
+3. Add a small unit test next to your provider (`<name>.test.ts`). Mock
+   `globalThis.fetch` (see `ollama.test.ts` for the pattern). Cover at minimum:
+   - success path (verifies URL, headers, body shape)
+   - non-OK response handling
+   - any provider-specific behaviour (auth, extra headers, fallback fields)
+4. If your provider is browser-friendly, mirror it under
+   `packages/ui/src/lib/embedding/providers/<name>.ts` so the UI can use it.
+5. Configure it in `~/.bikky/config.json`:
+   ```json
+   {
+     "embedding": {
+       "provider": "myprovider",
+       "model": "my-model",
+       "api_key": "…",
+       "extra": { "any-key": "any-value" }
+     }
+   }
+   ```
+   Or via env: `BIKKY_EMBEDDING_EXTRA_<KEY>=value` flows into `extra`.
+### Inference (LLM) provider
+Same pattern, under `src/llm/inference/providers/`. The interface is
+`InferenceProvider` (see `src/llm/inference/types.ts`), the key method is
+`chat(opts, cfg, log)`, and providers should **return `null`** on recoverable
+errors (HTTP error, missing key, network failure) so the orchestrator can fall
+back to `cfg.fallback` if configured. Throw only for programmer errors.
+Configure a fallback chain via `llm.fallback_provider` in config (or
+`LLM_FALLBACK_PROVIDER` env).
+## Submitting changes
+1. **Open an issue first** for non-trivial changes so we can align on the approach.
+2. **Branch** from `main` (`git checkout -b your-feature-name`).
+3. **Run the tests** in both packages before pushing.
+4. **Open a PR** referencing the issue (`Closes #123`). CI will re-run tests on push.
+5. We aim to review within a few business days — ping the issue if it goes quiet.
+## Style
+- TypeScript strict mode is on; no `any` unless interfacing with external SDK types (use a focused local interface to constrain the surface area).
+- We prefer small, pure functions and clear module boundaries to elaborate abstractions.
+- Tests live next to the source they cover (`foo.ts` + `foo.test.ts`).
+- Providers must not call `process.exit`, log to stdout, or modify global state beyond their own module-scope cache.
+- Heavy SDKs (e.g. `@aws-sdk/*`) **must be `await import(...)`-loaded inside the provider's `embed`/`chat`** so users on lighter providers don't pay the bundle cost.
+- Comments explain *why*, not *what* — the code shows the *what*.
+## License
+By contributing, you agree that your contributions will be licensed under the project's [AGPL-3.0-or-later](LICENSE) license.
+## Code of conduct
+Be kind. We follow the [Contributor Covenant](https://www.contributor-covenant.org/version/2/1/code_of_conduct/).

package/README.md CHANGED Viewed

@@ -1,196 +1,177 @@
 <h1 align="center">bikky</h1>
-<p align="center"><b>Persistent memory for AI coding agents — for teams, and for solo power users.</b></p>
+<p align="center"><b>Persistent memory for AI coding agents — built for teams and multi-agent engineering workflows.</b></p>
-bikky gives AI coding agents (GitHub Copilot, Claude Code, Cursor, and other MCP clients) long-term memory that persists across sessions, across tools, and across your whole team. Whether you're a team that wants every engineer's agent to start from the same knowledge base, or a solo power dev running a dozen agentic sessions a day, bikky captures what's learned *during* sessions so future sessions start smarter.
+bikky gives AI coding agents (GitHub Copilot, Claude Code, Cursor, and other MCP clients) long-term memory that persists across sessions, across tools, and across your whole team. When multiple engineers, agents, or repos need to build on the same knowledge base, bikky captures what's learned *during* sessions so future sessions start smarter.
 ### Who it's for
-| | |
-|---|---|
-| 👥 **Teams & software factories** | What one engineer's agent learns today, every agent on the team can recall tomorrow. Shared memory turns institutional knowledge into something queryable instead of tribal — onboarding accelerates, conventions stop drifting, and the same lesson never gets re-learned twice. |
-| 🧑‍💻 **Solo AI power devs** | You run multiple Cursor / Claude Code / Copilot sessions every day and you're tired of re-explaining the codebase, the conventions, and last week's decisions to each new agent. bikky remembers across every session and every tool. |
+- 👥 **Teams & software factories** — What one engineer's agent learns today, every agent on the team can recall tomorrow. Shared memory turns institutional knowledge into something queryable instead of tribal — onboarding accelerates, conventions stop drifting, and the same lesson never gets re-learned twice.
+- 🤖 **Multi-agent engineering workflows** — Multiple Cursor / Claude Code / Copilot sessions can share codebase context, conventions, and recent decisions instead of re-learning them from scratch.
 <p align="center">
-  <img src="https://cdn.jsdelivr.net/npm/bikky@latest/docs/diagrams/team-memory.svg" alt="Memory — facts flow from individual sessions into a self-curating knowledge store, shared across your team (or kept just for you)" width="720" />
+  <img src="https://cdn.jsdelivr.net/npm/bikky@latest/docs/diagrams/team-memory.svg" alt="Memory — facts flow from individual sessions into a self-curating knowledge store shared across your team" width="720" />
 </p>
-<p align="center"><i>Knowledge flows from every session into a store that curates itself over time — deduplicating, distilling, and decaying stale facts — so every future session starts smarter. Share the workspace across a team, or keep it solo.</i></p>
+<p align="center"><i>Knowledge flows from every session into a store that curates itself over time — deduplicating, distilling, and decaying stale facts — so every future session starts smarter across the team.</i></p>
 ---
 ### The problem
-The most valuable things you and your agents learn — why a config value exists, which deploy step matters, what broke last quarter, the convention you settled on yesterday — happen *during* sessions. And then they vanish when the session closes. Whether you're a team — where knowledge lives in heads, chat threads, and closed PRs, and every new engineer's agent has to learn it from scratch — or a solo power dev juggling dozens of agentic sessions a day across multiple tools that don't remember each other, it's the same wall. Hand-written docs drift the moment they're published.
+The most valuable things you and your agents learn — why a config value exists, which deploy step matters, what broke last quarter, the convention you settled on yesterday — happen *during* sessions. And then they vanish when the session closes. Across teams, repos, and tools, knowledge still lives in heads, chat threads, and closed PRs, and every new agent session has to learn it from scratch. Hand-written docs drift the moment they're published.
 ### How bikky solves it
-| | |
-|---|---|
-| **Capture** | Facts are extracted automatically from session transcripts — no manual docs to write |
-| **Recall** | Every new session — yours or a teammate's — recalls from the same store via semantic search |
-| **Curate** | Deduplication, confidence decay, contradiction detection, and distillation run autonomously |
-| **Compound** | Session 50 is dramatically better than session 1 — accumulated memory, not better prompts |
+bikky gives your agent memory tools and runs a small background service after `bikky setup`. You keep working normally; bikky captures useful facts, organizes them, recalls them in future sessions, and keeps the store tidy over time.
+- **Capture** — Facts are extracted automatically from session transcripts; no manual docs to write.
+- **Classify** — Memories are grouped as **engineering**, **product**, **human**, or **system** so they stay easy to browse and filter.
+- **Recall** — Every new session, yours or a teammate's, recalls from the same store via semantic search.
+- **Curate** — bikky merges duplicates, fades stale facts, resolves contradictions, distills recurring patterns, and builds an entity graph over time.
+- **Compound** — Session 50 is dramatically better than session 1 because memory accumulates.
+- **Route** — Optionally keep team, client, or environment-specific memory in separate Qdrant destinations from one install. See [separate memory stores](#optional-separate-memory-stores).
+Subtypes keep recall precise without making setup harder:
+- **Engineering** — codebase maps, architecture decisions, infra topology, access patterns, operational procedures, troubleshooting gotchas, and conventions.
+- **Product** — domain rules, product decisions, requirements, user workflows, roadmap items, success metrics, and market insights.
+- **Human** — preferences, person profiles, ownership notes, working agreements, and activity events.
+- **System** — session indexes, episodes, workstreams, and feedback signals.
 ---
 ## Quick start
-The fastest way to try bikky: **100% local, free, no accounts** — Qdrant in Docker, embeddings via Ollama.
+This is the fastest path to a working memory store: Qdrant runs locally, while hosted embeddings and LLM calls provide strong extraction and recall quality without running local models.
 ```bash
 # 1. Pull and run Qdrant (vector store)
 docker run -d --name qdrant -p 6333:6333 -v qdrant_storage:/qdrant/storage qdrant/qdrant
-# 2. Install Ollama (https://ollama.com) and pull the default embedding model
-ollama pull qwen3-embedding:0.6b
-# 3. Install and start bikky
+# 2. Install bikky
 npm install -g bikky
-echo '{ "qdrant_url": "http://localhost:6333" }' > ~/.bikky/config.json
+mkdir -p ~/.bikky
+# Replace sk-... below with your hosted model API key.
+cat > ~/.bikky/config.json <<'JSON'
+{
+  "qdrant_url": "http://localhost:6333",
+  "qdrant_api_key": "",
+  "embedding": {
+    "provider": "openai",
+    "model": "text-embedding-3-small",
+    "dimensions": 1536,
+    "api_key": "sk-..."
+  },
+  "llm": {
+    "provider": "openai",
+    "model": "gpt-4.1-mini",
+    "api_key": "sk-..."
+  }
+}
+JSON
+# qdrant_api_key is optional; leave it empty or omit it for local Qdrant.
+# Prefer env vars? Omit api_key above and set OPENAI_API_KEY instead.
+# 3. Register bikky with your editor and start the background service
 bikky setup            # writes MCP config for Copilot + Claude Code, then starts the daemon
 ```
-Restart your editor — the memory tools (`memory_store`, `memory_recall`, …) appear automatically.
+Restart your editor. The memory tools appear automatically in supported MCP clients.
 ```bash
-bikky status           # validate config, Qdrant, embeddings, daemon, and UI health
+bikky status           # confirms Qdrant, embeddings, daemon, and UI health
 ```
-That's the whole thing. From here you can swap any piece (hosted Qdrant, OpenAI / Bedrock embeddings, a hosted LLM for richer daemon distillation) — see **Setup** below.
+That's it. You can keep Qdrant local forever, or move the vector store to Qdrant Cloud later for a shared team setup.
+For other deployment shapes — fully hosted, 100% local, or hosted Qdrant with local models — see [Setup options](#setup-options).
 ---
-## Setup
+## Setup options
-### Prerequisites
+bikky supports four common setup shapes. Pick based on where you want Qdrant to run and where model calls should happen.
-| | Required | Options |
-|---|---|---|
-| **Node.js** | ≥ 20 | `nvm install 20` or your package manager |
-| **Vector store** | Qdrant | **Local Docker** (free, recommended for dev) · **[Qdrant Cloud](https://cloud.qdrant.io)** (free tier, 1 GB) · **Self-hosted** anywhere reachable |
-| **Embeddings** | One provider | **[Ollama](https://ollama.com)** local (free, default) · **OpenAI** · **AWS Bedrock** · **[Portkey](https://portkey.ai)** gateway |
-| **LLM** *(optional)* | Used by the daemon for distillation & extraction | Same provider list as embeddings — leave on Ollama for a fully-local stack |
-| **Docker** *(optional)* | Only if you run Qdrant locally | Docker Desktop, OrbStack, colima, etc. |
+### What you need
-### Install
+| Component               | Required                       | Options                                                                                  |
+| ----------------------- | ------------------------------ | ---------------------------------------------------------------------------------------- |
+| **Node.js**             | ≥ 20                           | `nvm install 20` or your package manager                                                 |
+| **Vector store**        | Qdrant                         | Local Docker · [Qdrant Cloud](https://cloud.qdrant.io) · Self-hosted                     |
+| **Embeddings**          | One provider                   | OpenAI · Ollama · Bedrock · Portkey                                                     |
+| **LLM**                 | One provider                   | OpenAI · Ollama · Bedrock · Portkey                                                     |
+| **Docker** *(optional)* | Only if you run Qdrant locally | Docker Desktop, OrbStack, colima, etc.                                                   |
-```bash
-npm install -g bikky          # CLI + MCP server + daemon
-npm install -g bikky-ui       # optional web dashboard
-```
+Both `embedding.provider` and `llm.provider` accept the same values: `ollama`, `openai`, `bedrock`, or `portkey`.
-### Pick your stack
+> ⚠️ **Qdrant Cloud free tier does not include automatic backups.** Deleted collections cannot be recovered. If your memory data is valuable, use a paid Qdrant Cloud plan (which includes daily backups), run Qdrant locally with your own backup strategy, or periodically export snapshots via the [Qdrant snapshots API](https://qdrant.tech/documentation/concepts/snapshots/).
-- **Fully local & free** — Qdrant in Docker + Ollama. Best for solo dev, no data leaves your machine. (See Quick start.)
-- **Hosted Qdrant + local Ollama** — Qdrant Cloud free tier for shared/team memory; embeddings still local.
-- **Fully hosted** — Qdrant Cloud + OpenAI / Bedrock / Portkey for embeddings and LLM. Best for teams that want a single shared memory across many machines.
+### Choose a setup
-### Configure
+| Setup                            | Best for                                                       | Config                                                                    |
+| -------------------------------- | -------------------------------------------------------------- | ------------------------------------------------------------------------- |
+| **Fully hosted**                 | Best performance and teams; managed vector storage and models  | [Fully hosted config][fully-hosted-config]                              |
+| **Local Qdrant + hosted models** | Local vector storage with hosted extraction and embedding      | [Hosted models config][hosted-models-config]                            |
+| **Local and free**               | Local evaluation; quality depends on local models              | [Local config guide][local-config]                                      |
+| **Hosted Qdrant + local Ollama** | Shared vector storage while keeping model calls local          | [Hosted Qdrant + local models][hosted-qdrant-local-models-config]       |
-Three ways to provide credentials, pick one:
+### Configuration basics
-```bash
-# A) Let your agent do it
-> "Call configure_credentials with my Qdrant URL (and API key if needed)"
+Pick the setup guide above for the copy-paste config. All setup shapes use the same three building blocks:
-# B) Config file (~/.bikky/config.json)
-echo '{ "qdrant_url": "http://localhost:6333" }' > ~/.bikky/config.json
+- **Qdrant** — where vectors and memory payloads are stored.
+- **Embeddings** — how facts become searchable vectors.
+- **LLM** — how session transcripts are extracted, curated, and distilled.
-# C) Environment variables
-export QDRANT_URL="http://localhost:6333"
-# export QDRANT_API_KEY="…"   # only for Qdrant Cloud / authenticated self-hosted
-```
+Config lives at `~/.bikky/config.json`, or at `BIKKY_HOME/config.json` when `BIKKY_HOME` is set. You can keep credentials out of the file with environment variables such as `QDRANT_URL`, `QDRANT_API_KEY`, and provider API keys.
-> 💡 **Tip:** Set `BIKKY_HOME` to relocate the config dir (defaults to `~/.bikky/`). Useful for tests, multiple profiles, or sandboxed setups.
+For hosted models, custom providers, multiple profiles, or advanced tuning, use the full configuration guide.
-> 📖 **Full configuration reference** — providers, models, daemon settings, env vars, copy-paste examples for every stack: **[docs/configuration.md](docs/configuration.md)**
+> 📖 **Full configuration guide:** [docs/configuration.md][configuration-guide]
 >
-> 🛠 Want to add a new embedding or LLM provider (Vertex, OpenRouter, etc.)? See **[CONTRIBUTING.md](CONTRIBUTING.md)** — it's a single-file change.
----
-## How it works
-<p align="center">
-  <img src="https://cdn.jsdelivr.net/npm/bikky@latest/docs/diagrams/architecture.svg" alt="Architecture" width="600" />
-</p>
-**MCP Server** — tools your agent calls directly:
-`memory_store` · `memory_recall` · `memory_entity` · `memory_relations` · `memory_forget` · `memory_verify` · `memory_heartbeat` · `memory_review` · `configure_credentials` · `verify_connection`
-**Daemon** — background process that passively watches session logs, extracts structured facts, writes lightweight session indexes, captures coherent episode summaries, updates current-state workstream summaries, infers entity relationships from recently changed facts, and runs the consolidation pipeline. Lifecycle memory is daemon-owned so agents do not need to remember summary/distillation tool calls.
----
-## Memory ontology
-bikky separates what a memory is about from where it came from. New captures use four top-level categories, concrete subtypes, small object kinds, activity domains, and provenance fields:
-```text
-Workspace
-  Domain
-    Project / repo / surface
-      Workstream
-        Episodes
-          Facts, decisions, preferences, activity events, operational notes
-        Current-state summaries
-          What matters now, open questions, blockers
-    Cross-cutting memory
-      Durable patterns, entity relationships, telemetry
+> 🛠 Want to add a new embedding or LLM provider (Vertex, OpenRouter, etc.)? See **[CONTRIBUTING.md][contributing]** — it's a single-file change.
+#### Optional: separate memory stores
+Most installs use one Qdrant destination. If you need clean separation later, replace the single `qdrant_url` / `collection` fields with named `destinations[]`:
+```jsonc
+{
+  "destinations": [
+    {
+      "name": "platform",
+      "qdrant_url": "https://platform.cloud.qdrant.io:6333",
+      "qdrant_api_key": "...",
+      "collection": "bikky-platform",
+      "default": true
+    },
+    {
+      "name": "client-a",
+      "qdrant_url": "https://client-a.cloud.qdrant.io:6333",
+      "qdrant_api_key": "...",
+      "collection": "bikky-client-a"
+    }
+  ]
+}
 ```
-This gives each memory enough context to be recalled precisely without forcing every note into a rigid project hierarchy.
-`category` is the broad subject area:
-| Category | Captures |
-|----------|----------|
-| `engineering` | Codebase maps, architecture decisions, infrastructure topology, access patterns, operational procedures, troubleshooting gotchas, and engineering conventions |
-| `product` | Domain rules, product decisions, requirements, user workflows, roadmap items, success metrics, and market insight |
-| `human` | Preferences, person profiles, ownership notes, working agreements, and durable actor-action activity events |
-| `system` | Bikky lifecycle memory: session indexes, episodes, workstreams, recall/feedback/outcome telemetry, and aggregate rollups |
-`memory_subtype` is the precise capture shape inside a category:
-| Category | Subtypes |
-|----------|----------|
-| `engineering` | `codebase_map`, `architecture_decision`, `infra_topology`, `access_pattern`, `operational_procedure`, `troubleshooting_gotcha`, `convention` |
-| `product` | `domain_rule`, `product_decision`, `product_requirement`, `user_workflow`, `roadmap_item`, `success_metric`, `market_insight` |
-| `human` | `preference`, `person_profile`, `ownership_note`, `working_agreement`, `activity_event` |
-| `system` | `session_index`, `episode`, `workstream`, `recall_event`, `feedback_event`, `outcome_event`, `aggregate_rollup` |
-`domain` is an activity/knowledge profile. The initial canonical domains are:
-| Domain | Purpose |
-|--------|---------|
-| `software_engineering` | Default for coding-agent captures: repos, code, infrastructure, releases, incidents |
-| `product_strategy` | Roadmap, positioning, experiments, customer insight, product decisions |
-| `business_operations` | Company processes, vendors, compliance, obligations, recurring workflows |
-| `research` | Source-backed investigation, hypotheses, contradictions, synthesis |
-| `personal_productivity` | Individual goals, routines, preferences, projects, habits |
-`kind` stays small (`fact`, `summary`, `distilled`, `relation`, `telemetry`). `source` is the creator class (`agent`, `system`, `user`, or `docs`). `actor_id` records the stable person or agent associated with a capture/action, and `workspace_id` scopes shared team memory. Legacy stored categories are read through compatibility aliases; this release does not migrate existing stored memories in place.
+That is enough for explicit selection in the UI and tools. Add routing rules only when you want automatic placement by cwd, entity, content, or metadata. Existing single-Qdrant configs continue to work.
----
-## Self-curation
-Raw fact accumulation creates noise. bikky keeps the knowledge store clean automatically:
+> 📖 **Details:** [multi-destination configuration](docs/configuration.md#multi-destination-routing)
-- **Deduplication** — content hash + vector similarity merges near-identical facts
-- **Ontology scope fields** — optional `workspace_id`, repo, workstream, and episode metadata make recall more precise
-- **Confidence decay** — old facts lose weight and surface for review
-- **Contradiction detection** — conflicting facts are resolved, not silently stacked
-- **Distillation** — recurring patterns across sessions consolidate into higher-level insights
-- **Entity graph** — relationships between concepts are inferred incrementally for richer recall
+[fully-hosted-config]: https://cdn.jsdelivr.net/npm/bikky@latest/docs/config/fully-hosted.md
+[hosted-models-config]: https://cdn.jsdelivr.net/npm/bikky@latest/docs/config/hosted-models.md
+[local-config]: https://cdn.jsdelivr.net/npm/bikky@latest/docs/config/local.md
+[hosted-qdrant-local-models-config]: https://cdn.jsdelivr.net/npm/bikky@latest/docs/config/hosted-qdrant-local-models.md
+[configuration-guide]: https://cdn.jsdelivr.net/npm/bikky@latest/docs/configuration.md
+[contributing]: https://cdn.jsdelivr.net/npm/bikky@latest/CONTRIBUTING.md
 ---
 ## Web UI
-[`bikky-ui`](packages/ui) is a local dashboard for browsing and managing your team's memory — facts, entities, quality metrics, aggregate impact insights, and the relationship graph.
+[`bikky-ui`](https://www.npmjs.com/package/bikky-ui) is a local dashboard for browsing and managing your team's memory — facts, entities, quality metrics, aggregate impact insights, and the relationship graph.
 ```bash
 npx bikky-ui          # one-shot — no install needed
@@ -200,17 +181,17 @@ bikky-ui              # opens http://localhost:1422
 ```
 <p align="center">
-  <img src="https://cdn.jsdelivr.net/npm/bikky@latest/docs/screenshots/dashboard.png" alt="Dashboard — overview stats, category breakdown, recent facts" width="720" />
+  <img src="docs/screenshots/dashboard.png" alt="Dashboard — overview stats, category breakdown, recent facts" width="720" />
 </p>
 <p align="center"><i>Dashboard — memory stats, category breakdown, and recent facts at a glance</i></p>
 <p align="center">
-  <img src="https://cdn.jsdelivr.net/npm/bikky@latest/docs/screenshots/memory.png" alt="Memory browser — search, filter, and browse all stored facts" width="720" />
+  <img src="docs/screenshots/memory.png" alt="Memory browser — search, filter, and browse all stored facts" width="720" />
 </p>
 <p align="center"><i>Memory browser — search, filter by category/kind/source, and browse all stored facts</i></p>
 <p align="center">
-  <img src="https://cdn.jsdelivr.net/npm/bikky@latest/docs/screenshots/graph.png" alt="Entity graph — interactive visualization of entity relationships" width="720" />
+  <img src="docs/screenshots/graph.png" alt="Entity graph — interactive visualization of entity relationships" width="720" />
 </p>
 <p align="center"><i>Entity graph — interactive visualization of how concepts, people, and services relate</i></p>
@@ -229,26 +210,7 @@ bikky ui        # launch the local web dashboard
 bikky render    # render a prompt to JSON (for eval harnesses & debugging)
 ```
-`bikky status` is the first thing to run when setup feels wrong. It validates the
-config file, highlights env vars that override it, checks Qdrant reachability and
-payload-index readiness without mutating the collection, runs a live embedding
-smoke check, validates the configured LLM provider name without sending a chat
-request, and reports daemon maintenance plus UI health. Use `bikky status --json` for automation,
-`--no-live` to skip the embedding call, and `--no-ui` to skip the local UI probe.
-### `bikky render` — inspect prompts
-Render any of bikky'''s prompts to JSON without booting the MCP server. Useful for
-external evaluation harnesses, prompt debugging, and reproducing model calls.
-```bash
-bikky render --list                                    # list available prompts
-echo '''{"transcript":"..."}''' | bikky render extraction  # via stdin
-bikky render extraction --input case.json              # via file
-```
-Output: a JSON object with `promptName`, `messages`, `temperature`,
-`max_tokens`, and `response_format` — exactly what bikky sends to the LLM.
+`bikky status` is the first thing to run when setup feels wrong. It checks the config, Qdrant, embeddings, background daemon, and local UI health, then tells you what needs attention. Use `bikky status --json` for automation.
 ## License

package/dist/config.d.ts CHANGED Viewed

@@ -76,11 +76,48 @@ export interface WatcherConfig {
         path: string;
     };
 }
+/**
+ * One Qdrant routing target. Each destination is fully self-contained: its own
+ * URL, API key, collection name, and match rules. All fields in `match` are
+ * arrays of regex strings; OR semantics within a destination's match block,
+ * first-match-wins across destinations.
+ */
+export interface DestinationMatch {
+    /** Match against `process.cwd()`. */
+    cwd?: string[];
+    /** Match against any of the input `entities`. */
+    entity?: string[];
+    /** Match against the input `content`. */
+    content?: string[];
+    /** Per-key match against the input `metadata`. */
+    metadata?: Record<string, string[]>;
+}
+export interface Destination {
+    /** Stable, unique name. Used as the `destination` override on tool calls. */
+    name: string;
+    qdrant_url: string;
+    qdrant_api_key: string | null;
+    collection: string;
+    /** Marks this destination as the fallback when no rule matches. */
+    default?: boolean;
+    /** Routing rules. Omit for a destination that is only reachable by override. */
+    match?: DestinationMatch;
+}
 export interface BikkyConfig {
+    /**
+     * Top-level Qdrant fields. When `destinations` is empty, a single default
+     * destination is synthesized from these — keeps single-Qdrant configs
+     * working without changes.
+     */
     qdrant_url: string | null;
     qdrant_api_key: string | null;
     collection: string;
-    default_workspace: string | null;
+    /**
+     * One or more Qdrant routing targets. Memory operations resolve to a
+     * destination via override → cwd/entity/content/metadata regex match →
+     * default flag → first entry.
+     */
+    destinations: Destination[];
     aws_profile: string | null;
     embedding: EmbeddingConfig;
     llm: LLMConfig;
@@ -107,6 +144,17 @@ export declare function validateConfigObject(raw: unknown): ConfigIssue[];
 export declare function inspectConfigFile(configPath?: string): ConfigFileDiagnostics;
 export declare function getActiveConfigEnvOverrides(env?: NodeJS.ProcessEnv): string[];
 export declare function loadConfig(): BikkyConfig;
+/**
+ * Resolve the effective list of destinations from the loaded config.
+ *
+ * - If `destinations` is non-empty, return as-is.
+ * - Otherwise synthesize a single fallback destination from the top-level
+ *   `qdrant_url` / `qdrant_api_key` / `collection` so existing single-Qdrant
+ *   configs keep working without changes.
+ * - If neither is configured, returns an empty array — callers should treat
+ *   that as "Qdrant not configured" the same way they did before.
+ */
+export declare function getEffectiveDestinations(config?: BikkyConfig): Destination[];
 /** Save config to disk (used by setup command). */
 export declare function saveConfig(config: BikkyConfig): void;
 /** Reset cached config (for testing). */