@andespindola/brainlink 0.1.0-beta.10 → 0.1.0-beta.101

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (52) hide show
  1. package/AGENTS.md +8 -5
  2. package/CHANGELOG.md +26 -2
  3. package/CONTRIBUTING.md +2 -2
  4. package/COPYRIGHT.md +5 -0
  5. package/README.md +138 -16
  6. package/SECURITY.md +1 -1
  7. package/dist/application/analyze-vault.js +1 -9
  8. package/dist/application/build-context.js +56 -1
  9. package/dist/application/dedupe-notes.js +226 -0
  10. package/dist/application/frontend/client-css.js +93 -45
  11. package/dist/application/frontend/client-html.js +34 -25
  12. package/dist/application/frontend/client-js.js +3153 -140
  13. package/dist/application/frontend/client-worker-js.js +66 -0
  14. package/dist/application/get-graph-layout.js +17 -5
  15. package/dist/application/get-graph-node.js +3 -3
  16. package/dist/application/get-graph-summary.js +3 -3
  17. package/dist/application/get-graph.js +3 -3
  18. package/dist/application/import-legacy-sqlite.js +296 -0
  19. package/dist/application/index-vault.js +252 -19
  20. package/dist/application/list-agents.js +3 -3
  21. package/dist/application/list-links.js +5 -5
  22. package/dist/application/offline-pack-backup.js +44 -0
  23. package/dist/application/search-graph-node-ids.js +3 -3
  24. package/dist/application/search-knowledge.js +25 -10
  25. package/dist/application/server/routes.js +76 -1
  26. package/dist/application/start-server.js +75 -4
  27. package/dist/application/watch-vault.js +23 -2
  28. package/dist/benchmarks/large-vault.js +1 -1
  29. package/dist/cli/commands/agent-commands.js +7 -0
  30. package/dist/cli/commands/write-commands.js +818 -8
  31. package/dist/domain/context.js +53 -11
  32. package/dist/domain/graph-layout.js +47 -2
  33. package/dist/domain/middle-out.js +18 -0
  34. package/dist/infrastructure/config.js +38 -0
  35. package/dist/infrastructure/file-index.js +358 -0
  36. package/dist/infrastructure/file-system-vault.js +15 -0
  37. package/dist/infrastructure/index-state.js +56 -0
  38. package/dist/infrastructure/private-pack-codec.js +134 -0
  39. package/dist/infrastructure/search-packs.js +452 -0
  40. package/dist/mcp/server.js +11 -1
  41. package/dist/mcp/tools.js +62 -0
  42. package/docs/AGENT_USAGE.md +97 -16
  43. package/docs/ARCHITECTURE.md +23 -26
  44. package/docs/QUICKSTART.md +7 -0
  45. package/package.json +6 -4
  46. package/dist/infrastructure/sqlite/document-writer.js +0 -51
  47. package/dist/infrastructure/sqlite/graph-reader.js +0 -267
  48. package/dist/infrastructure/sqlite/recovery.js +0 -83
  49. package/dist/infrastructure/sqlite/schema.js +0 -114
  50. package/dist/infrastructure/sqlite/search-reader.js +0 -188
  51. package/dist/infrastructure/sqlite/types.js +0 -1
  52. package/dist/infrastructure/sqlite-index.js +0 -38
package/AGENTS.md CHANGED
@@ -6,19 +6,19 @@ This file tells coding agents and AI assistants how to use this repository.
6
6
 
7
7
  Brainlink is a local-first knowledge memory for agents.
8
8
 
9
- It reads a Markdown vault, extracts `[[wiki links]]` and `#tags`, builds a local SQLite full-text index, and returns compact context packages that agents can inject into prompts.
9
+ It reads a Markdown vault, extracts `[[wiki links]]` and `#tags`, builds a local file index at `.brainlink/index.json`, and returns compact context packages that agents can inject into prompts.
10
10
 
11
11
  ## Source Of Truth
12
12
 
13
13
  Markdown files are the source of truth.
14
14
 
15
- The SQLite database at `.brainlink/brainlink.db` is a derived index. It can be deleted and rebuilt with:
15
+ The JSON index at `.brainlink/index.json` is derived. It can be deleted and rebuilt with:
16
16
 
17
17
  ```bash
18
18
  npm run dev -- index --vault ./vault
19
19
  ```
20
20
 
21
- Do not store permanent knowledge only in SQLite.
21
+ Do not store permanent knowledge only in index artifacts.
22
22
 
23
23
  By default, the installed Brainlink CLI uses `$HOME/.brainlink/vault` as its vault. Passing `--vault` or setting `vault` in `brainlink.config.json` intentionally selects a custom vault such as `./vault`.
24
24
 
@@ -83,6 +83,9 @@ Use watch mode while editing notes:
83
83
  ```bash
84
84
  npm run dev -- server --vault ./vault --watch
85
85
  npm run dev -- watch --vault ./vault
86
+ npm run dev -- bench --vault ./vault
87
+ npm run dev -- bench --vault ./vault --watch
88
+ npm run dev -- pack-backup --vault ./vault
86
89
  ```
87
90
 
88
91
  Start MCP over stdio:
@@ -107,10 +110,10 @@ npm run dev -- doctor --vault ./vault
107
110
 
108
111
  - Keep domain rules in `src/domain`.
109
112
  - Keep use cases in `src/application`.
110
- - Keep filesystem and SQLite details in `src/infrastructure`.
113
+ - Keep filesystem and index details in `src/infrastructure`.
111
114
  - Keep CLI concerns in `src/cli`.
112
115
  - Prefer pure functions for parsing, ranking, formatting, and transformation.
113
- - Do not make SQLite the canonical storage layer.
116
+ - Do not make index artifacts the canonical storage layer.
114
117
  - Do not add comments with emojis.
115
118
  - Keep JSON output backwards compatible where possible.
116
119
 
package/CHANGELOG.md CHANGED
@@ -22,6 +22,30 @@
22
22
  - Added short-lived hybrid search cache with automatic invalidation on index changes.
23
23
  - Added `stats --extended` observability output with storage, quality and latency probes.
24
24
  - Added `docs/QUICKSTART.md` and aligned README/agent docs with the latest CLI/MCP flows.
25
+ - Added middle-out context assembly so chunk selection expands around the strongest note chunk.
26
+ - Added compressed-space pack prefiltering (token bloom index) before `.blpk` decryption and scan.
27
+ - Improved graph UI auto-fit and viewport recovery so loaded nodes are re-centered when zoom/pan drifts to empty canvas.
28
+ - Added cross-platform native desktop GUI auto-open for `blink server` (macOS Swift/WebKit, Windows PowerShell WinForms, Linux Python GTK/WebKit2), with app-window/browser fallback.
29
+ - Changed Linux default UI launch to app-window/browser for lighter startup; Linux native GUI is now opt-in via `BRAINLINK_LINUX_NATIVE_GUI=1`.
30
+ - Added native GUI parent-process monitoring so GUI windows close automatically when `blink server` stops.
31
+ - Improved non-mac browser detection fallback to try installed Edge/Chrome/Firefox/Chromium candidates before system default open.
32
+ - Improved graph filter rendering to keep hub anchor nodes visible (`Memory Hub`/`MOC`/high-degree fallback) for coherent relationship context.
33
+ - Fixed graph modal content loading by correcting agent query parameter composition for `/api/graph-node` and `/api/graph-filter` requests.
34
+ - Improved 50k+ graph rendering performance with viewport-aware spatial node culling, cached render visibility, and node-adjacent edge selection to avoid full graph scans every frame.
35
+ - Added incremental vault indexing with file snapshots to reuse unchanged documents/chunks/embeddings, plus adaptive search-pack rebuild thresholds to avoid full re-compression on small edits.
36
+ - Reduced large-graph HTTP payload size with compact `/api/graph-layout` encoding for high-node vaults and capped transmitted edges to improve UI load responsiveness.
37
+ - Added aggressive graph LOD clustering when zoomed out, dynamic per-zoom edge render budgets, and a dedicated frontend worker for off-main-thread graph filter matching.
38
+ - Improved Linux browser fallback launch stability by auto-applying Chromium compatibility flags (`--ozone-platform=x11`, `--disable-gpu`, `--disable-features=Vulkan,VaapiVideoDecoder`, `--disable-background-networking`) for app-window/browser modes.
39
+ - Improved massive-graph UI responsiveness with stricter render budgets, adaptive heavy-graph frame throttling, reduced interaction hit-test frequency, and URL-first agent selection on initial graph load.
40
+ - Improved 50k+ graph LOD behavior so zoomed-out views render lightweight cluster overviews and progressively reveal nodes/edges only as zoom increases.
41
+ - Added `blink bench` with realtime index phase telemetry and per-run compressed-pack analysis (input/output bytes, ratio, saved space, rebuild reason and duration), including continuous watch mode.
42
+ - Added tunable single-stage search-pack compression settings (`searchPack.rowChunkSize`, `searchPack.compressionLevel`, `searchPack.useDictionary`).
43
+ - Added benchmark guardrails for compression savings and latency regression (`searchPack.guardrailMinSavingsPercent`, `searchPack.guardrailMaxLatencyRegressionPercent`), reported in `blink bench`.
44
+ - Added `blink pack-backup` for offline second-stage compression backups of encrypted `.blpk` packs, outside the online query path.
45
+ - Hardened Linux browser launch flags for Ubuntu 26 Chromium/Wayland compatibility (`--disable-vulkan`, `--use-gl=swiftshader`, `--ozone-platform-hint=x11`).
46
+ - Improved pack resilience by auto-repairing missing search-pack manifests from existing `.blpk` files, avoiding unnecessary full repacks on small incremental updates.
47
+ - Updated Linux graph auto-open behavior to prioritize the system default browser (`xdg-open`) before explicit browser fallbacks.
48
+ - Removed implicit Chromium dependency in Linux auto-open flow; app-window launch is now opt-in (`BRAINLINK_LINUX_APP_WINDOW=1`).
25
49
 
26
50
  ## 0.1.0-beta.3
27
51
 
@@ -49,8 +73,8 @@
49
73
  ## 0.1.0-alpha.0
50
74
 
51
75
  - Added local-first Markdown vault indexing.
52
- - Added SQLite FTS, local semantic retrieval, wiki links, backlinks and graph retrieval.
53
- - Added SQLite semantic bucket indexing to narrow vector candidates for larger vaults.
76
+ - Added local full-text indexing, local semantic retrieval, wiki links, backlinks and graph retrieval.
77
+ - Added semantic candidate bucket indexing to narrow vector candidates for larger vaults.
54
78
  - Optimized title/link resolution with precomputed agent-scoped title maps.
55
79
  - Added CLI, JSON output, HTTP API and graph UI.
56
80
  - Added vault diagnostics: stats, broken links, orphans, validation and doctor.
package/CONTRIBUTING.md CHANGED
@@ -22,7 +22,7 @@ npm run pack:smoke
22
22
  ## Design Rules
23
23
 
24
24
  - Markdown files are the source of truth.
25
- - SQLite is a derived index and must remain rebuildable.
25
+ - Local index artifacts are derived and must remain rebuildable.
26
26
  - Domain parsing, graph analysis and layout should stay pure and testable.
27
- - CLI, HTTP, filesystem and SQLite code are adapters around application use cases.
27
+ - CLI, HTTP, filesystem and index code are adapters around application use cases.
28
28
  - MCP integration should live outside this package by wrapping the CLI with `--json`.
package/COPYRIGHT.md ADDED
@@ -0,0 +1,5 @@
1
+ Copyright (c) 2026 Substructa
2
+
3
+ This project is licensed under the MIT License.
4
+
5
+ See [LICENSE](./LICENSE) for full terms.
package/README.md CHANGED
@@ -52,12 +52,15 @@ LLMs do not have infinite context. Brainlink gives agents an external memory lay
52
52
  1. Durable knowledge is written as Markdown.
53
53
  2. Notes are connected with `[[wiki links]]`.
54
54
  3. Concepts are classified with `#tags`.
55
- 4. Brainlink builds a local SQLite index with FTS records and local embeddings.
55
+ 4. Brainlink builds a local JSON index (`.brainlink/index.json`) and private encrypted search packs.
56
56
  5. Agents query the index before responding.
57
57
  6. Brainlink returns compact, source-backed context.
58
58
 
59
- Markdown is the source of truth. `.brainlink/brainlink.db` is only a rebuildable index.
60
- Brainlink now keeps an automatic rollback snapshot at `.brainlink/brainlink.db.backup`. If the main SQLite file is corrupted, Brainlink automatically restores from snapshot (or recreates a clean index when no snapshot exists).
59
+ Markdown is the source of truth. `.brainlink/index.json` is a rebuildable index artifact.
60
+ After each index run, Brainlink also writes private encrypted search packs at `.brainlink/search-packs/*.blpk` to preserve fast retrieval and portable recovery.
61
+ Online retrieval always uses a single compression stage per pack; optional second-stage compression is reserved for offline backup artifacts only.
62
+ Pack decryption uses a Brainlink key from `$BRAINLINK_HOME/keys` or from `BRAINLINK_SEARCH_PACK_KEY` when explicitly configured.
63
+ Legacy `.jsonl.gz` packs are upgraded to `.blpk` automatically on first search/context access.
61
64
 
62
65
  ## Features
63
66
 
@@ -65,8 +68,12 @@ Brainlink now keeps an automatic rollback snapshot at `.brainlink/brainlink.db.b
65
68
  - Obsidian-compatible `[[wiki links]]` and `#tags`.
66
69
  - Weighted graph edges so agents can rank relationship importance and priority.
67
70
  - Backlinks, broken-link reports, orphan detection and validation.
68
- - Full-text, semantic and hybrid retrieval modes.
69
- - SQLite-backed semantic candidate buckets for larger vaults.
71
+ - Full-text, semantic and hybrid retrieval on a local file index.
72
+ - Middle-out context assembly around the strongest chunk per document.
73
+ - In-process index and context caching with automatic invalidation on index updates.
74
+ - Compressed-space prefiltering for `.blpk` packs before decryption and scan.
75
+ - Incremental indexing that reprocesses only changed markdown files and reuses existing chunks/embeddings for unchanged notes.
76
+ - Adaptive compressed-pack rebuild policy to keep indexing fast during small edit batches.
70
77
  - Agent namespaces under `agents/<agent-id>/`.
71
78
  - S3-compatible bucket vaults through `s3://bucket/prefix` URIs.
72
79
  - CLI with machine-readable `--json` output.
@@ -74,6 +81,17 @@ Brainlink now keeps an automatic rollback snapshot at `.brainlink/brainlink.db.b
74
81
  - Built-in MCP stdio server for agent tool integration.
75
82
  - Local HTTP API.
76
83
  - Realtime graph UI with agent selector and colored knowledge groups.
84
+ - Graph renderer optimized for large datasets with viewport-driven node culling and edge lookup by visible nodes.
85
+ - Canvas graph rendering uses the same batched node and edge pipeline for every graph size, reducing per-frame draw calls while keeping selected and hovered items highlighted.
86
+ - WebGL acceleration is used when available for dense node and edge drawing, with Canvas 2D preserved as the interaction and fallback layer.
87
+ - Graph zoom-out renders hierarchical ecosystem subgraphs only above 1000 notes: the memory hub stays centered, 1000-note groups stay as compact sand-like points, and focused groups gradually expand into smaller graph meshes before individual notes are rendered.
88
+ - Large graph layout API automatically uses compact payload encoding with link-coverage-aware edge selection to reduce initial client load without hiding major relationships.
89
+ - Large-segment layout spacing now grows logarithmically to keep initial visual density consistent between medium and very large vaults (for example, ~1k vs ~50k notes).
90
+ - Graph coordinates are visually compacted across graph sizes so reset starts from a stable macro mass and zoom-in progressively expands toward local detail.
91
+ - Zoomed-out graph LOD renders nested subgraphs and progressively expands only the focused cluster as zoom increases, including very large vaults.
92
+ - Graph reset starts in macro "galaxy" overview mode and progressively reveals nearby nodes as zoom increases, including smaller vaults.
93
+ - Graph filtering runs in a dedicated browser worker to keep the UI thread responsive during heavy datasets.
94
+ - Edge rendering budgets adapt to zoom level to prevent frame spikes on large graph panoramas.
77
95
 
78
96
  ## Install
79
97
 
@@ -283,7 +301,7 @@ export BRAINLINK_S3_FORCE_PATH_STYLE=1
283
301
 
284
302
  Bucket vaults mirror Markdown into a local cache under
285
303
  `$BRAINLINK_HOME/bucket-cache`. The bucket remains canonical; the local
286
- `.brainlink/brainlink.db` stays a disposable index. Run `index` after remote
304
+ `.brainlink/index.json` stays a disposable index artifact. Run `index` after remote
287
305
  bucket changes before relying on `search`, `context`, graph or validation
288
306
  commands. Watch mode is only supported for local filesystem vaults.
289
307
 
@@ -299,7 +317,7 @@ vault/
299
317
  research-agent/
300
318
  source-review-policy.md
301
319
  .brainlink/
302
- brainlink.db
320
+ index.json
303
321
  ```
304
322
 
305
323
  Permanent data:
@@ -309,7 +327,7 @@ Permanent data:
309
327
 
310
328
  Rebuildable data:
311
329
 
312
- - `.brainlink/brainlink.db`
330
+ - `.brainlink/index.json`
313
331
  - full-text records
314
332
  - local embedding vectors
315
333
  - local embedding buckets
@@ -393,6 +411,7 @@ blink agent upgrade
393
411
  ```
394
412
 
395
413
  This configures `~/.codex/config.toml` with Brainlink MCP (`brainlink-mcp`) so Brainlink is available by default in agent sessions.
414
+ `agent install` and `agent upgrade` also apply the MCP `fully-auto` bootstrap policy by default (`enforceBootstrap`, `enforceContextFirst`, `autoBootstrapOnRead`, `autoBootstrapOnStartup` all enabled).
396
415
 
397
416
  If you are inside this repository and want plugin gallery setup too:
398
417
 
@@ -512,6 +531,8 @@ Available tools:
512
531
  - `brainlink_recommendations`: return an automatic action plan so agents can run Brainlink in the recommended order.
513
532
  - `brainlink_context`: read indexed context for a task or question.
514
533
  - `brainlink_search`: search indexed notes.
534
+ - `brainlink_dedupe`: detect duplicate candidates using exact hash + semantic similarity scores.
535
+ - `brainlink_resolve_duplicate`: resolve duplicate pairs (`merge`, `link`, `ignore`) with connectivity-safe fallback edges.
515
536
  - `brainlink_add_note`: write durable Markdown memory and reindex.
516
537
  - `brainlink_add_file`: ingest a local file as a note and reindex.
517
538
  - `brainlink_index`: rebuild the vault index.
@@ -550,6 +571,17 @@ blink server --host 127.0.0.1 --port 4321 --watch
550
571
  ```
551
572
 
552
573
  By default, the server uses `$HOME/.brainlink/vault`. Pass `--vault ./vault` only when you want to inspect a custom vault.
574
+ By default, `blink server` tries to open the graph in a native desktop GUI window:
575
+ - macOS: Swift + WebKit
576
+ - Windows: PowerShell WinForms WebBrowser
577
+ - Linux: optional Python GTK + WebKit2 (requires `python3` + `gi` + `WebKit2`)
578
+
579
+ On Linux, native GUI is disabled by default for better startup performance. Enable it with `BRAINLINK_LINUX_NATIVE_GUI=1`.
580
+ If native GUI launch is unavailable on your system, it falls back to dedicated app-window mode and then to the default browser.
581
+ For Chromium-family browsers on Linux (`chromium`, `chromium-browser`, `google-chrome`, `microsoft-edge`, `brave-browser`), Brainlink now auto-applies compatibility flags during launch (`--ozone-platform=x11`, `--ozone-platform-hint=x11`, `--disable-gpu`, `--disable-vulkan`, `--use-gl=swiftshader`, `--disable-features=Vulkan,VaapiVideoDecoder`, `--disable-background-networking`) to avoid common Wayland/Vulkan/VAAPI startup issues.
582
+ On Linux, Brainlink opens the graph through the system default browser first (`xdg-open`), then `$BROWSER`/detected browsers as fallback. Chromium-family app-window mode is optional via `BRAINLINK_LINUX_APP_WINDOW=1`.
583
+ Use `--no-open` to keep it headless.
584
+ When native GUI is used, the GUI window automatically closes when the `blink server` process stops.
553
585
 
554
586
  The graph UI shows:
555
587
 
@@ -557,12 +589,21 @@ The graph UI shows:
557
589
  - `[[wiki links]]` as weighted edges
558
590
  - details opened on node click (tags, outgoing links, backlinks, full Markdown content)
559
591
  - neutral graph nodes with segment/group metadata
560
- - agent selector for isolated views
592
+ - agent selector (id-only labels) for isolated views
561
593
  - graph filter matches title, path, tags and note content
594
+ - graph filter keeps hub context nodes visible (`Memory Hub`/`MOC`/high-degree fallback) to preserve relationship readability
562
595
  - realtime refresh while `--watch` is enabled
563
596
  - graph controls for zoom in, zoom out, fit visible nodes and reset-to-fit-all
564
- - wheel zoom anchored to cursor position for faster navigation in large graphs
597
+ - wheel zoom (including `cmd+scroll` and `ctrl+scroll`) anchored to cursor position for faster navigation in large graphs
598
+ - zoom-out floor for large and massive graphs, plus reset macro floor tied to hub-neighbor distance, so initial macro view stays closer to first particle layers instead of over-distancing
599
+ - keyboard shortcuts: `+` zoom in, `-` zoom out, `0` reset fit
600
+ - double-click on canvas zooms in at cursor position
565
601
  - floating graph totals (notes, links, tags) below the Brainlink title
602
+ - graph rendering safeguards (batched canvas drawing across graph sizes, edge draw caps, lower redraw rate, zoom-aware interaction)
603
+ - WebGL node and edge acceleration when supported, falling back to Canvas 2D without changing graph behavior
604
+ - compact macro-to-micro density progression so reset keeps the graph mass oriented and zoom-in separates local neighborhoods progressively
605
+ - graph camera treats hub-centered navigation as structural only when the hub is dominant; diffuse stress graphs reset and zoom around the full graph mass
606
+ - graph LOD progression: graphs up to 1000 notes render directly; larger graphs use one recursive model where each visible level targets up to 999 non-hub nodes, starts from a memory-hub-centered mesh, and each supernode can expand into another same-shape subgraph level (again up to 999 children) with latent fade-in, aggregated real links and local sibling mesh links so org-heavy and stress-50k follow the same structure at different depths; for massive graphs the first expansion starts much deeper in zoom, low-size child levels use slower easing, and expansion is additionally gated by focus readiness (screen-space isolation of the focused parent) so child levels open only when that subgraph is truly centered and separated in view
566
607
 
567
608
  The server indexes before starting by default. Use `--no-index` to skip that step:
568
609
 
@@ -664,6 +705,18 @@ blink migrate-vault --from ~/.brainlink/vault --to ./team-vault --report ./migra
664
705
  Runs explicit markdown migration between vaults while preserving conflicts as `.conflict-<timestamp>` files.
665
706
  Use `--dry-run` to preview `copied`, `conflicted` and `unchanged` counts before writing.
666
707
 
708
+ ### `db-import`
709
+
710
+ ```bash
711
+ blink db-import --vault ./team-vault
712
+ blink db-import --vault ./team-vault --db ./legacy/brainlink.db
713
+ blink db-import --vault ./team-vault --db ./legacy/brainlink.db --table legacy_notes --dry-run
714
+ ```
715
+
716
+ Imports durable memory from a legacy SQLite database into Markdown notes (`agents/<agent-id>/*.md`) and reindexes by default.
717
+ When `--db` is omitted, Brainlink auto-detects common legacy paths such as `<vault>/.brainlink/brainlink.db`.
718
+ Use `--agent <id>` to force all imported rows into one namespace, `--limit` for incremental imports, `--dry-run` to preview without writing files, and `--no-index` to defer reindexing.
719
+
667
720
  ### `init`
668
721
 
669
722
  ```bash
@@ -688,6 +741,28 @@ blink add "Note Title" --vault ./vault --content-file ./notes.md --no-auto-index
688
741
 
689
742
  Creates a Markdown note under `agents/<agent-id>/`. Common secret patterns are blocked by default; use `--allow-sensitive` only for an intentionally protected vault.
690
743
  To avoid disconnected memory, Brainlink auto-adds a fallback wiki edge when a note is written without links, creating agent hub notes when needed.
744
+ `add` also returns `possibleDuplicates` (exact hash + semantic candidates) so agents can resolve duplicate memory right after writes.
745
+
746
+ ### `dedupe`
747
+
748
+ ```bash
749
+ blink dedupe --vault ./vault --json
750
+ blink dedupe --vault ./vault --agent coding-agent --limit 20 --min-score 0.92 --json
751
+ blink dedupe --vault ./vault --no-semantic --json
752
+ ```
753
+
754
+ Detects `possibleDuplicate` pairs using exact content hashes and optional semantic similarity.
755
+
756
+ ### `dedupe-resolve`
757
+
758
+ ```bash
759
+ blink dedupe-resolve --vault ./vault --left agents/shared/a.md --right agents/shared/b.md --action merge --json
760
+ blink dedupe-resolve --vault ./vault --left agents/shared/a.md --right agents/shared/b.md --action link --json
761
+ blink dedupe-resolve --vault ./vault --left agents/shared/a.md --right agents/shared/b.md --action ignore --json
762
+ ```
763
+
764
+ Resolves a duplicate pair with `merge`, `link` or `ignore`.
765
+ When action is not `merge`, Brainlink still creates a low-priority related edge (`#related-to`) so notes remain connected.
691
766
 
692
767
  ### `index`
693
768
 
@@ -698,6 +773,38 @@ blink index --vault ./vault
698
773
 
699
774
  Rebuilds the local index from Markdown files.
700
775
 
776
+ ### `bench`
777
+
778
+ ```bash
779
+ blink bench --vault ./vault
780
+ blink bench --vault ./vault --watch
781
+ blink bench --vault ./vault --watch --debounce 500
782
+ blink bench --vault ./vault --json
783
+ ```
784
+
785
+ Runs indexing with realtime phase telemetry (`start`, `scan`, `parse`, `embed`, `persist`, `packs`, `complete`) and prints a benchmark summary at the end of each run.
786
+
787
+ Summary includes compression behavior for `.blpk` packs when rebuild happens:
788
+ - pack rebuild reason
789
+ - pack count and pack build duration
790
+ - uncompressed input bytes vs compressed output bytes
791
+ - saved percentage
792
+ - objective guardrails (minimum savings and maximum latency regression thresholds)
793
+
794
+ Use `--watch` to keep benchmarking incremental reindex runs after Markdown changes (local filesystem vaults only).
795
+ When `.brainlink/search-packs/manifest.json` is missing but `.blpk` files exist, Brainlink repairs the manifest first and avoids unnecessary full pack rebuild on small edits.
796
+
797
+ ### `pack-backup`
798
+
799
+ ```bash
800
+ blink pack-backup --vault ./vault
801
+ blink pack-backup --vault ./vault --output ./vault/.brainlink/backups/custom.blpkbak.gz
802
+ blink pack-backup --vault ./vault --json
803
+ ```
804
+
805
+ Creates an offline backup artifact of encrypted search packs with a second compression pass.
806
+ This is intentionally outside the online retrieval path (`index`, `search`, `context`).
807
+
701
808
  ### `agents`
702
809
 
703
810
  ```bash
@@ -720,11 +827,12 @@ If `--mode` or `--limit` is omitted, Brainlink resolves values from the current
720
827
 
721
828
  Modes:
722
829
 
723
- - `hybrid`: default; combines SQLite FTS with local embedding similarity.
724
- - `fts`: exact lexical retrieval through SQLite FTS.
830
+ - `hybrid`: default; combines lexical matching with local embedding similarity.
831
+ - `fts`: exact lexical retrieval from the file index.
725
832
  - `semantic`: local deterministic embedding similarity only.
726
833
 
727
834
  Hybrid results are cached in-memory for a short TTL and invalidated automatically when the local index file changes.
835
+ Context selection uses a middle-out strategy: it starts from the strongest chunk in a note and expands to neighboring chunks while respecting token budget.
728
836
 
729
837
  ### `context`
730
838
 
@@ -735,6 +843,7 @@ blink context "question" --vault ./vault --agent coding-agent --mode hybrid --js
735
843
  ```
736
844
 
737
845
  Builds a compact context package for an agent.
846
+ Repeated calls with the same vault, agent, query, mode and token/limit settings are served from a short in-memory cache while the index is unchanged.
738
847
 
739
848
  ### `links`
740
849
 
@@ -819,9 +928,15 @@ Watches Markdown files and rebuilds the index when notes change.
819
928
  ```bash
820
929
  blink server --watch
821
930
  blink server --vault ./vault --watch
931
+ blink server --vault ./vault --watch --no-open
822
932
  ```
823
933
 
824
934
  Starts the local read-only graph UI and HTTP API.
935
+ By default, it tries to open a native desktop GUI window for the graph URL.
936
+ On Linux, native GUI is disabled by default; enable it with `BRAINLINK_LINUX_NATIVE_GUI=1`.
937
+ If native GUI launch is unavailable, it falls back to dedicated app-window mode and then browser open.
938
+ When fallback opens Chromium-family browsers on Linux, Brainlink automatically uses compatibility launch flags for stable rendering on Ubuntu/Wayland setups.
939
+ Use `--no-open` to skip that behavior.
825
940
 
826
941
  The HTTP server only binds to loopback hosts such as `127.0.0.1`, `localhost` or `::1`.
827
942
 
@@ -862,6 +977,13 @@ If no `vault` is configured and no `--vault` flag is passed, Brainlink uses `$HO
862
977
  "embeddingProvider": "local",
863
978
  "defaultSearchMode": "hybrid",
864
979
  "chunkSize": 1200,
980
+ "searchPack": {
981
+ "rowChunkSize": 5000,
982
+ "compressionLevel": 5,
983
+ "useDictionary": true,
984
+ "guardrailMinSavingsPercent": 8,
985
+ "guardrailMaxLatencyRegressionPercent": 5
986
+ },
865
987
  "agentProfiles": {
866
988
  "coding-agent": {
867
989
  "defaultSearchMode": "semantic",
@@ -973,7 +1095,7 @@ src/
973
1095
  application/ use cases
974
1096
  cli/ command-line adapter
975
1097
  domain/ pure knowledge rules
976
- infrastructure/ filesystem and SQLite adapters
1098
+ infrastructure/ filesystem and index adapters
977
1099
  ```
978
1100
 
979
1101
  Detailed notes:
@@ -985,7 +1107,6 @@ Detailed notes:
985
1107
  ## Current Limits
986
1108
 
987
1109
  - Semantic search uses deterministic local embeddings, not a remote model provider.
988
- - Semantic search uses SQLite embedding buckets to narrow candidates before cosine scoring.
989
1110
  - `embeddingProvider` currently supports `local` and `none`.
990
1111
  - Link resolution is title-based inside each agent namespace, with `shared` as fallback.
991
1112
  - HTTP API is local and unauthenticated.
@@ -996,7 +1117,7 @@ Detailed notes:
996
1117
  The `0.1.0-beta` line is intended to stabilize the local-first memory loop:
997
1118
 
998
1119
  - Markdown as durable memory.
999
- - SQLite FTS plus local embeddings and semantic buckets as rebuildable retrieval index.
1120
+ - Rebuildable file index plus local embeddings and encrypted pack exports.
1000
1121
  - CLI as the primary agent interface.
1001
1122
  - HTTP graph API and frontend as inspection tools.
1002
1123
  - Agent namespaces to avoid context mixing.
@@ -1012,7 +1133,7 @@ Brainlink is local-first by default.
1012
1133
  - Brainlink HTTP is localhost-only and refuses non-loopback hosts.
1013
1134
  - Brainlink blocks common secret patterns by default when adding notes. Use `--allow-sensitive` only for intentional, protected vaults.
1014
1135
  - Do not store secrets, credentials, API keys or regulated personal data unless the vault is protected by your own storage controls.
1015
- - Treat `.brainlink/brainlink.db` as disposable derived data.
1136
+ - Treat `.brainlink/index.json` and `.brainlink/search-packs/` as disposable derived artifacts.
1016
1137
 
1017
1138
  See [SECURITY.md](SECURITY.md).
1018
1139
 
@@ -1023,6 +1144,7 @@ See [CONTRIBUTING.md](CONTRIBUTING.md).
1023
1144
  ## License
1024
1145
 
1025
1146
  MIT. See [LICENSE](LICENSE).
1147
+ Copyright (c) 2026 Substructa. See [COPYRIGHT.md](COPYRIGHT.md).
1026
1148
 
1027
1149
  ### Memory Optimization Loop (1-7)
1028
1150
 
package/SECURITY.md CHANGED
@@ -7,7 +7,7 @@ Brainlink is local-first.
7
7
  - The HTTP server binds to `127.0.0.1` by default.
8
8
  - The HTTP server always refuses non-loopback hosts.
9
9
  - The HTTP server is read-only and does not expose note creation, indexing or update routes.
10
- - The SQLite database is a derived local index.
10
+ - Local index artifacts (`.brainlink/index.json` and `.brainlink/search-packs/`) are derived data.
11
11
  - Markdown files are user-owned source data.
12
12
  - Brainlink-created Markdown files use `0600` permissions.
13
13
  - Brainlink-created directories and `.brainlink` use `0700` permissions.
@@ -1,7 +1,5 @@
1
1
  import { stat } from 'node:fs/promises';
2
- import { existsSync } from 'node:fs';
3
2
  import { performance } from 'node:perf_hooks';
4
- import { join } from 'node:path';
5
3
  import { validateGraph, getBrokenLinks, getOrphanNodes, getVaultStats } from '../domain/graph-analysis.js';
6
4
  import { ensureVault, listVaultFiles, readMarkdownFiles } from '../infrastructure/file-system-vault.js';
7
5
  import { resolveAgentRuntimeDefaults } from '../infrastructure/config.js';
@@ -96,17 +94,11 @@ export const doctorVault = async (vaultPath) => {
96
94
  const files = await readMarkdownFiles(absoluteVaultPath);
97
95
  const graph = await getGraphSummary(absoluteVaultPath);
98
96
  const validation = validateGraph(graph);
99
- const backupPath = join(absoluteVaultPath, '.brainlink', 'brainlink.db.backup');
100
- const hasBackup = existsSync(backupPath);
101
- const backupReady = graph.nodes.length === 0 || hasBackup;
102
97
  const checks = [
103
98
  createCheck('vault', true, `Vault ready at ${absoluteVaultPath}`),
104
99
  createCheck('markdown-files', files.length > 0, `${files.length} markdown files found`),
105
100
  createCheck('index', graph.nodes.length > 0, `${graph.nodes.length} indexed documents found`),
106
- createCheck('broken-links', validation.brokenLinks.length === 0, `${validation.brokenLinks.length} broken links found`),
107
- createCheck('index-backup', backupReady, backupReady
108
- ? (hasBackup ? 'SQLite recovery snapshot is available' : 'No index yet. Snapshot will be created after first indexing run')
109
- : 'Recovery snapshot missing. Run blink index to create a rollback snapshot')
101
+ createCheck('broken-links', validation.brokenLinks.length === 0, `${validation.brokenLinks.length} broken links found`)
110
102
  ];
111
103
  const recommendations = files.length === 0 && graph.nodes.length === 0
112
104
  ? [
@@ -1,13 +1,68 @@
1
+ import { stat } from 'node:fs/promises';
1
2
  import { formatContextPackage, selectContextSections } from '../domain/context.js';
3
+ import { indexStoragePath } from '../infrastructure/file-index.js';
2
4
  import { searchKnowledge } from './search-knowledge.js';
5
+ const contextCacheTtlMs = 45_000;
6
+ const contextCacheMaxEntries = 200;
7
+ const contextCache = new Map();
8
+ const readIndexMtimeMs = async (vaultPath) => {
9
+ try {
10
+ return (await stat(indexStoragePath(vaultPath))).mtimeMs;
11
+ }
12
+ catch {
13
+ return 0;
14
+ }
15
+ };
16
+ const toCacheKey = (vaultPath, query, limit, maxTokens, agentId, mode) => JSON.stringify({
17
+ vaultPath,
18
+ query: query.trim().toLowerCase(),
19
+ limit,
20
+ maxTokens,
21
+ agentId: agentId?.trim().toLowerCase() ?? '*',
22
+ mode: mode ?? 'default'
23
+ });
24
+ const contextCacheGet = (key, indexMtimeMs) => {
25
+ const entry = contextCache.get(key);
26
+ if (!entry) {
27
+ return undefined;
28
+ }
29
+ const fresh = Date.now() - entry.createdAt <= contextCacheTtlMs && entry.indexMtimeMs === indexMtimeMs;
30
+ if (!fresh) {
31
+ contextCache.delete(key);
32
+ return undefined;
33
+ }
34
+ return entry.context;
35
+ };
36
+ const contextCacheSet = (entry) => {
37
+ contextCache.set(entry.key, entry);
38
+ if (contextCache.size <= contextCacheMaxEntries) {
39
+ return;
40
+ }
41
+ const overflow = contextCache.size - contextCacheMaxEntries;
42
+ const keys = Array.from(contextCache.keys()).slice(0, overflow);
43
+ keys.forEach((key) => contextCache.delete(key));
44
+ };
3
45
  export const buildContextPackage = async (vaultPath, query, limit, maxTokens, agentId, mode) => {
46
+ const cacheKey = toCacheKey(vaultPath, query, limit, maxTokens, agentId, mode);
47
+ const indexMtimeMs = await readIndexMtimeMs(vaultPath);
48
+ const cached = contextCacheGet(cacheKey, indexMtimeMs);
49
+ if (cached) {
50
+ return cached;
51
+ }
4
52
  const results = await searchKnowledge(vaultPath, query, limit, agentId, mode);
5
53
  const sections = selectContextSections(results, maxTokens);
6
- return {
54
+ const context = {
7
55
  query,
8
56
  sections,
9
57
  content: formatContextPackage(query, sections)
10
58
  };
59
+ contextCacheSet({
60
+ key: cacheKey,
61
+ createdAt: Date.now(),
62
+ indexMtimeMs,
63
+ context
64
+ });
65
+ return context;
11
66
  };
12
67
  export const buildContext = async (vaultPath, query, limit, maxTokens, agentId, mode) => {
13
68
  const contextPackage = await buildContextPackage(vaultPath, query, limit, maxTokens, agentId, mode);