nlm-memory 0.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.agents/plugins/marketplace.json +20 -0
- package/.github/workflows/ci.yml +30 -0
- package/LICENSE +151 -0
- package/README.md +119 -0
- package/dist/cli/classify-parity.d.ts +48 -0
- package/dist/cli/classify-parity.js +182 -0
- package/dist/cli/classify-parity.js.map +1 -0
- package/dist/cli/launchctl-helpers.d.ts +26 -0
- package/dist/cli/launchctl-helpers.js +42 -0
- package/dist/cli/launchctl-helpers.js.map +1 -0
- package/dist/cli/nlm.d.ts +25 -0
- package/dist/cli/nlm.js +832 -0
- package/dist/cli/nlm.js.map +1 -0
- package/dist/core/actions/actions-log.d.ts +40 -0
- package/dist/core/actions/actions-log.js +72 -0
- package/dist/core/actions/actions-log.js.map +1 -0
- package/dist/core/actions/overlay.d.ts +30 -0
- package/dist/core/actions/overlay.js +101 -0
- package/dist/core/actions/overlay.js.map +1 -0
- package/dist/core/adapters/aider.d.ts +33 -0
- package/dist/core/adapters/aider.js +167 -0
- package/dist/core/adapters/aider.js.map +1 -0
- package/dist/core/adapters/claude-code.d.ts +32 -0
- package/dist/core/adapters/claude-code.js +270 -0
- package/dist/core/adapters/claude-code.js.map +1 -0
- package/dist/core/adapters/common.d.ts +20 -0
- package/dist/core/adapters/common.js +60 -0
- package/dist/core/adapters/common.js.map +1 -0
- package/dist/core/adapters/from-source.d.ts +11 -0
- package/dist/core/adapters/from-source.js +55 -0
- package/dist/core/adapters/from-source.js.map +1 -0
- package/dist/core/adapters/hermes-agent.d.ts +34 -0
- package/dist/core/adapters/hermes-agent.js +192 -0
- package/dist/core/adapters/hermes-agent.js.map +1 -0
- package/dist/core/adapters/hermes.d.ts +31 -0
- package/dist/core/adapters/hermes.js +247 -0
- package/dist/core/adapters/hermes.js.map +1 -0
- package/dist/core/adapters/jsonl-generic.d.ts +56 -0
- package/dist/core/adapters/jsonl-generic.js +185 -0
- package/dist/core/adapters/jsonl-generic.js.map +1 -0
- package/dist/core/adapters/opencode.d.ts +36 -0
- package/dist/core/adapters/opencode.js +213 -0
- package/dist/core/adapters/opencode.js.map +1 -0
- package/dist/core/adapters/pi.d.ts +32 -0
- package/dist/core/adapters/pi.js +233 -0
- package/dist/core/adapters/pi.js.map +1 -0
- package/dist/core/classifier/prompt.d.ts +60 -0
- package/dist/core/classifier/prompt.js +178 -0
- package/dist/core/classifier/prompt.js.map +1 -0
- package/dist/core/dataset/build-dataset.d.ts +87 -0
- package/dist/core/dataset/build-dataset.js +335 -0
- package/dist/core/dataset/build-dataset.js.map +1 -0
- package/dist/core/embedding/chunk-body.d.ts +30 -0
- package/dist/core/embedding/chunk-body.js +60 -0
- package/dist/core/embedding/chunk-body.js.map +1 -0
- package/dist/core/embedding/embed-backfill.d.ts +36 -0
- package/dist/core/embedding/embed-backfill.js +168 -0
- package/dist/core/embedding/embed-backfill.js.map +1 -0
- package/dist/core/embedding/embed-normalize.d.ts +28 -0
- package/dist/core/embedding/embed-normalize.js +98 -0
- package/dist/core/embedding/embed-normalize.js.map +1 -0
- package/dist/core/facts/backfill-facts.d.ts +58 -0
- package/dist/core/facts/backfill-facts.js +169 -0
- package/dist/core/facts/backfill-facts.js.map +1 -0
- package/dist/core/facts/extract-facts.d.ts +20 -0
- package/dist/core/facts/extract-facts.js +37 -0
- package/dist/core/facts/extract-facts.js.map +1 -0
- package/dist/core/hook/citation-detect.d.ts +32 -0
- package/dist/core/hook/citation-detect.js +105 -0
- package/dist/core/hook/citation-detect.js.map +1 -0
- package/dist/core/hook/cite-memo.d.ts +20 -0
- package/dist/core/hook/cite-memo.js +68 -0
- package/dist/core/hook/cite-memo.js.map +1 -0
- package/dist/core/hook/claude-settings.d.ts +34 -0
- package/dist/core/hook/claude-settings.js +117 -0
- package/dist/core/hook/claude-settings.js.map +1 -0
- package/dist/core/hook/gate.d.ts +11 -0
- package/dist/core/hook/gate.js +19 -0
- package/dist/core/hook/gate.js.map +1 -0
- package/dist/core/hook/hook-log.d.ts +25 -0
- package/dist/core/hook/hook-log.js +28 -0
- package/dist/core/hook/hook-log.js.map +1 -0
- package/dist/core/hook/memo-sweep.d.ts +55 -0
- package/dist/core/hook/memo-sweep.js +134 -0
- package/dist/core/hook/memo-sweep.js.map +1 -0
- package/dist/core/hook/memo.d.ts +20 -0
- package/dist/core/hook/memo.js +66 -0
- package/dist/core/hook/memo.js.map +1 -0
- package/dist/core/hook/pointer-block.d.ts +14 -0
- package/dist/core/hook/pointer-block.js +19 -0
- package/dist/core/hook/pointer-block.js.map +1 -0
- package/dist/core/hook/select.d.ts +21 -0
- package/dist/core/hook/select.js +15 -0
- package/dist/core/hook/select.js.map +1 -0
- package/dist/core/hook/transcript.d.ts +31 -0
- package/dist/core/hook/transcript.js +103 -0
- package/dist/core/hook/transcript.js.map +1 -0
- package/dist/core/ingest/ingest-session.d.ts +40 -0
- package/dist/core/ingest/ingest-session.js +71 -0
- package/dist/core/ingest/ingest-session.js.map +1 -0
- package/dist/core/providers/provider-models.d.ts +24 -0
- package/dist/core/providers/provider-models.js +72 -0
- package/dist/core/providers/provider-models.js.map +1 -0
- package/dist/core/providers/provider-registry.d.ts +62 -0
- package/dist/core/providers/provider-registry.js +143 -0
- package/dist/core/providers/provider-registry.js.map +1 -0
- package/dist/core/recall/citation-log.d.ts +28 -0
- package/dist/core/recall/citation-log.js +90 -0
- package/dist/core/recall/citation-log.js.map +1 -0
- package/dist/core/recall/filter.d.ts +11 -0
- package/dist/core/recall/filter.js +20 -0
- package/dist/core/recall/filter.js.map +1 -0
- package/dist/core/recall/index.d.ts +6 -0
- package/dist/core/recall/index.js +5 -0
- package/dist/core/recall/index.js.map +1 -0
- package/dist/core/recall/match-fields.d.ts +10 -0
- package/dist/core/recall/match-fields.js +37 -0
- package/dist/core/recall/match-fields.js.map +1 -0
- package/dist/core/recall/query-log.d.ts +36 -0
- package/dist/core/recall/query-log.js +112 -0
- package/dist/core/recall/query-log.js.map +1 -0
- package/dist/core/recall/query-shape.d.ts +22 -0
- package/dist/core/recall/query-shape.js +64 -0
- package/dist/core/recall/query-shape.js.map +1 -0
- package/dist/core/recall/recall-service.d.ts +19 -0
- package/dist/core/recall/recall-service.js +252 -0
- package/dist/core/recall/recall-service.js.map +1 -0
- package/dist/core/recall/recent-log.d.ts +16 -0
- package/dist/core/recall/recent-log.js +46 -0
- package/dist/core/recall/recent-log.js.map +1 -0
- package/dist/core/recall/tokenize.d.ts +7 -0
- package/dist/core/recall/tokenize.js +18 -0
- package/dist/core/recall/tokenize.js.map +1 -0
- package/dist/core/recall/useful-scan.d.ts +52 -0
- package/dist/core/recall/useful-scan.js +300 -0
- package/dist/core/recall/useful-scan.js.map +1 -0
- package/dist/core/recall-facts/fact-query-log.d.ts +42 -0
- package/dist/core/recall-facts/fact-query-log.js +115 -0
- package/dist/core/recall-facts/fact-query-log.js.map +1 -0
- package/dist/core/recall-facts/fact-recall-service.d.ts +34 -0
- package/dist/core/recall-facts/fact-recall-service.js +246 -0
- package/dist/core/recall-facts/fact-recall-service.js.map +1 -0
- package/dist/core/scheduler/scan-once.d.ts +32 -0
- package/dist/core/scheduler/scan-once.js +100 -0
- package/dist/core/scheduler/scan-once.js.map +1 -0
- package/dist/core/scheduler/scheduler.d.ts +59 -0
- package/dist/core/scheduler/scheduler.js +158 -0
- package/dist/core/scheduler/scheduler.js.map +1 -0
- package/dist/core/sources/source-registry.d.ts +68 -0
- package/dist/core/sources/source-registry.js +208 -0
- package/dist/core/sources/source-registry.js.map +1 -0
- package/dist/core/storage/db-restore.d.ts +53 -0
- package/dist/core/storage/db-restore.js +113 -0
- package/dist/core/storage/db-restore.js.map +1 -0
- package/dist/core/storage/live-status.d.ts +15 -0
- package/dist/core/storage/live-status.js +43 -0
- package/dist/core/storage/live-status.js.map +1 -0
- package/dist/core/storage/migrate.d.ts +14 -0
- package/dist/core/storage/migrate.js +52 -0
- package/dist/core/storage/migrate.js.map +1 -0
- package/dist/core/storage/sqlite-fact-store.d.ts +50 -0
- package/dist/core/storage/sqlite-fact-store.js +256 -0
- package/dist/core/storage/sqlite-fact-store.js.map +1 -0
- package/dist/core/storage/sqlite-session-store.d.ts +152 -0
- package/dist/core/storage/sqlite-session-store.js +587 -0
- package/dist/core/storage/sqlite-session-store.js.map +1 -0
- package/dist/hook/pre-compact-hook.d.ts +26 -0
- package/dist/hook/pre-compact-hook.js +94 -0
- package/dist/hook/pre-compact-hook.js.map +1 -0
- package/dist/hook/prompt-recall-hook.d.ts +23 -0
- package/dist/hook/prompt-recall-hook.js +141 -0
- package/dist/hook/prompt-recall-hook.js.map +1 -0
- package/dist/hook/session-end-hook.d.ts +18 -0
- package/dist/hook/session-end-hook.js +67 -0
- package/dist/hook/session-end-hook.js.map +1 -0
- package/dist/hook/session-start-hook.d.ts +25 -0
- package/dist/hook/session-start-hook.js +129 -0
- package/dist/hook/session-start-hook.js.map +1 -0
- package/dist/hook/stop-hook.d.ts +38 -0
- package/dist/hook/stop-hook.js +171 -0
- package/dist/hook/stop-hook.js.map +1 -0
- package/dist/hook/subagent-start-hook.d.ts +30 -0
- package/dist/hook/subagent-start-hook.js +108 -0
- package/dist/hook/subagent-start-hook.js.map +1 -0
- package/dist/http/app.d.ts +65 -0
- package/dist/http/app.js +1009 -0
- package/dist/http/app.js.map +1 -0
- package/dist/install/claude-code.d.ts +57 -0
- package/dist/install/claude-code.js +76 -0
- package/dist/install/claude-code.js.map +1 -0
- package/dist/install/codex.d.ts +82 -0
- package/dist/install/codex.js +277 -0
- package/dist/install/codex.js.map +1 -0
- package/dist/install/hermes-agent.d.ts +35 -0
- package/dist/install/hermes-agent.js +48 -0
- package/dist/install/hermes-agent.js.map +1 -0
- package/dist/install/hermes.d.ts +29 -0
- package/dist/install/hermes.js +52 -0
- package/dist/install/hermes.js.map +1 -0
- package/dist/install/ollama.d.ts +54 -0
- package/dist/install/ollama.js +178 -0
- package/dist/install/ollama.js.map +1 -0
- package/dist/install/setup.d.ts +37 -0
- package/dist/install/setup.js +339 -0
- package/dist/install/setup.js.map +1 -0
- package/dist/llm/classifier-box.d.ts +29 -0
- package/dist/llm/classifier-box.js +43 -0
- package/dist/llm/classifier-box.js.map +1 -0
- package/dist/llm/deepseek-client.d.ts +40 -0
- package/dist/llm/deepseek-client.js +114 -0
- package/dist/llm/deepseek-client.js.map +1 -0
- package/dist/llm/env-autoload.d.ts +8 -0
- package/dist/llm/env-autoload.js +54 -0
- package/dist/llm/env-autoload.js.map +1 -0
- package/dist/llm/ollama-client.d.ts +47 -0
- package/dist/llm/ollama-client.js +156 -0
- package/dist/llm/ollama-client.js.map +1 -0
- package/dist/mcp/server.d.ts +64 -0
- package/dist/mcp/server.js +430 -0
- package/dist/mcp/server.js.map +1 -0
- package/dist/ports/fact-store.d.ts +82 -0
- package/dist/ports/fact-store.js +16 -0
- package/dist/ports/fact-store.js.map +1 -0
- package/dist/ports/llm-client.d.ts +42 -0
- package/dist/ports/llm-client.js +14 -0
- package/dist/ports/llm-client.js.map +1 -0
- package/dist/ports/logger.d.ts +13 -0
- package/dist/ports/logger.js +8 -0
- package/dist/ports/logger.js.map +1 -0
- package/dist/ports/session-store.d.ts +29 -0
- package/dist/ports/session-store.js +9 -0
- package/dist/ports/session-store.js.map +1 -0
- package/dist/ports/transcript-adapter.d.ts +48 -0
- package/dist/ports/transcript-adapter.js +15 -0
- package/dist/ports/transcript-adapter.js.map +1 -0
- package/dist/shared/types.d.ts +129 -0
- package/dist/shared/types.js +6 -0
- package/dist/shared/types.js.map +1 -0
- package/dist/ui/assets/index-BA6IpU8g.css +1 -0
- package/dist/ui/assets/index-B_qIVV0k.js +69 -0
- package/dist/ui/index.html +13 -0
- package/docs/methodology/re-derivation-rate.md +112 -0
- package/docs/methodology/useful-hit-rate.md +79 -0
- package/docs/plans/2026-05-20-fts5-lexical-recall.md +1088 -0
- package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +662 -0
- package/docs/plans/2026-05-20-recall-hook-design.md +131 -0
- package/docs/plans/2026-05-20-recall-hook-implementation.md +1222 -0
- package/docs/plans/desktop-product.md +69 -0
- package/docs/plans/factstore-design.md +236 -0
- package/logs/CHANGELOG/CHANGELOG-2026.md +1389 -0
- package/logs/CHANGELOG/CHANGELOG.md +320 -0
- package/migrations/000_initial_schema.sql +174 -0
- package/migrations/001_entity_type_rename.sql +17 -0
- package/migrations/002_adapter_state_extend.sql +12 -0
- package/migrations/003_session_embeddings.sql +11 -0
- package/migrations/004_facts.sql +46 -0
- package/migrations/005_sources.sql +31 -0
- package/migrations/006_providers.sql +33 -0
- package/migrations/007_source_tokens.sql +17 -0
- package/migrations/008_fts_rebuild.sql +9 -0
- package/migrations/009_session_embedding_chunks.sql +46 -0
- package/migrations/010_sources_opencode.sql +30 -0
- package/migrations/011_sources_hermes_agent.sql +30 -0
- package/migrations/012_sources_aider.sql +30 -0
- package/migrations/013_adapter_state_failure_count.sql +12 -0
- package/package.json +56 -0
- package/plugin/.codex-plugin/plugin.json +22 -0
- package/plugin/.mcp.json +8 -0
- package/plugin/README.md +51 -0
- package/plugin/hooks/hooks.json +25 -0
- package/plugin/scripts/prompt-recall-hook.mjs +202 -0
- package/plugin/scripts/stop-hook.mjs +306 -0
- package/plugin-hermes-agent/README.md +49 -0
- package/plugin-hermes-agent/__init__.py +75 -0
- package/plugin-hermes-agent/plugin.yaml +15 -0
- package/scripts/backfill-citations.mjs +0 -0
- package/scripts/build-codex-plugin.mjs +61 -0
- package/scripts/deepseek-probe.mjs +67 -0
- package/scripts/extract-triples.mjs +207 -0
- package/scripts/longmemeval/embedding-cache.ts +77 -0
- package/scripts/longmemeval/fetch-dataset.sh +25 -0
- package/scripts/longmemeval/run-harness.ts +315 -0
- package/scripts/longmemeval/scorer.ts +99 -0
- package/scripts/longmemeval/tsconfig.json +9 -0
- package/scripts/longmemeval/types.ts +35 -0
- package/scripts/nlm-daily-digest.py +239 -0
- package/scripts/nlm-daily-digest.sh +28 -0
- package/src/cli/classify-parity.ts +257 -0
- package/src/cli/launchctl-helpers.ts +49 -0
- package/src/cli/nlm.ts +885 -0
- package/src/core/actions/actions-log.ts +118 -0
- package/src/core/actions/overlay.ts +117 -0
- package/src/core/adapters/aider.ts +205 -0
- package/src/core/adapters/claude-code.ts +293 -0
- package/src/core/adapters/common.ts +54 -0
- package/src/core/adapters/from-source.ts +57 -0
- package/src/core/adapters/hermes-agent.ts +240 -0
- package/src/core/adapters/hermes.ts +277 -0
- package/src/core/adapters/jsonl-generic.ts +208 -0
- package/src/core/adapters/opencode.ts +281 -0
- package/src/core/adapters/pi.ts +264 -0
- package/src/core/classifier/prompt.ts +200 -0
- package/src/core/dataset/build-dataset.ts +463 -0
- package/src/core/embedding/chunk-body.ts +76 -0
- package/src/core/embedding/embed-backfill.ts +210 -0
- package/src/core/embedding/embed-normalize.ts +135 -0
- package/src/core/facts/backfill-facts.ts +254 -0
- package/src/core/facts/extract-facts.ts +50 -0
- package/src/core/hook/citation-detect.ts +124 -0
- package/src/core/hook/cite-memo.ts +68 -0
- package/src/core/hook/claude-settings.ts +166 -0
- package/src/core/hook/gate.ts +25 -0
- package/src/core/hook/hook-log.ts +41 -0
- package/src/core/hook/memo-sweep.ts +164 -0
- package/src/core/hook/memo.ts +67 -0
- package/src/core/hook/pointer-block.ts +26 -0
- package/src/core/hook/select.ts +32 -0
- package/src/core/hook/transcript.ts +121 -0
- package/src/core/ingest/ingest-session.ts +111 -0
- package/src/core/providers/provider-models.ts +100 -0
- package/src/core/providers/provider-registry.ts +196 -0
- package/src/core/recall/citation-log.ts +108 -0
- package/src/core/recall/filter.ts +27 -0
- package/src/core/recall/index.ts +6 -0
- package/src/core/recall/match-fields.ts +40 -0
- package/src/core/recall/query-log.ts +149 -0
- package/src/core/recall/query-shape.ts +66 -0
- package/src/core/recall/recall-service.ts +320 -0
- package/src/core/recall/recent-log.ts +59 -0
- package/src/core/recall/tokenize.ts +18 -0
- package/src/core/recall/useful-scan.ts +336 -0
- package/src/core/recall-facts/fact-query-log.ts +150 -0
- package/src/core/recall-facts/fact-recall-service.ts +327 -0
- package/src/core/scheduler/scan-once.ts +142 -0
- package/src/core/scheduler/scheduler.ts +225 -0
- package/src/core/sources/source-registry.ts +260 -0
- package/src/core/storage/db-restore.ts +133 -0
- package/src/core/storage/live-status.ts +45 -0
- package/src/core/storage/migrate.ts +72 -0
- package/src/core/storage/sqlite-fact-store.ts +304 -0
- package/src/core/storage/sqlite-session-store.ts +765 -0
- package/src/hook/prompt-recall-hook.ts +174 -0
- package/src/hook/session-end-hook.ts +81 -0
- package/src/hook/session-start-hook.ts +165 -0
- package/src/hook/stop-hook.ts +236 -0
- package/src/http/app.ts +1114 -0
- package/src/install/claude-code.ts +128 -0
- package/src/install/codex.ts +367 -0
- package/src/install/hermes-agent.ts +76 -0
- package/src/install/hermes.ts +78 -0
- package/src/install/ollama.ts +208 -0
- package/src/install/setup.ts +368 -0
- package/src/llm/classifier-box.ts +64 -0
- package/src/llm/deepseek-client.ts +150 -0
- package/src/llm/env-autoload.ts +55 -0
- package/src/llm/ollama-client.ts +189 -0
- package/src/mcp/server.ts +534 -0
- package/src/ports/fact-store.ts +102 -0
- package/src/ports/llm-client.ts +52 -0
- package/src/ports/logger.ts +16 -0
- package/src/ports/session-store.ts +45 -0
- package/src/ports/transcript-adapter.ts +55 -0
- package/src/shared/types.ts +145 -0
- package/src/ui/App.tsx +58 -0
- package/src/ui/components/PromoteOpenButton.tsx +65 -0
- package/src/ui/components/SessionDrawer.tsx +136 -0
- package/src/ui/components/SideNav.tsx +162 -0
- package/src/ui/components/Skeleton.tsx +107 -0
- package/src/ui/index.html +13 -0
- package/src/ui/lib/actions.ts +30 -0
- package/src/ui/lib/api.ts +92 -0
- package/src/ui/lib/dataset.ts +141 -0
- package/src/ui/lib/registries.ts +155 -0
- package/src/ui/lib/view-settings.ts +41 -0
- package/src/ui/main.tsx +15 -0
- package/src/ui/pages/Live.tsx +229 -0
- package/src/ui/pages/Pulse.tsx +415 -0
- package/src/ui/pages/Recall.tsx +190 -0
- package/src/ui/pages/River.tsx +308 -0
- package/src/ui/pages/Search.tsx +93 -0
- package/src/ui/pages/Stub.tsx +9 -0
- package/src/ui/pages/Thread.tsx +262 -0
- package/src/ui/pages/settings/Classifier.tsx +227 -0
- package/src/ui/pages/settings/Data.tsx +190 -0
- package/src/ui/pages/settings/Index.tsx +65 -0
- package/src/ui/pages/settings/Labels.tsx +224 -0
- package/src/ui/pages/settings/Providers.tsx +305 -0
- package/src/ui/pages/settings/SettingsSubnav.tsx +28 -0
- package/src/ui/pages/settings/Sources.tsx +326 -0
- package/src/ui/pages/settings/Views.tsx +96 -0
- package/src/ui/styles.css +1766 -0
- package/src/ui/tsconfig.json +21 -0
- package/src/ui/vite.config.ts +19 -0
- package/tests/fixtures/claude_code/short_session.jsonl +2 -0
- package/tests/fixtures/claude_code/standard_iso.jsonl +4 -0
- package/tests/fixtures/claude_code/tool_heavy.jsonl +8 -0
- package/tests/fixtures/claude_code/with_subagent.jsonl +7 -0
- package/tests/fixtures/facts.ts +17 -0
- package/tests/fixtures/golden-corpus.ts +85 -0
- package/tests/fixtures/hermes/paired_request_dump.json +24 -0
- package/tests/fixtures/hermes/paired_session.json +23 -0
- package/tests/fixtures/hermes/request_dump.json +28 -0
- package/tests/fixtures/hermes/session_iso.json +38 -0
- package/tests/fixtures/hermes/session_unix.json +38 -0
- package/tests/fixtures/hermes/system_only.json +18 -0
- package/tests/fixtures/pi/error-connection-abort.jsonl +8 -0
- package/tests/fixtures/pi/short-successful.jsonl +5 -0
- package/tests/fixtures/pi/with-custom-message.jsonl +6 -0
- package/tests/fixtures/sessions.ts +22 -0
- package/tests/integration/backfill-facts.test.ts +362 -0
- package/tests/integration/citation-explicit.test.ts +111 -0
- package/tests/integration/cite-event.test.ts +169 -0
- package/tests/integration/cite-memo.test.ts +87 -0
- package/tests/integration/db-restore.test.ts +153 -0
- package/tests/integration/embed-backfill.test.ts +176 -0
- package/tests/integration/fact-supersedence.test.ts +313 -0
- package/tests/integration/fts-index.test.ts +60 -0
- package/tests/integration/getbyids-sqlite.test.ts +60 -0
- package/tests/integration/hermes-agent-hooks.test.ts +248 -0
- package/tests/integration/hook-claude-settings.test.ts +205 -0
- package/tests/integration/hook-log.test.ts +54 -0
- package/tests/integration/hook-memo.test.ts +68 -0
- package/tests/integration/hook-pre-compact.test.ts +105 -0
- package/tests/integration/hook-subagent-start.test.ts +102 -0
- package/tests/integration/http.test.ts +401 -0
- package/tests/integration/keyword-search-fts.test.ts +66 -0
- package/tests/integration/mcp-recall-logging.test.ts +88 -0
- package/tests/integration/mcp.test.ts +248 -0
- package/tests/integration/memo-sweep.test.ts +91 -0
- package/tests/integration/prompt-recall-hook.test.ts +88 -0
- package/tests/integration/provider-registry.test.ts +107 -0
- package/tests/integration/recall-golden.test.ts +59 -0
- package/tests/integration/recall-sqlite.test.ts +169 -0
- package/tests/integration/scheduler.test.ts +391 -0
- package/tests/integration/session-end-hook.test.ts +48 -0
- package/tests/integration/session-start-hook.test.ts +126 -0
- package/tests/integration/source-registry.test.ts +120 -0
- package/tests/integration/sqlite-fact-store.test.ts +346 -0
- package/tests/integration/stop-hook.test.ts +560 -0
- package/tests/integration/wal-checkpoint.test.ts +49 -0
- package/tests/unit/cli/launchctl-helpers.test.ts +60 -0
- package/tests/unit/core/adapters/aider.test.ts +230 -0
- package/tests/unit/core/adapters/claude-code.test.ts +118 -0
- package/tests/unit/core/adapters/hermes-agent.test.ts +329 -0
- package/tests/unit/core/adapters/hermes.test.ts +81 -0
- package/tests/unit/core/adapters/jsonl-generic.test.ts +142 -0
- package/tests/unit/core/adapters/opencode.test.ts +354 -0
- package/tests/unit/core/adapters/pi.test.ts +110 -0
- package/tests/unit/core/classifier/prompt.test.ts +126 -0
- package/tests/unit/core/embedding/chunk-body.test.ts +100 -0
- package/tests/unit/core/facts/extract-facts.test.ts +117 -0
- package/tests/unit/core/filter.test.ts +40 -0
- package/tests/unit/core/hook/citation-detect-cite-session.test.ts +96 -0
- package/tests/unit/core/hook/citation-detect.test.ts +124 -0
- package/tests/unit/core/hook/gate.test.ts +29 -0
- package/tests/unit/core/hook/pointer-block.test.ts +22 -0
- package/tests/unit/core/hook/select.test.ts +66 -0
- package/tests/unit/core/match-fields.test.ts +39 -0
- package/tests/unit/core/mcp-cite-session.test.ts +51 -0
- package/tests/unit/core/providers/provider-models.test.ts +101 -0
- package/tests/unit/core/query-shape.test.ts +92 -0
- package/tests/unit/core/recall-facts/fact-recall-service.test.ts +258 -0
- package/tests/unit/core/recall-service.test.ts +200 -0
- package/tests/unit/core/storage/live-status.test.ts +54 -0
- package/tests/unit/core/tokenize.test.ts +32 -0
- package/tests/unit/core/useful-scan.test.ts +537 -0
- package/tests/unit/llm/embed.test.ts +93 -0
- package/tests/unit/llm/ollama-client.test.ts +124 -0
- package/tests/unit/scripts/longmemeval-scorer.test.ts +114 -0
- package/tsconfig.json +31 -0
- package/tsconfig.test.json +11 -0
- package/vitest.config.ts +22 -0
|
@@ -0,0 +1,87 @@
|
|
|
1
|
+
import { mkdtempSync, readdirSync, rmSync, writeFileSync } from "node:fs";
|
|
2
|
+
import { tmpdir } from "node:os";
|
|
3
|
+
import { join } from "node:path";
|
|
4
|
+
import { afterEach, beforeEach, describe, expect, it } from "vitest";
|
|
5
|
+
import {
|
|
6
|
+
clearCited,
|
|
7
|
+
loadCited,
|
|
8
|
+
recordCited,
|
|
9
|
+
} from "../../src/core/hook/cite-memo.js";
|
|
10
|
+
|
|
11
|
+
describe("cite-memo", () => {
|
|
12
|
+
let tmp: string;
|
|
13
|
+
|
|
14
|
+
beforeEach(() => {
|
|
15
|
+
tmp = mkdtempSync(join(tmpdir(), "nlm-cite-memo-"));
|
|
16
|
+
process.env["NLM_HOOK_STATE_DIR"] = tmp;
|
|
17
|
+
});
|
|
18
|
+
|
|
19
|
+
afterEach(() => {
|
|
20
|
+
delete process.env["NLM_HOOK_STATE_DIR"];
|
|
21
|
+
rmSync(tmp, { recursive: true, force: true });
|
|
22
|
+
});
|
|
23
|
+
|
|
24
|
+
it("loadCited returns empty set when no memo file exists", () => {
|
|
25
|
+
expect(loadCited("conv-x").size).toBe(0);
|
|
26
|
+
});
|
|
27
|
+
|
|
28
|
+
it("recordCited persists ids; loadCited returns them on next call", () => {
|
|
29
|
+
recordCited("conv-x", ["cc_a", "cc_b"]);
|
|
30
|
+
expect(loadCited("conv-x")).toEqual(new Set(["cc_a", "cc_b"]));
|
|
31
|
+
});
|
|
32
|
+
|
|
33
|
+
it("recordCited unions across calls (does not overwrite)", () => {
|
|
34
|
+
recordCited("conv-x", ["cc_a"]);
|
|
35
|
+
recordCited("conv-x", ["cc_b", "cc_a"]);
|
|
36
|
+
expect(loadCited("conv-x")).toEqual(new Set(["cc_a", "cc_b"]));
|
|
37
|
+
});
|
|
38
|
+
|
|
39
|
+
it("recordCited with empty list is a no-op (no file created)", () => {
|
|
40
|
+
recordCited("conv-empty", []);
|
|
41
|
+
expect(readdirSync(tmp).filter((f) => f.startsWith("conv-empty"))).toEqual([]);
|
|
42
|
+
});
|
|
43
|
+
|
|
44
|
+
it("clearCited removes the file and returns true; second call returns false", () => {
|
|
45
|
+
recordCited("conv-x", ["cc_a"]);
|
|
46
|
+
expect(clearCited("conv-x")).toBe(true);
|
|
47
|
+
expect(clearCited("conv-x")).toBe(false);
|
|
48
|
+
expect(loadCited("conv-x").size).toBe(0);
|
|
49
|
+
});
|
|
50
|
+
|
|
51
|
+
it("uses .cited.json filename suffix — parallel to surfaced memo's .json", () => {
|
|
52
|
+
recordCited("conv-x", ["cc_a"]);
|
|
53
|
+
const files = readdirSync(tmp);
|
|
54
|
+
expect(files).toContain("conv-x.cited.json");
|
|
55
|
+
});
|
|
56
|
+
|
|
57
|
+
it("treats corrupt JSON as empty without throwing", () => {
|
|
58
|
+
writeFileSync(join(tmp, "conv-bad.cited.json"), "not json", "utf8");
|
|
59
|
+
expect(loadCited("conv-bad").size).toBe(0);
|
|
60
|
+
});
|
|
61
|
+
|
|
62
|
+
it("treats non-array JSON as empty without throwing", () => {
|
|
63
|
+
writeFileSync(
|
|
64
|
+
join(tmp, "conv-obj.cited.json"),
|
|
65
|
+
JSON.stringify({ cc_a: 1 }),
|
|
66
|
+
"utf8",
|
|
67
|
+
);
|
|
68
|
+
expect(loadCited("conv-obj").size).toBe(0);
|
|
69
|
+
});
|
|
70
|
+
|
|
71
|
+
it("filters out non-string entries from the persisted array", () => {
|
|
72
|
+
writeFileSync(
|
|
73
|
+
join(tmp, "conv-mixed.cited.json"),
|
|
74
|
+
JSON.stringify(["cc_a", 42, null, "cc_b"]),
|
|
75
|
+
"utf8",
|
|
76
|
+
);
|
|
77
|
+
expect(loadCited("conv-mixed")).toEqual(new Set(["cc_a", "cc_b"]));
|
|
78
|
+
});
|
|
79
|
+
|
|
80
|
+
it("sanitizes unsafe conversation IDs so the path stays inside the state dir", () => {
|
|
81
|
+
recordCited("../escape/attempt", ["cc_a"]);
|
|
82
|
+
const files = readdirSync(tmp);
|
|
83
|
+
// No file at ../escape/attempt should exist; conversion replaces unsafe chars.
|
|
84
|
+
expect(files.some((f) => f.endsWith(".cited.json"))).toBe(true);
|
|
85
|
+
expect(files).not.toContain("..");
|
|
86
|
+
});
|
|
87
|
+
});
|
|
@@ -0,0 +1,153 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Backup + restore integration. Real SQLite stores, VACUUM INTO snapshot,
|
|
3
|
+
* candidate validation, staged restore, and boot-time promotion.
|
|
4
|
+
*/
|
|
5
|
+
|
|
6
|
+
import { existsSync, mkdtempSync, readdirSync, rmSync, statSync, writeFileSync } from "node:fs";
|
|
7
|
+
import { tmpdir } from "node:os";
|
|
8
|
+
import { join, resolve } from "node:path";
|
|
9
|
+
import { afterEach, beforeEach, describe, expect, it } from "vitest";
|
|
10
|
+
import type Database from "better-sqlite3";
|
|
11
|
+
import { SqliteSessionStore } from "../../src/core/storage/sqlite-session-store.js";
|
|
12
|
+
import {
|
|
13
|
+
PENDING_SUFFIX,
|
|
14
|
+
applyPendingRestore,
|
|
15
|
+
snapshotScratchPath,
|
|
16
|
+
stageRestore,
|
|
17
|
+
validateRestoreCandidate,
|
|
18
|
+
vacuumSnapshot,
|
|
19
|
+
} from "../../src/core/storage/db-restore.js";
|
|
20
|
+
|
|
21
|
+
const MIGRATIONS_DIR = resolve(__dirname, "../../migrations");
|
|
22
|
+
|
|
23
|
+
function insertMarkerSource(db: Database.Database, name: string, runtimeLabel: string): void {
|
|
24
|
+
db.prepare(
|
|
25
|
+
"INSERT INTO sources (kind, name, path_or_url, runtime_label, parse_config, enabled) " +
|
|
26
|
+
"VALUES ('webhook', ?, NULL, ?, '{}', 1)",
|
|
27
|
+
).run(name, runtimeLabel);
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
describe("db-restore", () => {
|
|
31
|
+
let tmp: string;
|
|
32
|
+
let dbPath: string;
|
|
33
|
+
|
|
34
|
+
beforeEach(() => {
|
|
35
|
+
tmp = mkdtempSync(join(tmpdir(), "nlm-restore-"));
|
|
36
|
+
dbPath = join(tmp, "canonical.sqlite");
|
|
37
|
+
});
|
|
38
|
+
|
|
39
|
+
afterEach(() => {
|
|
40
|
+
rmSync(tmp, { recursive: true, force: true });
|
|
41
|
+
});
|
|
42
|
+
|
|
43
|
+
function freshStore(path: string): SqliteSessionStore {
|
|
44
|
+
return new SqliteSessionStore({ dbPath: path, migrationsDir: MIGRATIONS_DIR });
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
it("vacuumSnapshot writes a valid standalone copy", () => {
|
|
48
|
+
const store = freshStore(dbPath);
|
|
49
|
+
const snap = snapshotScratchPath(dbPath);
|
|
50
|
+
const bytes = vacuumSnapshot(store.rawDb(), snap);
|
|
51
|
+
store.close();
|
|
52
|
+
|
|
53
|
+
expect(bytes).toBeGreaterThan(0);
|
|
54
|
+
expect(statSync(snap).size).toBe(bytes);
|
|
55
|
+
expect(validateRestoreCandidate(snap).ok).toBe(true);
|
|
56
|
+
rmSync(snap, { force: true });
|
|
57
|
+
});
|
|
58
|
+
|
|
59
|
+
it("validateRestoreCandidate rejects a non-SQLite file", () => {
|
|
60
|
+
const junk = join(tmp, "junk.sqlite");
|
|
61
|
+
writeFileSync(junk, "this is not a database");
|
|
62
|
+
const result = validateRestoreCandidate(junk);
|
|
63
|
+
expect(result.ok).toBe(false);
|
|
64
|
+
expect(result.error).toBeTruthy();
|
|
65
|
+
});
|
|
66
|
+
|
|
67
|
+
it("validateRestoreCandidate rejects a SQLite file lacking nlm tables", () => {
|
|
68
|
+
const bare = join(tmp, "bare.sqlite");
|
|
69
|
+
const store = freshStore(bare);
|
|
70
|
+
store.rawDb().prepare("DROP TABLE sessions").run();
|
|
71
|
+
store.close();
|
|
72
|
+
const result = validateRestoreCandidate(bare);
|
|
73
|
+
expect(result.ok).toBe(false);
|
|
74
|
+
expect(result.error).toMatch(/sessions/);
|
|
75
|
+
});
|
|
76
|
+
|
|
77
|
+
it("validateRestoreCandidate reports session count and schema version", () => {
|
|
78
|
+
const store = freshStore(dbPath);
|
|
79
|
+
const snap = snapshotScratchPath(dbPath);
|
|
80
|
+
vacuumSnapshot(store.rawDb(), snap);
|
|
81
|
+
store.close();
|
|
82
|
+
|
|
83
|
+
const result = validateRestoreCandidate(snap);
|
|
84
|
+
expect(result.ok).toBe(true);
|
|
85
|
+
expect(result.sessions).toBe(0);
|
|
86
|
+
expect(result.schemaVersion).toBeGreaterThanOrEqual(0);
|
|
87
|
+
rmSync(snap, { force: true });
|
|
88
|
+
});
|
|
89
|
+
|
|
90
|
+
it("stageRestore parks a valid candidate at the pending path", () => {
|
|
91
|
+
const store = freshStore(dbPath);
|
|
92
|
+
const snap = snapshotScratchPath(dbPath);
|
|
93
|
+
vacuumSnapshot(store.rawDb(), snap);
|
|
94
|
+
store.close();
|
|
95
|
+
|
|
96
|
+
const result = stageRestore(dbPath, snap);
|
|
97
|
+
expect(result.ok).toBe(true);
|
|
98
|
+
expect(existsSync(dbPath + PENDING_SUFFIX)).toBe(true);
|
|
99
|
+
expect(existsSync(snap)).toBe(false); // candidate was renamed, not copied
|
|
100
|
+
});
|
|
101
|
+
|
|
102
|
+
it("stageRestore removes the candidate when validation fails", () => {
|
|
103
|
+
const junk = join(tmp, "junk.sqlite");
|
|
104
|
+
writeFileSync(junk, "not a database");
|
|
105
|
+
const result = stageRestore(dbPath, junk);
|
|
106
|
+
expect(result.ok).toBe(false);
|
|
107
|
+
expect(existsSync(junk)).toBe(false);
|
|
108
|
+
expect(existsSync(dbPath + PENDING_SUFFIX)).toBe(false);
|
|
109
|
+
});
|
|
110
|
+
|
|
111
|
+
it("applyPendingRestore is a no-op when nothing is staged", () => {
|
|
112
|
+
freshStore(dbPath).close();
|
|
113
|
+
const result = applyPendingRestore(dbPath);
|
|
114
|
+
expect(result.applied).toBe(false);
|
|
115
|
+
});
|
|
116
|
+
|
|
117
|
+
it("applyPendingRestore promotes the staged DB and archives the current one", () => {
|
|
118
|
+
// Current DB: one source seeded so we can tell the two stores apart.
|
|
119
|
+
const current = freshStore(dbPath);
|
|
120
|
+
insertMarkerSource(current.rawDb(), "marker-current", "current");
|
|
121
|
+
current.close();
|
|
122
|
+
|
|
123
|
+
// Staged DB: built elsewhere, carries a different marker source.
|
|
124
|
+
const stagedSrc = join(tmp, "staged-src.sqlite");
|
|
125
|
+
const staged = freshStore(stagedSrc);
|
|
126
|
+
insertMarkerSource(staged.rawDb(), "marker-staged", "staged");
|
|
127
|
+
const snap = snapshotScratchPath(dbPath);
|
|
128
|
+
vacuumSnapshot(staged.rawDb(), snap);
|
|
129
|
+
staged.close();
|
|
130
|
+
expect(stageRestore(dbPath, snap).ok).toBe(true);
|
|
131
|
+
|
|
132
|
+
const result = applyPendingRestore(dbPath);
|
|
133
|
+
expect(result.applied).toBe(true);
|
|
134
|
+
expect(result.archivedTo).toBeTruthy();
|
|
135
|
+
expect(existsSync(result.archivedTo!)).toBe(true);
|
|
136
|
+
expect(existsSync(dbPath + PENDING_SUFFIX)).toBe(false);
|
|
137
|
+
|
|
138
|
+
// The promoted DB is the staged one.
|
|
139
|
+
const reopened = freshStore(dbPath);
|
|
140
|
+
const names = reopened
|
|
141
|
+
.rawDb()
|
|
142
|
+
.prepare<[], { name: string }>("SELECT name FROM sources")
|
|
143
|
+
.all()
|
|
144
|
+
.map((r) => r.name);
|
|
145
|
+
reopened.close();
|
|
146
|
+
expect(names).toContain("marker-staged");
|
|
147
|
+
expect(names).not.toContain("marker-current");
|
|
148
|
+
|
|
149
|
+
// Exactly one pre-restore archive was created.
|
|
150
|
+
const archives = readdirSync(tmp).filter((f) => f.includes(".pre-restore-"));
|
|
151
|
+
expect(archives.length).toBe(1);
|
|
152
|
+
});
|
|
153
|
+
});
|
|
@@ -0,0 +1,176 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Integration tests for embed-backfill + embed-normalize against a real
|
|
3
|
+
* SQLite + sqlite-vec store. No network: a deterministic fake LLMClient
|
|
4
|
+
* stands in for Ollama.
|
|
5
|
+
*/
|
|
6
|
+
|
|
7
|
+
import { mkdtempSync, rmSync, existsSync } from "node:fs";
|
|
8
|
+
import { tmpdir } from "node:os";
|
|
9
|
+
import { join, resolve } from "node:path";
|
|
10
|
+
import { afterEach, beforeEach, describe, expect, it } from "vitest";
|
|
11
|
+
import Database from "better-sqlite3";
|
|
12
|
+
import * as sqliteVec from "sqlite-vec";
|
|
13
|
+
import { SqliteSessionStore } from "../../src/core/storage/sqlite-session-store.js";
|
|
14
|
+
import { reembedCorpus } from "../../src/core/embedding/embed-backfill.js";
|
|
15
|
+
import { normalizeEmbeddings } from "../../src/core/embedding/embed-normalize.js";
|
|
16
|
+
import type { EmbedResult, LLMClient } from "../../src/ports/llm-client.js";
|
|
17
|
+
import type { Session } from "../../src/shared/types.js";
|
|
18
|
+
import { makeSession } from "../fixtures/sessions.js";
|
|
19
|
+
|
|
20
|
+
const MIGRATIONS_DIR = resolve(__dirname, "../../migrations");
|
|
21
|
+
|
|
22
|
+
function unitWithLeading(value: number): Float32Array {
|
|
23
|
+
const v = new Float32Array(768);
|
|
24
|
+
v[0] = value;
|
|
25
|
+
let sum = 0;
|
|
26
|
+
for (let i = 0; i < v.length; i++) sum += (v[i] ?? 0) ** 2;
|
|
27
|
+
const n = Math.sqrt(sum) || 1;
|
|
28
|
+
const out = new Float32Array(768);
|
|
29
|
+
for (let i = 0; i < v.length; i++) out[i] = (v[i] ?? 0) / n;
|
|
30
|
+
return out;
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
class DeterministicEmbedder implements LLMClient {
|
|
34
|
+
calls = 0;
|
|
35
|
+
async embed(): Promise<EmbedResult> {
|
|
36
|
+
this.calls += 1;
|
|
37
|
+
// Stable, distinct, unit-length vectors per call
|
|
38
|
+
return { vector: unitWithLeading(this.calls), model: "fake" };
|
|
39
|
+
}
|
|
40
|
+
async classify(): Promise<never> {
|
|
41
|
+
throw new Error("not used");
|
|
42
|
+
}
|
|
43
|
+
}
|
|
44
|
+
|
|
45
|
+
const seed: ReadonlyArray<Session> = [
|
|
46
|
+
makeSession({ id: "s_a", label: "Hono setup", body: "wired Hono routes" }),
|
|
47
|
+
makeSession({ id: "s_b", label: "pgvector plan", body: "drafted pgvector swap" }),
|
|
48
|
+
makeSession({ id: "s_c", label: "tx tax county", body: "ingested county directory" }),
|
|
49
|
+
];
|
|
50
|
+
|
|
51
|
+
describe("reembedCorpus", () => {
|
|
52
|
+
let tmp: string;
|
|
53
|
+
let dbPath: string;
|
|
54
|
+
let statePath: string;
|
|
55
|
+
|
|
56
|
+
beforeEach(() => {
|
|
57
|
+
tmp = mkdtempSync(join(tmpdir(), "nlm-emb-"));
|
|
58
|
+
dbPath = join(tmp, "canonical.sqlite");
|
|
59
|
+
statePath = join(tmp, "state.json");
|
|
60
|
+
const store = new SqliteSessionStore({ dbPath, migrationsDir: MIGRATIONS_DIR });
|
|
61
|
+
for (const s of seed) {
|
|
62
|
+
store.insertSessionForTest(s);
|
|
63
|
+
// seed each with a non-normalized vector so backfill has something to replace
|
|
64
|
+
store.insertEmbeddingForTest(s.id, new Float32Array(768).fill(0.5));
|
|
65
|
+
}
|
|
66
|
+
store.close();
|
|
67
|
+
});
|
|
68
|
+
|
|
69
|
+
afterEach(() => rmSync(tmp, { recursive: true, force: true }));
|
|
70
|
+
|
|
71
|
+
it("replaces every embedding and writes a state file", async () => {
|
|
72
|
+
const embedder = new DeterministicEmbedder();
|
|
73
|
+
const report = await reembedCorpus({ dbPath, embedder, statePath });
|
|
74
|
+
expect(report.dbMissing).toBe(false);
|
|
75
|
+
expect(report.total).toBe(3);
|
|
76
|
+
expect(report.succeeded).toBe(3);
|
|
77
|
+
expect(report.failed).toBe(0);
|
|
78
|
+
expect(report.skippedAlreadyDone).toBe(0);
|
|
79
|
+
expect(embedder.calls).toBe(3);
|
|
80
|
+
expect(existsSync(statePath)).toBe(true);
|
|
81
|
+
});
|
|
82
|
+
|
|
83
|
+
it("is resumable — second run skips ids already in state", async () => {
|
|
84
|
+
const embedder1 = new DeterministicEmbedder();
|
|
85
|
+
await reembedCorpus({ dbPath, embedder: embedder1, statePath });
|
|
86
|
+
const embedder2 = new DeterministicEmbedder();
|
|
87
|
+
const report = await reembedCorpus({ dbPath, embedder: embedder2, statePath });
|
|
88
|
+
expect(report.skippedAlreadyDone).toBe(3);
|
|
89
|
+
expect(report.succeeded).toBe(0);
|
|
90
|
+
expect(embedder2.calls).toBe(0);
|
|
91
|
+
});
|
|
92
|
+
|
|
93
|
+
it("respects --limit", async () => {
|
|
94
|
+
const embedder = new DeterministicEmbedder();
|
|
95
|
+
const report = await reembedCorpus({ dbPath, embedder, statePath, limit: 2 });
|
|
96
|
+
expect(report.total).toBe(2);
|
|
97
|
+
expect(report.succeeded).toBe(2);
|
|
98
|
+
});
|
|
99
|
+
});
|
|
100
|
+
|
|
101
|
+
describe("normalizeEmbeddings", () => {
|
|
102
|
+
let tmp: string;
|
|
103
|
+
let dbPath: string;
|
|
104
|
+
|
|
105
|
+
beforeEach(() => {
|
|
106
|
+
tmp = mkdtempSync(join(tmpdir(), "nlm-norm-"));
|
|
107
|
+
dbPath = join(tmp, "canonical.sqlite");
|
|
108
|
+
const store = new SqliteSessionStore({ dbPath, migrationsDir: MIGRATIONS_DIR });
|
|
109
|
+
store.insertSessionForTest(makeSession({ id: "raw" }));
|
|
110
|
+
store.insertSessionForTest(makeSession({ id: "already" }));
|
|
111
|
+
store.insertSessionForTest(makeSession({ id: "zero" }));
|
|
112
|
+
store.close();
|
|
113
|
+
// embed-normalize operates on the legacy session_embeddings table that
|
|
114
|
+
// migration 003 still creates (left in place for rollback safety after
|
|
115
|
+
// the chunk + max-pool migration). Seed it directly via raw SQL — the
|
|
116
|
+
// session store's helpers now target session_embedding_chunks.
|
|
117
|
+
const db = new Database(dbPath);
|
|
118
|
+
sqliteVec.load(db);
|
|
119
|
+
const ins = db.prepare(
|
|
120
|
+
"INSERT INTO session_embeddings (session_id, embedding) VALUES (?, ?)",
|
|
121
|
+
);
|
|
122
|
+
const toBlob = (v: Float32Array): Buffer =>
|
|
123
|
+
Buffer.from(v.buffer, v.byteOffset, v.byteLength);
|
|
124
|
+
// raw: non-unit (||v|| = sqrt(768 * 0.25) ≈ 13.86)
|
|
125
|
+
ins.run("raw", toBlob(new Float32Array(768).fill(0.5)));
|
|
126
|
+
// already: unit (one component at 1.0)
|
|
127
|
+
const unit = new Float32Array(768);
|
|
128
|
+
unit[0] = 1;
|
|
129
|
+
ins.run("already", toBlob(unit));
|
|
130
|
+
// zero: zero vector
|
|
131
|
+
ins.run("zero", toBlob(new Float32Array(768)));
|
|
132
|
+
db.close();
|
|
133
|
+
});
|
|
134
|
+
|
|
135
|
+
afterEach(() => rmSync(tmp, { recursive: true, force: true }));
|
|
136
|
+
|
|
137
|
+
it("rewrites only the non-unit non-zero row", () => {
|
|
138
|
+
const report = normalizeEmbeddings({ dbPath });
|
|
139
|
+
expect(report.total).toBe(3);
|
|
140
|
+
expect(report.rewritten).toBe(1);
|
|
141
|
+
expect(report.alreadyNormalized).toBe(1);
|
|
142
|
+
expect(report.zeroVector).toBe(1);
|
|
143
|
+
});
|
|
144
|
+
|
|
145
|
+
it("dry-run reports the same counts without writing", () => {
|
|
146
|
+
const beforeDb = new Database(dbPath);
|
|
147
|
+
sqliteVec.load(beforeDb);
|
|
148
|
+
const beforeBlob = beforeDb
|
|
149
|
+
.prepare<[string], { embedding: Buffer }>(
|
|
150
|
+
"SELECT embedding FROM session_embeddings WHERE session_id = ?",
|
|
151
|
+
)
|
|
152
|
+
.get("raw")!.embedding;
|
|
153
|
+
beforeDb.close();
|
|
154
|
+
|
|
155
|
+
const report = normalizeEmbeddings({ dbPath, dryRun: true });
|
|
156
|
+
expect(report.rewritten).toBe(1);
|
|
157
|
+
expect(report.dryRun).toBe(true);
|
|
158
|
+
|
|
159
|
+
const afterDb = new Database(dbPath);
|
|
160
|
+
sqliteVec.load(afterDb);
|
|
161
|
+
const afterBlob = afterDb
|
|
162
|
+
.prepare<[string], { embedding: Buffer }>(
|
|
163
|
+
"SELECT embedding FROM session_embeddings WHERE session_id = ?",
|
|
164
|
+
)
|
|
165
|
+
.get("raw")!.embedding;
|
|
166
|
+
afterDb.close();
|
|
167
|
+
expect(afterBlob.equals(beforeBlob)).toBe(true);
|
|
168
|
+
});
|
|
169
|
+
|
|
170
|
+
it("is idempotent — second run rewrites nothing", () => {
|
|
171
|
+
normalizeEmbeddings({ dbPath });
|
|
172
|
+
const report = normalizeEmbeddings({ dbPath });
|
|
173
|
+
expect(report.rewritten).toBe(0);
|
|
174
|
+
expect(report.alreadyNormalized).toBe(2); // raw is now unit too
|
|
175
|
+
});
|
|
176
|
+
});
|