nlm-memory 0.4.2 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (285) hide show
  1. package/README.md +72 -34
  2. package/dist/cli/nlm.js +223 -33
  3. package/dist/cli/nlm.js.map +1 -1
  4. package/dist/core/adapters/cursor.d.ts +45 -0
  5. package/dist/core/adapters/cursor.js +397 -0
  6. package/dist/core/adapters/cursor.js.map +1 -0
  7. package/dist/core/adapters/from-source.js +10 -0
  8. package/dist/core/adapters/from-source.js.map +1 -1
  9. package/dist/core/adapters/windsurf.d.ts +44 -0
  10. package/dist/core/adapters/windsurf.js +299 -0
  11. package/dist/core/adapters/windsurf.js.map +1 -0
  12. package/dist/core/hook/claude-settings.d.ts +12 -5
  13. package/dist/core/hook/claude-settings.js +21 -6
  14. package/dist/core/hook/claude-settings.js.map +1 -1
  15. package/dist/core/sources/source-registry.d.ts +1 -1
  16. package/dist/core/sources/source-registry.js +18 -0
  17. package/dist/core/sources/source-registry.js.map +1 -1
  18. package/dist/core/storage/sqlite-session-store.d.ts +2 -0
  19. package/dist/core/storage/sqlite-session-store.js +38 -2
  20. package/dist/core/storage/sqlite-session-store.js.map +1 -1
  21. package/dist/hook/hook-auth.d.ts +13 -0
  22. package/dist/hook/hook-auth.js +19 -0
  23. package/dist/hook/hook-auth.js.map +1 -0
  24. package/dist/hook/prompt-recall-hook.js +7 -1
  25. package/dist/hook/prompt-recall-hook.js.map +1 -1
  26. package/dist/hook/session-start-hook.js +4 -1
  27. package/dist/hook/session-start-hook.js.map +1 -1
  28. package/dist/hook/stop-hook.js +4 -1
  29. package/dist/hook/stop-hook.js.map +1 -1
  30. package/dist/http/app.d.ts +2 -0
  31. package/dist/http/app.js +76 -1
  32. package/dist/http/app.js.map +1 -1
  33. package/dist/install/claude-code.js +1 -1
  34. package/dist/install/claude-code.js.map +1 -1
  35. package/dist/install/cursor.d.ts +25 -0
  36. package/dist/install/cursor.js +43 -0
  37. package/dist/install/cursor.js.map +1 -0
  38. package/dist/install/nlm-dir-perms.d.ts +19 -0
  39. package/dist/install/nlm-dir-perms.js +43 -0
  40. package/dist/install/nlm-dir-perms.js.map +1 -0
  41. package/dist/install/ollama.d.ts +18 -1
  42. package/dist/install/ollama.js +62 -7
  43. package/dist/install/ollama.js.map +1 -1
  44. package/dist/install/setup.d.ts +4 -0
  45. package/dist/install/setup.js +141 -18
  46. package/dist/install/setup.js.map +1 -1
  47. package/dist/install/windsurf.d.ts +25 -0
  48. package/dist/install/windsurf.js +43 -0
  49. package/dist/install/windsurf.js.map +1 -0
  50. package/dist/mcp/server.js +20 -1
  51. package/dist/mcp/server.js.map +1 -1
  52. package/dist/shared/types.d.ts +4 -0
  53. package/dist/ui/assets/{index-BA6IpU8g.css → index-Beo8psd-.css} +1 -1
  54. package/dist/ui/assets/index-CSPTTeeM.js +69 -0
  55. package/dist/ui/index.html +2 -2
  56. package/package.json +26 -1
  57. package/plugin/scripts/prompt-recall-hook.mjs +55 -4
  58. package/plugin/scripts/stop-hook.mjs +57 -6
  59. package/.agents/plugins/marketplace.json +0 -20
  60. package/.github/workflows/ci.yml +0 -30
  61. package/dist/ui/assets/index-B_qIVV0k.js +0 -69
  62. package/docs/methodology/re-derivation-rate.md +0 -112
  63. package/docs/methodology/useful-hit-rate.md +0 -79
  64. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  65. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  66. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  67. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  68. package/docs/plans/desktop-product.md +0 -69
  69. package/docs/plans/factstore-design.md +0 -236
  70. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1389
  71. package/logs/CHANGELOG/CHANGELOG.md +0 -337
  72. package/migrations/000_initial_schema.sql +0 -174
  73. package/migrations/001_entity_type_rename.sql +0 -17
  74. package/migrations/002_adapter_state_extend.sql +0 -12
  75. package/migrations/003_session_embeddings.sql +0 -11
  76. package/migrations/004_facts.sql +0 -46
  77. package/migrations/005_sources.sql +0 -31
  78. package/migrations/006_providers.sql +0 -33
  79. package/migrations/007_source_tokens.sql +0 -17
  80. package/migrations/008_fts_rebuild.sql +0 -9
  81. package/migrations/009_session_embedding_chunks.sql +0 -46
  82. package/migrations/010_sources_opencode.sql +0 -30
  83. package/migrations/011_sources_hermes_agent.sql +0 -30
  84. package/migrations/012_sources_aider.sql +0 -30
  85. package/migrations/013_adapter_state_failure_count.sql +0 -12
  86. package/plugin-hermes-agent/README.md +0 -49
  87. package/plugin-hermes-agent/__init__.py +0 -75
  88. package/plugin-hermes-agent/plugin.yaml +0 -15
  89. package/scripts/backfill-citations.mjs +0 -0
  90. package/scripts/build-codex-plugin.mjs +0 -61
  91. package/scripts/deepseek-probe.mjs +0 -67
  92. package/scripts/extract-triples.mjs +0 -207
  93. package/scripts/longmemeval/embedding-cache.ts +0 -77
  94. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  95. package/scripts/longmemeval/run-harness.ts +0 -315
  96. package/scripts/longmemeval/scorer.ts +0 -99
  97. package/scripts/longmemeval/tsconfig.json +0 -9
  98. package/scripts/longmemeval/types.ts +0 -35
  99. package/scripts/nlm-daily-digest.py +0 -239
  100. package/scripts/nlm-daily-digest.sh +0 -28
  101. package/src/cli/classify-parity.ts +0 -257
  102. package/src/cli/launchctl-helpers.ts +0 -49
  103. package/src/cli/nlm.ts +0 -885
  104. package/src/core/actions/actions-log.ts +0 -118
  105. package/src/core/actions/overlay.ts +0 -117
  106. package/src/core/adapters/aider.ts +0 -205
  107. package/src/core/adapters/claude-code.ts +0 -293
  108. package/src/core/adapters/common.ts +0 -54
  109. package/src/core/adapters/from-source.ts +0 -57
  110. package/src/core/adapters/hermes-agent.ts +0 -240
  111. package/src/core/adapters/hermes.ts +0 -277
  112. package/src/core/adapters/jsonl-generic.ts +0 -208
  113. package/src/core/adapters/opencode.ts +0 -281
  114. package/src/core/adapters/pi.ts +0 -264
  115. package/src/core/classifier/prompt.ts +0 -200
  116. package/src/core/dataset/build-dataset.ts +0 -463
  117. package/src/core/embedding/chunk-body.ts +0 -76
  118. package/src/core/embedding/embed-backfill.ts +0 -210
  119. package/src/core/embedding/embed-normalize.ts +0 -135
  120. package/src/core/facts/backfill-facts.ts +0 -254
  121. package/src/core/facts/extract-facts.ts +0 -50
  122. package/src/core/hook/citation-detect.ts +0 -124
  123. package/src/core/hook/cite-memo.ts +0 -68
  124. package/src/core/hook/claude-settings.ts +0 -166
  125. package/src/core/hook/gate.ts +0 -25
  126. package/src/core/hook/hook-log.ts +0 -41
  127. package/src/core/hook/memo-sweep.ts +0 -164
  128. package/src/core/hook/memo.ts +0 -67
  129. package/src/core/hook/pointer-block.ts +0 -26
  130. package/src/core/hook/select.ts +0 -32
  131. package/src/core/hook/transcript.ts +0 -121
  132. package/src/core/ingest/ingest-session.ts +0 -111
  133. package/src/core/providers/provider-models.ts +0 -100
  134. package/src/core/providers/provider-registry.ts +0 -196
  135. package/src/core/recall/citation-log.ts +0 -108
  136. package/src/core/recall/filter.ts +0 -27
  137. package/src/core/recall/index.ts +0 -6
  138. package/src/core/recall/match-fields.ts +0 -40
  139. package/src/core/recall/query-log.ts +0 -149
  140. package/src/core/recall/query-shape.ts +0 -66
  141. package/src/core/recall/recall-service.ts +0 -320
  142. package/src/core/recall/recent-log.ts +0 -59
  143. package/src/core/recall/tokenize.ts +0 -18
  144. package/src/core/recall/useful-scan.ts +0 -336
  145. package/src/core/recall-facts/fact-query-log.ts +0 -150
  146. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  147. package/src/core/scheduler/scan-once.ts +0 -142
  148. package/src/core/scheduler/scheduler.ts +0 -225
  149. package/src/core/sources/source-registry.ts +0 -260
  150. package/src/core/storage/db-restore.ts +0 -133
  151. package/src/core/storage/live-status.ts +0 -45
  152. package/src/core/storage/migrate.ts +0 -72
  153. package/src/core/storage/sqlite-fact-store.ts +0 -304
  154. package/src/core/storage/sqlite-session-store.ts +0 -765
  155. package/src/hook/prompt-recall-hook.ts +0 -174
  156. package/src/hook/session-end-hook.ts +0 -81
  157. package/src/hook/session-start-hook.ts +0 -165
  158. package/src/hook/stop-hook.ts +0 -236
  159. package/src/http/app.ts +0 -1137
  160. package/src/install/claude-code.ts +0 -128
  161. package/src/install/codex.ts +0 -367
  162. package/src/install/hermes-agent.ts +0 -76
  163. package/src/install/hermes.ts +0 -78
  164. package/src/install/ollama.ts +0 -211
  165. package/src/install/setup.ts +0 -368
  166. package/src/llm/classifier-box.ts +0 -64
  167. package/src/llm/deepseek-client.ts +0 -150
  168. package/src/llm/env-autoload.ts +0 -55
  169. package/src/llm/ollama-client.ts +0 -189
  170. package/src/mcp/server.ts +0 -534
  171. package/src/ports/fact-store.ts +0 -102
  172. package/src/ports/llm-client.ts +0 -52
  173. package/src/ports/logger.ts +0 -16
  174. package/src/ports/session-store.ts +0 -45
  175. package/src/ports/transcript-adapter.ts +0 -55
  176. package/src/shared/types.ts +0 -145
  177. package/src/ui/App.tsx +0 -58
  178. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  179. package/src/ui/components/SessionDrawer.tsx +0 -136
  180. package/src/ui/components/SideNav.tsx +0 -162
  181. package/src/ui/components/Skeleton.tsx +0 -107
  182. package/src/ui/index.html +0 -13
  183. package/src/ui/lib/actions.ts +0 -30
  184. package/src/ui/lib/api.ts +0 -92
  185. package/src/ui/lib/dataset.ts +0 -141
  186. package/src/ui/lib/registries.ts +0 -155
  187. package/src/ui/lib/view-settings.ts +0 -41
  188. package/src/ui/main.tsx +0 -15
  189. package/src/ui/pages/Live.tsx +0 -229
  190. package/src/ui/pages/Pulse.tsx +0 -415
  191. package/src/ui/pages/Recall.tsx +0 -190
  192. package/src/ui/pages/River.tsx +0 -308
  193. package/src/ui/pages/Search.tsx +0 -93
  194. package/src/ui/pages/Stub.tsx +0 -9
  195. package/src/ui/pages/Thread.tsx +0 -262
  196. package/src/ui/pages/settings/Classifier.tsx +0 -227
  197. package/src/ui/pages/settings/Data.tsx +0 -190
  198. package/src/ui/pages/settings/Index.tsx +0 -65
  199. package/src/ui/pages/settings/Labels.tsx +0 -224
  200. package/src/ui/pages/settings/Providers.tsx +0 -305
  201. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  202. package/src/ui/pages/settings/Sources.tsx +0 -326
  203. package/src/ui/pages/settings/Views.tsx +0 -96
  204. package/src/ui/styles.css +0 -1766
  205. package/src/ui/tsconfig.json +0 -21
  206. package/src/ui/vite.config.ts +0 -19
  207. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  208. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  209. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  210. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  211. package/tests/fixtures/facts.ts +0 -17
  212. package/tests/fixtures/golden-corpus.ts +0 -85
  213. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  214. package/tests/fixtures/hermes/paired_session.json +0 -23
  215. package/tests/fixtures/hermes/request_dump.json +0 -28
  216. package/tests/fixtures/hermes/session_iso.json +0 -38
  217. package/tests/fixtures/hermes/session_unix.json +0 -38
  218. package/tests/fixtures/hermes/system_only.json +0 -18
  219. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  220. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  221. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  222. package/tests/fixtures/sessions.ts +0 -22
  223. package/tests/integration/backfill-facts.test.ts +0 -362
  224. package/tests/integration/citation-explicit.test.ts +0 -111
  225. package/tests/integration/cite-event.test.ts +0 -169
  226. package/tests/integration/cite-memo.test.ts +0 -87
  227. package/tests/integration/db-restore.test.ts +0 -153
  228. package/tests/integration/embed-backfill.test.ts +0 -176
  229. package/tests/integration/fact-supersedence.test.ts +0 -313
  230. package/tests/integration/fts-index.test.ts +0 -60
  231. package/tests/integration/getbyids-sqlite.test.ts +0 -60
  232. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  233. package/tests/integration/hook-claude-settings.test.ts +0 -205
  234. package/tests/integration/hook-log.test.ts +0 -54
  235. package/tests/integration/hook-memo.test.ts +0 -68
  236. package/tests/integration/hook-pre-compact.test.ts +0 -105
  237. package/tests/integration/hook-subagent-start.test.ts +0 -102
  238. package/tests/integration/http.test.ts +0 -401
  239. package/tests/integration/keyword-search-fts.test.ts +0 -66
  240. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  241. package/tests/integration/mcp.test.ts +0 -248
  242. package/tests/integration/memo-sweep.test.ts +0 -91
  243. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  244. package/tests/integration/provider-registry.test.ts +0 -107
  245. package/tests/integration/recall-golden.test.ts +0 -59
  246. package/tests/integration/recall-sqlite.test.ts +0 -169
  247. package/tests/integration/scheduler.test.ts +0 -391
  248. package/tests/integration/session-end-hook.test.ts +0 -48
  249. package/tests/integration/session-start-hook.test.ts +0 -126
  250. package/tests/integration/source-registry.test.ts +0 -120
  251. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  252. package/tests/integration/stop-hook.test.ts +0 -560
  253. package/tests/integration/wal-checkpoint.test.ts +0 -49
  254. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  255. package/tests/unit/core/adapters/aider.test.ts +0 -230
  256. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  257. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  258. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  259. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  260. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  261. package/tests/unit/core/adapters/pi.test.ts +0 -110
  262. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  263. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  264. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  265. package/tests/unit/core/filter.test.ts +0 -40
  266. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  267. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  268. package/tests/unit/core/hook/gate.test.ts +0 -29
  269. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  270. package/tests/unit/core/hook/select.test.ts +0 -66
  271. package/tests/unit/core/match-fields.test.ts +0 -39
  272. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  273. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  274. package/tests/unit/core/query-shape.test.ts +0 -92
  275. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  276. package/tests/unit/core/recall-service.test.ts +0 -200
  277. package/tests/unit/core/storage/live-status.test.ts +0 -54
  278. package/tests/unit/core/tokenize.test.ts +0 -32
  279. package/tests/unit/core/useful-scan.test.ts +0 -537
  280. package/tests/unit/llm/embed.test.ts +0 -93
  281. package/tests/unit/llm/ollama-client.test.ts +0 -124
  282. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  283. package/tsconfig.json +0 -31
  284. package/tsconfig.test.json +0 -11
  285. package/vitest.config.ts +0 -22
package/src/mcp/server.ts DELETED
@@ -1,534 +0,0 @@
1
- /**
2
- * MCP adapter. Binds the `recall_sessions` and `get_session` tools directly
3
- * to RecallService and SessionStore — no HTTP hop, no localhost loopback.
4
- *
5
- * The Python daemon's MCP server proxied through HTTP. This server runs in
6
- * the same process as the rest of nlm-memory, so a tool call is a function
7
- * call. Lower latency, simpler stack traces, one fewer thing to keep alive.
8
- *
9
- * Layering: this module knows about the inner ring (RecallService,
10
- * SessionStore); core/ does not know this module exists.
11
- */
12
-
13
- import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
14
- import { encode as toonEncode } from "@toon-format/toon";
15
- import { z } from "zod";
16
- import { logQuery } from "@core/recall/query-log.js";
17
- import { logFactQuery } from "@core/recall-facts/fact-query-log.js";
18
- import { appendCitation } from "@core/recall/citation-log.js";
19
- import type { FactRecallService } from "@core/recall-facts/fact-recall-service.js";
20
- import type { RecallService } from "@core/recall/recall-service.js";
21
- import type { FactStore } from "@ports/fact-store.js";
22
- import type { SessionStore } from "@ports/session-store.js";
23
- import type {
24
- FactKind,
25
- FactRecallQuery,
26
- RecallKindFilter,
27
- RecallMode,
28
- RecallQuery,
29
- } from "@shared/types.js";
30
-
31
- const CHARACTER_LIMIT = 25_000;
32
- const DEFAULT_LIMIT = 10;
33
- const SERVER_NAME = "nlm-memory-mcp-server";
34
- const SERVER_VERSION = "0.4.0";
35
-
36
- /** TOON encoding cuts token usage on large recall payloads. Opt in via
37
- * NLM_FORMAT=toon in the MCP server's env (see .mcp.json). Defaults to JSON. */
38
- const USE_TOON = process.env.NLM_FORMAT === "toon";
39
-
40
- export interface McpDeps {
41
- readonly recall: RecallService;
42
- readonly store: SessionStore;
43
- /** Optional — when absent, fact tools are not registered. */
44
- readonly factRecall?: FactRecallService;
45
- readonly factStore?: FactStore;
46
- }
47
-
48
- export interface ToolResult {
49
- content: { type: "text"; text: string }[];
50
- isError?: boolean;
51
- }
52
-
53
- function format(data: unknown): string {
54
- if (USE_TOON) {
55
- try {
56
- return toonEncode(data);
57
- } catch {
58
- return JSON.stringify(data, null, 2);
59
- }
60
- }
61
- return JSON.stringify(data, null, 2);
62
- }
63
-
64
- function truncate(data: unknown): string {
65
- const str = format(data);
66
- if (str.length <= CHARACTER_LIMIT) return str;
67
- return format({
68
- truncated: true,
69
- truncation_message:
70
- "Response too large. Lower limit or fetch fewer fields via get_session.",
71
- });
72
- }
73
-
74
- function ok(data: unknown): ToolResult {
75
- return { content: [{ type: "text", text: truncate(data) }] };
76
- }
77
-
78
- function err(error: unknown): ToolResult {
79
- const message = error instanceof Error ? error.message : String(error);
80
- return {
81
- isError: true,
82
- content: [{ type: "text", text: `Error: ${message}` }],
83
- };
84
- }
85
-
86
- // Pure handler functions — exported so tests can exercise them without an
87
- // MCP transport. The McpServer wrapper below just registers these.
88
-
89
- export interface RecallToolInput {
90
- query: string | undefined;
91
- entity: string | undefined;
92
- kind: RecallKindFilter | undefined;
93
- mode: RecallMode | undefined;
94
- limit: number | undefined;
95
- }
96
-
97
- export async function recallSessionsHandler(
98
- deps: McpDeps,
99
- input: Partial<RecallToolInput>,
100
- ): Promise<ToolResult> {
101
- try {
102
- const query: RecallQuery = {
103
- query: input.query ?? "",
104
- mode: input.mode ?? "hybrid",
105
- limit: input.limit ?? DEFAULT_LIMIT,
106
- ...(input.entity !== undefined ? { entity: input.entity } : {}),
107
- ...(input.kind !== undefined ? { kind: input.kind } : {}),
108
- };
109
- const result = await deps.recall.search(query);
110
- // Telemetry — the MCP path is the real agent-usage path; without this it
111
- // is invisible to query_log.jsonl and the Recall page. Fire-and-forget,
112
- // mirrors the HTTP /api/recall handler.
113
- void logQuery({
114
- source: "mcp",
115
- query: input.query ?? null,
116
- entity: input.entity ?? null,
117
- kind: input.kind ?? null,
118
- mode: input.mode ?? "hybrid",
119
- limit: input.limit ?? DEFAULT_LIMIT,
120
- nResults: result.total,
121
- returnedIds: result.results.map((r) => r.id),
122
- });
123
- return ok(result);
124
- } catch (e) {
125
- return err(e);
126
- }
127
- }
128
-
129
- export async function getSessionHandler(
130
- deps: McpDeps,
131
- input: { id: string },
132
- ): Promise<ToolResult> {
133
- try {
134
- const session = await deps.store.getById(input.id);
135
- if (!session) {
136
- return err(new Error(`session ${input.id} not found`));
137
- }
138
- return ok(session);
139
- } catch (e) {
140
- return err(e);
141
- }
142
- }
143
-
144
- export interface RecallFactsInput {
145
- query: string | undefined;
146
- subject: string | undefined;
147
- predicate: string | undefined;
148
- kind: FactKind | undefined;
149
- mode: RecallMode | undefined;
150
- includeSuperseded: boolean | undefined;
151
- minConfidence: number | undefined;
152
- limit: number | undefined;
153
- }
154
-
155
- export async function recallFactsHandler(
156
- deps: McpDeps,
157
- input: Partial<RecallFactsInput>,
158
- ): Promise<ToolResult> {
159
- if (!deps.factRecall) {
160
- return err(new Error("fact recall not wired in this deployment"));
161
- }
162
- try {
163
- const query: FactRecallQuery = {
164
- query: input.query ?? "",
165
- mode: input.mode ?? "hybrid",
166
- limit: input.limit ?? DEFAULT_LIMIT,
167
- ...(input.subject !== undefined ? { subject: input.subject } : {}),
168
- ...(input.predicate !== undefined ? { predicate: input.predicate } : {}),
169
- ...(input.kind !== undefined ? { kind: input.kind } : {}),
170
- ...(input.includeSuperseded !== undefined
171
- ? { includeSuperseded: input.includeSuperseded }
172
- : {}),
173
- ...(input.minConfidence !== undefined
174
- ? { minConfidence: input.minConfidence }
175
- : {}),
176
- };
177
- const result = await deps.factRecall.search(query);
178
- // Telemetry — see recallSessionsHandler. Fire-and-forget.
179
- void logFactQuery({
180
- source: "mcp",
181
- query: input.query ?? null,
182
- subject: input.subject ?? null,
183
- predicate: input.predicate ?? null,
184
- kind: input.kind ?? null,
185
- mode: input.mode ?? "hybrid",
186
- limit: input.limit ?? DEFAULT_LIMIT,
187
- nResults: result.total,
188
- returnedIds: result.results.map((r) => r.id),
189
- });
190
- return ok(result);
191
- } catch (e) {
192
- return err(e);
193
- }
194
- }
195
-
196
- export async function getFactHistoryHandler(
197
- deps: McpDeps,
198
- input: { subject: string; predicate: string | undefined },
199
- ): Promise<ToolResult> {
200
- if (!deps.factStore) {
201
- return err(new Error("fact store not wired in this deployment"));
202
- }
203
- try {
204
- const chains = await deps.factStore.getHistory(input.subject, input.predicate);
205
- return ok({ subject: input.subject, predicate: input.predicate ?? null, chains });
206
- } catch (e) {
207
- return err(e);
208
- }
209
- }
210
-
211
- const CITE_SESSION_DESCRIPTION = `Log that you used a previously-surfaced session in your response. Pass the session ID. This lets NLM learn which surfaced sessions are actually useful, training a per-operator reranker over time. Call after writing your response, with one cite per surfaced session you actually drew from.`;
212
-
213
- const RECALL_DESCRIPTION = `Search prior AI sessions across every runtime the user has connected (Claude Code,
214
- Hermes, pi, Codex, Gemini, Aider). Local-first, fast (~200-400ms warm), idempotent,
215
- safe to call eagerly. No rate limit; no cost per call.
216
-
217
- CALL THIS FIRST — before answering — whenever the user prompt contains any of:
218
-
219
- Decision / position questions
220
- "what did we decide about X" · "did we figure out X" · "what's our take on X"
221
- "have we tried X" · "where did we land on X" · "what was the conclusion"
222
-
223
- Status / open-thread questions
224
- "what's still open on X" · "where did we leave X" · "what's blocked on X"
225
- "what's the state of X" · "is X done"
226
-
227
- History / continuity questions
228
- "have I worked on X" · "when did we last X" · "did we already do X"
229
- "have I talked to <person>" · "what's the history with X"
230
-
231
- Implicit references to prior context (the dangerous case — easy to miss)
232
- "that pgvector thing" · "the X discussion" · "our auth approach"
233
- "the one we built for <client>" · "the issue we hit last week"
234
-
235
- Not calling when the user references past work is the failure mode this tool exists
236
- to prevent: re-derivation of already-solved problems, contradicting prior decisions,
237
- re-litigating resolved open questions, ignoring the user's accumulated context.
238
-
239
- Returns ranked session digests (id, label, summary, entities, decisions, open
240
- questions). Call get_session for the full body when a digest looks relevant.
241
-
242
- Skip ONLY when the request is purely forward-looking with no plausible prior
243
- context — drafting wholly new content, naming something new, brainstorming
244
- greenfield ideas. When in doubt, call.
245
-
246
- When you reference a returned session in your response, call \`cite_session(id)\` to log it so the recall layer can learn what is useful.
247
-
248
- Args:
249
- - query: keyword(s) to search. Token-weighted match against label, decisions,
250
- open questions, and summary. Optional if entity or kind is provided.
251
- - entity: filter to sessions tagged with this entity. Optional.
252
- - kind: "decision" or "open" — restrict to sessions containing that marker
253
- kind. Omit for any. Optional.
254
- - mode: "hybrid" (default — keyword BM25 + semantic embeddings), "keyword", or
255
- "semantic". Optional.
256
- - limit: max results (1-100, default 10).`;
257
-
258
- const GET_SESSION_DESCRIPTION = `Fetch one full session by its canonical ID, including the conversational body.
259
-
260
- Call this AFTER recall_sessions when a returned digest looks relevant and the
261
- summary alone isn't enough to answer — e.g. you need the exact wording of a
262
- decision, the full reasoning behind a pivot, the specific commands that were
263
- run, or any quote you intend to reference verbatim.
264
-
265
- The recall_sessions digest is optimized for ranking and scanning; the full body
266
- contains the actual conversation transcript that produced the decision.
267
-
268
- Args:
269
- - id: Canonical session ID returned by recall_sessions (e.g. "cc_abc123",
270
- "sess_pgvector"). Pass the id field from the recall_sessions result.`;
271
-
272
- const RECALL_FACTS_DESCRIPTION = `Look up specific (subject, predicate, value) facts the user has established in
273
- prior sessions — model aliases, framework choices, endpoints, ports, hosts,
274
- deadlines, pricing, owners, dependencies, etc.
275
-
276
- CALL THIS when the user asks for a concrete value rather than a prose summary:
277
-
278
- "what port is X on" · "what model does Y use" · "what's the endpoint for Z"
279
- "what framework did we pick for X" · "who owns the X project"
280
- "when's the X deadline" · "what did we set X to" · "where does X live"
281
- "what version of X are we on" · "what's our X account"
282
-
283
- Prefer this over recall_sessions when the user wants the *answer*, not the
284
- *conversation* — facts return the exact value with provenance (source session
285
- + source quote), no scanning required. recall_sessions is the right tool when
286
- the user wants context, reasoning, or the full discussion.
287
-
288
- Returns matching Fact records ordered by recency. Superseded facts are excluded
289
- by default; call get_fact_history to walk the chain of how a value evolved
290
- ("when did X flip from Fastify to Hono?").
291
-
292
- Examples:
293
- recall_facts(subject="mac-pro-llm-host", predicate="model")
294
- → the model alias currently exposed on the Mac Pro LLM endpoint
295
- recall_facts(subject="nlm-memory-ts", predicate="framework")
296
- → the web framework picked for nlm-memory-ts
297
- recall_facts(subject="goat-home-services")
298
- → all known facts about the GOAT engagement
299
- recall_facts(query="routing", kind="decision")
300
- → recent decision-kind facts mentioning routing
301
-
302
- Args:
303
- - query: free-text search against fact values. Optional if subject /
304
- predicate / kind is set.
305
- - subject: exact-match normalized (lowercase-kebab) entity or topic name.
306
- - predicate: exact-match predicate from the closed vocabulary (framework,
307
- endpoint, model, port, host, owner, pricing, cost, deadline,
308
- status, stack, runtime, library, version, dependency, schema,
309
- integration, deployment, repo, branch, commit, description,
310
- decided-on, assumption, blocker).
311
- - kind: "decision" | "open" | "attribute". Optional.
312
- - mode: "hybrid" (default — keyword BM25 + semantic embeddings), "keyword",
313
- or "semantic".
314
- - includeSuperseded: true to include outdated facts. Default false.
315
- - minConfidence: lower bound on classifier confidence. Default 0.6.
316
- - limit: max results (1-100, default 10).`;
317
-
318
- const GET_FACT_HISTORY_DESCRIPTION = `Walk the supersedence chain for a (subject, predicate) pair to see how a value
319
- changed over time. Call this when the user asks about evolution, history of a
320
- choice, or wants to understand a prior decision that's since changed:
321
-
322
- "when did we switch from X to Y" · "what did we use before X"
323
- "wasn't X different a month ago" · "history of <X choice>"
324
- "why did we change from X to Y"
325
-
326
- This is the editable-timeline feature: NLM preserves rejected/replaced decisions
327
- as superseded entries rather than deleting them, so the reasoning trail survives.
328
-
329
- Returns chains ordered newest → oldest. The head is the current value; subsequent
330
- entries are predecessors, each linked forward via supersededBy.
331
-
332
- Args:
333
- - subject: normalized (lowercase-kebab) entity or topic name.
334
- - predicate: optional — narrow to a single (subject, predicate) chain. When
335
- omitted, returns one chain per predicate for this subject.`;
336
-
337
- // Minimum length for a session ID to be treated as valid.
338
- const MIN_CITE_ID_LEN = 6;
339
-
340
- export interface CiteSessionInput {
341
- readonly id: string;
342
- readonly conversation_id?: string | undefined;
343
- readonly reason?: string | undefined;
344
- }
345
-
346
- export async function citeSessionHandler(
347
- input: CiteSessionInput,
348
- ): Promise<ToolResult> {
349
- if (!input.id || input.id.length < MIN_CITE_ID_LEN) {
350
- return err(new Error(`id must be at least ${MIN_CITE_ID_LEN} characters`));
351
- }
352
- try {
353
- await appendCitation({
354
- conversationId: input.conversation_id ?? "mcp_tool",
355
- citedId: input.id,
356
- kind: "tool_use",
357
- ...(input.reason !== undefined ? { responsePreview: input.reason } : {}),
358
- });
359
- return ok({ logged: true, id: input.id });
360
- } catch (e) {
361
- return err(e);
362
- }
363
- }
364
-
365
- export function createMcpServer(deps: McpDeps): McpServer {
366
- const server = new McpServer({
367
- name: SERVER_NAME,
368
- version: SERVER_VERSION,
369
- });
370
-
371
- server.registerTool(
372
- "recall_sessions",
373
- {
374
- title: "Recall Sessions from NLM",
375
- description: RECALL_DESCRIPTION,
376
- inputSchema: {
377
- query: z
378
- .string()
379
- .default("")
380
- .describe("Keyword(s) to search. Optional if entity or kind is set."),
381
- entity: z
382
- .string()
383
- .optional()
384
- .describe("Filter to sessions tagged with this entity name."),
385
- kind: z
386
- .enum(["decision", "open"])
387
- .optional()
388
- .describe("Filter to sessions with a decision or open marker."),
389
- mode: z
390
- .enum(["keyword", "semantic", "hybrid"])
391
- .optional()
392
- .describe("Search mode. Defaults to hybrid (keyword BM25 + semantic embeddings)."),
393
- limit: z
394
- .number()
395
- .int()
396
- .min(1)
397
- .max(100)
398
- .default(DEFAULT_LIMIT)
399
- .describe("Max results to return."),
400
- },
401
- annotations: {
402
- readOnlyHint: true,
403
- destructiveHint: false,
404
- idempotentHint: true,
405
- openWorldHint: true,
406
- },
407
- },
408
- async (args) => recallSessionsHandler(deps, args) as never,
409
- );
410
-
411
- server.registerTool(
412
- "get_session",
413
- {
414
- title: "Get Full NLM Session",
415
- description: GET_SESSION_DESCRIPTION,
416
- inputSchema: {
417
- id: z.string().min(1).describe("Canonical session ID."),
418
- },
419
- annotations: {
420
- readOnlyHint: true,
421
- destructiveHint: false,
422
- idempotentHint: true,
423
- openWorldHint: true,
424
- },
425
- },
426
- async (args) => getSessionHandler(deps, args) as never,
427
- );
428
-
429
- if (deps.factRecall && deps.factStore) {
430
- server.registerTool(
431
- "recall_facts",
432
- {
433
- title: "Recall Facts from NLM",
434
- description: RECALL_FACTS_DESCRIPTION,
435
- inputSchema: {
436
- query: z
437
- .string()
438
- .default("")
439
- .describe("Free-text search against fact values. Optional if subject/predicate/kind set."),
440
- subject: z
441
- .string()
442
- .optional()
443
- .describe("Exact-match normalized entity/topic (lowercase-kebab)."),
444
- predicate: z
445
- .string()
446
- .optional()
447
- .describe("Exact-match predicate from the closed vocabulary."),
448
- kind: z
449
- .enum(["decision", "open", "attribute"])
450
- .optional()
451
- .describe("Filter to a single fact kind."),
452
- mode: z
453
- .enum(["keyword", "semantic", "hybrid"])
454
- .optional()
455
- .describe("Search mode. Defaults to hybrid (keyword BM25 + semantic embeddings)."),
456
- includeSuperseded: z
457
- .boolean()
458
- .optional()
459
- .describe("Include outdated facts. Default false."),
460
- minConfidence: z
461
- .number()
462
- .min(0)
463
- .max(1)
464
- .optional()
465
- .describe("Lower bound on classifier confidence. Default 0.6."),
466
- limit: z
467
- .number()
468
- .int()
469
- .min(1)
470
- .max(100)
471
- .default(DEFAULT_LIMIT)
472
- .describe("Max results to return."),
473
- },
474
- annotations: {
475
- readOnlyHint: true,
476
- destructiveHint: false,
477
- idempotentHint: true,
478
- openWorldHint: true,
479
- },
480
- },
481
- async (args) => recallFactsHandler(deps, args) as never,
482
- );
483
-
484
- server.registerTool(
485
- "get_fact_history",
486
- {
487
- title: "Get Fact Supersedence History",
488
- description: GET_FACT_HISTORY_DESCRIPTION,
489
- inputSchema: {
490
- subject: z.string().min(1).describe("Normalized entity/topic name."),
491
- predicate: z
492
- .string()
493
- .optional()
494
- .describe("Narrow to one (subject, predicate) chain."),
495
- },
496
- annotations: {
497
- readOnlyHint: true,
498
- destructiveHint: false,
499
- idempotentHint: true,
500
- openWorldHint: true,
501
- },
502
- },
503
- async (args) => getFactHistoryHandler(deps, args) as never,
504
- );
505
- }
506
-
507
- server.registerTool(
508
- "cite_session",
509
- {
510
- title: "Cite NLM Session",
511
- description: CITE_SESSION_DESCRIPTION,
512
- inputSchema: {
513
- id: z.string().min(MIN_CITE_ID_LEN).describe("Session ID returned by recall_sessions that you referenced in your response."),
514
- conversation_id: z
515
- .string()
516
- .optional()
517
- .describe("Current conversation ID. Optional — NLM infers from context when absent."),
518
- reason: z
519
- .string()
520
- .optional()
521
- .describe("Why this session was useful. Optional but encouraged — articulating the reason is a weak training signal."),
522
- },
523
- annotations: {
524
- readOnlyHint: false,
525
- destructiveHint: false,
526
- idempotentHint: false,
527
- openWorldHint: false,
528
- },
529
- },
530
- async (args) => citeSessionHandler(args) as never,
531
- );
532
-
533
- return server;
534
- }
@@ -1,102 +0,0 @@
1
- /**
2
- * FactStore — the only way core/ reads or writes the fact corpus.
3
- *
4
- * Companion to SessionStore. Sessions are the operator-recall unit; facts are
5
- * the agent-recall projection — normalized (subject, predicate, value) triples
6
- * derived from sessions, supersedence-aware. See
7
- * docs/plans/factstore-design.md.
8
- *
9
- * Phase B.1 ships the storage port + adapter only. No extraction wired yet
10
- * (B.2), no recall service (B.3), no MCP surface (B.3), no supersedence
11
- * autodetect (B.4). The surface here is the minimum needed by future phases:
12
- * insert one or many, look up by id, look up current (non-superseded) facts
13
- * by subject and optional predicate, mark a fact superseded.
14
- */
15
-
16
- import type { Fact, FactHistoryChain, FactKind } from "@shared/types.js";
17
-
18
- export interface FactQuery {
19
- readonly subject: string;
20
- readonly predicate?: string;
21
- readonly includeSuperseded?: boolean;
22
- readonly limit?: number;
23
- }
24
-
25
- export interface FactSemanticNeighbor {
26
- readonly factId: string;
27
- readonly distance: number;
28
- }
29
-
30
- /** Pre-filter applied at the storage layer before keyword scoring runs. */
31
- export interface FactListFilter {
32
- readonly subject?: string;
33
- readonly predicate?: string;
34
- readonly kind?: FactKind;
35
- readonly includeSuperseded?: boolean;
36
- readonly minConfidence?: number;
37
- readonly limit?: number;
38
- }
39
-
40
- export interface FactStore {
41
- /** Atomically insert a single fact. Throws on duplicate id. */
42
- insert(fact: Fact): Promise<void>;
43
-
44
- /** Atomically insert many facts as one transaction. Throws on any duplicate id. */
45
- insertMany(facts: ReadonlyArray<Fact>): Promise<void>;
46
-
47
- getById(id: string): Promise<Fact | null>;
48
-
49
- /**
50
- * Exact-match lookup of the current (non-superseded) fact for a
51
- * subject+predicate pair. Returns null if none exists. This is the hot
52
- * path for deterministic supersedence on ingest (Phase B.4).
53
- */
54
- findCurrent(subject: string, predicate: string): Promise<Fact | null>;
55
-
56
- /**
57
- * List facts matching the query. Defaults: current (non-superseded) only,
58
- * limit 50. Ordered by created_at descending.
59
- */
60
- list(query: FactQuery): Promise<ReadonlyArray<Fact>>;
61
-
62
- /**
63
- * List all facts attributable to a single session. Used by the UI to show
64
- * a fact-count badge on a session digest, and by tests.
65
- */
66
- listBySession(sessionId: string): Promise<ReadonlyArray<Fact>>;
67
-
68
- /**
69
- * Mark `oldId` as superseded by `newId`. Both facts must exist. Reversible
70
- * by passing null as newId (Phase C operator-undo affordance).
71
- */
72
- markSuperseded(oldId: string, newId: string | null): Promise<void>;
73
-
74
- /**
75
- * Pre-filtered fact list used by FactRecallService. Applies subject /
76
- * predicate / kind / confidence / superseded filters at the SQL layer
77
- * before keyword scoring runs in core. No ordering guarantee beyond
78
- * `created_at DESC`.
79
- */
80
- listForRecall(filter: FactListFilter): Promise<ReadonlyArray<Fact>>;
81
-
82
- /**
83
- * sqlite-vec KNN over fact_embeddings. Returns up to `limit` nearest
84
- * neighbors by L2 distance. The service converts distance to cosine and
85
- * blends with keyword scores.
86
- */
87
- semanticSearch(
88
- queryVector: Float32Array,
89
- limit: number,
90
- ): Promise<ReadonlyArray<FactSemanticNeighbor>>;
91
-
92
- /**
93
- * Supersedence chain inspection. When `predicate` is provided, returns a
94
- * single chain (or empty array if no facts match). When omitted, returns
95
- * one chain per distinct predicate for that subject. Each chain orders
96
- * newest → oldest by created_at.
97
- */
98
- getHistory(
99
- subject: string,
100
- predicate?: string,
101
- ): Promise<ReadonlyArray<FactHistoryChain>>;
102
- }
@@ -1,52 +0,0 @@
1
- /**
2
- * LLMClient — outbound LLM calls (embedding + classification).
3
- *
4
- * Implementations: OllamaClient (default, local), AnthropicClient, OpenAIClient.
5
- * core/ only sees this interface; it never imports an HTTP client.
6
- */
7
-
8
- export interface EmbedResult {
9
- readonly vector: Float32Array;
10
- readonly model: string;
11
- }
12
-
13
- export type EmbeddingKind = "query" | "document";
14
-
15
- /**
16
- * Raw fact extracted by the classifier. No id, no source_session_id, no
17
- * created_at yet — those get filled in at ingest time by extractFacts().
18
- *
19
- * `subject` and `predicate` come from the classifier already normalized
20
- * (lowercased, trimmed) per the prompt contract, but the coercer re-normalizes
21
- * defensively because LLM output is not trustworthy.
22
- */
23
- export interface ExtractedFact {
24
- readonly kind: "decision" | "open" | "attribute";
25
- readonly subject: string;
26
- readonly predicate: string;
27
- readonly value: string;
28
- readonly sourceQuote?: string;
29
- }
30
-
31
- export interface ClassifyResult {
32
- readonly label: string;
33
- readonly summary: string;
34
- readonly entities: ReadonlyArray<string>;
35
- readonly decisions: ReadonlyArray<string>;
36
- readonly open: ReadonlyArray<string>;
37
- readonly confidence: number;
38
- readonly facts: ReadonlyArray<ExtractedFact>;
39
- }
40
-
41
- export class LLMUnreachableError extends Error {
42
- constructor(provider: string, cause?: unknown) {
43
- super(`LLM unreachable: ${provider}`);
44
- this.name = "LLMUnreachableError";
45
- this.cause = cause;
46
- }
47
- }
48
-
49
- export interface LLMClient {
50
- embed(text: string, kind: EmbeddingKind): Promise<EmbedResult>;
51
- classify(transcript: string): Promise<ClassifyResult>;
52
- }
@@ -1,16 +0,0 @@
1
- /**
2
- * StructuredLogger — sole logging seam for core/.
3
- *
4
- * Outer layers wire a concrete logger (console, pino, file-append). Tests
5
- * substitute a recording logger. core/ never calls console.log directly.
6
- */
7
-
8
- export type LogLevel = "debug" | "info" | "warn" | "error";
9
-
10
- export interface LogFields {
11
- readonly [key: string]: string | number | boolean | null | undefined;
12
- }
13
-
14
- export interface StructuredLogger {
15
- log(level: LogLevel, message: string, fields?: LogFields): void;
16
- }