nlm-memory 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (257) hide show
  1. package/README.md +89 -34
  2. package/dist/cli/digest.d.ts +20 -0
  3. package/dist/cli/digest.js +142 -0
  4. package/dist/cli/digest.js.map +1 -0
  5. package/dist/cli/nlm.d.ts +1 -0
  6. package/dist/cli/nlm.js +25 -1
  7. package/dist/cli/nlm.js.map +1 -1
  8. package/dist/core/digest/compose.d.ts +38 -0
  9. package/dist/core/digest/compose.js +93 -0
  10. package/dist/core/digest/compose.js.map +1 -0
  11. package/dist/core/digest/hook-liveness.d.ts +32 -0
  12. package/dist/core/digest/hook-liveness.js +54 -0
  13. package/dist/core/digest/hook-liveness.js.map +1 -0
  14. package/dist/http/app.js +2 -1
  15. package/dist/http/app.js.map +1 -1
  16. package/dist/mcp/server.js +20 -1
  17. package/dist/mcp/server.js.map +1 -1
  18. package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
  19. package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
  20. package/dist/ui/index.html +2 -2
  21. package/package.json +26 -1
  22. package/.agents/plugins/marketplace.json +0 -20
  23. package/.github/workflows/ci.yml +0 -30
  24. package/docs/methodology/re-derivation-rate.md +0 -112
  25. package/docs/methodology/useful-hit-rate.md +0 -79
  26. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  27. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  28. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  29. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  30. package/docs/plans/desktop-product.md +0 -69
  31. package/docs/plans/factstore-design.md +0 -236
  32. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
  33. package/logs/CHANGELOG/CHANGELOG.md +0 -209
  34. package/migrations/000_initial_schema.sql +0 -174
  35. package/migrations/001_entity_type_rename.sql +0 -17
  36. package/migrations/002_adapter_state_extend.sql +0 -12
  37. package/migrations/003_session_embeddings.sql +0 -11
  38. package/migrations/004_facts.sql +0 -46
  39. package/migrations/005_sources.sql +0 -31
  40. package/migrations/006_providers.sql +0 -33
  41. package/migrations/007_source_tokens.sql +0 -17
  42. package/migrations/008_fts_rebuild.sql +0 -9
  43. package/migrations/009_session_embedding_chunks.sql +0 -46
  44. package/migrations/010_sources_opencode.sql +0 -30
  45. package/migrations/011_sources_hermes_agent.sql +0 -30
  46. package/migrations/012_sources_aider.sql +0 -30
  47. package/migrations/013_adapter_state_failure_count.sql +0 -12
  48. package/migrations/014_sources_cursor.sql +0 -30
  49. package/migrations/015_sources_windsurf.sql +0 -30
  50. package/plugin-hermes-agent/README.md +0 -49
  51. package/plugin-hermes-agent/__init__.py +0 -75
  52. package/plugin-hermes-agent/plugin.yaml +0 -15
  53. package/scripts/backfill-citations.mjs +0 -0
  54. package/scripts/build-codex-plugin.mjs +0 -61
  55. package/scripts/deepseek-probe.mjs +0 -67
  56. package/scripts/extract-triples.mjs +0 -207
  57. package/scripts/longmemeval/embedding-cache.ts +0 -77
  58. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  59. package/scripts/longmemeval/run-harness.ts +0 -315
  60. package/scripts/longmemeval/scorer.ts +0 -99
  61. package/scripts/longmemeval/tsconfig.json +0 -9
  62. package/scripts/longmemeval/types.ts +0 -35
  63. package/scripts/nlm-daily-digest.py +0 -239
  64. package/scripts/nlm-daily-digest.sh +0 -28
  65. package/src/cli/classify-parity.ts +0 -257
  66. package/src/cli/launchctl-helpers.ts +0 -49
  67. package/src/cli/nlm.ts +0 -1078
  68. package/src/core/actions/actions-log.ts +0 -118
  69. package/src/core/actions/overlay.ts +0 -117
  70. package/src/core/adapters/aider.ts +0 -205
  71. package/src/core/adapters/claude-code.ts +0 -293
  72. package/src/core/adapters/common.ts +0 -54
  73. package/src/core/adapters/cursor.ts +0 -486
  74. package/src/core/adapters/from-source.ts +0 -67
  75. package/src/core/adapters/hermes-agent.ts +0 -240
  76. package/src/core/adapters/hermes.ts +0 -277
  77. package/src/core/adapters/jsonl-generic.ts +0 -208
  78. package/src/core/adapters/opencode.ts +0 -281
  79. package/src/core/adapters/pi.ts +0 -264
  80. package/src/core/adapters/windsurf.ts +0 -386
  81. package/src/core/classifier/prompt.ts +0 -200
  82. package/src/core/dataset/build-dataset.ts +0 -463
  83. package/src/core/embedding/chunk-body.ts +0 -76
  84. package/src/core/embedding/embed-backfill.ts +0 -210
  85. package/src/core/embedding/embed-normalize.ts +0 -135
  86. package/src/core/facts/backfill-facts.ts +0 -254
  87. package/src/core/facts/extract-facts.ts +0 -50
  88. package/src/core/hook/citation-detect.ts +0 -124
  89. package/src/core/hook/cite-memo.ts +0 -68
  90. package/src/core/hook/claude-settings.ts +0 -187
  91. package/src/core/hook/gate.ts +0 -25
  92. package/src/core/hook/hook-log.ts +0 -41
  93. package/src/core/hook/memo-sweep.ts +0 -164
  94. package/src/core/hook/memo.ts +0 -67
  95. package/src/core/hook/pointer-block.ts +0 -26
  96. package/src/core/hook/select.ts +0 -32
  97. package/src/core/hook/transcript.ts +0 -121
  98. package/src/core/ingest/ingest-session.ts +0 -111
  99. package/src/core/providers/provider-models.ts +0 -100
  100. package/src/core/providers/provider-registry.ts +0 -196
  101. package/src/core/recall/citation-log.ts +0 -108
  102. package/src/core/recall/filter.ts +0 -27
  103. package/src/core/recall/index.ts +0 -6
  104. package/src/core/recall/match-fields.ts +0 -40
  105. package/src/core/recall/query-log.ts +0 -149
  106. package/src/core/recall/query-shape.ts +0 -66
  107. package/src/core/recall/recall-service.ts +0 -320
  108. package/src/core/recall/recent-log.ts +0 -59
  109. package/src/core/recall/tokenize.ts +0 -18
  110. package/src/core/recall/useful-scan.ts +0 -336
  111. package/src/core/recall-facts/fact-query-log.ts +0 -150
  112. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  113. package/src/core/scheduler/scan-once.ts +0 -142
  114. package/src/core/scheduler/scheduler.ts +0 -225
  115. package/src/core/sources/source-registry.ts +0 -278
  116. package/src/core/storage/db-restore.ts +0 -133
  117. package/src/core/storage/live-status.ts +0 -45
  118. package/src/core/storage/migrate.ts +0 -72
  119. package/src/core/storage/sqlite-fact-store.ts +0 -304
  120. package/src/core/storage/sqlite-session-store.ts +0 -810
  121. package/src/hook/hook-auth.ts +0 -18
  122. package/src/hook/prompt-recall-hook.ts +0 -180
  123. package/src/hook/session-end-hook.ts +0 -81
  124. package/src/hook/session-start-hook.ts +0 -168
  125. package/src/hook/stop-hook.ts +0 -239
  126. package/src/http/app.ts +0 -1215
  127. package/src/install/claude-code.ts +0 -128
  128. package/src/install/codex.ts +0 -367
  129. package/src/install/cursor.ts +0 -68
  130. package/src/install/hermes-agent.ts +0 -76
  131. package/src/install/hermes.ts +0 -78
  132. package/src/install/nlm-dir-perms.ts +0 -55
  133. package/src/install/ollama.ts +0 -284
  134. package/src/install/setup.ts +0 -489
  135. package/src/install/windsurf.ts +0 -68
  136. package/src/llm/classifier-box.ts +0 -64
  137. package/src/llm/deepseek-client.ts +0 -150
  138. package/src/llm/env-autoload.ts +0 -55
  139. package/src/llm/ollama-client.ts +0 -189
  140. package/src/mcp/server.ts +0 -534
  141. package/src/ports/fact-store.ts +0 -102
  142. package/src/ports/llm-client.ts +0 -52
  143. package/src/ports/logger.ts +0 -16
  144. package/src/ports/session-store.ts +0 -45
  145. package/src/ports/transcript-adapter.ts +0 -55
  146. package/src/shared/types.ts +0 -149
  147. package/src/ui/App.tsx +0 -58
  148. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  149. package/src/ui/components/SessionDrawer.tsx +0 -199
  150. package/src/ui/components/SideNav.tsx +0 -162
  151. package/src/ui/components/Skeleton.tsx +0 -107
  152. package/src/ui/index.html +0 -13
  153. package/src/ui/lib/actions.ts +0 -30
  154. package/src/ui/lib/api.ts +0 -92
  155. package/src/ui/lib/dataset.ts +0 -141
  156. package/src/ui/lib/registries.ts +0 -155
  157. package/src/ui/lib/view-settings.ts +0 -41
  158. package/src/ui/main.tsx +0 -15
  159. package/src/ui/pages/Live.tsx +0 -229
  160. package/src/ui/pages/Pulse.tsx +0 -415
  161. package/src/ui/pages/Recall.tsx +0 -190
  162. package/src/ui/pages/River.tsx +0 -354
  163. package/src/ui/pages/Search.tsx +0 -386
  164. package/src/ui/pages/Stub.tsx +0 -9
  165. package/src/ui/pages/Thread.tsx +0 -473
  166. package/src/ui/pages/settings/Classifier.tsx +0 -227
  167. package/src/ui/pages/settings/Data.tsx +0 -190
  168. package/src/ui/pages/settings/Index.tsx +0 -65
  169. package/src/ui/pages/settings/Labels.tsx +0 -224
  170. package/src/ui/pages/settings/Providers.tsx +0 -305
  171. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  172. package/src/ui/pages/settings/Sources.tsx +0 -326
  173. package/src/ui/pages/settings/Views.tsx +0 -96
  174. package/src/ui/styles.css +0 -1890
  175. package/src/ui/tsconfig.json +0 -21
  176. package/src/ui/vite.config.ts +0 -19
  177. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  178. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  179. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  180. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  181. package/tests/fixtures/facts.ts +0 -17
  182. package/tests/fixtures/golden-corpus.ts +0 -85
  183. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  184. package/tests/fixtures/hermes/paired_session.json +0 -23
  185. package/tests/fixtures/hermes/request_dump.json +0 -28
  186. package/tests/fixtures/hermes/session_iso.json +0 -38
  187. package/tests/fixtures/hermes/session_unix.json +0 -38
  188. package/tests/fixtures/hermes/system_only.json +0 -18
  189. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  190. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  191. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  192. package/tests/fixtures/sessions.ts +0 -22
  193. package/tests/integration/backfill-facts.test.ts +0 -362
  194. package/tests/integration/citation-explicit.test.ts +0 -111
  195. package/tests/integration/cite-event.test.ts +0 -169
  196. package/tests/integration/cite-memo.test.ts +0 -87
  197. package/tests/integration/db-restore.test.ts +0 -153
  198. package/tests/integration/embed-backfill.test.ts +0 -176
  199. package/tests/integration/fact-supersedence.test.ts +0 -313
  200. package/tests/integration/fts-index.test.ts +0 -60
  201. package/tests/integration/getbyids-sqlite.test.ts +0 -100
  202. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  203. package/tests/integration/hook-claude-settings.test.ts +0 -218
  204. package/tests/integration/hook-log.test.ts +0 -54
  205. package/tests/integration/hook-memo.test.ts +0 -68
  206. package/tests/integration/hook-pre-compact.test.ts +0 -105
  207. package/tests/integration/hook-subagent-start.test.ts +0 -102
  208. package/tests/integration/http.test.ts +0 -401
  209. package/tests/integration/keyword-search-fts.test.ts +0 -66
  210. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  211. package/tests/integration/mcp.test.ts +0 -260
  212. package/tests/integration/memo-sweep.test.ts +0 -91
  213. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  214. package/tests/integration/provider-registry.test.ts +0 -107
  215. package/tests/integration/recall-golden.test.ts +0 -59
  216. package/tests/integration/recall-sqlite.test.ts +0 -169
  217. package/tests/integration/scheduler.test.ts +0 -391
  218. package/tests/integration/session-end-hook.test.ts +0 -48
  219. package/tests/integration/session-start-hook.test.ts +0 -126
  220. package/tests/integration/source-registry.test.ts +0 -122
  221. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  222. package/tests/integration/stop-hook.test.ts +0 -560
  223. package/tests/integration/wal-checkpoint.test.ts +0 -49
  224. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  225. package/tests/unit/core/adapters/aider.test.ts +0 -230
  226. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  227. package/tests/unit/core/adapters/cursor.test.ts +0 -485
  228. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  229. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  230. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  231. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  232. package/tests/unit/core/adapters/pi.test.ts +0 -110
  233. package/tests/unit/core/adapters/windsurf.test.ts +0 -416
  234. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  235. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  236. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  237. package/tests/unit/core/filter.test.ts +0 -40
  238. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  239. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  240. package/tests/unit/core/hook/gate.test.ts +0 -29
  241. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  242. package/tests/unit/core/hook/select.test.ts +0 -66
  243. package/tests/unit/core/match-fields.test.ts +0 -39
  244. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  245. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  246. package/tests/unit/core/query-shape.test.ts +0 -92
  247. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  248. package/tests/unit/core/recall-service.test.ts +0 -200
  249. package/tests/unit/core/storage/live-status.test.ts +0 -54
  250. package/tests/unit/core/tokenize.test.ts +0 -32
  251. package/tests/unit/core/useful-scan.test.ts +0 -537
  252. package/tests/unit/llm/embed.test.ts +0 -93
  253. package/tests/unit/llm/ollama-client.test.ts +0 -124
  254. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  255. package/tsconfig.json +0 -31
  256. package/tsconfig.test.json +0 -11
  257. package/vitest.config.ts +0 -22
package/src/mcp/server.ts DELETED
@@ -1,534 +0,0 @@
1
- /**
2
- * MCP adapter. Binds the `recall_sessions` and `get_session` tools directly
3
- * to RecallService and SessionStore — no HTTP hop, no localhost loopback.
4
- *
5
- * The Python daemon's MCP server proxied through HTTP. This server runs in
6
- * the same process as the rest of nlm-memory, so a tool call is a function
7
- * call. Lower latency, simpler stack traces, one fewer thing to keep alive.
8
- *
9
- * Layering: this module knows about the inner ring (RecallService,
10
- * SessionStore); core/ does not know this module exists.
11
- */
12
-
13
- import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
14
- import { encode as toonEncode } from "@toon-format/toon";
15
- import { z } from "zod";
16
- import { logQuery } from "@core/recall/query-log.js";
17
- import { logFactQuery } from "@core/recall-facts/fact-query-log.js";
18
- import { appendCitation } from "@core/recall/citation-log.js";
19
- import type { FactRecallService } from "@core/recall-facts/fact-recall-service.js";
20
- import type { RecallService } from "@core/recall/recall-service.js";
21
- import type { FactStore } from "@ports/fact-store.js";
22
- import type { SessionStore } from "@ports/session-store.js";
23
- import type {
24
- FactKind,
25
- FactRecallQuery,
26
- RecallKindFilter,
27
- RecallMode,
28
- RecallQuery,
29
- } from "@shared/types.js";
30
-
31
- const CHARACTER_LIMIT = 25_000;
32
- const DEFAULT_LIMIT = 10;
33
- const SERVER_NAME = "nlm-memory-mcp-server";
34
- const SERVER_VERSION = "0.4.0";
35
-
36
- /** TOON encoding cuts token usage on large recall payloads. Opt in via
37
- * NLM_FORMAT=toon in the MCP server's env (see .mcp.json). Defaults to JSON. */
38
- const USE_TOON = process.env.NLM_FORMAT === "toon";
39
-
40
- export interface McpDeps {
41
- readonly recall: RecallService;
42
- readonly store: SessionStore;
43
- /** Optional — when absent, fact tools are not registered. */
44
- readonly factRecall?: FactRecallService;
45
- readonly factStore?: FactStore;
46
- }
47
-
48
- export interface ToolResult {
49
- content: { type: "text"; text: string }[];
50
- isError?: boolean;
51
- }
52
-
53
- function format(data: unknown): string {
54
- if (USE_TOON) {
55
- try {
56
- return toonEncode(data);
57
- } catch {
58
- return JSON.stringify(data, null, 2);
59
- }
60
- }
61
- return JSON.stringify(data, null, 2);
62
- }
63
-
64
- function truncate(data: unknown): string {
65
- const str = format(data);
66
- if (str.length <= CHARACTER_LIMIT) return str;
67
- return format({
68
- truncated: true,
69
- truncation_message:
70
- "Response too large. Lower limit or fetch fewer fields via get_session.",
71
- });
72
- }
73
-
74
- function ok(data: unknown): ToolResult {
75
- return { content: [{ type: "text", text: truncate(data) }] };
76
- }
77
-
78
- function err(error: unknown): ToolResult {
79
- const message = error instanceof Error ? error.message : String(error);
80
- return {
81
- isError: true,
82
- content: [{ type: "text", text: `Error: ${message}` }],
83
- };
84
- }
85
-
86
- // Pure handler functions — exported so tests can exercise them without an
87
- // MCP transport. The McpServer wrapper below just registers these.
88
-
89
- export interface RecallToolInput {
90
- query: string | undefined;
91
- entity: string | undefined;
92
- kind: RecallKindFilter | undefined;
93
- mode: RecallMode | undefined;
94
- limit: number | undefined;
95
- }
96
-
97
- export async function recallSessionsHandler(
98
- deps: McpDeps,
99
- input: Partial<RecallToolInput>,
100
- ): Promise<ToolResult> {
101
- try {
102
- const query: RecallQuery = {
103
- query: input.query ?? "",
104
- mode: input.mode ?? "hybrid",
105
- limit: input.limit ?? DEFAULT_LIMIT,
106
- ...(input.entity !== undefined ? { entity: input.entity } : {}),
107
- ...(input.kind !== undefined ? { kind: input.kind } : {}),
108
- };
109
- const result = await deps.recall.search(query);
110
- // Telemetry — the MCP path is the real agent-usage path; without this it
111
- // is invisible to query_log.jsonl and the Recall page. Fire-and-forget,
112
- // mirrors the HTTP /api/recall handler.
113
- void logQuery({
114
- source: "mcp",
115
- query: input.query ?? null,
116
- entity: input.entity ?? null,
117
- kind: input.kind ?? null,
118
- mode: input.mode ?? "hybrid",
119
- limit: input.limit ?? DEFAULT_LIMIT,
120
- nResults: result.total,
121
- returnedIds: result.results.map((r) => r.id),
122
- });
123
- return ok(result);
124
- } catch (e) {
125
- return err(e);
126
- }
127
- }
128
-
129
- export async function getSessionHandler(
130
- deps: McpDeps,
131
- input: { id: string },
132
- ): Promise<ToolResult> {
133
- try {
134
- const session = await deps.store.getById(input.id);
135
- if (!session) {
136
- return err(new Error(`session ${input.id} not found`));
137
- }
138
- return ok(session);
139
- } catch (e) {
140
- return err(e);
141
- }
142
- }
143
-
144
- export interface RecallFactsInput {
145
- query: string | undefined;
146
- subject: string | undefined;
147
- predicate: string | undefined;
148
- kind: FactKind | undefined;
149
- mode: RecallMode | undefined;
150
- includeSuperseded: boolean | undefined;
151
- minConfidence: number | undefined;
152
- limit: number | undefined;
153
- }
154
-
155
- export async function recallFactsHandler(
156
- deps: McpDeps,
157
- input: Partial<RecallFactsInput>,
158
- ): Promise<ToolResult> {
159
- if (!deps.factRecall) {
160
- return err(new Error("fact recall not wired in this deployment"));
161
- }
162
- try {
163
- const query: FactRecallQuery = {
164
- query: input.query ?? "",
165
- mode: input.mode ?? "hybrid",
166
- limit: input.limit ?? DEFAULT_LIMIT,
167
- ...(input.subject !== undefined ? { subject: input.subject } : {}),
168
- ...(input.predicate !== undefined ? { predicate: input.predicate } : {}),
169
- ...(input.kind !== undefined ? { kind: input.kind } : {}),
170
- ...(input.includeSuperseded !== undefined
171
- ? { includeSuperseded: input.includeSuperseded }
172
- : {}),
173
- ...(input.minConfidence !== undefined
174
- ? { minConfidence: input.minConfidence }
175
- : {}),
176
- };
177
- const result = await deps.factRecall.search(query);
178
- // Telemetry — see recallSessionsHandler. Fire-and-forget.
179
- void logFactQuery({
180
- source: "mcp",
181
- query: input.query ?? null,
182
- subject: input.subject ?? null,
183
- predicate: input.predicate ?? null,
184
- kind: input.kind ?? null,
185
- mode: input.mode ?? "hybrid",
186
- limit: input.limit ?? DEFAULT_LIMIT,
187
- nResults: result.total,
188
- returnedIds: result.results.map((r) => r.id),
189
- });
190
- return ok(result);
191
- } catch (e) {
192
- return err(e);
193
- }
194
- }
195
-
196
- export async function getFactHistoryHandler(
197
- deps: McpDeps,
198
- input: { subject: string; predicate: string | undefined },
199
- ): Promise<ToolResult> {
200
- if (!deps.factStore) {
201
- return err(new Error("fact store not wired in this deployment"));
202
- }
203
- try {
204
- const chains = await deps.factStore.getHistory(input.subject, input.predicate);
205
- return ok({ subject: input.subject, predicate: input.predicate ?? null, chains });
206
- } catch (e) {
207
- return err(e);
208
- }
209
- }
210
-
211
- const CITE_SESSION_DESCRIPTION = `Log that you used a previously-surfaced session in your response. Pass the session ID. This lets NLM learn which surfaced sessions are actually useful, training a per-operator reranker over time. Call after writing your response, with one cite per surfaced session you actually drew from.`;
212
-
213
- const RECALL_DESCRIPTION = `Search prior AI sessions across every runtime the user has connected (Claude Code,
214
- Hermes, pi, Codex, Gemini, Aider). Local-first, fast (~200-400ms warm), idempotent,
215
- safe to call eagerly. No rate limit; no cost per call.
216
-
217
- CALL THIS FIRST — before answering — whenever the user prompt contains any of:
218
-
219
- Decision / position questions
220
- "what did we decide about X" · "did we figure out X" · "what's our take on X"
221
- "have we tried X" · "where did we land on X" · "what was the conclusion"
222
-
223
- Status / open-thread questions
224
- "what's still open on X" · "where did we leave X" · "what's blocked on X"
225
- "what's the state of X" · "is X done"
226
-
227
- History / continuity questions
228
- "have I worked on X" · "when did we last X" · "did we already do X"
229
- "have I talked to <person>" · "what's the history with X"
230
-
231
- Implicit references to prior context (the dangerous case — easy to miss)
232
- "that pgvector thing" · "the X discussion" · "our auth approach"
233
- "the one we built for <client>" · "the issue we hit last week"
234
-
235
- Not calling when the user references past work is the failure mode this tool exists
236
- to prevent: re-derivation of already-solved problems, contradicting prior decisions,
237
- re-litigating resolved open questions, ignoring the user's accumulated context.
238
-
239
- Returns ranked session digests (id, label, summary, entities, decisions, open
240
- questions). Call get_session for the full body when a digest looks relevant.
241
-
242
- Skip ONLY when the request is purely forward-looking with no plausible prior
243
- context — drafting wholly new content, naming something new, brainstorming
244
- greenfield ideas. When in doubt, call.
245
-
246
- When you reference a returned session in your response, call \`cite_session(id)\` to log it so the recall layer can learn what is useful.
247
-
248
- Args:
249
- - query: keyword(s) to search. Token-weighted match against label, decisions,
250
- open questions, and summary. Optional if entity or kind is provided.
251
- - entity: filter to sessions tagged with this entity. Optional.
252
- - kind: "decision" or "open" — restrict to sessions containing that marker
253
- kind. Omit for any. Optional.
254
- - mode: "hybrid" (default — keyword BM25 + semantic embeddings), "keyword", or
255
- "semantic". Optional.
256
- - limit: max results (1-100, default 10).`;
257
-
258
- const GET_SESSION_DESCRIPTION = `Fetch one full session by its canonical ID, including the conversational body.
259
-
260
- Call this AFTER recall_sessions when a returned digest looks relevant and the
261
- summary alone isn't enough to answer — e.g. you need the exact wording of a
262
- decision, the full reasoning behind a pivot, the specific commands that were
263
- run, or any quote you intend to reference verbatim.
264
-
265
- The recall_sessions digest is optimized for ranking and scanning; the full body
266
- contains the actual conversation transcript that produced the decision.
267
-
268
- Args:
269
- - id: Canonical session ID returned by recall_sessions (e.g. "cc_abc123",
270
- "sess_pgvector"). Pass the id field from the recall_sessions result.`;
271
-
272
- const RECALL_FACTS_DESCRIPTION = `Look up specific (subject, predicate, value) facts the user has established in
273
- prior sessions — model aliases, framework choices, endpoints, ports, hosts,
274
- deadlines, pricing, owners, dependencies, etc.
275
-
276
- CALL THIS when the user asks for a concrete value rather than a prose summary:
277
-
278
- "what port is X on" · "what model does Y use" · "what's the endpoint for Z"
279
- "what framework did we pick for X" · "who owns the X project"
280
- "when's the X deadline" · "what did we set X to" · "where does X live"
281
- "what version of X are we on" · "what's our X account"
282
-
283
- Prefer this over recall_sessions when the user wants the *answer*, not the
284
- *conversation* — facts return the exact value with provenance (source session
285
- + source quote), no scanning required. recall_sessions is the right tool when
286
- the user wants context, reasoning, or the full discussion.
287
-
288
- Returns matching Fact records ordered by recency. Superseded facts are excluded
289
- by default; call get_fact_history to walk the chain of how a value evolved
290
- ("when did X flip from Fastify to Hono?").
291
-
292
- Examples:
293
- recall_facts(subject="mac-pro-llm-host", predicate="model")
294
- → the model alias currently exposed on the Mac Pro LLM endpoint
295
- recall_facts(subject="nlm-memory-ts", predicate="framework")
296
- → the web framework picked for nlm-memory-ts
297
- recall_facts(subject="goat-home-services")
298
- → all known facts about the GOAT engagement
299
- recall_facts(query="routing", kind="decision")
300
- → recent decision-kind facts mentioning routing
301
-
302
- Args:
303
- - query: free-text search against fact values. Optional if subject /
304
- predicate / kind is set.
305
- - subject: exact-match normalized (lowercase-kebab) entity or topic name.
306
- - predicate: exact-match predicate from the closed vocabulary (framework,
307
- endpoint, model, port, host, owner, pricing, cost, deadline,
308
- status, stack, runtime, library, version, dependency, schema,
309
- integration, deployment, repo, branch, commit, description,
310
- decided-on, assumption, blocker).
311
- - kind: "decision" | "open" | "attribute". Optional.
312
- - mode: "hybrid" (default — keyword BM25 + semantic embeddings), "keyword",
313
- or "semantic".
314
- - includeSuperseded: true to include outdated facts. Default false.
315
- - minConfidence: lower bound on classifier confidence. Default 0.6.
316
- - limit: max results (1-100, default 10).`;
317
-
318
- const GET_FACT_HISTORY_DESCRIPTION = `Walk the supersedence chain for a (subject, predicate) pair to see how a value
319
- changed over time. Call this when the user asks about evolution, history of a
320
- choice, or wants to understand a prior decision that's since changed:
321
-
322
- "when did we switch from X to Y" · "what did we use before X"
323
- "wasn't X different a month ago" · "history of <X choice>"
324
- "why did we change from X to Y"
325
-
326
- This is the editable-timeline feature: NLM preserves rejected/replaced decisions
327
- as superseded entries rather than deleting them, so the reasoning trail survives.
328
-
329
- Returns chains ordered newest → oldest. The head is the current value; subsequent
330
- entries are predecessors, each linked forward via supersededBy.
331
-
332
- Args:
333
- - subject: normalized (lowercase-kebab) entity or topic name.
334
- - predicate: optional — narrow to a single (subject, predicate) chain. When
335
- omitted, returns one chain per predicate for this subject.`;
336
-
337
- // Minimum length for a session ID to be treated as valid.
338
- const MIN_CITE_ID_LEN = 6;
339
-
340
- export interface CiteSessionInput {
341
- readonly id: string;
342
- readonly conversation_id?: string | undefined;
343
- readonly reason?: string | undefined;
344
- }
345
-
346
- export async function citeSessionHandler(
347
- input: CiteSessionInput,
348
- ): Promise<ToolResult> {
349
- if (!input.id || input.id.length < MIN_CITE_ID_LEN) {
350
- return err(new Error(`id must be at least ${MIN_CITE_ID_LEN} characters`));
351
- }
352
- try {
353
- await appendCitation({
354
- conversationId: input.conversation_id ?? "mcp_tool",
355
- citedId: input.id,
356
- kind: "tool_use",
357
- ...(input.reason !== undefined ? { responsePreview: input.reason } : {}),
358
- });
359
- return ok({ logged: true, id: input.id });
360
- } catch (e) {
361
- return err(e);
362
- }
363
- }
364
-
365
- export function createMcpServer(deps: McpDeps): McpServer {
366
- const server = new McpServer({
367
- name: SERVER_NAME,
368
- version: SERVER_VERSION,
369
- });
370
-
371
- server.registerTool(
372
- "recall_sessions",
373
- {
374
- title: "Recall Sessions from NLM",
375
- description: RECALL_DESCRIPTION,
376
- inputSchema: {
377
- query: z
378
- .string()
379
- .default("")
380
- .describe("Keyword(s) to search. Optional if entity or kind is set."),
381
- entity: z
382
- .string()
383
- .optional()
384
- .describe("Filter to sessions tagged with this entity name."),
385
- kind: z
386
- .enum(["decision", "open"])
387
- .optional()
388
- .describe("Filter to sessions with a decision or open marker."),
389
- mode: z
390
- .enum(["keyword", "semantic", "hybrid"])
391
- .optional()
392
- .describe("Search mode. Defaults to hybrid (keyword BM25 + semantic embeddings)."),
393
- limit: z
394
- .number()
395
- .int()
396
- .min(1)
397
- .max(100)
398
- .default(DEFAULT_LIMIT)
399
- .describe("Max results to return."),
400
- },
401
- annotations: {
402
- readOnlyHint: true,
403
- destructiveHint: false,
404
- idempotentHint: true,
405
- openWorldHint: true,
406
- },
407
- },
408
- async (args) => recallSessionsHandler(deps, args) as never,
409
- );
410
-
411
- server.registerTool(
412
- "get_session",
413
- {
414
- title: "Get Full NLM Session",
415
- description: GET_SESSION_DESCRIPTION,
416
- inputSchema: {
417
- id: z.string().min(1).describe("Canonical session ID."),
418
- },
419
- annotations: {
420
- readOnlyHint: true,
421
- destructiveHint: false,
422
- idempotentHint: true,
423
- openWorldHint: true,
424
- },
425
- },
426
- async (args) => getSessionHandler(deps, args) as never,
427
- );
428
-
429
- if (deps.factRecall && deps.factStore) {
430
- server.registerTool(
431
- "recall_facts",
432
- {
433
- title: "Recall Facts from NLM",
434
- description: RECALL_FACTS_DESCRIPTION,
435
- inputSchema: {
436
- query: z
437
- .string()
438
- .default("")
439
- .describe("Free-text search against fact values. Optional if subject/predicate/kind set."),
440
- subject: z
441
- .string()
442
- .optional()
443
- .describe("Exact-match normalized entity/topic (lowercase-kebab)."),
444
- predicate: z
445
- .string()
446
- .optional()
447
- .describe("Exact-match predicate from the closed vocabulary."),
448
- kind: z
449
- .enum(["decision", "open", "attribute"])
450
- .optional()
451
- .describe("Filter to a single fact kind."),
452
- mode: z
453
- .enum(["keyword", "semantic", "hybrid"])
454
- .optional()
455
- .describe("Search mode. Defaults to hybrid (keyword BM25 + semantic embeddings)."),
456
- includeSuperseded: z
457
- .boolean()
458
- .optional()
459
- .describe("Include outdated facts. Default false."),
460
- minConfidence: z
461
- .number()
462
- .min(0)
463
- .max(1)
464
- .optional()
465
- .describe("Lower bound on classifier confidence. Default 0.6."),
466
- limit: z
467
- .number()
468
- .int()
469
- .min(1)
470
- .max(100)
471
- .default(DEFAULT_LIMIT)
472
- .describe("Max results to return."),
473
- },
474
- annotations: {
475
- readOnlyHint: true,
476
- destructiveHint: false,
477
- idempotentHint: true,
478
- openWorldHint: true,
479
- },
480
- },
481
- async (args) => recallFactsHandler(deps, args) as never,
482
- );
483
-
484
- server.registerTool(
485
- "get_fact_history",
486
- {
487
- title: "Get Fact Supersedence History",
488
- description: GET_FACT_HISTORY_DESCRIPTION,
489
- inputSchema: {
490
- subject: z.string().min(1).describe("Normalized entity/topic name."),
491
- predicate: z
492
- .string()
493
- .optional()
494
- .describe("Narrow to one (subject, predicate) chain."),
495
- },
496
- annotations: {
497
- readOnlyHint: true,
498
- destructiveHint: false,
499
- idempotentHint: true,
500
- openWorldHint: true,
501
- },
502
- },
503
- async (args) => getFactHistoryHandler(deps, args) as never,
504
- );
505
- }
506
-
507
- server.registerTool(
508
- "cite_session",
509
- {
510
- title: "Cite NLM Session",
511
- description: CITE_SESSION_DESCRIPTION,
512
- inputSchema: {
513
- id: z.string().min(MIN_CITE_ID_LEN).describe("Session ID returned by recall_sessions that you referenced in your response."),
514
- conversation_id: z
515
- .string()
516
- .optional()
517
- .describe("Current conversation ID. Optional — NLM infers from context when absent."),
518
- reason: z
519
- .string()
520
- .optional()
521
- .describe("Why this session was useful. Optional but encouraged — articulating the reason is a weak training signal."),
522
- },
523
- annotations: {
524
- readOnlyHint: false,
525
- destructiveHint: false,
526
- idempotentHint: false,
527
- openWorldHint: false,
528
- },
529
- },
530
- async (args) => citeSessionHandler(args) as never,
531
- );
532
-
533
- return server;
534
- }
@@ -1,102 +0,0 @@
1
- /**
2
- * FactStore — the only way core/ reads or writes the fact corpus.
3
- *
4
- * Companion to SessionStore. Sessions are the operator-recall unit; facts are
5
- * the agent-recall projection — normalized (subject, predicate, value) triples
6
- * derived from sessions, supersedence-aware. See
7
- * docs/plans/factstore-design.md.
8
- *
9
- * Phase B.1 ships the storage port + adapter only. No extraction wired yet
10
- * (B.2), no recall service (B.3), no MCP surface (B.3), no supersedence
11
- * autodetect (B.4). The surface here is the minimum needed by future phases:
12
- * insert one or many, look up by id, look up current (non-superseded) facts
13
- * by subject and optional predicate, mark a fact superseded.
14
- */
15
-
16
- import type { Fact, FactHistoryChain, FactKind } from "@shared/types.js";
17
-
18
- export interface FactQuery {
19
- readonly subject: string;
20
- readonly predicate?: string;
21
- readonly includeSuperseded?: boolean;
22
- readonly limit?: number;
23
- }
24
-
25
- export interface FactSemanticNeighbor {
26
- readonly factId: string;
27
- readonly distance: number;
28
- }
29
-
30
- /** Pre-filter applied at the storage layer before keyword scoring runs. */
31
- export interface FactListFilter {
32
- readonly subject?: string;
33
- readonly predicate?: string;
34
- readonly kind?: FactKind;
35
- readonly includeSuperseded?: boolean;
36
- readonly minConfidence?: number;
37
- readonly limit?: number;
38
- }
39
-
40
- export interface FactStore {
41
- /** Atomically insert a single fact. Throws on duplicate id. */
42
- insert(fact: Fact): Promise<void>;
43
-
44
- /** Atomically insert many facts as one transaction. Throws on any duplicate id. */
45
- insertMany(facts: ReadonlyArray<Fact>): Promise<void>;
46
-
47
- getById(id: string): Promise<Fact | null>;
48
-
49
- /**
50
- * Exact-match lookup of the current (non-superseded) fact for a
51
- * subject+predicate pair. Returns null if none exists. This is the hot
52
- * path for deterministic supersedence on ingest (Phase B.4).
53
- */
54
- findCurrent(subject: string, predicate: string): Promise<Fact | null>;
55
-
56
- /**
57
- * List facts matching the query. Defaults: current (non-superseded) only,
58
- * limit 50. Ordered by created_at descending.
59
- */
60
- list(query: FactQuery): Promise<ReadonlyArray<Fact>>;
61
-
62
- /**
63
- * List all facts attributable to a single session. Used by the UI to show
64
- * a fact-count badge on a session digest, and by tests.
65
- */
66
- listBySession(sessionId: string): Promise<ReadonlyArray<Fact>>;
67
-
68
- /**
69
- * Mark `oldId` as superseded by `newId`. Both facts must exist. Reversible
70
- * by passing null as newId (Phase C operator-undo affordance).
71
- */
72
- markSuperseded(oldId: string, newId: string | null): Promise<void>;
73
-
74
- /**
75
- * Pre-filtered fact list used by FactRecallService. Applies subject /
76
- * predicate / kind / confidence / superseded filters at the SQL layer
77
- * before keyword scoring runs in core. No ordering guarantee beyond
78
- * `created_at DESC`.
79
- */
80
- listForRecall(filter: FactListFilter): Promise<ReadonlyArray<Fact>>;
81
-
82
- /**
83
- * sqlite-vec KNN over fact_embeddings. Returns up to `limit` nearest
84
- * neighbors by L2 distance. The service converts distance to cosine and
85
- * blends with keyword scores.
86
- */
87
- semanticSearch(
88
- queryVector: Float32Array,
89
- limit: number,
90
- ): Promise<ReadonlyArray<FactSemanticNeighbor>>;
91
-
92
- /**
93
- * Supersedence chain inspection. When `predicate` is provided, returns a
94
- * single chain (or empty array if no facts match). When omitted, returns
95
- * one chain per distinct predicate for that subject. Each chain orders
96
- * newest → oldest by created_at.
97
- */
98
- getHistory(
99
- subject: string,
100
- predicate?: string,
101
- ): Promise<ReadonlyArray<FactHistoryChain>>;
102
- }
@@ -1,52 +0,0 @@
1
- /**
2
- * LLMClient — outbound LLM calls (embedding + classification).
3
- *
4
- * Implementations: OllamaClient (default, local), AnthropicClient, OpenAIClient.
5
- * core/ only sees this interface; it never imports an HTTP client.
6
- */
7
-
8
- export interface EmbedResult {
9
- readonly vector: Float32Array;
10
- readonly model: string;
11
- }
12
-
13
- export type EmbeddingKind = "query" | "document";
14
-
15
- /**
16
- * Raw fact extracted by the classifier. No id, no source_session_id, no
17
- * created_at yet — those get filled in at ingest time by extractFacts().
18
- *
19
- * `subject` and `predicate` come from the classifier already normalized
20
- * (lowercased, trimmed) per the prompt contract, but the coercer re-normalizes
21
- * defensively because LLM output is not trustworthy.
22
- */
23
- export interface ExtractedFact {
24
- readonly kind: "decision" | "open" | "attribute";
25
- readonly subject: string;
26
- readonly predicate: string;
27
- readonly value: string;
28
- readonly sourceQuote?: string;
29
- }
30
-
31
- export interface ClassifyResult {
32
- readonly label: string;
33
- readonly summary: string;
34
- readonly entities: ReadonlyArray<string>;
35
- readonly decisions: ReadonlyArray<string>;
36
- readonly open: ReadonlyArray<string>;
37
- readonly confidence: number;
38
- readonly facts: ReadonlyArray<ExtractedFact>;
39
- }
40
-
41
- export class LLMUnreachableError extends Error {
42
- constructor(provider: string, cause?: unknown) {
43
- super(`LLM unreachable: ${provider}`);
44
- this.name = "LLMUnreachableError";
45
- this.cause = cause;
46
- }
47
- }
48
-
49
- export interface LLMClient {
50
- embed(text: string, kind: EmbeddingKind): Promise<EmbedResult>;
51
- classify(transcript: string): Promise<ClassifyResult>;
52
- }
@@ -1,16 +0,0 @@
1
- /**
2
- * StructuredLogger — sole logging seam for core/.
3
- *
4
- * Outer layers wire a concrete logger (console, pino, file-append). Tests
5
- * substitute a recording logger. core/ never calls console.log directly.
6
- */
7
-
8
- export type LogLevel = "debug" | "info" | "warn" | "error";
9
-
10
- export interface LogFields {
11
- readonly [key: string]: string | number | boolean | null | undefined;
12
- }
13
-
14
- export interface StructuredLogger {
15
- log(level: LogLevel, message: string, fields?: LogFields): void;
16
- }