nlm-memory 0.5.0 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (247) hide show
  1. package/README.md +72 -34
  2. package/dist/cli/nlm.js +2 -1
  3. package/dist/cli/nlm.js.map +1 -1
  4. package/dist/http/app.js +2 -1
  5. package/dist/http/app.js.map +1 -1
  6. package/dist/mcp/server.js +20 -1
  7. package/dist/mcp/server.js.map +1 -1
  8. package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
  9. package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
  10. package/dist/ui/index.html +2 -2
  11. package/package.json +26 -1
  12. package/.agents/plugins/marketplace.json +0 -20
  13. package/.github/workflows/ci.yml +0 -30
  14. package/docs/methodology/re-derivation-rate.md +0 -112
  15. package/docs/methodology/useful-hit-rate.md +0 -79
  16. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  17. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  18. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  19. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  20. package/docs/plans/desktop-product.md +0 -69
  21. package/docs/plans/factstore-design.md +0 -236
  22. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
  23. package/logs/CHANGELOG/CHANGELOG.md +0 -209
  24. package/migrations/000_initial_schema.sql +0 -174
  25. package/migrations/001_entity_type_rename.sql +0 -17
  26. package/migrations/002_adapter_state_extend.sql +0 -12
  27. package/migrations/003_session_embeddings.sql +0 -11
  28. package/migrations/004_facts.sql +0 -46
  29. package/migrations/005_sources.sql +0 -31
  30. package/migrations/006_providers.sql +0 -33
  31. package/migrations/007_source_tokens.sql +0 -17
  32. package/migrations/008_fts_rebuild.sql +0 -9
  33. package/migrations/009_session_embedding_chunks.sql +0 -46
  34. package/migrations/010_sources_opencode.sql +0 -30
  35. package/migrations/011_sources_hermes_agent.sql +0 -30
  36. package/migrations/012_sources_aider.sql +0 -30
  37. package/migrations/013_adapter_state_failure_count.sql +0 -12
  38. package/migrations/014_sources_cursor.sql +0 -30
  39. package/migrations/015_sources_windsurf.sql +0 -30
  40. package/plugin-hermes-agent/README.md +0 -49
  41. package/plugin-hermes-agent/__init__.py +0 -75
  42. package/plugin-hermes-agent/plugin.yaml +0 -15
  43. package/scripts/backfill-citations.mjs +0 -0
  44. package/scripts/build-codex-plugin.mjs +0 -61
  45. package/scripts/deepseek-probe.mjs +0 -67
  46. package/scripts/extract-triples.mjs +0 -207
  47. package/scripts/longmemeval/embedding-cache.ts +0 -77
  48. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  49. package/scripts/longmemeval/run-harness.ts +0 -315
  50. package/scripts/longmemeval/scorer.ts +0 -99
  51. package/scripts/longmemeval/tsconfig.json +0 -9
  52. package/scripts/longmemeval/types.ts +0 -35
  53. package/scripts/nlm-daily-digest.py +0 -239
  54. package/scripts/nlm-daily-digest.sh +0 -28
  55. package/src/cli/classify-parity.ts +0 -257
  56. package/src/cli/launchctl-helpers.ts +0 -49
  57. package/src/cli/nlm.ts +0 -1078
  58. package/src/core/actions/actions-log.ts +0 -118
  59. package/src/core/actions/overlay.ts +0 -117
  60. package/src/core/adapters/aider.ts +0 -205
  61. package/src/core/adapters/claude-code.ts +0 -293
  62. package/src/core/adapters/common.ts +0 -54
  63. package/src/core/adapters/cursor.ts +0 -486
  64. package/src/core/adapters/from-source.ts +0 -67
  65. package/src/core/adapters/hermes-agent.ts +0 -240
  66. package/src/core/adapters/hermes.ts +0 -277
  67. package/src/core/adapters/jsonl-generic.ts +0 -208
  68. package/src/core/adapters/opencode.ts +0 -281
  69. package/src/core/adapters/pi.ts +0 -264
  70. package/src/core/adapters/windsurf.ts +0 -386
  71. package/src/core/classifier/prompt.ts +0 -200
  72. package/src/core/dataset/build-dataset.ts +0 -463
  73. package/src/core/embedding/chunk-body.ts +0 -76
  74. package/src/core/embedding/embed-backfill.ts +0 -210
  75. package/src/core/embedding/embed-normalize.ts +0 -135
  76. package/src/core/facts/backfill-facts.ts +0 -254
  77. package/src/core/facts/extract-facts.ts +0 -50
  78. package/src/core/hook/citation-detect.ts +0 -124
  79. package/src/core/hook/cite-memo.ts +0 -68
  80. package/src/core/hook/claude-settings.ts +0 -187
  81. package/src/core/hook/gate.ts +0 -25
  82. package/src/core/hook/hook-log.ts +0 -41
  83. package/src/core/hook/memo-sweep.ts +0 -164
  84. package/src/core/hook/memo.ts +0 -67
  85. package/src/core/hook/pointer-block.ts +0 -26
  86. package/src/core/hook/select.ts +0 -32
  87. package/src/core/hook/transcript.ts +0 -121
  88. package/src/core/ingest/ingest-session.ts +0 -111
  89. package/src/core/providers/provider-models.ts +0 -100
  90. package/src/core/providers/provider-registry.ts +0 -196
  91. package/src/core/recall/citation-log.ts +0 -108
  92. package/src/core/recall/filter.ts +0 -27
  93. package/src/core/recall/index.ts +0 -6
  94. package/src/core/recall/match-fields.ts +0 -40
  95. package/src/core/recall/query-log.ts +0 -149
  96. package/src/core/recall/query-shape.ts +0 -66
  97. package/src/core/recall/recall-service.ts +0 -320
  98. package/src/core/recall/recent-log.ts +0 -59
  99. package/src/core/recall/tokenize.ts +0 -18
  100. package/src/core/recall/useful-scan.ts +0 -336
  101. package/src/core/recall-facts/fact-query-log.ts +0 -150
  102. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  103. package/src/core/scheduler/scan-once.ts +0 -142
  104. package/src/core/scheduler/scheduler.ts +0 -225
  105. package/src/core/sources/source-registry.ts +0 -278
  106. package/src/core/storage/db-restore.ts +0 -133
  107. package/src/core/storage/live-status.ts +0 -45
  108. package/src/core/storage/migrate.ts +0 -72
  109. package/src/core/storage/sqlite-fact-store.ts +0 -304
  110. package/src/core/storage/sqlite-session-store.ts +0 -810
  111. package/src/hook/hook-auth.ts +0 -18
  112. package/src/hook/prompt-recall-hook.ts +0 -180
  113. package/src/hook/session-end-hook.ts +0 -81
  114. package/src/hook/session-start-hook.ts +0 -168
  115. package/src/hook/stop-hook.ts +0 -239
  116. package/src/http/app.ts +0 -1215
  117. package/src/install/claude-code.ts +0 -128
  118. package/src/install/codex.ts +0 -367
  119. package/src/install/cursor.ts +0 -68
  120. package/src/install/hermes-agent.ts +0 -76
  121. package/src/install/hermes.ts +0 -78
  122. package/src/install/nlm-dir-perms.ts +0 -55
  123. package/src/install/ollama.ts +0 -284
  124. package/src/install/setup.ts +0 -489
  125. package/src/install/windsurf.ts +0 -68
  126. package/src/llm/classifier-box.ts +0 -64
  127. package/src/llm/deepseek-client.ts +0 -150
  128. package/src/llm/env-autoload.ts +0 -55
  129. package/src/llm/ollama-client.ts +0 -189
  130. package/src/mcp/server.ts +0 -534
  131. package/src/ports/fact-store.ts +0 -102
  132. package/src/ports/llm-client.ts +0 -52
  133. package/src/ports/logger.ts +0 -16
  134. package/src/ports/session-store.ts +0 -45
  135. package/src/ports/transcript-adapter.ts +0 -55
  136. package/src/shared/types.ts +0 -149
  137. package/src/ui/App.tsx +0 -58
  138. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  139. package/src/ui/components/SessionDrawer.tsx +0 -199
  140. package/src/ui/components/SideNav.tsx +0 -162
  141. package/src/ui/components/Skeleton.tsx +0 -107
  142. package/src/ui/index.html +0 -13
  143. package/src/ui/lib/actions.ts +0 -30
  144. package/src/ui/lib/api.ts +0 -92
  145. package/src/ui/lib/dataset.ts +0 -141
  146. package/src/ui/lib/registries.ts +0 -155
  147. package/src/ui/lib/view-settings.ts +0 -41
  148. package/src/ui/main.tsx +0 -15
  149. package/src/ui/pages/Live.tsx +0 -229
  150. package/src/ui/pages/Pulse.tsx +0 -415
  151. package/src/ui/pages/Recall.tsx +0 -190
  152. package/src/ui/pages/River.tsx +0 -354
  153. package/src/ui/pages/Search.tsx +0 -386
  154. package/src/ui/pages/Stub.tsx +0 -9
  155. package/src/ui/pages/Thread.tsx +0 -473
  156. package/src/ui/pages/settings/Classifier.tsx +0 -227
  157. package/src/ui/pages/settings/Data.tsx +0 -190
  158. package/src/ui/pages/settings/Index.tsx +0 -65
  159. package/src/ui/pages/settings/Labels.tsx +0 -224
  160. package/src/ui/pages/settings/Providers.tsx +0 -305
  161. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  162. package/src/ui/pages/settings/Sources.tsx +0 -326
  163. package/src/ui/pages/settings/Views.tsx +0 -96
  164. package/src/ui/styles.css +0 -1890
  165. package/src/ui/tsconfig.json +0 -21
  166. package/src/ui/vite.config.ts +0 -19
  167. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  168. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  169. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  170. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  171. package/tests/fixtures/facts.ts +0 -17
  172. package/tests/fixtures/golden-corpus.ts +0 -85
  173. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  174. package/tests/fixtures/hermes/paired_session.json +0 -23
  175. package/tests/fixtures/hermes/request_dump.json +0 -28
  176. package/tests/fixtures/hermes/session_iso.json +0 -38
  177. package/tests/fixtures/hermes/session_unix.json +0 -38
  178. package/tests/fixtures/hermes/system_only.json +0 -18
  179. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  180. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  181. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  182. package/tests/fixtures/sessions.ts +0 -22
  183. package/tests/integration/backfill-facts.test.ts +0 -362
  184. package/tests/integration/citation-explicit.test.ts +0 -111
  185. package/tests/integration/cite-event.test.ts +0 -169
  186. package/tests/integration/cite-memo.test.ts +0 -87
  187. package/tests/integration/db-restore.test.ts +0 -153
  188. package/tests/integration/embed-backfill.test.ts +0 -176
  189. package/tests/integration/fact-supersedence.test.ts +0 -313
  190. package/tests/integration/fts-index.test.ts +0 -60
  191. package/tests/integration/getbyids-sqlite.test.ts +0 -100
  192. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  193. package/tests/integration/hook-claude-settings.test.ts +0 -218
  194. package/tests/integration/hook-log.test.ts +0 -54
  195. package/tests/integration/hook-memo.test.ts +0 -68
  196. package/tests/integration/hook-pre-compact.test.ts +0 -105
  197. package/tests/integration/hook-subagent-start.test.ts +0 -102
  198. package/tests/integration/http.test.ts +0 -401
  199. package/tests/integration/keyword-search-fts.test.ts +0 -66
  200. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  201. package/tests/integration/mcp.test.ts +0 -260
  202. package/tests/integration/memo-sweep.test.ts +0 -91
  203. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  204. package/tests/integration/provider-registry.test.ts +0 -107
  205. package/tests/integration/recall-golden.test.ts +0 -59
  206. package/tests/integration/recall-sqlite.test.ts +0 -169
  207. package/tests/integration/scheduler.test.ts +0 -391
  208. package/tests/integration/session-end-hook.test.ts +0 -48
  209. package/tests/integration/session-start-hook.test.ts +0 -126
  210. package/tests/integration/source-registry.test.ts +0 -122
  211. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  212. package/tests/integration/stop-hook.test.ts +0 -560
  213. package/tests/integration/wal-checkpoint.test.ts +0 -49
  214. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  215. package/tests/unit/core/adapters/aider.test.ts +0 -230
  216. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  217. package/tests/unit/core/adapters/cursor.test.ts +0 -485
  218. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  219. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  220. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  221. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  222. package/tests/unit/core/adapters/pi.test.ts +0 -110
  223. package/tests/unit/core/adapters/windsurf.test.ts +0 -416
  224. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  225. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  226. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  227. package/tests/unit/core/filter.test.ts +0 -40
  228. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  229. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  230. package/tests/unit/core/hook/gate.test.ts +0 -29
  231. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  232. package/tests/unit/core/hook/select.test.ts +0 -66
  233. package/tests/unit/core/match-fields.test.ts +0 -39
  234. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  235. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  236. package/tests/unit/core/query-shape.test.ts +0 -92
  237. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  238. package/tests/unit/core/recall-service.test.ts +0 -200
  239. package/tests/unit/core/storage/live-status.test.ts +0 -54
  240. package/tests/unit/core/tokenize.test.ts +0 -32
  241. package/tests/unit/core/useful-scan.test.ts +0 -537
  242. package/tests/unit/llm/embed.test.ts +0 -93
  243. package/tests/unit/llm/ollama-client.test.ts +0 -124
  244. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  245. package/tsconfig.json +0 -31
  246. package/tsconfig.test.json +0 -11
  247. package/vitest.config.ts +0 -22
package/src/mcp/server.ts DELETED
@@ -1,534 +0,0 @@
1
- /**
2
- * MCP adapter. Binds the `recall_sessions` and `get_session` tools directly
3
- * to RecallService and SessionStore — no HTTP hop, no localhost loopback.
4
- *
5
- * The Python daemon's MCP server proxied through HTTP. This server runs in
6
- * the same process as the rest of nlm-memory, so a tool call is a function
7
- * call. Lower latency, simpler stack traces, one fewer thing to keep alive.
8
- *
9
- * Layering: this module knows about the inner ring (RecallService,
10
- * SessionStore); core/ does not know this module exists.
11
- */
12
-
13
- import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
14
- import { encode as toonEncode } from "@toon-format/toon";
15
- import { z } from "zod";
16
- import { logQuery } from "@core/recall/query-log.js";
17
- import { logFactQuery } from "@core/recall-facts/fact-query-log.js";
18
- import { appendCitation } from "@core/recall/citation-log.js";
19
- import type { FactRecallService } from "@core/recall-facts/fact-recall-service.js";
20
- import type { RecallService } from "@core/recall/recall-service.js";
21
- import type { FactStore } from "@ports/fact-store.js";
22
- import type { SessionStore } from "@ports/session-store.js";
23
- import type {
24
- FactKind,
25
- FactRecallQuery,
26
- RecallKindFilter,
27
- RecallMode,
28
- RecallQuery,
29
- } from "@shared/types.js";
30
-
31
- const CHARACTER_LIMIT = 25_000;
32
- const DEFAULT_LIMIT = 10;
33
- const SERVER_NAME = "nlm-memory-mcp-server";
34
- const SERVER_VERSION = "0.4.0";
35
-
36
- /** TOON encoding cuts token usage on large recall payloads. Opt in via
37
- * NLM_FORMAT=toon in the MCP server's env (see .mcp.json). Defaults to JSON. */
38
- const USE_TOON = process.env.NLM_FORMAT === "toon";
39
-
40
- export interface McpDeps {
41
- readonly recall: RecallService;
42
- readonly store: SessionStore;
43
- /** Optional — when absent, fact tools are not registered. */
44
- readonly factRecall?: FactRecallService;
45
- readonly factStore?: FactStore;
46
- }
47
-
48
- export interface ToolResult {
49
- content: { type: "text"; text: string }[];
50
- isError?: boolean;
51
- }
52
-
53
- function format(data: unknown): string {
54
- if (USE_TOON) {
55
- try {
56
- return toonEncode(data);
57
- } catch {
58
- return JSON.stringify(data, null, 2);
59
- }
60
- }
61
- return JSON.stringify(data, null, 2);
62
- }
63
-
64
- function truncate(data: unknown): string {
65
- const str = format(data);
66
- if (str.length <= CHARACTER_LIMIT) return str;
67
- return format({
68
- truncated: true,
69
- truncation_message:
70
- "Response too large. Lower limit or fetch fewer fields via get_session.",
71
- });
72
- }
73
-
74
- function ok(data: unknown): ToolResult {
75
- return { content: [{ type: "text", text: truncate(data) }] };
76
- }
77
-
78
- function err(error: unknown): ToolResult {
79
- const message = error instanceof Error ? error.message : String(error);
80
- return {
81
- isError: true,
82
- content: [{ type: "text", text: `Error: ${message}` }],
83
- };
84
- }
85
-
86
- // Pure handler functions — exported so tests can exercise them without an
87
- // MCP transport. The McpServer wrapper below just registers these.
88
-
89
- export interface RecallToolInput {
90
- query: string | undefined;
91
- entity: string | undefined;
92
- kind: RecallKindFilter | undefined;
93
- mode: RecallMode | undefined;
94
- limit: number | undefined;
95
- }
96
-
97
- export async function recallSessionsHandler(
98
- deps: McpDeps,
99
- input: Partial<RecallToolInput>,
100
- ): Promise<ToolResult> {
101
- try {
102
- const query: RecallQuery = {
103
- query: input.query ?? "",
104
- mode: input.mode ?? "hybrid",
105
- limit: input.limit ?? DEFAULT_LIMIT,
106
- ...(input.entity !== undefined ? { entity: input.entity } : {}),
107
- ...(input.kind !== undefined ? { kind: input.kind } : {}),
108
- };
109
- const result = await deps.recall.search(query);
110
- // Telemetry — the MCP path is the real agent-usage path; without this it
111
- // is invisible to query_log.jsonl and the Recall page. Fire-and-forget,
112
- // mirrors the HTTP /api/recall handler.
113
- void logQuery({
114
- source: "mcp",
115
- query: input.query ?? null,
116
- entity: input.entity ?? null,
117
- kind: input.kind ?? null,
118
- mode: input.mode ?? "hybrid",
119
- limit: input.limit ?? DEFAULT_LIMIT,
120
- nResults: result.total,
121
- returnedIds: result.results.map((r) => r.id),
122
- });
123
- return ok(result);
124
- } catch (e) {
125
- return err(e);
126
- }
127
- }
128
-
129
- export async function getSessionHandler(
130
- deps: McpDeps,
131
- input: { id: string },
132
- ): Promise<ToolResult> {
133
- try {
134
- const session = await deps.store.getById(input.id);
135
- if (!session) {
136
- return err(new Error(`session ${input.id} not found`));
137
- }
138
- return ok(session);
139
- } catch (e) {
140
- return err(e);
141
- }
142
- }
143
-
144
- export interface RecallFactsInput {
145
- query: string | undefined;
146
- subject: string | undefined;
147
- predicate: string | undefined;
148
- kind: FactKind | undefined;
149
- mode: RecallMode | undefined;
150
- includeSuperseded: boolean | undefined;
151
- minConfidence: number | undefined;
152
- limit: number | undefined;
153
- }
154
-
155
- export async function recallFactsHandler(
156
- deps: McpDeps,
157
- input: Partial<RecallFactsInput>,
158
- ): Promise<ToolResult> {
159
- if (!deps.factRecall) {
160
- return err(new Error("fact recall not wired in this deployment"));
161
- }
162
- try {
163
- const query: FactRecallQuery = {
164
- query: input.query ?? "",
165
- mode: input.mode ?? "hybrid",
166
- limit: input.limit ?? DEFAULT_LIMIT,
167
- ...(input.subject !== undefined ? { subject: input.subject } : {}),
168
- ...(input.predicate !== undefined ? { predicate: input.predicate } : {}),
169
- ...(input.kind !== undefined ? { kind: input.kind } : {}),
170
- ...(input.includeSuperseded !== undefined
171
- ? { includeSuperseded: input.includeSuperseded }
172
- : {}),
173
- ...(input.minConfidence !== undefined
174
- ? { minConfidence: input.minConfidence }
175
- : {}),
176
- };
177
- const result = await deps.factRecall.search(query);
178
- // Telemetry — see recallSessionsHandler. Fire-and-forget.
179
- void logFactQuery({
180
- source: "mcp",
181
- query: input.query ?? null,
182
- subject: input.subject ?? null,
183
- predicate: input.predicate ?? null,
184
- kind: input.kind ?? null,
185
- mode: input.mode ?? "hybrid",
186
- limit: input.limit ?? DEFAULT_LIMIT,
187
- nResults: result.total,
188
- returnedIds: result.results.map((r) => r.id),
189
- });
190
- return ok(result);
191
- } catch (e) {
192
- return err(e);
193
- }
194
- }
195
-
196
- export async function getFactHistoryHandler(
197
- deps: McpDeps,
198
- input: { subject: string; predicate: string | undefined },
199
- ): Promise<ToolResult> {
200
- if (!deps.factStore) {
201
- return err(new Error("fact store not wired in this deployment"));
202
- }
203
- try {
204
- const chains = await deps.factStore.getHistory(input.subject, input.predicate);
205
- return ok({ subject: input.subject, predicate: input.predicate ?? null, chains });
206
- } catch (e) {
207
- return err(e);
208
- }
209
- }
210
-
211
- const CITE_SESSION_DESCRIPTION = `Log that you used a previously-surfaced session in your response. Pass the session ID. This lets NLM learn which surfaced sessions are actually useful, training a per-operator reranker over time. Call after writing your response, with one cite per surfaced session you actually drew from.`;
212
-
213
- const RECALL_DESCRIPTION = `Search prior AI sessions across every runtime the user has connected (Claude Code,
214
- Hermes, pi, Codex, Gemini, Aider). Local-first, fast (~200-400ms warm), idempotent,
215
- safe to call eagerly. No rate limit; no cost per call.
216
-
217
- CALL THIS FIRST — before answering — whenever the user prompt contains any of:
218
-
219
- Decision / position questions
220
- "what did we decide about X" · "did we figure out X" · "what's our take on X"
221
- "have we tried X" · "where did we land on X" · "what was the conclusion"
222
-
223
- Status / open-thread questions
224
- "what's still open on X" · "where did we leave X" · "what's blocked on X"
225
- "what's the state of X" · "is X done"
226
-
227
- History / continuity questions
228
- "have I worked on X" · "when did we last X" · "did we already do X"
229
- "have I talked to <person>" · "what's the history with X"
230
-
231
- Implicit references to prior context (the dangerous case — easy to miss)
232
- "that pgvector thing" · "the X discussion" · "our auth approach"
233
- "the one we built for <client>" · "the issue we hit last week"
234
-
235
- Not calling when the user references past work is the failure mode this tool exists
236
- to prevent: re-derivation of already-solved problems, contradicting prior decisions,
237
- re-litigating resolved open questions, ignoring the user's accumulated context.
238
-
239
- Returns ranked session digests (id, label, summary, entities, decisions, open
240
- questions). Call get_session for the full body when a digest looks relevant.
241
-
242
- Skip ONLY when the request is purely forward-looking with no plausible prior
243
- context — drafting wholly new content, naming something new, brainstorming
244
- greenfield ideas. When in doubt, call.
245
-
246
- When you reference a returned session in your response, call \`cite_session(id)\` to log it so the recall layer can learn what is useful.
247
-
248
- Args:
249
- - query: keyword(s) to search. Token-weighted match against label, decisions,
250
- open questions, and summary. Optional if entity or kind is provided.
251
- - entity: filter to sessions tagged with this entity. Optional.
252
- - kind: "decision" or "open" — restrict to sessions containing that marker
253
- kind. Omit for any. Optional.
254
- - mode: "hybrid" (default — keyword BM25 + semantic embeddings), "keyword", or
255
- "semantic". Optional.
256
- - limit: max results (1-100, default 10).`;
257
-
258
- const GET_SESSION_DESCRIPTION = `Fetch one full session by its canonical ID, including the conversational body.
259
-
260
- Call this AFTER recall_sessions when a returned digest looks relevant and the
261
- summary alone isn't enough to answer — e.g. you need the exact wording of a
262
- decision, the full reasoning behind a pivot, the specific commands that were
263
- run, or any quote you intend to reference verbatim.
264
-
265
- The recall_sessions digest is optimized for ranking and scanning; the full body
266
- contains the actual conversation transcript that produced the decision.
267
-
268
- Args:
269
- - id: Canonical session ID returned by recall_sessions (e.g. "cc_abc123",
270
- "sess_pgvector"). Pass the id field from the recall_sessions result.`;
271
-
272
- const RECALL_FACTS_DESCRIPTION = `Look up specific (subject, predicate, value) facts the user has established in
273
- prior sessions — model aliases, framework choices, endpoints, ports, hosts,
274
- deadlines, pricing, owners, dependencies, etc.
275
-
276
- CALL THIS when the user asks for a concrete value rather than a prose summary:
277
-
278
- "what port is X on" · "what model does Y use" · "what's the endpoint for Z"
279
- "what framework did we pick for X" · "who owns the X project"
280
- "when's the X deadline" · "what did we set X to" · "where does X live"
281
- "what version of X are we on" · "what's our X account"
282
-
283
- Prefer this over recall_sessions when the user wants the *answer*, not the
284
- *conversation* — facts return the exact value with provenance (source session
285
- + source quote), no scanning required. recall_sessions is the right tool when
286
- the user wants context, reasoning, or the full discussion.
287
-
288
- Returns matching Fact records ordered by recency. Superseded facts are excluded
289
- by default; call get_fact_history to walk the chain of how a value evolved
290
- ("when did X flip from Fastify to Hono?").
291
-
292
- Examples:
293
- recall_facts(subject="mac-pro-llm-host", predicate="model")
294
- → the model alias currently exposed on the Mac Pro LLM endpoint
295
- recall_facts(subject="nlm-memory-ts", predicate="framework")
296
- → the web framework picked for nlm-memory-ts
297
- recall_facts(subject="goat-home-services")
298
- → all known facts about the GOAT engagement
299
- recall_facts(query="routing", kind="decision")
300
- → recent decision-kind facts mentioning routing
301
-
302
- Args:
303
- - query: free-text search against fact values. Optional if subject /
304
- predicate / kind is set.
305
- - subject: exact-match normalized (lowercase-kebab) entity or topic name.
306
- - predicate: exact-match predicate from the closed vocabulary (framework,
307
- endpoint, model, port, host, owner, pricing, cost, deadline,
308
- status, stack, runtime, library, version, dependency, schema,
309
- integration, deployment, repo, branch, commit, description,
310
- decided-on, assumption, blocker).
311
- - kind: "decision" | "open" | "attribute". Optional.
312
- - mode: "hybrid" (default — keyword BM25 + semantic embeddings), "keyword",
313
- or "semantic".
314
- - includeSuperseded: true to include outdated facts. Default false.
315
- - minConfidence: lower bound on classifier confidence. Default 0.6.
316
- - limit: max results (1-100, default 10).`;
317
-
318
- const GET_FACT_HISTORY_DESCRIPTION = `Walk the supersedence chain for a (subject, predicate) pair to see how a value
319
- changed over time. Call this when the user asks about evolution, history of a
320
- choice, or wants to understand a prior decision that's since changed:
321
-
322
- "when did we switch from X to Y" · "what did we use before X"
323
- "wasn't X different a month ago" · "history of <X choice>"
324
- "why did we change from X to Y"
325
-
326
- This is the editable-timeline feature: NLM preserves rejected/replaced decisions
327
- as superseded entries rather than deleting them, so the reasoning trail survives.
328
-
329
- Returns chains ordered newest → oldest. The head is the current value; subsequent
330
- entries are predecessors, each linked forward via supersededBy.
331
-
332
- Args:
333
- - subject: normalized (lowercase-kebab) entity or topic name.
334
- - predicate: optional — narrow to a single (subject, predicate) chain. When
335
- omitted, returns one chain per predicate for this subject.`;
336
-
337
- // Minimum length for a session ID to be treated as valid.
338
- const MIN_CITE_ID_LEN = 6;
339
-
340
- export interface CiteSessionInput {
341
- readonly id: string;
342
- readonly conversation_id?: string | undefined;
343
- readonly reason?: string | undefined;
344
- }
345
-
346
- export async function citeSessionHandler(
347
- input: CiteSessionInput,
348
- ): Promise<ToolResult> {
349
- if (!input.id || input.id.length < MIN_CITE_ID_LEN) {
350
- return err(new Error(`id must be at least ${MIN_CITE_ID_LEN} characters`));
351
- }
352
- try {
353
- await appendCitation({
354
- conversationId: input.conversation_id ?? "mcp_tool",
355
- citedId: input.id,
356
- kind: "tool_use",
357
- ...(input.reason !== undefined ? { responsePreview: input.reason } : {}),
358
- });
359
- return ok({ logged: true, id: input.id });
360
- } catch (e) {
361
- return err(e);
362
- }
363
- }
364
-
365
- export function createMcpServer(deps: McpDeps): McpServer {
366
- const server = new McpServer({
367
- name: SERVER_NAME,
368
- version: SERVER_VERSION,
369
- });
370
-
371
- server.registerTool(
372
- "recall_sessions",
373
- {
374
- title: "Recall Sessions from NLM",
375
- description: RECALL_DESCRIPTION,
376
- inputSchema: {
377
- query: z
378
- .string()
379
- .default("")
380
- .describe("Keyword(s) to search. Optional if entity or kind is set."),
381
- entity: z
382
- .string()
383
- .optional()
384
- .describe("Filter to sessions tagged with this entity name."),
385
- kind: z
386
- .enum(["decision", "open"])
387
- .optional()
388
- .describe("Filter to sessions with a decision or open marker."),
389
- mode: z
390
- .enum(["keyword", "semantic", "hybrid"])
391
- .optional()
392
- .describe("Search mode. Defaults to hybrid (keyword BM25 + semantic embeddings)."),
393
- limit: z
394
- .number()
395
- .int()
396
- .min(1)
397
- .max(100)
398
- .default(DEFAULT_LIMIT)
399
- .describe("Max results to return."),
400
- },
401
- annotations: {
402
- readOnlyHint: true,
403
- destructiveHint: false,
404
- idempotentHint: true,
405
- openWorldHint: true,
406
- },
407
- },
408
- async (args) => recallSessionsHandler(deps, args) as never,
409
- );
410
-
411
- server.registerTool(
412
- "get_session",
413
- {
414
- title: "Get Full NLM Session",
415
- description: GET_SESSION_DESCRIPTION,
416
- inputSchema: {
417
- id: z.string().min(1).describe("Canonical session ID."),
418
- },
419
- annotations: {
420
- readOnlyHint: true,
421
- destructiveHint: false,
422
- idempotentHint: true,
423
- openWorldHint: true,
424
- },
425
- },
426
- async (args) => getSessionHandler(deps, args) as never,
427
- );
428
-
429
- if (deps.factRecall && deps.factStore) {
430
- server.registerTool(
431
- "recall_facts",
432
- {
433
- title: "Recall Facts from NLM",
434
- description: RECALL_FACTS_DESCRIPTION,
435
- inputSchema: {
436
- query: z
437
- .string()
438
- .default("")
439
- .describe("Free-text search against fact values. Optional if subject/predicate/kind set."),
440
- subject: z
441
- .string()
442
- .optional()
443
- .describe("Exact-match normalized entity/topic (lowercase-kebab)."),
444
- predicate: z
445
- .string()
446
- .optional()
447
- .describe("Exact-match predicate from the closed vocabulary."),
448
- kind: z
449
- .enum(["decision", "open", "attribute"])
450
- .optional()
451
- .describe("Filter to a single fact kind."),
452
- mode: z
453
- .enum(["keyword", "semantic", "hybrid"])
454
- .optional()
455
- .describe("Search mode. Defaults to hybrid (keyword BM25 + semantic embeddings)."),
456
- includeSuperseded: z
457
- .boolean()
458
- .optional()
459
- .describe("Include outdated facts. Default false."),
460
- minConfidence: z
461
- .number()
462
- .min(0)
463
- .max(1)
464
- .optional()
465
- .describe("Lower bound on classifier confidence. Default 0.6."),
466
- limit: z
467
- .number()
468
- .int()
469
- .min(1)
470
- .max(100)
471
- .default(DEFAULT_LIMIT)
472
- .describe("Max results to return."),
473
- },
474
- annotations: {
475
- readOnlyHint: true,
476
- destructiveHint: false,
477
- idempotentHint: true,
478
- openWorldHint: true,
479
- },
480
- },
481
- async (args) => recallFactsHandler(deps, args) as never,
482
- );
483
-
484
- server.registerTool(
485
- "get_fact_history",
486
- {
487
- title: "Get Fact Supersedence History",
488
- description: GET_FACT_HISTORY_DESCRIPTION,
489
- inputSchema: {
490
- subject: z.string().min(1).describe("Normalized entity/topic name."),
491
- predicate: z
492
- .string()
493
- .optional()
494
- .describe("Narrow to one (subject, predicate) chain."),
495
- },
496
- annotations: {
497
- readOnlyHint: true,
498
- destructiveHint: false,
499
- idempotentHint: true,
500
- openWorldHint: true,
501
- },
502
- },
503
- async (args) => getFactHistoryHandler(deps, args) as never,
504
- );
505
- }
506
-
507
- server.registerTool(
508
- "cite_session",
509
- {
510
- title: "Cite NLM Session",
511
- description: CITE_SESSION_DESCRIPTION,
512
- inputSchema: {
513
- id: z.string().min(MIN_CITE_ID_LEN).describe("Session ID returned by recall_sessions that you referenced in your response."),
514
- conversation_id: z
515
- .string()
516
- .optional()
517
- .describe("Current conversation ID. Optional — NLM infers from context when absent."),
518
- reason: z
519
- .string()
520
- .optional()
521
- .describe("Why this session was useful. Optional but encouraged — articulating the reason is a weak training signal."),
522
- },
523
- annotations: {
524
- readOnlyHint: false,
525
- destructiveHint: false,
526
- idempotentHint: false,
527
- openWorldHint: false,
528
- },
529
- },
530
- async (args) => citeSessionHandler(args) as never,
531
- );
532
-
533
- return server;
534
- }
@@ -1,102 +0,0 @@
1
- /**
2
- * FactStore — the only way core/ reads or writes the fact corpus.
3
- *
4
- * Companion to SessionStore. Sessions are the operator-recall unit; facts are
5
- * the agent-recall projection — normalized (subject, predicate, value) triples
6
- * derived from sessions, supersedence-aware. See
7
- * docs/plans/factstore-design.md.
8
- *
9
- * Phase B.1 ships the storage port + adapter only. No extraction wired yet
10
- * (B.2), no recall service (B.3), no MCP surface (B.3), no supersedence
11
- * autodetect (B.4). The surface here is the minimum needed by future phases:
12
- * insert one or many, look up by id, look up current (non-superseded) facts
13
- * by subject and optional predicate, mark a fact superseded.
14
- */
15
-
16
- import type { Fact, FactHistoryChain, FactKind } from "@shared/types.js";
17
-
18
- export interface FactQuery {
19
- readonly subject: string;
20
- readonly predicate?: string;
21
- readonly includeSuperseded?: boolean;
22
- readonly limit?: number;
23
- }
24
-
25
- export interface FactSemanticNeighbor {
26
- readonly factId: string;
27
- readonly distance: number;
28
- }
29
-
30
- /** Pre-filter applied at the storage layer before keyword scoring runs. */
31
- export interface FactListFilter {
32
- readonly subject?: string;
33
- readonly predicate?: string;
34
- readonly kind?: FactKind;
35
- readonly includeSuperseded?: boolean;
36
- readonly minConfidence?: number;
37
- readonly limit?: number;
38
- }
39
-
40
- export interface FactStore {
41
- /** Atomically insert a single fact. Throws on duplicate id. */
42
- insert(fact: Fact): Promise<void>;
43
-
44
- /** Atomically insert many facts as one transaction. Throws on any duplicate id. */
45
- insertMany(facts: ReadonlyArray<Fact>): Promise<void>;
46
-
47
- getById(id: string): Promise<Fact | null>;
48
-
49
- /**
50
- * Exact-match lookup of the current (non-superseded) fact for a
51
- * subject+predicate pair. Returns null if none exists. This is the hot
52
- * path for deterministic supersedence on ingest (Phase B.4).
53
- */
54
- findCurrent(subject: string, predicate: string): Promise<Fact | null>;
55
-
56
- /**
57
- * List facts matching the query. Defaults: current (non-superseded) only,
58
- * limit 50. Ordered by created_at descending.
59
- */
60
- list(query: FactQuery): Promise<ReadonlyArray<Fact>>;
61
-
62
- /**
63
- * List all facts attributable to a single session. Used by the UI to show
64
- * a fact-count badge on a session digest, and by tests.
65
- */
66
- listBySession(sessionId: string): Promise<ReadonlyArray<Fact>>;
67
-
68
- /**
69
- * Mark `oldId` as superseded by `newId`. Both facts must exist. Reversible
70
- * by passing null as newId (Phase C operator-undo affordance).
71
- */
72
- markSuperseded(oldId: string, newId: string | null): Promise<void>;
73
-
74
- /**
75
- * Pre-filtered fact list used by FactRecallService. Applies subject /
76
- * predicate / kind / confidence / superseded filters at the SQL layer
77
- * before keyword scoring runs in core. No ordering guarantee beyond
78
- * `created_at DESC`.
79
- */
80
- listForRecall(filter: FactListFilter): Promise<ReadonlyArray<Fact>>;
81
-
82
- /**
83
- * sqlite-vec KNN over fact_embeddings. Returns up to `limit` nearest
84
- * neighbors by L2 distance. The service converts distance to cosine and
85
- * blends with keyword scores.
86
- */
87
- semanticSearch(
88
- queryVector: Float32Array,
89
- limit: number,
90
- ): Promise<ReadonlyArray<FactSemanticNeighbor>>;
91
-
92
- /**
93
- * Supersedence chain inspection. When `predicate` is provided, returns a
94
- * single chain (or empty array if no facts match). When omitted, returns
95
- * one chain per distinct predicate for that subject. Each chain orders
96
- * newest → oldest by created_at.
97
- */
98
- getHistory(
99
- subject: string,
100
- predicate?: string,
101
- ): Promise<ReadonlyArray<FactHistoryChain>>;
102
- }
@@ -1,52 +0,0 @@
1
- /**
2
- * LLMClient — outbound LLM calls (embedding + classification).
3
- *
4
- * Implementations: OllamaClient (default, local), AnthropicClient, OpenAIClient.
5
- * core/ only sees this interface; it never imports an HTTP client.
6
- */
7
-
8
- export interface EmbedResult {
9
- readonly vector: Float32Array;
10
- readonly model: string;
11
- }
12
-
13
- export type EmbeddingKind = "query" | "document";
14
-
15
- /**
16
- * Raw fact extracted by the classifier. No id, no source_session_id, no
17
- * created_at yet — those get filled in at ingest time by extractFacts().
18
- *
19
- * `subject` and `predicate` come from the classifier already normalized
20
- * (lowercased, trimmed) per the prompt contract, but the coercer re-normalizes
21
- * defensively because LLM output is not trustworthy.
22
- */
23
- export interface ExtractedFact {
24
- readonly kind: "decision" | "open" | "attribute";
25
- readonly subject: string;
26
- readonly predicate: string;
27
- readonly value: string;
28
- readonly sourceQuote?: string;
29
- }
30
-
31
- export interface ClassifyResult {
32
- readonly label: string;
33
- readonly summary: string;
34
- readonly entities: ReadonlyArray<string>;
35
- readonly decisions: ReadonlyArray<string>;
36
- readonly open: ReadonlyArray<string>;
37
- readonly confidence: number;
38
- readonly facts: ReadonlyArray<ExtractedFact>;
39
- }
40
-
41
- export class LLMUnreachableError extends Error {
42
- constructor(provider: string, cause?: unknown) {
43
- super(`LLM unreachable: ${provider}`);
44
- this.name = "LLMUnreachableError";
45
- this.cause = cause;
46
- }
47
- }
48
-
49
- export interface LLMClient {
50
- embed(text: string, kind: EmbeddingKind): Promise<EmbedResult>;
51
- classify(transcript: string): Promise<ClassifyResult>;
52
- }
@@ -1,16 +0,0 @@
1
- /**
2
- * StructuredLogger — sole logging seam for core/.
3
- *
4
- * Outer layers wire a concrete logger (console, pino, file-append). Tests
5
- * substitute a recording logger. core/ never calls console.log directly.
6
- */
7
-
8
- export type LogLevel = "debug" | "info" | "warn" | "error";
9
-
10
- export interface LogFields {
11
- readonly [key: string]: string | number | boolean | null | undefined;
12
- }
13
-
14
- export interface StructuredLogger {
15
- log(level: LogLevel, message: string, fields?: LogFields): void;
16
- }