nlm-memory 0.4.2 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (285) hide show
  1. package/README.md +72 -34
  2. package/dist/cli/nlm.js +223 -33
  3. package/dist/cli/nlm.js.map +1 -1
  4. package/dist/core/adapters/cursor.d.ts +45 -0
  5. package/dist/core/adapters/cursor.js +397 -0
  6. package/dist/core/adapters/cursor.js.map +1 -0
  7. package/dist/core/adapters/from-source.js +10 -0
  8. package/dist/core/adapters/from-source.js.map +1 -1
  9. package/dist/core/adapters/windsurf.d.ts +44 -0
  10. package/dist/core/adapters/windsurf.js +299 -0
  11. package/dist/core/adapters/windsurf.js.map +1 -0
  12. package/dist/core/hook/claude-settings.d.ts +12 -5
  13. package/dist/core/hook/claude-settings.js +21 -6
  14. package/dist/core/hook/claude-settings.js.map +1 -1
  15. package/dist/core/sources/source-registry.d.ts +1 -1
  16. package/dist/core/sources/source-registry.js +18 -0
  17. package/dist/core/sources/source-registry.js.map +1 -1
  18. package/dist/core/storage/sqlite-session-store.d.ts +2 -0
  19. package/dist/core/storage/sqlite-session-store.js +38 -2
  20. package/dist/core/storage/sqlite-session-store.js.map +1 -1
  21. package/dist/hook/hook-auth.d.ts +13 -0
  22. package/dist/hook/hook-auth.js +19 -0
  23. package/dist/hook/hook-auth.js.map +1 -0
  24. package/dist/hook/prompt-recall-hook.js +7 -1
  25. package/dist/hook/prompt-recall-hook.js.map +1 -1
  26. package/dist/hook/session-start-hook.js +4 -1
  27. package/dist/hook/session-start-hook.js.map +1 -1
  28. package/dist/hook/stop-hook.js +4 -1
  29. package/dist/hook/stop-hook.js.map +1 -1
  30. package/dist/http/app.d.ts +2 -0
  31. package/dist/http/app.js +76 -1
  32. package/dist/http/app.js.map +1 -1
  33. package/dist/install/claude-code.js +1 -1
  34. package/dist/install/claude-code.js.map +1 -1
  35. package/dist/install/cursor.d.ts +25 -0
  36. package/dist/install/cursor.js +43 -0
  37. package/dist/install/cursor.js.map +1 -0
  38. package/dist/install/nlm-dir-perms.d.ts +19 -0
  39. package/dist/install/nlm-dir-perms.js +43 -0
  40. package/dist/install/nlm-dir-perms.js.map +1 -0
  41. package/dist/install/ollama.d.ts +18 -1
  42. package/dist/install/ollama.js +62 -7
  43. package/dist/install/ollama.js.map +1 -1
  44. package/dist/install/setup.d.ts +4 -0
  45. package/dist/install/setup.js +141 -18
  46. package/dist/install/setup.js.map +1 -1
  47. package/dist/install/windsurf.d.ts +25 -0
  48. package/dist/install/windsurf.js +43 -0
  49. package/dist/install/windsurf.js.map +1 -0
  50. package/dist/mcp/server.js +20 -1
  51. package/dist/mcp/server.js.map +1 -1
  52. package/dist/shared/types.d.ts +4 -0
  53. package/dist/ui/assets/{index-BA6IpU8g.css → index-Beo8psd-.css} +1 -1
  54. package/dist/ui/assets/index-CSPTTeeM.js +69 -0
  55. package/dist/ui/index.html +2 -2
  56. package/package.json +26 -1
  57. package/plugin/scripts/prompt-recall-hook.mjs +55 -4
  58. package/plugin/scripts/stop-hook.mjs +57 -6
  59. package/.agents/plugins/marketplace.json +0 -20
  60. package/.github/workflows/ci.yml +0 -30
  61. package/dist/ui/assets/index-B_qIVV0k.js +0 -69
  62. package/docs/methodology/re-derivation-rate.md +0 -112
  63. package/docs/methodology/useful-hit-rate.md +0 -79
  64. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  65. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  66. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  67. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  68. package/docs/plans/desktop-product.md +0 -69
  69. package/docs/plans/factstore-design.md +0 -236
  70. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1389
  71. package/logs/CHANGELOG/CHANGELOG.md +0 -337
  72. package/migrations/000_initial_schema.sql +0 -174
  73. package/migrations/001_entity_type_rename.sql +0 -17
  74. package/migrations/002_adapter_state_extend.sql +0 -12
  75. package/migrations/003_session_embeddings.sql +0 -11
  76. package/migrations/004_facts.sql +0 -46
  77. package/migrations/005_sources.sql +0 -31
  78. package/migrations/006_providers.sql +0 -33
  79. package/migrations/007_source_tokens.sql +0 -17
  80. package/migrations/008_fts_rebuild.sql +0 -9
  81. package/migrations/009_session_embedding_chunks.sql +0 -46
  82. package/migrations/010_sources_opencode.sql +0 -30
  83. package/migrations/011_sources_hermes_agent.sql +0 -30
  84. package/migrations/012_sources_aider.sql +0 -30
  85. package/migrations/013_adapter_state_failure_count.sql +0 -12
  86. package/plugin-hermes-agent/README.md +0 -49
  87. package/plugin-hermes-agent/__init__.py +0 -75
  88. package/plugin-hermes-agent/plugin.yaml +0 -15
  89. package/scripts/backfill-citations.mjs +0 -0
  90. package/scripts/build-codex-plugin.mjs +0 -61
  91. package/scripts/deepseek-probe.mjs +0 -67
  92. package/scripts/extract-triples.mjs +0 -207
  93. package/scripts/longmemeval/embedding-cache.ts +0 -77
  94. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  95. package/scripts/longmemeval/run-harness.ts +0 -315
  96. package/scripts/longmemeval/scorer.ts +0 -99
  97. package/scripts/longmemeval/tsconfig.json +0 -9
  98. package/scripts/longmemeval/types.ts +0 -35
  99. package/scripts/nlm-daily-digest.py +0 -239
  100. package/scripts/nlm-daily-digest.sh +0 -28
  101. package/src/cli/classify-parity.ts +0 -257
  102. package/src/cli/launchctl-helpers.ts +0 -49
  103. package/src/cli/nlm.ts +0 -885
  104. package/src/core/actions/actions-log.ts +0 -118
  105. package/src/core/actions/overlay.ts +0 -117
  106. package/src/core/adapters/aider.ts +0 -205
  107. package/src/core/adapters/claude-code.ts +0 -293
  108. package/src/core/adapters/common.ts +0 -54
  109. package/src/core/adapters/from-source.ts +0 -57
  110. package/src/core/adapters/hermes-agent.ts +0 -240
  111. package/src/core/adapters/hermes.ts +0 -277
  112. package/src/core/adapters/jsonl-generic.ts +0 -208
  113. package/src/core/adapters/opencode.ts +0 -281
  114. package/src/core/adapters/pi.ts +0 -264
  115. package/src/core/classifier/prompt.ts +0 -200
  116. package/src/core/dataset/build-dataset.ts +0 -463
  117. package/src/core/embedding/chunk-body.ts +0 -76
  118. package/src/core/embedding/embed-backfill.ts +0 -210
  119. package/src/core/embedding/embed-normalize.ts +0 -135
  120. package/src/core/facts/backfill-facts.ts +0 -254
  121. package/src/core/facts/extract-facts.ts +0 -50
  122. package/src/core/hook/citation-detect.ts +0 -124
  123. package/src/core/hook/cite-memo.ts +0 -68
  124. package/src/core/hook/claude-settings.ts +0 -166
  125. package/src/core/hook/gate.ts +0 -25
  126. package/src/core/hook/hook-log.ts +0 -41
  127. package/src/core/hook/memo-sweep.ts +0 -164
  128. package/src/core/hook/memo.ts +0 -67
  129. package/src/core/hook/pointer-block.ts +0 -26
  130. package/src/core/hook/select.ts +0 -32
  131. package/src/core/hook/transcript.ts +0 -121
  132. package/src/core/ingest/ingest-session.ts +0 -111
  133. package/src/core/providers/provider-models.ts +0 -100
  134. package/src/core/providers/provider-registry.ts +0 -196
  135. package/src/core/recall/citation-log.ts +0 -108
  136. package/src/core/recall/filter.ts +0 -27
  137. package/src/core/recall/index.ts +0 -6
  138. package/src/core/recall/match-fields.ts +0 -40
  139. package/src/core/recall/query-log.ts +0 -149
  140. package/src/core/recall/query-shape.ts +0 -66
  141. package/src/core/recall/recall-service.ts +0 -320
  142. package/src/core/recall/recent-log.ts +0 -59
  143. package/src/core/recall/tokenize.ts +0 -18
  144. package/src/core/recall/useful-scan.ts +0 -336
  145. package/src/core/recall-facts/fact-query-log.ts +0 -150
  146. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  147. package/src/core/scheduler/scan-once.ts +0 -142
  148. package/src/core/scheduler/scheduler.ts +0 -225
  149. package/src/core/sources/source-registry.ts +0 -260
  150. package/src/core/storage/db-restore.ts +0 -133
  151. package/src/core/storage/live-status.ts +0 -45
  152. package/src/core/storage/migrate.ts +0 -72
  153. package/src/core/storage/sqlite-fact-store.ts +0 -304
  154. package/src/core/storage/sqlite-session-store.ts +0 -765
  155. package/src/hook/prompt-recall-hook.ts +0 -174
  156. package/src/hook/session-end-hook.ts +0 -81
  157. package/src/hook/session-start-hook.ts +0 -165
  158. package/src/hook/stop-hook.ts +0 -236
  159. package/src/http/app.ts +0 -1137
  160. package/src/install/claude-code.ts +0 -128
  161. package/src/install/codex.ts +0 -367
  162. package/src/install/hermes-agent.ts +0 -76
  163. package/src/install/hermes.ts +0 -78
  164. package/src/install/ollama.ts +0 -211
  165. package/src/install/setup.ts +0 -368
  166. package/src/llm/classifier-box.ts +0 -64
  167. package/src/llm/deepseek-client.ts +0 -150
  168. package/src/llm/env-autoload.ts +0 -55
  169. package/src/llm/ollama-client.ts +0 -189
  170. package/src/mcp/server.ts +0 -534
  171. package/src/ports/fact-store.ts +0 -102
  172. package/src/ports/llm-client.ts +0 -52
  173. package/src/ports/logger.ts +0 -16
  174. package/src/ports/session-store.ts +0 -45
  175. package/src/ports/transcript-adapter.ts +0 -55
  176. package/src/shared/types.ts +0 -145
  177. package/src/ui/App.tsx +0 -58
  178. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  179. package/src/ui/components/SessionDrawer.tsx +0 -136
  180. package/src/ui/components/SideNav.tsx +0 -162
  181. package/src/ui/components/Skeleton.tsx +0 -107
  182. package/src/ui/index.html +0 -13
  183. package/src/ui/lib/actions.ts +0 -30
  184. package/src/ui/lib/api.ts +0 -92
  185. package/src/ui/lib/dataset.ts +0 -141
  186. package/src/ui/lib/registries.ts +0 -155
  187. package/src/ui/lib/view-settings.ts +0 -41
  188. package/src/ui/main.tsx +0 -15
  189. package/src/ui/pages/Live.tsx +0 -229
  190. package/src/ui/pages/Pulse.tsx +0 -415
  191. package/src/ui/pages/Recall.tsx +0 -190
  192. package/src/ui/pages/River.tsx +0 -308
  193. package/src/ui/pages/Search.tsx +0 -93
  194. package/src/ui/pages/Stub.tsx +0 -9
  195. package/src/ui/pages/Thread.tsx +0 -262
  196. package/src/ui/pages/settings/Classifier.tsx +0 -227
  197. package/src/ui/pages/settings/Data.tsx +0 -190
  198. package/src/ui/pages/settings/Index.tsx +0 -65
  199. package/src/ui/pages/settings/Labels.tsx +0 -224
  200. package/src/ui/pages/settings/Providers.tsx +0 -305
  201. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  202. package/src/ui/pages/settings/Sources.tsx +0 -326
  203. package/src/ui/pages/settings/Views.tsx +0 -96
  204. package/src/ui/styles.css +0 -1766
  205. package/src/ui/tsconfig.json +0 -21
  206. package/src/ui/vite.config.ts +0 -19
  207. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  208. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  209. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  210. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  211. package/tests/fixtures/facts.ts +0 -17
  212. package/tests/fixtures/golden-corpus.ts +0 -85
  213. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  214. package/tests/fixtures/hermes/paired_session.json +0 -23
  215. package/tests/fixtures/hermes/request_dump.json +0 -28
  216. package/tests/fixtures/hermes/session_iso.json +0 -38
  217. package/tests/fixtures/hermes/session_unix.json +0 -38
  218. package/tests/fixtures/hermes/system_only.json +0 -18
  219. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  220. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  221. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  222. package/tests/fixtures/sessions.ts +0 -22
  223. package/tests/integration/backfill-facts.test.ts +0 -362
  224. package/tests/integration/citation-explicit.test.ts +0 -111
  225. package/tests/integration/cite-event.test.ts +0 -169
  226. package/tests/integration/cite-memo.test.ts +0 -87
  227. package/tests/integration/db-restore.test.ts +0 -153
  228. package/tests/integration/embed-backfill.test.ts +0 -176
  229. package/tests/integration/fact-supersedence.test.ts +0 -313
  230. package/tests/integration/fts-index.test.ts +0 -60
  231. package/tests/integration/getbyids-sqlite.test.ts +0 -60
  232. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  233. package/tests/integration/hook-claude-settings.test.ts +0 -205
  234. package/tests/integration/hook-log.test.ts +0 -54
  235. package/tests/integration/hook-memo.test.ts +0 -68
  236. package/tests/integration/hook-pre-compact.test.ts +0 -105
  237. package/tests/integration/hook-subagent-start.test.ts +0 -102
  238. package/tests/integration/http.test.ts +0 -401
  239. package/tests/integration/keyword-search-fts.test.ts +0 -66
  240. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  241. package/tests/integration/mcp.test.ts +0 -248
  242. package/tests/integration/memo-sweep.test.ts +0 -91
  243. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  244. package/tests/integration/provider-registry.test.ts +0 -107
  245. package/tests/integration/recall-golden.test.ts +0 -59
  246. package/tests/integration/recall-sqlite.test.ts +0 -169
  247. package/tests/integration/scheduler.test.ts +0 -391
  248. package/tests/integration/session-end-hook.test.ts +0 -48
  249. package/tests/integration/session-start-hook.test.ts +0 -126
  250. package/tests/integration/source-registry.test.ts +0 -120
  251. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  252. package/tests/integration/stop-hook.test.ts +0 -560
  253. package/tests/integration/wal-checkpoint.test.ts +0 -49
  254. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  255. package/tests/unit/core/adapters/aider.test.ts +0 -230
  256. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  257. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  258. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  259. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  260. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  261. package/tests/unit/core/adapters/pi.test.ts +0 -110
  262. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  263. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  264. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  265. package/tests/unit/core/filter.test.ts +0 -40
  266. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  267. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  268. package/tests/unit/core/hook/gate.test.ts +0 -29
  269. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  270. package/tests/unit/core/hook/select.test.ts +0 -66
  271. package/tests/unit/core/match-fields.test.ts +0 -39
  272. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  273. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  274. package/tests/unit/core/query-shape.test.ts +0 -92
  275. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  276. package/tests/unit/core/recall-service.test.ts +0 -200
  277. package/tests/unit/core/storage/live-status.test.ts +0 -54
  278. package/tests/unit/core/tokenize.test.ts +0 -32
  279. package/tests/unit/core/useful-scan.test.ts +0 -537
  280. package/tests/unit/llm/embed.test.ts +0 -93
  281. package/tests/unit/llm/ollama-client.test.ts +0 -124
  282. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  283. package/tsconfig.json +0 -31
  284. package/tsconfig.test.json +0 -11
  285. package/vitest.config.ts +0 -22
@@ -1,150 +0,0 @@
1
- /**
2
- * DeepSeekClient — LLMClient backed by DeepSeek's OpenAI-compatible chat API.
3
- *
4
- * Use case (per Python notes confirmed 2026-05-07 / 2026-05-13):
5
- * • v4-flash handles inputs up to ~60K chars reliably; we cap at 30K to
6
- * stay well inside the deterministic zone.
7
- * • ~$0.002/session at typical sizes — full backfill of ~1,200 sessions
8
- * ≈ $2.50.
9
- * • Strong extraction quality (12+ entities, accurate decisions,
10
- * 0.9 confidence) where phi4-mini struggles or times out.
11
- *
12
- * Same prompt module as OllamaClient — only the transport differs. Same
13
- * error semantics: LLMUnreachableError for network/HTTP, ClassifierSchemaError
14
- * for unparseable / shape-wrong output. Reads DEEPSEEK_API_KEY at construct
15
- * time unless an explicit key is passed.
16
- *
17
- * Embedding is not supported by DeepSeek's API — `embed()` throws. Wire a
18
- * separate embedder (OllamaClient) for semantic recall.
19
- */
20
-
21
- import type {
22
- ClassifyResult,
23
- EmbedResult,
24
- EmbeddingKind,
25
- LLMClient,
26
- } from "@ports/llm-client.js";
27
- import { LLMUnreachableError } from "@ports/llm-client.js";
28
- import {
29
- CLASSIFIER_SYSTEM_PROMPT,
30
- buildUserPrompt,
31
- coerceClassifyResult,
32
- stripJsonFences,
33
- validateClassifierJson,
34
- } from "@core/classifier/prompt.js";
35
- import { ClassifierSchemaError } from "./ollama-client.js";
36
-
37
- export type FetchImpl = typeof fetch;
38
-
39
- export interface DeepSeekClientOptions {
40
- readonly apiKey?: string;
41
- readonly baseUrl?: string;
42
- readonly classifyModel?: string;
43
- readonly classifyTimeoutMs?: number;
44
- readonly maxTranscriptChars?: number;
45
- readonly fetchImpl?: FetchImpl;
46
- }
47
-
48
- interface ChatResponse {
49
- readonly choices?: ReadonlyArray<{ readonly message?: { readonly content?: string } }>;
50
- }
51
-
52
- export class DeepSeekClient implements LLMClient {
53
- private readonly apiKey: string;
54
- private readonly baseUrl: string;
55
- private readonly classifyModel: string;
56
- private readonly classifyTimeoutMs: number;
57
- private readonly maxTranscriptChars: number;
58
- private readonly fetchImpl: FetchImpl;
59
-
60
- constructor(opts: DeepSeekClientOptions = {}) {
61
- const key = opts.apiKey ?? process.env["DEEPSEEK_API_KEY"];
62
- if (!key) {
63
- throw new Error(
64
- "DEEPSEEK_API_KEY not set. Export it, place it in ~/.nlm/.env, or pass apiKey explicitly.",
65
- );
66
- }
67
- this.apiKey = key;
68
- this.baseUrl = (opts.baseUrl ?? "https://api.deepseek.com/v1").replace(/\/+$/, "");
69
- this.classifyModel = opts.classifyModel ?? "deepseek-v4-flash";
70
- this.classifyTimeoutMs = opts.classifyTimeoutMs ?? 180_000;
71
- this.maxTranscriptChars = opts.maxTranscriptChars ?? 30_000;
72
- this.fetchImpl = opts.fetchImpl ?? fetch;
73
- }
74
-
75
- async embed(_text: string, _kind: EmbeddingKind): Promise<EmbedResult> {
76
- throw new Error(
77
- "DeepSeekClient.embed not supported — DeepSeek's API has no embeddings endpoint. Wire OllamaClient for embeddings.",
78
- );
79
- }
80
-
81
- async classify(transcript: string, priorContext: string = ""): Promise<ClassifyResult> {
82
- const controller = new AbortController();
83
- const timer = setTimeout(() => controller.abort(), this.classifyTimeoutMs);
84
- try {
85
- // DeepSeek's reliable zone is ≤30K, narrower than the prompt module's
86
- // 15K default. We pre-truncate to our wider cap to feed the model more
87
- // context than Ollama can handle, then buildUserPrompt's own truncation
88
- // is a no-op.
89
- const sized =
90
- transcript.length <= this.maxTranscriptChars
91
- ? transcript
92
- : transcript.slice(0, this.maxTranscriptChars / 2 - 40) +
93
- "\n\n[... transcript truncated; below is the closing portion ...]\n\n" +
94
- transcript.slice(transcript.length - this.maxTranscriptChars / 2 + 40);
95
- const userPrompt = buildUserPrompt(sized, priorContext);
96
-
97
- const res = await this.fetchImpl(`${this.baseUrl}/chat/completions`, {
98
- method: "POST",
99
- headers: {
100
- "Content-Type": "application/json",
101
- Authorization: `Bearer ${this.apiKey}`,
102
- },
103
- body: JSON.stringify({
104
- model: this.classifyModel,
105
- messages: [
106
- { role: "system", content: CLASSIFIER_SYSTEM_PROMPT },
107
- { role: "user", content: userPrompt },
108
- ],
109
- response_format: { type: "json_object" },
110
- temperature: 0.1,
111
- // 8192 covers reasoning + JSON output. deepseek-v4-flash is a
112
- // reasoning model — its hidden chain-of-thought counts against
113
- // max_tokens but never reaches `content`. At 1024 the reasoning
114
- // consumed the entire budget and the JSON output came back empty
115
- // (finish_reason: length, content: ""). Backfill verified ~72% of
116
- // real claude-code sessions hit that mode at 1024. Real-world
117
- // observed reasoning_tokens: ~900-1100; JSON body adds 200-1000
118
- // depending on facts/entity counts. 8192 leaves headroom.
119
- max_tokens: 8192,
120
- stream: false,
121
- }),
122
- signal: controller.signal,
123
- });
124
- if (!res.ok) {
125
- throw new LLMUnreachableError(
126
- "deepseek",
127
- `status ${res.status}: ${await res.text().catch(() => "")}`,
128
- );
129
- }
130
- const data = (await res.json()) as ChatResponse;
131
- const rawContent = data.choices?.[0]?.message?.content?.trim() ?? "";
132
- const content = stripJsonFences(rawContent);
133
- let parsed: unknown;
134
- try {
135
- parsed = JSON.parse(content);
136
- } catch {
137
- throw new ClassifierSchemaError("deepseek returned non-JSON content");
138
- }
139
- if (!validateClassifierJson(parsed)) {
140
- throw new ClassifierSchemaError("deepseek response missing required keys");
141
- }
142
- return coerceClassifyResult(parsed);
143
- } catch (e) {
144
- if (e instanceof LLMUnreachableError || e instanceof ClassifierSchemaError) throw e;
145
- throw new LLMUnreachableError("deepseek", e);
146
- } finally {
147
- clearTimeout(timer);
148
- }
149
- }
150
- }
@@ -1,55 +0,0 @@
1
- /**
2
- * Mirror of `classifier.autoload_env` from the Python daemon. Reads KEY=VALUE
3
- * pairs from a small list of likely .env locations into process.env. Existing
4
- * env vars are NOT overridden.
5
- *
6
- * Returns the list of paths actually loaded. Safe to call multiple times.
7
- */
8
-
9
- import { readFileSync, existsSync } from "node:fs";
10
- import { homedir } from "node:os";
11
- import { resolve } from "node:path";
12
-
13
- const DEFAULT_SEARCH_PATHS = [
14
- "~/.nlm/.env",
15
- "./.env",
16
- "../.env",
17
- "../../.env",
18
- ];
19
-
20
- function expandHome(p: string): string {
21
- if (p.startsWith("~/")) return resolve(homedir(), p.slice(2));
22
- return p;
23
- }
24
-
25
- export function autoloadEnv(extraPaths: ReadonlyArray<string> = []): string[] {
26
- const loaded: string[] = [];
27
- const paths = [...DEFAULT_SEARCH_PATHS, ...extraPaths];
28
- for (const raw of paths) {
29
- const path = expandHome(raw);
30
- if (!existsSync(path)) continue;
31
- try {
32
- const content = readFileSync(path, "utf8");
33
- for (const line of content.split("\n")) {
34
- const trimmed = line.trim();
35
- if (!trimmed || trimmed.startsWith("#") || !trimmed.includes("=")) continue;
36
- const eq = trimmed.indexOf("=");
37
- const key = trimmed.slice(0, eq).trim();
38
- let value = trimmed.slice(eq + 1).trim();
39
- if (
40
- (value.startsWith('"') && value.endsWith('"')) ||
41
- (value.startsWith("'") && value.endsWith("'"))
42
- ) {
43
- value = value.slice(1, -1);
44
- }
45
- if (key && process.env[key] === undefined) {
46
- process.env[key] = value;
47
- }
48
- }
49
- loaded.push(path);
50
- } catch {
51
- continue;
52
- }
53
- }
54
- return loaded;
55
- }
@@ -1,189 +0,0 @@
1
- /**
2
- * OllamaClient — LLMClient backed by a local Ollama HTTP endpoint.
3
- *
4
- * embed() → POST /api/embeddings (nomic-embed-text by default)
5
- * classify() → POST /api/chat (phi4-mini by default, format=json)
6
- *
7
- * Network/HTTP failure maps to LLMUnreachableError so RecallService can
8
- * degrade to keyword mode without crashing. Classification parse failures
9
- * resolve to null (caller's choice whether to retry or route to inbox).
10
- *
11
- * Layering: this file lives in the outer ring. core/ depends on LLMClient,
12
- * not on this concrete class. Tests can substitute a fake client.
13
- */
14
-
15
- import type {
16
- ClassifyResult,
17
- EmbedResult,
18
- EmbeddingKind,
19
- LLMClient,
20
- } from "@ports/llm-client.js";
21
- import { LLMUnreachableError } from "@ports/llm-client.js";
22
- import {
23
- CLASSIFIER_SYSTEM_PROMPT,
24
- buildUserPrompt,
25
- coerceClassifyResult,
26
- stripJsonFences,
27
- validateClassifierJson,
28
- } from "@core/classifier/prompt.js";
29
-
30
- export type FetchImpl = typeof fetch;
31
-
32
- // Tried raising 8000 → 28000 on 2026-05-25 to recover the answer-tail of
33
- // long gold sessions (median LongMemEval-S gold body is 14,294 chars). The
34
- // Ollama /api/embeddings endpoint returned 500 on 54% of those large
35
- // inputs despite nomic-embed-text's nominal 8192-token context — semantic
36
- // R@5 collapsed from 87.2% → 15.8%. Reverted. Real fix is chunk + max-pool
37
- // (each body split into ≤8K-char chunks, store all vectors, score against
38
- // max cosine at query time) so coverage doesn't depend on a single embed
39
- // call. Filed as #174.
40
- const MAX_EMBED_CHARS = 8_000;
41
-
42
- const EMBED_PREFIXES: Record<EmbeddingKind, string> = {
43
- query: "search_query: ",
44
- document: "search_document: ",
45
- };
46
-
47
- export function l2Normalize(vec: Float32Array): Float32Array {
48
- let sumSq = 0;
49
- for (let i = 0; i < vec.length; i++) {
50
- const v = vec[i] ?? 0;
51
- sumSq += v * v;
52
- }
53
- if (sumSq === 0) return vec;
54
- const norm = Math.sqrt(sumSq);
55
- const out = new Float32Array(vec.length);
56
- for (let i = 0; i < vec.length; i++) {
57
- out[i] = (vec[i] ?? 0) / norm;
58
- }
59
- return out;
60
- }
61
-
62
- export interface OllamaClientOptions {
63
- readonly baseUrl?: string;
64
- readonly embedModel?: string;
65
- readonly classifyModel?: string;
66
- readonly timeoutMs?: number;
67
- readonly classifyTimeoutMs?: number;
68
- /** Inject a fake fetch for tests. Defaults to global fetch. */
69
- readonly fetchImpl?: FetchImpl;
70
- }
71
-
72
- interface EmbeddingsResponse {
73
- readonly embedding?: ReadonlyArray<number>;
74
- }
75
-
76
- interface ChatResponse {
77
- readonly message?: { readonly content?: string };
78
- }
79
-
80
- export class OllamaClient implements LLMClient {
81
- private readonly baseUrl: string;
82
- private readonly embedModel: string;
83
- private readonly classifyModel: string;
84
- private readonly timeoutMs: number;
85
- private readonly classifyTimeoutMs: number;
86
- private readonly fetchImpl: FetchImpl;
87
-
88
- constructor(opts: OllamaClientOptions = {}) {
89
- this.baseUrl = (opts.baseUrl ?? "http://localhost:11434").replace(/\/+$/, "");
90
- this.embedModel = opts.embedModel ?? "nomic-embed-text";
91
- this.classifyModel = opts.classifyModel ?? "phi4-mini:latest";
92
- this.timeoutMs = opts.timeoutMs ?? 10_000;
93
- this.classifyTimeoutMs = opts.classifyTimeoutMs ?? 180_000;
94
- this.fetchImpl = opts.fetchImpl ?? fetch;
95
- }
96
-
97
- async embed(text: string, kind: EmbeddingKind): Promise<EmbedResult> {
98
- // nomic-embed-text v1.5 is an asymmetric retrieval model. The
99
- // search_query:/search_document: prefix is part of the training
100
- // contract; omitting it or using the wrong one degrades retrieval
101
- // quality measurably. MAX_EMBED_CHARS matches the Python ceiling.
102
- const truncated = text.slice(0, MAX_EMBED_CHARS);
103
- const prompt = `${EMBED_PREFIXES[kind]}${truncated}`;
104
-
105
- const controller = new AbortController();
106
- const timer = setTimeout(() => controller.abort(), this.timeoutMs);
107
- try {
108
- const res = await this.fetchImpl(`${this.baseUrl}/api/embeddings`, {
109
- method: "POST",
110
- headers: { "Content-Type": "application/json" },
111
- body: JSON.stringify({ model: this.embedModel, prompt }),
112
- signal: controller.signal,
113
- });
114
- if (!res.ok) {
115
- throw new LLMUnreachableError("ollama", `status ${res.status}`);
116
- }
117
- const data = (await res.json()) as EmbeddingsResponse;
118
- if (!data.embedding || data.embedding.length === 0) {
119
- throw new LLMUnreachableError("ollama", "empty embedding");
120
- }
121
- const raw = new Float32Array(data.embedding);
122
- return { vector: l2Normalize(raw), model: this.embedModel };
123
- } catch (e) {
124
- if (e instanceof LLMUnreachableError) throw e;
125
- throw new LLMUnreachableError("ollama", e);
126
- } finally {
127
- clearTimeout(timer);
128
- }
129
- }
130
-
131
- /**
132
- * Send a transcript through the Ollama classifier with the shared system
133
- * prompt. Returns a ClassifyResult on success, or throws on network failure
134
- * (LLMUnreachableError) or schema-invalid output (Error). The Python
135
- * counterpart returned None on parse failure; we throw a typed error so
136
- * callers explicitly handle retry / inbox routing rather than swallowing
137
- * silent nulls.
138
- */
139
- async classify(transcript: string, priorContext: string = ""): Promise<ClassifyResult> {
140
- const controller = new AbortController();
141
- const timer = setTimeout(() => controller.abort(), this.classifyTimeoutMs);
142
- try {
143
- const userPrompt = buildUserPrompt(transcript, priorContext);
144
- const res = await this.fetchImpl(`${this.baseUrl}/api/chat`, {
145
- method: "POST",
146
- headers: { "Content-Type": "application/json" },
147
- body: JSON.stringify({
148
- model: this.classifyModel,
149
- messages: [
150
- { role: "system", content: CLASSIFIER_SYSTEM_PROMPT },
151
- { role: "user", content: userPrompt },
152
- ],
153
- stream: false,
154
- format: "json",
155
- options: { temperature: 0.1 },
156
- }),
157
- signal: controller.signal,
158
- });
159
- if (!res.ok) {
160
- throw new LLMUnreachableError("ollama", `status ${res.status}`);
161
- }
162
- const data = (await res.json()) as ChatResponse;
163
- const rawContent = data.message?.content?.trim() ?? "";
164
- const content = stripJsonFences(rawContent);
165
- let parsed: unknown;
166
- try {
167
- parsed = JSON.parse(content);
168
- } catch {
169
- throw new ClassifierSchemaError("ollama returned non-JSON content");
170
- }
171
- if (!validateClassifierJson(parsed)) {
172
- throw new ClassifierSchemaError("ollama response missing required keys");
173
- }
174
- return coerceClassifyResult(parsed);
175
- } catch (e) {
176
- if (e instanceof LLMUnreachableError || e instanceof ClassifierSchemaError) throw e;
177
- throw new LLMUnreachableError("ollama", e);
178
- } finally {
179
- clearTimeout(timer);
180
- }
181
- }
182
- }
183
-
184
- export class ClassifierSchemaError extends Error {
185
- constructor(message: string) {
186
- super(message);
187
- this.name = "ClassifierSchemaError";
188
- }
189
- }