nlm-memory 0.4.2 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (285) hide show
  1. package/README.md +72 -34
  2. package/dist/cli/nlm.js +223 -33
  3. package/dist/cli/nlm.js.map +1 -1
  4. package/dist/core/adapters/cursor.d.ts +45 -0
  5. package/dist/core/adapters/cursor.js +397 -0
  6. package/dist/core/adapters/cursor.js.map +1 -0
  7. package/dist/core/adapters/from-source.js +10 -0
  8. package/dist/core/adapters/from-source.js.map +1 -1
  9. package/dist/core/adapters/windsurf.d.ts +44 -0
  10. package/dist/core/adapters/windsurf.js +299 -0
  11. package/dist/core/adapters/windsurf.js.map +1 -0
  12. package/dist/core/hook/claude-settings.d.ts +12 -5
  13. package/dist/core/hook/claude-settings.js +21 -6
  14. package/dist/core/hook/claude-settings.js.map +1 -1
  15. package/dist/core/sources/source-registry.d.ts +1 -1
  16. package/dist/core/sources/source-registry.js +18 -0
  17. package/dist/core/sources/source-registry.js.map +1 -1
  18. package/dist/core/storage/sqlite-session-store.d.ts +2 -0
  19. package/dist/core/storage/sqlite-session-store.js +38 -2
  20. package/dist/core/storage/sqlite-session-store.js.map +1 -1
  21. package/dist/hook/hook-auth.d.ts +13 -0
  22. package/dist/hook/hook-auth.js +19 -0
  23. package/dist/hook/hook-auth.js.map +1 -0
  24. package/dist/hook/prompt-recall-hook.js +7 -1
  25. package/dist/hook/prompt-recall-hook.js.map +1 -1
  26. package/dist/hook/session-start-hook.js +4 -1
  27. package/dist/hook/session-start-hook.js.map +1 -1
  28. package/dist/hook/stop-hook.js +4 -1
  29. package/dist/hook/stop-hook.js.map +1 -1
  30. package/dist/http/app.d.ts +2 -0
  31. package/dist/http/app.js +76 -1
  32. package/dist/http/app.js.map +1 -1
  33. package/dist/install/claude-code.js +1 -1
  34. package/dist/install/claude-code.js.map +1 -1
  35. package/dist/install/cursor.d.ts +25 -0
  36. package/dist/install/cursor.js +43 -0
  37. package/dist/install/cursor.js.map +1 -0
  38. package/dist/install/nlm-dir-perms.d.ts +19 -0
  39. package/dist/install/nlm-dir-perms.js +43 -0
  40. package/dist/install/nlm-dir-perms.js.map +1 -0
  41. package/dist/install/ollama.d.ts +18 -1
  42. package/dist/install/ollama.js +62 -7
  43. package/dist/install/ollama.js.map +1 -1
  44. package/dist/install/setup.d.ts +4 -0
  45. package/dist/install/setup.js +141 -18
  46. package/dist/install/setup.js.map +1 -1
  47. package/dist/install/windsurf.d.ts +25 -0
  48. package/dist/install/windsurf.js +43 -0
  49. package/dist/install/windsurf.js.map +1 -0
  50. package/dist/mcp/server.js +20 -1
  51. package/dist/mcp/server.js.map +1 -1
  52. package/dist/shared/types.d.ts +4 -0
  53. package/dist/ui/assets/{index-BA6IpU8g.css → index-Beo8psd-.css} +1 -1
  54. package/dist/ui/assets/index-CSPTTeeM.js +69 -0
  55. package/dist/ui/index.html +2 -2
  56. package/package.json +26 -1
  57. package/plugin/scripts/prompt-recall-hook.mjs +55 -4
  58. package/plugin/scripts/stop-hook.mjs +57 -6
  59. package/.agents/plugins/marketplace.json +0 -20
  60. package/.github/workflows/ci.yml +0 -30
  61. package/dist/ui/assets/index-B_qIVV0k.js +0 -69
  62. package/docs/methodology/re-derivation-rate.md +0 -112
  63. package/docs/methodology/useful-hit-rate.md +0 -79
  64. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  65. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  66. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  67. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  68. package/docs/plans/desktop-product.md +0 -69
  69. package/docs/plans/factstore-design.md +0 -236
  70. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1389
  71. package/logs/CHANGELOG/CHANGELOG.md +0 -337
  72. package/migrations/000_initial_schema.sql +0 -174
  73. package/migrations/001_entity_type_rename.sql +0 -17
  74. package/migrations/002_adapter_state_extend.sql +0 -12
  75. package/migrations/003_session_embeddings.sql +0 -11
  76. package/migrations/004_facts.sql +0 -46
  77. package/migrations/005_sources.sql +0 -31
  78. package/migrations/006_providers.sql +0 -33
  79. package/migrations/007_source_tokens.sql +0 -17
  80. package/migrations/008_fts_rebuild.sql +0 -9
  81. package/migrations/009_session_embedding_chunks.sql +0 -46
  82. package/migrations/010_sources_opencode.sql +0 -30
  83. package/migrations/011_sources_hermes_agent.sql +0 -30
  84. package/migrations/012_sources_aider.sql +0 -30
  85. package/migrations/013_adapter_state_failure_count.sql +0 -12
  86. package/plugin-hermes-agent/README.md +0 -49
  87. package/plugin-hermes-agent/__init__.py +0 -75
  88. package/plugin-hermes-agent/plugin.yaml +0 -15
  89. package/scripts/backfill-citations.mjs +0 -0
  90. package/scripts/build-codex-plugin.mjs +0 -61
  91. package/scripts/deepseek-probe.mjs +0 -67
  92. package/scripts/extract-triples.mjs +0 -207
  93. package/scripts/longmemeval/embedding-cache.ts +0 -77
  94. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  95. package/scripts/longmemeval/run-harness.ts +0 -315
  96. package/scripts/longmemeval/scorer.ts +0 -99
  97. package/scripts/longmemeval/tsconfig.json +0 -9
  98. package/scripts/longmemeval/types.ts +0 -35
  99. package/scripts/nlm-daily-digest.py +0 -239
  100. package/scripts/nlm-daily-digest.sh +0 -28
  101. package/src/cli/classify-parity.ts +0 -257
  102. package/src/cli/launchctl-helpers.ts +0 -49
  103. package/src/cli/nlm.ts +0 -885
  104. package/src/core/actions/actions-log.ts +0 -118
  105. package/src/core/actions/overlay.ts +0 -117
  106. package/src/core/adapters/aider.ts +0 -205
  107. package/src/core/adapters/claude-code.ts +0 -293
  108. package/src/core/adapters/common.ts +0 -54
  109. package/src/core/adapters/from-source.ts +0 -57
  110. package/src/core/adapters/hermes-agent.ts +0 -240
  111. package/src/core/adapters/hermes.ts +0 -277
  112. package/src/core/adapters/jsonl-generic.ts +0 -208
  113. package/src/core/adapters/opencode.ts +0 -281
  114. package/src/core/adapters/pi.ts +0 -264
  115. package/src/core/classifier/prompt.ts +0 -200
  116. package/src/core/dataset/build-dataset.ts +0 -463
  117. package/src/core/embedding/chunk-body.ts +0 -76
  118. package/src/core/embedding/embed-backfill.ts +0 -210
  119. package/src/core/embedding/embed-normalize.ts +0 -135
  120. package/src/core/facts/backfill-facts.ts +0 -254
  121. package/src/core/facts/extract-facts.ts +0 -50
  122. package/src/core/hook/citation-detect.ts +0 -124
  123. package/src/core/hook/cite-memo.ts +0 -68
  124. package/src/core/hook/claude-settings.ts +0 -166
  125. package/src/core/hook/gate.ts +0 -25
  126. package/src/core/hook/hook-log.ts +0 -41
  127. package/src/core/hook/memo-sweep.ts +0 -164
  128. package/src/core/hook/memo.ts +0 -67
  129. package/src/core/hook/pointer-block.ts +0 -26
  130. package/src/core/hook/select.ts +0 -32
  131. package/src/core/hook/transcript.ts +0 -121
  132. package/src/core/ingest/ingest-session.ts +0 -111
  133. package/src/core/providers/provider-models.ts +0 -100
  134. package/src/core/providers/provider-registry.ts +0 -196
  135. package/src/core/recall/citation-log.ts +0 -108
  136. package/src/core/recall/filter.ts +0 -27
  137. package/src/core/recall/index.ts +0 -6
  138. package/src/core/recall/match-fields.ts +0 -40
  139. package/src/core/recall/query-log.ts +0 -149
  140. package/src/core/recall/query-shape.ts +0 -66
  141. package/src/core/recall/recall-service.ts +0 -320
  142. package/src/core/recall/recent-log.ts +0 -59
  143. package/src/core/recall/tokenize.ts +0 -18
  144. package/src/core/recall/useful-scan.ts +0 -336
  145. package/src/core/recall-facts/fact-query-log.ts +0 -150
  146. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  147. package/src/core/scheduler/scan-once.ts +0 -142
  148. package/src/core/scheduler/scheduler.ts +0 -225
  149. package/src/core/sources/source-registry.ts +0 -260
  150. package/src/core/storage/db-restore.ts +0 -133
  151. package/src/core/storage/live-status.ts +0 -45
  152. package/src/core/storage/migrate.ts +0 -72
  153. package/src/core/storage/sqlite-fact-store.ts +0 -304
  154. package/src/core/storage/sqlite-session-store.ts +0 -765
  155. package/src/hook/prompt-recall-hook.ts +0 -174
  156. package/src/hook/session-end-hook.ts +0 -81
  157. package/src/hook/session-start-hook.ts +0 -165
  158. package/src/hook/stop-hook.ts +0 -236
  159. package/src/http/app.ts +0 -1137
  160. package/src/install/claude-code.ts +0 -128
  161. package/src/install/codex.ts +0 -367
  162. package/src/install/hermes-agent.ts +0 -76
  163. package/src/install/hermes.ts +0 -78
  164. package/src/install/ollama.ts +0 -211
  165. package/src/install/setup.ts +0 -368
  166. package/src/llm/classifier-box.ts +0 -64
  167. package/src/llm/deepseek-client.ts +0 -150
  168. package/src/llm/env-autoload.ts +0 -55
  169. package/src/llm/ollama-client.ts +0 -189
  170. package/src/mcp/server.ts +0 -534
  171. package/src/ports/fact-store.ts +0 -102
  172. package/src/ports/llm-client.ts +0 -52
  173. package/src/ports/logger.ts +0 -16
  174. package/src/ports/session-store.ts +0 -45
  175. package/src/ports/transcript-adapter.ts +0 -55
  176. package/src/shared/types.ts +0 -145
  177. package/src/ui/App.tsx +0 -58
  178. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  179. package/src/ui/components/SessionDrawer.tsx +0 -136
  180. package/src/ui/components/SideNav.tsx +0 -162
  181. package/src/ui/components/Skeleton.tsx +0 -107
  182. package/src/ui/index.html +0 -13
  183. package/src/ui/lib/actions.ts +0 -30
  184. package/src/ui/lib/api.ts +0 -92
  185. package/src/ui/lib/dataset.ts +0 -141
  186. package/src/ui/lib/registries.ts +0 -155
  187. package/src/ui/lib/view-settings.ts +0 -41
  188. package/src/ui/main.tsx +0 -15
  189. package/src/ui/pages/Live.tsx +0 -229
  190. package/src/ui/pages/Pulse.tsx +0 -415
  191. package/src/ui/pages/Recall.tsx +0 -190
  192. package/src/ui/pages/River.tsx +0 -308
  193. package/src/ui/pages/Search.tsx +0 -93
  194. package/src/ui/pages/Stub.tsx +0 -9
  195. package/src/ui/pages/Thread.tsx +0 -262
  196. package/src/ui/pages/settings/Classifier.tsx +0 -227
  197. package/src/ui/pages/settings/Data.tsx +0 -190
  198. package/src/ui/pages/settings/Index.tsx +0 -65
  199. package/src/ui/pages/settings/Labels.tsx +0 -224
  200. package/src/ui/pages/settings/Providers.tsx +0 -305
  201. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  202. package/src/ui/pages/settings/Sources.tsx +0 -326
  203. package/src/ui/pages/settings/Views.tsx +0 -96
  204. package/src/ui/styles.css +0 -1766
  205. package/src/ui/tsconfig.json +0 -21
  206. package/src/ui/vite.config.ts +0 -19
  207. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  208. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  209. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  210. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  211. package/tests/fixtures/facts.ts +0 -17
  212. package/tests/fixtures/golden-corpus.ts +0 -85
  213. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  214. package/tests/fixtures/hermes/paired_session.json +0 -23
  215. package/tests/fixtures/hermes/request_dump.json +0 -28
  216. package/tests/fixtures/hermes/session_iso.json +0 -38
  217. package/tests/fixtures/hermes/session_unix.json +0 -38
  218. package/tests/fixtures/hermes/system_only.json +0 -18
  219. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  220. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  221. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  222. package/tests/fixtures/sessions.ts +0 -22
  223. package/tests/integration/backfill-facts.test.ts +0 -362
  224. package/tests/integration/citation-explicit.test.ts +0 -111
  225. package/tests/integration/cite-event.test.ts +0 -169
  226. package/tests/integration/cite-memo.test.ts +0 -87
  227. package/tests/integration/db-restore.test.ts +0 -153
  228. package/tests/integration/embed-backfill.test.ts +0 -176
  229. package/tests/integration/fact-supersedence.test.ts +0 -313
  230. package/tests/integration/fts-index.test.ts +0 -60
  231. package/tests/integration/getbyids-sqlite.test.ts +0 -60
  232. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  233. package/tests/integration/hook-claude-settings.test.ts +0 -205
  234. package/tests/integration/hook-log.test.ts +0 -54
  235. package/tests/integration/hook-memo.test.ts +0 -68
  236. package/tests/integration/hook-pre-compact.test.ts +0 -105
  237. package/tests/integration/hook-subagent-start.test.ts +0 -102
  238. package/tests/integration/http.test.ts +0 -401
  239. package/tests/integration/keyword-search-fts.test.ts +0 -66
  240. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  241. package/tests/integration/mcp.test.ts +0 -248
  242. package/tests/integration/memo-sweep.test.ts +0 -91
  243. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  244. package/tests/integration/provider-registry.test.ts +0 -107
  245. package/tests/integration/recall-golden.test.ts +0 -59
  246. package/tests/integration/recall-sqlite.test.ts +0 -169
  247. package/tests/integration/scheduler.test.ts +0 -391
  248. package/tests/integration/session-end-hook.test.ts +0 -48
  249. package/tests/integration/session-start-hook.test.ts +0 -126
  250. package/tests/integration/source-registry.test.ts +0 -120
  251. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  252. package/tests/integration/stop-hook.test.ts +0 -560
  253. package/tests/integration/wal-checkpoint.test.ts +0 -49
  254. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  255. package/tests/unit/core/adapters/aider.test.ts +0 -230
  256. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  257. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  258. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  259. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  260. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  261. package/tests/unit/core/adapters/pi.test.ts +0 -110
  262. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  263. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  264. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  265. package/tests/unit/core/filter.test.ts +0 -40
  266. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  267. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  268. package/tests/unit/core/hook/gate.test.ts +0 -29
  269. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  270. package/tests/unit/core/hook/select.test.ts +0 -66
  271. package/tests/unit/core/match-fields.test.ts +0 -39
  272. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  273. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  274. package/tests/unit/core/query-shape.test.ts +0 -92
  275. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  276. package/tests/unit/core/recall-service.test.ts +0 -200
  277. package/tests/unit/core/storage/live-status.test.ts +0 -54
  278. package/tests/unit/core/tokenize.test.ts +0 -32
  279. package/tests/unit/core/useful-scan.test.ts +0 -537
  280. package/tests/unit/llm/embed.test.ts +0 -93
  281. package/tests/unit/llm/ollama-client.test.ts +0 -124
  282. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  283. package/tsconfig.json +0 -31
  284. package/tsconfig.test.json +0 -11
  285. package/vitest.config.ts +0 -22
@@ -1,537 +0,0 @@
1
- import { describe, expect, it } from "vitest";
2
- import { mkdirSync, writeFileSync } from "node:fs";
3
- import { join } from "node:path";
4
- import { tmpdir } from "node:os";
5
- import {
6
- isProbe,
7
- extractAssistantTurnsAfter,
8
- findMatchedId,
9
- scanUsefulHits,
10
- readUsefulHitRate,
11
- } from "../../../src/core/recall/useful-scan.js";
12
-
13
- // ── isProbe ──────────────────────────────────────────────────────────────────
14
-
15
- describe("isProbe", () => {
16
- it("returns true for probe patterns", () => {
17
- expect(isProbe("concurrency probe round 2")).toBe(true);
18
- expect(isProbe("test probe")).toBe(true);
19
- expect(isProbe("path test for the hook")).toBe(true);
20
- expect(isProbe("recall test")).toBe(true);
21
- expect(isProbe("smoke test run")).toBe(true);
22
- expect(isProbe("cutover validation")).toBe(true);
23
- });
24
-
25
- it("returns false for normal prompts", () => {
26
- expect(isProbe("what did we decide about pgvector")).toBe(false);
27
- expect(isProbe("how should we implement the recall hook")).toBe(false);
28
- expect(isProbe("review the PR")).toBe(false);
29
- });
30
-
31
- it("is case-insensitive", () => {
32
- expect(isProbe("SMOKE TEST")).toBe(true);
33
- expect(isProbe("Concurrency Probe")).toBe(true);
34
- });
35
- });
36
-
37
- // ── extractAssistantTurnsAfter ───────────────────────────────────────────────
38
-
39
- function makeTranscript(
40
- lines: Array<{ type: string; timestamp: string; content?: string | Array<Record<string, unknown>> }>,
41
- ): string {
42
- return lines
43
- .map((l) => {
44
- const msg =
45
- l.type === "assistant"
46
- ? {
47
- type: "assistant",
48
- timestamp: l.timestamp,
49
- message: { content: l.content ?? "" },
50
- }
51
- : { type: l.type, timestamp: l.timestamp };
52
- return JSON.stringify(msg);
53
- })
54
- .join("\n");
55
- }
56
-
57
- describe("extractAssistantTurnsAfter", () => {
58
- it("returns empty for a missing file", () => {
59
- expect(extractAssistantTurnsAfter("/tmp/nlm-nonexistent-transcript.jsonl", 0, 3)).toEqual([]);
60
- });
61
-
62
- it("returns empty when no assistant turns exist after the cutoff", () => {
63
- const dir = tmpdir();
64
- const path = join(dir, `transcript-past-${Date.now()}.jsonl`);
65
- writeFileSync(
66
- path,
67
- makeTranscript([
68
- { type: "user", timestamp: "2026-01-01T00:00:00.000Z" },
69
- { type: "assistant", timestamp: "2026-01-01T00:00:01.000Z", content: "answer" },
70
- ]),
71
- );
72
- // cutoff is after the assistant turn
73
- const cutoff = Date.parse("2026-01-01T00:00:02.000Z");
74
- expect(extractAssistantTurnsAfter(path, cutoff, 3)).toEqual([]);
75
- });
76
-
77
- it("returns up to `limit` assistant turns at or after the cutoff", () => {
78
- const dir = tmpdir();
79
- const path = join(dir, `transcript-limit-${Date.now()}.jsonl`);
80
- const ts = "2026-05-01T10:00:00.000Z";
81
- writeFileSync(
82
- path,
83
- makeTranscript([
84
- { type: "user", timestamp: "2026-05-01T09:59:59.000Z" },
85
- { type: "assistant", timestamp: ts, content: "turn-1" },
86
- { type: "user", timestamp: "2026-05-01T10:00:01.000Z" },
87
- { type: "assistant", timestamp: "2026-05-01T10:00:02.000Z", content: "turn-2" },
88
- { type: "user", timestamp: "2026-05-01T10:00:03.000Z" },
89
- { type: "assistant", timestamp: "2026-05-01T10:00:04.000Z", content: "turn-3" },
90
- { type: "user", timestamp: "2026-05-01T10:00:05.000Z" },
91
- { type: "assistant", timestamp: "2026-05-01T10:00:06.000Z", content: "turn-4" },
92
- ]),
93
- );
94
- const cutoff = Date.parse(ts);
95
- const turns = extractAssistantTurnsAfter(path, cutoff, 3);
96
- expect(turns).toHaveLength(3);
97
- expect(turns[0]).toContain("turn-1");
98
- expect(turns[1]).toContain("turn-2");
99
- expect(turns[2]).toContain("turn-3");
100
- });
101
-
102
- it("extracts text from content-array turns (text + tool_use)", () => {
103
- const dir = tmpdir();
104
- const path = join(dir, `transcript-blocks-${Date.now()}.jsonl`);
105
- const ts = "2026-05-01T10:00:00.000Z";
106
- const content: Array<Record<string, unknown>> = [
107
- { type: "text", text: "I looked it up." },
108
- { type: "tool_use", name: "mcp__nlm-memory__get_session", input: { id: "cc_sub_abc123" } },
109
- ];
110
- writeFileSync(
111
- path,
112
- JSON.stringify({ type: "assistant", timestamp: ts, message: { content } }) + "\n",
113
- );
114
- const turns = extractAssistantTurnsAfter(path, Date.parse(ts), 3);
115
- expect(turns).toHaveLength(1);
116
- expect(turns[0]).toContain("I looked it up.");
117
- expect(turns[0]).toContain("cc_sub_abc123");
118
- });
119
-
120
- it("skips malformed JSON lines without throwing", () => {
121
- const dir = tmpdir();
122
- const path = join(dir, `transcript-malformed-${Date.now()}.jsonl`);
123
- const ts = "2026-05-01T10:00:00.000Z";
124
- writeFileSync(
125
- path,
126
- "not json\n" +
127
- JSON.stringify({ type: "assistant", timestamp: ts, message: { content: "ok" } }) +
128
- "\n",
129
- );
130
- const turns = extractAssistantTurnsAfter(path, Date.parse(ts), 3);
131
- expect(turns).toHaveLength(1);
132
- expect(turns[0]).toContain("ok");
133
- });
134
- });
135
-
136
- // ── findMatchedId ────────────────────────────────────────────────────────────
137
-
138
- describe("findMatchedId", () => {
139
- it("returns the first matching ID", () => {
140
- expect(findMatchedId(["cc_sub_abc", "cc_sub_def"], ["context cc_sub_abc here"])).toBe(
141
- "cc_sub_abc",
142
- );
143
- });
144
-
145
- it("returns null when no ID appears", () => {
146
- expect(findMatchedId(["cc_sub_abc"], ["completely unrelated text"])).toBeNull();
147
- });
148
-
149
- it("matches IDs inside tool_use serialized JSON", () => {
150
- const turns = [JSON.stringify({ id: "cc_sub_xyz123" })];
151
- expect(findMatchedId(["cc_sub_xyz123"], turns)).toBe("cc_sub_xyz123");
152
- });
153
-
154
- it("returns null for empty ids list", () => {
155
- expect(findMatchedId([], ["some text"])).toBeNull();
156
- });
157
-
158
- it("returns null for empty turns list", () => {
159
- expect(findMatchedId(["cc_sub_abc"], [])).toBeNull();
160
- });
161
- });
162
-
163
- // ── scanUsefulHits ───────────────────────────────────────────────────────────
164
-
165
- function setupScanDirs(): { root: string; hookLogPath: string; usefulHitLogPath: string; transcriptsDir: string } {
166
- const root = join(tmpdir(), `nlm-scan-test-${Date.now()}-${Math.random().toString(36).slice(2)}`);
167
- mkdirSync(root, { recursive: true });
168
- const hookLogPath = join(root, "hook-log.jsonl");
169
- const usefulHitLogPath = join(root, "useful-hit-log.jsonl");
170
- const transcriptsDir = join(root, "projects");
171
- mkdirSync(transcriptsDir, { recursive: true });
172
- return { root, hookLogPath, usefulHitLogPath, transcriptsDir };
173
- }
174
-
175
- function writeTranscript(transcriptsDir: string, conversationId: string, content: string): void {
176
- const projectDir = join(transcriptsDir, "test-project");
177
- mkdirSync(projectDir, { recursive: true });
178
- writeFileSync(join(projectDir, `${conversationId}.jsonl`), content);
179
- }
180
-
181
- describe("scanUsefulHits", () => {
182
- it("returns zero totals when hook log is absent", async () => {
183
- const { root, hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
184
- const result = await scanUsefulHits({
185
- days: 1,
186
- hookLogPath,
187
- usefulHitLogPath,
188
- transcriptsDir,
189
- dryRun: true,
190
- });
191
- expect(result).toEqual({ total: 0, measurable: 0, useful: 0, appended: 0 });
192
- // suppress unused warning
193
- void root;
194
- });
195
-
196
- it("counts a useful hit when the ID appears in the next assistant turn", async () => {
197
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
198
- const convId = "test-conv-useful-hit";
199
- const hookTs = new Date().toISOString();
200
- const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
201
-
202
- // Hook log entry with wouldInject
203
- writeFileSync(
204
- hookLogPath,
205
- JSON.stringify({
206
- ts: hookTs,
207
- conversationId: convId,
208
- promptPreview: "what did we decide about the schema",
209
- gate: "evaluate",
210
- hits: [{ id: "cc_sub_abc123def456", score: 1.2 }],
211
- wouldInject: ["cc_sub_abc123def456"],
212
- estTokens: 50,
213
- mode: "shadow",
214
- }) + "\n",
215
- );
216
-
217
- // Transcript with the ID appearing in the assistant turn after the hook
218
- writeTranscript(
219
- transcriptsDir,
220
- convId,
221
- JSON.stringify({ type: "user", timestamp: hookTs }) +
222
- "\n" +
223
- JSON.stringify({
224
- type: "assistant",
225
- timestamp: afterTs,
226
- message: { content: "Per cc_sub_abc123def456 we chose the new schema." },
227
- }) +
228
- "\n",
229
- );
230
-
231
- const result = await scanUsefulHits({
232
- days: 1,
233
- hookLogPath,
234
- usefulHitLogPath,
235
- transcriptsDir,
236
- });
237
-
238
- expect(result.total).toBe(1);
239
- expect(result.measurable).toBe(1);
240
- expect(result.useful).toBe(1);
241
- expect(result.appended).toBe(1);
242
- });
243
-
244
- it("records useful=false when the ID does not appear in subsequent turns", async () => {
245
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
246
- const convId = "test-conv-not-useful";
247
- const hookTs = new Date().toISOString();
248
- const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
249
-
250
- writeFileSync(
251
- hookLogPath,
252
- JSON.stringify({
253
- ts: hookTs,
254
- conversationId: convId,
255
- promptPreview: "explain this code",
256
- gate: "evaluate",
257
- hits: [{ id: "cc_sub_zzz999", score: 0.8 }],
258
- wouldInject: ["cc_sub_zzz999"],
259
- estTokens: 30,
260
- mode: "shadow",
261
- }) + "\n",
262
- );
263
-
264
- writeTranscript(
265
- transcriptsDir,
266
- convId,
267
- JSON.stringify({ type: "user", timestamp: hookTs }) +
268
- "\n" +
269
- JSON.stringify({
270
- type: "assistant",
271
- timestamp: afterTs,
272
- message: { content: "Here is the explanation." },
273
- }) +
274
- "\n",
275
- );
276
-
277
- const result = await scanUsefulHits({
278
- days: 1,
279
- hookLogPath,
280
- usefulHitLogPath,
281
- transcriptsDir,
282
- });
283
-
284
- expect(result.useful).toBe(0);
285
- expect(result.measurable).toBe(1);
286
-
287
- // Verify the written entry has useful=false
288
- const { readFileSync } = await import("node:fs");
289
- const written = JSON.parse(readFileSync(usefulHitLogPath, "utf8").trim()) as Record<string, unknown>;
290
- expect(written["useful"]).toBe(false);
291
- expect(written["matchedId"]).toBeNull();
292
- });
293
-
294
- it("records useful=null when no transcript is found", async () => {
295
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
296
- const hookTs = new Date().toISOString();
297
-
298
- writeFileSync(
299
- hookLogPath,
300
- JSON.stringify({
301
- ts: hookTs,
302
- conversationId: "missing-conv-id-xyz",
303
- promptPreview: "what is the error",
304
- gate: "evaluate",
305
- hits: [{ id: "cc_sub_missing", score: 1.0 }],
306
- wouldInject: ["cc_sub_missing"],
307
- estTokens: 20,
308
- mode: "shadow",
309
- }) + "\n",
310
- );
311
-
312
- const result = await scanUsefulHits({
313
- days: 1,
314
- hookLogPath,
315
- usefulHitLogPath,
316
- transcriptsDir,
317
- });
318
-
319
- expect(result.measurable).toBe(0);
320
- expect(result.useful).toBe(0);
321
-
322
- const { readFileSync } = await import("node:fs");
323
- const written = JSON.parse(readFileSync(usefulHitLogPath, "utf8").trim()) as Record<string, unknown>;
324
- expect(written["useful"]).toBeNull();
325
- });
326
-
327
- it("skips probe entries", async () => {
328
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
329
- const hookTs = new Date().toISOString();
330
-
331
- writeFileSync(
332
- hookLogPath,
333
- JSON.stringify({
334
- ts: hookTs,
335
- conversationId: "probe-conv",
336
- promptPreview: "recall test round 3",
337
- gate: "evaluate",
338
- hits: [{ id: "cc_sub_probe", score: 1.0 }],
339
- wouldInject: ["cc_sub_probe"],
340
- estTokens: 10,
341
- mode: "shadow",
342
- }) + "\n",
343
- );
344
-
345
- const result = await scanUsefulHits({
346
- days: 1,
347
- hookLogPath,
348
- usefulHitLogPath,
349
- transcriptsDir,
350
- });
351
-
352
- expect(result.total).toBe(0);
353
- });
354
-
355
- it("skips entries with empty wouldInject", async () => {
356
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
357
- const hookTs = new Date().toISOString();
358
-
359
- writeFileSync(
360
- hookLogPath,
361
- JSON.stringify({
362
- ts: hookTs,
363
- conversationId: "conv-no-inject",
364
- promptPreview: "what is the status",
365
- gate: "generative",
366
- hits: [],
367
- wouldInject: [],
368
- estTokens: 0,
369
- mode: "shadow",
370
- }) + "\n",
371
- );
372
-
373
- const result = await scanUsefulHits({
374
- days: 1,
375
- hookLogPath,
376
- usefulHitLogPath,
377
- transcriptsDir,
378
- });
379
-
380
- expect(result.total).toBe(0);
381
- });
382
-
383
- it("skips stop-hook entries (kind field present)", async () => {
384
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
385
- const hookTs = new Date().toISOString();
386
-
387
- writeFileSync(
388
- hookLogPath,
389
- JSON.stringify({
390
- ts: hookTs,
391
- kind: "stop",
392
- conversationId: "conv-stop",
393
- surfacedCount: 2,
394
- citedIds: ["cc_sub_abc"],
395
- citationKinds: ["tool_use"],
396
- skipped: false,
397
- mode: "shadow",
398
- }) + "\n",
399
- );
400
-
401
- const result = await scanUsefulHits({
402
- days: 1,
403
- hookLogPath,
404
- usefulHitLogPath,
405
- transcriptsDir,
406
- });
407
-
408
- expect(result.total).toBe(0);
409
- });
410
-
411
- it("skips already-scanned entries on a second run", async () => {
412
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
413
- const convId = "conv-dedup";
414
- const hookTs = new Date().toISOString();
415
- const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
416
-
417
- writeFileSync(
418
- hookLogPath,
419
- JSON.stringify({
420
- ts: hookTs,
421
- conversationId: convId,
422
- promptPreview: "help with recall",
423
- gate: "evaluate",
424
- hits: [{ id: "cc_sub_dedup123", score: 1.1 }],
425
- wouldInject: ["cc_sub_dedup123"],
426
- estTokens: 40,
427
- mode: "shadow",
428
- }) + "\n",
429
- );
430
-
431
- writeTranscript(
432
- transcriptsDir,
433
- convId,
434
- JSON.stringify({ type: "user", timestamp: hookTs }) +
435
- "\n" +
436
- JSON.stringify({
437
- type: "assistant",
438
- timestamp: afterTs,
439
- message: { content: "Used cc_sub_dedup123 for the answer." },
440
- }) +
441
- "\n",
442
- );
443
-
444
- const first = await scanUsefulHits({ days: 1, hookLogPath, usefulHitLogPath, transcriptsDir });
445
- expect(first.appended).toBe(1);
446
-
447
- const second = await scanUsefulHits({ days: 1, hookLogPath, usefulHitLogPath, transcriptsDir });
448
- expect(second.appended).toBe(0);
449
- expect(second.total).toBe(1);
450
- });
451
-
452
- it("does not write when dryRun=true", async () => {
453
- const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
454
- const hookTs = new Date().toISOString();
455
-
456
- writeFileSync(
457
- hookLogPath,
458
- JSON.stringify({
459
- ts: hookTs,
460
- conversationId: "dry-conv",
461
- promptPreview: "explain the bug",
462
- gate: "evaluate",
463
- hits: [{ id: "cc_sub_dry", score: 1.0 }],
464
- wouldInject: ["cc_sub_dry"],
465
- estTokens: 20,
466
- mode: "shadow",
467
- }) + "\n",
468
- );
469
-
470
- const result = await scanUsefulHits({
471
- days: 1,
472
- hookLogPath,
473
- usefulHitLogPath,
474
- transcriptsDir,
475
- dryRun: true,
476
- });
477
-
478
- expect(result.appended).toBe(0);
479
- expect(result.total).toBe(1);
480
- const { existsSync } = await import("node:fs");
481
- expect(existsSync(usefulHitLogPath)).toBe(false);
482
- });
483
- });
484
-
485
- // ── readUsefulHitRate ────────────────────────────────────────────────────────
486
-
487
- describe("readUsefulHitRate", () => {
488
- it("returns null when the log file is absent", async () => {
489
- const path = join(tmpdir(), `nlm-no-useful-${Date.now()}.jsonl`);
490
- expect(await readUsefulHitRate(path, 1)).toBeNull();
491
- });
492
-
493
- it("returns null when all entries have useful=null (unmeasurable)", async () => {
494
- const path = join(tmpdir(), `nlm-useful-null-${Date.now()}.jsonl`);
495
- const ts = new Date().toISOString();
496
- writeFileSync(
497
- path,
498
- JSON.stringify({ ts, conversationId: "x", useful: null, returnedIds: [], source: "hook", matchedId: null, scannedAt: ts }) + "\n",
499
- );
500
- expect(await readUsefulHitRate(path, 1)).toBeNull();
501
- });
502
-
503
- it("computes the rate correctly from measurable entries", async () => {
504
- const path = join(tmpdir(), `nlm-useful-rate-${Date.now()}.jsonl`);
505
- const ts = new Date().toISOString();
506
- writeFileSync(
507
- path,
508
- [
509
- { ts, conversationId: "a", useful: true, returnedIds: ["cc_sub_1"], source: "hook", matchedId: "cc_sub_1", scannedAt: ts },
510
- { ts, conversationId: "b", useful: false, returnedIds: ["cc_sub_2"], source: "hook", matchedId: null, scannedAt: ts },
511
- { ts, conversationId: "c", useful: true, returnedIds: ["cc_sub_3"], source: "hook", matchedId: "cc_sub_3", scannedAt: ts },
512
- { ts, conversationId: "d", useful: null, returnedIds: ["cc_sub_4"], source: "hook", matchedId: null, scannedAt: ts },
513
- ]
514
- .map((e) => JSON.stringify(e))
515
- .join("\n") + "\n",
516
- );
517
- // 2 useful out of 3 measurable = 0.667
518
- expect(await readUsefulHitRate(path, 1)).toBeCloseTo(0.667, 2);
519
- });
520
-
521
- it("excludes entries outside the window", async () => {
522
- const path = join(tmpdir(), `nlm-useful-window-${Date.now()}.jsonl`);
523
- const old = new Date(Date.now() - 3 * 24 * 60 * 60 * 1000).toISOString();
524
- const recent = new Date().toISOString();
525
- writeFileSync(
526
- path,
527
- [
528
- { ts: old, conversationId: "old", useful: true, returnedIds: [], source: "hook", matchedId: "x", scannedAt: old },
529
- { ts: recent, conversationId: "new", useful: false, returnedIds: [], source: "hook", matchedId: null, scannedAt: recent },
530
- ]
531
- .map((e) => JSON.stringify(e))
532
- .join("\n") + "\n",
533
- );
534
- // Only the recent entry is in the 1-day window: 0/1 = 0.0
535
- expect(await readUsefulHitRate(path, 1)).toBe(0);
536
- });
537
- });
@@ -1,93 +0,0 @@
1
- /**
2
- * Unit tests for OllamaClient.embed: nomic prefix scheme, L2 normalization,
3
- * 8K char truncation. These guard the nomic-embed-text v1.5 contract.
4
- */
5
-
6
- import { describe, expect, it } from "vitest";
7
- import { OllamaClient, l2Normalize } from "../../../src/llm/ollama-client.js";
8
-
9
- type FakeFetch = typeof fetch;
10
-
11
- function jsonResponse(body: unknown): Response {
12
- return new Response(JSON.stringify(body), {
13
- status: 200,
14
- headers: { "content-type": "application/json" },
15
- });
16
- }
17
-
18
- function makeFetch(reply: (req: { url: string; body: unknown }) => Response): FakeFetch {
19
- return (async (input: string | URL | Request, init?: RequestInit) => {
20
- const url = typeof input === "string" ? input : input.toString();
21
- const body = init?.body ? JSON.parse(init.body.toString()) : null;
22
- return reply({ url, body });
23
- }) as FakeFetch;
24
- }
25
-
26
- describe("OllamaClient.embed prefix scheme", () => {
27
- it("prefixes a query call with 'search_query: '", async () => {
28
- let prompt = "";
29
- const fetchImpl = makeFetch(({ body }) => {
30
- prompt = (body as { prompt: string }).prompt;
31
- return jsonResponse({ embedding: [1, 0, 0] });
32
- });
33
- const client = new OllamaClient({ fetchImpl });
34
- await client.embed("what did we decide about pgvector", "query");
35
- expect(prompt.startsWith("search_query: ")).toBe(true);
36
- expect(prompt).toContain("pgvector");
37
- });
38
-
39
- it("prefixes a document call with 'search_document: '", async () => {
40
- let prompt = "";
41
- const fetchImpl = makeFetch(({ body }) => {
42
- prompt = (body as { prompt: string }).prompt;
43
- return jsonResponse({ embedding: [1, 0, 0] });
44
- });
45
- const client = new OllamaClient({ fetchImpl });
46
- await client.embed("session body text", "document");
47
- expect(prompt.startsWith("search_document: ")).toBe(true);
48
- });
49
-
50
- it("truncates text to MAX_EMBED_CHARS (8000) before prefixing", async () => {
51
- let prompt = "";
52
- const fetchImpl = makeFetch(({ body }) => {
53
- prompt = (body as { prompt: string }).prompt;
54
- return jsonResponse({ embedding: [1, 0, 0] });
55
- });
56
- const client = new OllamaClient({ fetchImpl });
57
- const big = "x".repeat(10_000);
58
- await client.embed(big, "document");
59
- // prompt = "search_document: " + truncated → prefix is 17 chars, body capped at 8000.
60
- // Briefly raised to 28000 on 2026-05-25 then reverted same day; nomic-
61
- // embed-text via Ollama 500s on inputs near the nominal 8192-token
62
- // context. Real fix is chunk + max-pool (filed as #174).
63
- expect(prompt.length).toBe(17 + 8_000);
64
- });
65
-
66
- it("L2-normalizes the returned vector", async () => {
67
- const fetchImpl = makeFetch(() => jsonResponse({ embedding: [3, 4, 0] }));
68
- const client = new OllamaClient({ fetchImpl });
69
- const { vector } = await client.embed("anything", "document");
70
- // raw norm = 5; normalized should be [0.6, 0.8, 0]
71
- expect(vector[0]).toBeCloseTo(0.6, 6);
72
- expect(vector[1]).toBeCloseTo(0.8, 6);
73
- expect(vector[2]).toBe(0);
74
- let norm = 0;
75
- for (const v of vector) norm += v * v;
76
- expect(Math.sqrt(norm)).toBeCloseTo(1, 6);
77
- });
78
- });
79
-
80
- describe("l2Normalize", () => {
81
- it("returns a unit vector for a non-zero input", () => {
82
- const out = l2Normalize(new Float32Array([3, 4, 0]));
83
- let sum = 0;
84
- for (const v of out) sum += v * v;
85
- expect(Math.sqrt(sum)).toBeCloseTo(1, 6);
86
- });
87
-
88
- it("returns the zero vector unchanged", () => {
89
- const zero = new Float32Array([0, 0, 0]);
90
- const out = l2Normalize(zero);
91
- expect(Array.from(out)).toEqual([0, 0, 0]);
92
- });
93
- });