nlm-memory 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (472) hide show
  1. package/.agents/plugins/marketplace.json +20 -0
  2. package/.github/workflows/ci.yml +30 -0
  3. package/LICENSE +151 -0
  4. package/README.md +119 -0
  5. package/dist/cli/classify-parity.d.ts +48 -0
  6. package/dist/cli/classify-parity.js +182 -0
  7. package/dist/cli/classify-parity.js.map +1 -0
  8. package/dist/cli/launchctl-helpers.d.ts +26 -0
  9. package/dist/cli/launchctl-helpers.js +42 -0
  10. package/dist/cli/launchctl-helpers.js.map +1 -0
  11. package/dist/cli/nlm.d.ts +25 -0
  12. package/dist/cli/nlm.js +832 -0
  13. package/dist/cli/nlm.js.map +1 -0
  14. package/dist/core/actions/actions-log.d.ts +40 -0
  15. package/dist/core/actions/actions-log.js +72 -0
  16. package/dist/core/actions/actions-log.js.map +1 -0
  17. package/dist/core/actions/overlay.d.ts +30 -0
  18. package/dist/core/actions/overlay.js +101 -0
  19. package/dist/core/actions/overlay.js.map +1 -0
  20. package/dist/core/adapters/aider.d.ts +33 -0
  21. package/dist/core/adapters/aider.js +167 -0
  22. package/dist/core/adapters/aider.js.map +1 -0
  23. package/dist/core/adapters/claude-code.d.ts +32 -0
  24. package/dist/core/adapters/claude-code.js +270 -0
  25. package/dist/core/adapters/claude-code.js.map +1 -0
  26. package/dist/core/adapters/common.d.ts +20 -0
  27. package/dist/core/adapters/common.js +60 -0
  28. package/dist/core/adapters/common.js.map +1 -0
  29. package/dist/core/adapters/from-source.d.ts +11 -0
  30. package/dist/core/adapters/from-source.js +55 -0
  31. package/dist/core/adapters/from-source.js.map +1 -0
  32. package/dist/core/adapters/hermes-agent.d.ts +34 -0
  33. package/dist/core/adapters/hermes-agent.js +192 -0
  34. package/dist/core/adapters/hermes-agent.js.map +1 -0
  35. package/dist/core/adapters/hermes.d.ts +31 -0
  36. package/dist/core/adapters/hermes.js +247 -0
  37. package/dist/core/adapters/hermes.js.map +1 -0
  38. package/dist/core/adapters/jsonl-generic.d.ts +56 -0
  39. package/dist/core/adapters/jsonl-generic.js +185 -0
  40. package/dist/core/adapters/jsonl-generic.js.map +1 -0
  41. package/dist/core/adapters/opencode.d.ts +36 -0
  42. package/dist/core/adapters/opencode.js +213 -0
  43. package/dist/core/adapters/opencode.js.map +1 -0
  44. package/dist/core/adapters/pi.d.ts +32 -0
  45. package/dist/core/adapters/pi.js +233 -0
  46. package/dist/core/adapters/pi.js.map +1 -0
  47. package/dist/core/classifier/prompt.d.ts +60 -0
  48. package/dist/core/classifier/prompt.js +178 -0
  49. package/dist/core/classifier/prompt.js.map +1 -0
  50. package/dist/core/dataset/build-dataset.d.ts +87 -0
  51. package/dist/core/dataset/build-dataset.js +335 -0
  52. package/dist/core/dataset/build-dataset.js.map +1 -0
  53. package/dist/core/embedding/chunk-body.d.ts +30 -0
  54. package/dist/core/embedding/chunk-body.js +60 -0
  55. package/dist/core/embedding/chunk-body.js.map +1 -0
  56. package/dist/core/embedding/embed-backfill.d.ts +36 -0
  57. package/dist/core/embedding/embed-backfill.js +168 -0
  58. package/dist/core/embedding/embed-backfill.js.map +1 -0
  59. package/dist/core/embedding/embed-normalize.d.ts +28 -0
  60. package/dist/core/embedding/embed-normalize.js +98 -0
  61. package/dist/core/embedding/embed-normalize.js.map +1 -0
  62. package/dist/core/facts/backfill-facts.d.ts +58 -0
  63. package/dist/core/facts/backfill-facts.js +169 -0
  64. package/dist/core/facts/backfill-facts.js.map +1 -0
  65. package/dist/core/facts/extract-facts.d.ts +20 -0
  66. package/dist/core/facts/extract-facts.js +37 -0
  67. package/dist/core/facts/extract-facts.js.map +1 -0
  68. package/dist/core/hook/citation-detect.d.ts +32 -0
  69. package/dist/core/hook/citation-detect.js +105 -0
  70. package/dist/core/hook/citation-detect.js.map +1 -0
  71. package/dist/core/hook/cite-memo.d.ts +20 -0
  72. package/dist/core/hook/cite-memo.js +68 -0
  73. package/dist/core/hook/cite-memo.js.map +1 -0
  74. package/dist/core/hook/claude-settings.d.ts +34 -0
  75. package/dist/core/hook/claude-settings.js +117 -0
  76. package/dist/core/hook/claude-settings.js.map +1 -0
  77. package/dist/core/hook/gate.d.ts +11 -0
  78. package/dist/core/hook/gate.js +19 -0
  79. package/dist/core/hook/gate.js.map +1 -0
  80. package/dist/core/hook/hook-log.d.ts +25 -0
  81. package/dist/core/hook/hook-log.js +28 -0
  82. package/dist/core/hook/hook-log.js.map +1 -0
  83. package/dist/core/hook/memo-sweep.d.ts +55 -0
  84. package/dist/core/hook/memo-sweep.js +134 -0
  85. package/dist/core/hook/memo-sweep.js.map +1 -0
  86. package/dist/core/hook/memo.d.ts +20 -0
  87. package/dist/core/hook/memo.js +66 -0
  88. package/dist/core/hook/memo.js.map +1 -0
  89. package/dist/core/hook/pointer-block.d.ts +14 -0
  90. package/dist/core/hook/pointer-block.js +19 -0
  91. package/dist/core/hook/pointer-block.js.map +1 -0
  92. package/dist/core/hook/select.d.ts +21 -0
  93. package/dist/core/hook/select.js +15 -0
  94. package/dist/core/hook/select.js.map +1 -0
  95. package/dist/core/hook/transcript.d.ts +31 -0
  96. package/dist/core/hook/transcript.js +103 -0
  97. package/dist/core/hook/transcript.js.map +1 -0
  98. package/dist/core/ingest/ingest-session.d.ts +40 -0
  99. package/dist/core/ingest/ingest-session.js +71 -0
  100. package/dist/core/ingest/ingest-session.js.map +1 -0
  101. package/dist/core/providers/provider-models.d.ts +24 -0
  102. package/dist/core/providers/provider-models.js +72 -0
  103. package/dist/core/providers/provider-models.js.map +1 -0
  104. package/dist/core/providers/provider-registry.d.ts +62 -0
  105. package/dist/core/providers/provider-registry.js +143 -0
  106. package/dist/core/providers/provider-registry.js.map +1 -0
  107. package/dist/core/recall/citation-log.d.ts +28 -0
  108. package/dist/core/recall/citation-log.js +90 -0
  109. package/dist/core/recall/citation-log.js.map +1 -0
  110. package/dist/core/recall/filter.d.ts +11 -0
  111. package/dist/core/recall/filter.js +20 -0
  112. package/dist/core/recall/filter.js.map +1 -0
  113. package/dist/core/recall/index.d.ts +6 -0
  114. package/dist/core/recall/index.js +5 -0
  115. package/dist/core/recall/index.js.map +1 -0
  116. package/dist/core/recall/match-fields.d.ts +10 -0
  117. package/dist/core/recall/match-fields.js +37 -0
  118. package/dist/core/recall/match-fields.js.map +1 -0
  119. package/dist/core/recall/query-log.d.ts +36 -0
  120. package/dist/core/recall/query-log.js +112 -0
  121. package/dist/core/recall/query-log.js.map +1 -0
  122. package/dist/core/recall/query-shape.d.ts +22 -0
  123. package/dist/core/recall/query-shape.js +64 -0
  124. package/dist/core/recall/query-shape.js.map +1 -0
  125. package/dist/core/recall/recall-service.d.ts +19 -0
  126. package/dist/core/recall/recall-service.js +252 -0
  127. package/dist/core/recall/recall-service.js.map +1 -0
  128. package/dist/core/recall/recent-log.d.ts +16 -0
  129. package/dist/core/recall/recent-log.js +46 -0
  130. package/dist/core/recall/recent-log.js.map +1 -0
  131. package/dist/core/recall/tokenize.d.ts +7 -0
  132. package/dist/core/recall/tokenize.js +18 -0
  133. package/dist/core/recall/tokenize.js.map +1 -0
  134. package/dist/core/recall/useful-scan.d.ts +52 -0
  135. package/dist/core/recall/useful-scan.js +300 -0
  136. package/dist/core/recall/useful-scan.js.map +1 -0
  137. package/dist/core/recall-facts/fact-query-log.d.ts +42 -0
  138. package/dist/core/recall-facts/fact-query-log.js +115 -0
  139. package/dist/core/recall-facts/fact-query-log.js.map +1 -0
  140. package/dist/core/recall-facts/fact-recall-service.d.ts +34 -0
  141. package/dist/core/recall-facts/fact-recall-service.js +246 -0
  142. package/dist/core/recall-facts/fact-recall-service.js.map +1 -0
  143. package/dist/core/scheduler/scan-once.d.ts +32 -0
  144. package/dist/core/scheduler/scan-once.js +100 -0
  145. package/dist/core/scheduler/scan-once.js.map +1 -0
  146. package/dist/core/scheduler/scheduler.d.ts +59 -0
  147. package/dist/core/scheduler/scheduler.js +158 -0
  148. package/dist/core/scheduler/scheduler.js.map +1 -0
  149. package/dist/core/sources/source-registry.d.ts +68 -0
  150. package/dist/core/sources/source-registry.js +208 -0
  151. package/dist/core/sources/source-registry.js.map +1 -0
  152. package/dist/core/storage/db-restore.d.ts +53 -0
  153. package/dist/core/storage/db-restore.js +113 -0
  154. package/dist/core/storage/db-restore.js.map +1 -0
  155. package/dist/core/storage/live-status.d.ts +15 -0
  156. package/dist/core/storage/live-status.js +43 -0
  157. package/dist/core/storage/live-status.js.map +1 -0
  158. package/dist/core/storage/migrate.d.ts +14 -0
  159. package/dist/core/storage/migrate.js +52 -0
  160. package/dist/core/storage/migrate.js.map +1 -0
  161. package/dist/core/storage/sqlite-fact-store.d.ts +50 -0
  162. package/dist/core/storage/sqlite-fact-store.js +256 -0
  163. package/dist/core/storage/sqlite-fact-store.js.map +1 -0
  164. package/dist/core/storage/sqlite-session-store.d.ts +152 -0
  165. package/dist/core/storage/sqlite-session-store.js +587 -0
  166. package/dist/core/storage/sqlite-session-store.js.map +1 -0
  167. package/dist/hook/pre-compact-hook.d.ts +26 -0
  168. package/dist/hook/pre-compact-hook.js +94 -0
  169. package/dist/hook/pre-compact-hook.js.map +1 -0
  170. package/dist/hook/prompt-recall-hook.d.ts +23 -0
  171. package/dist/hook/prompt-recall-hook.js +141 -0
  172. package/dist/hook/prompt-recall-hook.js.map +1 -0
  173. package/dist/hook/session-end-hook.d.ts +18 -0
  174. package/dist/hook/session-end-hook.js +67 -0
  175. package/dist/hook/session-end-hook.js.map +1 -0
  176. package/dist/hook/session-start-hook.d.ts +25 -0
  177. package/dist/hook/session-start-hook.js +129 -0
  178. package/dist/hook/session-start-hook.js.map +1 -0
  179. package/dist/hook/stop-hook.d.ts +38 -0
  180. package/dist/hook/stop-hook.js +171 -0
  181. package/dist/hook/stop-hook.js.map +1 -0
  182. package/dist/hook/subagent-start-hook.d.ts +30 -0
  183. package/dist/hook/subagent-start-hook.js +108 -0
  184. package/dist/hook/subagent-start-hook.js.map +1 -0
  185. package/dist/http/app.d.ts +65 -0
  186. package/dist/http/app.js +1009 -0
  187. package/dist/http/app.js.map +1 -0
  188. package/dist/install/claude-code.d.ts +57 -0
  189. package/dist/install/claude-code.js +76 -0
  190. package/dist/install/claude-code.js.map +1 -0
  191. package/dist/install/codex.d.ts +82 -0
  192. package/dist/install/codex.js +277 -0
  193. package/dist/install/codex.js.map +1 -0
  194. package/dist/install/hermes-agent.d.ts +35 -0
  195. package/dist/install/hermes-agent.js +48 -0
  196. package/dist/install/hermes-agent.js.map +1 -0
  197. package/dist/install/hermes.d.ts +29 -0
  198. package/dist/install/hermes.js +52 -0
  199. package/dist/install/hermes.js.map +1 -0
  200. package/dist/install/ollama.d.ts +54 -0
  201. package/dist/install/ollama.js +178 -0
  202. package/dist/install/ollama.js.map +1 -0
  203. package/dist/install/setup.d.ts +37 -0
  204. package/dist/install/setup.js +339 -0
  205. package/dist/install/setup.js.map +1 -0
  206. package/dist/llm/classifier-box.d.ts +29 -0
  207. package/dist/llm/classifier-box.js +43 -0
  208. package/dist/llm/classifier-box.js.map +1 -0
  209. package/dist/llm/deepseek-client.d.ts +40 -0
  210. package/dist/llm/deepseek-client.js +114 -0
  211. package/dist/llm/deepseek-client.js.map +1 -0
  212. package/dist/llm/env-autoload.d.ts +8 -0
  213. package/dist/llm/env-autoload.js +54 -0
  214. package/dist/llm/env-autoload.js.map +1 -0
  215. package/dist/llm/ollama-client.d.ts +47 -0
  216. package/dist/llm/ollama-client.js +156 -0
  217. package/dist/llm/ollama-client.js.map +1 -0
  218. package/dist/mcp/server.d.ts +64 -0
  219. package/dist/mcp/server.js +430 -0
  220. package/dist/mcp/server.js.map +1 -0
  221. package/dist/ports/fact-store.d.ts +82 -0
  222. package/dist/ports/fact-store.js +16 -0
  223. package/dist/ports/fact-store.js.map +1 -0
  224. package/dist/ports/llm-client.d.ts +42 -0
  225. package/dist/ports/llm-client.js +14 -0
  226. package/dist/ports/llm-client.js.map +1 -0
  227. package/dist/ports/logger.d.ts +13 -0
  228. package/dist/ports/logger.js +8 -0
  229. package/dist/ports/logger.js.map +1 -0
  230. package/dist/ports/session-store.d.ts +29 -0
  231. package/dist/ports/session-store.js +9 -0
  232. package/dist/ports/session-store.js.map +1 -0
  233. package/dist/ports/transcript-adapter.d.ts +48 -0
  234. package/dist/ports/transcript-adapter.js +15 -0
  235. package/dist/ports/transcript-adapter.js.map +1 -0
  236. package/dist/shared/types.d.ts +129 -0
  237. package/dist/shared/types.js +6 -0
  238. package/dist/shared/types.js.map +1 -0
  239. package/dist/ui/assets/index-BA6IpU8g.css +1 -0
  240. package/dist/ui/assets/index-B_qIVV0k.js +69 -0
  241. package/dist/ui/index.html +13 -0
  242. package/docs/methodology/re-derivation-rate.md +112 -0
  243. package/docs/methodology/useful-hit-rate.md +79 -0
  244. package/docs/plans/2026-05-20-fts5-lexical-recall.md +1088 -0
  245. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +662 -0
  246. package/docs/plans/2026-05-20-recall-hook-design.md +131 -0
  247. package/docs/plans/2026-05-20-recall-hook-implementation.md +1222 -0
  248. package/docs/plans/desktop-product.md +69 -0
  249. package/docs/plans/factstore-design.md +236 -0
  250. package/logs/CHANGELOG/CHANGELOG-2026.md +1389 -0
  251. package/logs/CHANGELOG/CHANGELOG.md +320 -0
  252. package/migrations/000_initial_schema.sql +174 -0
  253. package/migrations/001_entity_type_rename.sql +17 -0
  254. package/migrations/002_adapter_state_extend.sql +12 -0
  255. package/migrations/003_session_embeddings.sql +11 -0
  256. package/migrations/004_facts.sql +46 -0
  257. package/migrations/005_sources.sql +31 -0
  258. package/migrations/006_providers.sql +33 -0
  259. package/migrations/007_source_tokens.sql +17 -0
  260. package/migrations/008_fts_rebuild.sql +9 -0
  261. package/migrations/009_session_embedding_chunks.sql +46 -0
  262. package/migrations/010_sources_opencode.sql +30 -0
  263. package/migrations/011_sources_hermes_agent.sql +30 -0
  264. package/migrations/012_sources_aider.sql +30 -0
  265. package/migrations/013_adapter_state_failure_count.sql +12 -0
  266. package/package.json +56 -0
  267. package/plugin/.codex-plugin/plugin.json +22 -0
  268. package/plugin/.mcp.json +8 -0
  269. package/plugin/README.md +51 -0
  270. package/plugin/hooks/hooks.json +25 -0
  271. package/plugin/scripts/prompt-recall-hook.mjs +202 -0
  272. package/plugin/scripts/stop-hook.mjs +306 -0
  273. package/plugin-hermes-agent/README.md +49 -0
  274. package/plugin-hermes-agent/__init__.py +75 -0
  275. package/plugin-hermes-agent/plugin.yaml +15 -0
  276. package/scripts/backfill-citations.mjs +0 -0
  277. package/scripts/build-codex-plugin.mjs +61 -0
  278. package/scripts/deepseek-probe.mjs +67 -0
  279. package/scripts/extract-triples.mjs +207 -0
  280. package/scripts/longmemeval/embedding-cache.ts +77 -0
  281. package/scripts/longmemeval/fetch-dataset.sh +25 -0
  282. package/scripts/longmemeval/run-harness.ts +315 -0
  283. package/scripts/longmemeval/scorer.ts +99 -0
  284. package/scripts/longmemeval/tsconfig.json +9 -0
  285. package/scripts/longmemeval/types.ts +35 -0
  286. package/scripts/nlm-daily-digest.py +239 -0
  287. package/scripts/nlm-daily-digest.sh +28 -0
  288. package/src/cli/classify-parity.ts +257 -0
  289. package/src/cli/launchctl-helpers.ts +49 -0
  290. package/src/cli/nlm.ts +885 -0
  291. package/src/core/actions/actions-log.ts +118 -0
  292. package/src/core/actions/overlay.ts +117 -0
  293. package/src/core/adapters/aider.ts +205 -0
  294. package/src/core/adapters/claude-code.ts +293 -0
  295. package/src/core/adapters/common.ts +54 -0
  296. package/src/core/adapters/from-source.ts +57 -0
  297. package/src/core/adapters/hermes-agent.ts +240 -0
  298. package/src/core/adapters/hermes.ts +277 -0
  299. package/src/core/adapters/jsonl-generic.ts +208 -0
  300. package/src/core/adapters/opencode.ts +281 -0
  301. package/src/core/adapters/pi.ts +264 -0
  302. package/src/core/classifier/prompt.ts +200 -0
  303. package/src/core/dataset/build-dataset.ts +463 -0
  304. package/src/core/embedding/chunk-body.ts +76 -0
  305. package/src/core/embedding/embed-backfill.ts +210 -0
  306. package/src/core/embedding/embed-normalize.ts +135 -0
  307. package/src/core/facts/backfill-facts.ts +254 -0
  308. package/src/core/facts/extract-facts.ts +50 -0
  309. package/src/core/hook/citation-detect.ts +124 -0
  310. package/src/core/hook/cite-memo.ts +68 -0
  311. package/src/core/hook/claude-settings.ts +166 -0
  312. package/src/core/hook/gate.ts +25 -0
  313. package/src/core/hook/hook-log.ts +41 -0
  314. package/src/core/hook/memo-sweep.ts +164 -0
  315. package/src/core/hook/memo.ts +67 -0
  316. package/src/core/hook/pointer-block.ts +26 -0
  317. package/src/core/hook/select.ts +32 -0
  318. package/src/core/hook/transcript.ts +121 -0
  319. package/src/core/ingest/ingest-session.ts +111 -0
  320. package/src/core/providers/provider-models.ts +100 -0
  321. package/src/core/providers/provider-registry.ts +196 -0
  322. package/src/core/recall/citation-log.ts +108 -0
  323. package/src/core/recall/filter.ts +27 -0
  324. package/src/core/recall/index.ts +6 -0
  325. package/src/core/recall/match-fields.ts +40 -0
  326. package/src/core/recall/query-log.ts +149 -0
  327. package/src/core/recall/query-shape.ts +66 -0
  328. package/src/core/recall/recall-service.ts +320 -0
  329. package/src/core/recall/recent-log.ts +59 -0
  330. package/src/core/recall/tokenize.ts +18 -0
  331. package/src/core/recall/useful-scan.ts +336 -0
  332. package/src/core/recall-facts/fact-query-log.ts +150 -0
  333. package/src/core/recall-facts/fact-recall-service.ts +327 -0
  334. package/src/core/scheduler/scan-once.ts +142 -0
  335. package/src/core/scheduler/scheduler.ts +225 -0
  336. package/src/core/sources/source-registry.ts +260 -0
  337. package/src/core/storage/db-restore.ts +133 -0
  338. package/src/core/storage/live-status.ts +45 -0
  339. package/src/core/storage/migrate.ts +72 -0
  340. package/src/core/storage/sqlite-fact-store.ts +304 -0
  341. package/src/core/storage/sqlite-session-store.ts +765 -0
  342. package/src/hook/prompt-recall-hook.ts +174 -0
  343. package/src/hook/session-end-hook.ts +81 -0
  344. package/src/hook/session-start-hook.ts +165 -0
  345. package/src/hook/stop-hook.ts +236 -0
  346. package/src/http/app.ts +1114 -0
  347. package/src/install/claude-code.ts +128 -0
  348. package/src/install/codex.ts +367 -0
  349. package/src/install/hermes-agent.ts +76 -0
  350. package/src/install/hermes.ts +78 -0
  351. package/src/install/ollama.ts +208 -0
  352. package/src/install/setup.ts +368 -0
  353. package/src/llm/classifier-box.ts +64 -0
  354. package/src/llm/deepseek-client.ts +150 -0
  355. package/src/llm/env-autoload.ts +55 -0
  356. package/src/llm/ollama-client.ts +189 -0
  357. package/src/mcp/server.ts +534 -0
  358. package/src/ports/fact-store.ts +102 -0
  359. package/src/ports/llm-client.ts +52 -0
  360. package/src/ports/logger.ts +16 -0
  361. package/src/ports/session-store.ts +45 -0
  362. package/src/ports/transcript-adapter.ts +55 -0
  363. package/src/shared/types.ts +145 -0
  364. package/src/ui/App.tsx +58 -0
  365. package/src/ui/components/PromoteOpenButton.tsx +65 -0
  366. package/src/ui/components/SessionDrawer.tsx +136 -0
  367. package/src/ui/components/SideNav.tsx +162 -0
  368. package/src/ui/components/Skeleton.tsx +107 -0
  369. package/src/ui/index.html +13 -0
  370. package/src/ui/lib/actions.ts +30 -0
  371. package/src/ui/lib/api.ts +92 -0
  372. package/src/ui/lib/dataset.ts +141 -0
  373. package/src/ui/lib/registries.ts +155 -0
  374. package/src/ui/lib/view-settings.ts +41 -0
  375. package/src/ui/main.tsx +15 -0
  376. package/src/ui/pages/Live.tsx +229 -0
  377. package/src/ui/pages/Pulse.tsx +415 -0
  378. package/src/ui/pages/Recall.tsx +190 -0
  379. package/src/ui/pages/River.tsx +308 -0
  380. package/src/ui/pages/Search.tsx +93 -0
  381. package/src/ui/pages/Stub.tsx +9 -0
  382. package/src/ui/pages/Thread.tsx +262 -0
  383. package/src/ui/pages/settings/Classifier.tsx +227 -0
  384. package/src/ui/pages/settings/Data.tsx +190 -0
  385. package/src/ui/pages/settings/Index.tsx +65 -0
  386. package/src/ui/pages/settings/Labels.tsx +224 -0
  387. package/src/ui/pages/settings/Providers.tsx +305 -0
  388. package/src/ui/pages/settings/SettingsSubnav.tsx +28 -0
  389. package/src/ui/pages/settings/Sources.tsx +326 -0
  390. package/src/ui/pages/settings/Views.tsx +96 -0
  391. package/src/ui/styles.css +1766 -0
  392. package/src/ui/tsconfig.json +21 -0
  393. package/src/ui/vite.config.ts +19 -0
  394. package/tests/fixtures/claude_code/short_session.jsonl +2 -0
  395. package/tests/fixtures/claude_code/standard_iso.jsonl +4 -0
  396. package/tests/fixtures/claude_code/tool_heavy.jsonl +8 -0
  397. package/tests/fixtures/claude_code/with_subagent.jsonl +7 -0
  398. package/tests/fixtures/facts.ts +17 -0
  399. package/tests/fixtures/golden-corpus.ts +85 -0
  400. package/tests/fixtures/hermes/paired_request_dump.json +24 -0
  401. package/tests/fixtures/hermes/paired_session.json +23 -0
  402. package/tests/fixtures/hermes/request_dump.json +28 -0
  403. package/tests/fixtures/hermes/session_iso.json +38 -0
  404. package/tests/fixtures/hermes/session_unix.json +38 -0
  405. package/tests/fixtures/hermes/system_only.json +18 -0
  406. package/tests/fixtures/pi/error-connection-abort.jsonl +8 -0
  407. package/tests/fixtures/pi/short-successful.jsonl +5 -0
  408. package/tests/fixtures/pi/with-custom-message.jsonl +6 -0
  409. package/tests/fixtures/sessions.ts +22 -0
  410. package/tests/integration/backfill-facts.test.ts +362 -0
  411. package/tests/integration/citation-explicit.test.ts +111 -0
  412. package/tests/integration/cite-event.test.ts +169 -0
  413. package/tests/integration/cite-memo.test.ts +87 -0
  414. package/tests/integration/db-restore.test.ts +153 -0
  415. package/tests/integration/embed-backfill.test.ts +176 -0
  416. package/tests/integration/fact-supersedence.test.ts +313 -0
  417. package/tests/integration/fts-index.test.ts +60 -0
  418. package/tests/integration/getbyids-sqlite.test.ts +60 -0
  419. package/tests/integration/hermes-agent-hooks.test.ts +248 -0
  420. package/tests/integration/hook-claude-settings.test.ts +205 -0
  421. package/tests/integration/hook-log.test.ts +54 -0
  422. package/tests/integration/hook-memo.test.ts +68 -0
  423. package/tests/integration/hook-pre-compact.test.ts +105 -0
  424. package/tests/integration/hook-subagent-start.test.ts +102 -0
  425. package/tests/integration/http.test.ts +401 -0
  426. package/tests/integration/keyword-search-fts.test.ts +66 -0
  427. package/tests/integration/mcp-recall-logging.test.ts +88 -0
  428. package/tests/integration/mcp.test.ts +248 -0
  429. package/tests/integration/memo-sweep.test.ts +91 -0
  430. package/tests/integration/prompt-recall-hook.test.ts +88 -0
  431. package/tests/integration/provider-registry.test.ts +107 -0
  432. package/tests/integration/recall-golden.test.ts +59 -0
  433. package/tests/integration/recall-sqlite.test.ts +169 -0
  434. package/tests/integration/scheduler.test.ts +391 -0
  435. package/tests/integration/session-end-hook.test.ts +48 -0
  436. package/tests/integration/session-start-hook.test.ts +126 -0
  437. package/tests/integration/source-registry.test.ts +120 -0
  438. package/tests/integration/sqlite-fact-store.test.ts +346 -0
  439. package/tests/integration/stop-hook.test.ts +560 -0
  440. package/tests/integration/wal-checkpoint.test.ts +49 -0
  441. package/tests/unit/cli/launchctl-helpers.test.ts +60 -0
  442. package/tests/unit/core/adapters/aider.test.ts +230 -0
  443. package/tests/unit/core/adapters/claude-code.test.ts +118 -0
  444. package/tests/unit/core/adapters/hermes-agent.test.ts +329 -0
  445. package/tests/unit/core/adapters/hermes.test.ts +81 -0
  446. package/tests/unit/core/adapters/jsonl-generic.test.ts +142 -0
  447. package/tests/unit/core/adapters/opencode.test.ts +354 -0
  448. package/tests/unit/core/adapters/pi.test.ts +110 -0
  449. package/tests/unit/core/classifier/prompt.test.ts +126 -0
  450. package/tests/unit/core/embedding/chunk-body.test.ts +100 -0
  451. package/tests/unit/core/facts/extract-facts.test.ts +117 -0
  452. package/tests/unit/core/filter.test.ts +40 -0
  453. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +96 -0
  454. package/tests/unit/core/hook/citation-detect.test.ts +124 -0
  455. package/tests/unit/core/hook/gate.test.ts +29 -0
  456. package/tests/unit/core/hook/pointer-block.test.ts +22 -0
  457. package/tests/unit/core/hook/select.test.ts +66 -0
  458. package/tests/unit/core/match-fields.test.ts +39 -0
  459. package/tests/unit/core/mcp-cite-session.test.ts +51 -0
  460. package/tests/unit/core/providers/provider-models.test.ts +101 -0
  461. package/tests/unit/core/query-shape.test.ts +92 -0
  462. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +258 -0
  463. package/tests/unit/core/recall-service.test.ts +200 -0
  464. package/tests/unit/core/storage/live-status.test.ts +54 -0
  465. package/tests/unit/core/tokenize.test.ts +32 -0
  466. package/tests/unit/core/useful-scan.test.ts +537 -0
  467. package/tests/unit/llm/embed.test.ts +93 -0
  468. package/tests/unit/llm/ollama-client.test.ts +124 -0
  469. package/tests/unit/scripts/longmemeval-scorer.test.ts +114 -0
  470. package/tsconfig.json +31 -0
  471. package/tsconfig.test.json +11 -0
  472. package/vitest.config.ts +22 -0
@@ -0,0 +1,537 @@
1
+ import { describe, expect, it } from "vitest";
2
+ import { mkdirSync, writeFileSync } from "node:fs";
3
+ import { join } from "node:path";
4
+ import { tmpdir } from "node:os";
5
+ import {
6
+ isProbe,
7
+ extractAssistantTurnsAfter,
8
+ findMatchedId,
9
+ scanUsefulHits,
10
+ readUsefulHitRate,
11
+ } from "../../../src/core/recall/useful-scan.js";
12
+
13
+ // ── isProbe ──────────────────────────────────────────────────────────────────
14
+
15
+ describe("isProbe", () => {
16
+ it("returns true for probe patterns", () => {
17
+ expect(isProbe("concurrency probe round 2")).toBe(true);
18
+ expect(isProbe("test probe")).toBe(true);
19
+ expect(isProbe("path test for the hook")).toBe(true);
20
+ expect(isProbe("recall test")).toBe(true);
21
+ expect(isProbe("smoke test run")).toBe(true);
22
+ expect(isProbe("cutover validation")).toBe(true);
23
+ });
24
+
25
+ it("returns false for normal prompts", () => {
26
+ expect(isProbe("what did we decide about pgvector")).toBe(false);
27
+ expect(isProbe("how should we implement the recall hook")).toBe(false);
28
+ expect(isProbe("review the PR")).toBe(false);
29
+ });
30
+
31
+ it("is case-insensitive", () => {
32
+ expect(isProbe("SMOKE TEST")).toBe(true);
33
+ expect(isProbe("Concurrency Probe")).toBe(true);
34
+ });
35
+ });
36
+
37
+ // ── extractAssistantTurnsAfter ───────────────────────────────────────────────
38
+
39
+ function makeTranscript(
40
+ lines: Array<{ type: string; timestamp: string; content?: string | Array<Record<string, unknown>> }>,
41
+ ): string {
42
+ return lines
43
+ .map((l) => {
44
+ const msg =
45
+ l.type === "assistant"
46
+ ? {
47
+ type: "assistant",
48
+ timestamp: l.timestamp,
49
+ message: { content: l.content ?? "" },
50
+ }
51
+ : { type: l.type, timestamp: l.timestamp };
52
+ return JSON.stringify(msg);
53
+ })
54
+ .join("\n");
55
+ }
56
+
57
+ describe("extractAssistantTurnsAfter", () => {
58
+ it("returns empty for a missing file", () => {
59
+ expect(extractAssistantTurnsAfter("/tmp/nlm-nonexistent-transcript.jsonl", 0, 3)).toEqual([]);
60
+ });
61
+
62
+ it("returns empty when no assistant turns exist after the cutoff", () => {
63
+ const dir = tmpdir();
64
+ const path = join(dir, `transcript-past-${Date.now()}.jsonl`);
65
+ writeFileSync(
66
+ path,
67
+ makeTranscript([
68
+ { type: "user", timestamp: "2026-01-01T00:00:00.000Z" },
69
+ { type: "assistant", timestamp: "2026-01-01T00:00:01.000Z", content: "answer" },
70
+ ]),
71
+ );
72
+ // cutoff is after the assistant turn
73
+ const cutoff = Date.parse("2026-01-01T00:00:02.000Z");
74
+ expect(extractAssistantTurnsAfter(path, cutoff, 3)).toEqual([]);
75
+ });
76
+
77
+ it("returns up to `limit` assistant turns at or after the cutoff", () => {
78
+ const dir = tmpdir();
79
+ const path = join(dir, `transcript-limit-${Date.now()}.jsonl`);
80
+ const ts = "2026-05-01T10:00:00.000Z";
81
+ writeFileSync(
82
+ path,
83
+ makeTranscript([
84
+ { type: "user", timestamp: "2026-05-01T09:59:59.000Z" },
85
+ { type: "assistant", timestamp: ts, content: "turn-1" },
86
+ { type: "user", timestamp: "2026-05-01T10:00:01.000Z" },
87
+ { type: "assistant", timestamp: "2026-05-01T10:00:02.000Z", content: "turn-2" },
88
+ { type: "user", timestamp: "2026-05-01T10:00:03.000Z" },
89
+ { type: "assistant", timestamp: "2026-05-01T10:00:04.000Z", content: "turn-3" },
90
+ { type: "user", timestamp: "2026-05-01T10:00:05.000Z" },
91
+ { type: "assistant", timestamp: "2026-05-01T10:00:06.000Z", content: "turn-4" },
92
+ ]),
93
+ );
94
+ const cutoff = Date.parse(ts);
95
+ const turns = extractAssistantTurnsAfter(path, cutoff, 3);
96
+ expect(turns).toHaveLength(3);
97
+ expect(turns[0]).toContain("turn-1");
98
+ expect(turns[1]).toContain("turn-2");
99
+ expect(turns[2]).toContain("turn-3");
100
+ });
101
+
102
+ it("extracts text from content-array turns (text + tool_use)", () => {
103
+ const dir = tmpdir();
104
+ const path = join(dir, `transcript-blocks-${Date.now()}.jsonl`);
105
+ const ts = "2026-05-01T10:00:00.000Z";
106
+ const content: Array<Record<string, unknown>> = [
107
+ { type: "text", text: "I looked it up." },
108
+ { type: "tool_use", name: "mcp__nlm-memory__get_session", input: { id: "cc_sub_abc123" } },
109
+ ];
110
+ writeFileSync(
111
+ path,
112
+ JSON.stringify({ type: "assistant", timestamp: ts, message: { content } }) + "\n",
113
+ );
114
+ const turns = extractAssistantTurnsAfter(path, Date.parse(ts), 3);
115
+ expect(turns).toHaveLength(1);
116
+ expect(turns[0]).toContain("I looked it up.");
117
+ expect(turns[0]).toContain("cc_sub_abc123");
118
+ });
119
+
120
+ it("skips malformed JSON lines without throwing", () => {
121
+ const dir = tmpdir();
122
+ const path = join(dir, `transcript-malformed-${Date.now()}.jsonl`);
123
+ const ts = "2026-05-01T10:00:00.000Z";
124
+ writeFileSync(
125
+ path,
126
+ "not json\n" +
127
+ JSON.stringify({ type: "assistant", timestamp: ts, message: { content: "ok" } }) +
128
+ "\n",
129
+ );
130
+ const turns = extractAssistantTurnsAfter(path, Date.parse(ts), 3);
131
+ expect(turns).toHaveLength(1);
132
+ expect(turns[0]).toContain("ok");
133
+ });
134
+ });
135
+
136
+ // ── findMatchedId ────────────────────────────────────────────────────────────
137
+
138
+ describe("findMatchedId", () => {
139
+ it("returns the first matching ID", () => {
140
+ expect(findMatchedId(["cc_sub_abc", "cc_sub_def"], ["context cc_sub_abc here"])).toBe(
141
+ "cc_sub_abc",
142
+ );
143
+ });
144
+
145
+ it("returns null when no ID appears", () => {
146
+ expect(findMatchedId(["cc_sub_abc"], ["completely unrelated text"])).toBeNull();
147
+ });
148
+
149
+ it("matches IDs inside tool_use serialized JSON", () => {
150
+ const turns = [JSON.stringify({ id: "cc_sub_xyz123" })];
151
+ expect(findMatchedId(["cc_sub_xyz123"], turns)).toBe("cc_sub_xyz123");
152
+ });
153
+
154
+ it("returns null for empty ids list", () => {
155
+ expect(findMatchedId([], ["some text"])).toBeNull();
156
+ });
157
+
158
+ it("returns null for empty turns list", () => {
159
+ expect(findMatchedId(["cc_sub_abc"], [])).toBeNull();
160
+ });
161
+ });
162
+
163
+ // ── scanUsefulHits ───────────────────────────────────────────────────────────
164
+
165
+ function setupScanDirs(): { root: string; hookLogPath: string; usefulHitLogPath: string; transcriptsDir: string } {
166
+ const root = join(tmpdir(), `nlm-scan-test-${Date.now()}-${Math.random().toString(36).slice(2)}`);
167
+ mkdirSync(root, { recursive: true });
168
+ const hookLogPath = join(root, "hook-log.jsonl");
169
+ const usefulHitLogPath = join(root, "useful-hit-log.jsonl");
170
+ const transcriptsDir = join(root, "projects");
171
+ mkdirSync(transcriptsDir, { recursive: true });
172
+ return { root, hookLogPath, usefulHitLogPath, transcriptsDir };
173
+ }
174
+
175
+ function writeTranscript(transcriptsDir: string, conversationId: string, content: string): void {
176
+ const projectDir = join(transcriptsDir, "test-project");
177
+ mkdirSync(projectDir, { recursive: true });
178
+ writeFileSync(join(projectDir, `${conversationId}.jsonl`), content);
179
+ }
180
+
181
+ describe("scanUsefulHits", () => {
182
+ it("returns zero totals when hook log is absent", async () => {
183
+ const { root, hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
184
+ const result = await scanUsefulHits({
185
+ days: 1,
186
+ hookLogPath,
187
+ usefulHitLogPath,
188
+ transcriptsDir,
189
+ dryRun: true,
190
+ });
191
+ expect(result).toEqual({ total: 0, measurable: 0, useful: 0, appended: 0 });
192
+ // suppress unused warning
193
+ void root;
194
+ });
195
+
196
+ it("counts a useful hit when the ID appears in the next assistant turn", async () => {
197
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
198
+ const convId = "test-conv-useful-hit";
199
+ const hookTs = new Date().toISOString();
200
+ const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
201
+
202
+ // Hook log entry with wouldInject
203
+ writeFileSync(
204
+ hookLogPath,
205
+ JSON.stringify({
206
+ ts: hookTs,
207
+ conversationId: convId,
208
+ promptPreview: "what did we decide about the schema",
209
+ gate: "evaluate",
210
+ hits: [{ id: "cc_sub_abc123def456", score: 1.2 }],
211
+ wouldInject: ["cc_sub_abc123def456"],
212
+ estTokens: 50,
213
+ mode: "shadow",
214
+ }) + "\n",
215
+ );
216
+
217
+ // Transcript with the ID appearing in the assistant turn after the hook
218
+ writeTranscript(
219
+ transcriptsDir,
220
+ convId,
221
+ JSON.stringify({ type: "user", timestamp: hookTs }) +
222
+ "\n" +
223
+ JSON.stringify({
224
+ type: "assistant",
225
+ timestamp: afterTs,
226
+ message: { content: "Per cc_sub_abc123def456 we chose the new schema." },
227
+ }) +
228
+ "\n",
229
+ );
230
+
231
+ const result = await scanUsefulHits({
232
+ days: 1,
233
+ hookLogPath,
234
+ usefulHitLogPath,
235
+ transcriptsDir,
236
+ });
237
+
238
+ expect(result.total).toBe(1);
239
+ expect(result.measurable).toBe(1);
240
+ expect(result.useful).toBe(1);
241
+ expect(result.appended).toBe(1);
242
+ });
243
+
244
+ it("records useful=false when the ID does not appear in subsequent turns", async () => {
245
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
246
+ const convId = "test-conv-not-useful";
247
+ const hookTs = new Date().toISOString();
248
+ const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
249
+
250
+ writeFileSync(
251
+ hookLogPath,
252
+ JSON.stringify({
253
+ ts: hookTs,
254
+ conversationId: convId,
255
+ promptPreview: "explain this code",
256
+ gate: "evaluate",
257
+ hits: [{ id: "cc_sub_zzz999", score: 0.8 }],
258
+ wouldInject: ["cc_sub_zzz999"],
259
+ estTokens: 30,
260
+ mode: "shadow",
261
+ }) + "\n",
262
+ );
263
+
264
+ writeTranscript(
265
+ transcriptsDir,
266
+ convId,
267
+ JSON.stringify({ type: "user", timestamp: hookTs }) +
268
+ "\n" +
269
+ JSON.stringify({
270
+ type: "assistant",
271
+ timestamp: afterTs,
272
+ message: { content: "Here is the explanation." },
273
+ }) +
274
+ "\n",
275
+ );
276
+
277
+ const result = await scanUsefulHits({
278
+ days: 1,
279
+ hookLogPath,
280
+ usefulHitLogPath,
281
+ transcriptsDir,
282
+ });
283
+
284
+ expect(result.useful).toBe(0);
285
+ expect(result.measurable).toBe(1);
286
+
287
+ // Verify the written entry has useful=false
288
+ const { readFileSync } = await import("node:fs");
289
+ const written = JSON.parse(readFileSync(usefulHitLogPath, "utf8").trim()) as Record<string, unknown>;
290
+ expect(written["useful"]).toBe(false);
291
+ expect(written["matchedId"]).toBeNull();
292
+ });
293
+
294
+ it("records useful=null when no transcript is found", async () => {
295
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
296
+ const hookTs = new Date().toISOString();
297
+
298
+ writeFileSync(
299
+ hookLogPath,
300
+ JSON.stringify({
301
+ ts: hookTs,
302
+ conversationId: "missing-conv-id-xyz",
303
+ promptPreview: "what is the error",
304
+ gate: "evaluate",
305
+ hits: [{ id: "cc_sub_missing", score: 1.0 }],
306
+ wouldInject: ["cc_sub_missing"],
307
+ estTokens: 20,
308
+ mode: "shadow",
309
+ }) + "\n",
310
+ );
311
+
312
+ const result = await scanUsefulHits({
313
+ days: 1,
314
+ hookLogPath,
315
+ usefulHitLogPath,
316
+ transcriptsDir,
317
+ });
318
+
319
+ expect(result.measurable).toBe(0);
320
+ expect(result.useful).toBe(0);
321
+
322
+ const { readFileSync } = await import("node:fs");
323
+ const written = JSON.parse(readFileSync(usefulHitLogPath, "utf8").trim()) as Record<string, unknown>;
324
+ expect(written["useful"]).toBeNull();
325
+ });
326
+
327
+ it("skips probe entries", async () => {
328
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
329
+ const hookTs = new Date().toISOString();
330
+
331
+ writeFileSync(
332
+ hookLogPath,
333
+ JSON.stringify({
334
+ ts: hookTs,
335
+ conversationId: "probe-conv",
336
+ promptPreview: "recall test round 3",
337
+ gate: "evaluate",
338
+ hits: [{ id: "cc_sub_probe", score: 1.0 }],
339
+ wouldInject: ["cc_sub_probe"],
340
+ estTokens: 10,
341
+ mode: "shadow",
342
+ }) + "\n",
343
+ );
344
+
345
+ const result = await scanUsefulHits({
346
+ days: 1,
347
+ hookLogPath,
348
+ usefulHitLogPath,
349
+ transcriptsDir,
350
+ });
351
+
352
+ expect(result.total).toBe(0);
353
+ });
354
+
355
+ it("skips entries with empty wouldInject", async () => {
356
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
357
+ const hookTs = new Date().toISOString();
358
+
359
+ writeFileSync(
360
+ hookLogPath,
361
+ JSON.stringify({
362
+ ts: hookTs,
363
+ conversationId: "conv-no-inject",
364
+ promptPreview: "what is the status",
365
+ gate: "generative",
366
+ hits: [],
367
+ wouldInject: [],
368
+ estTokens: 0,
369
+ mode: "shadow",
370
+ }) + "\n",
371
+ );
372
+
373
+ const result = await scanUsefulHits({
374
+ days: 1,
375
+ hookLogPath,
376
+ usefulHitLogPath,
377
+ transcriptsDir,
378
+ });
379
+
380
+ expect(result.total).toBe(0);
381
+ });
382
+
383
+ it("skips stop-hook entries (kind field present)", async () => {
384
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
385
+ const hookTs = new Date().toISOString();
386
+
387
+ writeFileSync(
388
+ hookLogPath,
389
+ JSON.stringify({
390
+ ts: hookTs,
391
+ kind: "stop",
392
+ conversationId: "conv-stop",
393
+ surfacedCount: 2,
394
+ citedIds: ["cc_sub_abc"],
395
+ citationKinds: ["tool_use"],
396
+ skipped: false,
397
+ mode: "shadow",
398
+ }) + "\n",
399
+ );
400
+
401
+ const result = await scanUsefulHits({
402
+ days: 1,
403
+ hookLogPath,
404
+ usefulHitLogPath,
405
+ transcriptsDir,
406
+ });
407
+
408
+ expect(result.total).toBe(0);
409
+ });
410
+
411
+ it("skips already-scanned entries on a second run", async () => {
412
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
413
+ const convId = "conv-dedup";
414
+ const hookTs = new Date().toISOString();
415
+ const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
416
+
417
+ writeFileSync(
418
+ hookLogPath,
419
+ JSON.stringify({
420
+ ts: hookTs,
421
+ conversationId: convId,
422
+ promptPreview: "help with recall",
423
+ gate: "evaluate",
424
+ hits: [{ id: "cc_sub_dedup123", score: 1.1 }],
425
+ wouldInject: ["cc_sub_dedup123"],
426
+ estTokens: 40,
427
+ mode: "shadow",
428
+ }) + "\n",
429
+ );
430
+
431
+ writeTranscript(
432
+ transcriptsDir,
433
+ convId,
434
+ JSON.stringify({ type: "user", timestamp: hookTs }) +
435
+ "\n" +
436
+ JSON.stringify({
437
+ type: "assistant",
438
+ timestamp: afterTs,
439
+ message: { content: "Used cc_sub_dedup123 for the answer." },
440
+ }) +
441
+ "\n",
442
+ );
443
+
444
+ const first = await scanUsefulHits({ days: 1, hookLogPath, usefulHitLogPath, transcriptsDir });
445
+ expect(first.appended).toBe(1);
446
+
447
+ const second = await scanUsefulHits({ days: 1, hookLogPath, usefulHitLogPath, transcriptsDir });
448
+ expect(second.appended).toBe(0);
449
+ expect(second.total).toBe(1);
450
+ });
451
+
452
+ it("does not write when dryRun=true", async () => {
453
+ const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
454
+ const hookTs = new Date().toISOString();
455
+
456
+ writeFileSync(
457
+ hookLogPath,
458
+ JSON.stringify({
459
+ ts: hookTs,
460
+ conversationId: "dry-conv",
461
+ promptPreview: "explain the bug",
462
+ gate: "evaluate",
463
+ hits: [{ id: "cc_sub_dry", score: 1.0 }],
464
+ wouldInject: ["cc_sub_dry"],
465
+ estTokens: 20,
466
+ mode: "shadow",
467
+ }) + "\n",
468
+ );
469
+
470
+ const result = await scanUsefulHits({
471
+ days: 1,
472
+ hookLogPath,
473
+ usefulHitLogPath,
474
+ transcriptsDir,
475
+ dryRun: true,
476
+ });
477
+
478
+ expect(result.appended).toBe(0);
479
+ expect(result.total).toBe(1);
480
+ const { existsSync } = await import("node:fs");
481
+ expect(existsSync(usefulHitLogPath)).toBe(false);
482
+ });
483
+ });
484
+
485
+ // ── readUsefulHitRate ────────────────────────────────────────────────────────
486
+
487
+ describe("readUsefulHitRate", () => {
488
+ it("returns null when the log file is absent", async () => {
489
+ const path = join(tmpdir(), `nlm-no-useful-${Date.now()}.jsonl`);
490
+ expect(await readUsefulHitRate(path, 1)).toBeNull();
491
+ });
492
+
493
+ it("returns null when all entries have useful=null (unmeasurable)", async () => {
494
+ const path = join(tmpdir(), `nlm-useful-null-${Date.now()}.jsonl`);
495
+ const ts = new Date().toISOString();
496
+ writeFileSync(
497
+ path,
498
+ JSON.stringify({ ts, conversationId: "x", useful: null, returnedIds: [], source: "hook", matchedId: null, scannedAt: ts }) + "\n",
499
+ );
500
+ expect(await readUsefulHitRate(path, 1)).toBeNull();
501
+ });
502
+
503
+ it("computes the rate correctly from measurable entries", async () => {
504
+ const path = join(tmpdir(), `nlm-useful-rate-${Date.now()}.jsonl`);
505
+ const ts = new Date().toISOString();
506
+ writeFileSync(
507
+ path,
508
+ [
509
+ { ts, conversationId: "a", useful: true, returnedIds: ["cc_sub_1"], source: "hook", matchedId: "cc_sub_1", scannedAt: ts },
510
+ { ts, conversationId: "b", useful: false, returnedIds: ["cc_sub_2"], source: "hook", matchedId: null, scannedAt: ts },
511
+ { ts, conversationId: "c", useful: true, returnedIds: ["cc_sub_3"], source: "hook", matchedId: "cc_sub_3", scannedAt: ts },
512
+ { ts, conversationId: "d", useful: null, returnedIds: ["cc_sub_4"], source: "hook", matchedId: null, scannedAt: ts },
513
+ ]
514
+ .map((e) => JSON.stringify(e))
515
+ .join("\n") + "\n",
516
+ );
517
+ // 2 useful out of 3 measurable = 0.667
518
+ expect(await readUsefulHitRate(path, 1)).toBeCloseTo(0.667, 2);
519
+ });
520
+
521
+ it("excludes entries outside the window", async () => {
522
+ const path = join(tmpdir(), `nlm-useful-window-${Date.now()}.jsonl`);
523
+ const old = new Date(Date.now() - 3 * 24 * 60 * 60 * 1000).toISOString();
524
+ const recent = new Date().toISOString();
525
+ writeFileSync(
526
+ path,
527
+ [
528
+ { ts: old, conversationId: "old", useful: true, returnedIds: [], source: "hook", matchedId: "x", scannedAt: old },
529
+ { ts: recent, conversationId: "new", useful: false, returnedIds: [], source: "hook", matchedId: null, scannedAt: recent },
530
+ ]
531
+ .map((e) => JSON.stringify(e))
532
+ .join("\n") + "\n",
533
+ );
534
+ // Only the recent entry is in the 1-day window: 0/1 = 0.0
535
+ expect(await readUsefulHitRate(path, 1)).toBe(0);
536
+ });
537
+ });
@@ -0,0 +1,93 @@
1
+ /**
2
+ * Unit tests for OllamaClient.embed: nomic prefix scheme, L2 normalization,
3
+ * 8K char truncation. These guard the nomic-embed-text v1.5 contract.
4
+ */
5
+
6
+ import { describe, expect, it } from "vitest";
7
+ import { OllamaClient, l2Normalize } from "../../../src/llm/ollama-client.js";
8
+
9
+ type FakeFetch = typeof fetch;
10
+
11
+ function jsonResponse(body: unknown): Response {
12
+ return new Response(JSON.stringify(body), {
13
+ status: 200,
14
+ headers: { "content-type": "application/json" },
15
+ });
16
+ }
17
+
18
+ function makeFetch(reply: (req: { url: string; body: unknown }) => Response): FakeFetch {
19
+ return (async (input: string | URL | Request, init?: RequestInit) => {
20
+ const url = typeof input === "string" ? input : input.toString();
21
+ const body = init?.body ? JSON.parse(init.body.toString()) : null;
22
+ return reply({ url, body });
23
+ }) as FakeFetch;
24
+ }
25
+
26
+ describe("OllamaClient.embed prefix scheme", () => {
27
+ it("prefixes a query call with 'search_query: '", async () => {
28
+ let prompt = "";
29
+ const fetchImpl = makeFetch(({ body }) => {
30
+ prompt = (body as { prompt: string }).prompt;
31
+ return jsonResponse({ embedding: [1, 0, 0] });
32
+ });
33
+ const client = new OllamaClient({ fetchImpl });
34
+ await client.embed("what did we decide about pgvector", "query");
35
+ expect(prompt.startsWith("search_query: ")).toBe(true);
36
+ expect(prompt).toContain("pgvector");
37
+ });
38
+
39
+ it("prefixes a document call with 'search_document: '", async () => {
40
+ let prompt = "";
41
+ const fetchImpl = makeFetch(({ body }) => {
42
+ prompt = (body as { prompt: string }).prompt;
43
+ return jsonResponse({ embedding: [1, 0, 0] });
44
+ });
45
+ const client = new OllamaClient({ fetchImpl });
46
+ await client.embed("session body text", "document");
47
+ expect(prompt.startsWith("search_document: ")).toBe(true);
48
+ });
49
+
50
+ it("truncates text to MAX_EMBED_CHARS (8000) before prefixing", async () => {
51
+ let prompt = "";
52
+ const fetchImpl = makeFetch(({ body }) => {
53
+ prompt = (body as { prompt: string }).prompt;
54
+ return jsonResponse({ embedding: [1, 0, 0] });
55
+ });
56
+ const client = new OllamaClient({ fetchImpl });
57
+ const big = "x".repeat(10_000);
58
+ await client.embed(big, "document");
59
+ // prompt = "search_document: " + truncated → prefix is 17 chars, body capped at 8000.
60
+ // Briefly raised to 28000 on 2026-05-25 then reverted same day; nomic-
61
+ // embed-text via Ollama 500s on inputs near the nominal 8192-token
62
+ // context. Real fix is chunk + max-pool (filed as #174).
63
+ expect(prompt.length).toBe(17 + 8_000);
64
+ });
65
+
66
+ it("L2-normalizes the returned vector", async () => {
67
+ const fetchImpl = makeFetch(() => jsonResponse({ embedding: [3, 4, 0] }));
68
+ const client = new OllamaClient({ fetchImpl });
69
+ const { vector } = await client.embed("anything", "document");
70
+ // raw norm = 5; normalized should be [0.6, 0.8, 0]
71
+ expect(vector[0]).toBeCloseTo(0.6, 6);
72
+ expect(vector[1]).toBeCloseTo(0.8, 6);
73
+ expect(vector[2]).toBe(0);
74
+ let norm = 0;
75
+ for (const v of vector) norm += v * v;
76
+ expect(Math.sqrt(norm)).toBeCloseTo(1, 6);
77
+ });
78
+ });
79
+
80
+ describe("l2Normalize", () => {
81
+ it("returns a unit vector for a non-zero input", () => {
82
+ const out = l2Normalize(new Float32Array([3, 4, 0]));
83
+ let sum = 0;
84
+ for (const v of out) sum += v * v;
85
+ expect(Math.sqrt(sum)).toBeCloseTo(1, 6);
86
+ });
87
+
88
+ it("returns the zero vector unchanged", () => {
89
+ const zero = new Float32Array([0, 0, 0]);
90
+ const out = l2Normalize(zero);
91
+ expect(Array.from(out)).toEqual([0, 0, 0]);
92
+ });
93
+ });