nlm-memory 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (257) hide show
  1. package/README.md +89 -34
  2. package/dist/cli/digest.d.ts +20 -0
  3. package/dist/cli/digest.js +142 -0
  4. package/dist/cli/digest.js.map +1 -0
  5. package/dist/cli/nlm.d.ts +1 -0
  6. package/dist/cli/nlm.js +25 -1
  7. package/dist/cli/nlm.js.map +1 -1
  8. package/dist/core/digest/compose.d.ts +38 -0
  9. package/dist/core/digest/compose.js +93 -0
  10. package/dist/core/digest/compose.js.map +1 -0
  11. package/dist/core/digest/hook-liveness.d.ts +32 -0
  12. package/dist/core/digest/hook-liveness.js +54 -0
  13. package/dist/core/digest/hook-liveness.js.map +1 -0
  14. package/dist/http/app.js +2 -1
  15. package/dist/http/app.js.map +1 -1
  16. package/dist/mcp/server.js +20 -1
  17. package/dist/mcp/server.js.map +1 -1
  18. package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
  19. package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
  20. package/dist/ui/index.html +2 -2
  21. package/package.json +26 -1
  22. package/.agents/plugins/marketplace.json +0 -20
  23. package/.github/workflows/ci.yml +0 -30
  24. package/docs/methodology/re-derivation-rate.md +0 -112
  25. package/docs/methodology/useful-hit-rate.md +0 -79
  26. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  27. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  28. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  29. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  30. package/docs/plans/desktop-product.md +0 -69
  31. package/docs/plans/factstore-design.md +0 -236
  32. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
  33. package/logs/CHANGELOG/CHANGELOG.md +0 -209
  34. package/migrations/000_initial_schema.sql +0 -174
  35. package/migrations/001_entity_type_rename.sql +0 -17
  36. package/migrations/002_adapter_state_extend.sql +0 -12
  37. package/migrations/003_session_embeddings.sql +0 -11
  38. package/migrations/004_facts.sql +0 -46
  39. package/migrations/005_sources.sql +0 -31
  40. package/migrations/006_providers.sql +0 -33
  41. package/migrations/007_source_tokens.sql +0 -17
  42. package/migrations/008_fts_rebuild.sql +0 -9
  43. package/migrations/009_session_embedding_chunks.sql +0 -46
  44. package/migrations/010_sources_opencode.sql +0 -30
  45. package/migrations/011_sources_hermes_agent.sql +0 -30
  46. package/migrations/012_sources_aider.sql +0 -30
  47. package/migrations/013_adapter_state_failure_count.sql +0 -12
  48. package/migrations/014_sources_cursor.sql +0 -30
  49. package/migrations/015_sources_windsurf.sql +0 -30
  50. package/plugin-hermes-agent/README.md +0 -49
  51. package/plugin-hermes-agent/__init__.py +0 -75
  52. package/plugin-hermes-agent/plugin.yaml +0 -15
  53. package/scripts/backfill-citations.mjs +0 -0
  54. package/scripts/build-codex-plugin.mjs +0 -61
  55. package/scripts/deepseek-probe.mjs +0 -67
  56. package/scripts/extract-triples.mjs +0 -207
  57. package/scripts/longmemeval/embedding-cache.ts +0 -77
  58. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  59. package/scripts/longmemeval/run-harness.ts +0 -315
  60. package/scripts/longmemeval/scorer.ts +0 -99
  61. package/scripts/longmemeval/tsconfig.json +0 -9
  62. package/scripts/longmemeval/types.ts +0 -35
  63. package/scripts/nlm-daily-digest.py +0 -239
  64. package/scripts/nlm-daily-digest.sh +0 -28
  65. package/src/cli/classify-parity.ts +0 -257
  66. package/src/cli/launchctl-helpers.ts +0 -49
  67. package/src/cli/nlm.ts +0 -1078
  68. package/src/core/actions/actions-log.ts +0 -118
  69. package/src/core/actions/overlay.ts +0 -117
  70. package/src/core/adapters/aider.ts +0 -205
  71. package/src/core/adapters/claude-code.ts +0 -293
  72. package/src/core/adapters/common.ts +0 -54
  73. package/src/core/adapters/cursor.ts +0 -486
  74. package/src/core/adapters/from-source.ts +0 -67
  75. package/src/core/adapters/hermes-agent.ts +0 -240
  76. package/src/core/adapters/hermes.ts +0 -277
  77. package/src/core/adapters/jsonl-generic.ts +0 -208
  78. package/src/core/adapters/opencode.ts +0 -281
  79. package/src/core/adapters/pi.ts +0 -264
  80. package/src/core/adapters/windsurf.ts +0 -386
  81. package/src/core/classifier/prompt.ts +0 -200
  82. package/src/core/dataset/build-dataset.ts +0 -463
  83. package/src/core/embedding/chunk-body.ts +0 -76
  84. package/src/core/embedding/embed-backfill.ts +0 -210
  85. package/src/core/embedding/embed-normalize.ts +0 -135
  86. package/src/core/facts/backfill-facts.ts +0 -254
  87. package/src/core/facts/extract-facts.ts +0 -50
  88. package/src/core/hook/citation-detect.ts +0 -124
  89. package/src/core/hook/cite-memo.ts +0 -68
  90. package/src/core/hook/claude-settings.ts +0 -187
  91. package/src/core/hook/gate.ts +0 -25
  92. package/src/core/hook/hook-log.ts +0 -41
  93. package/src/core/hook/memo-sweep.ts +0 -164
  94. package/src/core/hook/memo.ts +0 -67
  95. package/src/core/hook/pointer-block.ts +0 -26
  96. package/src/core/hook/select.ts +0 -32
  97. package/src/core/hook/transcript.ts +0 -121
  98. package/src/core/ingest/ingest-session.ts +0 -111
  99. package/src/core/providers/provider-models.ts +0 -100
  100. package/src/core/providers/provider-registry.ts +0 -196
  101. package/src/core/recall/citation-log.ts +0 -108
  102. package/src/core/recall/filter.ts +0 -27
  103. package/src/core/recall/index.ts +0 -6
  104. package/src/core/recall/match-fields.ts +0 -40
  105. package/src/core/recall/query-log.ts +0 -149
  106. package/src/core/recall/query-shape.ts +0 -66
  107. package/src/core/recall/recall-service.ts +0 -320
  108. package/src/core/recall/recent-log.ts +0 -59
  109. package/src/core/recall/tokenize.ts +0 -18
  110. package/src/core/recall/useful-scan.ts +0 -336
  111. package/src/core/recall-facts/fact-query-log.ts +0 -150
  112. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  113. package/src/core/scheduler/scan-once.ts +0 -142
  114. package/src/core/scheduler/scheduler.ts +0 -225
  115. package/src/core/sources/source-registry.ts +0 -278
  116. package/src/core/storage/db-restore.ts +0 -133
  117. package/src/core/storage/live-status.ts +0 -45
  118. package/src/core/storage/migrate.ts +0 -72
  119. package/src/core/storage/sqlite-fact-store.ts +0 -304
  120. package/src/core/storage/sqlite-session-store.ts +0 -810
  121. package/src/hook/hook-auth.ts +0 -18
  122. package/src/hook/prompt-recall-hook.ts +0 -180
  123. package/src/hook/session-end-hook.ts +0 -81
  124. package/src/hook/session-start-hook.ts +0 -168
  125. package/src/hook/stop-hook.ts +0 -239
  126. package/src/http/app.ts +0 -1215
  127. package/src/install/claude-code.ts +0 -128
  128. package/src/install/codex.ts +0 -367
  129. package/src/install/cursor.ts +0 -68
  130. package/src/install/hermes-agent.ts +0 -76
  131. package/src/install/hermes.ts +0 -78
  132. package/src/install/nlm-dir-perms.ts +0 -55
  133. package/src/install/ollama.ts +0 -284
  134. package/src/install/setup.ts +0 -489
  135. package/src/install/windsurf.ts +0 -68
  136. package/src/llm/classifier-box.ts +0 -64
  137. package/src/llm/deepseek-client.ts +0 -150
  138. package/src/llm/env-autoload.ts +0 -55
  139. package/src/llm/ollama-client.ts +0 -189
  140. package/src/mcp/server.ts +0 -534
  141. package/src/ports/fact-store.ts +0 -102
  142. package/src/ports/llm-client.ts +0 -52
  143. package/src/ports/logger.ts +0 -16
  144. package/src/ports/session-store.ts +0 -45
  145. package/src/ports/transcript-adapter.ts +0 -55
  146. package/src/shared/types.ts +0 -149
  147. package/src/ui/App.tsx +0 -58
  148. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  149. package/src/ui/components/SessionDrawer.tsx +0 -199
  150. package/src/ui/components/SideNav.tsx +0 -162
  151. package/src/ui/components/Skeleton.tsx +0 -107
  152. package/src/ui/index.html +0 -13
  153. package/src/ui/lib/actions.ts +0 -30
  154. package/src/ui/lib/api.ts +0 -92
  155. package/src/ui/lib/dataset.ts +0 -141
  156. package/src/ui/lib/registries.ts +0 -155
  157. package/src/ui/lib/view-settings.ts +0 -41
  158. package/src/ui/main.tsx +0 -15
  159. package/src/ui/pages/Live.tsx +0 -229
  160. package/src/ui/pages/Pulse.tsx +0 -415
  161. package/src/ui/pages/Recall.tsx +0 -190
  162. package/src/ui/pages/River.tsx +0 -354
  163. package/src/ui/pages/Search.tsx +0 -386
  164. package/src/ui/pages/Stub.tsx +0 -9
  165. package/src/ui/pages/Thread.tsx +0 -473
  166. package/src/ui/pages/settings/Classifier.tsx +0 -227
  167. package/src/ui/pages/settings/Data.tsx +0 -190
  168. package/src/ui/pages/settings/Index.tsx +0 -65
  169. package/src/ui/pages/settings/Labels.tsx +0 -224
  170. package/src/ui/pages/settings/Providers.tsx +0 -305
  171. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  172. package/src/ui/pages/settings/Sources.tsx +0 -326
  173. package/src/ui/pages/settings/Views.tsx +0 -96
  174. package/src/ui/styles.css +0 -1890
  175. package/src/ui/tsconfig.json +0 -21
  176. package/src/ui/vite.config.ts +0 -19
  177. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  178. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  179. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  180. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  181. package/tests/fixtures/facts.ts +0 -17
  182. package/tests/fixtures/golden-corpus.ts +0 -85
  183. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  184. package/tests/fixtures/hermes/paired_session.json +0 -23
  185. package/tests/fixtures/hermes/request_dump.json +0 -28
  186. package/tests/fixtures/hermes/session_iso.json +0 -38
  187. package/tests/fixtures/hermes/session_unix.json +0 -38
  188. package/tests/fixtures/hermes/system_only.json +0 -18
  189. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  190. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  191. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  192. package/tests/fixtures/sessions.ts +0 -22
  193. package/tests/integration/backfill-facts.test.ts +0 -362
  194. package/tests/integration/citation-explicit.test.ts +0 -111
  195. package/tests/integration/cite-event.test.ts +0 -169
  196. package/tests/integration/cite-memo.test.ts +0 -87
  197. package/tests/integration/db-restore.test.ts +0 -153
  198. package/tests/integration/embed-backfill.test.ts +0 -176
  199. package/tests/integration/fact-supersedence.test.ts +0 -313
  200. package/tests/integration/fts-index.test.ts +0 -60
  201. package/tests/integration/getbyids-sqlite.test.ts +0 -100
  202. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  203. package/tests/integration/hook-claude-settings.test.ts +0 -218
  204. package/tests/integration/hook-log.test.ts +0 -54
  205. package/tests/integration/hook-memo.test.ts +0 -68
  206. package/tests/integration/hook-pre-compact.test.ts +0 -105
  207. package/tests/integration/hook-subagent-start.test.ts +0 -102
  208. package/tests/integration/http.test.ts +0 -401
  209. package/tests/integration/keyword-search-fts.test.ts +0 -66
  210. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  211. package/tests/integration/mcp.test.ts +0 -260
  212. package/tests/integration/memo-sweep.test.ts +0 -91
  213. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  214. package/tests/integration/provider-registry.test.ts +0 -107
  215. package/tests/integration/recall-golden.test.ts +0 -59
  216. package/tests/integration/recall-sqlite.test.ts +0 -169
  217. package/tests/integration/scheduler.test.ts +0 -391
  218. package/tests/integration/session-end-hook.test.ts +0 -48
  219. package/tests/integration/session-start-hook.test.ts +0 -126
  220. package/tests/integration/source-registry.test.ts +0 -122
  221. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  222. package/tests/integration/stop-hook.test.ts +0 -560
  223. package/tests/integration/wal-checkpoint.test.ts +0 -49
  224. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  225. package/tests/unit/core/adapters/aider.test.ts +0 -230
  226. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  227. package/tests/unit/core/adapters/cursor.test.ts +0 -485
  228. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  229. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  230. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  231. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  232. package/tests/unit/core/adapters/pi.test.ts +0 -110
  233. package/tests/unit/core/adapters/windsurf.test.ts +0 -416
  234. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  235. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  236. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  237. package/tests/unit/core/filter.test.ts +0 -40
  238. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  239. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  240. package/tests/unit/core/hook/gate.test.ts +0 -29
  241. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  242. package/tests/unit/core/hook/select.test.ts +0 -66
  243. package/tests/unit/core/match-fields.test.ts +0 -39
  244. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  245. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  246. package/tests/unit/core/query-shape.test.ts +0 -92
  247. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  248. package/tests/unit/core/recall-service.test.ts +0 -200
  249. package/tests/unit/core/storage/live-status.test.ts +0 -54
  250. package/tests/unit/core/tokenize.test.ts +0 -32
  251. package/tests/unit/core/useful-scan.test.ts +0 -537
  252. package/tests/unit/llm/embed.test.ts +0 -93
  253. package/tests/unit/llm/ollama-client.test.ts +0 -124
  254. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  255. package/tsconfig.json +0 -31
  256. package/tsconfig.test.json +0 -11
  257. package/vitest.config.ts +0 -22
@@ -1,320 +0,0 @@
1
- /**
2
- * RecallService — the use case. Composes filters, keyword scoring, and
3
- * semantic search into a single recall operation.
4
- *
5
- * Depends only on ports (SessionStore, LLMClient). No framework imports,
6
- * no SQLite, no HTTP. Tests substitute fake adapters.
7
- */
8
-
9
- import type { LLMClient } from "@ports/llm-client.js";
10
- import { LLMUnreachableError } from "@ports/llm-client.js";
11
- import type {
12
- KeywordNeighbor,
13
- SemanticNeighbor,
14
- SessionStore,
15
- } from "@ports/session-store.js";
16
- import type {
17
- MatchField,
18
- RecallHit,
19
- RecallMode,
20
- RecallQuery,
21
- RecallResult,
22
- Session,
23
- } from "@shared/types.js";
24
- import { applyFilter } from "./filter.js";
25
- import { keywordMatchFields } from "./match-fields.js";
26
- import { detectQueryShape } from "./query-shape.js";
27
- import { tokenSet } from "./tokenize.js";
28
-
29
- const DEFAULT_LIMIT = 20;
30
- const MAX_LIMIT = 100;
31
- // Reciprocal Rank Fusion constant (Cormack et al. 2009). k=60 is the
32
- // canonical literature default. RRF combines ranked lists from multiple
33
- // retrievers by summing 1/(k + rank) per retriever, ignoring raw scores —
34
- // robust to wildly different score distributions (BM25 unbounded vs cosine
35
- // in [-1,1]) without requiring normalization.
36
- const RRF_K = 60;
37
- const SEMANTIC_OVERFETCH = 3;
38
- const KEYWORD_OVERFETCH = 3;
39
-
40
- export interface RecallServiceDeps {
41
- readonly store: SessionStore;
42
- readonly llm: LLMClient;
43
- }
44
-
45
- export class RecallService {
46
- constructor(private readonly deps: RecallServiceDeps) {}
47
-
48
- async search(input: RecallQuery): Promise<RecallResult> {
49
- const mode: RecallMode = input.mode ?? "keyword";
50
- const limit = clampLimit(input.limit);
51
- const entity = input.entity ?? null;
52
- const kind = input.kind ?? null;
53
-
54
- const empty: RecallResult = {
55
- query: input.query,
56
- entity,
57
- kind,
58
- mode,
59
- limit,
60
- total: 0,
61
- results: [],
62
- };
63
-
64
- if (!input.query && !entity && !kind) return empty;
65
-
66
- // 1. Search legs — ranked neighbor IDs only. No session bodies loaded.
67
- const kwNeighbors: ReadonlyArray<KeywordNeighbor> =
68
- (mode === "keyword" || mode === "hybrid") && input.query
69
- ? await this.deps.store.keywordSearch(input.query, limit * KEYWORD_OVERFETCH)
70
- : [];
71
-
72
- let semNeighbors: ReadonlyArray<SemanticNeighbor> = [];
73
- let semError: "ollama_unreachable" | null = null;
74
- if ((mode === "semantic" || mode === "hybrid") && input.query) {
75
- try {
76
- const embedding = await this.deps.llm.embed(input.query, "query");
77
- semNeighbors = await this.deps.store.semanticSearch(
78
- embedding.vector,
79
- limit * SEMANTIC_OVERFETCH,
80
- );
81
- } catch (err) {
82
- if (err instanceof LLMUnreachableError) {
83
- semError = "ollama_unreachable";
84
- } else {
85
- throw err;
86
- }
87
- }
88
- }
89
-
90
- if (mode === "semantic" && semError) {
91
- return { ...empty, modeUnavailable: semError };
92
- }
93
-
94
- // 2. Resolve ONLY the hit sessions — never the whole corpus. The
95
- // entity/kind filter is applied to the fetched hits; a filtered-out
96
- // session is absent from byId and is skipped during resolution.
97
- const hitIds = uniqueIds(kwNeighbors, semNeighbors);
98
- const hitSessions = await this.deps.store.getByIds(hitIds);
99
- const filterArgs: { entity?: string; kind?: typeof input.kind } = {};
100
- if (input.entity !== undefined) filterArgs.entity = input.entity;
101
- if (input.kind !== undefined) filterArgs.kind = input.kind;
102
- const byId = new Map<string, Session>(
103
- applyFilter(hitSessions, filterArgs).map((s) => [s.id, s]),
104
- );
105
-
106
- // 3. Build hits from the resolved sessions, preserving leg rank order.
107
- const queryTokens = input.query
108
- ? new Set(tokenSet(input.query))
109
- : new Set<string>();
110
-
111
- const kwHits: KeywordHit[] = [];
112
- for (const n of kwNeighbors) {
113
- const session = byId.get(n.sessionId);
114
- if (!session) continue;
115
- kwHits.push({
116
- session,
117
- score: n.score,
118
- matchedIn: keywordMatchFields(session, queryTokens),
119
- });
120
- }
121
-
122
- const semHits: SemanticHit[] = [];
123
- for (const n of semNeighbors) {
124
- const session = byId.get(n.sessionId);
125
- if (!session) continue;
126
- semHits.push({ session, similarity: cosineFromL2(n.distance) });
127
- }
128
-
129
- // 4. Finalize per mode.
130
- if (mode === "keyword") {
131
- return finalize(input.query, entity, kind, mode, limit, kwHits.map(toKeywordHit));
132
- }
133
- if (mode === "semantic") {
134
- return finalize(input.query, entity, kind, mode, limit, semHits.map(toSemanticHit));
135
- }
136
- const merged = mergeHybrid(kwHits, semHits);
137
- const shape = detectQueryShape(input.query);
138
- const forceIncluded = (shape.hasTemporal && shape.hasNamedEntity)
139
- ? forceIncludeKeywordTop(merged, kwHits, limit)
140
- : merged;
141
- const result = finalize(input.query, entity, kind, mode, limit, forceIncluded);
142
- return semError ? { ...result, modeUnavailable: semError } : result;
143
- }
144
- }
145
-
146
- function uniqueIds(
147
- kw: ReadonlyArray<KeywordNeighbor>,
148
- sem: ReadonlyArray<SemanticNeighbor>,
149
- ): ReadonlyArray<string> {
150
- const ids = new Set<string>();
151
- for (const n of kw) ids.add(n.sessionId);
152
- for (const n of sem) ids.add(n.sessionId);
153
- return [...ids];
154
- }
155
-
156
- interface KeywordHit {
157
- readonly session: Session;
158
- readonly score: number;
159
- readonly matchedIn: ReadonlyArray<MatchField>;
160
- }
161
-
162
- interface SemanticHit {
163
- readonly session: Session;
164
- readonly similarity: number;
165
- }
166
-
167
- /**
168
- * Reciprocal Rank Fusion across the keyword + semantic legs.
169
- *
170
- * matchScore = Σ 1/(RRF_K + rank_i) for each retriever the session appears in.
171
- * A session at rank 1 in both retrievers therefore scores ~0.0328 (the max
172
- * possible with two retrievers at k=60); a session at rank 1 in one
173
- * retriever and absent from the other scores ~0.0164.
174
- *
175
- * keywordScore and semanticScore stay populated as min-max normalized
176
- * informational values so the UI can show "how strong was each leg" —
177
- * they're no longer used to compute matchScore.
178
- */
179
- function mergeHybrid(
180
- kwHits: ReadonlyArray<KeywordHit>,
181
- semHits: ReadonlyArray<SemanticHit>,
182
- ): ReadonlyArray<RecallHit> {
183
- const maxKw = Math.max(1, ...kwHits.map((h) => h.score));
184
- const maxSem = Math.max(1, ...semHits.map((h) => h.similarity));
185
-
186
- const kwRank = new Map<string, number>();
187
- kwHits.forEach((h, i) => kwRank.set(h.session.id, i + 1));
188
- const semRank = new Map<string, number>();
189
- semHits.forEach((h, i) => semRank.set(h.session.id, i + 1));
190
-
191
- const kwMap = new Map<string, KeywordHit>(kwHits.map((h) => [h.session.id, h]));
192
- const semMap = new Map<string, SemanticHit>(semHits.map((h) => [h.session.id, h]));
193
- const allIds = new Set<string>([...kwMap.keys(), ...semMap.keys()]);
194
-
195
- const rows: RecallHit[] = [];
196
- for (const id of allIds) {
197
- const kw = kwMap.get(id);
198
- const sem = semMap.get(id);
199
- const session = (kw ?? sem)!.session;
200
- const kRank = kwRank.get(id);
201
- const sRank = semRank.get(id);
202
- const rrf =
203
- (kRank !== undefined ? 1 / (RRF_K + kRank) : 0) +
204
- (sRank !== undefined ? 1 / (RRF_K + sRank) : 0);
205
- const matchedIn = uniqueFields(kw?.matchedIn ?? [], sem ? (["semantic"] as MatchField[]) : []);
206
- rows.push({
207
- ...sessionHitFields(session),
208
- matchScore: round4(rrf),
209
- matchedIn,
210
- keywordScore: kw ? round4(kw.score / maxKw) : 0,
211
- semanticScore: sem ? round4(sem.similarity / maxSem) : 0,
212
- });
213
- }
214
- rows.sort((a, b) => b.matchScore - a.matchScore);
215
- return rows;
216
- }
217
-
218
- /**
219
- * Force-include the keyword-leg rank-1 session into the merged top-`limit`
220
- * result. Only invoked when the query shape (temporal + named entity)
221
- * indicates a Mode A pattern where pure RRF is known to demote keyword
222
- * winners (see query-shape.ts for diagnosis). If the rank-1 keyword session
223
- * is already in the limited top-N, no change. Otherwise it's inserted at
224
- * position `limit - 1`, displacing the lowest-confidence merged hit.
225
- */
226
- function forceIncludeKeywordTop(
227
- merged: ReadonlyArray<RecallHit>,
228
- kwHits: ReadonlyArray<KeywordHit>,
229
- limit: number,
230
- ): ReadonlyArray<RecallHit> {
231
- if (kwHits.length === 0 || merged.length === 0) return merged;
232
- const topId = kwHits[0]!.session.id;
233
- const top = merged.slice(0, limit);
234
- if (top.some((h) => h.id === topId)) return merged;
235
- const forcedHit = merged.find((h) => h.id === topId);
236
- if (!forcedHit) return merged;
237
- const kept = top.slice(0, Math.max(0, limit - 1));
238
- const tail = merged.slice(limit);
239
- return [...kept, forcedHit, ...tail];
240
- }
241
-
242
- function toKeywordHit(h: KeywordHit): RecallHit {
243
- return {
244
- ...sessionHitFields(h.session),
245
- matchScore: h.score,
246
- matchedIn: h.matchedIn,
247
- };
248
- }
249
-
250
- function toSemanticHit(h: SemanticHit): RecallHit {
251
- return {
252
- ...sessionHitFields(h.session),
253
- matchScore: h.similarity,
254
- matchedIn: ["semantic"],
255
- };
256
- }
257
-
258
- function sessionHitFields(s: Session) {
259
- return {
260
- id: s.id,
261
- startedAt: s.startedAt,
262
- label: s.label,
263
- summary: s.summary,
264
- entities: s.entities,
265
- decisions: s.decisions,
266
- open: s.open,
267
- status: s.status,
268
- } as const;
269
- }
270
-
271
- function finalize(
272
- query: string,
273
- entity: string | null,
274
- kind: RecallResult["kind"],
275
- mode: RecallMode,
276
- limit: number,
277
- hits: ReadonlyArray<RecallHit>,
278
- ): RecallResult {
279
- return {
280
- query,
281
- entity,
282
- kind,
283
- mode,
284
- limit,
285
- total: hits.length,
286
- results: hits.slice(0, limit),
287
- };
288
- }
289
-
290
- function clampLimit(limit: number | undefined): number {
291
- const n = limit ?? DEFAULT_LIMIT;
292
- if (Number.isNaN(n) || n < 1) return 1;
293
- return Math.min(MAX_LIMIT, Math.trunc(n));
294
- }
295
-
296
- function cosineFromL2(distance: number): number {
297
- // session_embeddings stores unit-normalized vectors. For unit vectors,
298
- // cos_sim = 1 - L2^2 / 2. Mirrors recall.py:_run_semantic.
299
- const cos = 1 - (distance * distance) / 2;
300
- return round4(Math.max(-1, Math.min(1, cos)));
301
- }
302
-
303
- function round4(value: number): number {
304
- return Math.round(value * 10_000) / 10_000;
305
- }
306
-
307
- function uniqueFields(
308
- a: ReadonlyArray<MatchField>,
309
- b: ReadonlyArray<MatchField>,
310
- ): ReadonlyArray<MatchField> {
311
- const seen = new Set<MatchField>();
312
- const out: MatchField[] = [];
313
- for (const f of [...a, ...b]) {
314
- if (!seen.has(f)) {
315
- seen.add(f);
316
- out.push(f);
317
- }
318
- }
319
- return out;
320
- }
@@ -1,59 +0,0 @@
1
- /**
2
- * recentLog — tail the query log for the /live observability panel.
3
- * Returns the last N entries in chronological order (most recent first).
4
- */
5
-
6
- import { readFileSync, existsSync, statSync } from "node:fs";
7
- import { homedir } from "node:os";
8
- import { join } from "node:path";
9
-
10
- export interface RecentLogEntry {
11
- readonly ts: string;
12
- readonly source: string;
13
- readonly query: string | null;
14
- readonly entity: string | null;
15
- readonly kind: string | null;
16
- readonly mode: string;
17
- readonly limit: number;
18
- readonly nResults: number;
19
- readonly returnedIds: ReadonlyArray<string>;
20
- }
21
-
22
- function defaultLogPath(): string {
23
- return process.env["NLM_QUERY_LOG"] ?? join(homedir(), ".nlm", "query_log.jsonl");
24
- }
25
-
26
- const TAIL_BYTES = 256 * 1024;
27
-
28
- export function recentQueryLog(limit: number, logPath: string = defaultLogPath()): RecentLogEntry[] {
29
- if (!existsSync(logPath)) return [];
30
- const size = statSync(logPath).size;
31
- const start = Math.max(0, size - TAIL_BYTES);
32
- const tail = readFileSync(logPath, { encoding: "utf8" }).slice(start);
33
-
34
- const entries: RecentLogEntry[] = [];
35
- for (const line of tail.split("\n")) {
36
- const trimmed = line.trim();
37
- if (!trimmed) continue;
38
- try {
39
- const raw = JSON.parse(trimmed) as Record<string, unknown>;
40
- entries.push({
41
- ts: typeof raw["ts"] === "string" ? raw["ts"] : "",
42
- source: typeof raw["source"] === "string" ? raw["source"] : "unknown",
43
- query: typeof raw["query"] === "string" ? raw["query"] : null,
44
- entity: typeof raw["entity"] === "string" ? raw["entity"] : null,
45
- kind: typeof raw["kind"] === "string" ? raw["kind"] : null,
46
- mode: typeof raw["mode"] === "string" ? raw["mode"] : "keyword",
47
- limit: typeof raw["limit"] === "number" ? raw["limit"] : 0,
48
- nResults: typeof raw["n_results"] === "number" ? raw["n_results"] : 0,
49
- returnedIds: Array.isArray(raw["returned_ids"])
50
- ? raw["returned_ids"].filter((x): x is string => typeof x === "string")
51
- : [],
52
- });
53
- } catch {
54
- continue;
55
- }
56
- }
57
- entries.sort((a, b) => b.ts.localeCompare(a.ts));
58
- return entries.slice(0, limit);
59
- }
@@ -1,18 +0,0 @@
1
- /**
2
- * Tokenizer mirrors recall.py:_TOKEN_RE. Identical regex, lowercase normalize.
3
- * Pure function. The keyword scorer's parity with the Python implementation
4
- * starts here.
5
- */
6
-
7
- const TOKEN_PATTERN = /[A-Za-z0-9][A-Za-z0-9_.-]*/g;
8
-
9
- export function tokenize(text: string | null | undefined): ReadonlyArray<string> {
10
- if (!text) return [];
11
- const matches = text.match(TOKEN_PATTERN);
12
- if (!matches) return [];
13
- return matches.map((t) => t.toLowerCase());
14
- }
15
-
16
- export function tokenSet(text: string | null | undefined): Set<string> {
17
- return new Set(tokenize(text));
18
- }