nlm-memory 0.5.0 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (247) hide show
  1. package/README.md +72 -34
  2. package/dist/cli/nlm.js +2 -1
  3. package/dist/cli/nlm.js.map +1 -1
  4. package/dist/http/app.js +2 -1
  5. package/dist/http/app.js.map +1 -1
  6. package/dist/mcp/server.js +20 -1
  7. package/dist/mcp/server.js.map +1 -1
  8. package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
  9. package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
  10. package/dist/ui/index.html +2 -2
  11. package/package.json +26 -1
  12. package/.agents/plugins/marketplace.json +0 -20
  13. package/.github/workflows/ci.yml +0 -30
  14. package/docs/methodology/re-derivation-rate.md +0 -112
  15. package/docs/methodology/useful-hit-rate.md +0 -79
  16. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  17. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  18. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  19. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  20. package/docs/plans/desktop-product.md +0 -69
  21. package/docs/plans/factstore-design.md +0 -236
  22. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
  23. package/logs/CHANGELOG/CHANGELOG.md +0 -209
  24. package/migrations/000_initial_schema.sql +0 -174
  25. package/migrations/001_entity_type_rename.sql +0 -17
  26. package/migrations/002_adapter_state_extend.sql +0 -12
  27. package/migrations/003_session_embeddings.sql +0 -11
  28. package/migrations/004_facts.sql +0 -46
  29. package/migrations/005_sources.sql +0 -31
  30. package/migrations/006_providers.sql +0 -33
  31. package/migrations/007_source_tokens.sql +0 -17
  32. package/migrations/008_fts_rebuild.sql +0 -9
  33. package/migrations/009_session_embedding_chunks.sql +0 -46
  34. package/migrations/010_sources_opencode.sql +0 -30
  35. package/migrations/011_sources_hermes_agent.sql +0 -30
  36. package/migrations/012_sources_aider.sql +0 -30
  37. package/migrations/013_adapter_state_failure_count.sql +0 -12
  38. package/migrations/014_sources_cursor.sql +0 -30
  39. package/migrations/015_sources_windsurf.sql +0 -30
  40. package/plugin-hermes-agent/README.md +0 -49
  41. package/plugin-hermes-agent/__init__.py +0 -75
  42. package/plugin-hermes-agent/plugin.yaml +0 -15
  43. package/scripts/backfill-citations.mjs +0 -0
  44. package/scripts/build-codex-plugin.mjs +0 -61
  45. package/scripts/deepseek-probe.mjs +0 -67
  46. package/scripts/extract-triples.mjs +0 -207
  47. package/scripts/longmemeval/embedding-cache.ts +0 -77
  48. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  49. package/scripts/longmemeval/run-harness.ts +0 -315
  50. package/scripts/longmemeval/scorer.ts +0 -99
  51. package/scripts/longmemeval/tsconfig.json +0 -9
  52. package/scripts/longmemeval/types.ts +0 -35
  53. package/scripts/nlm-daily-digest.py +0 -239
  54. package/scripts/nlm-daily-digest.sh +0 -28
  55. package/src/cli/classify-parity.ts +0 -257
  56. package/src/cli/launchctl-helpers.ts +0 -49
  57. package/src/cli/nlm.ts +0 -1078
  58. package/src/core/actions/actions-log.ts +0 -118
  59. package/src/core/actions/overlay.ts +0 -117
  60. package/src/core/adapters/aider.ts +0 -205
  61. package/src/core/adapters/claude-code.ts +0 -293
  62. package/src/core/adapters/common.ts +0 -54
  63. package/src/core/adapters/cursor.ts +0 -486
  64. package/src/core/adapters/from-source.ts +0 -67
  65. package/src/core/adapters/hermes-agent.ts +0 -240
  66. package/src/core/adapters/hermes.ts +0 -277
  67. package/src/core/adapters/jsonl-generic.ts +0 -208
  68. package/src/core/adapters/opencode.ts +0 -281
  69. package/src/core/adapters/pi.ts +0 -264
  70. package/src/core/adapters/windsurf.ts +0 -386
  71. package/src/core/classifier/prompt.ts +0 -200
  72. package/src/core/dataset/build-dataset.ts +0 -463
  73. package/src/core/embedding/chunk-body.ts +0 -76
  74. package/src/core/embedding/embed-backfill.ts +0 -210
  75. package/src/core/embedding/embed-normalize.ts +0 -135
  76. package/src/core/facts/backfill-facts.ts +0 -254
  77. package/src/core/facts/extract-facts.ts +0 -50
  78. package/src/core/hook/citation-detect.ts +0 -124
  79. package/src/core/hook/cite-memo.ts +0 -68
  80. package/src/core/hook/claude-settings.ts +0 -187
  81. package/src/core/hook/gate.ts +0 -25
  82. package/src/core/hook/hook-log.ts +0 -41
  83. package/src/core/hook/memo-sweep.ts +0 -164
  84. package/src/core/hook/memo.ts +0 -67
  85. package/src/core/hook/pointer-block.ts +0 -26
  86. package/src/core/hook/select.ts +0 -32
  87. package/src/core/hook/transcript.ts +0 -121
  88. package/src/core/ingest/ingest-session.ts +0 -111
  89. package/src/core/providers/provider-models.ts +0 -100
  90. package/src/core/providers/provider-registry.ts +0 -196
  91. package/src/core/recall/citation-log.ts +0 -108
  92. package/src/core/recall/filter.ts +0 -27
  93. package/src/core/recall/index.ts +0 -6
  94. package/src/core/recall/match-fields.ts +0 -40
  95. package/src/core/recall/query-log.ts +0 -149
  96. package/src/core/recall/query-shape.ts +0 -66
  97. package/src/core/recall/recall-service.ts +0 -320
  98. package/src/core/recall/recent-log.ts +0 -59
  99. package/src/core/recall/tokenize.ts +0 -18
  100. package/src/core/recall/useful-scan.ts +0 -336
  101. package/src/core/recall-facts/fact-query-log.ts +0 -150
  102. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  103. package/src/core/scheduler/scan-once.ts +0 -142
  104. package/src/core/scheduler/scheduler.ts +0 -225
  105. package/src/core/sources/source-registry.ts +0 -278
  106. package/src/core/storage/db-restore.ts +0 -133
  107. package/src/core/storage/live-status.ts +0 -45
  108. package/src/core/storage/migrate.ts +0 -72
  109. package/src/core/storage/sqlite-fact-store.ts +0 -304
  110. package/src/core/storage/sqlite-session-store.ts +0 -810
  111. package/src/hook/hook-auth.ts +0 -18
  112. package/src/hook/prompt-recall-hook.ts +0 -180
  113. package/src/hook/session-end-hook.ts +0 -81
  114. package/src/hook/session-start-hook.ts +0 -168
  115. package/src/hook/stop-hook.ts +0 -239
  116. package/src/http/app.ts +0 -1215
  117. package/src/install/claude-code.ts +0 -128
  118. package/src/install/codex.ts +0 -367
  119. package/src/install/cursor.ts +0 -68
  120. package/src/install/hermes-agent.ts +0 -76
  121. package/src/install/hermes.ts +0 -78
  122. package/src/install/nlm-dir-perms.ts +0 -55
  123. package/src/install/ollama.ts +0 -284
  124. package/src/install/setup.ts +0 -489
  125. package/src/install/windsurf.ts +0 -68
  126. package/src/llm/classifier-box.ts +0 -64
  127. package/src/llm/deepseek-client.ts +0 -150
  128. package/src/llm/env-autoload.ts +0 -55
  129. package/src/llm/ollama-client.ts +0 -189
  130. package/src/mcp/server.ts +0 -534
  131. package/src/ports/fact-store.ts +0 -102
  132. package/src/ports/llm-client.ts +0 -52
  133. package/src/ports/logger.ts +0 -16
  134. package/src/ports/session-store.ts +0 -45
  135. package/src/ports/transcript-adapter.ts +0 -55
  136. package/src/shared/types.ts +0 -149
  137. package/src/ui/App.tsx +0 -58
  138. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  139. package/src/ui/components/SessionDrawer.tsx +0 -199
  140. package/src/ui/components/SideNav.tsx +0 -162
  141. package/src/ui/components/Skeleton.tsx +0 -107
  142. package/src/ui/index.html +0 -13
  143. package/src/ui/lib/actions.ts +0 -30
  144. package/src/ui/lib/api.ts +0 -92
  145. package/src/ui/lib/dataset.ts +0 -141
  146. package/src/ui/lib/registries.ts +0 -155
  147. package/src/ui/lib/view-settings.ts +0 -41
  148. package/src/ui/main.tsx +0 -15
  149. package/src/ui/pages/Live.tsx +0 -229
  150. package/src/ui/pages/Pulse.tsx +0 -415
  151. package/src/ui/pages/Recall.tsx +0 -190
  152. package/src/ui/pages/River.tsx +0 -354
  153. package/src/ui/pages/Search.tsx +0 -386
  154. package/src/ui/pages/Stub.tsx +0 -9
  155. package/src/ui/pages/Thread.tsx +0 -473
  156. package/src/ui/pages/settings/Classifier.tsx +0 -227
  157. package/src/ui/pages/settings/Data.tsx +0 -190
  158. package/src/ui/pages/settings/Index.tsx +0 -65
  159. package/src/ui/pages/settings/Labels.tsx +0 -224
  160. package/src/ui/pages/settings/Providers.tsx +0 -305
  161. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  162. package/src/ui/pages/settings/Sources.tsx +0 -326
  163. package/src/ui/pages/settings/Views.tsx +0 -96
  164. package/src/ui/styles.css +0 -1890
  165. package/src/ui/tsconfig.json +0 -21
  166. package/src/ui/vite.config.ts +0 -19
  167. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  168. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  169. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  170. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  171. package/tests/fixtures/facts.ts +0 -17
  172. package/tests/fixtures/golden-corpus.ts +0 -85
  173. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  174. package/tests/fixtures/hermes/paired_session.json +0 -23
  175. package/tests/fixtures/hermes/request_dump.json +0 -28
  176. package/tests/fixtures/hermes/session_iso.json +0 -38
  177. package/tests/fixtures/hermes/session_unix.json +0 -38
  178. package/tests/fixtures/hermes/system_only.json +0 -18
  179. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  180. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  181. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  182. package/tests/fixtures/sessions.ts +0 -22
  183. package/tests/integration/backfill-facts.test.ts +0 -362
  184. package/tests/integration/citation-explicit.test.ts +0 -111
  185. package/tests/integration/cite-event.test.ts +0 -169
  186. package/tests/integration/cite-memo.test.ts +0 -87
  187. package/tests/integration/db-restore.test.ts +0 -153
  188. package/tests/integration/embed-backfill.test.ts +0 -176
  189. package/tests/integration/fact-supersedence.test.ts +0 -313
  190. package/tests/integration/fts-index.test.ts +0 -60
  191. package/tests/integration/getbyids-sqlite.test.ts +0 -100
  192. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  193. package/tests/integration/hook-claude-settings.test.ts +0 -218
  194. package/tests/integration/hook-log.test.ts +0 -54
  195. package/tests/integration/hook-memo.test.ts +0 -68
  196. package/tests/integration/hook-pre-compact.test.ts +0 -105
  197. package/tests/integration/hook-subagent-start.test.ts +0 -102
  198. package/tests/integration/http.test.ts +0 -401
  199. package/tests/integration/keyword-search-fts.test.ts +0 -66
  200. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  201. package/tests/integration/mcp.test.ts +0 -260
  202. package/tests/integration/memo-sweep.test.ts +0 -91
  203. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  204. package/tests/integration/provider-registry.test.ts +0 -107
  205. package/tests/integration/recall-golden.test.ts +0 -59
  206. package/tests/integration/recall-sqlite.test.ts +0 -169
  207. package/tests/integration/scheduler.test.ts +0 -391
  208. package/tests/integration/session-end-hook.test.ts +0 -48
  209. package/tests/integration/session-start-hook.test.ts +0 -126
  210. package/tests/integration/source-registry.test.ts +0 -122
  211. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  212. package/tests/integration/stop-hook.test.ts +0 -560
  213. package/tests/integration/wal-checkpoint.test.ts +0 -49
  214. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  215. package/tests/unit/core/adapters/aider.test.ts +0 -230
  216. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  217. package/tests/unit/core/adapters/cursor.test.ts +0 -485
  218. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  219. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  220. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  221. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  222. package/tests/unit/core/adapters/pi.test.ts +0 -110
  223. package/tests/unit/core/adapters/windsurf.test.ts +0 -416
  224. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  225. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  226. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  227. package/tests/unit/core/filter.test.ts +0 -40
  228. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  229. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  230. package/tests/unit/core/hook/gate.test.ts +0 -29
  231. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  232. package/tests/unit/core/hook/select.test.ts +0 -66
  233. package/tests/unit/core/match-fields.test.ts +0 -39
  234. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  235. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  236. package/tests/unit/core/query-shape.test.ts +0 -92
  237. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  238. package/tests/unit/core/recall-service.test.ts +0 -200
  239. package/tests/unit/core/storage/live-status.test.ts +0 -54
  240. package/tests/unit/core/tokenize.test.ts +0 -32
  241. package/tests/unit/core/useful-scan.test.ts +0 -537
  242. package/tests/unit/llm/embed.test.ts +0 -93
  243. package/tests/unit/llm/ollama-client.test.ts +0 -124
  244. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  245. package/tsconfig.json +0 -31
  246. package/tsconfig.test.json +0 -11
  247. package/vitest.config.ts +0 -22
@@ -1,320 +0,0 @@
1
- /**
2
- * RecallService — the use case. Composes filters, keyword scoring, and
3
- * semantic search into a single recall operation.
4
- *
5
- * Depends only on ports (SessionStore, LLMClient). No framework imports,
6
- * no SQLite, no HTTP. Tests substitute fake adapters.
7
- */
8
-
9
- import type { LLMClient } from "@ports/llm-client.js";
10
- import { LLMUnreachableError } from "@ports/llm-client.js";
11
- import type {
12
- KeywordNeighbor,
13
- SemanticNeighbor,
14
- SessionStore,
15
- } from "@ports/session-store.js";
16
- import type {
17
- MatchField,
18
- RecallHit,
19
- RecallMode,
20
- RecallQuery,
21
- RecallResult,
22
- Session,
23
- } from "@shared/types.js";
24
- import { applyFilter } from "./filter.js";
25
- import { keywordMatchFields } from "./match-fields.js";
26
- import { detectQueryShape } from "./query-shape.js";
27
- import { tokenSet } from "./tokenize.js";
28
-
29
- const DEFAULT_LIMIT = 20;
30
- const MAX_LIMIT = 100;
31
- // Reciprocal Rank Fusion constant (Cormack et al. 2009). k=60 is the
32
- // canonical literature default. RRF combines ranked lists from multiple
33
- // retrievers by summing 1/(k + rank) per retriever, ignoring raw scores —
34
- // robust to wildly different score distributions (BM25 unbounded vs cosine
35
- // in [-1,1]) without requiring normalization.
36
- const RRF_K = 60;
37
- const SEMANTIC_OVERFETCH = 3;
38
- const KEYWORD_OVERFETCH = 3;
39
-
40
- export interface RecallServiceDeps {
41
- readonly store: SessionStore;
42
- readonly llm: LLMClient;
43
- }
44
-
45
- export class RecallService {
46
- constructor(private readonly deps: RecallServiceDeps) {}
47
-
48
- async search(input: RecallQuery): Promise<RecallResult> {
49
- const mode: RecallMode = input.mode ?? "keyword";
50
- const limit = clampLimit(input.limit);
51
- const entity = input.entity ?? null;
52
- const kind = input.kind ?? null;
53
-
54
- const empty: RecallResult = {
55
- query: input.query,
56
- entity,
57
- kind,
58
- mode,
59
- limit,
60
- total: 0,
61
- results: [],
62
- };
63
-
64
- if (!input.query && !entity && !kind) return empty;
65
-
66
- // 1. Search legs — ranked neighbor IDs only. No session bodies loaded.
67
- const kwNeighbors: ReadonlyArray<KeywordNeighbor> =
68
- (mode === "keyword" || mode === "hybrid") && input.query
69
- ? await this.deps.store.keywordSearch(input.query, limit * KEYWORD_OVERFETCH)
70
- : [];
71
-
72
- let semNeighbors: ReadonlyArray<SemanticNeighbor> = [];
73
- let semError: "ollama_unreachable" | null = null;
74
- if ((mode === "semantic" || mode === "hybrid") && input.query) {
75
- try {
76
- const embedding = await this.deps.llm.embed(input.query, "query");
77
- semNeighbors = await this.deps.store.semanticSearch(
78
- embedding.vector,
79
- limit * SEMANTIC_OVERFETCH,
80
- );
81
- } catch (err) {
82
- if (err instanceof LLMUnreachableError) {
83
- semError = "ollama_unreachable";
84
- } else {
85
- throw err;
86
- }
87
- }
88
- }
89
-
90
- if (mode === "semantic" && semError) {
91
- return { ...empty, modeUnavailable: semError };
92
- }
93
-
94
- // 2. Resolve ONLY the hit sessions — never the whole corpus. The
95
- // entity/kind filter is applied to the fetched hits; a filtered-out
96
- // session is absent from byId and is skipped during resolution.
97
- const hitIds = uniqueIds(kwNeighbors, semNeighbors);
98
- const hitSessions = await this.deps.store.getByIds(hitIds);
99
- const filterArgs: { entity?: string; kind?: typeof input.kind } = {};
100
- if (input.entity !== undefined) filterArgs.entity = input.entity;
101
- if (input.kind !== undefined) filterArgs.kind = input.kind;
102
- const byId = new Map<string, Session>(
103
- applyFilter(hitSessions, filterArgs).map((s) => [s.id, s]),
104
- );
105
-
106
- // 3. Build hits from the resolved sessions, preserving leg rank order.
107
- const queryTokens = input.query
108
- ? new Set(tokenSet(input.query))
109
- : new Set<string>();
110
-
111
- const kwHits: KeywordHit[] = [];
112
- for (const n of kwNeighbors) {
113
- const session = byId.get(n.sessionId);
114
- if (!session) continue;
115
- kwHits.push({
116
- session,
117
- score: n.score,
118
- matchedIn: keywordMatchFields(session, queryTokens),
119
- });
120
- }
121
-
122
- const semHits: SemanticHit[] = [];
123
- for (const n of semNeighbors) {
124
- const session = byId.get(n.sessionId);
125
- if (!session) continue;
126
- semHits.push({ session, similarity: cosineFromL2(n.distance) });
127
- }
128
-
129
- // 4. Finalize per mode.
130
- if (mode === "keyword") {
131
- return finalize(input.query, entity, kind, mode, limit, kwHits.map(toKeywordHit));
132
- }
133
- if (mode === "semantic") {
134
- return finalize(input.query, entity, kind, mode, limit, semHits.map(toSemanticHit));
135
- }
136
- const merged = mergeHybrid(kwHits, semHits);
137
- const shape = detectQueryShape(input.query);
138
- const forceIncluded = (shape.hasTemporal && shape.hasNamedEntity)
139
- ? forceIncludeKeywordTop(merged, kwHits, limit)
140
- : merged;
141
- const result = finalize(input.query, entity, kind, mode, limit, forceIncluded);
142
- return semError ? { ...result, modeUnavailable: semError } : result;
143
- }
144
- }
145
-
146
- function uniqueIds(
147
- kw: ReadonlyArray<KeywordNeighbor>,
148
- sem: ReadonlyArray<SemanticNeighbor>,
149
- ): ReadonlyArray<string> {
150
- const ids = new Set<string>();
151
- for (const n of kw) ids.add(n.sessionId);
152
- for (const n of sem) ids.add(n.sessionId);
153
- return [...ids];
154
- }
155
-
156
- interface KeywordHit {
157
- readonly session: Session;
158
- readonly score: number;
159
- readonly matchedIn: ReadonlyArray<MatchField>;
160
- }
161
-
162
- interface SemanticHit {
163
- readonly session: Session;
164
- readonly similarity: number;
165
- }
166
-
167
- /**
168
- * Reciprocal Rank Fusion across the keyword + semantic legs.
169
- *
170
- * matchScore = Σ 1/(RRF_K + rank_i) for each retriever the session appears in.
171
- * A session at rank 1 in both retrievers therefore scores ~0.0328 (the max
172
- * possible with two retrievers at k=60); a session at rank 1 in one
173
- * retriever and absent from the other scores ~0.0164.
174
- *
175
- * keywordScore and semanticScore stay populated as min-max normalized
176
- * informational values so the UI can show "how strong was each leg" —
177
- * they're no longer used to compute matchScore.
178
- */
179
- function mergeHybrid(
180
- kwHits: ReadonlyArray<KeywordHit>,
181
- semHits: ReadonlyArray<SemanticHit>,
182
- ): ReadonlyArray<RecallHit> {
183
- const maxKw = Math.max(1, ...kwHits.map((h) => h.score));
184
- const maxSem = Math.max(1, ...semHits.map((h) => h.similarity));
185
-
186
- const kwRank = new Map<string, number>();
187
- kwHits.forEach((h, i) => kwRank.set(h.session.id, i + 1));
188
- const semRank = new Map<string, number>();
189
- semHits.forEach((h, i) => semRank.set(h.session.id, i + 1));
190
-
191
- const kwMap = new Map<string, KeywordHit>(kwHits.map((h) => [h.session.id, h]));
192
- const semMap = new Map<string, SemanticHit>(semHits.map((h) => [h.session.id, h]));
193
- const allIds = new Set<string>([...kwMap.keys(), ...semMap.keys()]);
194
-
195
- const rows: RecallHit[] = [];
196
- for (const id of allIds) {
197
- const kw = kwMap.get(id);
198
- const sem = semMap.get(id);
199
- const session = (kw ?? sem)!.session;
200
- const kRank = kwRank.get(id);
201
- const sRank = semRank.get(id);
202
- const rrf =
203
- (kRank !== undefined ? 1 / (RRF_K + kRank) : 0) +
204
- (sRank !== undefined ? 1 / (RRF_K + sRank) : 0);
205
- const matchedIn = uniqueFields(kw?.matchedIn ?? [], sem ? (["semantic"] as MatchField[]) : []);
206
- rows.push({
207
- ...sessionHitFields(session),
208
- matchScore: round4(rrf),
209
- matchedIn,
210
- keywordScore: kw ? round4(kw.score / maxKw) : 0,
211
- semanticScore: sem ? round4(sem.similarity / maxSem) : 0,
212
- });
213
- }
214
- rows.sort((a, b) => b.matchScore - a.matchScore);
215
- return rows;
216
- }
217
-
218
- /**
219
- * Force-include the keyword-leg rank-1 session into the merged top-`limit`
220
- * result. Only invoked when the query shape (temporal + named entity)
221
- * indicates a Mode A pattern where pure RRF is known to demote keyword
222
- * winners (see query-shape.ts for diagnosis). If the rank-1 keyword session
223
- * is already in the limited top-N, no change. Otherwise it's inserted at
224
- * position `limit - 1`, displacing the lowest-confidence merged hit.
225
- */
226
- function forceIncludeKeywordTop(
227
- merged: ReadonlyArray<RecallHit>,
228
- kwHits: ReadonlyArray<KeywordHit>,
229
- limit: number,
230
- ): ReadonlyArray<RecallHit> {
231
- if (kwHits.length === 0 || merged.length === 0) return merged;
232
- const topId = kwHits[0]!.session.id;
233
- const top = merged.slice(0, limit);
234
- if (top.some((h) => h.id === topId)) return merged;
235
- const forcedHit = merged.find((h) => h.id === topId);
236
- if (!forcedHit) return merged;
237
- const kept = top.slice(0, Math.max(0, limit - 1));
238
- const tail = merged.slice(limit);
239
- return [...kept, forcedHit, ...tail];
240
- }
241
-
242
- function toKeywordHit(h: KeywordHit): RecallHit {
243
- return {
244
- ...sessionHitFields(h.session),
245
- matchScore: h.score,
246
- matchedIn: h.matchedIn,
247
- };
248
- }
249
-
250
- function toSemanticHit(h: SemanticHit): RecallHit {
251
- return {
252
- ...sessionHitFields(h.session),
253
- matchScore: h.similarity,
254
- matchedIn: ["semantic"],
255
- };
256
- }
257
-
258
- function sessionHitFields(s: Session) {
259
- return {
260
- id: s.id,
261
- startedAt: s.startedAt,
262
- label: s.label,
263
- summary: s.summary,
264
- entities: s.entities,
265
- decisions: s.decisions,
266
- open: s.open,
267
- status: s.status,
268
- } as const;
269
- }
270
-
271
- function finalize(
272
- query: string,
273
- entity: string | null,
274
- kind: RecallResult["kind"],
275
- mode: RecallMode,
276
- limit: number,
277
- hits: ReadonlyArray<RecallHit>,
278
- ): RecallResult {
279
- return {
280
- query,
281
- entity,
282
- kind,
283
- mode,
284
- limit,
285
- total: hits.length,
286
- results: hits.slice(0, limit),
287
- };
288
- }
289
-
290
- function clampLimit(limit: number | undefined): number {
291
- const n = limit ?? DEFAULT_LIMIT;
292
- if (Number.isNaN(n) || n < 1) return 1;
293
- return Math.min(MAX_LIMIT, Math.trunc(n));
294
- }
295
-
296
- function cosineFromL2(distance: number): number {
297
- // session_embeddings stores unit-normalized vectors. For unit vectors,
298
- // cos_sim = 1 - L2^2 / 2. Mirrors recall.py:_run_semantic.
299
- const cos = 1 - (distance * distance) / 2;
300
- return round4(Math.max(-1, Math.min(1, cos)));
301
- }
302
-
303
- function round4(value: number): number {
304
- return Math.round(value * 10_000) / 10_000;
305
- }
306
-
307
- function uniqueFields(
308
- a: ReadonlyArray<MatchField>,
309
- b: ReadonlyArray<MatchField>,
310
- ): ReadonlyArray<MatchField> {
311
- const seen = new Set<MatchField>();
312
- const out: MatchField[] = [];
313
- for (const f of [...a, ...b]) {
314
- if (!seen.has(f)) {
315
- seen.add(f);
316
- out.push(f);
317
- }
318
- }
319
- return out;
320
- }
@@ -1,59 +0,0 @@
1
- /**
2
- * recentLog — tail the query log for the /live observability panel.
3
- * Returns the last N entries in chronological order (most recent first).
4
- */
5
-
6
- import { readFileSync, existsSync, statSync } from "node:fs";
7
- import { homedir } from "node:os";
8
- import { join } from "node:path";
9
-
10
- export interface RecentLogEntry {
11
- readonly ts: string;
12
- readonly source: string;
13
- readonly query: string | null;
14
- readonly entity: string | null;
15
- readonly kind: string | null;
16
- readonly mode: string;
17
- readonly limit: number;
18
- readonly nResults: number;
19
- readonly returnedIds: ReadonlyArray<string>;
20
- }
21
-
22
- function defaultLogPath(): string {
23
- return process.env["NLM_QUERY_LOG"] ?? join(homedir(), ".nlm", "query_log.jsonl");
24
- }
25
-
26
- const TAIL_BYTES = 256 * 1024;
27
-
28
- export function recentQueryLog(limit: number, logPath: string = defaultLogPath()): RecentLogEntry[] {
29
- if (!existsSync(logPath)) return [];
30
- const size = statSync(logPath).size;
31
- const start = Math.max(0, size - TAIL_BYTES);
32
- const tail = readFileSync(logPath, { encoding: "utf8" }).slice(start);
33
-
34
- const entries: RecentLogEntry[] = [];
35
- for (const line of tail.split("\n")) {
36
- const trimmed = line.trim();
37
- if (!trimmed) continue;
38
- try {
39
- const raw = JSON.parse(trimmed) as Record<string, unknown>;
40
- entries.push({
41
- ts: typeof raw["ts"] === "string" ? raw["ts"] : "",
42
- source: typeof raw["source"] === "string" ? raw["source"] : "unknown",
43
- query: typeof raw["query"] === "string" ? raw["query"] : null,
44
- entity: typeof raw["entity"] === "string" ? raw["entity"] : null,
45
- kind: typeof raw["kind"] === "string" ? raw["kind"] : null,
46
- mode: typeof raw["mode"] === "string" ? raw["mode"] : "keyword",
47
- limit: typeof raw["limit"] === "number" ? raw["limit"] : 0,
48
- nResults: typeof raw["n_results"] === "number" ? raw["n_results"] : 0,
49
- returnedIds: Array.isArray(raw["returned_ids"])
50
- ? raw["returned_ids"].filter((x): x is string => typeof x === "string")
51
- : [],
52
- });
53
- } catch {
54
- continue;
55
- }
56
- }
57
- entries.sort((a, b) => b.ts.localeCompare(a.ts));
58
- return entries.slice(0, limit);
59
- }
@@ -1,18 +0,0 @@
1
- /**
2
- * Tokenizer mirrors recall.py:_TOKEN_RE. Identical regex, lowercase normalize.
3
- * Pure function. The keyword scorer's parity with the Python implementation
4
- * starts here.
5
- */
6
-
7
- const TOKEN_PATTERN = /[A-Za-z0-9][A-Za-z0-9_.-]*/g;
8
-
9
- export function tokenize(text: string | null | undefined): ReadonlyArray<string> {
10
- if (!text) return [];
11
- const matches = text.match(TOKEN_PATTERN);
12
- if (!matches) return [];
13
- return matches.map((t) => t.toLowerCase());
14
- }
15
-
16
- export function tokenSet(text: string | null | undefined): Set<string> {
17
- return new Set(tokenize(text));
18
- }