nlm-memory 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (257) hide show
  1. package/README.md +89 -34
  2. package/dist/cli/digest.d.ts +20 -0
  3. package/dist/cli/digest.js +142 -0
  4. package/dist/cli/digest.js.map +1 -0
  5. package/dist/cli/nlm.d.ts +1 -0
  6. package/dist/cli/nlm.js +25 -1
  7. package/dist/cli/nlm.js.map +1 -1
  8. package/dist/core/digest/compose.d.ts +38 -0
  9. package/dist/core/digest/compose.js +93 -0
  10. package/dist/core/digest/compose.js.map +1 -0
  11. package/dist/core/digest/hook-liveness.d.ts +32 -0
  12. package/dist/core/digest/hook-liveness.js +54 -0
  13. package/dist/core/digest/hook-liveness.js.map +1 -0
  14. package/dist/http/app.js +2 -1
  15. package/dist/http/app.js.map +1 -1
  16. package/dist/mcp/server.js +20 -1
  17. package/dist/mcp/server.js.map +1 -1
  18. package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
  19. package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
  20. package/dist/ui/index.html +2 -2
  21. package/package.json +26 -1
  22. package/.agents/plugins/marketplace.json +0 -20
  23. package/.github/workflows/ci.yml +0 -30
  24. package/docs/methodology/re-derivation-rate.md +0 -112
  25. package/docs/methodology/useful-hit-rate.md +0 -79
  26. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  27. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  28. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  29. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  30. package/docs/plans/desktop-product.md +0 -69
  31. package/docs/plans/factstore-design.md +0 -236
  32. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
  33. package/logs/CHANGELOG/CHANGELOG.md +0 -209
  34. package/migrations/000_initial_schema.sql +0 -174
  35. package/migrations/001_entity_type_rename.sql +0 -17
  36. package/migrations/002_adapter_state_extend.sql +0 -12
  37. package/migrations/003_session_embeddings.sql +0 -11
  38. package/migrations/004_facts.sql +0 -46
  39. package/migrations/005_sources.sql +0 -31
  40. package/migrations/006_providers.sql +0 -33
  41. package/migrations/007_source_tokens.sql +0 -17
  42. package/migrations/008_fts_rebuild.sql +0 -9
  43. package/migrations/009_session_embedding_chunks.sql +0 -46
  44. package/migrations/010_sources_opencode.sql +0 -30
  45. package/migrations/011_sources_hermes_agent.sql +0 -30
  46. package/migrations/012_sources_aider.sql +0 -30
  47. package/migrations/013_adapter_state_failure_count.sql +0 -12
  48. package/migrations/014_sources_cursor.sql +0 -30
  49. package/migrations/015_sources_windsurf.sql +0 -30
  50. package/plugin-hermes-agent/README.md +0 -49
  51. package/plugin-hermes-agent/__init__.py +0 -75
  52. package/plugin-hermes-agent/plugin.yaml +0 -15
  53. package/scripts/backfill-citations.mjs +0 -0
  54. package/scripts/build-codex-plugin.mjs +0 -61
  55. package/scripts/deepseek-probe.mjs +0 -67
  56. package/scripts/extract-triples.mjs +0 -207
  57. package/scripts/longmemeval/embedding-cache.ts +0 -77
  58. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  59. package/scripts/longmemeval/run-harness.ts +0 -315
  60. package/scripts/longmemeval/scorer.ts +0 -99
  61. package/scripts/longmemeval/tsconfig.json +0 -9
  62. package/scripts/longmemeval/types.ts +0 -35
  63. package/scripts/nlm-daily-digest.py +0 -239
  64. package/scripts/nlm-daily-digest.sh +0 -28
  65. package/src/cli/classify-parity.ts +0 -257
  66. package/src/cli/launchctl-helpers.ts +0 -49
  67. package/src/cli/nlm.ts +0 -1078
  68. package/src/core/actions/actions-log.ts +0 -118
  69. package/src/core/actions/overlay.ts +0 -117
  70. package/src/core/adapters/aider.ts +0 -205
  71. package/src/core/adapters/claude-code.ts +0 -293
  72. package/src/core/adapters/common.ts +0 -54
  73. package/src/core/adapters/cursor.ts +0 -486
  74. package/src/core/adapters/from-source.ts +0 -67
  75. package/src/core/adapters/hermes-agent.ts +0 -240
  76. package/src/core/adapters/hermes.ts +0 -277
  77. package/src/core/adapters/jsonl-generic.ts +0 -208
  78. package/src/core/adapters/opencode.ts +0 -281
  79. package/src/core/adapters/pi.ts +0 -264
  80. package/src/core/adapters/windsurf.ts +0 -386
  81. package/src/core/classifier/prompt.ts +0 -200
  82. package/src/core/dataset/build-dataset.ts +0 -463
  83. package/src/core/embedding/chunk-body.ts +0 -76
  84. package/src/core/embedding/embed-backfill.ts +0 -210
  85. package/src/core/embedding/embed-normalize.ts +0 -135
  86. package/src/core/facts/backfill-facts.ts +0 -254
  87. package/src/core/facts/extract-facts.ts +0 -50
  88. package/src/core/hook/citation-detect.ts +0 -124
  89. package/src/core/hook/cite-memo.ts +0 -68
  90. package/src/core/hook/claude-settings.ts +0 -187
  91. package/src/core/hook/gate.ts +0 -25
  92. package/src/core/hook/hook-log.ts +0 -41
  93. package/src/core/hook/memo-sweep.ts +0 -164
  94. package/src/core/hook/memo.ts +0 -67
  95. package/src/core/hook/pointer-block.ts +0 -26
  96. package/src/core/hook/select.ts +0 -32
  97. package/src/core/hook/transcript.ts +0 -121
  98. package/src/core/ingest/ingest-session.ts +0 -111
  99. package/src/core/providers/provider-models.ts +0 -100
  100. package/src/core/providers/provider-registry.ts +0 -196
  101. package/src/core/recall/citation-log.ts +0 -108
  102. package/src/core/recall/filter.ts +0 -27
  103. package/src/core/recall/index.ts +0 -6
  104. package/src/core/recall/match-fields.ts +0 -40
  105. package/src/core/recall/query-log.ts +0 -149
  106. package/src/core/recall/query-shape.ts +0 -66
  107. package/src/core/recall/recall-service.ts +0 -320
  108. package/src/core/recall/recent-log.ts +0 -59
  109. package/src/core/recall/tokenize.ts +0 -18
  110. package/src/core/recall/useful-scan.ts +0 -336
  111. package/src/core/recall-facts/fact-query-log.ts +0 -150
  112. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  113. package/src/core/scheduler/scan-once.ts +0 -142
  114. package/src/core/scheduler/scheduler.ts +0 -225
  115. package/src/core/sources/source-registry.ts +0 -278
  116. package/src/core/storage/db-restore.ts +0 -133
  117. package/src/core/storage/live-status.ts +0 -45
  118. package/src/core/storage/migrate.ts +0 -72
  119. package/src/core/storage/sqlite-fact-store.ts +0 -304
  120. package/src/core/storage/sqlite-session-store.ts +0 -810
  121. package/src/hook/hook-auth.ts +0 -18
  122. package/src/hook/prompt-recall-hook.ts +0 -180
  123. package/src/hook/session-end-hook.ts +0 -81
  124. package/src/hook/session-start-hook.ts +0 -168
  125. package/src/hook/stop-hook.ts +0 -239
  126. package/src/http/app.ts +0 -1215
  127. package/src/install/claude-code.ts +0 -128
  128. package/src/install/codex.ts +0 -367
  129. package/src/install/cursor.ts +0 -68
  130. package/src/install/hermes-agent.ts +0 -76
  131. package/src/install/hermes.ts +0 -78
  132. package/src/install/nlm-dir-perms.ts +0 -55
  133. package/src/install/ollama.ts +0 -284
  134. package/src/install/setup.ts +0 -489
  135. package/src/install/windsurf.ts +0 -68
  136. package/src/llm/classifier-box.ts +0 -64
  137. package/src/llm/deepseek-client.ts +0 -150
  138. package/src/llm/env-autoload.ts +0 -55
  139. package/src/llm/ollama-client.ts +0 -189
  140. package/src/mcp/server.ts +0 -534
  141. package/src/ports/fact-store.ts +0 -102
  142. package/src/ports/llm-client.ts +0 -52
  143. package/src/ports/logger.ts +0 -16
  144. package/src/ports/session-store.ts +0 -45
  145. package/src/ports/transcript-adapter.ts +0 -55
  146. package/src/shared/types.ts +0 -149
  147. package/src/ui/App.tsx +0 -58
  148. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  149. package/src/ui/components/SessionDrawer.tsx +0 -199
  150. package/src/ui/components/SideNav.tsx +0 -162
  151. package/src/ui/components/Skeleton.tsx +0 -107
  152. package/src/ui/index.html +0 -13
  153. package/src/ui/lib/actions.ts +0 -30
  154. package/src/ui/lib/api.ts +0 -92
  155. package/src/ui/lib/dataset.ts +0 -141
  156. package/src/ui/lib/registries.ts +0 -155
  157. package/src/ui/lib/view-settings.ts +0 -41
  158. package/src/ui/main.tsx +0 -15
  159. package/src/ui/pages/Live.tsx +0 -229
  160. package/src/ui/pages/Pulse.tsx +0 -415
  161. package/src/ui/pages/Recall.tsx +0 -190
  162. package/src/ui/pages/River.tsx +0 -354
  163. package/src/ui/pages/Search.tsx +0 -386
  164. package/src/ui/pages/Stub.tsx +0 -9
  165. package/src/ui/pages/Thread.tsx +0 -473
  166. package/src/ui/pages/settings/Classifier.tsx +0 -227
  167. package/src/ui/pages/settings/Data.tsx +0 -190
  168. package/src/ui/pages/settings/Index.tsx +0 -65
  169. package/src/ui/pages/settings/Labels.tsx +0 -224
  170. package/src/ui/pages/settings/Providers.tsx +0 -305
  171. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  172. package/src/ui/pages/settings/Sources.tsx +0 -326
  173. package/src/ui/pages/settings/Views.tsx +0 -96
  174. package/src/ui/styles.css +0 -1890
  175. package/src/ui/tsconfig.json +0 -21
  176. package/src/ui/vite.config.ts +0 -19
  177. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  178. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  179. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  180. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  181. package/tests/fixtures/facts.ts +0 -17
  182. package/tests/fixtures/golden-corpus.ts +0 -85
  183. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  184. package/tests/fixtures/hermes/paired_session.json +0 -23
  185. package/tests/fixtures/hermes/request_dump.json +0 -28
  186. package/tests/fixtures/hermes/session_iso.json +0 -38
  187. package/tests/fixtures/hermes/session_unix.json +0 -38
  188. package/tests/fixtures/hermes/system_only.json +0 -18
  189. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  190. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  191. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  192. package/tests/fixtures/sessions.ts +0 -22
  193. package/tests/integration/backfill-facts.test.ts +0 -362
  194. package/tests/integration/citation-explicit.test.ts +0 -111
  195. package/tests/integration/cite-event.test.ts +0 -169
  196. package/tests/integration/cite-memo.test.ts +0 -87
  197. package/tests/integration/db-restore.test.ts +0 -153
  198. package/tests/integration/embed-backfill.test.ts +0 -176
  199. package/tests/integration/fact-supersedence.test.ts +0 -313
  200. package/tests/integration/fts-index.test.ts +0 -60
  201. package/tests/integration/getbyids-sqlite.test.ts +0 -100
  202. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  203. package/tests/integration/hook-claude-settings.test.ts +0 -218
  204. package/tests/integration/hook-log.test.ts +0 -54
  205. package/tests/integration/hook-memo.test.ts +0 -68
  206. package/tests/integration/hook-pre-compact.test.ts +0 -105
  207. package/tests/integration/hook-subagent-start.test.ts +0 -102
  208. package/tests/integration/http.test.ts +0 -401
  209. package/tests/integration/keyword-search-fts.test.ts +0 -66
  210. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  211. package/tests/integration/mcp.test.ts +0 -260
  212. package/tests/integration/memo-sweep.test.ts +0 -91
  213. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  214. package/tests/integration/provider-registry.test.ts +0 -107
  215. package/tests/integration/recall-golden.test.ts +0 -59
  216. package/tests/integration/recall-sqlite.test.ts +0 -169
  217. package/tests/integration/scheduler.test.ts +0 -391
  218. package/tests/integration/session-end-hook.test.ts +0 -48
  219. package/tests/integration/session-start-hook.test.ts +0 -126
  220. package/tests/integration/source-registry.test.ts +0 -122
  221. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  222. package/tests/integration/stop-hook.test.ts +0 -560
  223. package/tests/integration/wal-checkpoint.test.ts +0 -49
  224. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  225. package/tests/unit/core/adapters/aider.test.ts +0 -230
  226. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  227. package/tests/unit/core/adapters/cursor.test.ts +0 -485
  228. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  229. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  230. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  231. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  232. package/tests/unit/core/adapters/pi.test.ts +0 -110
  233. package/tests/unit/core/adapters/windsurf.test.ts +0 -416
  234. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  235. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  236. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  237. package/tests/unit/core/filter.test.ts +0 -40
  238. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  239. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  240. package/tests/unit/core/hook/gate.test.ts +0 -29
  241. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  242. package/tests/unit/core/hook/select.test.ts +0 -66
  243. package/tests/unit/core/match-fields.test.ts +0 -39
  244. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  245. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  246. package/tests/unit/core/query-shape.test.ts +0 -92
  247. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  248. package/tests/unit/core/recall-service.test.ts +0 -200
  249. package/tests/unit/core/storage/live-status.test.ts +0 -54
  250. package/tests/unit/core/tokenize.test.ts +0 -32
  251. package/tests/unit/core/useful-scan.test.ts +0 -537
  252. package/tests/unit/llm/embed.test.ts +0 -93
  253. package/tests/unit/llm/ollama-client.test.ts +0 -124
  254. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  255. package/tsconfig.json +0 -31
  256. package/tsconfig.test.json +0 -11
  257. package/vitest.config.ts +0 -22
@@ -1,93 +0,0 @@
1
- /**
2
- * Unit tests for OllamaClient.embed: nomic prefix scheme, L2 normalization,
3
- * 8K char truncation. These guard the nomic-embed-text v1.5 contract.
4
- */
5
-
6
- import { describe, expect, it } from "vitest";
7
- import { OllamaClient, l2Normalize } from "../../../src/llm/ollama-client.js";
8
-
9
- type FakeFetch = typeof fetch;
10
-
11
- function jsonResponse(body: unknown): Response {
12
- return new Response(JSON.stringify(body), {
13
- status: 200,
14
- headers: { "content-type": "application/json" },
15
- });
16
- }
17
-
18
- function makeFetch(reply: (req: { url: string; body: unknown }) => Response): FakeFetch {
19
- return (async (input: string | URL | Request, init?: RequestInit) => {
20
- const url = typeof input === "string" ? input : input.toString();
21
- const body = init?.body ? JSON.parse(init.body.toString()) : null;
22
- return reply({ url, body });
23
- }) as FakeFetch;
24
- }
25
-
26
- describe("OllamaClient.embed prefix scheme", () => {
27
- it("prefixes a query call with 'search_query: '", async () => {
28
- let prompt = "";
29
- const fetchImpl = makeFetch(({ body }) => {
30
- prompt = (body as { prompt: string }).prompt;
31
- return jsonResponse({ embedding: [1, 0, 0] });
32
- });
33
- const client = new OllamaClient({ fetchImpl });
34
- await client.embed("what did we decide about pgvector", "query");
35
- expect(prompt.startsWith("search_query: ")).toBe(true);
36
- expect(prompt).toContain("pgvector");
37
- });
38
-
39
- it("prefixes a document call with 'search_document: '", async () => {
40
- let prompt = "";
41
- const fetchImpl = makeFetch(({ body }) => {
42
- prompt = (body as { prompt: string }).prompt;
43
- return jsonResponse({ embedding: [1, 0, 0] });
44
- });
45
- const client = new OllamaClient({ fetchImpl });
46
- await client.embed("session body text", "document");
47
- expect(prompt.startsWith("search_document: ")).toBe(true);
48
- });
49
-
50
- it("truncates text to MAX_EMBED_CHARS (8000) before prefixing", async () => {
51
- let prompt = "";
52
- const fetchImpl = makeFetch(({ body }) => {
53
- prompt = (body as { prompt: string }).prompt;
54
- return jsonResponse({ embedding: [1, 0, 0] });
55
- });
56
- const client = new OllamaClient({ fetchImpl });
57
- const big = "x".repeat(10_000);
58
- await client.embed(big, "document");
59
- // prompt = "search_document: " + truncated → prefix is 17 chars, body capped at 8000.
60
- // Briefly raised to 28000 on 2026-05-25 then reverted same day; nomic-
61
- // embed-text via Ollama 500s on inputs near the nominal 8192-token
62
- // context. Real fix is chunk + max-pool (filed as #174).
63
- expect(prompt.length).toBe(17 + 8_000);
64
- });
65
-
66
- it("L2-normalizes the returned vector", async () => {
67
- const fetchImpl = makeFetch(() => jsonResponse({ embedding: [3, 4, 0] }));
68
- const client = new OllamaClient({ fetchImpl });
69
- const { vector } = await client.embed("anything", "document");
70
- // raw norm = 5; normalized should be [0.6, 0.8, 0]
71
- expect(vector[0]).toBeCloseTo(0.6, 6);
72
- expect(vector[1]).toBeCloseTo(0.8, 6);
73
- expect(vector[2]).toBe(0);
74
- let norm = 0;
75
- for (const v of vector) norm += v * v;
76
- expect(Math.sqrt(norm)).toBeCloseTo(1, 6);
77
- });
78
- });
79
-
80
- describe("l2Normalize", () => {
81
- it("returns a unit vector for a non-zero input", () => {
82
- const out = l2Normalize(new Float32Array([3, 4, 0]));
83
- let sum = 0;
84
- for (const v of out) sum += v * v;
85
- expect(Math.sqrt(sum)).toBeCloseTo(1, 6);
86
- });
87
-
88
- it("returns the zero vector unchanged", () => {
89
- const zero = new Float32Array([0, 0, 0]);
90
- const out = l2Normalize(zero);
91
- expect(Array.from(out)).toEqual([0, 0, 0]);
92
- });
93
- });
@@ -1,124 +0,0 @@
1
- /**
2
- * Unit tests for OllamaClient.classify against an injected fake fetch.
3
- * No network. Verifies prompt construction, JSON-mode handling, schema
4
- * validation, fence stripping, and error mapping.
5
- */
6
-
7
- import { describe, expect, it } from "vitest";
8
- import { OllamaClient, ClassifierSchemaError } from "../../../src/llm/ollama-client.js";
9
- import { LLMUnreachableError } from "../../../src/ports/llm-client.js";
10
-
11
- type FakeFetch = typeof fetch;
12
-
13
- function jsonResponse(body: unknown, init: ResponseInit = {}): Response {
14
- return new Response(JSON.stringify(body), {
15
- status: init.status ?? 200,
16
- headers: { "content-type": "application/json" },
17
- });
18
- }
19
-
20
- function makeFetch(reply: (req: { url: string; body: unknown }) => Response | Promise<Response>): FakeFetch {
21
- return (async (input: string | URL | Request, init?: RequestInit) => {
22
- const url = typeof input === "string" ? input : input.toString();
23
- const body = init?.body ? JSON.parse(init.body.toString()) : null;
24
- return reply({ url, body });
25
- }) as FakeFetch;
26
- }
27
-
28
- const VALID_PAYLOAD = {
29
- label: "Phase C classifier port",
30
- summary: "Built OllamaClient.classify with JSON-mode and schema validation against the shared prompt module.",
31
- entities: ["NLM", "Ollama", "OllamaClient"],
32
- decisions: ["Map schema-invalid output to a typed ClassifierSchemaError instead of returning null"],
33
- open: ["Whether to retry once on schema failure or send to inbox immediately"],
34
- confidence: 0.85,
35
- };
36
-
37
- describe("OllamaClient.classify", () => {
38
- it("parses a valid JSON payload through the Ollama chat envelope", async () => {
39
- const fetchImpl = makeFetch(({ url, body }) => {
40
- expect(url).toContain("/api/chat");
41
- const b = body as { model: string; messages: { role: string; content: string }[]; format: string };
42
- expect(b.format).toBe("json");
43
- expect(b.messages[0]?.role).toBe("system");
44
- expect(b.messages[0]?.content).toContain("session classifier");
45
- expect(b.messages[1]?.content).toContain("TRANSCRIPT TO CLASSIFY");
46
- return jsonResponse({ message: { content: JSON.stringify(VALID_PAYLOAD) } });
47
- });
48
- const client = new OllamaClient({ fetchImpl });
49
- const result = await client.classify("user: build the classifier\nassistant: done");
50
- expect(result.label).toBe(VALID_PAYLOAD.label);
51
- expect(result.entities).toEqual(VALID_PAYLOAD.entities);
52
- expect(result.decisions).toHaveLength(1);
53
- expect(result.confidence).toBeCloseTo(0.85);
54
- });
55
-
56
- it("threads priorContext into the user prompt when supplied", async () => {
57
- let userContent = "";
58
- const fetchImpl = makeFetch(({ body }) => {
59
- const b = body as { messages: { role: string; content: string }[] };
60
- userContent = b.messages[1]?.content ?? "";
61
- return jsonResponse({ message: { content: JSON.stringify(VALID_PAYLOAD) } });
62
- });
63
- const client = new OllamaClient({ fetchImpl });
64
- await client.classify("...transcript...", "earlier session about Hono routing");
65
- expect(userContent).toContain("PRIOR CONTEXT (already filed):");
66
- expect(userContent).toContain("earlier session about Hono routing");
67
- });
68
-
69
- it("strips markdown fences before JSON parse", async () => {
70
- const fenced = "```json\n" + JSON.stringify(VALID_PAYLOAD) + "\n```";
71
- const fetchImpl = makeFetch(() =>
72
- jsonResponse({ message: { content: fenced } }),
73
- );
74
- const client = new OllamaClient({ fetchImpl });
75
- const result = await client.classify("transcript");
76
- expect(result.label).toBe(VALID_PAYLOAD.label);
77
- });
78
-
79
- it("throws ClassifierSchemaError when required keys are missing", async () => {
80
- const bad = { label: "x", summary: "y" };
81
- const fetchImpl = makeFetch(() =>
82
- jsonResponse({ message: { content: JSON.stringify(bad) } }),
83
- );
84
- const client = new OllamaClient({ fetchImpl });
85
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(ClassifierSchemaError);
86
- });
87
-
88
- it("throws ClassifierSchemaError when the model returns non-JSON", async () => {
89
- const fetchImpl = makeFetch(() =>
90
- jsonResponse({ message: { content: "not even close to json" } }),
91
- );
92
- const client = new OllamaClient({ fetchImpl });
93
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(ClassifierSchemaError);
94
- });
95
-
96
- it("maps non-200 HTTP responses to LLMUnreachableError", async () => {
97
- const fetchImpl = makeFetch(() =>
98
- new Response("server down", { status: 503 }),
99
- );
100
- const client = new OllamaClient({ fetchImpl });
101
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(LLMUnreachableError);
102
- });
103
-
104
- it("maps network throws to LLMUnreachableError", async () => {
105
- const fetchImpl = (async () => {
106
- throw new TypeError("ECONNREFUSED");
107
- }) as FakeFetch;
108
- const client = new OllamaClient({ fetchImpl });
109
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(LLMUnreachableError);
110
- });
111
-
112
- it("coerces non-string entities to strings and trims whitespace", async () => {
113
- const messy = {
114
- ...VALID_PAYLOAD,
115
- entities: [" n8n ", " ", "Qdrant", 42],
116
- };
117
- const fetchImpl = makeFetch(() =>
118
- jsonResponse({ message: { content: JSON.stringify(messy) } }),
119
- );
120
- const client = new OllamaClient({ fetchImpl });
121
- const result = await client.classify("transcript");
122
- expect(result.entities).toEqual(["n8n", "Qdrant", "42"]);
123
- });
124
- });
@@ -1,114 +0,0 @@
1
- import { describe, expect, it } from "vitest";
2
- import {
3
- aggregate,
4
- scoreOne,
5
- } from "../../../scripts/longmemeval/scorer.js";
6
-
7
- describe("scoreOne", () => {
8
- it("recallAtK=1 when a gold id is in the top-k", () => {
9
- const r = scoreOne({
10
- returnedIds: ["a", "b", "gold-1", "d", "e"],
11
- goldIds: ["gold-1", "gold-2"],
12
- returnedBodies: ["", "", "", "", ""],
13
- answer: "anything",
14
- k: 5,
15
- });
16
- expect(r.recallAtK).toBe(1);
17
- });
18
-
19
- it("recallAtK=0 when no gold id appears in the top-k", () => {
20
- const r = scoreOne({
21
- returnedIds: ["a", "b", "c", "d", "e"],
22
- goldIds: ["gold-1"],
23
- returnedBodies: ["", "", "", "", ""],
24
- answer: "z",
25
- k: 5,
26
- });
27
- expect(r.recallAtK).toBe(0);
28
- });
29
-
30
- it("recallAtK respects k=3 ceiling even when gold is at position 4", () => {
31
- const r = scoreOne({
32
- returnedIds: ["a", "b", "c", "gold-1", "e"],
33
- goldIds: ["gold-1"],
34
- returnedBodies: [],
35
- answer: "z",
36
- k: 3,
37
- });
38
- expect(r.recallAtK).toBe(0);
39
- });
40
-
41
- it("sessionBodyHit=1 when answer substring appears in any returned body (case/whitespace insensitive)", () => {
42
- const r = scoreOne({
43
- returnedIds: ["a", "b"],
44
- goldIds: ["gold"],
45
- returnedBodies: [
46
- "irrelevant transcript content",
47
- "User: Where did you grow up?\nAssistant: I grew up in Austin, Texas.",
48
- ],
49
- answer: "austin texas",
50
- k: 5,
51
- });
52
- expect(r.sessionBodyHit).toBe(1);
53
- });
54
-
55
- it("sessionBodyHit=0 when answer is absent from all returned bodies", () => {
56
- const r = scoreOne({
57
- returnedIds: ["a"],
58
- goldIds: ["gold"],
59
- returnedBodies: ["nothing matches here"],
60
- answer: "Houston",
61
- k: 5,
62
- });
63
- expect(r.sessionBodyHit).toBe(0);
64
- });
65
-
66
- it("coerces a numeric answer to string and matches with word boundaries", () => {
67
- const hit = scoreOne({
68
- returnedIds: ["a"],
69
- goldIds: ["gold"],
70
- returnedBodies: ["The user mentioned 3 brothers in the conversation."],
71
- answer: 3,
72
- k: 5,
73
- });
74
- expect(hit.sessionBodyHit).toBe(1);
75
-
76
- const miss = scoreOne({
77
- returnedIds: ["a"],
78
- goldIds: ["gold"],
79
- returnedBodies: ["They paid $30 for the meal and tipped 20%."],
80
- answer: 3,
81
- k: 5,
82
- });
83
- expect(miss.sessionBodyHit).toBe(0);
84
- });
85
-
86
- it("sessionBodyHit=0 when answer is empty", () => {
87
- const r = scoreOne({
88
- returnedIds: ["a"],
89
- goldIds: ["gold"],
90
- returnedBodies: ["whatever"],
91
- answer: "",
92
- k: 5,
93
- });
94
- expect(r.sessionBodyHit).toBe(0);
95
- });
96
- });
97
-
98
- describe("aggregate", () => {
99
- it("computes mean rates rounded to 3 decimal places", () => {
100
- const a = aggregate([
101
- { recallAtK: 1, sessionBodyHit: 1 },
102
- { recallAtK: 0, sessionBodyHit: 1 },
103
- { recallAtK: 1, sessionBodyHit: 0 },
104
- ]);
105
- expect(a.n).toBe(3);
106
- expect(a.recallAtK).toBeCloseTo(0.667, 3);
107
- expect(a.sessionBodyHitRate).toBeCloseTo(0.667, 3);
108
- });
109
-
110
- it("returns zeros for empty input", () => {
111
- const a = aggregate([]);
112
- expect(a).toEqual({ n: 0, recallAtK: 0, sessionBodyHitRate: 0 });
113
- });
114
- });
package/tsconfig.json DELETED
@@ -1,31 +0,0 @@
1
- {
2
- "compilerOptions": {
3
- "target": "ES2022",
4
- "module": "NodeNext",
5
- "moduleResolution": "NodeNext",
6
- "lib": ["ES2022"],
7
- "outDir": "dist",
8
- "rootDir": "src",
9
- "strict": true,
10
- "noUncheckedIndexedAccess": true,
11
- "exactOptionalPropertyTypes": true,
12
- "noImplicitOverride": true,
13
- "noFallthroughCasesInSwitch": true,
14
- "forceConsistentCasingInFileNames": true,
15
- "esModuleInterop": true,
16
- "skipLibCheck": true,
17
- "declaration": true,
18
- "sourceMap": true,
19
- "resolveJsonModule": true,
20
- "isolatedModules": true,
21
- "verbatimModuleSyntax": true,
22
- "baseUrl": "src",
23
- "paths": {
24
- "@core/*": ["./core/*"],
25
- "@ports/*": ["./ports/*"],
26
- "@shared/*": ["./shared/*"]
27
- }
28
- },
29
- "include": ["src/**/*.ts"],
30
- "exclude": ["node_modules", "dist", "src/ui"]
31
- }
@@ -1,11 +0,0 @@
1
- {
2
- "extends": "./tsconfig.json",
3
- "compilerOptions": {
4
- "rootDir": ".",
5
- "noEmit": true,
6
- "declaration": false,
7
- "sourceMap": false
8
- },
9
- "include": ["src/**/*.ts", "tests/**/*.ts"],
10
- "exclude": ["node_modules", "dist", "src/ui"]
11
- }
package/vitest.config.ts DELETED
@@ -1,22 +0,0 @@
1
- import { defineConfig } from "vitest/config";
2
- import { fileURLToPath } from "node:url";
3
-
4
- export default defineConfig({
5
- test: {
6
- globals: false,
7
- environment: "node",
8
- include: ["tests/**/*.test.ts"],
9
- coverage: {
10
- provider: "v8",
11
- include: ["src/core/**", "src/ports/**"],
12
- reporter: ["text", "html"],
13
- },
14
- },
15
- resolve: {
16
- alias: {
17
- "@core": fileURLToPath(new URL("./src/core", import.meta.url)),
18
- "@ports": fileURLToPath(new URL("./src/ports", import.meta.url)),
19
- "@shared": fileURLToPath(new URL("./src/shared", import.meta.url)),
20
- },
21
- },
22
- });