nlm-memory 0.5.0 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (247) hide show
  1. package/README.md +72 -34
  2. package/dist/cli/nlm.js +2 -1
  3. package/dist/cli/nlm.js.map +1 -1
  4. package/dist/http/app.js +2 -1
  5. package/dist/http/app.js.map +1 -1
  6. package/dist/mcp/server.js +20 -1
  7. package/dist/mcp/server.js.map +1 -1
  8. package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
  9. package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
  10. package/dist/ui/index.html +2 -2
  11. package/package.json +26 -1
  12. package/.agents/plugins/marketplace.json +0 -20
  13. package/.github/workflows/ci.yml +0 -30
  14. package/docs/methodology/re-derivation-rate.md +0 -112
  15. package/docs/methodology/useful-hit-rate.md +0 -79
  16. package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
  17. package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
  18. package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
  19. package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
  20. package/docs/plans/desktop-product.md +0 -69
  21. package/docs/plans/factstore-design.md +0 -236
  22. package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
  23. package/logs/CHANGELOG/CHANGELOG.md +0 -209
  24. package/migrations/000_initial_schema.sql +0 -174
  25. package/migrations/001_entity_type_rename.sql +0 -17
  26. package/migrations/002_adapter_state_extend.sql +0 -12
  27. package/migrations/003_session_embeddings.sql +0 -11
  28. package/migrations/004_facts.sql +0 -46
  29. package/migrations/005_sources.sql +0 -31
  30. package/migrations/006_providers.sql +0 -33
  31. package/migrations/007_source_tokens.sql +0 -17
  32. package/migrations/008_fts_rebuild.sql +0 -9
  33. package/migrations/009_session_embedding_chunks.sql +0 -46
  34. package/migrations/010_sources_opencode.sql +0 -30
  35. package/migrations/011_sources_hermes_agent.sql +0 -30
  36. package/migrations/012_sources_aider.sql +0 -30
  37. package/migrations/013_adapter_state_failure_count.sql +0 -12
  38. package/migrations/014_sources_cursor.sql +0 -30
  39. package/migrations/015_sources_windsurf.sql +0 -30
  40. package/plugin-hermes-agent/README.md +0 -49
  41. package/plugin-hermes-agent/__init__.py +0 -75
  42. package/plugin-hermes-agent/plugin.yaml +0 -15
  43. package/scripts/backfill-citations.mjs +0 -0
  44. package/scripts/build-codex-plugin.mjs +0 -61
  45. package/scripts/deepseek-probe.mjs +0 -67
  46. package/scripts/extract-triples.mjs +0 -207
  47. package/scripts/longmemeval/embedding-cache.ts +0 -77
  48. package/scripts/longmemeval/fetch-dataset.sh +0 -25
  49. package/scripts/longmemeval/run-harness.ts +0 -315
  50. package/scripts/longmemeval/scorer.ts +0 -99
  51. package/scripts/longmemeval/tsconfig.json +0 -9
  52. package/scripts/longmemeval/types.ts +0 -35
  53. package/scripts/nlm-daily-digest.py +0 -239
  54. package/scripts/nlm-daily-digest.sh +0 -28
  55. package/src/cli/classify-parity.ts +0 -257
  56. package/src/cli/launchctl-helpers.ts +0 -49
  57. package/src/cli/nlm.ts +0 -1078
  58. package/src/core/actions/actions-log.ts +0 -118
  59. package/src/core/actions/overlay.ts +0 -117
  60. package/src/core/adapters/aider.ts +0 -205
  61. package/src/core/adapters/claude-code.ts +0 -293
  62. package/src/core/adapters/common.ts +0 -54
  63. package/src/core/adapters/cursor.ts +0 -486
  64. package/src/core/adapters/from-source.ts +0 -67
  65. package/src/core/adapters/hermes-agent.ts +0 -240
  66. package/src/core/adapters/hermes.ts +0 -277
  67. package/src/core/adapters/jsonl-generic.ts +0 -208
  68. package/src/core/adapters/opencode.ts +0 -281
  69. package/src/core/adapters/pi.ts +0 -264
  70. package/src/core/adapters/windsurf.ts +0 -386
  71. package/src/core/classifier/prompt.ts +0 -200
  72. package/src/core/dataset/build-dataset.ts +0 -463
  73. package/src/core/embedding/chunk-body.ts +0 -76
  74. package/src/core/embedding/embed-backfill.ts +0 -210
  75. package/src/core/embedding/embed-normalize.ts +0 -135
  76. package/src/core/facts/backfill-facts.ts +0 -254
  77. package/src/core/facts/extract-facts.ts +0 -50
  78. package/src/core/hook/citation-detect.ts +0 -124
  79. package/src/core/hook/cite-memo.ts +0 -68
  80. package/src/core/hook/claude-settings.ts +0 -187
  81. package/src/core/hook/gate.ts +0 -25
  82. package/src/core/hook/hook-log.ts +0 -41
  83. package/src/core/hook/memo-sweep.ts +0 -164
  84. package/src/core/hook/memo.ts +0 -67
  85. package/src/core/hook/pointer-block.ts +0 -26
  86. package/src/core/hook/select.ts +0 -32
  87. package/src/core/hook/transcript.ts +0 -121
  88. package/src/core/ingest/ingest-session.ts +0 -111
  89. package/src/core/providers/provider-models.ts +0 -100
  90. package/src/core/providers/provider-registry.ts +0 -196
  91. package/src/core/recall/citation-log.ts +0 -108
  92. package/src/core/recall/filter.ts +0 -27
  93. package/src/core/recall/index.ts +0 -6
  94. package/src/core/recall/match-fields.ts +0 -40
  95. package/src/core/recall/query-log.ts +0 -149
  96. package/src/core/recall/query-shape.ts +0 -66
  97. package/src/core/recall/recall-service.ts +0 -320
  98. package/src/core/recall/recent-log.ts +0 -59
  99. package/src/core/recall/tokenize.ts +0 -18
  100. package/src/core/recall/useful-scan.ts +0 -336
  101. package/src/core/recall-facts/fact-query-log.ts +0 -150
  102. package/src/core/recall-facts/fact-recall-service.ts +0 -327
  103. package/src/core/scheduler/scan-once.ts +0 -142
  104. package/src/core/scheduler/scheduler.ts +0 -225
  105. package/src/core/sources/source-registry.ts +0 -278
  106. package/src/core/storage/db-restore.ts +0 -133
  107. package/src/core/storage/live-status.ts +0 -45
  108. package/src/core/storage/migrate.ts +0 -72
  109. package/src/core/storage/sqlite-fact-store.ts +0 -304
  110. package/src/core/storage/sqlite-session-store.ts +0 -810
  111. package/src/hook/hook-auth.ts +0 -18
  112. package/src/hook/prompt-recall-hook.ts +0 -180
  113. package/src/hook/session-end-hook.ts +0 -81
  114. package/src/hook/session-start-hook.ts +0 -168
  115. package/src/hook/stop-hook.ts +0 -239
  116. package/src/http/app.ts +0 -1215
  117. package/src/install/claude-code.ts +0 -128
  118. package/src/install/codex.ts +0 -367
  119. package/src/install/cursor.ts +0 -68
  120. package/src/install/hermes-agent.ts +0 -76
  121. package/src/install/hermes.ts +0 -78
  122. package/src/install/nlm-dir-perms.ts +0 -55
  123. package/src/install/ollama.ts +0 -284
  124. package/src/install/setup.ts +0 -489
  125. package/src/install/windsurf.ts +0 -68
  126. package/src/llm/classifier-box.ts +0 -64
  127. package/src/llm/deepseek-client.ts +0 -150
  128. package/src/llm/env-autoload.ts +0 -55
  129. package/src/llm/ollama-client.ts +0 -189
  130. package/src/mcp/server.ts +0 -534
  131. package/src/ports/fact-store.ts +0 -102
  132. package/src/ports/llm-client.ts +0 -52
  133. package/src/ports/logger.ts +0 -16
  134. package/src/ports/session-store.ts +0 -45
  135. package/src/ports/transcript-adapter.ts +0 -55
  136. package/src/shared/types.ts +0 -149
  137. package/src/ui/App.tsx +0 -58
  138. package/src/ui/components/PromoteOpenButton.tsx +0 -65
  139. package/src/ui/components/SessionDrawer.tsx +0 -199
  140. package/src/ui/components/SideNav.tsx +0 -162
  141. package/src/ui/components/Skeleton.tsx +0 -107
  142. package/src/ui/index.html +0 -13
  143. package/src/ui/lib/actions.ts +0 -30
  144. package/src/ui/lib/api.ts +0 -92
  145. package/src/ui/lib/dataset.ts +0 -141
  146. package/src/ui/lib/registries.ts +0 -155
  147. package/src/ui/lib/view-settings.ts +0 -41
  148. package/src/ui/main.tsx +0 -15
  149. package/src/ui/pages/Live.tsx +0 -229
  150. package/src/ui/pages/Pulse.tsx +0 -415
  151. package/src/ui/pages/Recall.tsx +0 -190
  152. package/src/ui/pages/River.tsx +0 -354
  153. package/src/ui/pages/Search.tsx +0 -386
  154. package/src/ui/pages/Stub.tsx +0 -9
  155. package/src/ui/pages/Thread.tsx +0 -473
  156. package/src/ui/pages/settings/Classifier.tsx +0 -227
  157. package/src/ui/pages/settings/Data.tsx +0 -190
  158. package/src/ui/pages/settings/Index.tsx +0 -65
  159. package/src/ui/pages/settings/Labels.tsx +0 -224
  160. package/src/ui/pages/settings/Providers.tsx +0 -305
  161. package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
  162. package/src/ui/pages/settings/Sources.tsx +0 -326
  163. package/src/ui/pages/settings/Views.tsx +0 -96
  164. package/src/ui/styles.css +0 -1890
  165. package/src/ui/tsconfig.json +0 -21
  166. package/src/ui/vite.config.ts +0 -19
  167. package/tests/fixtures/claude_code/short_session.jsonl +0 -2
  168. package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
  169. package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
  170. package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
  171. package/tests/fixtures/facts.ts +0 -17
  172. package/tests/fixtures/golden-corpus.ts +0 -85
  173. package/tests/fixtures/hermes/paired_request_dump.json +0 -24
  174. package/tests/fixtures/hermes/paired_session.json +0 -23
  175. package/tests/fixtures/hermes/request_dump.json +0 -28
  176. package/tests/fixtures/hermes/session_iso.json +0 -38
  177. package/tests/fixtures/hermes/session_unix.json +0 -38
  178. package/tests/fixtures/hermes/system_only.json +0 -18
  179. package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
  180. package/tests/fixtures/pi/short-successful.jsonl +0 -5
  181. package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
  182. package/tests/fixtures/sessions.ts +0 -22
  183. package/tests/integration/backfill-facts.test.ts +0 -362
  184. package/tests/integration/citation-explicit.test.ts +0 -111
  185. package/tests/integration/cite-event.test.ts +0 -169
  186. package/tests/integration/cite-memo.test.ts +0 -87
  187. package/tests/integration/db-restore.test.ts +0 -153
  188. package/tests/integration/embed-backfill.test.ts +0 -176
  189. package/tests/integration/fact-supersedence.test.ts +0 -313
  190. package/tests/integration/fts-index.test.ts +0 -60
  191. package/tests/integration/getbyids-sqlite.test.ts +0 -100
  192. package/tests/integration/hermes-agent-hooks.test.ts +0 -248
  193. package/tests/integration/hook-claude-settings.test.ts +0 -218
  194. package/tests/integration/hook-log.test.ts +0 -54
  195. package/tests/integration/hook-memo.test.ts +0 -68
  196. package/tests/integration/hook-pre-compact.test.ts +0 -105
  197. package/tests/integration/hook-subagent-start.test.ts +0 -102
  198. package/tests/integration/http.test.ts +0 -401
  199. package/tests/integration/keyword-search-fts.test.ts +0 -66
  200. package/tests/integration/mcp-recall-logging.test.ts +0 -88
  201. package/tests/integration/mcp.test.ts +0 -260
  202. package/tests/integration/memo-sweep.test.ts +0 -91
  203. package/tests/integration/prompt-recall-hook.test.ts +0 -88
  204. package/tests/integration/provider-registry.test.ts +0 -107
  205. package/tests/integration/recall-golden.test.ts +0 -59
  206. package/tests/integration/recall-sqlite.test.ts +0 -169
  207. package/tests/integration/scheduler.test.ts +0 -391
  208. package/tests/integration/session-end-hook.test.ts +0 -48
  209. package/tests/integration/session-start-hook.test.ts +0 -126
  210. package/tests/integration/source-registry.test.ts +0 -122
  211. package/tests/integration/sqlite-fact-store.test.ts +0 -346
  212. package/tests/integration/stop-hook.test.ts +0 -560
  213. package/tests/integration/wal-checkpoint.test.ts +0 -49
  214. package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
  215. package/tests/unit/core/adapters/aider.test.ts +0 -230
  216. package/tests/unit/core/adapters/claude-code.test.ts +0 -118
  217. package/tests/unit/core/adapters/cursor.test.ts +0 -485
  218. package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
  219. package/tests/unit/core/adapters/hermes.test.ts +0 -81
  220. package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
  221. package/tests/unit/core/adapters/opencode.test.ts +0 -354
  222. package/tests/unit/core/adapters/pi.test.ts +0 -110
  223. package/tests/unit/core/adapters/windsurf.test.ts +0 -416
  224. package/tests/unit/core/classifier/prompt.test.ts +0 -126
  225. package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
  226. package/tests/unit/core/facts/extract-facts.test.ts +0 -117
  227. package/tests/unit/core/filter.test.ts +0 -40
  228. package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
  229. package/tests/unit/core/hook/citation-detect.test.ts +0 -124
  230. package/tests/unit/core/hook/gate.test.ts +0 -29
  231. package/tests/unit/core/hook/pointer-block.test.ts +0 -22
  232. package/tests/unit/core/hook/select.test.ts +0 -66
  233. package/tests/unit/core/match-fields.test.ts +0 -39
  234. package/tests/unit/core/mcp-cite-session.test.ts +0 -51
  235. package/tests/unit/core/providers/provider-models.test.ts +0 -101
  236. package/tests/unit/core/query-shape.test.ts +0 -92
  237. package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
  238. package/tests/unit/core/recall-service.test.ts +0 -200
  239. package/tests/unit/core/storage/live-status.test.ts +0 -54
  240. package/tests/unit/core/tokenize.test.ts +0 -32
  241. package/tests/unit/core/useful-scan.test.ts +0 -537
  242. package/tests/unit/llm/embed.test.ts +0 -93
  243. package/tests/unit/llm/ollama-client.test.ts +0 -124
  244. package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
  245. package/tsconfig.json +0 -31
  246. package/tsconfig.test.json +0 -11
  247. package/vitest.config.ts +0 -22
@@ -1,93 +0,0 @@
1
- /**
2
- * Unit tests for OllamaClient.embed: nomic prefix scheme, L2 normalization,
3
- * 8K char truncation. These guard the nomic-embed-text v1.5 contract.
4
- */
5
-
6
- import { describe, expect, it } from "vitest";
7
- import { OllamaClient, l2Normalize } from "../../../src/llm/ollama-client.js";
8
-
9
- type FakeFetch = typeof fetch;
10
-
11
- function jsonResponse(body: unknown): Response {
12
- return new Response(JSON.stringify(body), {
13
- status: 200,
14
- headers: { "content-type": "application/json" },
15
- });
16
- }
17
-
18
- function makeFetch(reply: (req: { url: string; body: unknown }) => Response): FakeFetch {
19
- return (async (input: string | URL | Request, init?: RequestInit) => {
20
- const url = typeof input === "string" ? input : input.toString();
21
- const body = init?.body ? JSON.parse(init.body.toString()) : null;
22
- return reply({ url, body });
23
- }) as FakeFetch;
24
- }
25
-
26
- describe("OllamaClient.embed prefix scheme", () => {
27
- it("prefixes a query call with 'search_query: '", async () => {
28
- let prompt = "";
29
- const fetchImpl = makeFetch(({ body }) => {
30
- prompt = (body as { prompt: string }).prompt;
31
- return jsonResponse({ embedding: [1, 0, 0] });
32
- });
33
- const client = new OllamaClient({ fetchImpl });
34
- await client.embed("what did we decide about pgvector", "query");
35
- expect(prompt.startsWith("search_query: ")).toBe(true);
36
- expect(prompt).toContain("pgvector");
37
- });
38
-
39
- it("prefixes a document call with 'search_document: '", async () => {
40
- let prompt = "";
41
- const fetchImpl = makeFetch(({ body }) => {
42
- prompt = (body as { prompt: string }).prompt;
43
- return jsonResponse({ embedding: [1, 0, 0] });
44
- });
45
- const client = new OllamaClient({ fetchImpl });
46
- await client.embed("session body text", "document");
47
- expect(prompt.startsWith("search_document: ")).toBe(true);
48
- });
49
-
50
- it("truncates text to MAX_EMBED_CHARS (8000) before prefixing", async () => {
51
- let prompt = "";
52
- const fetchImpl = makeFetch(({ body }) => {
53
- prompt = (body as { prompt: string }).prompt;
54
- return jsonResponse({ embedding: [1, 0, 0] });
55
- });
56
- const client = new OllamaClient({ fetchImpl });
57
- const big = "x".repeat(10_000);
58
- await client.embed(big, "document");
59
- // prompt = "search_document: " + truncated → prefix is 17 chars, body capped at 8000.
60
- // Briefly raised to 28000 on 2026-05-25 then reverted same day; nomic-
61
- // embed-text via Ollama 500s on inputs near the nominal 8192-token
62
- // context. Real fix is chunk + max-pool (filed as #174).
63
- expect(prompt.length).toBe(17 + 8_000);
64
- });
65
-
66
- it("L2-normalizes the returned vector", async () => {
67
- const fetchImpl = makeFetch(() => jsonResponse({ embedding: [3, 4, 0] }));
68
- const client = new OllamaClient({ fetchImpl });
69
- const { vector } = await client.embed("anything", "document");
70
- // raw norm = 5; normalized should be [0.6, 0.8, 0]
71
- expect(vector[0]).toBeCloseTo(0.6, 6);
72
- expect(vector[1]).toBeCloseTo(0.8, 6);
73
- expect(vector[2]).toBe(0);
74
- let norm = 0;
75
- for (const v of vector) norm += v * v;
76
- expect(Math.sqrt(norm)).toBeCloseTo(1, 6);
77
- });
78
- });
79
-
80
- describe("l2Normalize", () => {
81
- it("returns a unit vector for a non-zero input", () => {
82
- const out = l2Normalize(new Float32Array([3, 4, 0]));
83
- let sum = 0;
84
- for (const v of out) sum += v * v;
85
- expect(Math.sqrt(sum)).toBeCloseTo(1, 6);
86
- });
87
-
88
- it("returns the zero vector unchanged", () => {
89
- const zero = new Float32Array([0, 0, 0]);
90
- const out = l2Normalize(zero);
91
- expect(Array.from(out)).toEqual([0, 0, 0]);
92
- });
93
- });
@@ -1,124 +0,0 @@
1
- /**
2
- * Unit tests for OllamaClient.classify against an injected fake fetch.
3
- * No network. Verifies prompt construction, JSON-mode handling, schema
4
- * validation, fence stripping, and error mapping.
5
- */
6
-
7
- import { describe, expect, it } from "vitest";
8
- import { OllamaClient, ClassifierSchemaError } from "../../../src/llm/ollama-client.js";
9
- import { LLMUnreachableError } from "../../../src/ports/llm-client.js";
10
-
11
- type FakeFetch = typeof fetch;
12
-
13
- function jsonResponse(body: unknown, init: ResponseInit = {}): Response {
14
- return new Response(JSON.stringify(body), {
15
- status: init.status ?? 200,
16
- headers: { "content-type": "application/json" },
17
- });
18
- }
19
-
20
- function makeFetch(reply: (req: { url: string; body: unknown }) => Response | Promise<Response>): FakeFetch {
21
- return (async (input: string | URL | Request, init?: RequestInit) => {
22
- const url = typeof input === "string" ? input : input.toString();
23
- const body = init?.body ? JSON.parse(init.body.toString()) : null;
24
- return reply({ url, body });
25
- }) as FakeFetch;
26
- }
27
-
28
- const VALID_PAYLOAD = {
29
- label: "Phase C classifier port",
30
- summary: "Built OllamaClient.classify with JSON-mode and schema validation against the shared prompt module.",
31
- entities: ["NLM", "Ollama", "OllamaClient"],
32
- decisions: ["Map schema-invalid output to a typed ClassifierSchemaError instead of returning null"],
33
- open: ["Whether to retry once on schema failure or send to inbox immediately"],
34
- confidence: 0.85,
35
- };
36
-
37
- describe("OllamaClient.classify", () => {
38
- it("parses a valid JSON payload through the Ollama chat envelope", async () => {
39
- const fetchImpl = makeFetch(({ url, body }) => {
40
- expect(url).toContain("/api/chat");
41
- const b = body as { model: string; messages: { role: string; content: string }[]; format: string };
42
- expect(b.format).toBe("json");
43
- expect(b.messages[0]?.role).toBe("system");
44
- expect(b.messages[0]?.content).toContain("session classifier");
45
- expect(b.messages[1]?.content).toContain("TRANSCRIPT TO CLASSIFY");
46
- return jsonResponse({ message: { content: JSON.stringify(VALID_PAYLOAD) } });
47
- });
48
- const client = new OllamaClient({ fetchImpl });
49
- const result = await client.classify("user: build the classifier\nassistant: done");
50
- expect(result.label).toBe(VALID_PAYLOAD.label);
51
- expect(result.entities).toEqual(VALID_PAYLOAD.entities);
52
- expect(result.decisions).toHaveLength(1);
53
- expect(result.confidence).toBeCloseTo(0.85);
54
- });
55
-
56
- it("threads priorContext into the user prompt when supplied", async () => {
57
- let userContent = "";
58
- const fetchImpl = makeFetch(({ body }) => {
59
- const b = body as { messages: { role: string; content: string }[] };
60
- userContent = b.messages[1]?.content ?? "";
61
- return jsonResponse({ message: { content: JSON.stringify(VALID_PAYLOAD) } });
62
- });
63
- const client = new OllamaClient({ fetchImpl });
64
- await client.classify("...transcript...", "earlier session about Hono routing");
65
- expect(userContent).toContain("PRIOR CONTEXT (already filed):");
66
- expect(userContent).toContain("earlier session about Hono routing");
67
- });
68
-
69
- it("strips markdown fences before JSON parse", async () => {
70
- const fenced = "```json\n" + JSON.stringify(VALID_PAYLOAD) + "\n```";
71
- const fetchImpl = makeFetch(() =>
72
- jsonResponse({ message: { content: fenced } }),
73
- );
74
- const client = new OllamaClient({ fetchImpl });
75
- const result = await client.classify("transcript");
76
- expect(result.label).toBe(VALID_PAYLOAD.label);
77
- });
78
-
79
- it("throws ClassifierSchemaError when required keys are missing", async () => {
80
- const bad = { label: "x", summary: "y" };
81
- const fetchImpl = makeFetch(() =>
82
- jsonResponse({ message: { content: JSON.stringify(bad) } }),
83
- );
84
- const client = new OllamaClient({ fetchImpl });
85
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(ClassifierSchemaError);
86
- });
87
-
88
- it("throws ClassifierSchemaError when the model returns non-JSON", async () => {
89
- const fetchImpl = makeFetch(() =>
90
- jsonResponse({ message: { content: "not even close to json" } }),
91
- );
92
- const client = new OllamaClient({ fetchImpl });
93
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(ClassifierSchemaError);
94
- });
95
-
96
- it("maps non-200 HTTP responses to LLMUnreachableError", async () => {
97
- const fetchImpl = makeFetch(() =>
98
- new Response("server down", { status: 503 }),
99
- );
100
- const client = new OllamaClient({ fetchImpl });
101
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(LLMUnreachableError);
102
- });
103
-
104
- it("maps network throws to LLMUnreachableError", async () => {
105
- const fetchImpl = (async () => {
106
- throw new TypeError("ECONNREFUSED");
107
- }) as FakeFetch;
108
- const client = new OllamaClient({ fetchImpl });
109
- await expect(client.classify("transcript")).rejects.toBeInstanceOf(LLMUnreachableError);
110
- });
111
-
112
- it("coerces non-string entities to strings and trims whitespace", async () => {
113
- const messy = {
114
- ...VALID_PAYLOAD,
115
- entities: [" n8n ", " ", "Qdrant", 42],
116
- };
117
- const fetchImpl = makeFetch(() =>
118
- jsonResponse({ message: { content: JSON.stringify(messy) } }),
119
- );
120
- const client = new OllamaClient({ fetchImpl });
121
- const result = await client.classify("transcript");
122
- expect(result.entities).toEqual(["n8n", "Qdrant", "42"]);
123
- });
124
- });
@@ -1,114 +0,0 @@
1
- import { describe, expect, it } from "vitest";
2
- import {
3
- aggregate,
4
- scoreOne,
5
- } from "../../../scripts/longmemeval/scorer.js";
6
-
7
- describe("scoreOne", () => {
8
- it("recallAtK=1 when a gold id is in the top-k", () => {
9
- const r = scoreOne({
10
- returnedIds: ["a", "b", "gold-1", "d", "e"],
11
- goldIds: ["gold-1", "gold-2"],
12
- returnedBodies: ["", "", "", "", ""],
13
- answer: "anything",
14
- k: 5,
15
- });
16
- expect(r.recallAtK).toBe(1);
17
- });
18
-
19
- it("recallAtK=0 when no gold id appears in the top-k", () => {
20
- const r = scoreOne({
21
- returnedIds: ["a", "b", "c", "d", "e"],
22
- goldIds: ["gold-1"],
23
- returnedBodies: ["", "", "", "", ""],
24
- answer: "z",
25
- k: 5,
26
- });
27
- expect(r.recallAtK).toBe(0);
28
- });
29
-
30
- it("recallAtK respects k=3 ceiling even when gold is at position 4", () => {
31
- const r = scoreOne({
32
- returnedIds: ["a", "b", "c", "gold-1", "e"],
33
- goldIds: ["gold-1"],
34
- returnedBodies: [],
35
- answer: "z",
36
- k: 3,
37
- });
38
- expect(r.recallAtK).toBe(0);
39
- });
40
-
41
- it("sessionBodyHit=1 when answer substring appears in any returned body (case/whitespace insensitive)", () => {
42
- const r = scoreOne({
43
- returnedIds: ["a", "b"],
44
- goldIds: ["gold"],
45
- returnedBodies: [
46
- "irrelevant transcript content",
47
- "User: Where did you grow up?\nAssistant: I grew up in Austin, Texas.",
48
- ],
49
- answer: "austin texas",
50
- k: 5,
51
- });
52
- expect(r.sessionBodyHit).toBe(1);
53
- });
54
-
55
- it("sessionBodyHit=0 when answer is absent from all returned bodies", () => {
56
- const r = scoreOne({
57
- returnedIds: ["a"],
58
- goldIds: ["gold"],
59
- returnedBodies: ["nothing matches here"],
60
- answer: "Houston",
61
- k: 5,
62
- });
63
- expect(r.sessionBodyHit).toBe(0);
64
- });
65
-
66
- it("coerces a numeric answer to string and matches with word boundaries", () => {
67
- const hit = scoreOne({
68
- returnedIds: ["a"],
69
- goldIds: ["gold"],
70
- returnedBodies: ["The user mentioned 3 brothers in the conversation."],
71
- answer: 3,
72
- k: 5,
73
- });
74
- expect(hit.sessionBodyHit).toBe(1);
75
-
76
- const miss = scoreOne({
77
- returnedIds: ["a"],
78
- goldIds: ["gold"],
79
- returnedBodies: ["They paid $30 for the meal and tipped 20%."],
80
- answer: 3,
81
- k: 5,
82
- });
83
- expect(miss.sessionBodyHit).toBe(0);
84
- });
85
-
86
- it("sessionBodyHit=0 when answer is empty", () => {
87
- const r = scoreOne({
88
- returnedIds: ["a"],
89
- goldIds: ["gold"],
90
- returnedBodies: ["whatever"],
91
- answer: "",
92
- k: 5,
93
- });
94
- expect(r.sessionBodyHit).toBe(0);
95
- });
96
- });
97
-
98
- describe("aggregate", () => {
99
- it("computes mean rates rounded to 3 decimal places", () => {
100
- const a = aggregate([
101
- { recallAtK: 1, sessionBodyHit: 1 },
102
- { recallAtK: 0, sessionBodyHit: 1 },
103
- { recallAtK: 1, sessionBodyHit: 0 },
104
- ]);
105
- expect(a.n).toBe(3);
106
- expect(a.recallAtK).toBeCloseTo(0.667, 3);
107
- expect(a.sessionBodyHitRate).toBeCloseTo(0.667, 3);
108
- });
109
-
110
- it("returns zeros for empty input", () => {
111
- const a = aggregate([]);
112
- expect(a).toEqual({ n: 0, recallAtK: 0, sessionBodyHitRate: 0 });
113
- });
114
- });
package/tsconfig.json DELETED
@@ -1,31 +0,0 @@
1
- {
2
- "compilerOptions": {
3
- "target": "ES2022",
4
- "module": "NodeNext",
5
- "moduleResolution": "NodeNext",
6
- "lib": ["ES2022"],
7
- "outDir": "dist",
8
- "rootDir": "src",
9
- "strict": true,
10
- "noUncheckedIndexedAccess": true,
11
- "exactOptionalPropertyTypes": true,
12
- "noImplicitOverride": true,
13
- "noFallthroughCasesInSwitch": true,
14
- "forceConsistentCasingInFileNames": true,
15
- "esModuleInterop": true,
16
- "skipLibCheck": true,
17
- "declaration": true,
18
- "sourceMap": true,
19
- "resolveJsonModule": true,
20
- "isolatedModules": true,
21
- "verbatimModuleSyntax": true,
22
- "baseUrl": "src",
23
- "paths": {
24
- "@core/*": ["./core/*"],
25
- "@ports/*": ["./ports/*"],
26
- "@shared/*": ["./shared/*"]
27
- }
28
- },
29
- "include": ["src/**/*.ts"],
30
- "exclude": ["node_modules", "dist", "src/ui"]
31
- }
@@ -1,11 +0,0 @@
1
- {
2
- "extends": "./tsconfig.json",
3
- "compilerOptions": {
4
- "rootDir": ".",
5
- "noEmit": true,
6
- "declaration": false,
7
- "sourceMap": false
8
- },
9
- "include": ["src/**/*.ts", "tests/**/*.ts"],
10
- "exclude": ["node_modules", "dist", "src/ui"]
11
- }
package/vitest.config.ts DELETED
@@ -1,22 +0,0 @@
1
- import { defineConfig } from "vitest/config";
2
- import { fileURLToPath } from "node:url";
3
-
4
- export default defineConfig({
5
- test: {
6
- globals: false,
7
- environment: "node",
8
- include: ["tests/**/*.test.ts"],
9
- coverage: {
10
- provider: "v8",
11
- include: ["src/core/**", "src/ports/**"],
12
- reporter: ["text", "html"],
13
- },
14
- },
15
- resolve: {
16
- alias: {
17
- "@core": fileURLToPath(new URL("./src/core", import.meta.url)),
18
- "@ports": fileURLToPath(new URL("./src/ports", import.meta.url)),
19
- "@shared": fileURLToPath(new URL("./src/shared", import.meta.url)),
20
- },
21
- },
22
- });