nlm-memory 0.5.0 → 0.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +72 -34
- package/dist/cli/nlm.js +2 -1
- package/dist/cli/nlm.js.map +1 -1
- package/dist/http/app.js +2 -1
- package/dist/http/app.js.map +1 -1
- package/dist/mcp/server.js +20 -1
- package/dist/mcp/server.js.map +1 -1
- package/dist/ui/assets/{index-C8cpwbYJ.css → index-Beo8psd-.css} +1 -1
- package/dist/ui/assets/{index-CB50QnL-.js → index-CSPTTeeM.js} +8 -8
- package/dist/ui/index.html +2 -2
- package/package.json +26 -1
- package/.agents/plugins/marketplace.json +0 -20
- package/.github/workflows/ci.yml +0 -30
- package/docs/methodology/re-derivation-rate.md +0 -112
- package/docs/methodology/useful-hit-rate.md +0 -79
- package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
- package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
- package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
- package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
- package/docs/plans/desktop-product.md +0 -69
- package/docs/plans/factstore-design.md +0 -236
- package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1575
- package/logs/CHANGELOG/CHANGELOG.md +0 -209
- package/migrations/000_initial_schema.sql +0 -174
- package/migrations/001_entity_type_rename.sql +0 -17
- package/migrations/002_adapter_state_extend.sql +0 -12
- package/migrations/003_session_embeddings.sql +0 -11
- package/migrations/004_facts.sql +0 -46
- package/migrations/005_sources.sql +0 -31
- package/migrations/006_providers.sql +0 -33
- package/migrations/007_source_tokens.sql +0 -17
- package/migrations/008_fts_rebuild.sql +0 -9
- package/migrations/009_session_embedding_chunks.sql +0 -46
- package/migrations/010_sources_opencode.sql +0 -30
- package/migrations/011_sources_hermes_agent.sql +0 -30
- package/migrations/012_sources_aider.sql +0 -30
- package/migrations/013_adapter_state_failure_count.sql +0 -12
- package/migrations/014_sources_cursor.sql +0 -30
- package/migrations/015_sources_windsurf.sql +0 -30
- package/plugin-hermes-agent/README.md +0 -49
- package/plugin-hermes-agent/__init__.py +0 -75
- package/plugin-hermes-agent/plugin.yaml +0 -15
- package/scripts/backfill-citations.mjs +0 -0
- package/scripts/build-codex-plugin.mjs +0 -61
- package/scripts/deepseek-probe.mjs +0 -67
- package/scripts/extract-triples.mjs +0 -207
- package/scripts/longmemeval/embedding-cache.ts +0 -77
- package/scripts/longmemeval/fetch-dataset.sh +0 -25
- package/scripts/longmemeval/run-harness.ts +0 -315
- package/scripts/longmemeval/scorer.ts +0 -99
- package/scripts/longmemeval/tsconfig.json +0 -9
- package/scripts/longmemeval/types.ts +0 -35
- package/scripts/nlm-daily-digest.py +0 -239
- package/scripts/nlm-daily-digest.sh +0 -28
- package/src/cli/classify-parity.ts +0 -257
- package/src/cli/launchctl-helpers.ts +0 -49
- package/src/cli/nlm.ts +0 -1078
- package/src/core/actions/actions-log.ts +0 -118
- package/src/core/actions/overlay.ts +0 -117
- package/src/core/adapters/aider.ts +0 -205
- package/src/core/adapters/claude-code.ts +0 -293
- package/src/core/adapters/common.ts +0 -54
- package/src/core/adapters/cursor.ts +0 -486
- package/src/core/adapters/from-source.ts +0 -67
- package/src/core/adapters/hermes-agent.ts +0 -240
- package/src/core/adapters/hermes.ts +0 -277
- package/src/core/adapters/jsonl-generic.ts +0 -208
- package/src/core/adapters/opencode.ts +0 -281
- package/src/core/adapters/pi.ts +0 -264
- package/src/core/adapters/windsurf.ts +0 -386
- package/src/core/classifier/prompt.ts +0 -200
- package/src/core/dataset/build-dataset.ts +0 -463
- package/src/core/embedding/chunk-body.ts +0 -76
- package/src/core/embedding/embed-backfill.ts +0 -210
- package/src/core/embedding/embed-normalize.ts +0 -135
- package/src/core/facts/backfill-facts.ts +0 -254
- package/src/core/facts/extract-facts.ts +0 -50
- package/src/core/hook/citation-detect.ts +0 -124
- package/src/core/hook/cite-memo.ts +0 -68
- package/src/core/hook/claude-settings.ts +0 -187
- package/src/core/hook/gate.ts +0 -25
- package/src/core/hook/hook-log.ts +0 -41
- package/src/core/hook/memo-sweep.ts +0 -164
- package/src/core/hook/memo.ts +0 -67
- package/src/core/hook/pointer-block.ts +0 -26
- package/src/core/hook/select.ts +0 -32
- package/src/core/hook/transcript.ts +0 -121
- package/src/core/ingest/ingest-session.ts +0 -111
- package/src/core/providers/provider-models.ts +0 -100
- package/src/core/providers/provider-registry.ts +0 -196
- package/src/core/recall/citation-log.ts +0 -108
- package/src/core/recall/filter.ts +0 -27
- package/src/core/recall/index.ts +0 -6
- package/src/core/recall/match-fields.ts +0 -40
- package/src/core/recall/query-log.ts +0 -149
- package/src/core/recall/query-shape.ts +0 -66
- package/src/core/recall/recall-service.ts +0 -320
- package/src/core/recall/recent-log.ts +0 -59
- package/src/core/recall/tokenize.ts +0 -18
- package/src/core/recall/useful-scan.ts +0 -336
- package/src/core/recall-facts/fact-query-log.ts +0 -150
- package/src/core/recall-facts/fact-recall-service.ts +0 -327
- package/src/core/scheduler/scan-once.ts +0 -142
- package/src/core/scheduler/scheduler.ts +0 -225
- package/src/core/sources/source-registry.ts +0 -278
- package/src/core/storage/db-restore.ts +0 -133
- package/src/core/storage/live-status.ts +0 -45
- package/src/core/storage/migrate.ts +0 -72
- package/src/core/storage/sqlite-fact-store.ts +0 -304
- package/src/core/storage/sqlite-session-store.ts +0 -810
- package/src/hook/hook-auth.ts +0 -18
- package/src/hook/prompt-recall-hook.ts +0 -180
- package/src/hook/session-end-hook.ts +0 -81
- package/src/hook/session-start-hook.ts +0 -168
- package/src/hook/stop-hook.ts +0 -239
- package/src/http/app.ts +0 -1215
- package/src/install/claude-code.ts +0 -128
- package/src/install/codex.ts +0 -367
- package/src/install/cursor.ts +0 -68
- package/src/install/hermes-agent.ts +0 -76
- package/src/install/hermes.ts +0 -78
- package/src/install/nlm-dir-perms.ts +0 -55
- package/src/install/ollama.ts +0 -284
- package/src/install/setup.ts +0 -489
- package/src/install/windsurf.ts +0 -68
- package/src/llm/classifier-box.ts +0 -64
- package/src/llm/deepseek-client.ts +0 -150
- package/src/llm/env-autoload.ts +0 -55
- package/src/llm/ollama-client.ts +0 -189
- package/src/mcp/server.ts +0 -534
- package/src/ports/fact-store.ts +0 -102
- package/src/ports/llm-client.ts +0 -52
- package/src/ports/logger.ts +0 -16
- package/src/ports/session-store.ts +0 -45
- package/src/ports/transcript-adapter.ts +0 -55
- package/src/shared/types.ts +0 -149
- package/src/ui/App.tsx +0 -58
- package/src/ui/components/PromoteOpenButton.tsx +0 -65
- package/src/ui/components/SessionDrawer.tsx +0 -199
- package/src/ui/components/SideNav.tsx +0 -162
- package/src/ui/components/Skeleton.tsx +0 -107
- package/src/ui/index.html +0 -13
- package/src/ui/lib/actions.ts +0 -30
- package/src/ui/lib/api.ts +0 -92
- package/src/ui/lib/dataset.ts +0 -141
- package/src/ui/lib/registries.ts +0 -155
- package/src/ui/lib/view-settings.ts +0 -41
- package/src/ui/main.tsx +0 -15
- package/src/ui/pages/Live.tsx +0 -229
- package/src/ui/pages/Pulse.tsx +0 -415
- package/src/ui/pages/Recall.tsx +0 -190
- package/src/ui/pages/River.tsx +0 -354
- package/src/ui/pages/Search.tsx +0 -386
- package/src/ui/pages/Stub.tsx +0 -9
- package/src/ui/pages/Thread.tsx +0 -473
- package/src/ui/pages/settings/Classifier.tsx +0 -227
- package/src/ui/pages/settings/Data.tsx +0 -190
- package/src/ui/pages/settings/Index.tsx +0 -65
- package/src/ui/pages/settings/Labels.tsx +0 -224
- package/src/ui/pages/settings/Providers.tsx +0 -305
- package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
- package/src/ui/pages/settings/Sources.tsx +0 -326
- package/src/ui/pages/settings/Views.tsx +0 -96
- package/src/ui/styles.css +0 -1890
- package/src/ui/tsconfig.json +0 -21
- package/src/ui/vite.config.ts +0 -19
- package/tests/fixtures/claude_code/short_session.jsonl +0 -2
- package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
- package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
- package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
- package/tests/fixtures/facts.ts +0 -17
- package/tests/fixtures/golden-corpus.ts +0 -85
- package/tests/fixtures/hermes/paired_request_dump.json +0 -24
- package/tests/fixtures/hermes/paired_session.json +0 -23
- package/tests/fixtures/hermes/request_dump.json +0 -28
- package/tests/fixtures/hermes/session_iso.json +0 -38
- package/tests/fixtures/hermes/session_unix.json +0 -38
- package/tests/fixtures/hermes/system_only.json +0 -18
- package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
- package/tests/fixtures/pi/short-successful.jsonl +0 -5
- package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
- package/tests/fixtures/sessions.ts +0 -22
- package/tests/integration/backfill-facts.test.ts +0 -362
- package/tests/integration/citation-explicit.test.ts +0 -111
- package/tests/integration/cite-event.test.ts +0 -169
- package/tests/integration/cite-memo.test.ts +0 -87
- package/tests/integration/db-restore.test.ts +0 -153
- package/tests/integration/embed-backfill.test.ts +0 -176
- package/tests/integration/fact-supersedence.test.ts +0 -313
- package/tests/integration/fts-index.test.ts +0 -60
- package/tests/integration/getbyids-sqlite.test.ts +0 -100
- package/tests/integration/hermes-agent-hooks.test.ts +0 -248
- package/tests/integration/hook-claude-settings.test.ts +0 -218
- package/tests/integration/hook-log.test.ts +0 -54
- package/tests/integration/hook-memo.test.ts +0 -68
- package/tests/integration/hook-pre-compact.test.ts +0 -105
- package/tests/integration/hook-subagent-start.test.ts +0 -102
- package/tests/integration/http.test.ts +0 -401
- package/tests/integration/keyword-search-fts.test.ts +0 -66
- package/tests/integration/mcp-recall-logging.test.ts +0 -88
- package/tests/integration/mcp.test.ts +0 -260
- package/tests/integration/memo-sweep.test.ts +0 -91
- package/tests/integration/prompt-recall-hook.test.ts +0 -88
- package/tests/integration/provider-registry.test.ts +0 -107
- package/tests/integration/recall-golden.test.ts +0 -59
- package/tests/integration/recall-sqlite.test.ts +0 -169
- package/tests/integration/scheduler.test.ts +0 -391
- package/tests/integration/session-end-hook.test.ts +0 -48
- package/tests/integration/session-start-hook.test.ts +0 -126
- package/tests/integration/source-registry.test.ts +0 -122
- package/tests/integration/sqlite-fact-store.test.ts +0 -346
- package/tests/integration/stop-hook.test.ts +0 -560
- package/tests/integration/wal-checkpoint.test.ts +0 -49
- package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
- package/tests/unit/core/adapters/aider.test.ts +0 -230
- package/tests/unit/core/adapters/claude-code.test.ts +0 -118
- package/tests/unit/core/adapters/cursor.test.ts +0 -485
- package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
- package/tests/unit/core/adapters/hermes.test.ts +0 -81
- package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
- package/tests/unit/core/adapters/opencode.test.ts +0 -354
- package/tests/unit/core/adapters/pi.test.ts +0 -110
- package/tests/unit/core/adapters/windsurf.test.ts +0 -416
- package/tests/unit/core/classifier/prompt.test.ts +0 -126
- package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
- package/tests/unit/core/facts/extract-facts.test.ts +0 -117
- package/tests/unit/core/filter.test.ts +0 -40
- package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
- package/tests/unit/core/hook/citation-detect.test.ts +0 -124
- package/tests/unit/core/hook/gate.test.ts +0 -29
- package/tests/unit/core/hook/pointer-block.test.ts +0 -22
- package/tests/unit/core/hook/select.test.ts +0 -66
- package/tests/unit/core/match-fields.test.ts +0 -39
- package/tests/unit/core/mcp-cite-session.test.ts +0 -51
- package/tests/unit/core/providers/provider-models.test.ts +0 -101
- package/tests/unit/core/query-shape.test.ts +0 -92
- package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
- package/tests/unit/core/recall-service.test.ts +0 -200
- package/tests/unit/core/storage/live-status.test.ts +0 -54
- package/tests/unit/core/tokenize.test.ts +0 -32
- package/tests/unit/core/useful-scan.test.ts +0 -537
- package/tests/unit/llm/embed.test.ts +0 -93
- package/tests/unit/llm/ollama-client.test.ts +0 -124
- package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
- package/tsconfig.json +0 -31
- package/tsconfig.test.json +0 -11
- package/vitest.config.ts +0 -22
|
@@ -1,93 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Unit tests for OllamaClient.embed: nomic prefix scheme, L2 normalization,
|
|
3
|
-
* 8K char truncation. These guard the nomic-embed-text v1.5 contract.
|
|
4
|
-
*/
|
|
5
|
-
|
|
6
|
-
import { describe, expect, it } from "vitest";
|
|
7
|
-
import { OllamaClient, l2Normalize } from "../../../src/llm/ollama-client.js";
|
|
8
|
-
|
|
9
|
-
type FakeFetch = typeof fetch;
|
|
10
|
-
|
|
11
|
-
function jsonResponse(body: unknown): Response {
|
|
12
|
-
return new Response(JSON.stringify(body), {
|
|
13
|
-
status: 200,
|
|
14
|
-
headers: { "content-type": "application/json" },
|
|
15
|
-
});
|
|
16
|
-
}
|
|
17
|
-
|
|
18
|
-
function makeFetch(reply: (req: { url: string; body: unknown }) => Response): FakeFetch {
|
|
19
|
-
return (async (input: string | URL | Request, init?: RequestInit) => {
|
|
20
|
-
const url = typeof input === "string" ? input : input.toString();
|
|
21
|
-
const body = init?.body ? JSON.parse(init.body.toString()) : null;
|
|
22
|
-
return reply({ url, body });
|
|
23
|
-
}) as FakeFetch;
|
|
24
|
-
}
|
|
25
|
-
|
|
26
|
-
describe("OllamaClient.embed prefix scheme", () => {
|
|
27
|
-
it("prefixes a query call with 'search_query: '", async () => {
|
|
28
|
-
let prompt = "";
|
|
29
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
30
|
-
prompt = (body as { prompt: string }).prompt;
|
|
31
|
-
return jsonResponse({ embedding: [1, 0, 0] });
|
|
32
|
-
});
|
|
33
|
-
const client = new OllamaClient({ fetchImpl });
|
|
34
|
-
await client.embed("what did we decide about pgvector", "query");
|
|
35
|
-
expect(prompt.startsWith("search_query: ")).toBe(true);
|
|
36
|
-
expect(prompt).toContain("pgvector");
|
|
37
|
-
});
|
|
38
|
-
|
|
39
|
-
it("prefixes a document call with 'search_document: '", async () => {
|
|
40
|
-
let prompt = "";
|
|
41
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
42
|
-
prompt = (body as { prompt: string }).prompt;
|
|
43
|
-
return jsonResponse({ embedding: [1, 0, 0] });
|
|
44
|
-
});
|
|
45
|
-
const client = new OllamaClient({ fetchImpl });
|
|
46
|
-
await client.embed("session body text", "document");
|
|
47
|
-
expect(prompt.startsWith("search_document: ")).toBe(true);
|
|
48
|
-
});
|
|
49
|
-
|
|
50
|
-
it("truncates text to MAX_EMBED_CHARS (8000) before prefixing", async () => {
|
|
51
|
-
let prompt = "";
|
|
52
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
53
|
-
prompt = (body as { prompt: string }).prompt;
|
|
54
|
-
return jsonResponse({ embedding: [1, 0, 0] });
|
|
55
|
-
});
|
|
56
|
-
const client = new OllamaClient({ fetchImpl });
|
|
57
|
-
const big = "x".repeat(10_000);
|
|
58
|
-
await client.embed(big, "document");
|
|
59
|
-
// prompt = "search_document: " + truncated → prefix is 17 chars, body capped at 8000.
|
|
60
|
-
// Briefly raised to 28000 on 2026-05-25 then reverted same day; nomic-
|
|
61
|
-
// embed-text via Ollama 500s on inputs near the nominal 8192-token
|
|
62
|
-
// context. Real fix is chunk + max-pool (filed as #174).
|
|
63
|
-
expect(prompt.length).toBe(17 + 8_000);
|
|
64
|
-
});
|
|
65
|
-
|
|
66
|
-
it("L2-normalizes the returned vector", async () => {
|
|
67
|
-
const fetchImpl = makeFetch(() => jsonResponse({ embedding: [3, 4, 0] }));
|
|
68
|
-
const client = new OllamaClient({ fetchImpl });
|
|
69
|
-
const { vector } = await client.embed("anything", "document");
|
|
70
|
-
// raw norm = 5; normalized should be [0.6, 0.8, 0]
|
|
71
|
-
expect(vector[0]).toBeCloseTo(0.6, 6);
|
|
72
|
-
expect(vector[1]).toBeCloseTo(0.8, 6);
|
|
73
|
-
expect(vector[2]).toBe(0);
|
|
74
|
-
let norm = 0;
|
|
75
|
-
for (const v of vector) norm += v * v;
|
|
76
|
-
expect(Math.sqrt(norm)).toBeCloseTo(1, 6);
|
|
77
|
-
});
|
|
78
|
-
});
|
|
79
|
-
|
|
80
|
-
describe("l2Normalize", () => {
|
|
81
|
-
it("returns a unit vector for a non-zero input", () => {
|
|
82
|
-
const out = l2Normalize(new Float32Array([3, 4, 0]));
|
|
83
|
-
let sum = 0;
|
|
84
|
-
for (const v of out) sum += v * v;
|
|
85
|
-
expect(Math.sqrt(sum)).toBeCloseTo(1, 6);
|
|
86
|
-
});
|
|
87
|
-
|
|
88
|
-
it("returns the zero vector unchanged", () => {
|
|
89
|
-
const zero = new Float32Array([0, 0, 0]);
|
|
90
|
-
const out = l2Normalize(zero);
|
|
91
|
-
expect(Array.from(out)).toEqual([0, 0, 0]);
|
|
92
|
-
});
|
|
93
|
-
});
|
|
@@ -1,124 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Unit tests for OllamaClient.classify against an injected fake fetch.
|
|
3
|
-
* No network. Verifies prompt construction, JSON-mode handling, schema
|
|
4
|
-
* validation, fence stripping, and error mapping.
|
|
5
|
-
*/
|
|
6
|
-
|
|
7
|
-
import { describe, expect, it } from "vitest";
|
|
8
|
-
import { OllamaClient, ClassifierSchemaError } from "../../../src/llm/ollama-client.js";
|
|
9
|
-
import { LLMUnreachableError } from "../../../src/ports/llm-client.js";
|
|
10
|
-
|
|
11
|
-
type FakeFetch = typeof fetch;
|
|
12
|
-
|
|
13
|
-
function jsonResponse(body: unknown, init: ResponseInit = {}): Response {
|
|
14
|
-
return new Response(JSON.stringify(body), {
|
|
15
|
-
status: init.status ?? 200,
|
|
16
|
-
headers: { "content-type": "application/json" },
|
|
17
|
-
});
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
function makeFetch(reply: (req: { url: string; body: unknown }) => Response | Promise<Response>): FakeFetch {
|
|
21
|
-
return (async (input: string | URL | Request, init?: RequestInit) => {
|
|
22
|
-
const url = typeof input === "string" ? input : input.toString();
|
|
23
|
-
const body = init?.body ? JSON.parse(init.body.toString()) : null;
|
|
24
|
-
return reply({ url, body });
|
|
25
|
-
}) as FakeFetch;
|
|
26
|
-
}
|
|
27
|
-
|
|
28
|
-
const VALID_PAYLOAD = {
|
|
29
|
-
label: "Phase C classifier port",
|
|
30
|
-
summary: "Built OllamaClient.classify with JSON-mode and schema validation against the shared prompt module.",
|
|
31
|
-
entities: ["NLM", "Ollama", "OllamaClient"],
|
|
32
|
-
decisions: ["Map schema-invalid output to a typed ClassifierSchemaError instead of returning null"],
|
|
33
|
-
open: ["Whether to retry once on schema failure or send to inbox immediately"],
|
|
34
|
-
confidence: 0.85,
|
|
35
|
-
};
|
|
36
|
-
|
|
37
|
-
describe("OllamaClient.classify", () => {
|
|
38
|
-
it("parses a valid JSON payload through the Ollama chat envelope", async () => {
|
|
39
|
-
const fetchImpl = makeFetch(({ url, body }) => {
|
|
40
|
-
expect(url).toContain("/api/chat");
|
|
41
|
-
const b = body as { model: string; messages: { role: string; content: string }[]; format: string };
|
|
42
|
-
expect(b.format).toBe("json");
|
|
43
|
-
expect(b.messages[0]?.role).toBe("system");
|
|
44
|
-
expect(b.messages[0]?.content).toContain("session classifier");
|
|
45
|
-
expect(b.messages[1]?.content).toContain("TRANSCRIPT TO CLASSIFY");
|
|
46
|
-
return jsonResponse({ message: { content: JSON.stringify(VALID_PAYLOAD) } });
|
|
47
|
-
});
|
|
48
|
-
const client = new OllamaClient({ fetchImpl });
|
|
49
|
-
const result = await client.classify("user: build the classifier\nassistant: done");
|
|
50
|
-
expect(result.label).toBe(VALID_PAYLOAD.label);
|
|
51
|
-
expect(result.entities).toEqual(VALID_PAYLOAD.entities);
|
|
52
|
-
expect(result.decisions).toHaveLength(1);
|
|
53
|
-
expect(result.confidence).toBeCloseTo(0.85);
|
|
54
|
-
});
|
|
55
|
-
|
|
56
|
-
it("threads priorContext into the user prompt when supplied", async () => {
|
|
57
|
-
let userContent = "";
|
|
58
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
59
|
-
const b = body as { messages: { role: string; content: string }[] };
|
|
60
|
-
userContent = b.messages[1]?.content ?? "";
|
|
61
|
-
return jsonResponse({ message: { content: JSON.stringify(VALID_PAYLOAD) } });
|
|
62
|
-
});
|
|
63
|
-
const client = new OllamaClient({ fetchImpl });
|
|
64
|
-
await client.classify("...transcript...", "earlier session about Hono routing");
|
|
65
|
-
expect(userContent).toContain("PRIOR CONTEXT (already filed):");
|
|
66
|
-
expect(userContent).toContain("earlier session about Hono routing");
|
|
67
|
-
});
|
|
68
|
-
|
|
69
|
-
it("strips markdown fences before JSON parse", async () => {
|
|
70
|
-
const fenced = "```json\n" + JSON.stringify(VALID_PAYLOAD) + "\n```";
|
|
71
|
-
const fetchImpl = makeFetch(() =>
|
|
72
|
-
jsonResponse({ message: { content: fenced } }),
|
|
73
|
-
);
|
|
74
|
-
const client = new OllamaClient({ fetchImpl });
|
|
75
|
-
const result = await client.classify("transcript");
|
|
76
|
-
expect(result.label).toBe(VALID_PAYLOAD.label);
|
|
77
|
-
});
|
|
78
|
-
|
|
79
|
-
it("throws ClassifierSchemaError when required keys are missing", async () => {
|
|
80
|
-
const bad = { label: "x", summary: "y" };
|
|
81
|
-
const fetchImpl = makeFetch(() =>
|
|
82
|
-
jsonResponse({ message: { content: JSON.stringify(bad) } }),
|
|
83
|
-
);
|
|
84
|
-
const client = new OllamaClient({ fetchImpl });
|
|
85
|
-
await expect(client.classify("transcript")).rejects.toBeInstanceOf(ClassifierSchemaError);
|
|
86
|
-
});
|
|
87
|
-
|
|
88
|
-
it("throws ClassifierSchemaError when the model returns non-JSON", async () => {
|
|
89
|
-
const fetchImpl = makeFetch(() =>
|
|
90
|
-
jsonResponse({ message: { content: "not even close to json" } }),
|
|
91
|
-
);
|
|
92
|
-
const client = new OllamaClient({ fetchImpl });
|
|
93
|
-
await expect(client.classify("transcript")).rejects.toBeInstanceOf(ClassifierSchemaError);
|
|
94
|
-
});
|
|
95
|
-
|
|
96
|
-
it("maps non-200 HTTP responses to LLMUnreachableError", async () => {
|
|
97
|
-
const fetchImpl = makeFetch(() =>
|
|
98
|
-
new Response("server down", { status: 503 }),
|
|
99
|
-
);
|
|
100
|
-
const client = new OllamaClient({ fetchImpl });
|
|
101
|
-
await expect(client.classify("transcript")).rejects.toBeInstanceOf(LLMUnreachableError);
|
|
102
|
-
});
|
|
103
|
-
|
|
104
|
-
it("maps network throws to LLMUnreachableError", async () => {
|
|
105
|
-
const fetchImpl = (async () => {
|
|
106
|
-
throw new TypeError("ECONNREFUSED");
|
|
107
|
-
}) as FakeFetch;
|
|
108
|
-
const client = new OllamaClient({ fetchImpl });
|
|
109
|
-
await expect(client.classify("transcript")).rejects.toBeInstanceOf(LLMUnreachableError);
|
|
110
|
-
});
|
|
111
|
-
|
|
112
|
-
it("coerces non-string entities to strings and trims whitespace", async () => {
|
|
113
|
-
const messy = {
|
|
114
|
-
...VALID_PAYLOAD,
|
|
115
|
-
entities: [" n8n ", " ", "Qdrant", 42],
|
|
116
|
-
};
|
|
117
|
-
const fetchImpl = makeFetch(() =>
|
|
118
|
-
jsonResponse({ message: { content: JSON.stringify(messy) } }),
|
|
119
|
-
);
|
|
120
|
-
const client = new OllamaClient({ fetchImpl });
|
|
121
|
-
const result = await client.classify("transcript");
|
|
122
|
-
expect(result.entities).toEqual(["n8n", "Qdrant", "42"]);
|
|
123
|
-
});
|
|
124
|
-
});
|
|
@@ -1,114 +0,0 @@
|
|
|
1
|
-
import { describe, expect, it } from "vitest";
|
|
2
|
-
import {
|
|
3
|
-
aggregate,
|
|
4
|
-
scoreOne,
|
|
5
|
-
} from "../../../scripts/longmemeval/scorer.js";
|
|
6
|
-
|
|
7
|
-
describe("scoreOne", () => {
|
|
8
|
-
it("recallAtK=1 when a gold id is in the top-k", () => {
|
|
9
|
-
const r = scoreOne({
|
|
10
|
-
returnedIds: ["a", "b", "gold-1", "d", "e"],
|
|
11
|
-
goldIds: ["gold-1", "gold-2"],
|
|
12
|
-
returnedBodies: ["", "", "", "", ""],
|
|
13
|
-
answer: "anything",
|
|
14
|
-
k: 5,
|
|
15
|
-
});
|
|
16
|
-
expect(r.recallAtK).toBe(1);
|
|
17
|
-
});
|
|
18
|
-
|
|
19
|
-
it("recallAtK=0 when no gold id appears in the top-k", () => {
|
|
20
|
-
const r = scoreOne({
|
|
21
|
-
returnedIds: ["a", "b", "c", "d", "e"],
|
|
22
|
-
goldIds: ["gold-1"],
|
|
23
|
-
returnedBodies: ["", "", "", "", ""],
|
|
24
|
-
answer: "z",
|
|
25
|
-
k: 5,
|
|
26
|
-
});
|
|
27
|
-
expect(r.recallAtK).toBe(0);
|
|
28
|
-
});
|
|
29
|
-
|
|
30
|
-
it("recallAtK respects k=3 ceiling even when gold is at position 4", () => {
|
|
31
|
-
const r = scoreOne({
|
|
32
|
-
returnedIds: ["a", "b", "c", "gold-1", "e"],
|
|
33
|
-
goldIds: ["gold-1"],
|
|
34
|
-
returnedBodies: [],
|
|
35
|
-
answer: "z",
|
|
36
|
-
k: 3,
|
|
37
|
-
});
|
|
38
|
-
expect(r.recallAtK).toBe(0);
|
|
39
|
-
});
|
|
40
|
-
|
|
41
|
-
it("sessionBodyHit=1 when answer substring appears in any returned body (case/whitespace insensitive)", () => {
|
|
42
|
-
const r = scoreOne({
|
|
43
|
-
returnedIds: ["a", "b"],
|
|
44
|
-
goldIds: ["gold"],
|
|
45
|
-
returnedBodies: [
|
|
46
|
-
"irrelevant transcript content",
|
|
47
|
-
"User: Where did you grow up?\nAssistant: I grew up in Austin, Texas.",
|
|
48
|
-
],
|
|
49
|
-
answer: "austin texas",
|
|
50
|
-
k: 5,
|
|
51
|
-
});
|
|
52
|
-
expect(r.sessionBodyHit).toBe(1);
|
|
53
|
-
});
|
|
54
|
-
|
|
55
|
-
it("sessionBodyHit=0 when answer is absent from all returned bodies", () => {
|
|
56
|
-
const r = scoreOne({
|
|
57
|
-
returnedIds: ["a"],
|
|
58
|
-
goldIds: ["gold"],
|
|
59
|
-
returnedBodies: ["nothing matches here"],
|
|
60
|
-
answer: "Houston",
|
|
61
|
-
k: 5,
|
|
62
|
-
});
|
|
63
|
-
expect(r.sessionBodyHit).toBe(0);
|
|
64
|
-
});
|
|
65
|
-
|
|
66
|
-
it("coerces a numeric answer to string and matches with word boundaries", () => {
|
|
67
|
-
const hit = scoreOne({
|
|
68
|
-
returnedIds: ["a"],
|
|
69
|
-
goldIds: ["gold"],
|
|
70
|
-
returnedBodies: ["The user mentioned 3 brothers in the conversation."],
|
|
71
|
-
answer: 3,
|
|
72
|
-
k: 5,
|
|
73
|
-
});
|
|
74
|
-
expect(hit.sessionBodyHit).toBe(1);
|
|
75
|
-
|
|
76
|
-
const miss = scoreOne({
|
|
77
|
-
returnedIds: ["a"],
|
|
78
|
-
goldIds: ["gold"],
|
|
79
|
-
returnedBodies: ["They paid $30 for the meal and tipped 20%."],
|
|
80
|
-
answer: 3,
|
|
81
|
-
k: 5,
|
|
82
|
-
});
|
|
83
|
-
expect(miss.sessionBodyHit).toBe(0);
|
|
84
|
-
});
|
|
85
|
-
|
|
86
|
-
it("sessionBodyHit=0 when answer is empty", () => {
|
|
87
|
-
const r = scoreOne({
|
|
88
|
-
returnedIds: ["a"],
|
|
89
|
-
goldIds: ["gold"],
|
|
90
|
-
returnedBodies: ["whatever"],
|
|
91
|
-
answer: "",
|
|
92
|
-
k: 5,
|
|
93
|
-
});
|
|
94
|
-
expect(r.sessionBodyHit).toBe(0);
|
|
95
|
-
});
|
|
96
|
-
});
|
|
97
|
-
|
|
98
|
-
describe("aggregate", () => {
|
|
99
|
-
it("computes mean rates rounded to 3 decimal places", () => {
|
|
100
|
-
const a = aggregate([
|
|
101
|
-
{ recallAtK: 1, sessionBodyHit: 1 },
|
|
102
|
-
{ recallAtK: 0, sessionBodyHit: 1 },
|
|
103
|
-
{ recallAtK: 1, sessionBodyHit: 0 },
|
|
104
|
-
]);
|
|
105
|
-
expect(a.n).toBe(3);
|
|
106
|
-
expect(a.recallAtK).toBeCloseTo(0.667, 3);
|
|
107
|
-
expect(a.sessionBodyHitRate).toBeCloseTo(0.667, 3);
|
|
108
|
-
});
|
|
109
|
-
|
|
110
|
-
it("returns zeros for empty input", () => {
|
|
111
|
-
const a = aggregate([]);
|
|
112
|
-
expect(a).toEqual({ n: 0, recallAtK: 0, sessionBodyHitRate: 0 });
|
|
113
|
-
});
|
|
114
|
-
});
|
package/tsconfig.json
DELETED
|
@@ -1,31 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"compilerOptions": {
|
|
3
|
-
"target": "ES2022",
|
|
4
|
-
"module": "NodeNext",
|
|
5
|
-
"moduleResolution": "NodeNext",
|
|
6
|
-
"lib": ["ES2022"],
|
|
7
|
-
"outDir": "dist",
|
|
8
|
-
"rootDir": "src",
|
|
9
|
-
"strict": true,
|
|
10
|
-
"noUncheckedIndexedAccess": true,
|
|
11
|
-
"exactOptionalPropertyTypes": true,
|
|
12
|
-
"noImplicitOverride": true,
|
|
13
|
-
"noFallthroughCasesInSwitch": true,
|
|
14
|
-
"forceConsistentCasingInFileNames": true,
|
|
15
|
-
"esModuleInterop": true,
|
|
16
|
-
"skipLibCheck": true,
|
|
17
|
-
"declaration": true,
|
|
18
|
-
"sourceMap": true,
|
|
19
|
-
"resolveJsonModule": true,
|
|
20
|
-
"isolatedModules": true,
|
|
21
|
-
"verbatimModuleSyntax": true,
|
|
22
|
-
"baseUrl": "src",
|
|
23
|
-
"paths": {
|
|
24
|
-
"@core/*": ["./core/*"],
|
|
25
|
-
"@ports/*": ["./ports/*"],
|
|
26
|
-
"@shared/*": ["./shared/*"]
|
|
27
|
-
}
|
|
28
|
-
},
|
|
29
|
-
"include": ["src/**/*.ts"],
|
|
30
|
-
"exclude": ["node_modules", "dist", "src/ui"]
|
|
31
|
-
}
|
package/tsconfig.test.json
DELETED
package/vitest.config.ts
DELETED
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
import { defineConfig } from "vitest/config";
|
|
2
|
-
import { fileURLToPath } from "node:url";
|
|
3
|
-
|
|
4
|
-
export default defineConfig({
|
|
5
|
-
test: {
|
|
6
|
-
globals: false,
|
|
7
|
-
environment: "node",
|
|
8
|
-
include: ["tests/**/*.test.ts"],
|
|
9
|
-
coverage: {
|
|
10
|
-
provider: "v8",
|
|
11
|
-
include: ["src/core/**", "src/ports/**"],
|
|
12
|
-
reporter: ["text", "html"],
|
|
13
|
-
},
|
|
14
|
-
},
|
|
15
|
-
resolve: {
|
|
16
|
-
alias: {
|
|
17
|
-
"@core": fileURLToPath(new URL("./src/core", import.meta.url)),
|
|
18
|
-
"@ports": fileURLToPath(new URL("./src/ports", import.meta.url)),
|
|
19
|
-
"@shared": fileURLToPath(new URL("./src/shared", import.meta.url)),
|
|
20
|
-
},
|
|
21
|
-
},
|
|
22
|
-
});
|