nlm-memory 0.4.2 → 0.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +72 -34
- package/dist/cli/nlm.js +223 -33
- package/dist/cli/nlm.js.map +1 -1
- package/dist/core/adapters/cursor.d.ts +45 -0
- package/dist/core/adapters/cursor.js +397 -0
- package/dist/core/adapters/cursor.js.map +1 -0
- package/dist/core/adapters/from-source.js +10 -0
- package/dist/core/adapters/from-source.js.map +1 -1
- package/dist/core/adapters/windsurf.d.ts +44 -0
- package/dist/core/adapters/windsurf.js +299 -0
- package/dist/core/adapters/windsurf.js.map +1 -0
- package/dist/core/hook/claude-settings.d.ts +12 -5
- package/dist/core/hook/claude-settings.js +21 -6
- package/dist/core/hook/claude-settings.js.map +1 -1
- package/dist/core/sources/source-registry.d.ts +1 -1
- package/dist/core/sources/source-registry.js +18 -0
- package/dist/core/sources/source-registry.js.map +1 -1
- package/dist/core/storage/sqlite-session-store.d.ts +2 -0
- package/dist/core/storage/sqlite-session-store.js +38 -2
- package/dist/core/storage/sqlite-session-store.js.map +1 -1
- package/dist/hook/hook-auth.d.ts +13 -0
- package/dist/hook/hook-auth.js +19 -0
- package/dist/hook/hook-auth.js.map +1 -0
- package/dist/hook/prompt-recall-hook.js +7 -1
- package/dist/hook/prompt-recall-hook.js.map +1 -1
- package/dist/hook/session-start-hook.js +4 -1
- package/dist/hook/session-start-hook.js.map +1 -1
- package/dist/hook/stop-hook.js +4 -1
- package/dist/hook/stop-hook.js.map +1 -1
- package/dist/http/app.d.ts +2 -0
- package/dist/http/app.js +76 -1
- package/dist/http/app.js.map +1 -1
- package/dist/install/claude-code.js +1 -1
- package/dist/install/claude-code.js.map +1 -1
- package/dist/install/cursor.d.ts +25 -0
- package/dist/install/cursor.js +43 -0
- package/dist/install/cursor.js.map +1 -0
- package/dist/install/nlm-dir-perms.d.ts +19 -0
- package/dist/install/nlm-dir-perms.js +43 -0
- package/dist/install/nlm-dir-perms.js.map +1 -0
- package/dist/install/ollama.d.ts +18 -1
- package/dist/install/ollama.js +62 -7
- package/dist/install/ollama.js.map +1 -1
- package/dist/install/setup.d.ts +4 -0
- package/dist/install/setup.js +141 -18
- package/dist/install/setup.js.map +1 -1
- package/dist/install/windsurf.d.ts +25 -0
- package/dist/install/windsurf.js +43 -0
- package/dist/install/windsurf.js.map +1 -0
- package/dist/mcp/server.js +20 -1
- package/dist/mcp/server.js.map +1 -1
- package/dist/shared/types.d.ts +4 -0
- package/dist/ui/assets/{index-BA6IpU8g.css → index-Beo8psd-.css} +1 -1
- package/dist/ui/assets/index-CSPTTeeM.js +69 -0
- package/dist/ui/index.html +2 -2
- package/package.json +26 -1
- package/plugin/scripts/prompt-recall-hook.mjs +55 -4
- package/plugin/scripts/stop-hook.mjs +57 -6
- package/.agents/plugins/marketplace.json +0 -20
- package/.github/workflows/ci.yml +0 -30
- package/dist/ui/assets/index-B_qIVV0k.js +0 -69
- package/docs/methodology/re-derivation-rate.md +0 -112
- package/docs/methodology/useful-hit-rate.md +0 -79
- package/docs/plans/2026-05-20-fts5-lexical-recall.md +0 -1088
- package/docs/plans/2026-05-20-recall-daemon-wedge-fix.md +0 -662
- package/docs/plans/2026-05-20-recall-hook-design.md +0 -131
- package/docs/plans/2026-05-20-recall-hook-implementation.md +0 -1222
- package/docs/plans/desktop-product.md +0 -69
- package/docs/plans/factstore-design.md +0 -236
- package/logs/CHANGELOG/CHANGELOG-2026.md +0 -1389
- package/logs/CHANGELOG/CHANGELOG.md +0 -337
- package/migrations/000_initial_schema.sql +0 -174
- package/migrations/001_entity_type_rename.sql +0 -17
- package/migrations/002_adapter_state_extend.sql +0 -12
- package/migrations/003_session_embeddings.sql +0 -11
- package/migrations/004_facts.sql +0 -46
- package/migrations/005_sources.sql +0 -31
- package/migrations/006_providers.sql +0 -33
- package/migrations/007_source_tokens.sql +0 -17
- package/migrations/008_fts_rebuild.sql +0 -9
- package/migrations/009_session_embedding_chunks.sql +0 -46
- package/migrations/010_sources_opencode.sql +0 -30
- package/migrations/011_sources_hermes_agent.sql +0 -30
- package/migrations/012_sources_aider.sql +0 -30
- package/migrations/013_adapter_state_failure_count.sql +0 -12
- package/plugin-hermes-agent/README.md +0 -49
- package/plugin-hermes-agent/__init__.py +0 -75
- package/plugin-hermes-agent/plugin.yaml +0 -15
- package/scripts/backfill-citations.mjs +0 -0
- package/scripts/build-codex-plugin.mjs +0 -61
- package/scripts/deepseek-probe.mjs +0 -67
- package/scripts/extract-triples.mjs +0 -207
- package/scripts/longmemeval/embedding-cache.ts +0 -77
- package/scripts/longmemeval/fetch-dataset.sh +0 -25
- package/scripts/longmemeval/run-harness.ts +0 -315
- package/scripts/longmemeval/scorer.ts +0 -99
- package/scripts/longmemeval/tsconfig.json +0 -9
- package/scripts/longmemeval/types.ts +0 -35
- package/scripts/nlm-daily-digest.py +0 -239
- package/scripts/nlm-daily-digest.sh +0 -28
- package/src/cli/classify-parity.ts +0 -257
- package/src/cli/launchctl-helpers.ts +0 -49
- package/src/cli/nlm.ts +0 -885
- package/src/core/actions/actions-log.ts +0 -118
- package/src/core/actions/overlay.ts +0 -117
- package/src/core/adapters/aider.ts +0 -205
- package/src/core/adapters/claude-code.ts +0 -293
- package/src/core/adapters/common.ts +0 -54
- package/src/core/adapters/from-source.ts +0 -57
- package/src/core/adapters/hermes-agent.ts +0 -240
- package/src/core/adapters/hermes.ts +0 -277
- package/src/core/adapters/jsonl-generic.ts +0 -208
- package/src/core/adapters/opencode.ts +0 -281
- package/src/core/adapters/pi.ts +0 -264
- package/src/core/classifier/prompt.ts +0 -200
- package/src/core/dataset/build-dataset.ts +0 -463
- package/src/core/embedding/chunk-body.ts +0 -76
- package/src/core/embedding/embed-backfill.ts +0 -210
- package/src/core/embedding/embed-normalize.ts +0 -135
- package/src/core/facts/backfill-facts.ts +0 -254
- package/src/core/facts/extract-facts.ts +0 -50
- package/src/core/hook/citation-detect.ts +0 -124
- package/src/core/hook/cite-memo.ts +0 -68
- package/src/core/hook/claude-settings.ts +0 -166
- package/src/core/hook/gate.ts +0 -25
- package/src/core/hook/hook-log.ts +0 -41
- package/src/core/hook/memo-sweep.ts +0 -164
- package/src/core/hook/memo.ts +0 -67
- package/src/core/hook/pointer-block.ts +0 -26
- package/src/core/hook/select.ts +0 -32
- package/src/core/hook/transcript.ts +0 -121
- package/src/core/ingest/ingest-session.ts +0 -111
- package/src/core/providers/provider-models.ts +0 -100
- package/src/core/providers/provider-registry.ts +0 -196
- package/src/core/recall/citation-log.ts +0 -108
- package/src/core/recall/filter.ts +0 -27
- package/src/core/recall/index.ts +0 -6
- package/src/core/recall/match-fields.ts +0 -40
- package/src/core/recall/query-log.ts +0 -149
- package/src/core/recall/query-shape.ts +0 -66
- package/src/core/recall/recall-service.ts +0 -320
- package/src/core/recall/recent-log.ts +0 -59
- package/src/core/recall/tokenize.ts +0 -18
- package/src/core/recall/useful-scan.ts +0 -336
- package/src/core/recall-facts/fact-query-log.ts +0 -150
- package/src/core/recall-facts/fact-recall-service.ts +0 -327
- package/src/core/scheduler/scan-once.ts +0 -142
- package/src/core/scheduler/scheduler.ts +0 -225
- package/src/core/sources/source-registry.ts +0 -260
- package/src/core/storage/db-restore.ts +0 -133
- package/src/core/storage/live-status.ts +0 -45
- package/src/core/storage/migrate.ts +0 -72
- package/src/core/storage/sqlite-fact-store.ts +0 -304
- package/src/core/storage/sqlite-session-store.ts +0 -765
- package/src/hook/prompt-recall-hook.ts +0 -174
- package/src/hook/session-end-hook.ts +0 -81
- package/src/hook/session-start-hook.ts +0 -165
- package/src/hook/stop-hook.ts +0 -236
- package/src/http/app.ts +0 -1137
- package/src/install/claude-code.ts +0 -128
- package/src/install/codex.ts +0 -367
- package/src/install/hermes-agent.ts +0 -76
- package/src/install/hermes.ts +0 -78
- package/src/install/ollama.ts +0 -211
- package/src/install/setup.ts +0 -368
- package/src/llm/classifier-box.ts +0 -64
- package/src/llm/deepseek-client.ts +0 -150
- package/src/llm/env-autoload.ts +0 -55
- package/src/llm/ollama-client.ts +0 -189
- package/src/mcp/server.ts +0 -534
- package/src/ports/fact-store.ts +0 -102
- package/src/ports/llm-client.ts +0 -52
- package/src/ports/logger.ts +0 -16
- package/src/ports/session-store.ts +0 -45
- package/src/ports/transcript-adapter.ts +0 -55
- package/src/shared/types.ts +0 -145
- package/src/ui/App.tsx +0 -58
- package/src/ui/components/PromoteOpenButton.tsx +0 -65
- package/src/ui/components/SessionDrawer.tsx +0 -136
- package/src/ui/components/SideNav.tsx +0 -162
- package/src/ui/components/Skeleton.tsx +0 -107
- package/src/ui/index.html +0 -13
- package/src/ui/lib/actions.ts +0 -30
- package/src/ui/lib/api.ts +0 -92
- package/src/ui/lib/dataset.ts +0 -141
- package/src/ui/lib/registries.ts +0 -155
- package/src/ui/lib/view-settings.ts +0 -41
- package/src/ui/main.tsx +0 -15
- package/src/ui/pages/Live.tsx +0 -229
- package/src/ui/pages/Pulse.tsx +0 -415
- package/src/ui/pages/Recall.tsx +0 -190
- package/src/ui/pages/River.tsx +0 -308
- package/src/ui/pages/Search.tsx +0 -93
- package/src/ui/pages/Stub.tsx +0 -9
- package/src/ui/pages/Thread.tsx +0 -262
- package/src/ui/pages/settings/Classifier.tsx +0 -227
- package/src/ui/pages/settings/Data.tsx +0 -190
- package/src/ui/pages/settings/Index.tsx +0 -65
- package/src/ui/pages/settings/Labels.tsx +0 -224
- package/src/ui/pages/settings/Providers.tsx +0 -305
- package/src/ui/pages/settings/SettingsSubnav.tsx +0 -28
- package/src/ui/pages/settings/Sources.tsx +0 -326
- package/src/ui/pages/settings/Views.tsx +0 -96
- package/src/ui/styles.css +0 -1766
- package/src/ui/tsconfig.json +0 -21
- package/src/ui/vite.config.ts +0 -19
- package/tests/fixtures/claude_code/short_session.jsonl +0 -2
- package/tests/fixtures/claude_code/standard_iso.jsonl +0 -4
- package/tests/fixtures/claude_code/tool_heavy.jsonl +0 -8
- package/tests/fixtures/claude_code/with_subagent.jsonl +0 -7
- package/tests/fixtures/facts.ts +0 -17
- package/tests/fixtures/golden-corpus.ts +0 -85
- package/tests/fixtures/hermes/paired_request_dump.json +0 -24
- package/tests/fixtures/hermes/paired_session.json +0 -23
- package/tests/fixtures/hermes/request_dump.json +0 -28
- package/tests/fixtures/hermes/session_iso.json +0 -38
- package/tests/fixtures/hermes/session_unix.json +0 -38
- package/tests/fixtures/hermes/system_only.json +0 -18
- package/tests/fixtures/pi/error-connection-abort.jsonl +0 -8
- package/tests/fixtures/pi/short-successful.jsonl +0 -5
- package/tests/fixtures/pi/with-custom-message.jsonl +0 -6
- package/tests/fixtures/sessions.ts +0 -22
- package/tests/integration/backfill-facts.test.ts +0 -362
- package/tests/integration/citation-explicit.test.ts +0 -111
- package/tests/integration/cite-event.test.ts +0 -169
- package/tests/integration/cite-memo.test.ts +0 -87
- package/tests/integration/db-restore.test.ts +0 -153
- package/tests/integration/embed-backfill.test.ts +0 -176
- package/tests/integration/fact-supersedence.test.ts +0 -313
- package/tests/integration/fts-index.test.ts +0 -60
- package/tests/integration/getbyids-sqlite.test.ts +0 -60
- package/tests/integration/hermes-agent-hooks.test.ts +0 -248
- package/tests/integration/hook-claude-settings.test.ts +0 -205
- package/tests/integration/hook-log.test.ts +0 -54
- package/tests/integration/hook-memo.test.ts +0 -68
- package/tests/integration/hook-pre-compact.test.ts +0 -105
- package/tests/integration/hook-subagent-start.test.ts +0 -102
- package/tests/integration/http.test.ts +0 -401
- package/tests/integration/keyword-search-fts.test.ts +0 -66
- package/tests/integration/mcp-recall-logging.test.ts +0 -88
- package/tests/integration/mcp.test.ts +0 -248
- package/tests/integration/memo-sweep.test.ts +0 -91
- package/tests/integration/prompt-recall-hook.test.ts +0 -88
- package/tests/integration/provider-registry.test.ts +0 -107
- package/tests/integration/recall-golden.test.ts +0 -59
- package/tests/integration/recall-sqlite.test.ts +0 -169
- package/tests/integration/scheduler.test.ts +0 -391
- package/tests/integration/session-end-hook.test.ts +0 -48
- package/tests/integration/session-start-hook.test.ts +0 -126
- package/tests/integration/source-registry.test.ts +0 -120
- package/tests/integration/sqlite-fact-store.test.ts +0 -346
- package/tests/integration/stop-hook.test.ts +0 -560
- package/tests/integration/wal-checkpoint.test.ts +0 -49
- package/tests/unit/cli/launchctl-helpers.test.ts +0 -60
- package/tests/unit/core/adapters/aider.test.ts +0 -230
- package/tests/unit/core/adapters/claude-code.test.ts +0 -118
- package/tests/unit/core/adapters/hermes-agent.test.ts +0 -329
- package/tests/unit/core/adapters/hermes.test.ts +0 -81
- package/tests/unit/core/adapters/jsonl-generic.test.ts +0 -142
- package/tests/unit/core/adapters/opencode.test.ts +0 -354
- package/tests/unit/core/adapters/pi.test.ts +0 -110
- package/tests/unit/core/classifier/prompt.test.ts +0 -126
- package/tests/unit/core/embedding/chunk-body.test.ts +0 -100
- package/tests/unit/core/facts/extract-facts.test.ts +0 -117
- package/tests/unit/core/filter.test.ts +0 -40
- package/tests/unit/core/hook/citation-detect-cite-session.test.ts +0 -96
- package/tests/unit/core/hook/citation-detect.test.ts +0 -124
- package/tests/unit/core/hook/gate.test.ts +0 -29
- package/tests/unit/core/hook/pointer-block.test.ts +0 -22
- package/tests/unit/core/hook/select.test.ts +0 -66
- package/tests/unit/core/match-fields.test.ts +0 -39
- package/tests/unit/core/mcp-cite-session.test.ts +0 -51
- package/tests/unit/core/providers/provider-models.test.ts +0 -101
- package/tests/unit/core/query-shape.test.ts +0 -92
- package/tests/unit/core/recall-facts/fact-recall-service.test.ts +0 -258
- package/tests/unit/core/recall-service.test.ts +0 -200
- package/tests/unit/core/storage/live-status.test.ts +0 -54
- package/tests/unit/core/tokenize.test.ts +0 -32
- package/tests/unit/core/useful-scan.test.ts +0 -537
- package/tests/unit/llm/embed.test.ts +0 -93
- package/tests/unit/llm/ollama-client.test.ts +0 -124
- package/tests/unit/scripts/longmemeval-scorer.test.ts +0 -114
- package/tsconfig.json +0 -31
- package/tsconfig.test.json +0 -11
- package/vitest.config.ts +0 -22
|
@@ -1,537 +0,0 @@
|
|
|
1
|
-
import { describe, expect, it } from "vitest";
|
|
2
|
-
import { mkdirSync, writeFileSync } from "node:fs";
|
|
3
|
-
import { join } from "node:path";
|
|
4
|
-
import { tmpdir } from "node:os";
|
|
5
|
-
import {
|
|
6
|
-
isProbe,
|
|
7
|
-
extractAssistantTurnsAfter,
|
|
8
|
-
findMatchedId,
|
|
9
|
-
scanUsefulHits,
|
|
10
|
-
readUsefulHitRate,
|
|
11
|
-
} from "../../../src/core/recall/useful-scan.js";
|
|
12
|
-
|
|
13
|
-
// ── isProbe ──────────────────────────────────────────────────────────────────
|
|
14
|
-
|
|
15
|
-
describe("isProbe", () => {
|
|
16
|
-
it("returns true for probe patterns", () => {
|
|
17
|
-
expect(isProbe("concurrency probe round 2")).toBe(true);
|
|
18
|
-
expect(isProbe("test probe")).toBe(true);
|
|
19
|
-
expect(isProbe("path test for the hook")).toBe(true);
|
|
20
|
-
expect(isProbe("recall test")).toBe(true);
|
|
21
|
-
expect(isProbe("smoke test run")).toBe(true);
|
|
22
|
-
expect(isProbe("cutover validation")).toBe(true);
|
|
23
|
-
});
|
|
24
|
-
|
|
25
|
-
it("returns false for normal prompts", () => {
|
|
26
|
-
expect(isProbe("what did we decide about pgvector")).toBe(false);
|
|
27
|
-
expect(isProbe("how should we implement the recall hook")).toBe(false);
|
|
28
|
-
expect(isProbe("review the PR")).toBe(false);
|
|
29
|
-
});
|
|
30
|
-
|
|
31
|
-
it("is case-insensitive", () => {
|
|
32
|
-
expect(isProbe("SMOKE TEST")).toBe(true);
|
|
33
|
-
expect(isProbe("Concurrency Probe")).toBe(true);
|
|
34
|
-
});
|
|
35
|
-
});
|
|
36
|
-
|
|
37
|
-
// ── extractAssistantTurnsAfter ───────────────────────────────────────────────
|
|
38
|
-
|
|
39
|
-
function makeTranscript(
|
|
40
|
-
lines: Array<{ type: string; timestamp: string; content?: string | Array<Record<string, unknown>> }>,
|
|
41
|
-
): string {
|
|
42
|
-
return lines
|
|
43
|
-
.map((l) => {
|
|
44
|
-
const msg =
|
|
45
|
-
l.type === "assistant"
|
|
46
|
-
? {
|
|
47
|
-
type: "assistant",
|
|
48
|
-
timestamp: l.timestamp,
|
|
49
|
-
message: { content: l.content ?? "" },
|
|
50
|
-
}
|
|
51
|
-
: { type: l.type, timestamp: l.timestamp };
|
|
52
|
-
return JSON.stringify(msg);
|
|
53
|
-
})
|
|
54
|
-
.join("\n");
|
|
55
|
-
}
|
|
56
|
-
|
|
57
|
-
describe("extractAssistantTurnsAfter", () => {
|
|
58
|
-
it("returns empty for a missing file", () => {
|
|
59
|
-
expect(extractAssistantTurnsAfter("/tmp/nlm-nonexistent-transcript.jsonl", 0, 3)).toEqual([]);
|
|
60
|
-
});
|
|
61
|
-
|
|
62
|
-
it("returns empty when no assistant turns exist after the cutoff", () => {
|
|
63
|
-
const dir = tmpdir();
|
|
64
|
-
const path = join(dir, `transcript-past-${Date.now()}.jsonl`);
|
|
65
|
-
writeFileSync(
|
|
66
|
-
path,
|
|
67
|
-
makeTranscript([
|
|
68
|
-
{ type: "user", timestamp: "2026-01-01T00:00:00.000Z" },
|
|
69
|
-
{ type: "assistant", timestamp: "2026-01-01T00:00:01.000Z", content: "answer" },
|
|
70
|
-
]),
|
|
71
|
-
);
|
|
72
|
-
// cutoff is after the assistant turn
|
|
73
|
-
const cutoff = Date.parse("2026-01-01T00:00:02.000Z");
|
|
74
|
-
expect(extractAssistantTurnsAfter(path, cutoff, 3)).toEqual([]);
|
|
75
|
-
});
|
|
76
|
-
|
|
77
|
-
it("returns up to `limit` assistant turns at or after the cutoff", () => {
|
|
78
|
-
const dir = tmpdir();
|
|
79
|
-
const path = join(dir, `transcript-limit-${Date.now()}.jsonl`);
|
|
80
|
-
const ts = "2026-05-01T10:00:00.000Z";
|
|
81
|
-
writeFileSync(
|
|
82
|
-
path,
|
|
83
|
-
makeTranscript([
|
|
84
|
-
{ type: "user", timestamp: "2026-05-01T09:59:59.000Z" },
|
|
85
|
-
{ type: "assistant", timestamp: ts, content: "turn-1" },
|
|
86
|
-
{ type: "user", timestamp: "2026-05-01T10:00:01.000Z" },
|
|
87
|
-
{ type: "assistant", timestamp: "2026-05-01T10:00:02.000Z", content: "turn-2" },
|
|
88
|
-
{ type: "user", timestamp: "2026-05-01T10:00:03.000Z" },
|
|
89
|
-
{ type: "assistant", timestamp: "2026-05-01T10:00:04.000Z", content: "turn-3" },
|
|
90
|
-
{ type: "user", timestamp: "2026-05-01T10:00:05.000Z" },
|
|
91
|
-
{ type: "assistant", timestamp: "2026-05-01T10:00:06.000Z", content: "turn-4" },
|
|
92
|
-
]),
|
|
93
|
-
);
|
|
94
|
-
const cutoff = Date.parse(ts);
|
|
95
|
-
const turns = extractAssistantTurnsAfter(path, cutoff, 3);
|
|
96
|
-
expect(turns).toHaveLength(3);
|
|
97
|
-
expect(turns[0]).toContain("turn-1");
|
|
98
|
-
expect(turns[1]).toContain("turn-2");
|
|
99
|
-
expect(turns[2]).toContain("turn-3");
|
|
100
|
-
});
|
|
101
|
-
|
|
102
|
-
it("extracts text from content-array turns (text + tool_use)", () => {
|
|
103
|
-
const dir = tmpdir();
|
|
104
|
-
const path = join(dir, `transcript-blocks-${Date.now()}.jsonl`);
|
|
105
|
-
const ts = "2026-05-01T10:00:00.000Z";
|
|
106
|
-
const content: Array<Record<string, unknown>> = [
|
|
107
|
-
{ type: "text", text: "I looked it up." },
|
|
108
|
-
{ type: "tool_use", name: "mcp__nlm-memory__get_session", input: { id: "cc_sub_abc123" } },
|
|
109
|
-
];
|
|
110
|
-
writeFileSync(
|
|
111
|
-
path,
|
|
112
|
-
JSON.stringify({ type: "assistant", timestamp: ts, message: { content } }) + "\n",
|
|
113
|
-
);
|
|
114
|
-
const turns = extractAssistantTurnsAfter(path, Date.parse(ts), 3);
|
|
115
|
-
expect(turns).toHaveLength(1);
|
|
116
|
-
expect(turns[0]).toContain("I looked it up.");
|
|
117
|
-
expect(turns[0]).toContain("cc_sub_abc123");
|
|
118
|
-
});
|
|
119
|
-
|
|
120
|
-
it("skips malformed JSON lines without throwing", () => {
|
|
121
|
-
const dir = tmpdir();
|
|
122
|
-
const path = join(dir, `transcript-malformed-${Date.now()}.jsonl`);
|
|
123
|
-
const ts = "2026-05-01T10:00:00.000Z";
|
|
124
|
-
writeFileSync(
|
|
125
|
-
path,
|
|
126
|
-
"not json\n" +
|
|
127
|
-
JSON.stringify({ type: "assistant", timestamp: ts, message: { content: "ok" } }) +
|
|
128
|
-
"\n",
|
|
129
|
-
);
|
|
130
|
-
const turns = extractAssistantTurnsAfter(path, Date.parse(ts), 3);
|
|
131
|
-
expect(turns).toHaveLength(1);
|
|
132
|
-
expect(turns[0]).toContain("ok");
|
|
133
|
-
});
|
|
134
|
-
});
|
|
135
|
-
|
|
136
|
-
// ── findMatchedId ────────────────────────────────────────────────────────────
|
|
137
|
-
|
|
138
|
-
describe("findMatchedId", () => {
|
|
139
|
-
it("returns the first matching ID", () => {
|
|
140
|
-
expect(findMatchedId(["cc_sub_abc", "cc_sub_def"], ["context cc_sub_abc here"])).toBe(
|
|
141
|
-
"cc_sub_abc",
|
|
142
|
-
);
|
|
143
|
-
});
|
|
144
|
-
|
|
145
|
-
it("returns null when no ID appears", () => {
|
|
146
|
-
expect(findMatchedId(["cc_sub_abc"], ["completely unrelated text"])).toBeNull();
|
|
147
|
-
});
|
|
148
|
-
|
|
149
|
-
it("matches IDs inside tool_use serialized JSON", () => {
|
|
150
|
-
const turns = [JSON.stringify({ id: "cc_sub_xyz123" })];
|
|
151
|
-
expect(findMatchedId(["cc_sub_xyz123"], turns)).toBe("cc_sub_xyz123");
|
|
152
|
-
});
|
|
153
|
-
|
|
154
|
-
it("returns null for empty ids list", () => {
|
|
155
|
-
expect(findMatchedId([], ["some text"])).toBeNull();
|
|
156
|
-
});
|
|
157
|
-
|
|
158
|
-
it("returns null for empty turns list", () => {
|
|
159
|
-
expect(findMatchedId(["cc_sub_abc"], [])).toBeNull();
|
|
160
|
-
});
|
|
161
|
-
});
|
|
162
|
-
|
|
163
|
-
// ── scanUsefulHits ───────────────────────────────────────────────────────────
|
|
164
|
-
|
|
165
|
-
function setupScanDirs(): { root: string; hookLogPath: string; usefulHitLogPath: string; transcriptsDir: string } {
|
|
166
|
-
const root = join(tmpdir(), `nlm-scan-test-${Date.now()}-${Math.random().toString(36).slice(2)}`);
|
|
167
|
-
mkdirSync(root, { recursive: true });
|
|
168
|
-
const hookLogPath = join(root, "hook-log.jsonl");
|
|
169
|
-
const usefulHitLogPath = join(root, "useful-hit-log.jsonl");
|
|
170
|
-
const transcriptsDir = join(root, "projects");
|
|
171
|
-
mkdirSync(transcriptsDir, { recursive: true });
|
|
172
|
-
return { root, hookLogPath, usefulHitLogPath, transcriptsDir };
|
|
173
|
-
}
|
|
174
|
-
|
|
175
|
-
function writeTranscript(transcriptsDir: string, conversationId: string, content: string): void {
|
|
176
|
-
const projectDir = join(transcriptsDir, "test-project");
|
|
177
|
-
mkdirSync(projectDir, { recursive: true });
|
|
178
|
-
writeFileSync(join(projectDir, `${conversationId}.jsonl`), content);
|
|
179
|
-
}
|
|
180
|
-
|
|
181
|
-
describe("scanUsefulHits", () => {
|
|
182
|
-
it("returns zero totals when hook log is absent", async () => {
|
|
183
|
-
const { root, hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
184
|
-
const result = await scanUsefulHits({
|
|
185
|
-
days: 1,
|
|
186
|
-
hookLogPath,
|
|
187
|
-
usefulHitLogPath,
|
|
188
|
-
transcriptsDir,
|
|
189
|
-
dryRun: true,
|
|
190
|
-
});
|
|
191
|
-
expect(result).toEqual({ total: 0, measurable: 0, useful: 0, appended: 0 });
|
|
192
|
-
// suppress unused warning
|
|
193
|
-
void root;
|
|
194
|
-
});
|
|
195
|
-
|
|
196
|
-
it("counts a useful hit when the ID appears in the next assistant turn", async () => {
|
|
197
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
198
|
-
const convId = "test-conv-useful-hit";
|
|
199
|
-
const hookTs = new Date().toISOString();
|
|
200
|
-
const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
|
|
201
|
-
|
|
202
|
-
// Hook log entry with wouldInject
|
|
203
|
-
writeFileSync(
|
|
204
|
-
hookLogPath,
|
|
205
|
-
JSON.stringify({
|
|
206
|
-
ts: hookTs,
|
|
207
|
-
conversationId: convId,
|
|
208
|
-
promptPreview: "what did we decide about the schema",
|
|
209
|
-
gate: "evaluate",
|
|
210
|
-
hits: [{ id: "cc_sub_abc123def456", score: 1.2 }],
|
|
211
|
-
wouldInject: ["cc_sub_abc123def456"],
|
|
212
|
-
estTokens: 50,
|
|
213
|
-
mode: "shadow",
|
|
214
|
-
}) + "\n",
|
|
215
|
-
);
|
|
216
|
-
|
|
217
|
-
// Transcript with the ID appearing in the assistant turn after the hook
|
|
218
|
-
writeTranscript(
|
|
219
|
-
transcriptsDir,
|
|
220
|
-
convId,
|
|
221
|
-
JSON.stringify({ type: "user", timestamp: hookTs }) +
|
|
222
|
-
"\n" +
|
|
223
|
-
JSON.stringify({
|
|
224
|
-
type: "assistant",
|
|
225
|
-
timestamp: afterTs,
|
|
226
|
-
message: { content: "Per cc_sub_abc123def456 we chose the new schema." },
|
|
227
|
-
}) +
|
|
228
|
-
"\n",
|
|
229
|
-
);
|
|
230
|
-
|
|
231
|
-
const result = await scanUsefulHits({
|
|
232
|
-
days: 1,
|
|
233
|
-
hookLogPath,
|
|
234
|
-
usefulHitLogPath,
|
|
235
|
-
transcriptsDir,
|
|
236
|
-
});
|
|
237
|
-
|
|
238
|
-
expect(result.total).toBe(1);
|
|
239
|
-
expect(result.measurable).toBe(1);
|
|
240
|
-
expect(result.useful).toBe(1);
|
|
241
|
-
expect(result.appended).toBe(1);
|
|
242
|
-
});
|
|
243
|
-
|
|
244
|
-
it("records useful=false when the ID does not appear in subsequent turns", async () => {
|
|
245
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
246
|
-
const convId = "test-conv-not-useful";
|
|
247
|
-
const hookTs = new Date().toISOString();
|
|
248
|
-
const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
|
|
249
|
-
|
|
250
|
-
writeFileSync(
|
|
251
|
-
hookLogPath,
|
|
252
|
-
JSON.stringify({
|
|
253
|
-
ts: hookTs,
|
|
254
|
-
conversationId: convId,
|
|
255
|
-
promptPreview: "explain this code",
|
|
256
|
-
gate: "evaluate",
|
|
257
|
-
hits: [{ id: "cc_sub_zzz999", score: 0.8 }],
|
|
258
|
-
wouldInject: ["cc_sub_zzz999"],
|
|
259
|
-
estTokens: 30,
|
|
260
|
-
mode: "shadow",
|
|
261
|
-
}) + "\n",
|
|
262
|
-
);
|
|
263
|
-
|
|
264
|
-
writeTranscript(
|
|
265
|
-
transcriptsDir,
|
|
266
|
-
convId,
|
|
267
|
-
JSON.stringify({ type: "user", timestamp: hookTs }) +
|
|
268
|
-
"\n" +
|
|
269
|
-
JSON.stringify({
|
|
270
|
-
type: "assistant",
|
|
271
|
-
timestamp: afterTs,
|
|
272
|
-
message: { content: "Here is the explanation." },
|
|
273
|
-
}) +
|
|
274
|
-
"\n",
|
|
275
|
-
);
|
|
276
|
-
|
|
277
|
-
const result = await scanUsefulHits({
|
|
278
|
-
days: 1,
|
|
279
|
-
hookLogPath,
|
|
280
|
-
usefulHitLogPath,
|
|
281
|
-
transcriptsDir,
|
|
282
|
-
});
|
|
283
|
-
|
|
284
|
-
expect(result.useful).toBe(0);
|
|
285
|
-
expect(result.measurable).toBe(1);
|
|
286
|
-
|
|
287
|
-
// Verify the written entry has useful=false
|
|
288
|
-
const { readFileSync } = await import("node:fs");
|
|
289
|
-
const written = JSON.parse(readFileSync(usefulHitLogPath, "utf8").trim()) as Record<string, unknown>;
|
|
290
|
-
expect(written["useful"]).toBe(false);
|
|
291
|
-
expect(written["matchedId"]).toBeNull();
|
|
292
|
-
});
|
|
293
|
-
|
|
294
|
-
it("records useful=null when no transcript is found", async () => {
|
|
295
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
296
|
-
const hookTs = new Date().toISOString();
|
|
297
|
-
|
|
298
|
-
writeFileSync(
|
|
299
|
-
hookLogPath,
|
|
300
|
-
JSON.stringify({
|
|
301
|
-
ts: hookTs,
|
|
302
|
-
conversationId: "missing-conv-id-xyz",
|
|
303
|
-
promptPreview: "what is the error",
|
|
304
|
-
gate: "evaluate",
|
|
305
|
-
hits: [{ id: "cc_sub_missing", score: 1.0 }],
|
|
306
|
-
wouldInject: ["cc_sub_missing"],
|
|
307
|
-
estTokens: 20,
|
|
308
|
-
mode: "shadow",
|
|
309
|
-
}) + "\n",
|
|
310
|
-
);
|
|
311
|
-
|
|
312
|
-
const result = await scanUsefulHits({
|
|
313
|
-
days: 1,
|
|
314
|
-
hookLogPath,
|
|
315
|
-
usefulHitLogPath,
|
|
316
|
-
transcriptsDir,
|
|
317
|
-
});
|
|
318
|
-
|
|
319
|
-
expect(result.measurable).toBe(0);
|
|
320
|
-
expect(result.useful).toBe(0);
|
|
321
|
-
|
|
322
|
-
const { readFileSync } = await import("node:fs");
|
|
323
|
-
const written = JSON.parse(readFileSync(usefulHitLogPath, "utf8").trim()) as Record<string, unknown>;
|
|
324
|
-
expect(written["useful"]).toBeNull();
|
|
325
|
-
});
|
|
326
|
-
|
|
327
|
-
it("skips probe entries", async () => {
|
|
328
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
329
|
-
const hookTs = new Date().toISOString();
|
|
330
|
-
|
|
331
|
-
writeFileSync(
|
|
332
|
-
hookLogPath,
|
|
333
|
-
JSON.stringify({
|
|
334
|
-
ts: hookTs,
|
|
335
|
-
conversationId: "probe-conv",
|
|
336
|
-
promptPreview: "recall test round 3",
|
|
337
|
-
gate: "evaluate",
|
|
338
|
-
hits: [{ id: "cc_sub_probe", score: 1.0 }],
|
|
339
|
-
wouldInject: ["cc_sub_probe"],
|
|
340
|
-
estTokens: 10,
|
|
341
|
-
mode: "shadow",
|
|
342
|
-
}) + "\n",
|
|
343
|
-
);
|
|
344
|
-
|
|
345
|
-
const result = await scanUsefulHits({
|
|
346
|
-
days: 1,
|
|
347
|
-
hookLogPath,
|
|
348
|
-
usefulHitLogPath,
|
|
349
|
-
transcriptsDir,
|
|
350
|
-
});
|
|
351
|
-
|
|
352
|
-
expect(result.total).toBe(0);
|
|
353
|
-
});
|
|
354
|
-
|
|
355
|
-
it("skips entries with empty wouldInject", async () => {
|
|
356
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
357
|
-
const hookTs = new Date().toISOString();
|
|
358
|
-
|
|
359
|
-
writeFileSync(
|
|
360
|
-
hookLogPath,
|
|
361
|
-
JSON.stringify({
|
|
362
|
-
ts: hookTs,
|
|
363
|
-
conversationId: "conv-no-inject",
|
|
364
|
-
promptPreview: "what is the status",
|
|
365
|
-
gate: "generative",
|
|
366
|
-
hits: [],
|
|
367
|
-
wouldInject: [],
|
|
368
|
-
estTokens: 0,
|
|
369
|
-
mode: "shadow",
|
|
370
|
-
}) + "\n",
|
|
371
|
-
);
|
|
372
|
-
|
|
373
|
-
const result = await scanUsefulHits({
|
|
374
|
-
days: 1,
|
|
375
|
-
hookLogPath,
|
|
376
|
-
usefulHitLogPath,
|
|
377
|
-
transcriptsDir,
|
|
378
|
-
});
|
|
379
|
-
|
|
380
|
-
expect(result.total).toBe(0);
|
|
381
|
-
});
|
|
382
|
-
|
|
383
|
-
it("skips stop-hook entries (kind field present)", async () => {
|
|
384
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
385
|
-
const hookTs = new Date().toISOString();
|
|
386
|
-
|
|
387
|
-
writeFileSync(
|
|
388
|
-
hookLogPath,
|
|
389
|
-
JSON.stringify({
|
|
390
|
-
ts: hookTs,
|
|
391
|
-
kind: "stop",
|
|
392
|
-
conversationId: "conv-stop",
|
|
393
|
-
surfacedCount: 2,
|
|
394
|
-
citedIds: ["cc_sub_abc"],
|
|
395
|
-
citationKinds: ["tool_use"],
|
|
396
|
-
skipped: false,
|
|
397
|
-
mode: "shadow",
|
|
398
|
-
}) + "\n",
|
|
399
|
-
);
|
|
400
|
-
|
|
401
|
-
const result = await scanUsefulHits({
|
|
402
|
-
days: 1,
|
|
403
|
-
hookLogPath,
|
|
404
|
-
usefulHitLogPath,
|
|
405
|
-
transcriptsDir,
|
|
406
|
-
});
|
|
407
|
-
|
|
408
|
-
expect(result.total).toBe(0);
|
|
409
|
-
});
|
|
410
|
-
|
|
411
|
-
it("skips already-scanned entries on a second run", async () => {
|
|
412
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
413
|
-
const convId = "conv-dedup";
|
|
414
|
-
const hookTs = new Date().toISOString();
|
|
415
|
-
const afterTs = new Date(Date.parse(hookTs) + 1000).toISOString();
|
|
416
|
-
|
|
417
|
-
writeFileSync(
|
|
418
|
-
hookLogPath,
|
|
419
|
-
JSON.stringify({
|
|
420
|
-
ts: hookTs,
|
|
421
|
-
conversationId: convId,
|
|
422
|
-
promptPreview: "help with recall",
|
|
423
|
-
gate: "evaluate",
|
|
424
|
-
hits: [{ id: "cc_sub_dedup123", score: 1.1 }],
|
|
425
|
-
wouldInject: ["cc_sub_dedup123"],
|
|
426
|
-
estTokens: 40,
|
|
427
|
-
mode: "shadow",
|
|
428
|
-
}) + "\n",
|
|
429
|
-
);
|
|
430
|
-
|
|
431
|
-
writeTranscript(
|
|
432
|
-
transcriptsDir,
|
|
433
|
-
convId,
|
|
434
|
-
JSON.stringify({ type: "user", timestamp: hookTs }) +
|
|
435
|
-
"\n" +
|
|
436
|
-
JSON.stringify({
|
|
437
|
-
type: "assistant",
|
|
438
|
-
timestamp: afterTs,
|
|
439
|
-
message: { content: "Used cc_sub_dedup123 for the answer." },
|
|
440
|
-
}) +
|
|
441
|
-
"\n",
|
|
442
|
-
);
|
|
443
|
-
|
|
444
|
-
const first = await scanUsefulHits({ days: 1, hookLogPath, usefulHitLogPath, transcriptsDir });
|
|
445
|
-
expect(first.appended).toBe(1);
|
|
446
|
-
|
|
447
|
-
const second = await scanUsefulHits({ days: 1, hookLogPath, usefulHitLogPath, transcriptsDir });
|
|
448
|
-
expect(second.appended).toBe(0);
|
|
449
|
-
expect(second.total).toBe(1);
|
|
450
|
-
});
|
|
451
|
-
|
|
452
|
-
it("does not write when dryRun=true", async () => {
|
|
453
|
-
const { hookLogPath, usefulHitLogPath, transcriptsDir } = setupScanDirs();
|
|
454
|
-
const hookTs = new Date().toISOString();
|
|
455
|
-
|
|
456
|
-
writeFileSync(
|
|
457
|
-
hookLogPath,
|
|
458
|
-
JSON.stringify({
|
|
459
|
-
ts: hookTs,
|
|
460
|
-
conversationId: "dry-conv",
|
|
461
|
-
promptPreview: "explain the bug",
|
|
462
|
-
gate: "evaluate",
|
|
463
|
-
hits: [{ id: "cc_sub_dry", score: 1.0 }],
|
|
464
|
-
wouldInject: ["cc_sub_dry"],
|
|
465
|
-
estTokens: 20,
|
|
466
|
-
mode: "shadow",
|
|
467
|
-
}) + "\n",
|
|
468
|
-
);
|
|
469
|
-
|
|
470
|
-
const result = await scanUsefulHits({
|
|
471
|
-
days: 1,
|
|
472
|
-
hookLogPath,
|
|
473
|
-
usefulHitLogPath,
|
|
474
|
-
transcriptsDir,
|
|
475
|
-
dryRun: true,
|
|
476
|
-
});
|
|
477
|
-
|
|
478
|
-
expect(result.appended).toBe(0);
|
|
479
|
-
expect(result.total).toBe(1);
|
|
480
|
-
const { existsSync } = await import("node:fs");
|
|
481
|
-
expect(existsSync(usefulHitLogPath)).toBe(false);
|
|
482
|
-
});
|
|
483
|
-
});
|
|
484
|
-
|
|
485
|
-
// ── readUsefulHitRate ────────────────────────────────────────────────────────
|
|
486
|
-
|
|
487
|
-
describe("readUsefulHitRate", () => {
|
|
488
|
-
it("returns null when the log file is absent", async () => {
|
|
489
|
-
const path = join(tmpdir(), `nlm-no-useful-${Date.now()}.jsonl`);
|
|
490
|
-
expect(await readUsefulHitRate(path, 1)).toBeNull();
|
|
491
|
-
});
|
|
492
|
-
|
|
493
|
-
it("returns null when all entries have useful=null (unmeasurable)", async () => {
|
|
494
|
-
const path = join(tmpdir(), `nlm-useful-null-${Date.now()}.jsonl`);
|
|
495
|
-
const ts = new Date().toISOString();
|
|
496
|
-
writeFileSync(
|
|
497
|
-
path,
|
|
498
|
-
JSON.stringify({ ts, conversationId: "x", useful: null, returnedIds: [], source: "hook", matchedId: null, scannedAt: ts }) + "\n",
|
|
499
|
-
);
|
|
500
|
-
expect(await readUsefulHitRate(path, 1)).toBeNull();
|
|
501
|
-
});
|
|
502
|
-
|
|
503
|
-
it("computes the rate correctly from measurable entries", async () => {
|
|
504
|
-
const path = join(tmpdir(), `nlm-useful-rate-${Date.now()}.jsonl`);
|
|
505
|
-
const ts = new Date().toISOString();
|
|
506
|
-
writeFileSync(
|
|
507
|
-
path,
|
|
508
|
-
[
|
|
509
|
-
{ ts, conversationId: "a", useful: true, returnedIds: ["cc_sub_1"], source: "hook", matchedId: "cc_sub_1", scannedAt: ts },
|
|
510
|
-
{ ts, conversationId: "b", useful: false, returnedIds: ["cc_sub_2"], source: "hook", matchedId: null, scannedAt: ts },
|
|
511
|
-
{ ts, conversationId: "c", useful: true, returnedIds: ["cc_sub_3"], source: "hook", matchedId: "cc_sub_3", scannedAt: ts },
|
|
512
|
-
{ ts, conversationId: "d", useful: null, returnedIds: ["cc_sub_4"], source: "hook", matchedId: null, scannedAt: ts },
|
|
513
|
-
]
|
|
514
|
-
.map((e) => JSON.stringify(e))
|
|
515
|
-
.join("\n") + "\n",
|
|
516
|
-
);
|
|
517
|
-
// 2 useful out of 3 measurable = 0.667
|
|
518
|
-
expect(await readUsefulHitRate(path, 1)).toBeCloseTo(0.667, 2);
|
|
519
|
-
});
|
|
520
|
-
|
|
521
|
-
it("excludes entries outside the window", async () => {
|
|
522
|
-
const path = join(tmpdir(), `nlm-useful-window-${Date.now()}.jsonl`);
|
|
523
|
-
const old = new Date(Date.now() - 3 * 24 * 60 * 60 * 1000).toISOString();
|
|
524
|
-
const recent = new Date().toISOString();
|
|
525
|
-
writeFileSync(
|
|
526
|
-
path,
|
|
527
|
-
[
|
|
528
|
-
{ ts: old, conversationId: "old", useful: true, returnedIds: [], source: "hook", matchedId: "x", scannedAt: old },
|
|
529
|
-
{ ts: recent, conversationId: "new", useful: false, returnedIds: [], source: "hook", matchedId: null, scannedAt: recent },
|
|
530
|
-
]
|
|
531
|
-
.map((e) => JSON.stringify(e))
|
|
532
|
-
.join("\n") + "\n",
|
|
533
|
-
);
|
|
534
|
-
// Only the recent entry is in the 1-day window: 0/1 = 0.0
|
|
535
|
-
expect(await readUsefulHitRate(path, 1)).toBe(0);
|
|
536
|
-
});
|
|
537
|
-
});
|
|
@@ -1,93 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Unit tests for OllamaClient.embed: nomic prefix scheme, L2 normalization,
|
|
3
|
-
* 8K char truncation. These guard the nomic-embed-text v1.5 contract.
|
|
4
|
-
*/
|
|
5
|
-
|
|
6
|
-
import { describe, expect, it } from "vitest";
|
|
7
|
-
import { OllamaClient, l2Normalize } from "../../../src/llm/ollama-client.js";
|
|
8
|
-
|
|
9
|
-
type FakeFetch = typeof fetch;
|
|
10
|
-
|
|
11
|
-
function jsonResponse(body: unknown): Response {
|
|
12
|
-
return new Response(JSON.stringify(body), {
|
|
13
|
-
status: 200,
|
|
14
|
-
headers: { "content-type": "application/json" },
|
|
15
|
-
});
|
|
16
|
-
}
|
|
17
|
-
|
|
18
|
-
function makeFetch(reply: (req: { url: string; body: unknown }) => Response): FakeFetch {
|
|
19
|
-
return (async (input: string | URL | Request, init?: RequestInit) => {
|
|
20
|
-
const url = typeof input === "string" ? input : input.toString();
|
|
21
|
-
const body = init?.body ? JSON.parse(init.body.toString()) : null;
|
|
22
|
-
return reply({ url, body });
|
|
23
|
-
}) as FakeFetch;
|
|
24
|
-
}
|
|
25
|
-
|
|
26
|
-
describe("OllamaClient.embed prefix scheme", () => {
|
|
27
|
-
it("prefixes a query call with 'search_query: '", async () => {
|
|
28
|
-
let prompt = "";
|
|
29
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
30
|
-
prompt = (body as { prompt: string }).prompt;
|
|
31
|
-
return jsonResponse({ embedding: [1, 0, 0] });
|
|
32
|
-
});
|
|
33
|
-
const client = new OllamaClient({ fetchImpl });
|
|
34
|
-
await client.embed("what did we decide about pgvector", "query");
|
|
35
|
-
expect(prompt.startsWith("search_query: ")).toBe(true);
|
|
36
|
-
expect(prompt).toContain("pgvector");
|
|
37
|
-
});
|
|
38
|
-
|
|
39
|
-
it("prefixes a document call with 'search_document: '", async () => {
|
|
40
|
-
let prompt = "";
|
|
41
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
42
|
-
prompt = (body as { prompt: string }).prompt;
|
|
43
|
-
return jsonResponse({ embedding: [1, 0, 0] });
|
|
44
|
-
});
|
|
45
|
-
const client = new OllamaClient({ fetchImpl });
|
|
46
|
-
await client.embed("session body text", "document");
|
|
47
|
-
expect(prompt.startsWith("search_document: ")).toBe(true);
|
|
48
|
-
});
|
|
49
|
-
|
|
50
|
-
it("truncates text to MAX_EMBED_CHARS (8000) before prefixing", async () => {
|
|
51
|
-
let prompt = "";
|
|
52
|
-
const fetchImpl = makeFetch(({ body }) => {
|
|
53
|
-
prompt = (body as { prompt: string }).prompt;
|
|
54
|
-
return jsonResponse({ embedding: [1, 0, 0] });
|
|
55
|
-
});
|
|
56
|
-
const client = new OllamaClient({ fetchImpl });
|
|
57
|
-
const big = "x".repeat(10_000);
|
|
58
|
-
await client.embed(big, "document");
|
|
59
|
-
// prompt = "search_document: " + truncated → prefix is 17 chars, body capped at 8000.
|
|
60
|
-
// Briefly raised to 28000 on 2026-05-25 then reverted same day; nomic-
|
|
61
|
-
// embed-text via Ollama 500s on inputs near the nominal 8192-token
|
|
62
|
-
// context. Real fix is chunk + max-pool (filed as #174).
|
|
63
|
-
expect(prompt.length).toBe(17 + 8_000);
|
|
64
|
-
});
|
|
65
|
-
|
|
66
|
-
it("L2-normalizes the returned vector", async () => {
|
|
67
|
-
const fetchImpl = makeFetch(() => jsonResponse({ embedding: [3, 4, 0] }));
|
|
68
|
-
const client = new OllamaClient({ fetchImpl });
|
|
69
|
-
const { vector } = await client.embed("anything", "document");
|
|
70
|
-
// raw norm = 5; normalized should be [0.6, 0.8, 0]
|
|
71
|
-
expect(vector[0]).toBeCloseTo(0.6, 6);
|
|
72
|
-
expect(vector[1]).toBeCloseTo(0.8, 6);
|
|
73
|
-
expect(vector[2]).toBe(0);
|
|
74
|
-
let norm = 0;
|
|
75
|
-
for (const v of vector) norm += v * v;
|
|
76
|
-
expect(Math.sqrt(norm)).toBeCloseTo(1, 6);
|
|
77
|
-
});
|
|
78
|
-
});
|
|
79
|
-
|
|
80
|
-
describe("l2Normalize", () => {
|
|
81
|
-
it("returns a unit vector for a non-zero input", () => {
|
|
82
|
-
const out = l2Normalize(new Float32Array([3, 4, 0]));
|
|
83
|
-
let sum = 0;
|
|
84
|
-
for (const v of out) sum += v * v;
|
|
85
|
-
expect(Math.sqrt(sum)).toBeCloseTo(1, 6);
|
|
86
|
-
});
|
|
87
|
-
|
|
88
|
-
it("returns the zero vector unchanged", () => {
|
|
89
|
-
const zero = new Float32Array([0, 0, 0]);
|
|
90
|
-
const out = l2Normalize(zero);
|
|
91
|
-
expect(Array.from(out)).toEqual([0, 0, 0]);
|
|
92
|
-
});
|
|
93
|
-
});
|