claude-memory-layer 1.0.26 → 1.0.28
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.env.example +7 -0
- package/AGENTS.md +11 -0
- package/README.md +184 -41
- package/benchmarks/replay/anonymized-real-sessions.json +48 -0
- package/dist/cli/index.js +10097 -6003
- package/dist/cli/index.js.map +4 -4
- package/dist/core/index.js +9745 -5587
- package/dist/core/index.js.map +4 -4
- package/dist/hooks/post-tool-use.js +6545 -5270
- package/dist/hooks/post-tool-use.js.map +4 -4
- package/dist/hooks/semantic-daemon.js +6646 -5354
- package/dist/hooks/semantic-daemon.js.map +4 -4
- package/dist/hooks/session-end.js +6618 -5347
- package/dist/hooks/session-end.js.map +4 -4
- package/dist/hooks/session-start.js +6619 -5354
- package/dist/hooks/session-start.js.map +4 -4
- package/dist/hooks/stop.js +6614 -5325
- package/dist/hooks/stop.js.map +4 -4
- package/dist/hooks/user-prompt-submit.js +6702 -5356
- package/dist/hooks/user-prompt-submit.js.map +4 -4
- package/dist/index.js +13537 -0
- package/dist/index.js.map +7 -0
- package/dist/mcp/index.js +20770 -0
- package/dist/mcp/index.js.map +7 -0
- package/dist/server/api/index.js +6632 -5319
- package/dist/server/api/index.js.map +4 -4
- package/dist/server/index.js +6667 -5340
- package/dist/server/index.js.map +4 -4
- package/dist/services/memory-service.js +6568 -5350
- package/dist/services/memory-service.js.map +4 -4
- package/dist/ui/assets/js/bootstrap.js +244 -0
- package/dist/ui/assets/js/chat.js +373 -0
- package/dist/ui/assets/js/disclosure.js +232 -0
- package/dist/ui/assets/js/modals.js +298 -0
- package/dist/ui/assets/js/overview.js +655 -0
- package/dist/ui/assets/js/state.js +72 -0
- package/dist/ui/assets/js/views.js +468 -0
- package/dist/ui/index.html +43 -1
- package/dist/ui/index.ts +3 -0
- package/dist/ui/style.css +222 -0
- package/docs/ARCHITECTURE_COMPARISON_AND_RECOMMENDATIONS.md +627 -0
- package/docs/HERMES_MEMORY_INGESTION_ANALYSIS.md +440 -0
- package/docs/MEMORY_USEFULNESS_AUDIT.md +371 -0
- package/docs/MEMORY_USEFULNESS_AUDIT_RAW.json +80 -0
- package/docs/MEMSEARCH_PROJECT_STRUCTURE_ANALYSIS.md +333 -0
- package/docs/PRODUCT_VALIDATION_MATRIX.md +82 -0
- package/docs/PROJECT_STRUCTURE_ANALYSIS.md +421 -0
- package/docs/REFACTORING_MILESTONES_AND_ISSUES.md +501 -0
- package/docs/REFACTORING_PLAN_THIN_CORE.md +414 -0
- package/docs/REFERENCE_PROJECT_ANALYSES.md +25 -0
- package/docs/SUPERLOCALMEMORY_PROJECT_STRUCTURE_ANALYSIS.md +452 -0
- package/docs/TARGET_ARCHITECTURE_AND_FOLDER_STRUCTURE.md +446 -0
- package/docs/architecture/comparison-index.md +47 -0
- package/docs/reports/codex-real-data-validation-20260505T040447Z.md +46 -0
- package/package.json +9 -5
- package/scripts/build.ts +25 -8
- package/scripts/generate-session-qrels.ts +126 -0
- package/scripts/replay-retrieval-benchmark.ts +69 -0
- package/specs/thin-core-refactor/context.md +275 -0
- package/specs/thin-core-refactor/plan.md +536 -0
- package/specs/thin-core-refactor/spec.md +465 -0
- package/src/adapters/claude/capture/index.ts +3 -0
- package/src/adapters/claude/context/index.ts +3 -0
- package/src/adapters/claude/hooks/index.ts +21 -0
- package/src/adapters/claude/hooks/post-tool-use.ts +239 -0
- package/src/adapters/claude/hooks/prompt-injection-policy.ts +104 -0
- package/src/adapters/claude/hooks/semantic-daemon-client.ts +209 -0
- package/src/adapters/claude/hooks/semantic-daemon.ts +283 -0
- package/src/adapters/claude/hooks/session-end.ts +59 -0
- package/src/adapters/claude/hooks/session-start.ts +73 -0
- package/src/adapters/claude/hooks/stop.ts +128 -0
- package/src/adapters/claude/hooks/user-prompt-submit.ts +361 -0
- package/src/adapters/claude/index.ts +4 -0
- package/src/adapters/claude/transcript/index.ts +4 -0
- package/src/adapters/claude/transcript/transcript-reader.ts +57 -0
- package/src/adapters/claude/transcript/turn-reconstructor.ts +65 -0
- package/src/apps/cli/claude-settings-hooks.ts +138 -0
- package/src/apps/cli/codex-import-runner.ts +125 -0
- package/src/apps/cli/codex-validation-output.ts +95 -0
- package/src/apps/cli/hermes-import-runner.ts +130 -0
- package/src/apps/cli/hermes-validation-output.ts +91 -0
- package/src/apps/cli/index.ts +1731 -0
- package/src/apps/cli/mcp-install.ts +106 -0
- package/src/apps/cli/retrieval-disclosure-output.ts +196 -0
- package/src/apps/dashboard/assets/js/bootstrap.js +244 -0
- package/src/apps/dashboard/assets/js/chat.js +373 -0
- package/src/apps/dashboard/assets/js/disclosure.js +232 -0
- package/src/apps/dashboard/assets/js/modals.js +298 -0
- package/src/apps/dashboard/assets/js/overview.js +655 -0
- package/src/apps/dashboard/assets/js/state.js +72 -0
- package/src/apps/dashboard/assets/js/views.js +468 -0
- package/src/{ui → apps/dashboard}/index.html +43 -1
- package/src/apps/dashboard/index.ts +3 -0
- package/src/{ui → apps/dashboard}/style.css +222 -0
- package/src/apps/index.ts +5 -0
- package/src/apps/server/api/chat.ts +244 -0
- package/src/apps/server/api/citations.ts +105 -0
- package/src/apps/server/api/events.ts +137 -0
- package/src/apps/server/api/health.ts +53 -0
- package/src/apps/server/api/index.ts +26 -0
- package/src/apps/server/api/projects.ts +74 -0
- package/src/apps/server/api/search.ts +184 -0
- package/src/apps/server/api/sessions.ts +115 -0
- package/src/apps/server/api/stats.ts +723 -0
- package/src/apps/server/api/turns.ts +143 -0
- package/src/apps/server/api/utils.ts +65 -0
- package/src/apps/server/index.ts +111 -0
- package/src/cli/index.ts +2 -1311
- package/src/cli/retrieval-disclosure-output.ts +2 -0
- package/src/compat/index.ts +5 -0
- package/src/core/derive/fact-deriver.ts +170 -0
- package/src/core/derive/index.ts +2 -0
- package/src/core/derive/summary-deriver.ts +76 -0
- package/src/core/embedder.ts +4 -152
- package/src/core/engine/embedding-maintenance-service.ts +187 -0
- package/src/core/engine/endless-memory-services.ts +4 -0
- package/src/core/engine/index.ts +19 -0
- package/src/core/engine/memory-engine-services.ts +170 -0
- package/src/core/engine/memory-ingest-service.ts +317 -0
- package/src/core/engine/memory-query-service.ts +173 -0
- package/src/core/engine/memory-runtime-service.ts +162 -0
- package/src/core/engine/memory-service-composition.ts +231 -0
- package/src/core/engine/retrieval-analytics-service.ts +181 -0
- package/src/core/engine/retrieval-disclosure-service.ts +420 -0
- package/src/core/engine/retrieval-orchestrator.ts +377 -0
- package/src/core/engine/retrieval-services.ts +176 -0
- package/src/core/engine/shared-memory-services.ts +4 -0
- package/src/core/entity-repo.ts +1 -3
- package/src/core/event-store.ts +3 -3
- package/src/core/evidence-aligner.ts +2 -2
- package/src/core/external-market-context.ts +582 -0
- package/src/core/graduation.ts +2 -3
- package/src/core/index.ts +21 -0
- package/src/core/matcher.ts +2 -4
- package/src/core/model/memory-fact.ts +30 -0
- package/src/core/model/memory-rule.ts +14 -0
- package/src/core/model/memory-summary.ts +21 -0
- package/src/core/model/raw-event.ts +28 -0
- package/src/core/model/retrieval-result.ts +35 -0
- package/src/core/privacy/filter.ts +21 -10
- package/src/core/product-validation-matrix.ts +314 -0
- package/src/core/progressive-retriever.ts +1 -2
- package/src/core/registry/project-path.ts +54 -0
- package/src/core/registry/session-registry.ts +69 -0
- package/src/core/replay-evaluator.ts +625 -0
- package/src/core/retrieval-benchmark.ts +117 -0
- package/src/core/retrieval-quality.ts +109 -0
- package/src/core/retriever.ts +53 -15
- package/src/core/session-qrels.ts +360 -0
- package/src/core/shared-event-store.ts +1 -1
- package/src/core/sqlite-event-store.ts +35 -11
- package/src/core/task/blocker-resolver.ts +2 -2
- package/src/core/task/task-resolver.ts +0 -1
- package/src/core/vector-outbox.ts +1 -10
- package/src/core/vector-worker.ts +1 -1
- package/src/extensions/endless-memory/endless-memory-services.ts +350 -0
- package/src/extensions/endless-memory/index.ts +1 -0
- package/src/extensions/index.ts +5 -0
- package/src/extensions/mcp/handlers.ts +960 -0
- package/src/extensions/mcp/index.ts +48 -0
- package/src/extensions/mcp/tools.ts +252 -0
- package/src/extensions/shared-memory/index.ts +1 -0
- package/src/extensions/shared-memory/shared-memory-services.ts +211 -0
- package/src/extensions/vector/embedder.ts +197 -0
- package/src/extensions/vector/index.ts +1 -0
- package/src/hooks/post-tool-use.ts +3 -236
- package/src/hooks/semantic-daemon-client.ts +1 -208
- package/src/hooks/semantic-daemon.ts +6 -271
- package/src/hooks/session-end.ts +4 -79
- package/src/hooks/session-start.ts +4 -73
- package/src/hooks/stop.ts +3 -173
- package/src/hooks/user-prompt-submit.ts +3 -338
- package/src/index.ts +13 -0
- package/src/mcp/handlers.ts +2 -212
- package/src/mcp/index.ts +3 -46
- package/src/mcp/tools.ts +2 -78
- package/src/server/api/chat.ts +2 -244
- package/src/server/api/citations.ts +2 -105
- package/src/server/api/events.ts +2 -137
- package/src/server/api/health.ts +2 -53
- package/src/server/api/index.ts +2 -26
- package/src/server/api/projects.ts +2 -74
- package/src/server/api/search.ts +2 -102
- package/src/server/api/sessions.ts +2 -115
- package/src/server/api/stats.ts +2 -724
- package/src/server/api/turns.ts +2 -143
- package/src/server/api/utils.ts +2 -46
- package/src/server/index.ts +2 -100
- package/src/services/bootstrap-organizer.ts +46 -26
- package/src/services/codex-session-history-importer.ts +521 -29
- package/src/services/hermes-session-history-importer.ts +733 -0
- package/src/services/memory-service-config.ts +36 -0
- package/src/services/memory-service-registry.ts +150 -0
- package/src/services/memory-service.ts +211 -1325
- package/src/services/session-history-importer.ts +58 -14
- package/tests/README.md +23 -0
- package/tests/adapters/claude/claude-semantic-daemon-adapter.test.ts +54 -0
- package/tests/adapters/claude/claude-transcript-reconstructor.test.ts +98 -0
- package/tests/adapters/claude-hook-prompt-injection-policy.test.ts +99 -0
- package/tests/apps/app-layer-boundary.test.ts +48 -0
- package/tests/apps/claude-settings-hooks.test.ts +107 -0
- package/tests/apps/cli-disclosure-output.test.ts +212 -0
- package/tests/apps/codex-import-runner.test.ts +99 -0
- package/tests/apps/codex-validation-output.test.ts +100 -0
- package/tests/apps/hermes-import-runner.test.ts +99 -0
- package/tests/apps/mcp-install-command.test.ts +59 -0
- package/tests/apps/package-build-entrypoints.test.ts +30 -0
- package/tests/apps/search-api-disclosure.test.ts +162 -0
- package/tests/apps/stats-api-lightweight.test.ts +67 -0
- package/tests/apps/ui-disclosure-output.test.ts +140 -0
- package/tests/{bootstrap-organizer.test.ts → core/bootstrap-organizer.test.ts} +1 -1
- package/tests/{canonical-key.test.ts → core/canonical-key.test.ts} +1 -1
- package/tests/core/codex-session-history-importer-validation.test.ts +185 -0
- package/tests/{consolidation-worker.test.ts → core/consolidation-worker.test.ts} +2 -2
- package/tests/core/embedding-maintenance-service.test.ts +282 -0
- package/tests/{evidence-aligner.test.ts → core/evidence-aligner.test.ts} +1 -1
- package/tests/core/external-market-context.test.ts +209 -0
- package/tests/core/fact-deriver.test.ts +79 -0
- package/tests/core/hermes-session-history-importer-validation.test.ts +609 -0
- package/tests/{ingest-interceptor.test.ts → core/ingest-interceptor.test.ts} +1 -1
- package/tests/{markdown-mirror.test.ts → core/markdown-mirror.test.ts} +2 -2
- package/tests/{matcher.test.ts → core/matcher.test.ts} +1 -1
- package/tests/{md-mirror.test.ts → core/md-mirror.test.ts} +2 -2
- package/tests/core/memory-engine-services.test.ts +240 -0
- package/tests/core/memory-ingest-service.test.ts +296 -0
- package/tests/core/memory-query-service.test.ts +129 -0
- package/tests/core/memory-runtime-service.test.ts +201 -0
- package/tests/core/memory-service-composition.test.ts +192 -0
- package/tests/core/memory-service-config.test.ts +41 -0
- package/tests/core/memory-service-facade.test.ts +30 -0
- package/tests/core/memory-service-registry.test.ts +206 -0
- package/tests/core/product-validation-matrix.test.ts +61 -0
- package/tests/core/project-registry.test.ts +78 -0
- package/tests/core/replay-evaluator.test.ts +181 -0
- package/tests/core/retrieval-analytics-service.test.ts +210 -0
- package/tests/core/retrieval-benchmark.test.ts +93 -0
- package/tests/core/retrieval-disclosure-service.test.ts +264 -0
- package/tests/core/retrieval-orchestrator.test.ts +403 -0
- package/tests/core/retrieval-quality.test.ts +31 -0
- package/tests/core/retrieval-services.test.ts +185 -0
- package/tests/{retriever-fallback-chain.test.ts → core/retriever-fallback-chain.test.ts} +3 -3
- package/tests/{retriever-strategy-scope.test.ts → core/retriever-strategy-scope.test.ts} +70 -3
- package/tests/{retriever.memu-adoption.test.ts → core/retriever.memu-adoption.test.ts} +3 -3
- package/tests/core/session-history-importer-filter.test.ts +78 -0
- package/tests/core/session-qrels.test.ts +250 -0
- package/tests/{sqlite-event-store-replication.test.ts → core/sqlite-event-store-replication.test.ts} +36 -1
- package/tests/core/summary-deriver.test.ts +66 -0
- package/tests/extensions/embedder-warning-suppression.test.ts +53 -0
- package/tests/extensions/endless-memory-extension-boundary.test.ts +17 -0
- package/tests/extensions/endless-memory-services.test.ts +325 -0
- package/tests/extensions/mcp-context-tools.test.ts +905 -0
- package/tests/extensions/mcp-extension-boundary.test.ts +21 -0
- package/tests/extensions/mcp-package-build.test.ts +22 -0
- package/tests/extensions/mcp-project-aware-tools.test.ts +102 -0
- package/tests/extensions/shared-memory-extension-boundary.test.ts +24 -0
- package/tests/extensions/shared-memory-services.test.ts +309 -0
- package/tests/extensions/vector-extension-boundary.test.ts +21 -0
- package/.claude/settings.local.json +0 -25
- package/.npm-cache/_cacache/content-v2/sha512/04/76/c098f88dfe584a2b80870bff7421b05d17d3d9ee1027f77772332a22d3f93a9a57101a2855107f6ad82077a818bba912b2bc317f2361b5ddb09ad284d9ce +0 -0
- package/.npm-cache/_cacache/content-v2/sha512/60/25/d2ecd39cfc7cab58351162814be77f935c6d6491c10c3745d456da7ddb2117ffd90c10e53fe3c0f1ed16b403307841543634504398b16ee4e6b6dd8e0c45 +0 -0
- package/.npm-cache/_cacache/index-v5/2b/9a/7f8f40206ed8a2e0a84efaa953ccaed1f5d001e14b931083f2e7a0738007 +0 -2
- package/.npm-cache/_cacache/index-v5/2e/d9/fcfa5c6a6abdc2a3644ab84a95936047298c465a2f47ee03db8f7fe1e946 +0 -3
- package/.npm-cache/_cacache/index-v5/a9/42/e519633356d12d3d2f19da66a8301016d496c8f5c3e0554124aaa62dc043 +0 -2
- package/.npm-cache/_logs/2026-02-26T12_04_52_729Z-debug-0.log +0 -256
- package/.npm-cache/_logs/2026-02-26T12_05_36_835Z-debug-0.log +0 -18
- package/.npm-cache/_logs/2026-02-26T12_05_45_982Z-debug-0.log +0 -32
- package/.npm-cache/_logs/2026-02-26T12_05_48_515Z-debug-0.log +0 -260
- package/.npm-cache/_logs/2026-02-26T12_05_53_567Z-debug-0.log +0 -69
- package/.npm-cache/_update-notifier-last-checked +0 -0
- package/bootstrap-kb/decisions/decisions.md +0 -244
- package/bootstrap-kb/glossary/glossary.md +0 -46
- package/bootstrap-kb/modules/.claude-plugin.md +0 -22
- package/bootstrap-kb/modules/agents.md.md +0 -15
- package/bootstrap-kb/modules/claude.md.md +0 -15
- package/bootstrap-kb/modules/context.md.md +0 -15
- package/bootstrap-kb/modules/docs.md +0 -18
- package/bootstrap-kb/modules/handoff.md.md +0 -15
- package/bootstrap-kb/modules/package-lock.json.md +0 -15
- package/bootstrap-kb/modules/package.json.md +0 -15
- package/bootstrap-kb/modules/plan.md.md +0 -15
- package/bootstrap-kb/modules/readme.md.md +0 -15
- package/bootstrap-kb/modules/scripts.md +0 -26
- package/bootstrap-kb/modules/spec.md.md +0 -15
- package/bootstrap-kb/modules/specs.md +0 -20
- package/bootstrap-kb/modules/src.md +0 -51
- package/bootstrap-kb/modules/tests.md +0 -42
- package/bootstrap-kb/modules/tsconfig.json.md +0 -15
- package/bootstrap-kb/modules/vitest.config.ts.md +0 -15
- package/bootstrap-kb/overview/overview.md +0 -40
- package/bootstrap-kb/sources/manifest.json +0 -950
- package/bootstrap-kb/sources/manifest.md +0 -227
- package/bootstrap-kb/timeline/timeline.md +0 -57
- package/claude-memory-layer-1.0.14.tgz +0 -0
- package/d.sh +0 -3
- package/deploy.sh +0 -3
- package/dist/ui/app.js +0 -2101
- package/memory/.claude-plugin/commands/2026-02-25.md +0 -263
- package/memory/_index.md +0 -418
- package/memory/agent_response/uncategorized/2026-02-26.md +0 -176
- package/memory/agent_response/uncategorized/2026-03-03.md +0 -14
- package/memory/agent_response/uncategorized/2026-03-04.md +0 -1421
- package/memory/agent_response/uncategorized/2026-03-05.md +0 -48
- package/memory/default/uncategorized/2026-02-25.md +0 -4839
- package/memory/session_summary/uncategorized/2026-02-26.md +0 -13
- package/memory/session_summary/uncategorized/2026-03-03.md +0 -5
- package/memory/session_summary/uncategorized/2026-03-04.md +0 -50
- package/memory/specs/20260207-dashboard-upgrade/2026-02-25.md +0 -142
- package/memory/specs/citations-system/2026-02-25.md +0 -1121
- package/memory/specs/endless-mode/2026-02-25.md +0 -1392
- package/memory/specs/entity-edge-model/2026-02-25.md +0 -1263
- package/memory/specs/evidence-aligner-v2/2026-02-25.md +0 -1028
- package/memory/specs/mcp-desktop-integration/2026-02-25.md +0 -1334
- package/memory/specs/post-tool-use-hook/2026-02-25.md +0 -1164
- package/memory/specs/private-tags/2026-02-25.md +0 -1057
- package/memory/specs/progressive-disclosure/2026-02-25.md +0 -1436
- package/memory/specs/task-entity-system/2026-02-25.md +0 -924
- package/memory/specs/vector-outbox-v2/2026-02-25.md +0 -1510
- package/memory/specs/web-viewer-ui/2026-02-25.md +0 -1709
- package/memory/tool_observation/uncategorized/2026-02-26.md +0 -209
- package/memory/tool_observation/uncategorized/2026-03-03.md +0 -21
- package/memory/tool_observation/uncategorized/2026-03-04.md +0 -1033
- package/memory/tool_observation/uncategorized/2026-03-05.md +0 -29
- package/memory/user_prompt/uncategorized/2026-02-26.md +0 -25
- package/memory/user_prompt/uncategorized/2026-03-04.md +0 -634
- package/specs/optional-duckdb/context.md +0 -77
- package/specs/optional-duckdb/plan.md +0 -142
- package/specs/optional-duckdb/spec.md +0 -35
- package/src/ui/app.js +0 -2101
|
@@ -0,0 +1,117 @@
|
|
|
1
|
+
export interface ReplayMetricInput {
|
|
2
|
+
queryId: string;
|
|
3
|
+
expectedIds: string[];
|
|
4
|
+
retrievedIds: string[];
|
|
5
|
+
/** Optional graded qrels labels. Missing expected ids default to relevance 1. */
|
|
6
|
+
expectedRelevance?: Record<string, number>;
|
|
7
|
+
}
|
|
8
|
+
|
|
9
|
+
export interface PrecisionRecallAtK {
|
|
10
|
+
precision: number;
|
|
11
|
+
recall: number;
|
|
12
|
+
hits: number;
|
|
13
|
+
ndcg: number;
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
export interface ReplayQueryMetrics {
|
|
17
|
+
queryId: string;
|
|
18
|
+
at: Record<number, PrecisionRecallAtK>;
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
export interface ReplayMetricsSummary {
|
|
22
|
+
queryCount: number;
|
|
23
|
+
precisionAtK: Record<number, number>;
|
|
24
|
+
recallAtK: Record<number, number>;
|
|
25
|
+
ndcgAtK: Record<number, number>;
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
export function computePrecisionRecallAtK(
|
|
29
|
+
inputs: ReplayMetricInput[],
|
|
30
|
+
ks: number[]
|
|
31
|
+
): ReplayQueryMetrics[] {
|
|
32
|
+
const normalizedKs = normalizeKs(ks);
|
|
33
|
+
return inputs.map((input) => {
|
|
34
|
+
const expected = new Set(input.expectedIds);
|
|
35
|
+
const relevance = normalizeRelevance(input.expectedIds, input.expectedRelevance);
|
|
36
|
+
const at: Record<number, PrecisionRecallAtK> = {};
|
|
37
|
+
|
|
38
|
+
for (const k of normalizedKs) {
|
|
39
|
+
const retrieved = input.retrievedIds.slice(0, k);
|
|
40
|
+
const hits = new Set(retrieved.filter((id) => expected.has(id))).size;
|
|
41
|
+
at[k] = {
|
|
42
|
+
precision: k === 0 ? 0 : hits / k,
|
|
43
|
+
recall: expected.size === 0 ? 0 : hits / expected.size,
|
|
44
|
+
hits,
|
|
45
|
+
ndcg: computeNdcgAtK(retrieved, relevance, k)
|
|
46
|
+
};
|
|
47
|
+
}
|
|
48
|
+
|
|
49
|
+
return { queryId: input.queryId, at };
|
|
50
|
+
});
|
|
51
|
+
}
|
|
52
|
+
|
|
53
|
+
export function summarizeReplayMetrics(
|
|
54
|
+
metrics: ReplayQueryMetrics[],
|
|
55
|
+
ks: number[]
|
|
56
|
+
): ReplayMetricsSummary {
|
|
57
|
+
const normalizedKs = normalizeKs(ks);
|
|
58
|
+
const precisionAtK: Record<number, number> = {};
|
|
59
|
+
const recallAtK: Record<number, number> = {};
|
|
60
|
+
const ndcgAtK: Record<number, number> = {};
|
|
61
|
+
|
|
62
|
+
for (const k of normalizedKs) {
|
|
63
|
+
precisionAtK[k] = average(metrics.map((metric) => metric.at[k]?.precision ?? 0));
|
|
64
|
+
recallAtK[k] = average(metrics.map((metric) => metric.at[k]?.recall ?? 0));
|
|
65
|
+
ndcgAtK[k] = average(metrics.map((metric) => metric.at[k]?.ndcg ?? 0));
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
return { queryCount: metrics.length, precisionAtK, recallAtK, ndcgAtK };
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
function normalizeKs(ks: number[]): number[] {
|
|
72
|
+
const seen = new Set<number>();
|
|
73
|
+
const normalized: number[] = [];
|
|
74
|
+
|
|
75
|
+
for (const rawK of ks) {
|
|
76
|
+
const k = Math.max(0, Math.floor(rawK));
|
|
77
|
+
if (seen.has(k)) continue;
|
|
78
|
+
seen.add(k);
|
|
79
|
+
normalized.push(k);
|
|
80
|
+
}
|
|
81
|
+
|
|
82
|
+
return normalized.sort((a, b) => a - b);
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
function normalizeRelevance(expectedIds: string[], expectedRelevance?: Record<string, number>): Record<string, number> {
|
|
86
|
+
const relevance: Record<string, number> = {};
|
|
87
|
+
for (const id of expectedIds) {
|
|
88
|
+
const raw = expectedRelevance?.[id] ?? 1;
|
|
89
|
+
relevance[id] = Number.isFinite(raw) ? Math.max(0, raw) : 0;
|
|
90
|
+
}
|
|
91
|
+
return relevance;
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
function computeNdcgAtK(retrieved: string[], relevance: Record<string, number>, k: number): number {
|
|
95
|
+
if (k <= 0) return 0;
|
|
96
|
+
|
|
97
|
+
const seen = new Set<string>();
|
|
98
|
+
const dcg = retrieved.reduce((sum, id, index) => {
|
|
99
|
+
if (seen.has(id)) return sum;
|
|
100
|
+
seen.add(id);
|
|
101
|
+
return sum + discountedGain(relevance[id] ?? 0, index);
|
|
102
|
+
}, 0);
|
|
103
|
+
|
|
104
|
+
const idealRelevance = Object.values(relevance).sort((a, b) => b - a).slice(0, k);
|
|
105
|
+
const idealDcg = idealRelevance.reduce((sum, rel, index) => sum + discountedGain(rel, index), 0);
|
|
106
|
+
return idealDcg === 0 ? 0 : dcg / idealDcg;
|
|
107
|
+
}
|
|
108
|
+
|
|
109
|
+
function discountedGain(relevance: number, zeroBasedRank: number): number {
|
|
110
|
+
if (relevance <= 0) return 0;
|
|
111
|
+
return (2 ** relevance - 1) / Math.log2(zeroBasedRank + 2);
|
|
112
|
+
}
|
|
113
|
+
|
|
114
|
+
function average(values: number[]): number {
|
|
115
|
+
if (values.length === 0) return 0;
|
|
116
|
+
return values.reduce((sum, value) => sum + value, 0) / values.length;
|
|
117
|
+
}
|
|
@@ -0,0 +1,109 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Retrieval quality guards.
|
|
3
|
+
*
|
|
4
|
+
* These are deliberately small deterministic heuristics used to avoid injecting
|
|
5
|
+
* obviously irrelevant memories. They are not a second source of truth; they
|
|
6
|
+
* only filter candidate retrieval results before context assembly.
|
|
7
|
+
*/
|
|
8
|
+
|
|
9
|
+
const COMMAND_ARTIFACT_PATTERNS = [
|
|
10
|
+
/<\/?(?:local-command-(?:stdout|stderr)|command-(?:name|message))\b/i,
|
|
11
|
+
/<command-name>[\s\S]*?<\/command-name>/i,
|
|
12
|
+
/<local-command-stdout>[\s\S]*?<\/local-command-stdout>/i,
|
|
13
|
+
/<local-command-stderr>[\s\S]*?<\/local-command-stderr>/i
|
|
14
|
+
];
|
|
15
|
+
|
|
16
|
+
const LOW_SIGNAL_CONTEXT_PATTERNS = [
|
|
17
|
+
/<environment_context\b[\s\S]*<\/environment_context>/i,
|
|
18
|
+
/<turn_aborted>/i,
|
|
19
|
+
/^#\s*AGENTS\.md\s+instructions\b[\s\S]*<INSTRUCTIONS>/i,
|
|
20
|
+
/^\s*(?:understood[,\s.]*)?(?:stopping|stopped|pausing|paused)\s+here\b[\s\S]{0,180}\blet\s+me\s+know\s+when\s+you(?:'d|\s+would)?\s+like\s+to\s+continue\b/i,
|
|
21
|
+
/^➜\s+\S+\s+git:\([^)]*\)\s+/i,
|
|
22
|
+
/^\$\s+\S+/i
|
|
23
|
+
];
|
|
24
|
+
|
|
25
|
+
const CONTINUATION_QUERY_PATTERNS = [
|
|
26
|
+
/^\s*(?:continue|resume|next|what(?:'s| is)? next|next\s+(?:step|task|action)|recommended\s+(?:next\s+)?(?:step|task|action)|what should (?:we|i) do next)\??\s*$/i,
|
|
27
|
+
/^\s*(?:이어서(?:\s*진행해줘)?|계속(?:\s*해줘)?|다음\s*(?:단계|작업|추천\s*작업|추천|할\s*일)?(?:은|는)?(?:\s*뭐야)?\??|추천\s*작업(?:은|는)?(?:\s*뭐야)?\??|진행해줘)\s*$/i
|
|
28
|
+
];
|
|
29
|
+
|
|
30
|
+
const GENERIC_TECHNICAL_TERMS = new Set([
|
|
31
|
+
'api',
|
|
32
|
+
'cli',
|
|
33
|
+
'ui',
|
|
34
|
+
'json',
|
|
35
|
+
'jsonl',
|
|
36
|
+
'html',
|
|
37
|
+
'http',
|
|
38
|
+
'https',
|
|
39
|
+
'url',
|
|
40
|
+
'uri',
|
|
41
|
+
'id',
|
|
42
|
+
'ids',
|
|
43
|
+
'uuid',
|
|
44
|
+
'db',
|
|
45
|
+
'sql'
|
|
46
|
+
]);
|
|
47
|
+
|
|
48
|
+
export function isCommandArtifactQuery(query: string): boolean {
|
|
49
|
+
const trimmed = query.trim();
|
|
50
|
+
if (!trimmed) return false;
|
|
51
|
+
const normalized = trimmed.toLowerCase();
|
|
52
|
+
if (normalized.includes('local-command-stdout') || normalized.includes('local-command-stderr')) return true;
|
|
53
|
+
if (normalized.includes('command-name') || normalized.includes('command-message')) return true;
|
|
54
|
+
return COMMAND_ARTIFACT_PATTERNS.some((pattern) => pattern.test(trimmed));
|
|
55
|
+
}
|
|
56
|
+
|
|
57
|
+
export function isCommandArtifactContent(content: string): boolean {
|
|
58
|
+
const trimmed = content.trim();
|
|
59
|
+
if (!trimmed) return false;
|
|
60
|
+
const normalized = trimmed.toLowerCase();
|
|
61
|
+
if (normalized.includes('local-command-stdout') || normalized.includes('local-command-stderr')) return true;
|
|
62
|
+
if (normalized.includes('command-name') || normalized.includes('command-message')) return true;
|
|
63
|
+
return COMMAND_ARTIFACT_PATTERNS.some((pattern) => pattern.test(trimmed));
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
export function isLowSignalContextContent(content: string): boolean {
|
|
67
|
+
const trimmed = content.trim();
|
|
68
|
+
if (!trimmed) return true;
|
|
69
|
+
if (isCommandArtifactContent(trimmed)) return true;
|
|
70
|
+
if (LOW_SIGNAL_CONTEXT_PATTERNS.some((pattern) => pattern.test(trimmed))) return true;
|
|
71
|
+
return false;
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
export function isGenericContinuationQuery(query: string): boolean {
|
|
75
|
+
const trimmed = query.trim();
|
|
76
|
+
if (!trimmed) return false;
|
|
77
|
+
if (!CONTINUATION_QUERY_PATTERNS.some((pattern) => pattern.test(trimmed))) return false;
|
|
78
|
+
if (extractTechnicalQueryTerms(trimmed).length > 0) return false;
|
|
79
|
+
|
|
80
|
+
const tokens = trimmed.match(/[A-Za-z0-9가-힣#._/-]+/g) ?? [];
|
|
81
|
+
if (tokens.length > 10) return false;
|
|
82
|
+
|
|
83
|
+
return !/[A-Za-z0-9_-]+\.[A-Za-z0-9]+/.test(trimmed) &&
|
|
84
|
+
!/(?:^|\s)(?:feat|fix|chore|refactor|docs)\/[A-Za-z0-9._-]+/.test(trimmed) &&
|
|
85
|
+
!/[A-Za-z]:?[\\/]|\/Users\/|\.\/|\.\.\//.test(trimmed);
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
export function extractTechnicalQueryTerms(query: string): string[] {
|
|
89
|
+
const matches = query.match(/[A-Za-z][A-Za-z0-9_.:-]{2,}/g) ?? [];
|
|
90
|
+
const terms = matches.filter((term) => {
|
|
91
|
+
const lower = term.toLowerCase();
|
|
92
|
+
if (GENERIC_TECHNICAL_TERMS.has(lower)) return false;
|
|
93
|
+
return /[._:-]/.test(term) || /[a-z][A-Z]/.test(term) || /[A-Z]{2,}/.test(term) || /\d/.test(term);
|
|
94
|
+
});
|
|
95
|
+
|
|
96
|
+
return Array.from(new Set(terms.map((term) => term.toLowerCase())));
|
|
97
|
+
}
|
|
98
|
+
|
|
99
|
+
export function hasTechnicalTermOverlap(query: string, content: string): boolean {
|
|
100
|
+
const terms = extractTechnicalQueryTerms(query);
|
|
101
|
+
if (terms.length === 0) return true;
|
|
102
|
+
|
|
103
|
+
const normalizedContent = content.toLowerCase();
|
|
104
|
+
return terms.some((term) => normalizedContent.includes(term));
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
export function shouldApplyTechnicalGuard(query: string): boolean {
|
|
108
|
+
return extractTechnicalQueryTerms(query).length > 0;
|
|
109
|
+
}
|
package/src/core/retriever.ts
CHANGED
|
@@ -10,6 +10,11 @@ import { Matcher } from './matcher.js';
|
|
|
10
10
|
import { SharedStore } from './shared-store.js';
|
|
11
11
|
import { SharedVectorStore } from './shared-vector-store.js';
|
|
12
12
|
import { GraduationPipeline } from './graduation.js';
|
|
13
|
+
import {
|
|
14
|
+
hasTechnicalTermOverlap,
|
|
15
|
+
isCommandArtifactQuery,
|
|
16
|
+
shouldApplyTechnicalGuard
|
|
17
|
+
} from './retrieval-quality.js';
|
|
13
18
|
import type { MemoryEvent, MatchResult, SharedTroubleshootingEntry } from './types.js';
|
|
14
19
|
|
|
15
20
|
export interface RetrievalScope {
|
|
@@ -23,6 +28,8 @@ export interface RetrievalScope {
|
|
|
23
28
|
|
|
24
29
|
export type RetrievalStrategy = 'auto' | 'fast' | 'deep';
|
|
25
30
|
export type ProjectScopeMode = 'strict' | 'prefer' | 'global';
|
|
31
|
+
type DecayPolicy = NonNullable<RetrievalOptions['decayPolicy']>;
|
|
32
|
+
type GraphHopOptions = NonNullable<RetrievalOptions['graphHop']>;
|
|
26
33
|
|
|
27
34
|
export interface RetrievalOptions {
|
|
28
35
|
topK: number;
|
|
@@ -166,6 +173,20 @@ export class Retriever {
|
|
|
166
173
|
const sessionFilter = opts.scope?.sessionId ?? opts.sessionId;
|
|
167
174
|
const fallbackTrace: string[] = [];
|
|
168
175
|
|
|
176
|
+
if (isCommandArtifactQuery(query)) {
|
|
177
|
+
fallbackTrace.push('guard:command-artifact-query');
|
|
178
|
+
const emptyMatch = this.matcher.matchSearchResults([], () => 0);
|
|
179
|
+
return {
|
|
180
|
+
memories: [],
|
|
181
|
+
matchResult: emptyMatch,
|
|
182
|
+
totalTokens: 0,
|
|
183
|
+
context: '',
|
|
184
|
+
fallbackTrace,
|
|
185
|
+
selectedDebug: [],
|
|
186
|
+
candidateDebug: []
|
|
187
|
+
};
|
|
188
|
+
}
|
|
189
|
+
|
|
169
190
|
const fallbackEnabled = (opts.strategy ?? 'auto') === 'auto';
|
|
170
191
|
|
|
171
192
|
// Stage 1: primary retrieval
|
|
@@ -311,28 +332,21 @@ export class Retriever {
|
|
|
311
332
|
minScore: number;
|
|
312
333
|
sessionId?: string;
|
|
313
334
|
scope?: RetrievalScope;
|
|
314
|
-
rerankWithKeyword
|
|
335
|
+
rerankWithKeyword?: boolean;
|
|
315
336
|
rerankWeights?: {
|
|
316
337
|
semantic?: number;
|
|
317
338
|
lexical?: number;
|
|
318
339
|
recency?: number;
|
|
319
340
|
};
|
|
320
|
-
decayPolicy?:
|
|
321
|
-
enabled?: boolean;
|
|
322
|
-
windowDays?: number;
|
|
323
|
-
maxPenalty?: number;
|
|
324
|
-
};
|
|
341
|
+
decayPolicy?: DecayPolicy;
|
|
325
342
|
intentRewrite?: boolean;
|
|
326
|
-
graphHop?:
|
|
327
|
-
enabled?: boolean;
|
|
328
|
-
maxHops?: number;
|
|
329
|
-
hopPenalty?: number;
|
|
330
|
-
};
|
|
343
|
+
graphHop?: GraphHopOptions;
|
|
331
344
|
projectScopeMode?: ProjectScopeMode;
|
|
332
345
|
projectHash?: string;
|
|
333
346
|
allowedProjectHashes?: string[];
|
|
334
347
|
}
|
|
335
|
-
): Promise<{ results: SearchResult[]; matchResult: MatchResult }> {
|
|
348
|
+
): Promise<{ results: SearchResult[]; candidateResults: SearchResult[]; matchResult: MatchResult }> {
|
|
349
|
+
let rerankQuery = query;
|
|
336
350
|
let initialResults = await this.searchByStrategy(query, {
|
|
337
351
|
strategy: input.strategy,
|
|
338
352
|
topK: input.topK,
|
|
@@ -343,6 +357,7 @@ export class Retriever {
|
|
|
343
357
|
if (input.intentRewrite && input.strategy === 'deep' && this.queryRewriter) {
|
|
344
358
|
const rewritten = (await this.queryRewriter(query))?.trim();
|
|
345
359
|
if (rewritten && rewritten !== query) {
|
|
360
|
+
rerankQuery = `${query} ${rewritten}`;
|
|
346
361
|
const rewrittenResults = await this.searchByStrategy(rewritten, {
|
|
347
362
|
strategy: 'deep',
|
|
348
363
|
topK: input.topK,
|
|
@@ -362,7 +377,7 @@ export class Retriever {
|
|
|
362
377
|
});
|
|
363
378
|
|
|
364
379
|
const rerankedResults = input.rerankWithKeyword
|
|
365
|
-
? this.rerankByKeywordOverlap(expandedResults,
|
|
380
|
+
? this.rerankByKeywordOverlap(expandedResults, rerankQuery, input.rerankWeights, input.decayPolicy)
|
|
366
381
|
: expandedResults;
|
|
367
382
|
|
|
368
383
|
const filtered = await this.applyScopeFilters(rerankedResults, {
|
|
@@ -371,10 +386,33 @@ export class Retriever {
|
|
|
371
386
|
projectHash: input.projectHash,
|
|
372
387
|
allowedProjectHashes: input.allowedProjectHashes
|
|
373
388
|
});
|
|
374
|
-
const
|
|
389
|
+
const qualityFiltered = this.applyQualityFilters(filtered, {
|
|
390
|
+
query,
|
|
391
|
+
minScore: input.minScore
|
|
392
|
+
});
|
|
393
|
+
const top = qualityFiltered.slice(0, input.topK);
|
|
375
394
|
const matchResult = this.matcher.matchSearchResults(top, () => 0);
|
|
376
395
|
|
|
377
|
-
return { results: top, candidateResults:
|
|
396
|
+
return { results: top, candidateResults: qualityFiltered, matchResult };
|
|
397
|
+
}
|
|
398
|
+
|
|
399
|
+
private applyQualityFilters(
|
|
400
|
+
results: Array<SearchResult & { semanticScore?: number; lexicalScore?: number; recencyScore?: number }>,
|
|
401
|
+
options: { query: string; minScore: number }
|
|
402
|
+
): Array<SearchResult & { semanticScore?: number; lexicalScore?: number; recencyScore?: number }> {
|
|
403
|
+
let filtered = [...results];
|
|
404
|
+
|
|
405
|
+
if (shouldApplyTechnicalGuard(options.query)) {
|
|
406
|
+
filtered = filtered.filter((result) => hasTechnicalTermOverlap(options.query, result.content));
|
|
407
|
+
}
|
|
408
|
+
|
|
409
|
+
if (filtered.length <= 2) return filtered;
|
|
410
|
+
|
|
411
|
+
const topScore = filtered[0].score;
|
|
412
|
+
if (topScore < 0.8) return filtered;
|
|
413
|
+
|
|
414
|
+
const cliffThreshold = Math.max(options.minScore, topScore - 0.25);
|
|
415
|
+
return filtered.filter((result) => result.score >= cliffThreshold);
|
|
378
416
|
}
|
|
379
417
|
|
|
380
418
|
private mergeResults(primary: SearchResult[], secondary: SearchResult[], limit: number): SearchResult[] {
|