claude-memory-layer 1.0.26 → 1.0.28

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (328) hide show
  1. package/.env.example +7 -0
  2. package/AGENTS.md +11 -0
  3. package/README.md +184 -41
  4. package/benchmarks/replay/anonymized-real-sessions.json +48 -0
  5. package/dist/cli/index.js +10097 -6003
  6. package/dist/cli/index.js.map +4 -4
  7. package/dist/core/index.js +9745 -5587
  8. package/dist/core/index.js.map +4 -4
  9. package/dist/hooks/post-tool-use.js +6545 -5270
  10. package/dist/hooks/post-tool-use.js.map +4 -4
  11. package/dist/hooks/semantic-daemon.js +6646 -5354
  12. package/dist/hooks/semantic-daemon.js.map +4 -4
  13. package/dist/hooks/session-end.js +6618 -5347
  14. package/dist/hooks/session-end.js.map +4 -4
  15. package/dist/hooks/session-start.js +6619 -5354
  16. package/dist/hooks/session-start.js.map +4 -4
  17. package/dist/hooks/stop.js +6614 -5325
  18. package/dist/hooks/stop.js.map +4 -4
  19. package/dist/hooks/user-prompt-submit.js +6702 -5356
  20. package/dist/hooks/user-prompt-submit.js.map +4 -4
  21. package/dist/index.js +13537 -0
  22. package/dist/index.js.map +7 -0
  23. package/dist/mcp/index.js +20770 -0
  24. package/dist/mcp/index.js.map +7 -0
  25. package/dist/server/api/index.js +6632 -5319
  26. package/dist/server/api/index.js.map +4 -4
  27. package/dist/server/index.js +6667 -5340
  28. package/dist/server/index.js.map +4 -4
  29. package/dist/services/memory-service.js +6568 -5350
  30. package/dist/services/memory-service.js.map +4 -4
  31. package/dist/ui/assets/js/bootstrap.js +244 -0
  32. package/dist/ui/assets/js/chat.js +373 -0
  33. package/dist/ui/assets/js/disclosure.js +232 -0
  34. package/dist/ui/assets/js/modals.js +298 -0
  35. package/dist/ui/assets/js/overview.js +655 -0
  36. package/dist/ui/assets/js/state.js +72 -0
  37. package/dist/ui/assets/js/views.js +468 -0
  38. package/dist/ui/index.html +43 -1
  39. package/dist/ui/index.ts +3 -0
  40. package/dist/ui/style.css +222 -0
  41. package/docs/ARCHITECTURE_COMPARISON_AND_RECOMMENDATIONS.md +627 -0
  42. package/docs/HERMES_MEMORY_INGESTION_ANALYSIS.md +440 -0
  43. package/docs/MEMORY_USEFULNESS_AUDIT.md +371 -0
  44. package/docs/MEMORY_USEFULNESS_AUDIT_RAW.json +80 -0
  45. package/docs/MEMSEARCH_PROJECT_STRUCTURE_ANALYSIS.md +333 -0
  46. package/docs/PRODUCT_VALIDATION_MATRIX.md +82 -0
  47. package/docs/PROJECT_STRUCTURE_ANALYSIS.md +421 -0
  48. package/docs/REFACTORING_MILESTONES_AND_ISSUES.md +501 -0
  49. package/docs/REFACTORING_PLAN_THIN_CORE.md +414 -0
  50. package/docs/REFERENCE_PROJECT_ANALYSES.md +25 -0
  51. package/docs/SUPERLOCALMEMORY_PROJECT_STRUCTURE_ANALYSIS.md +452 -0
  52. package/docs/TARGET_ARCHITECTURE_AND_FOLDER_STRUCTURE.md +446 -0
  53. package/docs/architecture/comparison-index.md +47 -0
  54. package/docs/reports/codex-real-data-validation-20260505T040447Z.md +46 -0
  55. package/package.json +9 -5
  56. package/scripts/build.ts +25 -8
  57. package/scripts/generate-session-qrels.ts +126 -0
  58. package/scripts/replay-retrieval-benchmark.ts +69 -0
  59. package/specs/thin-core-refactor/context.md +275 -0
  60. package/specs/thin-core-refactor/plan.md +536 -0
  61. package/specs/thin-core-refactor/spec.md +465 -0
  62. package/src/adapters/claude/capture/index.ts +3 -0
  63. package/src/adapters/claude/context/index.ts +3 -0
  64. package/src/adapters/claude/hooks/index.ts +21 -0
  65. package/src/adapters/claude/hooks/post-tool-use.ts +239 -0
  66. package/src/adapters/claude/hooks/prompt-injection-policy.ts +104 -0
  67. package/src/adapters/claude/hooks/semantic-daemon-client.ts +209 -0
  68. package/src/adapters/claude/hooks/semantic-daemon.ts +283 -0
  69. package/src/adapters/claude/hooks/session-end.ts +59 -0
  70. package/src/adapters/claude/hooks/session-start.ts +73 -0
  71. package/src/adapters/claude/hooks/stop.ts +128 -0
  72. package/src/adapters/claude/hooks/user-prompt-submit.ts +361 -0
  73. package/src/adapters/claude/index.ts +4 -0
  74. package/src/adapters/claude/transcript/index.ts +4 -0
  75. package/src/adapters/claude/transcript/transcript-reader.ts +57 -0
  76. package/src/adapters/claude/transcript/turn-reconstructor.ts +65 -0
  77. package/src/apps/cli/claude-settings-hooks.ts +138 -0
  78. package/src/apps/cli/codex-import-runner.ts +125 -0
  79. package/src/apps/cli/codex-validation-output.ts +95 -0
  80. package/src/apps/cli/hermes-import-runner.ts +130 -0
  81. package/src/apps/cli/hermes-validation-output.ts +91 -0
  82. package/src/apps/cli/index.ts +1731 -0
  83. package/src/apps/cli/mcp-install.ts +106 -0
  84. package/src/apps/cli/retrieval-disclosure-output.ts +196 -0
  85. package/src/apps/dashboard/assets/js/bootstrap.js +244 -0
  86. package/src/apps/dashboard/assets/js/chat.js +373 -0
  87. package/src/apps/dashboard/assets/js/disclosure.js +232 -0
  88. package/src/apps/dashboard/assets/js/modals.js +298 -0
  89. package/src/apps/dashboard/assets/js/overview.js +655 -0
  90. package/src/apps/dashboard/assets/js/state.js +72 -0
  91. package/src/apps/dashboard/assets/js/views.js +468 -0
  92. package/src/{ui → apps/dashboard}/index.html +43 -1
  93. package/src/apps/dashboard/index.ts +3 -0
  94. package/src/{ui → apps/dashboard}/style.css +222 -0
  95. package/src/apps/index.ts +5 -0
  96. package/src/apps/server/api/chat.ts +244 -0
  97. package/src/apps/server/api/citations.ts +105 -0
  98. package/src/apps/server/api/events.ts +137 -0
  99. package/src/apps/server/api/health.ts +53 -0
  100. package/src/apps/server/api/index.ts +26 -0
  101. package/src/apps/server/api/projects.ts +74 -0
  102. package/src/apps/server/api/search.ts +184 -0
  103. package/src/apps/server/api/sessions.ts +115 -0
  104. package/src/apps/server/api/stats.ts +723 -0
  105. package/src/apps/server/api/turns.ts +143 -0
  106. package/src/apps/server/api/utils.ts +65 -0
  107. package/src/apps/server/index.ts +111 -0
  108. package/src/cli/index.ts +2 -1311
  109. package/src/cli/retrieval-disclosure-output.ts +2 -0
  110. package/src/compat/index.ts +5 -0
  111. package/src/core/derive/fact-deriver.ts +170 -0
  112. package/src/core/derive/index.ts +2 -0
  113. package/src/core/derive/summary-deriver.ts +76 -0
  114. package/src/core/embedder.ts +4 -152
  115. package/src/core/engine/embedding-maintenance-service.ts +187 -0
  116. package/src/core/engine/endless-memory-services.ts +4 -0
  117. package/src/core/engine/index.ts +19 -0
  118. package/src/core/engine/memory-engine-services.ts +170 -0
  119. package/src/core/engine/memory-ingest-service.ts +317 -0
  120. package/src/core/engine/memory-query-service.ts +173 -0
  121. package/src/core/engine/memory-runtime-service.ts +162 -0
  122. package/src/core/engine/memory-service-composition.ts +231 -0
  123. package/src/core/engine/retrieval-analytics-service.ts +181 -0
  124. package/src/core/engine/retrieval-disclosure-service.ts +420 -0
  125. package/src/core/engine/retrieval-orchestrator.ts +377 -0
  126. package/src/core/engine/retrieval-services.ts +176 -0
  127. package/src/core/engine/shared-memory-services.ts +4 -0
  128. package/src/core/entity-repo.ts +1 -3
  129. package/src/core/event-store.ts +3 -3
  130. package/src/core/evidence-aligner.ts +2 -2
  131. package/src/core/external-market-context.ts +582 -0
  132. package/src/core/graduation.ts +2 -3
  133. package/src/core/index.ts +21 -0
  134. package/src/core/matcher.ts +2 -4
  135. package/src/core/model/memory-fact.ts +30 -0
  136. package/src/core/model/memory-rule.ts +14 -0
  137. package/src/core/model/memory-summary.ts +21 -0
  138. package/src/core/model/raw-event.ts +28 -0
  139. package/src/core/model/retrieval-result.ts +35 -0
  140. package/src/core/privacy/filter.ts +21 -10
  141. package/src/core/product-validation-matrix.ts +314 -0
  142. package/src/core/progressive-retriever.ts +1 -2
  143. package/src/core/registry/project-path.ts +54 -0
  144. package/src/core/registry/session-registry.ts +69 -0
  145. package/src/core/replay-evaluator.ts +625 -0
  146. package/src/core/retrieval-benchmark.ts +117 -0
  147. package/src/core/retrieval-quality.ts +109 -0
  148. package/src/core/retriever.ts +53 -15
  149. package/src/core/session-qrels.ts +360 -0
  150. package/src/core/shared-event-store.ts +1 -1
  151. package/src/core/sqlite-event-store.ts +35 -11
  152. package/src/core/task/blocker-resolver.ts +2 -2
  153. package/src/core/task/task-resolver.ts +0 -1
  154. package/src/core/vector-outbox.ts +1 -10
  155. package/src/core/vector-worker.ts +1 -1
  156. package/src/extensions/endless-memory/endless-memory-services.ts +350 -0
  157. package/src/extensions/endless-memory/index.ts +1 -0
  158. package/src/extensions/index.ts +5 -0
  159. package/src/extensions/mcp/handlers.ts +960 -0
  160. package/src/extensions/mcp/index.ts +48 -0
  161. package/src/extensions/mcp/tools.ts +252 -0
  162. package/src/extensions/shared-memory/index.ts +1 -0
  163. package/src/extensions/shared-memory/shared-memory-services.ts +211 -0
  164. package/src/extensions/vector/embedder.ts +197 -0
  165. package/src/extensions/vector/index.ts +1 -0
  166. package/src/hooks/post-tool-use.ts +3 -236
  167. package/src/hooks/semantic-daemon-client.ts +1 -208
  168. package/src/hooks/semantic-daemon.ts +6 -271
  169. package/src/hooks/session-end.ts +4 -79
  170. package/src/hooks/session-start.ts +4 -73
  171. package/src/hooks/stop.ts +3 -173
  172. package/src/hooks/user-prompt-submit.ts +3 -338
  173. package/src/index.ts +13 -0
  174. package/src/mcp/handlers.ts +2 -212
  175. package/src/mcp/index.ts +3 -46
  176. package/src/mcp/tools.ts +2 -78
  177. package/src/server/api/chat.ts +2 -244
  178. package/src/server/api/citations.ts +2 -105
  179. package/src/server/api/events.ts +2 -137
  180. package/src/server/api/health.ts +2 -53
  181. package/src/server/api/index.ts +2 -26
  182. package/src/server/api/projects.ts +2 -74
  183. package/src/server/api/search.ts +2 -102
  184. package/src/server/api/sessions.ts +2 -115
  185. package/src/server/api/stats.ts +2 -724
  186. package/src/server/api/turns.ts +2 -143
  187. package/src/server/api/utils.ts +2 -46
  188. package/src/server/index.ts +2 -100
  189. package/src/services/bootstrap-organizer.ts +46 -26
  190. package/src/services/codex-session-history-importer.ts +521 -29
  191. package/src/services/hermes-session-history-importer.ts +733 -0
  192. package/src/services/memory-service-config.ts +36 -0
  193. package/src/services/memory-service-registry.ts +150 -0
  194. package/src/services/memory-service.ts +211 -1325
  195. package/src/services/session-history-importer.ts +58 -14
  196. package/tests/README.md +23 -0
  197. package/tests/adapters/claude/claude-semantic-daemon-adapter.test.ts +54 -0
  198. package/tests/adapters/claude/claude-transcript-reconstructor.test.ts +98 -0
  199. package/tests/adapters/claude-hook-prompt-injection-policy.test.ts +99 -0
  200. package/tests/apps/app-layer-boundary.test.ts +48 -0
  201. package/tests/apps/claude-settings-hooks.test.ts +107 -0
  202. package/tests/apps/cli-disclosure-output.test.ts +212 -0
  203. package/tests/apps/codex-import-runner.test.ts +99 -0
  204. package/tests/apps/codex-validation-output.test.ts +100 -0
  205. package/tests/apps/hermes-import-runner.test.ts +99 -0
  206. package/tests/apps/mcp-install-command.test.ts +59 -0
  207. package/tests/apps/package-build-entrypoints.test.ts +30 -0
  208. package/tests/apps/search-api-disclosure.test.ts +162 -0
  209. package/tests/apps/stats-api-lightweight.test.ts +67 -0
  210. package/tests/apps/ui-disclosure-output.test.ts +140 -0
  211. package/tests/{bootstrap-organizer.test.ts → core/bootstrap-organizer.test.ts} +1 -1
  212. package/tests/{canonical-key.test.ts → core/canonical-key.test.ts} +1 -1
  213. package/tests/core/codex-session-history-importer-validation.test.ts +185 -0
  214. package/tests/{consolidation-worker.test.ts → core/consolidation-worker.test.ts} +2 -2
  215. package/tests/core/embedding-maintenance-service.test.ts +282 -0
  216. package/tests/{evidence-aligner.test.ts → core/evidence-aligner.test.ts} +1 -1
  217. package/tests/core/external-market-context.test.ts +209 -0
  218. package/tests/core/fact-deriver.test.ts +79 -0
  219. package/tests/core/hermes-session-history-importer-validation.test.ts +609 -0
  220. package/tests/{ingest-interceptor.test.ts → core/ingest-interceptor.test.ts} +1 -1
  221. package/tests/{markdown-mirror.test.ts → core/markdown-mirror.test.ts} +2 -2
  222. package/tests/{matcher.test.ts → core/matcher.test.ts} +1 -1
  223. package/tests/{md-mirror.test.ts → core/md-mirror.test.ts} +2 -2
  224. package/tests/core/memory-engine-services.test.ts +240 -0
  225. package/tests/core/memory-ingest-service.test.ts +296 -0
  226. package/tests/core/memory-query-service.test.ts +129 -0
  227. package/tests/core/memory-runtime-service.test.ts +201 -0
  228. package/tests/core/memory-service-composition.test.ts +192 -0
  229. package/tests/core/memory-service-config.test.ts +41 -0
  230. package/tests/core/memory-service-facade.test.ts +30 -0
  231. package/tests/core/memory-service-registry.test.ts +206 -0
  232. package/tests/core/product-validation-matrix.test.ts +61 -0
  233. package/tests/core/project-registry.test.ts +78 -0
  234. package/tests/core/replay-evaluator.test.ts +181 -0
  235. package/tests/core/retrieval-analytics-service.test.ts +210 -0
  236. package/tests/core/retrieval-benchmark.test.ts +93 -0
  237. package/tests/core/retrieval-disclosure-service.test.ts +264 -0
  238. package/tests/core/retrieval-orchestrator.test.ts +403 -0
  239. package/tests/core/retrieval-quality.test.ts +31 -0
  240. package/tests/core/retrieval-services.test.ts +185 -0
  241. package/tests/{retriever-fallback-chain.test.ts → core/retriever-fallback-chain.test.ts} +3 -3
  242. package/tests/{retriever-strategy-scope.test.ts → core/retriever-strategy-scope.test.ts} +70 -3
  243. package/tests/{retriever.memu-adoption.test.ts → core/retriever.memu-adoption.test.ts} +3 -3
  244. package/tests/core/session-history-importer-filter.test.ts +78 -0
  245. package/tests/core/session-qrels.test.ts +250 -0
  246. package/tests/{sqlite-event-store-replication.test.ts → core/sqlite-event-store-replication.test.ts} +36 -1
  247. package/tests/core/summary-deriver.test.ts +66 -0
  248. package/tests/extensions/embedder-warning-suppression.test.ts +53 -0
  249. package/tests/extensions/endless-memory-extension-boundary.test.ts +17 -0
  250. package/tests/extensions/endless-memory-services.test.ts +325 -0
  251. package/tests/extensions/mcp-context-tools.test.ts +905 -0
  252. package/tests/extensions/mcp-extension-boundary.test.ts +21 -0
  253. package/tests/extensions/mcp-package-build.test.ts +22 -0
  254. package/tests/extensions/mcp-project-aware-tools.test.ts +102 -0
  255. package/tests/extensions/shared-memory-extension-boundary.test.ts +24 -0
  256. package/tests/extensions/shared-memory-services.test.ts +309 -0
  257. package/tests/extensions/vector-extension-boundary.test.ts +21 -0
  258. package/.claude/settings.local.json +0 -25
  259. package/.npm-cache/_cacache/content-v2/sha512/04/76/c098f88dfe584a2b80870bff7421b05d17d3d9ee1027f77772332a22d3f93a9a57101a2855107f6ad82077a818bba912b2bc317f2361b5ddb09ad284d9ce +0 -0
  260. package/.npm-cache/_cacache/content-v2/sha512/60/25/d2ecd39cfc7cab58351162814be77f935c6d6491c10c3745d456da7ddb2117ffd90c10e53fe3c0f1ed16b403307841543634504398b16ee4e6b6dd8e0c45 +0 -0
  261. package/.npm-cache/_cacache/index-v5/2b/9a/7f8f40206ed8a2e0a84efaa953ccaed1f5d001e14b931083f2e7a0738007 +0 -2
  262. package/.npm-cache/_cacache/index-v5/2e/d9/fcfa5c6a6abdc2a3644ab84a95936047298c465a2f47ee03db8f7fe1e946 +0 -3
  263. package/.npm-cache/_cacache/index-v5/a9/42/e519633356d12d3d2f19da66a8301016d496c8f5c3e0554124aaa62dc043 +0 -2
  264. package/.npm-cache/_logs/2026-02-26T12_04_52_729Z-debug-0.log +0 -256
  265. package/.npm-cache/_logs/2026-02-26T12_05_36_835Z-debug-0.log +0 -18
  266. package/.npm-cache/_logs/2026-02-26T12_05_45_982Z-debug-0.log +0 -32
  267. package/.npm-cache/_logs/2026-02-26T12_05_48_515Z-debug-0.log +0 -260
  268. package/.npm-cache/_logs/2026-02-26T12_05_53_567Z-debug-0.log +0 -69
  269. package/.npm-cache/_update-notifier-last-checked +0 -0
  270. package/bootstrap-kb/decisions/decisions.md +0 -244
  271. package/bootstrap-kb/glossary/glossary.md +0 -46
  272. package/bootstrap-kb/modules/.claude-plugin.md +0 -22
  273. package/bootstrap-kb/modules/agents.md.md +0 -15
  274. package/bootstrap-kb/modules/claude.md.md +0 -15
  275. package/bootstrap-kb/modules/context.md.md +0 -15
  276. package/bootstrap-kb/modules/docs.md +0 -18
  277. package/bootstrap-kb/modules/handoff.md.md +0 -15
  278. package/bootstrap-kb/modules/package-lock.json.md +0 -15
  279. package/bootstrap-kb/modules/package.json.md +0 -15
  280. package/bootstrap-kb/modules/plan.md.md +0 -15
  281. package/bootstrap-kb/modules/readme.md.md +0 -15
  282. package/bootstrap-kb/modules/scripts.md +0 -26
  283. package/bootstrap-kb/modules/spec.md.md +0 -15
  284. package/bootstrap-kb/modules/specs.md +0 -20
  285. package/bootstrap-kb/modules/src.md +0 -51
  286. package/bootstrap-kb/modules/tests.md +0 -42
  287. package/bootstrap-kb/modules/tsconfig.json.md +0 -15
  288. package/bootstrap-kb/modules/vitest.config.ts.md +0 -15
  289. package/bootstrap-kb/overview/overview.md +0 -40
  290. package/bootstrap-kb/sources/manifest.json +0 -950
  291. package/bootstrap-kb/sources/manifest.md +0 -227
  292. package/bootstrap-kb/timeline/timeline.md +0 -57
  293. package/claude-memory-layer-1.0.14.tgz +0 -0
  294. package/d.sh +0 -3
  295. package/deploy.sh +0 -3
  296. package/dist/ui/app.js +0 -2101
  297. package/memory/.claude-plugin/commands/2026-02-25.md +0 -263
  298. package/memory/_index.md +0 -418
  299. package/memory/agent_response/uncategorized/2026-02-26.md +0 -176
  300. package/memory/agent_response/uncategorized/2026-03-03.md +0 -14
  301. package/memory/agent_response/uncategorized/2026-03-04.md +0 -1421
  302. package/memory/agent_response/uncategorized/2026-03-05.md +0 -48
  303. package/memory/default/uncategorized/2026-02-25.md +0 -4839
  304. package/memory/session_summary/uncategorized/2026-02-26.md +0 -13
  305. package/memory/session_summary/uncategorized/2026-03-03.md +0 -5
  306. package/memory/session_summary/uncategorized/2026-03-04.md +0 -50
  307. package/memory/specs/20260207-dashboard-upgrade/2026-02-25.md +0 -142
  308. package/memory/specs/citations-system/2026-02-25.md +0 -1121
  309. package/memory/specs/endless-mode/2026-02-25.md +0 -1392
  310. package/memory/specs/entity-edge-model/2026-02-25.md +0 -1263
  311. package/memory/specs/evidence-aligner-v2/2026-02-25.md +0 -1028
  312. package/memory/specs/mcp-desktop-integration/2026-02-25.md +0 -1334
  313. package/memory/specs/post-tool-use-hook/2026-02-25.md +0 -1164
  314. package/memory/specs/private-tags/2026-02-25.md +0 -1057
  315. package/memory/specs/progressive-disclosure/2026-02-25.md +0 -1436
  316. package/memory/specs/task-entity-system/2026-02-25.md +0 -924
  317. package/memory/specs/vector-outbox-v2/2026-02-25.md +0 -1510
  318. package/memory/specs/web-viewer-ui/2026-02-25.md +0 -1709
  319. package/memory/tool_observation/uncategorized/2026-02-26.md +0 -209
  320. package/memory/tool_observation/uncategorized/2026-03-03.md +0 -21
  321. package/memory/tool_observation/uncategorized/2026-03-04.md +0 -1033
  322. package/memory/tool_observation/uncategorized/2026-03-05.md +0 -29
  323. package/memory/user_prompt/uncategorized/2026-02-26.md +0 -25
  324. package/memory/user_prompt/uncategorized/2026-03-04.md +0 -634
  325. package/specs/optional-duckdb/context.md +0 -77
  326. package/specs/optional-duckdb/plan.md +0 -142
  327. package/specs/optional-duckdb/spec.md +0 -35
  328. package/src/ui/app.js +0 -2101
@@ -0,0 +1,117 @@
1
+ export interface ReplayMetricInput {
2
+ queryId: string;
3
+ expectedIds: string[];
4
+ retrievedIds: string[];
5
+ /** Optional graded qrels labels. Missing expected ids default to relevance 1. */
6
+ expectedRelevance?: Record<string, number>;
7
+ }
8
+
9
+ export interface PrecisionRecallAtK {
10
+ precision: number;
11
+ recall: number;
12
+ hits: number;
13
+ ndcg: number;
14
+ }
15
+
16
+ export interface ReplayQueryMetrics {
17
+ queryId: string;
18
+ at: Record<number, PrecisionRecallAtK>;
19
+ }
20
+
21
+ export interface ReplayMetricsSummary {
22
+ queryCount: number;
23
+ precisionAtK: Record<number, number>;
24
+ recallAtK: Record<number, number>;
25
+ ndcgAtK: Record<number, number>;
26
+ }
27
+
28
+ export function computePrecisionRecallAtK(
29
+ inputs: ReplayMetricInput[],
30
+ ks: number[]
31
+ ): ReplayQueryMetrics[] {
32
+ const normalizedKs = normalizeKs(ks);
33
+ return inputs.map((input) => {
34
+ const expected = new Set(input.expectedIds);
35
+ const relevance = normalizeRelevance(input.expectedIds, input.expectedRelevance);
36
+ const at: Record<number, PrecisionRecallAtK> = {};
37
+
38
+ for (const k of normalizedKs) {
39
+ const retrieved = input.retrievedIds.slice(0, k);
40
+ const hits = new Set(retrieved.filter((id) => expected.has(id))).size;
41
+ at[k] = {
42
+ precision: k === 0 ? 0 : hits / k,
43
+ recall: expected.size === 0 ? 0 : hits / expected.size,
44
+ hits,
45
+ ndcg: computeNdcgAtK(retrieved, relevance, k)
46
+ };
47
+ }
48
+
49
+ return { queryId: input.queryId, at };
50
+ });
51
+ }
52
+
53
+ export function summarizeReplayMetrics(
54
+ metrics: ReplayQueryMetrics[],
55
+ ks: number[]
56
+ ): ReplayMetricsSummary {
57
+ const normalizedKs = normalizeKs(ks);
58
+ const precisionAtK: Record<number, number> = {};
59
+ const recallAtK: Record<number, number> = {};
60
+ const ndcgAtK: Record<number, number> = {};
61
+
62
+ for (const k of normalizedKs) {
63
+ precisionAtK[k] = average(metrics.map((metric) => metric.at[k]?.precision ?? 0));
64
+ recallAtK[k] = average(metrics.map((metric) => metric.at[k]?.recall ?? 0));
65
+ ndcgAtK[k] = average(metrics.map((metric) => metric.at[k]?.ndcg ?? 0));
66
+ }
67
+
68
+ return { queryCount: metrics.length, precisionAtK, recallAtK, ndcgAtK };
69
+ }
70
+
71
+ function normalizeKs(ks: number[]): number[] {
72
+ const seen = new Set<number>();
73
+ const normalized: number[] = [];
74
+
75
+ for (const rawK of ks) {
76
+ const k = Math.max(0, Math.floor(rawK));
77
+ if (seen.has(k)) continue;
78
+ seen.add(k);
79
+ normalized.push(k);
80
+ }
81
+
82
+ return normalized.sort((a, b) => a - b);
83
+ }
84
+
85
+ function normalizeRelevance(expectedIds: string[], expectedRelevance?: Record<string, number>): Record<string, number> {
86
+ const relevance: Record<string, number> = {};
87
+ for (const id of expectedIds) {
88
+ const raw = expectedRelevance?.[id] ?? 1;
89
+ relevance[id] = Number.isFinite(raw) ? Math.max(0, raw) : 0;
90
+ }
91
+ return relevance;
92
+ }
93
+
94
+ function computeNdcgAtK(retrieved: string[], relevance: Record<string, number>, k: number): number {
95
+ if (k <= 0) return 0;
96
+
97
+ const seen = new Set<string>();
98
+ const dcg = retrieved.reduce((sum, id, index) => {
99
+ if (seen.has(id)) return sum;
100
+ seen.add(id);
101
+ return sum + discountedGain(relevance[id] ?? 0, index);
102
+ }, 0);
103
+
104
+ const idealRelevance = Object.values(relevance).sort((a, b) => b - a).slice(0, k);
105
+ const idealDcg = idealRelevance.reduce((sum, rel, index) => sum + discountedGain(rel, index), 0);
106
+ return idealDcg === 0 ? 0 : dcg / idealDcg;
107
+ }
108
+
109
+ function discountedGain(relevance: number, zeroBasedRank: number): number {
110
+ if (relevance <= 0) return 0;
111
+ return (2 ** relevance - 1) / Math.log2(zeroBasedRank + 2);
112
+ }
113
+
114
+ function average(values: number[]): number {
115
+ if (values.length === 0) return 0;
116
+ return values.reduce((sum, value) => sum + value, 0) / values.length;
117
+ }
@@ -0,0 +1,109 @@
1
+ /**
2
+ * Retrieval quality guards.
3
+ *
4
+ * These are deliberately small deterministic heuristics used to avoid injecting
5
+ * obviously irrelevant memories. They are not a second source of truth; they
6
+ * only filter candidate retrieval results before context assembly.
7
+ */
8
+
9
+ const COMMAND_ARTIFACT_PATTERNS = [
10
+ /<\/?(?:local-command-(?:stdout|stderr)|command-(?:name|message))\b/i,
11
+ /<command-name>[\s\S]*?<\/command-name>/i,
12
+ /<local-command-stdout>[\s\S]*?<\/local-command-stdout>/i,
13
+ /<local-command-stderr>[\s\S]*?<\/local-command-stderr>/i
14
+ ];
15
+
16
+ const LOW_SIGNAL_CONTEXT_PATTERNS = [
17
+ /<environment_context\b[\s\S]*<\/environment_context>/i,
18
+ /<turn_aborted>/i,
19
+ /^#\s*AGENTS\.md\s+instructions\b[\s\S]*<INSTRUCTIONS>/i,
20
+ /^\s*(?:understood[,\s.]*)?(?:stopping|stopped|pausing|paused)\s+here\b[\s\S]{0,180}\blet\s+me\s+know\s+when\s+you(?:'d|\s+would)?\s+like\s+to\s+continue\b/i,
21
+ /^➜\s+\S+\s+git:\([^)]*\)\s+/i,
22
+ /^\$\s+\S+/i
23
+ ];
24
+
25
+ const CONTINUATION_QUERY_PATTERNS = [
26
+ /^\s*(?:continue|resume|next|what(?:'s| is)? next|next\s+(?:step|task|action)|recommended\s+(?:next\s+)?(?:step|task|action)|what should (?:we|i) do next)\??\s*$/i,
27
+ /^\s*(?:이어서(?:\s*진행해줘)?|계속(?:\s*해줘)?|다음\s*(?:단계|작업|추천\s*작업|추천|할\s*일)?(?:은|는)?(?:\s*뭐야)?\??|추천\s*작업(?:은|는)?(?:\s*뭐야)?\??|진행해줘)\s*$/i
28
+ ];
29
+
30
+ const GENERIC_TECHNICAL_TERMS = new Set([
31
+ 'api',
32
+ 'cli',
33
+ 'ui',
34
+ 'json',
35
+ 'jsonl',
36
+ 'html',
37
+ 'http',
38
+ 'https',
39
+ 'url',
40
+ 'uri',
41
+ 'id',
42
+ 'ids',
43
+ 'uuid',
44
+ 'db',
45
+ 'sql'
46
+ ]);
47
+
48
+ export function isCommandArtifactQuery(query: string): boolean {
49
+ const trimmed = query.trim();
50
+ if (!trimmed) return false;
51
+ const normalized = trimmed.toLowerCase();
52
+ if (normalized.includes('local-command-stdout') || normalized.includes('local-command-stderr')) return true;
53
+ if (normalized.includes('command-name') || normalized.includes('command-message')) return true;
54
+ return COMMAND_ARTIFACT_PATTERNS.some((pattern) => pattern.test(trimmed));
55
+ }
56
+
57
+ export function isCommandArtifactContent(content: string): boolean {
58
+ const trimmed = content.trim();
59
+ if (!trimmed) return false;
60
+ const normalized = trimmed.toLowerCase();
61
+ if (normalized.includes('local-command-stdout') || normalized.includes('local-command-stderr')) return true;
62
+ if (normalized.includes('command-name') || normalized.includes('command-message')) return true;
63
+ return COMMAND_ARTIFACT_PATTERNS.some((pattern) => pattern.test(trimmed));
64
+ }
65
+
66
+ export function isLowSignalContextContent(content: string): boolean {
67
+ const trimmed = content.trim();
68
+ if (!trimmed) return true;
69
+ if (isCommandArtifactContent(trimmed)) return true;
70
+ if (LOW_SIGNAL_CONTEXT_PATTERNS.some((pattern) => pattern.test(trimmed))) return true;
71
+ return false;
72
+ }
73
+
74
+ export function isGenericContinuationQuery(query: string): boolean {
75
+ const trimmed = query.trim();
76
+ if (!trimmed) return false;
77
+ if (!CONTINUATION_QUERY_PATTERNS.some((pattern) => pattern.test(trimmed))) return false;
78
+ if (extractTechnicalQueryTerms(trimmed).length > 0) return false;
79
+
80
+ const tokens = trimmed.match(/[A-Za-z0-9가-힣#._/-]+/g) ?? [];
81
+ if (tokens.length > 10) return false;
82
+
83
+ return !/[A-Za-z0-9_-]+\.[A-Za-z0-9]+/.test(trimmed) &&
84
+ !/(?:^|\s)(?:feat|fix|chore|refactor|docs)\/[A-Za-z0-9._-]+/.test(trimmed) &&
85
+ !/[A-Za-z]:?[\\/]|\/Users\/|\.\/|\.\.\//.test(trimmed);
86
+ }
87
+
88
+ export function extractTechnicalQueryTerms(query: string): string[] {
89
+ const matches = query.match(/[A-Za-z][A-Za-z0-9_.:-]{2,}/g) ?? [];
90
+ const terms = matches.filter((term) => {
91
+ const lower = term.toLowerCase();
92
+ if (GENERIC_TECHNICAL_TERMS.has(lower)) return false;
93
+ return /[._:-]/.test(term) || /[a-z][A-Z]/.test(term) || /[A-Z]{2,}/.test(term) || /\d/.test(term);
94
+ });
95
+
96
+ return Array.from(new Set(terms.map((term) => term.toLowerCase())));
97
+ }
98
+
99
+ export function hasTechnicalTermOverlap(query: string, content: string): boolean {
100
+ const terms = extractTechnicalQueryTerms(query);
101
+ if (terms.length === 0) return true;
102
+
103
+ const normalizedContent = content.toLowerCase();
104
+ return terms.some((term) => normalizedContent.includes(term));
105
+ }
106
+
107
+ export function shouldApplyTechnicalGuard(query: string): boolean {
108
+ return extractTechnicalQueryTerms(query).length > 0;
109
+ }
@@ -10,6 +10,11 @@ import { Matcher } from './matcher.js';
10
10
  import { SharedStore } from './shared-store.js';
11
11
  import { SharedVectorStore } from './shared-vector-store.js';
12
12
  import { GraduationPipeline } from './graduation.js';
13
+ import {
14
+ hasTechnicalTermOverlap,
15
+ isCommandArtifactQuery,
16
+ shouldApplyTechnicalGuard
17
+ } from './retrieval-quality.js';
13
18
  import type { MemoryEvent, MatchResult, SharedTroubleshootingEntry } from './types.js';
14
19
 
15
20
  export interface RetrievalScope {
@@ -23,6 +28,8 @@ export interface RetrievalScope {
23
28
 
24
29
  export type RetrievalStrategy = 'auto' | 'fast' | 'deep';
25
30
  export type ProjectScopeMode = 'strict' | 'prefer' | 'global';
31
+ type DecayPolicy = NonNullable<RetrievalOptions['decayPolicy']>;
32
+ type GraphHopOptions = NonNullable<RetrievalOptions['graphHop']>;
26
33
 
27
34
  export interface RetrievalOptions {
28
35
  topK: number;
@@ -166,6 +173,20 @@ export class Retriever {
166
173
  const sessionFilter = opts.scope?.sessionId ?? opts.sessionId;
167
174
  const fallbackTrace: string[] = [];
168
175
 
176
+ if (isCommandArtifactQuery(query)) {
177
+ fallbackTrace.push('guard:command-artifact-query');
178
+ const emptyMatch = this.matcher.matchSearchResults([], () => 0);
179
+ return {
180
+ memories: [],
181
+ matchResult: emptyMatch,
182
+ totalTokens: 0,
183
+ context: '',
184
+ fallbackTrace,
185
+ selectedDebug: [],
186
+ candidateDebug: []
187
+ };
188
+ }
189
+
169
190
  const fallbackEnabled = (opts.strategy ?? 'auto') === 'auto';
170
191
 
171
192
  // Stage 1: primary retrieval
@@ -311,28 +332,21 @@ export class Retriever {
311
332
  minScore: number;
312
333
  sessionId?: string;
313
334
  scope?: RetrievalScope;
314
- rerankWithKeyword: boolean;
335
+ rerankWithKeyword?: boolean;
315
336
  rerankWeights?: {
316
337
  semantic?: number;
317
338
  lexical?: number;
318
339
  recency?: number;
319
340
  };
320
- decayPolicy?: {
321
- enabled?: boolean;
322
- windowDays?: number;
323
- maxPenalty?: number;
324
- };
341
+ decayPolicy?: DecayPolicy;
325
342
  intentRewrite?: boolean;
326
- graphHop?: {
327
- enabled?: boolean;
328
- maxHops?: number;
329
- hopPenalty?: number;
330
- };
343
+ graphHop?: GraphHopOptions;
331
344
  projectScopeMode?: ProjectScopeMode;
332
345
  projectHash?: string;
333
346
  allowedProjectHashes?: string[];
334
347
  }
335
- ): Promise<{ results: SearchResult[]; matchResult: MatchResult }> {
348
+ ): Promise<{ results: SearchResult[]; candidateResults: SearchResult[]; matchResult: MatchResult }> {
349
+ let rerankQuery = query;
336
350
  let initialResults = await this.searchByStrategy(query, {
337
351
  strategy: input.strategy,
338
352
  topK: input.topK,
@@ -343,6 +357,7 @@ export class Retriever {
343
357
  if (input.intentRewrite && input.strategy === 'deep' && this.queryRewriter) {
344
358
  const rewritten = (await this.queryRewriter(query))?.trim();
345
359
  if (rewritten && rewritten !== query) {
360
+ rerankQuery = `${query} ${rewritten}`;
346
361
  const rewrittenResults = await this.searchByStrategy(rewritten, {
347
362
  strategy: 'deep',
348
363
  topK: input.topK,
@@ -362,7 +377,7 @@ export class Retriever {
362
377
  });
363
378
 
364
379
  const rerankedResults = input.rerankWithKeyword
365
- ? this.rerankByKeywordOverlap(expandedResults, query, input.rerankWeights, input.decayPolicy)
380
+ ? this.rerankByKeywordOverlap(expandedResults, rerankQuery, input.rerankWeights, input.decayPolicy)
366
381
  : expandedResults;
367
382
 
368
383
  const filtered = await this.applyScopeFilters(rerankedResults, {
@@ -371,10 +386,33 @@ export class Retriever {
371
386
  projectHash: input.projectHash,
372
387
  allowedProjectHashes: input.allowedProjectHashes
373
388
  });
374
- const top = filtered.slice(0, input.topK);
389
+ const qualityFiltered = this.applyQualityFilters(filtered, {
390
+ query,
391
+ minScore: input.minScore
392
+ });
393
+ const top = qualityFiltered.slice(0, input.topK);
375
394
  const matchResult = this.matcher.matchSearchResults(top, () => 0);
376
395
 
377
- return { results: top, candidateResults: filtered, matchResult };
396
+ return { results: top, candidateResults: qualityFiltered, matchResult };
397
+ }
398
+
399
+ private applyQualityFilters(
400
+ results: Array<SearchResult & { semanticScore?: number; lexicalScore?: number; recencyScore?: number }>,
401
+ options: { query: string; minScore: number }
402
+ ): Array<SearchResult & { semanticScore?: number; lexicalScore?: number; recencyScore?: number }> {
403
+ let filtered = [...results];
404
+
405
+ if (shouldApplyTechnicalGuard(options.query)) {
406
+ filtered = filtered.filter((result) => hasTechnicalTermOverlap(options.query, result.content));
407
+ }
408
+
409
+ if (filtered.length <= 2) return filtered;
410
+
411
+ const topScore = filtered[0].score;
412
+ if (topScore < 0.8) return filtered;
413
+
414
+ const cliffThreshold = Math.max(options.minScore, topScore - 0.25);
415
+ return filtered.filter((result) => result.score >= cliffThreshold);
378
416
  }
379
417
 
380
418
  private mergeResults(primary: SearchResult[], secondary: SearchResult[], limit: number): SearchResult[] {