claude-memory-layer 1.0.27 → 1.0.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (331) hide show
  1. package/.env.example +7 -0
  2. package/AGENTS.md +11 -0
  3. package/README.md +374 -49
  4. package/benchmarks/replay/anonymized-real-sessions.json +48 -0
  5. package/dist/cli/index.js +10097 -6003
  6. package/dist/cli/index.js.map +4 -4
  7. package/dist/core/index.js +9745 -5587
  8. package/dist/core/index.js.map +4 -4
  9. package/dist/hooks/post-tool-use.js +6545 -5270
  10. package/dist/hooks/post-tool-use.js.map +4 -4
  11. package/dist/hooks/semantic-daemon.js +6646 -5354
  12. package/dist/hooks/semantic-daemon.js.map +4 -4
  13. package/dist/hooks/session-end.js +6618 -5347
  14. package/dist/hooks/session-end.js.map +4 -4
  15. package/dist/hooks/session-start.js +6619 -5354
  16. package/dist/hooks/session-start.js.map +4 -4
  17. package/dist/hooks/stop.js +6614 -5325
  18. package/dist/hooks/stop.js.map +4 -4
  19. package/dist/hooks/user-prompt-submit.js +6702 -5356
  20. package/dist/hooks/user-prompt-submit.js.map +4 -4
  21. package/dist/index.js +13537 -0
  22. package/dist/index.js.map +7 -0
  23. package/dist/mcp/index.js +20770 -0
  24. package/dist/mcp/index.js.map +7 -0
  25. package/dist/server/api/index.js +6632 -5319
  26. package/dist/server/api/index.js.map +4 -4
  27. package/dist/server/index.js +6667 -5340
  28. package/dist/server/index.js.map +4 -4
  29. package/dist/services/memory-service.js +6568 -5350
  30. package/dist/services/memory-service.js.map +4 -4
  31. package/dist/ui/assets/js/bootstrap.js +244 -0
  32. package/dist/ui/assets/js/chat.js +373 -0
  33. package/dist/ui/assets/js/disclosure.js +232 -0
  34. package/dist/ui/assets/js/modals.js +298 -0
  35. package/dist/ui/assets/js/overview.js +655 -0
  36. package/dist/ui/assets/js/state.js +72 -0
  37. package/dist/ui/assets/js/views.js +468 -0
  38. package/dist/ui/index.html +43 -1
  39. package/dist/ui/index.ts +3 -0
  40. package/dist/ui/style.css +222 -0
  41. package/docs/ARCHITECTURE_COMPARISON_AND_RECOMMENDATIONS.md +627 -0
  42. package/docs/HERMES_MEMORY_INGESTION_ANALYSIS.md +440 -0
  43. package/docs/MEMORY_USEFULNESS_AUDIT.md +371 -0
  44. package/docs/MEMORY_USEFULNESS_AUDIT_RAW.json +80 -0
  45. package/docs/MEMSEARCH_PROJECT_STRUCTURE_ANALYSIS.md +333 -0
  46. package/docs/PRODUCT_VALIDATION_MATRIX.md +82 -0
  47. package/docs/PROJECT_STRUCTURE_ANALYSIS.md +421 -0
  48. package/docs/REFACTORING_MILESTONES_AND_ISSUES.md +501 -0
  49. package/docs/REFACTORING_PLAN_THIN_CORE.md +414 -0
  50. package/docs/REFERENCE_PROJECT_ANALYSES.md +25 -0
  51. package/docs/SUPERLOCALMEMORY_PROJECT_STRUCTURE_ANALYSIS.md +452 -0
  52. package/docs/TARGET_ARCHITECTURE_AND_FOLDER_STRUCTURE.md +446 -0
  53. package/docs/architecture/comparison-index.md +47 -0
  54. package/docs/reports/codex-real-data-validation-20260505T040447Z.md +46 -0
  55. package/package.json +12 -5
  56. package/scripts/build.ts +25 -8
  57. package/scripts/generate-session-qrels.ts +126 -0
  58. package/scripts/postinstall-embedding-backend.cjs +142 -0
  59. package/scripts/replay-retrieval-benchmark.ts +69 -0
  60. package/specs/thin-core-refactor/context.md +275 -0
  61. package/specs/thin-core-refactor/plan.md +536 -0
  62. package/specs/thin-core-refactor/spec.md +465 -0
  63. package/src/adapters/claude/capture/index.ts +3 -0
  64. package/src/adapters/claude/context/index.ts +3 -0
  65. package/src/adapters/claude/hooks/index.ts +21 -0
  66. package/src/adapters/claude/hooks/post-tool-use.ts +239 -0
  67. package/src/adapters/claude/hooks/prompt-injection-policy.ts +104 -0
  68. package/src/adapters/claude/hooks/semantic-daemon-client.ts +209 -0
  69. package/src/adapters/claude/hooks/semantic-daemon.ts +283 -0
  70. package/src/adapters/claude/hooks/session-end.ts +59 -0
  71. package/src/adapters/claude/hooks/session-start.ts +73 -0
  72. package/src/adapters/claude/hooks/stop.ts +128 -0
  73. package/src/adapters/claude/hooks/user-prompt-submit.ts +361 -0
  74. package/src/adapters/claude/index.ts +4 -0
  75. package/src/adapters/claude/transcript/index.ts +4 -0
  76. package/src/adapters/claude/transcript/transcript-reader.ts +57 -0
  77. package/src/adapters/claude/transcript/turn-reconstructor.ts +65 -0
  78. package/src/apps/cli/claude-settings-hooks.ts +138 -0
  79. package/src/apps/cli/codex-import-runner.ts +125 -0
  80. package/src/apps/cli/codex-validation-output.ts +95 -0
  81. package/src/apps/cli/hermes-import-runner.ts +130 -0
  82. package/src/apps/cli/hermes-validation-output.ts +91 -0
  83. package/src/apps/cli/index.ts +1731 -0
  84. package/src/apps/cli/mcp-install.ts +106 -0
  85. package/src/apps/cli/retrieval-disclosure-output.ts +196 -0
  86. package/src/apps/dashboard/assets/js/bootstrap.js +244 -0
  87. package/src/apps/dashboard/assets/js/chat.js +373 -0
  88. package/src/apps/dashboard/assets/js/disclosure.js +232 -0
  89. package/src/apps/dashboard/assets/js/modals.js +298 -0
  90. package/src/apps/dashboard/assets/js/overview.js +655 -0
  91. package/src/apps/dashboard/assets/js/state.js +72 -0
  92. package/src/apps/dashboard/assets/js/views.js +468 -0
  93. package/src/{ui → apps/dashboard}/index.html +43 -1
  94. package/src/apps/dashboard/index.ts +3 -0
  95. package/src/{ui → apps/dashboard}/style.css +222 -0
  96. package/src/apps/index.ts +5 -0
  97. package/src/apps/server/api/chat.ts +244 -0
  98. package/src/apps/server/api/citations.ts +105 -0
  99. package/src/apps/server/api/events.ts +137 -0
  100. package/src/apps/server/api/health.ts +53 -0
  101. package/src/apps/server/api/index.ts +26 -0
  102. package/src/apps/server/api/projects.ts +74 -0
  103. package/src/apps/server/api/search.ts +184 -0
  104. package/src/apps/server/api/sessions.ts +115 -0
  105. package/src/apps/server/api/stats.ts +723 -0
  106. package/src/apps/server/api/turns.ts +143 -0
  107. package/src/apps/server/api/utils.ts +65 -0
  108. package/src/apps/server/index.ts +111 -0
  109. package/src/cli/index.ts +2 -1311
  110. package/src/cli/retrieval-disclosure-output.ts +2 -0
  111. package/src/compat/index.ts +5 -0
  112. package/src/core/derive/fact-deriver.ts +170 -0
  113. package/src/core/derive/index.ts +2 -0
  114. package/src/core/derive/summary-deriver.ts +76 -0
  115. package/src/core/embedder.ts +4 -152
  116. package/src/core/engine/embedding-maintenance-service.ts +187 -0
  117. package/src/core/engine/endless-memory-services.ts +4 -0
  118. package/src/core/engine/index.ts +19 -0
  119. package/src/core/engine/memory-engine-services.ts +170 -0
  120. package/src/core/engine/memory-ingest-service.ts +317 -0
  121. package/src/core/engine/memory-query-service.ts +173 -0
  122. package/src/core/engine/memory-runtime-service.ts +162 -0
  123. package/src/core/engine/memory-service-composition.ts +231 -0
  124. package/src/core/engine/retrieval-analytics-service.ts +181 -0
  125. package/src/core/engine/retrieval-disclosure-service.ts +420 -0
  126. package/src/core/engine/retrieval-orchestrator.ts +377 -0
  127. package/src/core/engine/retrieval-services.ts +176 -0
  128. package/src/core/engine/shared-memory-services.ts +4 -0
  129. package/src/core/entity-repo.ts +1 -3
  130. package/src/core/event-store.ts +3 -3
  131. package/src/core/evidence-aligner.ts +2 -2
  132. package/src/core/external-market-context.ts +582 -0
  133. package/src/core/graduation.ts +2 -3
  134. package/src/core/index.ts +21 -0
  135. package/src/core/matcher.ts +2 -4
  136. package/src/core/model/memory-fact.ts +30 -0
  137. package/src/core/model/memory-rule.ts +14 -0
  138. package/src/core/model/memory-summary.ts +21 -0
  139. package/src/core/model/raw-event.ts +28 -0
  140. package/src/core/model/retrieval-result.ts +35 -0
  141. package/src/core/privacy/filter.ts +21 -10
  142. package/src/core/product-validation-matrix.ts +314 -0
  143. package/src/core/progressive-retriever.ts +1 -2
  144. package/src/core/registry/project-path.ts +54 -0
  145. package/src/core/registry/session-registry.ts +69 -0
  146. package/src/core/replay-evaluator.ts +625 -0
  147. package/src/core/retrieval-benchmark.ts +117 -0
  148. package/src/core/retrieval-quality.ts +109 -0
  149. package/src/core/retriever.ts +53 -15
  150. package/src/core/session-qrels.ts +360 -0
  151. package/src/core/shared-event-store.ts +1 -1
  152. package/src/core/sqlite-event-store.ts +35 -11
  153. package/src/core/task/blocker-resolver.ts +2 -2
  154. package/src/core/task/task-resolver.ts +0 -1
  155. package/src/core/vector-outbox.ts +1 -10
  156. package/src/core/vector-worker.ts +1 -1
  157. package/src/extensions/endless-memory/endless-memory-services.ts +350 -0
  158. package/src/extensions/endless-memory/index.ts +1 -0
  159. package/src/extensions/index.ts +5 -0
  160. package/src/extensions/mcp/handlers.ts +960 -0
  161. package/src/extensions/mcp/index.ts +48 -0
  162. package/src/extensions/mcp/tools.ts +252 -0
  163. package/src/extensions/shared-memory/index.ts +1 -0
  164. package/src/extensions/shared-memory/shared-memory-services.ts +211 -0
  165. package/src/extensions/vector/embedder.ts +197 -0
  166. package/src/extensions/vector/index.ts +1 -0
  167. package/src/hooks/post-tool-use.ts +3 -236
  168. package/src/hooks/semantic-daemon-client.ts +1 -208
  169. package/src/hooks/semantic-daemon.ts +6 -271
  170. package/src/hooks/session-end.ts +4 -79
  171. package/src/hooks/session-start.ts +4 -73
  172. package/src/hooks/stop.ts +3 -173
  173. package/src/hooks/user-prompt-submit.ts +3 -338
  174. package/src/index.ts +13 -0
  175. package/src/mcp/handlers.ts +2 -212
  176. package/src/mcp/index.ts +3 -46
  177. package/src/mcp/tools.ts +2 -78
  178. package/src/server/api/chat.ts +2 -244
  179. package/src/server/api/citations.ts +2 -105
  180. package/src/server/api/events.ts +2 -137
  181. package/src/server/api/health.ts +2 -53
  182. package/src/server/api/index.ts +2 -26
  183. package/src/server/api/projects.ts +2 -74
  184. package/src/server/api/search.ts +2 -102
  185. package/src/server/api/sessions.ts +2 -115
  186. package/src/server/api/stats.ts +2 -724
  187. package/src/server/api/turns.ts +2 -143
  188. package/src/server/api/utils.ts +2 -46
  189. package/src/server/index.ts +2 -100
  190. package/src/services/bootstrap-organizer.ts +46 -26
  191. package/src/services/codex-session-history-importer.ts +521 -29
  192. package/src/services/hermes-session-history-importer.ts +733 -0
  193. package/src/services/memory-service-config.ts +36 -0
  194. package/src/services/memory-service-registry.ts +150 -0
  195. package/src/services/memory-service.ts +211 -1325
  196. package/src/services/session-history-importer.ts +58 -14
  197. package/tests/README.md +23 -0
  198. package/tests/adapters/claude/claude-semantic-daemon-adapter.test.ts +54 -0
  199. package/tests/adapters/claude/claude-transcript-reconstructor.test.ts +98 -0
  200. package/tests/adapters/claude-hook-prompt-injection-policy.test.ts +99 -0
  201. package/tests/apps/app-layer-boundary.test.ts +48 -0
  202. package/tests/apps/claude-settings-hooks.test.ts +107 -0
  203. package/tests/apps/cli-disclosure-output.test.ts +212 -0
  204. package/tests/apps/codex-import-runner.test.ts +99 -0
  205. package/tests/apps/codex-validation-output.test.ts +100 -0
  206. package/tests/apps/hermes-import-runner.test.ts +99 -0
  207. package/tests/apps/mcp-install-command.test.ts +59 -0
  208. package/tests/apps/package-build-entrypoints.test.ts +30 -0
  209. package/tests/apps/postinstall-embedding-backend.test.ts +167 -0
  210. package/tests/apps/search-api-disclosure.test.ts +162 -0
  211. package/tests/apps/stats-api-lightweight.test.ts +67 -0
  212. package/tests/apps/ui-disclosure-output.test.ts +140 -0
  213. package/tests/{bootstrap-organizer.test.ts → core/bootstrap-organizer.test.ts} +1 -1
  214. package/tests/{canonical-key.test.ts → core/canonical-key.test.ts} +1 -1
  215. package/tests/core/codex-session-history-importer-validation.test.ts +185 -0
  216. package/tests/{consolidation-worker.test.ts → core/consolidation-worker.test.ts} +2 -2
  217. package/tests/core/embedding-maintenance-service.test.ts +282 -0
  218. package/tests/{evidence-aligner.test.ts → core/evidence-aligner.test.ts} +1 -1
  219. package/tests/core/external-market-context.test.ts +209 -0
  220. package/tests/core/fact-deriver.test.ts +79 -0
  221. package/tests/core/hermes-session-history-importer-validation.test.ts +609 -0
  222. package/tests/{ingest-interceptor.test.ts → core/ingest-interceptor.test.ts} +1 -1
  223. package/tests/{markdown-mirror.test.ts → core/markdown-mirror.test.ts} +2 -2
  224. package/tests/{matcher.test.ts → core/matcher.test.ts} +1 -1
  225. package/tests/{md-mirror.test.ts → core/md-mirror.test.ts} +2 -2
  226. package/tests/core/memory-engine-services.test.ts +240 -0
  227. package/tests/core/memory-ingest-service.test.ts +296 -0
  228. package/tests/core/memory-query-service.test.ts +129 -0
  229. package/tests/core/memory-runtime-service.test.ts +201 -0
  230. package/tests/core/memory-service-composition.test.ts +192 -0
  231. package/tests/core/memory-service-config.test.ts +41 -0
  232. package/tests/core/memory-service-facade.test.ts +30 -0
  233. package/tests/core/memory-service-registry.test.ts +206 -0
  234. package/tests/core/product-validation-matrix.test.ts +61 -0
  235. package/tests/core/project-registry.test.ts +78 -0
  236. package/tests/core/replay-evaluator.test.ts +181 -0
  237. package/tests/core/retrieval-analytics-service.test.ts +210 -0
  238. package/tests/core/retrieval-benchmark.test.ts +93 -0
  239. package/tests/core/retrieval-disclosure-service.test.ts +264 -0
  240. package/tests/core/retrieval-orchestrator.test.ts +403 -0
  241. package/tests/core/retrieval-quality.test.ts +31 -0
  242. package/tests/core/retrieval-services.test.ts +185 -0
  243. package/tests/{retriever-fallback-chain.test.ts → core/retriever-fallback-chain.test.ts} +3 -3
  244. package/tests/{retriever-strategy-scope.test.ts → core/retriever-strategy-scope.test.ts} +70 -3
  245. package/tests/{retriever.memu-adoption.test.ts → core/retriever.memu-adoption.test.ts} +3 -3
  246. package/tests/core/session-history-importer-filter.test.ts +78 -0
  247. package/tests/core/session-qrels.test.ts +250 -0
  248. package/tests/{sqlite-event-store-replication.test.ts → core/sqlite-event-store-replication.test.ts} +36 -1
  249. package/tests/core/summary-deriver.test.ts +66 -0
  250. package/tests/extensions/embedder-warning-suppression.test.ts +53 -0
  251. package/tests/extensions/endless-memory-extension-boundary.test.ts +17 -0
  252. package/tests/extensions/endless-memory-services.test.ts +325 -0
  253. package/tests/extensions/mcp-context-tools.test.ts +905 -0
  254. package/tests/extensions/mcp-extension-boundary.test.ts +21 -0
  255. package/tests/extensions/mcp-package-build.test.ts +22 -0
  256. package/tests/extensions/mcp-project-aware-tools.test.ts +102 -0
  257. package/tests/extensions/shared-memory-extension-boundary.test.ts +24 -0
  258. package/tests/extensions/shared-memory-services.test.ts +309 -0
  259. package/tests/extensions/vector-extension-boundary.test.ts +21 -0
  260. package/.claude/settings.local.json +0 -25
  261. package/.npm-cache/_cacache/content-v2/sha512/04/76/c098f88dfe584a2b80870bff7421b05d17d3d9ee1027f77772332a22d3f93a9a57101a2855107f6ad82077a818bba912b2bc317f2361b5ddb09ad284d9ce +0 -0
  262. package/.npm-cache/_cacache/content-v2/sha512/60/25/d2ecd39cfc7cab58351162814be77f935c6d6491c10c3745d456da7ddb2117ffd90c10e53fe3c0f1ed16b403307841543634504398b16ee4e6b6dd8e0c45 +0 -0
  263. package/.npm-cache/_cacache/index-v5/2b/9a/7f8f40206ed8a2e0a84efaa953ccaed1f5d001e14b931083f2e7a0738007 +0 -2
  264. package/.npm-cache/_cacache/index-v5/2e/d9/fcfa5c6a6abdc2a3644ab84a95936047298c465a2f47ee03db8f7fe1e946 +0 -3
  265. package/.npm-cache/_cacache/index-v5/a9/42/e519633356d12d3d2f19da66a8301016d496c8f5c3e0554124aaa62dc043 +0 -2
  266. package/.npm-cache/_logs/2026-02-26T12_04_52_729Z-debug-0.log +0 -256
  267. package/.npm-cache/_logs/2026-02-26T12_05_36_835Z-debug-0.log +0 -18
  268. package/.npm-cache/_logs/2026-02-26T12_05_45_982Z-debug-0.log +0 -32
  269. package/.npm-cache/_logs/2026-02-26T12_05_48_515Z-debug-0.log +0 -260
  270. package/.npm-cache/_logs/2026-02-26T12_05_53_567Z-debug-0.log +0 -69
  271. package/.npm-cache/_update-notifier-last-checked +0 -0
  272. package/bootstrap-kb/decisions/decisions.md +0 -244
  273. package/bootstrap-kb/glossary/glossary.md +0 -46
  274. package/bootstrap-kb/modules/.claude-plugin.md +0 -22
  275. package/bootstrap-kb/modules/agents.md.md +0 -15
  276. package/bootstrap-kb/modules/claude.md.md +0 -15
  277. package/bootstrap-kb/modules/context.md.md +0 -15
  278. package/bootstrap-kb/modules/docs.md +0 -18
  279. package/bootstrap-kb/modules/handoff.md.md +0 -15
  280. package/bootstrap-kb/modules/package-lock.json.md +0 -15
  281. package/bootstrap-kb/modules/package.json.md +0 -15
  282. package/bootstrap-kb/modules/plan.md.md +0 -15
  283. package/bootstrap-kb/modules/readme.md.md +0 -15
  284. package/bootstrap-kb/modules/scripts.md +0 -26
  285. package/bootstrap-kb/modules/spec.md.md +0 -15
  286. package/bootstrap-kb/modules/specs.md +0 -20
  287. package/bootstrap-kb/modules/src.md +0 -51
  288. package/bootstrap-kb/modules/tests.md +0 -42
  289. package/bootstrap-kb/modules/tsconfig.json.md +0 -15
  290. package/bootstrap-kb/modules/vitest.config.ts.md +0 -15
  291. package/bootstrap-kb/overview/overview.md +0 -40
  292. package/bootstrap-kb/sources/manifest.json +0 -950
  293. package/bootstrap-kb/sources/manifest.md +0 -227
  294. package/bootstrap-kb/timeline/timeline.md +0 -57
  295. package/claude-memory-layer-1.0.14.tgz +0 -0
  296. package/d.sh +0 -3
  297. package/deploy.sh +0 -3
  298. package/dist/ui/app.js +0 -2101
  299. package/memory/.claude-plugin/commands/2026-02-25.md +0 -263
  300. package/memory/_index.md +0 -419
  301. package/memory/agent_response/uncategorized/2026-02-26.md +0 -176
  302. package/memory/agent_response/uncategorized/2026-03-03.md +0 -14
  303. package/memory/agent_response/uncategorized/2026-03-04.md +0 -1421
  304. package/memory/agent_response/uncategorized/2026-03-05.md +0 -157
  305. package/memory/default/uncategorized/2026-02-25.md +0 -4839
  306. package/memory/session_summary/uncategorized/2026-02-26.md +0 -13
  307. package/memory/session_summary/uncategorized/2026-03-03.md +0 -5
  308. package/memory/session_summary/uncategorized/2026-03-04.md +0 -50
  309. package/memory/specs/20260207-dashboard-upgrade/2026-02-25.md +0 -142
  310. package/memory/specs/citations-system/2026-02-25.md +0 -1121
  311. package/memory/specs/endless-mode/2026-02-25.md +0 -1392
  312. package/memory/specs/entity-edge-model/2026-02-25.md +0 -1263
  313. package/memory/specs/evidence-aligner-v2/2026-02-25.md +0 -1028
  314. package/memory/specs/mcp-desktop-integration/2026-02-25.md +0 -1334
  315. package/memory/specs/post-tool-use-hook/2026-02-25.md +0 -1164
  316. package/memory/specs/private-tags/2026-02-25.md +0 -1057
  317. package/memory/specs/progressive-disclosure/2026-02-25.md +0 -1436
  318. package/memory/specs/task-entity-system/2026-02-25.md +0 -924
  319. package/memory/specs/vector-outbox-v2/2026-02-25.md +0 -1510
  320. package/memory/specs/web-viewer-ui/2026-02-25.md +0 -1709
  321. package/memory/tool_observation/uncategorized/2026-02-26.md +0 -209
  322. package/memory/tool_observation/uncategorized/2026-03-03.md +0 -21
  323. package/memory/tool_observation/uncategorized/2026-03-04.md +0 -1033
  324. package/memory/tool_observation/uncategorized/2026-03-05.md +0 -33
  325. package/memory/user_prompt/uncategorized/2026-02-26.md +0 -25
  326. package/memory/user_prompt/uncategorized/2026-03-04.md +0 -634
  327. package/memory/user_prompt/uncategorized/2026-03-05.md +0 -6
  328. package/specs/optional-duckdb/context.md +0 -77
  329. package/specs/optional-duckdb/plan.md +0 -142
  330. package/specs/optional-duckdb/spec.md +0 -35
  331. package/src/ui/app.js +0 -2101
@@ -0,0 +1,117 @@
1
+ export interface ReplayMetricInput {
2
+ queryId: string;
3
+ expectedIds: string[];
4
+ retrievedIds: string[];
5
+ /** Optional graded qrels labels. Missing expected ids default to relevance 1. */
6
+ expectedRelevance?: Record<string, number>;
7
+ }
8
+
9
+ export interface PrecisionRecallAtK {
10
+ precision: number;
11
+ recall: number;
12
+ hits: number;
13
+ ndcg: number;
14
+ }
15
+
16
+ export interface ReplayQueryMetrics {
17
+ queryId: string;
18
+ at: Record<number, PrecisionRecallAtK>;
19
+ }
20
+
21
+ export interface ReplayMetricsSummary {
22
+ queryCount: number;
23
+ precisionAtK: Record<number, number>;
24
+ recallAtK: Record<number, number>;
25
+ ndcgAtK: Record<number, number>;
26
+ }
27
+
28
+ export function computePrecisionRecallAtK(
29
+ inputs: ReplayMetricInput[],
30
+ ks: number[]
31
+ ): ReplayQueryMetrics[] {
32
+ const normalizedKs = normalizeKs(ks);
33
+ return inputs.map((input) => {
34
+ const expected = new Set(input.expectedIds);
35
+ const relevance = normalizeRelevance(input.expectedIds, input.expectedRelevance);
36
+ const at: Record<number, PrecisionRecallAtK> = {};
37
+
38
+ for (const k of normalizedKs) {
39
+ const retrieved = input.retrievedIds.slice(0, k);
40
+ const hits = new Set(retrieved.filter((id) => expected.has(id))).size;
41
+ at[k] = {
42
+ precision: k === 0 ? 0 : hits / k,
43
+ recall: expected.size === 0 ? 0 : hits / expected.size,
44
+ hits,
45
+ ndcg: computeNdcgAtK(retrieved, relevance, k)
46
+ };
47
+ }
48
+
49
+ return { queryId: input.queryId, at };
50
+ });
51
+ }
52
+
53
+ export function summarizeReplayMetrics(
54
+ metrics: ReplayQueryMetrics[],
55
+ ks: number[]
56
+ ): ReplayMetricsSummary {
57
+ const normalizedKs = normalizeKs(ks);
58
+ const precisionAtK: Record<number, number> = {};
59
+ const recallAtK: Record<number, number> = {};
60
+ const ndcgAtK: Record<number, number> = {};
61
+
62
+ for (const k of normalizedKs) {
63
+ precisionAtK[k] = average(metrics.map((metric) => metric.at[k]?.precision ?? 0));
64
+ recallAtK[k] = average(metrics.map((metric) => metric.at[k]?.recall ?? 0));
65
+ ndcgAtK[k] = average(metrics.map((metric) => metric.at[k]?.ndcg ?? 0));
66
+ }
67
+
68
+ return { queryCount: metrics.length, precisionAtK, recallAtK, ndcgAtK };
69
+ }
70
+
71
+ function normalizeKs(ks: number[]): number[] {
72
+ const seen = new Set<number>();
73
+ const normalized: number[] = [];
74
+
75
+ for (const rawK of ks) {
76
+ const k = Math.max(0, Math.floor(rawK));
77
+ if (seen.has(k)) continue;
78
+ seen.add(k);
79
+ normalized.push(k);
80
+ }
81
+
82
+ return normalized.sort((a, b) => a - b);
83
+ }
84
+
85
+ function normalizeRelevance(expectedIds: string[], expectedRelevance?: Record<string, number>): Record<string, number> {
86
+ const relevance: Record<string, number> = {};
87
+ for (const id of expectedIds) {
88
+ const raw = expectedRelevance?.[id] ?? 1;
89
+ relevance[id] = Number.isFinite(raw) ? Math.max(0, raw) : 0;
90
+ }
91
+ return relevance;
92
+ }
93
+
94
+ function computeNdcgAtK(retrieved: string[], relevance: Record<string, number>, k: number): number {
95
+ if (k <= 0) return 0;
96
+
97
+ const seen = new Set<string>();
98
+ const dcg = retrieved.reduce((sum, id, index) => {
99
+ if (seen.has(id)) return sum;
100
+ seen.add(id);
101
+ return sum + discountedGain(relevance[id] ?? 0, index);
102
+ }, 0);
103
+
104
+ const idealRelevance = Object.values(relevance).sort((a, b) => b - a).slice(0, k);
105
+ const idealDcg = idealRelevance.reduce((sum, rel, index) => sum + discountedGain(rel, index), 0);
106
+ return idealDcg === 0 ? 0 : dcg / idealDcg;
107
+ }
108
+
109
+ function discountedGain(relevance: number, zeroBasedRank: number): number {
110
+ if (relevance <= 0) return 0;
111
+ return (2 ** relevance - 1) / Math.log2(zeroBasedRank + 2);
112
+ }
113
+
114
+ function average(values: number[]): number {
115
+ if (values.length === 0) return 0;
116
+ return values.reduce((sum, value) => sum + value, 0) / values.length;
117
+ }
@@ -0,0 +1,109 @@
1
+ /**
2
+ * Retrieval quality guards.
3
+ *
4
+ * These are deliberately small deterministic heuristics used to avoid injecting
5
+ * obviously irrelevant memories. They are not a second source of truth; they
6
+ * only filter candidate retrieval results before context assembly.
7
+ */
8
+
9
+ const COMMAND_ARTIFACT_PATTERNS = [
10
+ /<\/?(?:local-command-(?:stdout|stderr)|command-(?:name|message))\b/i,
11
+ /<command-name>[\s\S]*?<\/command-name>/i,
12
+ /<local-command-stdout>[\s\S]*?<\/local-command-stdout>/i,
13
+ /<local-command-stderr>[\s\S]*?<\/local-command-stderr>/i
14
+ ];
15
+
16
+ const LOW_SIGNAL_CONTEXT_PATTERNS = [
17
+ /<environment_context\b[\s\S]*<\/environment_context>/i,
18
+ /<turn_aborted>/i,
19
+ /^#\s*AGENTS\.md\s+instructions\b[\s\S]*<INSTRUCTIONS>/i,
20
+ /^\s*(?:understood[,\s.]*)?(?:stopping|stopped|pausing|paused)\s+here\b[\s\S]{0,180}\blet\s+me\s+know\s+when\s+you(?:'d|\s+would)?\s+like\s+to\s+continue\b/i,
21
+ /^➜\s+\S+\s+git:\([^)]*\)\s+/i,
22
+ /^\$\s+\S+/i
23
+ ];
24
+
25
+ const CONTINUATION_QUERY_PATTERNS = [
26
+ /^\s*(?:continue|resume|next|what(?:'s| is)? next|next\s+(?:step|task|action)|recommended\s+(?:next\s+)?(?:step|task|action)|what should (?:we|i) do next)\??\s*$/i,
27
+ /^\s*(?:이어서(?:\s*진행해줘)?|계속(?:\s*해줘)?|다음\s*(?:단계|작업|추천\s*작업|추천|할\s*일)?(?:은|는)?(?:\s*뭐야)?\??|추천\s*작업(?:은|는)?(?:\s*뭐야)?\??|진행해줘)\s*$/i
28
+ ];
29
+
30
+ const GENERIC_TECHNICAL_TERMS = new Set([
31
+ 'api',
32
+ 'cli',
33
+ 'ui',
34
+ 'json',
35
+ 'jsonl',
36
+ 'html',
37
+ 'http',
38
+ 'https',
39
+ 'url',
40
+ 'uri',
41
+ 'id',
42
+ 'ids',
43
+ 'uuid',
44
+ 'db',
45
+ 'sql'
46
+ ]);
47
+
48
+ export function isCommandArtifactQuery(query: string): boolean {
49
+ const trimmed = query.trim();
50
+ if (!trimmed) return false;
51
+ const normalized = trimmed.toLowerCase();
52
+ if (normalized.includes('local-command-stdout') || normalized.includes('local-command-stderr')) return true;
53
+ if (normalized.includes('command-name') || normalized.includes('command-message')) return true;
54
+ return COMMAND_ARTIFACT_PATTERNS.some((pattern) => pattern.test(trimmed));
55
+ }
56
+
57
+ export function isCommandArtifactContent(content: string): boolean {
58
+ const trimmed = content.trim();
59
+ if (!trimmed) return false;
60
+ const normalized = trimmed.toLowerCase();
61
+ if (normalized.includes('local-command-stdout') || normalized.includes('local-command-stderr')) return true;
62
+ if (normalized.includes('command-name') || normalized.includes('command-message')) return true;
63
+ return COMMAND_ARTIFACT_PATTERNS.some((pattern) => pattern.test(trimmed));
64
+ }
65
+
66
+ export function isLowSignalContextContent(content: string): boolean {
67
+ const trimmed = content.trim();
68
+ if (!trimmed) return true;
69
+ if (isCommandArtifactContent(trimmed)) return true;
70
+ if (LOW_SIGNAL_CONTEXT_PATTERNS.some((pattern) => pattern.test(trimmed))) return true;
71
+ return false;
72
+ }
73
+
74
+ export function isGenericContinuationQuery(query: string): boolean {
75
+ const trimmed = query.trim();
76
+ if (!trimmed) return false;
77
+ if (!CONTINUATION_QUERY_PATTERNS.some((pattern) => pattern.test(trimmed))) return false;
78
+ if (extractTechnicalQueryTerms(trimmed).length > 0) return false;
79
+
80
+ const tokens = trimmed.match(/[A-Za-z0-9가-힣#._/-]+/g) ?? [];
81
+ if (tokens.length > 10) return false;
82
+
83
+ return !/[A-Za-z0-9_-]+\.[A-Za-z0-9]+/.test(trimmed) &&
84
+ !/(?:^|\s)(?:feat|fix|chore|refactor|docs)\/[A-Za-z0-9._-]+/.test(trimmed) &&
85
+ !/[A-Za-z]:?[\\/]|\/Users\/|\.\/|\.\.\//.test(trimmed);
86
+ }
87
+
88
+ export function extractTechnicalQueryTerms(query: string): string[] {
89
+ const matches = query.match(/[A-Za-z][A-Za-z0-9_.:-]{2,}/g) ?? [];
90
+ const terms = matches.filter((term) => {
91
+ const lower = term.toLowerCase();
92
+ if (GENERIC_TECHNICAL_TERMS.has(lower)) return false;
93
+ return /[._:-]/.test(term) || /[a-z][A-Z]/.test(term) || /[A-Z]{2,}/.test(term) || /\d/.test(term);
94
+ });
95
+
96
+ return Array.from(new Set(terms.map((term) => term.toLowerCase())));
97
+ }
98
+
99
+ export function hasTechnicalTermOverlap(query: string, content: string): boolean {
100
+ const terms = extractTechnicalQueryTerms(query);
101
+ if (terms.length === 0) return true;
102
+
103
+ const normalizedContent = content.toLowerCase();
104
+ return terms.some((term) => normalizedContent.includes(term));
105
+ }
106
+
107
+ export function shouldApplyTechnicalGuard(query: string): boolean {
108
+ return extractTechnicalQueryTerms(query).length > 0;
109
+ }
@@ -10,6 +10,11 @@ import { Matcher } from './matcher.js';
10
10
  import { SharedStore } from './shared-store.js';
11
11
  import { SharedVectorStore } from './shared-vector-store.js';
12
12
  import { GraduationPipeline } from './graduation.js';
13
+ import {
14
+ hasTechnicalTermOverlap,
15
+ isCommandArtifactQuery,
16
+ shouldApplyTechnicalGuard
17
+ } from './retrieval-quality.js';
13
18
  import type { MemoryEvent, MatchResult, SharedTroubleshootingEntry } from './types.js';
14
19
 
15
20
  export interface RetrievalScope {
@@ -23,6 +28,8 @@ export interface RetrievalScope {
23
28
 
24
29
  export type RetrievalStrategy = 'auto' | 'fast' | 'deep';
25
30
  export type ProjectScopeMode = 'strict' | 'prefer' | 'global';
31
+ type DecayPolicy = NonNullable<RetrievalOptions['decayPolicy']>;
32
+ type GraphHopOptions = NonNullable<RetrievalOptions['graphHop']>;
26
33
 
27
34
  export interface RetrievalOptions {
28
35
  topK: number;
@@ -166,6 +173,20 @@ export class Retriever {
166
173
  const sessionFilter = opts.scope?.sessionId ?? opts.sessionId;
167
174
  const fallbackTrace: string[] = [];
168
175
 
176
+ if (isCommandArtifactQuery(query)) {
177
+ fallbackTrace.push('guard:command-artifact-query');
178
+ const emptyMatch = this.matcher.matchSearchResults([], () => 0);
179
+ return {
180
+ memories: [],
181
+ matchResult: emptyMatch,
182
+ totalTokens: 0,
183
+ context: '',
184
+ fallbackTrace,
185
+ selectedDebug: [],
186
+ candidateDebug: []
187
+ };
188
+ }
189
+
169
190
  const fallbackEnabled = (opts.strategy ?? 'auto') === 'auto';
170
191
 
171
192
  // Stage 1: primary retrieval
@@ -311,28 +332,21 @@ export class Retriever {
311
332
  minScore: number;
312
333
  sessionId?: string;
313
334
  scope?: RetrievalScope;
314
- rerankWithKeyword: boolean;
335
+ rerankWithKeyword?: boolean;
315
336
  rerankWeights?: {
316
337
  semantic?: number;
317
338
  lexical?: number;
318
339
  recency?: number;
319
340
  };
320
- decayPolicy?: {
321
- enabled?: boolean;
322
- windowDays?: number;
323
- maxPenalty?: number;
324
- };
341
+ decayPolicy?: DecayPolicy;
325
342
  intentRewrite?: boolean;
326
- graphHop?: {
327
- enabled?: boolean;
328
- maxHops?: number;
329
- hopPenalty?: number;
330
- };
343
+ graphHop?: GraphHopOptions;
331
344
  projectScopeMode?: ProjectScopeMode;
332
345
  projectHash?: string;
333
346
  allowedProjectHashes?: string[];
334
347
  }
335
- ): Promise<{ results: SearchResult[]; matchResult: MatchResult }> {
348
+ ): Promise<{ results: SearchResult[]; candidateResults: SearchResult[]; matchResult: MatchResult }> {
349
+ let rerankQuery = query;
336
350
  let initialResults = await this.searchByStrategy(query, {
337
351
  strategy: input.strategy,
338
352
  topK: input.topK,
@@ -343,6 +357,7 @@ export class Retriever {
343
357
  if (input.intentRewrite && input.strategy === 'deep' && this.queryRewriter) {
344
358
  const rewritten = (await this.queryRewriter(query))?.trim();
345
359
  if (rewritten && rewritten !== query) {
360
+ rerankQuery = `${query} ${rewritten}`;
346
361
  const rewrittenResults = await this.searchByStrategy(rewritten, {
347
362
  strategy: 'deep',
348
363
  topK: input.topK,
@@ -362,7 +377,7 @@ export class Retriever {
362
377
  });
363
378
 
364
379
  const rerankedResults = input.rerankWithKeyword
365
- ? this.rerankByKeywordOverlap(expandedResults, query, input.rerankWeights, input.decayPolicy)
380
+ ? this.rerankByKeywordOverlap(expandedResults, rerankQuery, input.rerankWeights, input.decayPolicy)
366
381
  : expandedResults;
367
382
 
368
383
  const filtered = await this.applyScopeFilters(rerankedResults, {
@@ -371,10 +386,33 @@ export class Retriever {
371
386
  projectHash: input.projectHash,
372
387
  allowedProjectHashes: input.allowedProjectHashes
373
388
  });
374
- const top = filtered.slice(0, input.topK);
389
+ const qualityFiltered = this.applyQualityFilters(filtered, {
390
+ query,
391
+ minScore: input.minScore
392
+ });
393
+ const top = qualityFiltered.slice(0, input.topK);
375
394
  const matchResult = this.matcher.matchSearchResults(top, () => 0);
376
395
 
377
- return { results: top, candidateResults: filtered, matchResult };
396
+ return { results: top, candidateResults: qualityFiltered, matchResult };
397
+ }
398
+
399
+ private applyQualityFilters(
400
+ results: Array<SearchResult & { semanticScore?: number; lexicalScore?: number; recencyScore?: number }>,
401
+ options: { query: string; minScore: number }
402
+ ): Array<SearchResult & { semanticScore?: number; lexicalScore?: number; recencyScore?: number }> {
403
+ let filtered = [...results];
404
+
405
+ if (shouldApplyTechnicalGuard(options.query)) {
406
+ filtered = filtered.filter((result) => hasTechnicalTermOverlap(options.query, result.content));
407
+ }
408
+
409
+ if (filtered.length <= 2) return filtered;
410
+
411
+ const topScore = filtered[0].score;
412
+ if (topScore < 0.8) return filtered;
413
+
414
+ const cliffThreshold = Math.max(options.minScore, topScore - 0.25);
415
+ return filtered.filter((result) => result.score >= cliffThreshold);
378
416
  }
379
417
 
380
418
  private mergeResults(primary: SearchResult[], secondary: SearchResult[], limit: number): SearchResult[] {