claude-memory-layer 1.0.31 → 1.0.32

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (313) hide show
  1. package/README.md +9 -2
  2. package/dist/cli/index.js +1 -1
  3. package/package.json +11 -2
  4. package/scripts/postinstall-embedding-backend.cjs +16 -12
  5. package/AGENTS.md +0 -71
  6. package/CLAUDE.md +0 -30
  7. package/HANDOFF.md +0 -92
  8. package/Memo.txt +0 -558
  9. package/benchmarks/replay/anonymized-real-sessions.json +0 -48
  10. package/config/kpi-thresholds.json +0 -7
  11. package/context.md +0 -636
  12. package/docs/ARCHITECTURE_COMPARISON_AND_RECOMMENDATIONS.md +0 -627
  13. package/docs/HERMES_MEMORY_INGESTION_ANALYSIS.md +0 -440
  14. package/docs/MCP_MEMORY_SERVICE_COMPARATIVE_REVIEW.md +0 -271
  15. package/docs/MEMORY_USEFULNESS_AUDIT.md +0 -371
  16. package/docs/MEMORY_USEFULNESS_AUDIT_RAW.json +0 -80
  17. package/docs/MEMSEARCH_PROJECT_STRUCTURE_ANALYSIS.md +0 -333
  18. package/docs/MEMU_ADOPTION.md +0 -40
  19. package/docs/OPERATIONS.md +0 -18
  20. package/docs/PRODUCT_VALIDATION_MATRIX.md +0 -82
  21. package/docs/PROJECT_STRUCTURE_ANALYSIS.md +0 -421
  22. package/docs/REFACTORING_MILESTONES_AND_ISSUES.md +0 -501
  23. package/docs/REFACTORING_PLAN_THIN_CORE.md +0 -414
  24. package/docs/REFERENCE_PROJECT_ANALYSES.md +0 -25
  25. package/docs/SUPERLOCALMEMORY_PROJECT_STRUCTURE_ANALYSIS.md +0 -452
  26. package/docs/TARGET_ARCHITECTURE_AND_FOLDER_STRUCTURE.md +0 -446
  27. package/docs/architecture/comparison-index.md +0 -47
  28. package/docs/reports/codex-real-data-validation-20260505T040447Z.md +0 -46
  29. package/plan.md +0 -1642
  30. package/scripts/build.ts +0 -159
  31. package/scripts/bump-patch-version.sh +0 -18
  32. package/scripts/delete-unknown-projects.js +0 -154
  33. package/scripts/fix-sync-gap.js +0 -32
  34. package/scripts/generate-session-qrels.ts +0 -126
  35. package/scripts/heartbeat-memory-orchestrator.sh +0 -28
  36. package/scripts/replay-retrieval-benchmark.ts +0 -69
  37. package/scripts/report-sync-gap.js +0 -26
  38. package/scripts/review-queue-auto-resolve.js +0 -21
  39. package/scripts/sync-gap-auto-heal.sh +0 -17
  40. package/spec.md +0 -624
  41. package/specs/20260207-dashboard-upgrade/context.md +0 -38
  42. package/specs/20260207-dashboard-upgrade/spec.md +0 -96
  43. package/specs/citations-system/context.md +0 -243
  44. package/specs/citations-system/plan.md +0 -495
  45. package/specs/citations-system/spec.md +0 -371
  46. package/specs/endless-mode/context.md +0 -305
  47. package/specs/endless-mode/plan.md +0 -620
  48. package/specs/endless-mode/spec.md +0 -455
  49. package/specs/entity-edge-model/context.md +0 -401
  50. package/specs/entity-edge-model/plan.md +0 -459
  51. package/specs/entity-edge-model/spec.md +0 -391
  52. package/specs/evidence-aligner-v2/context.md +0 -401
  53. package/specs/evidence-aligner-v2/plan.md +0 -303
  54. package/specs/evidence-aligner-v2/spec.md +0 -312
  55. package/specs/mcp-desktop-integration/context.md +0 -278
  56. package/specs/mcp-desktop-integration/plan.md +0 -550
  57. package/specs/mcp-desktop-integration/spec.md +0 -494
  58. package/specs/memory-utilization-improvements/context.md +0 -145
  59. package/specs/memory-utilization-improvements/plan.md +0 -361
  60. package/specs/memory-utilization-improvements/spec.md +0 -361
  61. package/specs/post-tool-use-hook/context.md +0 -319
  62. package/specs/post-tool-use-hook/plan.md +0 -469
  63. package/specs/post-tool-use-hook/spec.md +0 -364
  64. package/specs/private-tags/context.md +0 -288
  65. package/specs/private-tags/plan.md +0 -412
  66. package/specs/private-tags/spec.md +0 -345
  67. package/specs/progressive-disclosure/context.md +0 -346
  68. package/specs/progressive-disclosure/plan.md +0 -663
  69. package/specs/progressive-disclosure/spec.md +0 -415
  70. package/specs/selective-tool-observation/context.md +0 -100
  71. package/specs/selective-tool-observation/plan.md +0 -158
  72. package/specs/selective-tool-observation/spec.md +0 -127
  73. package/specs/task-entity-system/context.md +0 -297
  74. package/specs/task-entity-system/plan.md +0 -301
  75. package/specs/task-entity-system/spec.md +0 -314
  76. package/specs/thin-core-refactor/context.md +0 -275
  77. package/specs/thin-core-refactor/plan.md +0 -536
  78. package/specs/thin-core-refactor/spec.md +0 -465
  79. package/specs/vector-outbox-v2/context.md +0 -470
  80. package/specs/vector-outbox-v2/plan.md +0 -562
  81. package/specs/vector-outbox-v2/spec.md +0 -466
  82. package/specs/web-viewer-ui/context.md +0 -384
  83. package/specs/web-viewer-ui/plan.md +0 -797
  84. package/specs/web-viewer-ui/spec.md +0 -516
  85. package/src/adapters/claude/capture/index.ts +0 -3
  86. package/src/adapters/claude/context/index.ts +0 -3
  87. package/src/adapters/claude/hooks/index.ts +0 -21
  88. package/src/adapters/claude/hooks/post-tool-use.ts +0 -239
  89. package/src/adapters/claude/hooks/prompt-injection-policy.ts +0 -104
  90. package/src/adapters/claude/hooks/semantic-daemon-client.ts +0 -209
  91. package/src/adapters/claude/hooks/semantic-daemon.ts +0 -283
  92. package/src/adapters/claude/hooks/session-end.ts +0 -59
  93. package/src/adapters/claude/hooks/session-start.ts +0 -73
  94. package/src/adapters/claude/hooks/stop.ts +0 -128
  95. package/src/adapters/claude/hooks/user-prompt-submit.ts +0 -361
  96. package/src/adapters/claude/index.ts +0 -4
  97. package/src/adapters/claude/transcript/index.ts +0 -4
  98. package/src/adapters/claude/transcript/transcript-reader.ts +0 -57
  99. package/src/adapters/claude/transcript/turn-reconstructor.ts +0 -65
  100. package/src/apps/cli/claude-settings-hooks.ts +0 -138
  101. package/src/apps/cli/codex-import-runner.ts +0 -125
  102. package/src/apps/cli/codex-validation-output.ts +0 -95
  103. package/src/apps/cli/hermes-import-runner.ts +0 -130
  104. package/src/apps/cli/hermes-validation-output.ts +0 -91
  105. package/src/apps/cli/index.ts +0 -1735
  106. package/src/apps/cli/mcp-install.ts +0 -106
  107. package/src/apps/cli/retrieval-disclosure-output.ts +0 -196
  108. package/src/apps/dashboard/assets/js/bootstrap.js +0 -244
  109. package/src/apps/dashboard/assets/js/chat.js +0 -373
  110. package/src/apps/dashboard/assets/js/disclosure.js +0 -232
  111. package/src/apps/dashboard/assets/js/modals.js +0 -298
  112. package/src/apps/dashboard/assets/js/overview.js +0 -655
  113. package/src/apps/dashboard/assets/js/state.js +0 -72
  114. package/src/apps/dashboard/assets/js/views.js +0 -468
  115. package/src/apps/dashboard/index.html +0 -543
  116. package/src/apps/dashboard/index.ts +0 -3
  117. package/src/apps/dashboard/style.css +0 -1750
  118. package/src/apps/index.ts +0 -5
  119. package/src/apps/server/api/chat.ts +0 -244
  120. package/src/apps/server/api/citations.ts +0 -105
  121. package/src/apps/server/api/events.ts +0 -137
  122. package/src/apps/server/api/health.ts +0 -53
  123. package/src/apps/server/api/index.ts +0 -26
  124. package/src/apps/server/api/projects.ts +0 -74
  125. package/src/apps/server/api/search.ts +0 -184
  126. package/src/apps/server/api/sessions.ts +0 -115
  127. package/src/apps/server/api/stats.ts +0 -723
  128. package/src/apps/server/api/turns.ts +0 -143
  129. package/src/apps/server/api/utils.ts +0 -65
  130. package/src/apps/server/index.ts +0 -111
  131. package/src/cli/index.ts +0 -3
  132. package/src/cli/retrieval-disclosure-output.ts +0 -2
  133. package/src/compat/index.ts +0 -5
  134. package/src/core/canonical-key.ts +0 -186
  135. package/src/core/citation-generator.ts +0 -63
  136. package/src/core/consolidated-store.ts +0 -356
  137. package/src/core/consolidation-worker.ts +0 -493
  138. package/src/core/context-formatter.ts +0 -276
  139. package/src/core/continuity-manager.ts +0 -341
  140. package/src/core/db-wrapper.ts +0 -64
  141. package/src/core/derive/fact-deriver.ts +0 -170
  142. package/src/core/derive/index.ts +0 -2
  143. package/src/core/derive/summary-deriver.ts +0 -76
  144. package/src/core/edge-repo.ts +0 -333
  145. package/src/core/embedder.ts +0 -4
  146. package/src/core/engine/embedding-maintenance-service.ts +0 -187
  147. package/src/core/engine/endless-memory-services.ts +0 -4
  148. package/src/core/engine/index.ts +0 -19
  149. package/src/core/engine/memory-engine-services.ts +0 -170
  150. package/src/core/engine/memory-ingest-service.ts +0 -317
  151. package/src/core/engine/memory-query-service.ts +0 -173
  152. package/src/core/engine/memory-runtime-service.ts +0 -162
  153. package/src/core/engine/memory-service-composition.ts +0 -231
  154. package/src/core/engine/retrieval-analytics-service.ts +0 -181
  155. package/src/core/engine/retrieval-disclosure-service.ts +0 -420
  156. package/src/core/engine/retrieval-orchestrator.ts +0 -377
  157. package/src/core/engine/retrieval-services.ts +0 -176
  158. package/src/core/engine/shared-memory-services.ts +0 -4
  159. package/src/core/entity-repo.ts +0 -349
  160. package/src/core/event-store.ts +0 -779
  161. package/src/core/evidence-aligner.ts +0 -635
  162. package/src/core/external-market-context.ts +0 -582
  163. package/src/core/graduation-worker.ts +0 -171
  164. package/src/core/graduation.ts +0 -377
  165. package/src/core/index.ts +0 -64
  166. package/src/core/ingest-interceptor.ts +0 -80
  167. package/src/core/markdown-mirror.ts +0 -70
  168. package/src/core/matcher.ts +0 -208
  169. package/src/core/md-mirror.ts +0 -92
  170. package/src/core/metadata-extractor.ts +0 -203
  171. package/src/core/model/memory-fact.ts +0 -30
  172. package/src/core/model/memory-rule.ts +0 -14
  173. package/src/core/model/memory-summary.ts +0 -21
  174. package/src/core/model/raw-event.ts +0 -28
  175. package/src/core/model/retrieval-result.ts +0 -35
  176. package/src/core/mongo-sync-config.ts +0 -165
  177. package/src/core/mongo-sync-worker.ts +0 -381
  178. package/src/core/privacy/filter.ts +0 -190
  179. package/src/core/privacy/index.ts +0 -20
  180. package/src/core/privacy/tag-parser.ts +0 -145
  181. package/src/core/product-validation-matrix.ts +0 -314
  182. package/src/core/progressive-retriever.ts +0 -414
  183. package/src/core/registry/project-path.ts +0 -54
  184. package/src/core/registry/session-registry.ts +0 -69
  185. package/src/core/replay-evaluator.ts +0 -625
  186. package/src/core/retrieval-benchmark.ts +0 -117
  187. package/src/core/retrieval-quality.ts +0 -109
  188. package/src/core/retriever.ts +0 -800
  189. package/src/core/session-qrels.ts +0 -360
  190. package/src/core/shared-event-store.ts +0 -114
  191. package/src/core/shared-promoter.ts +0 -249
  192. package/src/core/shared-store.ts +0 -289
  193. package/src/core/shared-vector-store.ts +0 -203
  194. package/src/core/sqlite-event-store.ts +0 -1846
  195. package/src/core/sqlite-wrapper.ts +0 -116
  196. package/src/core/sync-worker.ts +0 -228
  197. package/src/core/tag-taxonomy.ts +0 -51
  198. package/src/core/task/blocker-resolver.ts +0 -333
  199. package/src/core/task/index.ts +0 -9
  200. package/src/core/task/task-matcher.ts +0 -240
  201. package/src/core/task/task-projector.ts +0 -358
  202. package/src/core/task/task-resolver.ts +0 -421
  203. package/src/core/turn-state.ts +0 -207
  204. package/src/core/types.ts +0 -952
  205. package/src/core/vector-outbox.ts +0 -299
  206. package/src/core/vector-store.ts +0 -231
  207. package/src/core/vector-worker.ts +0 -521
  208. package/src/core/working-set-store.ts +0 -257
  209. package/src/extensions/endless-memory/endless-memory-services.ts +0 -350
  210. package/src/extensions/endless-memory/index.ts +0 -1
  211. package/src/extensions/index.ts +0 -5
  212. package/src/extensions/mcp/handlers.ts +0 -960
  213. package/src/extensions/mcp/index.ts +0 -48
  214. package/src/extensions/mcp/tools.ts +0 -252
  215. package/src/extensions/shared-memory/index.ts +0 -1
  216. package/src/extensions/shared-memory/shared-memory-services.ts +0 -211
  217. package/src/extensions/vector/embedder.ts +0 -234
  218. package/src/extensions/vector/index.ts +0 -1
  219. package/src/hooks/post-tool-use.ts +0 -9
  220. package/src/hooks/semantic-daemon-client.ts +0 -1
  221. package/src/hooks/semantic-daemon.ts +0 -11
  222. package/src/hooks/session-end.ts +0 -9
  223. package/src/hooks/session-start.ts +0 -9
  224. package/src/hooks/stop.ts +0 -9
  225. package/src/hooks/user-prompt-submit.ts +0 -9
  226. package/src/index.ts +0 -13
  227. package/src/mcp/handlers.ts +0 -2
  228. package/src/mcp/index.ts +0 -4
  229. package/src/mcp/tools.ts +0 -2
  230. package/src/server/api/chat.ts +0 -2
  231. package/src/server/api/citations.ts +0 -2
  232. package/src/server/api/events.ts +0 -2
  233. package/src/server/api/health.ts +0 -2
  234. package/src/server/api/index.ts +0 -2
  235. package/src/server/api/projects.ts +0 -2
  236. package/src/server/api/search.ts +0 -2
  237. package/src/server/api/sessions.ts +0 -2
  238. package/src/server/api/stats.ts +0 -2
  239. package/src/server/api/turns.ts +0 -2
  240. package/src/server/api/utils.ts +0 -2
  241. package/src/server/index.ts +0 -2
  242. package/src/services/bootstrap-organizer.ts +0 -463
  243. package/src/services/codex-session-history-importer.ts +0 -966
  244. package/src/services/hermes-session-history-importer.ts +0 -733
  245. package/src/services/memory-service-config.ts +0 -36
  246. package/src/services/memory-service-registry.ts +0 -150
  247. package/src/services/memory-service.ts +0 -688
  248. package/src/services/session-history-importer.ts +0 -629
  249. package/tests/README.md +0 -23
  250. package/tests/adapters/claude/claude-semantic-daemon-adapter.test.ts +0 -54
  251. package/tests/adapters/claude/claude-transcript-reconstructor.test.ts +0 -98
  252. package/tests/adapters/claude-hook-prompt-injection-policy.test.ts +0 -99
  253. package/tests/apps/app-layer-boundary.test.ts +0 -48
  254. package/tests/apps/claude-settings-hooks.test.ts +0 -107
  255. package/tests/apps/cli-disclosure-output.test.ts +0 -212
  256. package/tests/apps/codex-import-runner.test.ts +0 -99
  257. package/tests/apps/codex-validation-output.test.ts +0 -100
  258. package/tests/apps/hermes-import-runner.test.ts +0 -99
  259. package/tests/apps/mcp-install-command.test.ts +0 -59
  260. package/tests/apps/package-build-entrypoints.test.ts +0 -30
  261. package/tests/apps/postinstall-embedding-backend.test.ts +0 -185
  262. package/tests/apps/search-api-disclosure.test.ts +0 -162
  263. package/tests/apps/stats-api-lightweight.test.ts +0 -67
  264. package/tests/apps/ui-disclosure-output.test.ts +0 -140
  265. package/tests/core/bootstrap-organizer.test.ts +0 -111
  266. package/tests/core/canonical-key.test.ts +0 -101
  267. package/tests/core/codex-session-history-importer-validation.test.ts +0 -185
  268. package/tests/core/consolidation-worker.test.ts +0 -75
  269. package/tests/core/embedding-maintenance-service.test.ts +0 -282
  270. package/tests/core/evidence-aligner.test.ts +0 -152
  271. package/tests/core/external-market-context.test.ts +0 -209
  272. package/tests/core/fact-deriver.test.ts +0 -79
  273. package/tests/core/hermes-session-history-importer-validation.test.ts +0 -609
  274. package/tests/core/ingest-interceptor.test.ts +0 -38
  275. package/tests/core/markdown-mirror.test.ts +0 -85
  276. package/tests/core/matcher.test.ts +0 -112
  277. package/tests/core/md-mirror.test.ts +0 -50
  278. package/tests/core/memory-engine-services.test.ts +0 -240
  279. package/tests/core/memory-ingest-service.test.ts +0 -296
  280. package/tests/core/memory-query-service.test.ts +0 -129
  281. package/tests/core/memory-runtime-service.test.ts +0 -201
  282. package/tests/core/memory-service-composition.test.ts +0 -192
  283. package/tests/core/memory-service-config.test.ts +0 -41
  284. package/tests/core/memory-service-facade.test.ts +0 -30
  285. package/tests/core/memory-service-registry.test.ts +0 -206
  286. package/tests/core/product-validation-matrix.test.ts +0 -61
  287. package/tests/core/project-registry.test.ts +0 -78
  288. package/tests/core/replay-evaluator.test.ts +0 -181
  289. package/tests/core/retrieval-analytics-service.test.ts +0 -210
  290. package/tests/core/retrieval-benchmark.test.ts +0 -93
  291. package/tests/core/retrieval-disclosure-service.test.ts +0 -264
  292. package/tests/core/retrieval-orchestrator.test.ts +0 -403
  293. package/tests/core/retrieval-quality.test.ts +0 -31
  294. package/tests/core/retrieval-services.test.ts +0 -185
  295. package/tests/core/retriever-fallback-chain.test.ts +0 -223
  296. package/tests/core/retriever-strategy-scope.test.ts +0 -164
  297. package/tests/core/retriever.memu-adoption.test.ts +0 -122
  298. package/tests/core/session-history-importer-filter.test.ts +0 -78
  299. package/tests/core/session-qrels.test.ts +0 -250
  300. package/tests/core/sqlite-event-store-replication.test.ts +0 -127
  301. package/tests/core/summary-deriver.test.ts +0 -66
  302. package/tests/extensions/embedder-warning-suppression.test.ts +0 -84
  303. package/tests/extensions/endless-memory-extension-boundary.test.ts +0 -17
  304. package/tests/extensions/endless-memory-services.test.ts +0 -325
  305. package/tests/extensions/mcp-context-tools.test.ts +0 -905
  306. package/tests/extensions/mcp-extension-boundary.test.ts +0 -21
  307. package/tests/extensions/mcp-package-build.test.ts +0 -22
  308. package/tests/extensions/mcp-project-aware-tools.test.ts +0 -102
  309. package/tests/extensions/shared-memory-extension-boundary.test.ts +0 -24
  310. package/tests/extensions/shared-memory-services.test.ts +0 -309
  311. package/tests/extensions/vector-extension-boundary.test.ts +0 -21
  312. package/tsconfig.json +0 -24
  313. package/vitest.config.ts +0 -15
@@ -1,466 +0,0 @@
1
- # Vector Outbox V2 Specification
2
-
3
- > **Version**: 2.0.0
4
- > **Status**: Draft
5
- > **Created**: 2026-01-31
6
-
7
- ## 1. 개요
8
-
9
- ### 1.1 문제 정의
10
-
11
- DuckDB와 LanceDB 간 데이터 정합성 문제:
12
-
13
- 1. **원자성 부재**: DuckDB 쓰기와 LanceDB 쓰기가 별도 트랜잭션
14
- 2. **중복 벡터**: 재처리 시 같은 벡터가 중복 저장될 수 있음
15
- 3. **일관성**: DuckDB에는 있지만 LanceDB에는 없는 상태 발생
16
- 4. **동시성**: 여러 프로세스가 동시에 벡터 저장 시 충돌
17
-
18
- ### 1.2 해결 방향
19
-
20
- **Transactional Outbox Pattern**:
21
- 1. DuckDB에 먼저 기록 (vector_outbox 테이블)
22
- 2. 단일 writer가 outbox를 처리하여 LanceDB에 upsert
23
- 3. 성공 시 outbox 상태 업데이트
24
-
25
- ## 2. 핵심 개념
26
-
27
- ### 2.1 Outbox 패턴 흐름
28
-
29
- ```
30
- Application DuckDB LanceDB
31
- │ │ │
32
- │ 1. Entry 저장 │ │
33
- ├────────────────────────▶│ │
34
- │ │ │
35
- │ 2. Outbox job 생성 │ │
36
- ├────────────────────────▶│ │
37
- │ │ │
38
- │ (트랜잭션 커밋) │ │
39
- │ │ │
40
- ┌─────┴─────┐
41
- │ Worker │
42
- └─────┬─────┘
43
- │ │
44
- │ 3. pending job 조회 │
45
- │◀────────────────────────│
46
- │ │
47
- │ 4. 임베딩 생성 │
48
- │ │
49
- │ 5. LanceDB upsert │
50
- │─────────────────────────▶│
51
- │ │
52
- │ 6. status='done' 업데이트 │
53
- │────────────────────────▶│
54
- ```
55
-
56
- ### 2.2 Job 상태 머신
57
-
58
- ```
59
- ┌─────────┐ Worker 픽업 ┌────────────┐
60
- │ pending │ ──────────────────▶ │ processing │
61
- └─────────┘ └──────┬─────┘
62
- │ │
63
- │ 재시도 (reconcile) │
64
- │ │
65
- │ ┌───────────────────────┼───────────────────────┐
66
- │ │ │ │
67
- │ ▼ ▼ ▼
68
- │ ┌─────────┐ ┌──────────┐ ┌─────────┐
69
- └───▶│ pending │ │ done │ │ failed │
70
- └─────────┘ └──────────┘ └─────────┘
71
-
72
- │ retry < max
73
-
74
- ┌─────────┐
75
- │ pending │
76
- └─────────┘
77
- ```
78
-
79
- ### 2.3 Item 종류
80
-
81
- ```typescript
82
- type ItemKind =
83
- | 'entry' // entries 테이블의 content 임베딩
84
- | 'task_title' // entities 테이블의 task 제목 임베딩
85
- | 'session_summary' // 세션 요약 임베딩
86
- ;
87
- ```
88
-
89
- ## 3. DB 스키마
90
-
91
- ### 3.1 vector_outbox 테이블
92
-
93
- ```sql
94
- CREATE TABLE vector_outbox (
95
- job_id VARCHAR PRIMARY KEY,
96
- item_kind VARCHAR NOT NULL, -- entry|task_title|session_summary
97
- item_id VARCHAR NOT NULL,
98
- embedding_version VARCHAR NOT NULL, -- e.g., 'v1.0.0', 'minilm-v2'
99
- status VARCHAR NOT NULL, -- pending|processing|done|failed
100
- retry_count INTEGER DEFAULT 0,
101
- error VARCHAR,
102
- created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
103
- updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
104
-
105
- -- 중복 방지: 같은 아이템+버전은 하나만
106
- UNIQUE(item_kind, item_id, embedding_version)
107
- );
108
-
109
- CREATE INDEX idx_outbox_status ON vector_outbox(status);
110
- CREATE INDEX idx_outbox_created ON vector_outbox(created_at);
111
- ```
112
-
113
- ### 3.2 vector_store_meta 테이블 (선택)
114
-
115
- ```sql
116
- -- LanceDB 테이블 메타데이터 추적
117
- CREATE TABLE vector_store_meta (
118
- table_name VARCHAR PRIMARY KEY, -- e.g., 'entry_vectors_v1'
119
- embedding_version VARCHAR NOT NULL,
120
- item_count INTEGER DEFAULT 0,
121
- last_sync_at TIMESTAMP,
122
- created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
123
- );
124
- ```
125
-
126
- ## 4. Outbox API
127
-
128
- ### 4.1 Enqueue
129
-
130
- ```typescript
131
- interface OutboxEnqueueInput {
132
- itemKind: ItemKind;
133
- itemId: string;
134
- embeddingVersion: string;
135
- }
136
-
137
- interface VectorOutbox {
138
- // Job 추가 (중복 시 무시)
139
- enqueue(input: OutboxEnqueueInput): Promise<EnqueueResult>;
140
-
141
- // 배치 추가
142
- enqueueBatch(inputs: OutboxEnqueueInput[]): Promise<EnqueueResult[]>;
143
- }
144
-
145
- type EnqueueResult =
146
- | { success: true; jobId: string; isNew: true }
147
- | { success: true; jobId: string; isNew: false } // 이미 존재
148
- | { success: false; error: string };
149
- ```
150
-
151
- ### 4.2 Process (Worker)
152
-
153
- ```typescript
154
- interface VectorWorker {
155
- // pending job 가져오기 (락)
156
- claimJobs(limit: number): Promise<OutboxJob[]>;
157
-
158
- // 처리 완료 표시
159
- markDone(jobId: string): Promise<void>;
160
-
161
- // 실패 표시
162
- markFailed(jobId: string, error: string): Promise<void>;
163
-
164
- // 전체 처리 루프
165
- processAll(): Promise<ProcessResult>;
166
- }
167
-
168
- interface ProcessResult {
169
- processed: number;
170
- succeeded: number;
171
- failed: number;
172
- errors: { jobId: string; error: string }[];
173
- }
174
- ```
175
-
176
- ### 4.3 Reconcile
177
-
178
- ```typescript
179
- interface VectorOutbox {
180
- // 재시도 가능한 failed job을 pending으로 변경
181
- reconcileFailed(maxRetries: number): Promise<number>;
182
-
183
- // processing 상태로 오래 멈춘 job 복구
184
- recoverStuck(stuckThresholdMs: number): Promise<number>;
185
-
186
- // 완료된 job 정리
187
- cleanupDone(olderThanDays: number): Promise<number>;
188
- }
189
- ```
190
-
191
- ## 5. 단일 Writer 패턴
192
-
193
- ### 5.1 왜 단일 Writer인가?
194
-
195
- **문제**: 여러 프로세스가 동시에 LanceDB에 쓰면
196
- - 충돌 발생 가능
197
- - 중복 벡터 생성
198
- - 트랜잭션 보장 어려움
199
-
200
- **해결**: 하나의 worker만 LanceDB에 쓰기
201
-
202
- ```typescript
203
- // 단일 writer 보장 방법들
204
-
205
- // 방법 1: 프로세스 수준 락
206
- const lockFile = '/tmp/vector-worker.lock';
207
- if (fs.existsSync(lockFile)) {
208
- console.log('Another worker is running');
209
- process.exit(0);
210
- }
211
- fs.writeFileSync(lockFile, process.pid.toString());
212
-
213
- // 방법 2: DB 수준 락
214
- await db.run(`
215
- INSERT INTO worker_locks (worker_name, locked_at)
216
- VALUES ('vector_worker', CURRENT_TIMESTAMP)
217
- ON CONFLICT (worker_name)
218
- DO UPDATE SET locked_at = CURRENT_TIMESTAMP
219
- WHERE locked_at < datetime('now', '-5 minutes')
220
- `);
221
- ```
222
-
223
- ### 5.2 Worker 구현
224
-
225
- ```typescript
226
- class VectorWorkerImpl implements VectorWorker {
227
- private embedder: Embedder;
228
- private vectorStore: VectorStore;
229
- private db: Database;
230
-
231
- async processAll(): Promise<ProcessResult> {
232
- const result: ProcessResult = { processed: 0, succeeded: 0, failed: 0, errors: [] };
233
-
234
- while (true) {
235
- const jobs = await this.claimJobs(BATCH_SIZE);
236
- if (jobs.length === 0) break;
237
-
238
- for (const job of jobs) {
239
- try {
240
- await this.processJob(job);
241
- await this.markDone(job.jobId);
242
- result.succeeded++;
243
- } catch (error) {
244
- await this.markFailed(job.jobId, error.message);
245
- result.failed++;
246
- result.errors.push({ jobId: job.jobId, error: error.message });
247
- }
248
- result.processed++;
249
- }
250
- }
251
-
252
- return result;
253
- }
254
-
255
- private async processJob(job: OutboxJob): Promise<void> {
256
- // 1. 원본 콘텐츠 조회
257
- const content = await this.getContent(job.itemKind, job.itemId);
258
-
259
- // 2. 임베딩 생성
260
- const embedding = await this.embedder.embed(content);
261
-
262
- // 3. LanceDB upsert (idempotent)
263
- await this.vectorStore.upsert({
264
- id: job.itemId,
265
- vector: embedding,
266
- metadata: {
267
- itemKind: job.itemKind,
268
- embeddingVersion: job.embeddingVersion
269
- }
270
- });
271
- }
272
- }
273
- ```
274
-
275
- ## 6. LanceDB Upsert 전략
276
-
277
- ### 6.1 Idempotent Upsert
278
-
279
- ```typescript
280
- async function upsertVector(record: VectorRecord): Promise<void> {
281
- const table = await this.getTable(record.itemKind, record.embeddingVersion);
282
-
283
- // LanceDB에서 기존 레코드 확인
284
- const existing = await table
285
- .search([0]) // dummy search for filter
286
- .filter(`id = '${record.id}'`)
287
- .limit(1)
288
- .toArray();
289
-
290
- if (existing.length > 0) {
291
- // 업데이트: 삭제 후 재삽입
292
- await table.delete(`id = '${record.id}'`);
293
- }
294
-
295
- // 삽입
296
- await table.add([{
297
- id: record.id,
298
- vector: record.vector,
299
- content: record.content,
300
- timestamp: record.timestamp,
301
- metadata: record.metadata
302
- }]);
303
- }
304
- ```
305
-
306
- ### 6.2 테이블 버전 관리
307
-
308
- ```typescript
309
- // 임베딩 모델 버전별 테이블 분리
310
- function getTableName(itemKind: ItemKind, embeddingVersion: string): string {
311
- // entry_vectors_minilm_v2
312
- // task_title_vectors_minilm_v2
313
- const versionSlug = embeddingVersion.replace(/[^a-z0-9]/gi, '_');
314
- return `${itemKind}_vectors_${versionSlug}`;
315
- }
316
- ```
317
-
318
- ## 7. Idris2 영감 적용
319
-
320
- ### 7.1 상태 전이 타입 안전성
321
-
322
- ```typescript
323
- // 타입 레벨에서 유효한 상태 전이만 허용
324
- type ValidTransition =
325
- | { from: 'pending'; to: 'processing' }
326
- | { from: 'processing'; to: 'done' }
327
- | { from: 'processing'; to: 'failed' }
328
- | { from: 'failed'; to: 'pending' }; // retry
329
-
330
- function transition(job: OutboxJob, to: OutboxStatus): OutboxJob {
331
- const valid: ValidTransition[] = [
332
- { from: 'pending', to: 'processing' },
333
- { from: 'processing', to: 'done' },
334
- { from: 'processing', to: 'failed' },
335
- { from: 'failed', to: 'pending' }
336
- ];
337
-
338
- const isValid = valid.some(t => t.from === job.status && t.to === to);
339
- if (!isValid) {
340
- throw new InvalidTransitionError(`Cannot transition from ${job.status} to ${to}`);
341
- }
342
-
343
- return { ...job, status: to, updatedAt: new Date() };
344
- }
345
- ```
346
-
347
- ### 7.2 Idempotency 불변식
348
-
349
- ```typescript
350
- // Zod로 idempotency 검증
351
- const OutboxJobSchema = z.object({
352
- itemKind: ItemKindSchema,
353
- itemId: z.string(),
354
- embeddingVersion: z.string()
355
- }).refine(
356
- async (job) => {
357
- // 같은 조합은 하나만 존재해야 함
358
- const existing = await db.query(`
359
- SELECT COUNT(*) as cnt FROM vector_outbox
360
- WHERE item_kind = ? AND item_id = ? AND embedding_version = ?
361
- `, [job.itemKind, job.itemId, job.embeddingVersion]);
362
- return existing[0].cnt <= 1;
363
- },
364
- { message: 'Duplicate outbox job' }
365
- );
366
- ```
367
-
368
- ## 8. 기존 코드와의 관계
369
-
370
- ### 8.1 현재 vector-worker.ts
371
-
372
- ```typescript
373
- // 현재 구현 (src/core/vector-worker.ts)
374
- export class VectorWorker {
375
- // OutboxItem 타입 사용
376
- // status: 'pending' | 'processing' | 'done' | 'failed'
377
- }
378
- ```
379
-
380
- ### 8.2 V2 확장 포인트
381
-
382
- | 기존 | V2 확장 |
383
- |-----|---------|
384
- | OutboxItem 타입 | itemKind, embeddingVersion 추가 |
385
- | 단순 배치 처리 | claiming with lock |
386
- | 재시도 없음 | reconcile + retry policy |
387
- | 중복 가능 | UNIQUE 제약 + upsert |
388
-
389
- ### 8.3 현재 vector-store.ts
390
-
391
- ```typescript
392
- // 현재 구현 (src/core/vector-store.ts)
393
- export class VectorStore {
394
- async add(record: VectorRecord): Promise<void>;
395
- async search(query: number[], limit: number): Promise<SearchResult[]>;
396
- }
397
- ```
398
-
399
- V2에서 `upsert` 메서드 추가 필요.
400
-
401
- ## 9. 운영 고려사항
402
-
403
- ### 9.1 모니터링
404
-
405
- ```typescript
406
- // 메트릭 수집
407
- interface OutboxMetrics {
408
- pendingCount: number;
409
- processingCount: number;
410
- failedCount: number;
411
- doneCount: number;
412
- avgProcessingTimeMs: number;
413
- lastProcessedAt: Date | null;
414
- }
415
-
416
- async function getMetrics(): Promise<OutboxMetrics> {
417
- return db.query(`
418
- SELECT
419
- SUM(CASE WHEN status = 'pending' THEN 1 ELSE 0 END) as pendingCount,
420
- SUM(CASE WHEN status = 'processing' THEN 1 ELSE 0 END) as processingCount,
421
- SUM(CASE WHEN status = 'failed' THEN 1 ELSE 0 END) as failedCount,
422
- SUM(CASE WHEN status = 'done' THEN 1 ELSE 0 END) as doneCount,
423
- MAX(updated_at) as lastProcessedAt
424
- FROM vector_outbox
425
- `);
426
- }
427
- ```
428
-
429
- ### 9.2 알림
430
-
431
- ```typescript
432
- // failed job이 임계값 초과 시 알림
433
- const FAILED_THRESHOLD = 10;
434
-
435
- async function checkAndAlert(): Promise<void> {
436
- const metrics = await getMetrics();
437
- if (metrics.failedCount >= FAILED_THRESHOLD) {
438
- console.error(`[ALERT] ${metrics.failedCount} failed vector jobs`);
439
- // 추가 알림 로직
440
- }
441
- }
442
- ```
443
-
444
- ### 9.3 정리 작업
445
-
446
- ```typescript
447
- // 정기적으로 완료된 job 정리
448
- async function cleanup(): Promise<void> {
449
- const deleted = await db.run(`
450
- DELETE FROM vector_outbox
451
- WHERE status = 'done'
452
- AND updated_at < datetime('now', '-7 days')
453
- `);
454
- console.log(`Cleaned up ${deleted.changes} done jobs`);
455
- }
456
- ```
457
-
458
- ## 10. 성공 기준
459
-
460
- - [ ] vector_outbox 테이블 생성 및 UNIQUE 제약
461
- - [ ] enqueue가 중복을 무시하고 idempotent하게 동작
462
- - [ ] 단일 worker가 pending job을 처리
463
- - [ ] LanceDB upsert로 중복 벡터 방지
464
- - [ ] failed job 재시도 (reconcile) 동작
465
- - [ ] processing 상태 stuck 복구 동작
466
- - [ ] 기존 vector-worker.ts와 호환 유지