claude-memory-layer 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/commands/memory-forget.md +42 -0
- package/.claude-plugin/commands/memory-history.md +34 -0
- package/.claude-plugin/commands/memory-import.md +56 -0
- package/.claude-plugin/commands/memory-list.md +37 -0
- package/.claude-plugin/commands/memory-search.md +36 -0
- package/.claude-plugin/commands/memory-stats.md +34 -0
- package/.claude-plugin/hooks.json +59 -0
- package/.claude-plugin/plugin.json +24 -0
- package/.history/package_20260201112328.json +45 -0
- package/.history/package_20260201113602.json +45 -0
- package/.history/package_20260201113713.json +45 -0
- package/.history/package_20260201114110.json +45 -0
- package/Memo.txt +558 -0
- package/README.md +520 -0
- package/context.md +636 -0
- package/dist/.claude-plugin/commands/memory-forget.md +42 -0
- package/dist/.claude-plugin/commands/memory-history.md +34 -0
- package/dist/.claude-plugin/commands/memory-import.md +56 -0
- package/dist/.claude-plugin/commands/memory-list.md +37 -0
- package/dist/.claude-plugin/commands/memory-search.md +36 -0
- package/dist/.claude-plugin/commands/memory-stats.md +34 -0
- package/dist/.claude-plugin/hooks.json +59 -0
- package/dist/.claude-plugin/plugin.json +24 -0
- package/dist/cli/index.js +3539 -0
- package/dist/cli/index.js.map +7 -0
- package/dist/core/index.js +4408 -0
- package/dist/core/index.js.map +7 -0
- package/dist/hooks/session-end.js +2971 -0
- package/dist/hooks/session-end.js.map +7 -0
- package/dist/hooks/session-start.js +2969 -0
- package/dist/hooks/session-start.js.map +7 -0
- package/dist/hooks/stop.js +3123 -0
- package/dist/hooks/stop.js.map +7 -0
- package/dist/hooks/user-prompt-submit.js +2960 -0
- package/dist/hooks/user-prompt-submit.js.map +7 -0
- package/dist/services/memory-service.js +2931 -0
- package/dist/services/memory-service.js.map +7 -0
- package/package.json +45 -0
- package/plan.md +1642 -0
- package/scripts/build.ts +102 -0
- package/spec.md +624 -0
- package/specs/citations-system/context.md +243 -0
- package/specs/citations-system/plan.md +495 -0
- package/specs/citations-system/spec.md +371 -0
- package/specs/endless-mode/context.md +305 -0
- package/specs/endless-mode/plan.md +620 -0
- package/specs/endless-mode/spec.md +455 -0
- package/specs/entity-edge-model/context.md +401 -0
- package/specs/entity-edge-model/plan.md +459 -0
- package/specs/entity-edge-model/spec.md +391 -0
- package/specs/evidence-aligner-v2/context.md +401 -0
- package/specs/evidence-aligner-v2/plan.md +303 -0
- package/specs/evidence-aligner-v2/spec.md +312 -0
- package/specs/mcp-desktop-integration/context.md +278 -0
- package/specs/mcp-desktop-integration/plan.md +550 -0
- package/specs/mcp-desktop-integration/spec.md +494 -0
- package/specs/post-tool-use-hook/context.md +319 -0
- package/specs/post-tool-use-hook/plan.md +469 -0
- package/specs/post-tool-use-hook/spec.md +364 -0
- package/specs/private-tags/context.md +288 -0
- package/specs/private-tags/plan.md +412 -0
- package/specs/private-tags/spec.md +345 -0
- package/specs/progressive-disclosure/context.md +346 -0
- package/specs/progressive-disclosure/plan.md +663 -0
- package/specs/progressive-disclosure/spec.md +415 -0
- package/specs/task-entity-system/context.md +297 -0
- package/specs/task-entity-system/plan.md +301 -0
- package/specs/task-entity-system/spec.md +314 -0
- package/specs/vector-outbox-v2/context.md +470 -0
- package/specs/vector-outbox-v2/plan.md +562 -0
- package/specs/vector-outbox-v2/spec.md +466 -0
- package/specs/web-viewer-ui/context.md +384 -0
- package/specs/web-viewer-ui/plan.md +797 -0
- package/specs/web-viewer-ui/spec.md +516 -0
- package/src/cli/index.ts +570 -0
- package/src/core/canonical-key.ts +186 -0
- package/src/core/citation-generator.ts +63 -0
- package/src/core/consolidated-store.ts +279 -0
- package/src/core/consolidation-worker.ts +384 -0
- package/src/core/context-formatter.ts +276 -0
- package/src/core/continuity-manager.ts +336 -0
- package/src/core/edge-repo.ts +324 -0
- package/src/core/embedder.ts +124 -0
- package/src/core/entity-repo.ts +342 -0
- package/src/core/event-store.ts +672 -0
- package/src/core/evidence-aligner.ts +635 -0
- package/src/core/graduation.ts +365 -0
- package/src/core/index.ts +32 -0
- package/src/core/matcher.ts +210 -0
- package/src/core/metadata-extractor.ts +203 -0
- package/src/core/privacy/filter.ts +179 -0
- package/src/core/privacy/index.ts +20 -0
- package/src/core/privacy/tag-parser.ts +145 -0
- package/src/core/progressive-retriever.ts +415 -0
- package/src/core/retriever.ts +235 -0
- package/src/core/task/blocker-resolver.ts +325 -0
- package/src/core/task/index.ts +9 -0
- package/src/core/task/task-matcher.ts +238 -0
- package/src/core/task/task-projector.ts +345 -0
- package/src/core/task/task-resolver.ts +414 -0
- package/src/core/types.ts +841 -0
- package/src/core/vector-outbox.ts +295 -0
- package/src/core/vector-store.ts +182 -0
- package/src/core/vector-worker.ts +488 -0
- package/src/core/working-set-store.ts +244 -0
- package/src/hooks/post-tool-use.ts +127 -0
- package/src/hooks/session-end.ts +78 -0
- package/src/hooks/session-start.ts +57 -0
- package/src/hooks/stop.ts +78 -0
- package/src/hooks/user-prompt-submit.ts +54 -0
- package/src/mcp/handlers.ts +212 -0
- package/src/mcp/index.ts +47 -0
- package/src/mcp/tools.ts +78 -0
- package/src/server/api/citations.ts +101 -0
- package/src/server/api/events.ts +101 -0
- package/src/server/api/index.ts +18 -0
- package/src/server/api/search.ts +98 -0
- package/src/server/api/sessions.ts +111 -0
- package/src/server/api/stats.ts +97 -0
- package/src/server/index.ts +91 -0
- package/src/services/memory-service.ts +626 -0
- package/src/services/session-history-importer.ts +367 -0
- package/tests/canonical-key.test.ts +101 -0
- package/tests/evidence-aligner.test.ts +152 -0
- package/tests/matcher.test.ts +112 -0
- package/tsconfig.json +24 -0
- package/vitest.config.ts +15 -0
|
@@ -0,0 +1,466 @@
|
|
|
1
|
+
# Vector Outbox V2 Specification
|
|
2
|
+
|
|
3
|
+
> **Version**: 2.0.0
|
|
4
|
+
> **Status**: Draft
|
|
5
|
+
> **Created**: 2026-01-31
|
|
6
|
+
|
|
7
|
+
## 1. 개요
|
|
8
|
+
|
|
9
|
+
### 1.1 문제 정의
|
|
10
|
+
|
|
11
|
+
DuckDB와 LanceDB 간 데이터 정합성 문제:
|
|
12
|
+
|
|
13
|
+
1. **원자성 부재**: DuckDB 쓰기와 LanceDB 쓰기가 별도 트랜잭션
|
|
14
|
+
2. **중복 벡터**: 재처리 시 같은 벡터가 중복 저장될 수 있음
|
|
15
|
+
3. **일관성**: DuckDB에는 있지만 LanceDB에는 없는 상태 발생
|
|
16
|
+
4. **동시성**: 여러 프로세스가 동시에 벡터 저장 시 충돌
|
|
17
|
+
|
|
18
|
+
### 1.2 해결 방향
|
|
19
|
+
|
|
20
|
+
**Transactional Outbox Pattern**:
|
|
21
|
+
1. DuckDB에 먼저 기록 (vector_outbox 테이블)
|
|
22
|
+
2. 단일 writer가 outbox를 처리하여 LanceDB에 upsert
|
|
23
|
+
3. 성공 시 outbox 상태 업데이트
|
|
24
|
+
|
|
25
|
+
## 2. 핵심 개념
|
|
26
|
+
|
|
27
|
+
### 2.1 Outbox 패턴 흐름
|
|
28
|
+
|
|
29
|
+
```
|
|
30
|
+
Application DuckDB LanceDB
|
|
31
|
+
│ │ │
|
|
32
|
+
│ 1. Entry 저장 │ │
|
|
33
|
+
├────────────────────────▶│ │
|
|
34
|
+
│ │ │
|
|
35
|
+
│ 2. Outbox job 생성 │ │
|
|
36
|
+
├────────────────────────▶│ │
|
|
37
|
+
│ │ │
|
|
38
|
+
│ (트랜잭션 커밋) │ │
|
|
39
|
+
│ │ │
|
|
40
|
+
┌─────┴─────┐
|
|
41
|
+
│ Worker │
|
|
42
|
+
└─────┬─────┘
|
|
43
|
+
│ │
|
|
44
|
+
│ 3. pending job 조회 │
|
|
45
|
+
│◀────────────────────────│
|
|
46
|
+
│ │
|
|
47
|
+
│ 4. 임베딩 생성 │
|
|
48
|
+
│ │
|
|
49
|
+
│ 5. LanceDB upsert │
|
|
50
|
+
│─────────────────────────▶│
|
|
51
|
+
│ │
|
|
52
|
+
│ 6. status='done' 업데이트 │
|
|
53
|
+
│────────────────────────▶│
|
|
54
|
+
```
|
|
55
|
+
|
|
56
|
+
### 2.2 Job 상태 머신
|
|
57
|
+
|
|
58
|
+
```
|
|
59
|
+
┌─────────┐ Worker 픽업 ┌────────────┐
|
|
60
|
+
│ pending │ ──────────────────▶ │ processing │
|
|
61
|
+
└─────────┘ └──────┬─────┘
|
|
62
|
+
│ │
|
|
63
|
+
│ 재시도 (reconcile) │
|
|
64
|
+
│ │
|
|
65
|
+
│ ┌───────────────────────┼───────────────────────┐
|
|
66
|
+
│ │ │ │
|
|
67
|
+
│ ▼ ▼ ▼
|
|
68
|
+
│ ┌─────────┐ ┌──────────┐ ┌─────────┐
|
|
69
|
+
└───▶│ pending │ │ done │ │ failed │
|
|
70
|
+
└─────────┘ └──────────┘ └─────────┘
|
|
71
|
+
│
|
|
72
|
+
│ retry < max
|
|
73
|
+
▼
|
|
74
|
+
┌─────────┐
|
|
75
|
+
│ pending │
|
|
76
|
+
└─────────┘
|
|
77
|
+
```
|
|
78
|
+
|
|
79
|
+
### 2.3 Item 종류
|
|
80
|
+
|
|
81
|
+
```typescript
|
|
82
|
+
type ItemKind =
|
|
83
|
+
| 'entry' // entries 테이블의 content 임베딩
|
|
84
|
+
| 'task_title' // entities 테이블의 task 제목 임베딩
|
|
85
|
+
| 'session_summary' // 세션 요약 임베딩
|
|
86
|
+
;
|
|
87
|
+
```
|
|
88
|
+
|
|
89
|
+
## 3. DB 스키마
|
|
90
|
+
|
|
91
|
+
### 3.1 vector_outbox 테이블
|
|
92
|
+
|
|
93
|
+
```sql
|
|
94
|
+
CREATE TABLE vector_outbox (
|
|
95
|
+
job_id VARCHAR PRIMARY KEY,
|
|
96
|
+
item_kind VARCHAR NOT NULL, -- entry|task_title|session_summary
|
|
97
|
+
item_id VARCHAR NOT NULL,
|
|
98
|
+
embedding_version VARCHAR NOT NULL, -- e.g., 'v1.0.0', 'minilm-v2'
|
|
99
|
+
status VARCHAR NOT NULL, -- pending|processing|done|failed
|
|
100
|
+
retry_count INTEGER DEFAULT 0,
|
|
101
|
+
error VARCHAR,
|
|
102
|
+
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
|
|
103
|
+
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
|
|
104
|
+
|
|
105
|
+
-- 중복 방지: 같은 아이템+버전은 하나만
|
|
106
|
+
UNIQUE(item_kind, item_id, embedding_version)
|
|
107
|
+
);
|
|
108
|
+
|
|
109
|
+
CREATE INDEX idx_outbox_status ON vector_outbox(status);
|
|
110
|
+
CREATE INDEX idx_outbox_created ON vector_outbox(created_at);
|
|
111
|
+
```
|
|
112
|
+
|
|
113
|
+
### 3.2 vector_store_meta 테이블 (선택)
|
|
114
|
+
|
|
115
|
+
```sql
|
|
116
|
+
-- LanceDB 테이블 메타데이터 추적
|
|
117
|
+
CREATE TABLE vector_store_meta (
|
|
118
|
+
table_name VARCHAR PRIMARY KEY, -- e.g., 'entry_vectors_v1'
|
|
119
|
+
embedding_version VARCHAR NOT NULL,
|
|
120
|
+
item_count INTEGER DEFAULT 0,
|
|
121
|
+
last_sync_at TIMESTAMP,
|
|
122
|
+
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
|
|
123
|
+
);
|
|
124
|
+
```
|
|
125
|
+
|
|
126
|
+
## 4. Outbox API
|
|
127
|
+
|
|
128
|
+
### 4.1 Enqueue
|
|
129
|
+
|
|
130
|
+
```typescript
|
|
131
|
+
interface OutboxEnqueueInput {
|
|
132
|
+
itemKind: ItemKind;
|
|
133
|
+
itemId: string;
|
|
134
|
+
embeddingVersion: string;
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
interface VectorOutbox {
|
|
138
|
+
// Job 추가 (중복 시 무시)
|
|
139
|
+
enqueue(input: OutboxEnqueueInput): Promise<EnqueueResult>;
|
|
140
|
+
|
|
141
|
+
// 배치 추가
|
|
142
|
+
enqueueBatch(inputs: OutboxEnqueueInput[]): Promise<EnqueueResult[]>;
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
type EnqueueResult =
|
|
146
|
+
| { success: true; jobId: string; isNew: true }
|
|
147
|
+
| { success: true; jobId: string; isNew: false } // 이미 존재
|
|
148
|
+
| { success: false; error: string };
|
|
149
|
+
```
|
|
150
|
+
|
|
151
|
+
### 4.2 Process (Worker)
|
|
152
|
+
|
|
153
|
+
```typescript
|
|
154
|
+
interface VectorWorker {
|
|
155
|
+
// pending job 가져오기 (락)
|
|
156
|
+
claimJobs(limit: number): Promise<OutboxJob[]>;
|
|
157
|
+
|
|
158
|
+
// 처리 완료 표시
|
|
159
|
+
markDone(jobId: string): Promise<void>;
|
|
160
|
+
|
|
161
|
+
// 실패 표시
|
|
162
|
+
markFailed(jobId: string, error: string): Promise<void>;
|
|
163
|
+
|
|
164
|
+
// 전체 처리 루프
|
|
165
|
+
processAll(): Promise<ProcessResult>;
|
|
166
|
+
}
|
|
167
|
+
|
|
168
|
+
interface ProcessResult {
|
|
169
|
+
processed: number;
|
|
170
|
+
succeeded: number;
|
|
171
|
+
failed: number;
|
|
172
|
+
errors: { jobId: string; error: string }[];
|
|
173
|
+
}
|
|
174
|
+
```
|
|
175
|
+
|
|
176
|
+
### 4.3 Reconcile
|
|
177
|
+
|
|
178
|
+
```typescript
|
|
179
|
+
interface VectorOutbox {
|
|
180
|
+
// 재시도 가능한 failed job을 pending으로 변경
|
|
181
|
+
reconcileFailed(maxRetries: number): Promise<number>;
|
|
182
|
+
|
|
183
|
+
// processing 상태로 오래 멈춘 job 복구
|
|
184
|
+
recoverStuck(stuckThresholdMs: number): Promise<number>;
|
|
185
|
+
|
|
186
|
+
// 완료된 job 정리
|
|
187
|
+
cleanupDone(olderThanDays: number): Promise<number>;
|
|
188
|
+
}
|
|
189
|
+
```
|
|
190
|
+
|
|
191
|
+
## 5. 단일 Writer 패턴
|
|
192
|
+
|
|
193
|
+
### 5.1 왜 단일 Writer인가?
|
|
194
|
+
|
|
195
|
+
**문제**: 여러 프로세스가 동시에 LanceDB에 쓰면
|
|
196
|
+
- 충돌 발생 가능
|
|
197
|
+
- 중복 벡터 생성
|
|
198
|
+
- 트랜잭션 보장 어려움
|
|
199
|
+
|
|
200
|
+
**해결**: 하나의 worker만 LanceDB에 쓰기
|
|
201
|
+
|
|
202
|
+
```typescript
|
|
203
|
+
// 단일 writer 보장 방법들
|
|
204
|
+
|
|
205
|
+
// 방법 1: 프로세스 수준 락
|
|
206
|
+
const lockFile = '/tmp/vector-worker.lock';
|
|
207
|
+
if (fs.existsSync(lockFile)) {
|
|
208
|
+
console.log('Another worker is running');
|
|
209
|
+
process.exit(0);
|
|
210
|
+
}
|
|
211
|
+
fs.writeFileSync(lockFile, process.pid.toString());
|
|
212
|
+
|
|
213
|
+
// 방법 2: DB 수준 락
|
|
214
|
+
await db.run(`
|
|
215
|
+
INSERT INTO worker_locks (worker_name, locked_at)
|
|
216
|
+
VALUES ('vector_worker', CURRENT_TIMESTAMP)
|
|
217
|
+
ON CONFLICT (worker_name)
|
|
218
|
+
DO UPDATE SET locked_at = CURRENT_TIMESTAMP
|
|
219
|
+
WHERE locked_at < datetime('now', '-5 minutes')
|
|
220
|
+
`);
|
|
221
|
+
```
|
|
222
|
+
|
|
223
|
+
### 5.2 Worker 구현
|
|
224
|
+
|
|
225
|
+
```typescript
|
|
226
|
+
class VectorWorkerImpl implements VectorWorker {
|
|
227
|
+
private embedder: Embedder;
|
|
228
|
+
private vectorStore: VectorStore;
|
|
229
|
+
private db: Database;
|
|
230
|
+
|
|
231
|
+
async processAll(): Promise<ProcessResult> {
|
|
232
|
+
const result: ProcessResult = { processed: 0, succeeded: 0, failed: 0, errors: [] };
|
|
233
|
+
|
|
234
|
+
while (true) {
|
|
235
|
+
const jobs = await this.claimJobs(BATCH_SIZE);
|
|
236
|
+
if (jobs.length === 0) break;
|
|
237
|
+
|
|
238
|
+
for (const job of jobs) {
|
|
239
|
+
try {
|
|
240
|
+
await this.processJob(job);
|
|
241
|
+
await this.markDone(job.jobId);
|
|
242
|
+
result.succeeded++;
|
|
243
|
+
} catch (error) {
|
|
244
|
+
await this.markFailed(job.jobId, error.message);
|
|
245
|
+
result.failed++;
|
|
246
|
+
result.errors.push({ jobId: job.jobId, error: error.message });
|
|
247
|
+
}
|
|
248
|
+
result.processed++;
|
|
249
|
+
}
|
|
250
|
+
}
|
|
251
|
+
|
|
252
|
+
return result;
|
|
253
|
+
}
|
|
254
|
+
|
|
255
|
+
private async processJob(job: OutboxJob): Promise<void> {
|
|
256
|
+
// 1. 원본 콘텐츠 조회
|
|
257
|
+
const content = await this.getContent(job.itemKind, job.itemId);
|
|
258
|
+
|
|
259
|
+
// 2. 임베딩 생성
|
|
260
|
+
const embedding = await this.embedder.embed(content);
|
|
261
|
+
|
|
262
|
+
// 3. LanceDB upsert (idempotent)
|
|
263
|
+
await this.vectorStore.upsert({
|
|
264
|
+
id: job.itemId,
|
|
265
|
+
vector: embedding,
|
|
266
|
+
metadata: {
|
|
267
|
+
itemKind: job.itemKind,
|
|
268
|
+
embeddingVersion: job.embeddingVersion
|
|
269
|
+
}
|
|
270
|
+
});
|
|
271
|
+
}
|
|
272
|
+
}
|
|
273
|
+
```
|
|
274
|
+
|
|
275
|
+
## 6. LanceDB Upsert 전략
|
|
276
|
+
|
|
277
|
+
### 6.1 Idempotent Upsert
|
|
278
|
+
|
|
279
|
+
```typescript
|
|
280
|
+
async function upsertVector(record: VectorRecord): Promise<void> {
|
|
281
|
+
const table = await this.getTable(record.itemKind, record.embeddingVersion);
|
|
282
|
+
|
|
283
|
+
// LanceDB에서 기존 레코드 확인
|
|
284
|
+
const existing = await table
|
|
285
|
+
.search([0]) // dummy search for filter
|
|
286
|
+
.filter(`id = '${record.id}'`)
|
|
287
|
+
.limit(1)
|
|
288
|
+
.toArray();
|
|
289
|
+
|
|
290
|
+
if (existing.length > 0) {
|
|
291
|
+
// 업데이트: 삭제 후 재삽입
|
|
292
|
+
await table.delete(`id = '${record.id}'`);
|
|
293
|
+
}
|
|
294
|
+
|
|
295
|
+
// 삽입
|
|
296
|
+
await table.add([{
|
|
297
|
+
id: record.id,
|
|
298
|
+
vector: record.vector,
|
|
299
|
+
content: record.content,
|
|
300
|
+
timestamp: record.timestamp,
|
|
301
|
+
metadata: record.metadata
|
|
302
|
+
}]);
|
|
303
|
+
}
|
|
304
|
+
```
|
|
305
|
+
|
|
306
|
+
### 6.2 테이블 버전 관리
|
|
307
|
+
|
|
308
|
+
```typescript
|
|
309
|
+
// 임베딩 모델 버전별 테이블 분리
|
|
310
|
+
function getTableName(itemKind: ItemKind, embeddingVersion: string): string {
|
|
311
|
+
// entry_vectors_minilm_v2
|
|
312
|
+
// task_title_vectors_minilm_v2
|
|
313
|
+
const versionSlug = embeddingVersion.replace(/[^a-z0-9]/gi, '_');
|
|
314
|
+
return `${itemKind}_vectors_${versionSlug}`;
|
|
315
|
+
}
|
|
316
|
+
```
|
|
317
|
+
|
|
318
|
+
## 7. Idris2 영감 적용
|
|
319
|
+
|
|
320
|
+
### 7.1 상태 전이 타입 안전성
|
|
321
|
+
|
|
322
|
+
```typescript
|
|
323
|
+
// 타입 레벨에서 유효한 상태 전이만 허용
|
|
324
|
+
type ValidTransition =
|
|
325
|
+
| { from: 'pending'; to: 'processing' }
|
|
326
|
+
| { from: 'processing'; to: 'done' }
|
|
327
|
+
| { from: 'processing'; to: 'failed' }
|
|
328
|
+
| { from: 'failed'; to: 'pending' }; // retry
|
|
329
|
+
|
|
330
|
+
function transition(job: OutboxJob, to: OutboxStatus): OutboxJob {
|
|
331
|
+
const valid: ValidTransition[] = [
|
|
332
|
+
{ from: 'pending', to: 'processing' },
|
|
333
|
+
{ from: 'processing', to: 'done' },
|
|
334
|
+
{ from: 'processing', to: 'failed' },
|
|
335
|
+
{ from: 'failed', to: 'pending' }
|
|
336
|
+
];
|
|
337
|
+
|
|
338
|
+
const isValid = valid.some(t => t.from === job.status && t.to === to);
|
|
339
|
+
if (!isValid) {
|
|
340
|
+
throw new InvalidTransitionError(`Cannot transition from ${job.status} to ${to}`);
|
|
341
|
+
}
|
|
342
|
+
|
|
343
|
+
return { ...job, status: to, updatedAt: new Date() };
|
|
344
|
+
}
|
|
345
|
+
```
|
|
346
|
+
|
|
347
|
+
### 7.2 Idempotency 불변식
|
|
348
|
+
|
|
349
|
+
```typescript
|
|
350
|
+
// Zod로 idempotency 검증
|
|
351
|
+
const OutboxJobSchema = z.object({
|
|
352
|
+
itemKind: ItemKindSchema,
|
|
353
|
+
itemId: z.string(),
|
|
354
|
+
embeddingVersion: z.string()
|
|
355
|
+
}).refine(
|
|
356
|
+
async (job) => {
|
|
357
|
+
// 같은 조합은 하나만 존재해야 함
|
|
358
|
+
const existing = await db.query(`
|
|
359
|
+
SELECT COUNT(*) as cnt FROM vector_outbox
|
|
360
|
+
WHERE item_kind = ? AND item_id = ? AND embedding_version = ?
|
|
361
|
+
`, [job.itemKind, job.itemId, job.embeddingVersion]);
|
|
362
|
+
return existing[0].cnt <= 1;
|
|
363
|
+
},
|
|
364
|
+
{ message: 'Duplicate outbox job' }
|
|
365
|
+
);
|
|
366
|
+
```
|
|
367
|
+
|
|
368
|
+
## 8. 기존 코드와의 관계
|
|
369
|
+
|
|
370
|
+
### 8.1 현재 vector-worker.ts
|
|
371
|
+
|
|
372
|
+
```typescript
|
|
373
|
+
// 현재 구현 (src/core/vector-worker.ts)
|
|
374
|
+
export class VectorWorker {
|
|
375
|
+
// OutboxItem 타입 사용
|
|
376
|
+
// status: 'pending' | 'processing' | 'done' | 'failed'
|
|
377
|
+
}
|
|
378
|
+
```
|
|
379
|
+
|
|
380
|
+
### 8.2 V2 확장 포인트
|
|
381
|
+
|
|
382
|
+
| 기존 | V2 확장 |
|
|
383
|
+
|-----|---------|
|
|
384
|
+
| OutboxItem 타입 | itemKind, embeddingVersion 추가 |
|
|
385
|
+
| 단순 배치 처리 | claiming with lock |
|
|
386
|
+
| 재시도 없음 | reconcile + retry policy |
|
|
387
|
+
| 중복 가능 | UNIQUE 제약 + upsert |
|
|
388
|
+
|
|
389
|
+
### 8.3 현재 vector-store.ts
|
|
390
|
+
|
|
391
|
+
```typescript
|
|
392
|
+
// 현재 구현 (src/core/vector-store.ts)
|
|
393
|
+
export class VectorStore {
|
|
394
|
+
async add(record: VectorRecord): Promise<void>;
|
|
395
|
+
async search(query: number[], limit: number): Promise<SearchResult[]>;
|
|
396
|
+
}
|
|
397
|
+
```
|
|
398
|
+
|
|
399
|
+
V2에서 `upsert` 메서드 추가 필요.
|
|
400
|
+
|
|
401
|
+
## 9. 운영 고려사항
|
|
402
|
+
|
|
403
|
+
### 9.1 모니터링
|
|
404
|
+
|
|
405
|
+
```typescript
|
|
406
|
+
// 메트릭 수집
|
|
407
|
+
interface OutboxMetrics {
|
|
408
|
+
pendingCount: number;
|
|
409
|
+
processingCount: number;
|
|
410
|
+
failedCount: number;
|
|
411
|
+
doneCount: number;
|
|
412
|
+
avgProcessingTimeMs: number;
|
|
413
|
+
lastProcessedAt: Date | null;
|
|
414
|
+
}
|
|
415
|
+
|
|
416
|
+
async function getMetrics(): Promise<OutboxMetrics> {
|
|
417
|
+
return db.query(`
|
|
418
|
+
SELECT
|
|
419
|
+
SUM(CASE WHEN status = 'pending' THEN 1 ELSE 0 END) as pendingCount,
|
|
420
|
+
SUM(CASE WHEN status = 'processing' THEN 1 ELSE 0 END) as processingCount,
|
|
421
|
+
SUM(CASE WHEN status = 'failed' THEN 1 ELSE 0 END) as failedCount,
|
|
422
|
+
SUM(CASE WHEN status = 'done' THEN 1 ELSE 0 END) as doneCount,
|
|
423
|
+
MAX(updated_at) as lastProcessedAt
|
|
424
|
+
FROM vector_outbox
|
|
425
|
+
`);
|
|
426
|
+
}
|
|
427
|
+
```
|
|
428
|
+
|
|
429
|
+
### 9.2 알림
|
|
430
|
+
|
|
431
|
+
```typescript
|
|
432
|
+
// failed job이 임계값 초과 시 알림
|
|
433
|
+
const FAILED_THRESHOLD = 10;
|
|
434
|
+
|
|
435
|
+
async function checkAndAlert(): Promise<void> {
|
|
436
|
+
const metrics = await getMetrics();
|
|
437
|
+
if (metrics.failedCount >= FAILED_THRESHOLD) {
|
|
438
|
+
console.error(`[ALERT] ${metrics.failedCount} failed vector jobs`);
|
|
439
|
+
// 추가 알림 로직
|
|
440
|
+
}
|
|
441
|
+
}
|
|
442
|
+
```
|
|
443
|
+
|
|
444
|
+
### 9.3 정리 작업
|
|
445
|
+
|
|
446
|
+
```typescript
|
|
447
|
+
// 정기적으로 완료된 job 정리
|
|
448
|
+
async function cleanup(): Promise<void> {
|
|
449
|
+
const deleted = await db.run(`
|
|
450
|
+
DELETE FROM vector_outbox
|
|
451
|
+
WHERE status = 'done'
|
|
452
|
+
AND updated_at < datetime('now', '-7 days')
|
|
453
|
+
`);
|
|
454
|
+
console.log(`Cleaned up ${deleted.changes} done jobs`);
|
|
455
|
+
}
|
|
456
|
+
```
|
|
457
|
+
|
|
458
|
+
## 10. 성공 기준
|
|
459
|
+
|
|
460
|
+
- [ ] vector_outbox 테이블 생성 및 UNIQUE 제약
|
|
461
|
+
- [ ] enqueue가 중복을 무시하고 idempotent하게 동작
|
|
462
|
+
- [ ] 단일 worker가 pending job을 처리
|
|
463
|
+
- [ ] LanceDB upsert로 중복 벡터 방지
|
|
464
|
+
- [ ] failed job 재시도 (reconcile) 동작
|
|
465
|
+
- [ ] processing 상태 stuck 복구 동작
|
|
466
|
+
- [ ] 기존 vector-worker.ts와 호환 유지
|