claude-memory-layer 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/commands/memory-forget.md +42 -0
- package/.claude-plugin/commands/memory-history.md +34 -0
- package/.claude-plugin/commands/memory-import.md +56 -0
- package/.claude-plugin/commands/memory-list.md +37 -0
- package/.claude-plugin/commands/memory-search.md +36 -0
- package/.claude-plugin/commands/memory-stats.md +34 -0
- package/.claude-plugin/hooks.json +59 -0
- package/.claude-plugin/plugin.json +24 -0
- package/.history/package_20260201112328.json +45 -0
- package/.history/package_20260201113602.json +45 -0
- package/.history/package_20260201113713.json +45 -0
- package/.history/package_20260201114110.json +45 -0
- package/Memo.txt +558 -0
- package/README.md +520 -0
- package/context.md +636 -0
- package/dist/.claude-plugin/commands/memory-forget.md +42 -0
- package/dist/.claude-plugin/commands/memory-history.md +34 -0
- package/dist/.claude-plugin/commands/memory-import.md +56 -0
- package/dist/.claude-plugin/commands/memory-list.md +37 -0
- package/dist/.claude-plugin/commands/memory-search.md +36 -0
- package/dist/.claude-plugin/commands/memory-stats.md +34 -0
- package/dist/.claude-plugin/hooks.json +59 -0
- package/dist/.claude-plugin/plugin.json +24 -0
- package/dist/cli/index.js +3539 -0
- package/dist/cli/index.js.map +7 -0
- package/dist/core/index.js +4408 -0
- package/dist/core/index.js.map +7 -0
- package/dist/hooks/session-end.js +2971 -0
- package/dist/hooks/session-end.js.map +7 -0
- package/dist/hooks/session-start.js +2969 -0
- package/dist/hooks/session-start.js.map +7 -0
- package/dist/hooks/stop.js +3123 -0
- package/dist/hooks/stop.js.map +7 -0
- package/dist/hooks/user-prompt-submit.js +2960 -0
- package/dist/hooks/user-prompt-submit.js.map +7 -0
- package/dist/services/memory-service.js +2931 -0
- package/dist/services/memory-service.js.map +7 -0
- package/package.json +45 -0
- package/plan.md +1642 -0
- package/scripts/build.ts +102 -0
- package/spec.md +624 -0
- package/specs/citations-system/context.md +243 -0
- package/specs/citations-system/plan.md +495 -0
- package/specs/citations-system/spec.md +371 -0
- package/specs/endless-mode/context.md +305 -0
- package/specs/endless-mode/plan.md +620 -0
- package/specs/endless-mode/spec.md +455 -0
- package/specs/entity-edge-model/context.md +401 -0
- package/specs/entity-edge-model/plan.md +459 -0
- package/specs/entity-edge-model/spec.md +391 -0
- package/specs/evidence-aligner-v2/context.md +401 -0
- package/specs/evidence-aligner-v2/plan.md +303 -0
- package/specs/evidence-aligner-v2/spec.md +312 -0
- package/specs/mcp-desktop-integration/context.md +278 -0
- package/specs/mcp-desktop-integration/plan.md +550 -0
- package/specs/mcp-desktop-integration/spec.md +494 -0
- package/specs/post-tool-use-hook/context.md +319 -0
- package/specs/post-tool-use-hook/plan.md +469 -0
- package/specs/post-tool-use-hook/spec.md +364 -0
- package/specs/private-tags/context.md +288 -0
- package/specs/private-tags/plan.md +412 -0
- package/specs/private-tags/spec.md +345 -0
- package/specs/progressive-disclosure/context.md +346 -0
- package/specs/progressive-disclosure/plan.md +663 -0
- package/specs/progressive-disclosure/spec.md +415 -0
- package/specs/task-entity-system/context.md +297 -0
- package/specs/task-entity-system/plan.md +301 -0
- package/specs/task-entity-system/spec.md +314 -0
- package/specs/vector-outbox-v2/context.md +470 -0
- package/specs/vector-outbox-v2/plan.md +562 -0
- package/specs/vector-outbox-v2/spec.md +466 -0
- package/specs/web-viewer-ui/context.md +384 -0
- package/specs/web-viewer-ui/plan.md +797 -0
- package/specs/web-viewer-ui/spec.md +516 -0
- package/src/cli/index.ts +570 -0
- package/src/core/canonical-key.ts +186 -0
- package/src/core/citation-generator.ts +63 -0
- package/src/core/consolidated-store.ts +279 -0
- package/src/core/consolidation-worker.ts +384 -0
- package/src/core/context-formatter.ts +276 -0
- package/src/core/continuity-manager.ts +336 -0
- package/src/core/edge-repo.ts +324 -0
- package/src/core/embedder.ts +124 -0
- package/src/core/entity-repo.ts +342 -0
- package/src/core/event-store.ts +672 -0
- package/src/core/evidence-aligner.ts +635 -0
- package/src/core/graduation.ts +365 -0
- package/src/core/index.ts +32 -0
- package/src/core/matcher.ts +210 -0
- package/src/core/metadata-extractor.ts +203 -0
- package/src/core/privacy/filter.ts +179 -0
- package/src/core/privacy/index.ts +20 -0
- package/src/core/privacy/tag-parser.ts +145 -0
- package/src/core/progressive-retriever.ts +415 -0
- package/src/core/retriever.ts +235 -0
- package/src/core/task/blocker-resolver.ts +325 -0
- package/src/core/task/index.ts +9 -0
- package/src/core/task/task-matcher.ts +238 -0
- package/src/core/task/task-projector.ts +345 -0
- package/src/core/task/task-resolver.ts +414 -0
- package/src/core/types.ts +841 -0
- package/src/core/vector-outbox.ts +295 -0
- package/src/core/vector-store.ts +182 -0
- package/src/core/vector-worker.ts +488 -0
- package/src/core/working-set-store.ts +244 -0
- package/src/hooks/post-tool-use.ts +127 -0
- package/src/hooks/session-end.ts +78 -0
- package/src/hooks/session-start.ts +57 -0
- package/src/hooks/stop.ts +78 -0
- package/src/hooks/user-prompt-submit.ts +54 -0
- package/src/mcp/handlers.ts +212 -0
- package/src/mcp/index.ts +47 -0
- package/src/mcp/tools.ts +78 -0
- package/src/server/api/citations.ts +101 -0
- package/src/server/api/events.ts +101 -0
- package/src/server/api/index.ts +18 -0
- package/src/server/api/search.ts +98 -0
- package/src/server/api/sessions.ts +111 -0
- package/src/server/api/stats.ts +97 -0
- package/src/server/index.ts +91 -0
- package/src/services/memory-service.ts +626 -0
- package/src/services/session-history-importer.ts +367 -0
- package/tests/canonical-key.test.ts +101 -0
- package/tests/evidence-aligner.test.ts +152 -0
- package/tests/matcher.test.ts +112 -0
- package/tsconfig.json +24 -0
- package/vitest.config.ts +15 -0
|
@@ -0,0 +1,470 @@
|
|
|
1
|
+
# Vector Outbox V2 Context
|
|
2
|
+
|
|
3
|
+
> **Version**: 2.0.0
|
|
4
|
+
> **Created**: 2026-01-31
|
|
5
|
+
|
|
6
|
+
## 1. 배경
|
|
7
|
+
|
|
8
|
+
### 1.1 분산 시스템의 정합성 문제
|
|
9
|
+
|
|
10
|
+
두 개의 서로 다른 저장소(DuckDB, LanceDB)에 데이터를 저장할 때:
|
|
11
|
+
|
|
12
|
+
```
|
|
13
|
+
Application
|
|
14
|
+
│
|
|
15
|
+
├──▶ DuckDB (entries 저장) ✓
|
|
16
|
+
│
|
|
17
|
+
└──▶ LanceDB (벡터 저장) ✗ (실패)
|
|
18
|
+
|
|
19
|
+
결과: DuckDB에는 있지만 LanceDB에는 없는 불일치 상태
|
|
20
|
+
```
|
|
21
|
+
|
|
22
|
+
**문제 시나리오**:
|
|
23
|
+
1. Entry가 저장되었지만 임베딩이 실패
|
|
24
|
+
2. 재시작 시 어떤 entry가 임베딩되지 않았는지 알 수 없음
|
|
25
|
+
3. 검색 결과에서 해당 entry가 누락
|
|
26
|
+
|
|
27
|
+
### 1.2 Transactional Outbox Pattern
|
|
28
|
+
|
|
29
|
+
마이크로서비스 아키텍처에서 검증된 패턴:
|
|
30
|
+
|
|
31
|
+
```
|
|
32
|
+
┌─────────────────────────────────────┐
|
|
33
|
+
│ DuckDB Transaction │
|
|
34
|
+
│ │
|
|
35
|
+
│ 1. INSERT INTO entries (...) │
|
|
36
|
+
│ 2. INSERT INTO vector_outbox (...) │
|
|
37
|
+
│ │
|
|
38
|
+
│ COMMIT │
|
|
39
|
+
└─────────────────────────────────────┘
|
|
40
|
+
│
|
|
41
|
+
│ (비동기)
|
|
42
|
+
▼
|
|
43
|
+
┌─────────────────────────────────────┐
|
|
44
|
+
│ Vector Worker │
|
|
45
|
+
│ │
|
|
46
|
+
│ 1. SELECT * FROM vector_outbox │
|
|
47
|
+
│ WHERE status = 'pending' │
|
|
48
|
+
│ 2. Generate embedding │
|
|
49
|
+
│ 3. Upsert to LanceDB │
|
|
50
|
+
│ 4. UPDATE status = 'done' │
|
|
51
|
+
└─────────────────────────────────────┘
|
|
52
|
+
```
|
|
53
|
+
|
|
54
|
+
**장점**:
|
|
55
|
+
- 원자성 보장 (DuckDB 트랜잭션 내)
|
|
56
|
+
- 실패 시 재시도 가능
|
|
57
|
+
- 상태 추적 가능
|
|
58
|
+
|
|
59
|
+
## 2. Memo.txt 참고 사항
|
|
60
|
+
|
|
61
|
+
### 2.1 핵심 원칙 (섹션 2.6)
|
|
62
|
+
|
|
63
|
+
> **6. Vector store 정합성**
|
|
64
|
+
> - DuckDB에 먼저 기록 → outbox → 단일 writer가 LanceDB에 upsert → DuckDB 상태 업데이트
|
|
65
|
+
|
|
66
|
+
### 2.2 스키마 (섹션 4.4)
|
|
67
|
+
|
|
68
|
+
```sql
|
|
69
|
+
CREATE TABLE vector_outbox (
|
|
70
|
+
job_id VARCHAR PRIMARY KEY,
|
|
71
|
+
item_kind VARCHAR NOT NULL, -- entry|task_title
|
|
72
|
+
item_id VARCHAR NOT NULL,
|
|
73
|
+
embedding_version VARCHAR NOT NULL,
|
|
74
|
+
status VARCHAR NOT NULL, -- pending|done|failed
|
|
75
|
+
error VARCHAR,
|
|
76
|
+
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
|
|
77
|
+
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
|
|
78
|
+
UNIQUE(item_kind, item_id, embedding_version)
|
|
79
|
+
);
|
|
80
|
+
```
|
|
81
|
+
|
|
82
|
+
### 2.3 Worker 지시 (섹션 8)
|
|
83
|
+
|
|
84
|
+
**Outbox enqueue**:
|
|
85
|
+
- entry materialized 시: `item_kind='entry'`
|
|
86
|
+
- task_created/task_title_changed 시: `item_kind='task_title'`
|
|
87
|
+
|
|
88
|
+
**Single writer worker**:
|
|
89
|
+
- pending 배치 처리
|
|
90
|
+
- LanceDB **idempotent upsert**
|
|
91
|
+
- 같은 id는 중복 row가 쌓이지 않게
|
|
92
|
+
|
|
93
|
+
**reconcile()**:
|
|
94
|
+
- pending 재처리
|
|
95
|
+
- failed는 재시도 정책
|
|
96
|
+
|
|
97
|
+
## 3. Idris2 영감 적용
|
|
98
|
+
|
|
99
|
+
### 3.1 상태 머신 타입 안전성
|
|
100
|
+
|
|
101
|
+
**Idris2 개념**:
|
|
102
|
+
```idris
|
|
103
|
+
-- 상태 전이가 타입 수준에서 정의됨
|
|
104
|
+
data OutboxState = Pending | Processing | Done | Failed
|
|
105
|
+
|
|
106
|
+
data Transition : OutboxState -> OutboxState -> Type where
|
|
107
|
+
Claim : Transition Pending Processing
|
|
108
|
+
Complete : Transition Processing Done
|
|
109
|
+
Fail : Transition Processing Failed
|
|
110
|
+
Retry : Transition Failed Pending
|
|
111
|
+
```
|
|
112
|
+
|
|
113
|
+
**TypeScript 적용**:
|
|
114
|
+
```typescript
|
|
115
|
+
// 유효한 전이만 타입으로 정의
|
|
116
|
+
type ValidTransition =
|
|
117
|
+
| { from: 'pending'; to: 'processing' }
|
|
118
|
+
| { from: 'processing'; to: 'done' }
|
|
119
|
+
| { from: 'processing'; to: 'failed' }
|
|
120
|
+
| { from: 'failed'; to: 'pending' };
|
|
121
|
+
|
|
122
|
+
// 런타임 검증
|
|
123
|
+
function assertValidTransition(from: OutboxStatus, to: OutboxStatus): void {
|
|
124
|
+
const valid: ValidTransition[] = [...];
|
|
125
|
+
if (!valid.some(t => t.from === from && t.to === to)) {
|
|
126
|
+
throw new Error(`Invalid transition: ${from} → ${to}`);
|
|
127
|
+
}
|
|
128
|
+
}
|
|
129
|
+
```
|
|
130
|
+
|
|
131
|
+
### 3.2 Idempotency 증명
|
|
132
|
+
|
|
133
|
+
**Idris2 개념**:
|
|
134
|
+
```idris
|
|
135
|
+
-- 같은 입력에 같은 결과
|
|
136
|
+
idempotent : (f : a -> a) -> Type
|
|
137
|
+
idempotent f = (x : a) -> f (f x) = f x
|
|
138
|
+
```
|
|
139
|
+
|
|
140
|
+
**TypeScript 적용**:
|
|
141
|
+
```typescript
|
|
142
|
+
// UNIQUE 제약으로 idempotency 보장
|
|
143
|
+
const UNIQUE_CONSTRAINT = `
|
|
144
|
+
UNIQUE(item_kind, item_id, embedding_version)
|
|
145
|
+
`;
|
|
146
|
+
|
|
147
|
+
// enqueue는 여러 번 호출해도 같은 결과
|
|
148
|
+
async function enqueue(input: EnqueueInput): Promise<EnqueueResult> {
|
|
149
|
+
await db.run(`
|
|
150
|
+
INSERT INTO vector_outbox (...)
|
|
151
|
+
ON CONFLICT (item_kind, item_id, embedding_version)
|
|
152
|
+
DO NOTHING
|
|
153
|
+
`, [...]);
|
|
154
|
+
// 결과는 항상 동일: 하나의 job만 존재
|
|
155
|
+
}
|
|
156
|
+
```
|
|
157
|
+
|
|
158
|
+
### 3.3 벡터 upsert 증명
|
|
159
|
+
|
|
160
|
+
```typescript
|
|
161
|
+
// upsert 후 조건: 정확히 하나의 레코드만 존재
|
|
162
|
+
interface UpsertInvariant {
|
|
163
|
+
// Pre: record with id=X may or may not exist
|
|
164
|
+
// Post: exactly one record with id=X exists, with latest values
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
async function upsert(record: VectorRecord): Promise<void> {
|
|
168
|
+
// Delete existing (if any)
|
|
169
|
+
await table.delete(`id = '${record.id}'`);
|
|
170
|
+
// Insert new
|
|
171
|
+
await table.add([record]);
|
|
172
|
+
// Invariant: exactly one record with id exists
|
|
173
|
+
}
|
|
174
|
+
```
|
|
175
|
+
|
|
176
|
+
## 4. 기존 코드와의 관계
|
|
177
|
+
|
|
178
|
+
### 4.1 현재 vector-worker.ts
|
|
179
|
+
|
|
180
|
+
```typescript
|
|
181
|
+
// 현재 구현 (src/core/vector-worker.ts)
|
|
182
|
+
export class VectorWorker {
|
|
183
|
+
private embedder: Embedder;
|
|
184
|
+
private vectorStore: VectorStore;
|
|
185
|
+
private db: Database;
|
|
186
|
+
}
|
|
187
|
+
|
|
188
|
+
export interface OutboxItem {
|
|
189
|
+
id: string;
|
|
190
|
+
eventId: string;
|
|
191
|
+
content: string;
|
|
192
|
+
status: 'pending' | 'processing' | 'done' | 'failed';
|
|
193
|
+
retryCount: number;
|
|
194
|
+
createdAt: Date;
|
|
195
|
+
errorMessage?: string;
|
|
196
|
+
}
|
|
197
|
+
```
|
|
198
|
+
|
|
199
|
+
### 4.2 V2 확장 포인트
|
|
200
|
+
|
|
201
|
+
| 기존 | V2 확장 |
|
|
202
|
+
|-----|---------|
|
|
203
|
+
| eventId 기반 | item_kind + item_id |
|
|
204
|
+
| 단순 status | embedding_version 추가 |
|
|
205
|
+
| 재시도 없음 | reconcile + retry policy |
|
|
206
|
+
| 중복 가능 | UNIQUE + upsert |
|
|
207
|
+
|
|
208
|
+
### 4.3 현재 types.ts
|
|
209
|
+
|
|
210
|
+
```typescript
|
|
211
|
+
// 현재 OutboxItem 정의
|
|
212
|
+
export interface OutboxItem {
|
|
213
|
+
id: string;
|
|
214
|
+
eventId: string;
|
|
215
|
+
content: string;
|
|
216
|
+
status: 'pending' | 'processing' | 'done' | 'failed';
|
|
217
|
+
retryCount: number;
|
|
218
|
+
createdAt: Date;
|
|
219
|
+
errorMessage?: string;
|
|
220
|
+
}
|
|
221
|
+
```
|
|
222
|
+
|
|
223
|
+
V2에서 OutboxJob으로 확장.
|
|
224
|
+
|
|
225
|
+
## 5. 설계 결정 사항
|
|
226
|
+
|
|
227
|
+
### 5.1 왜 embedding_version을 포함하는가?
|
|
228
|
+
|
|
229
|
+
**시나리오**:
|
|
230
|
+
1. 모델 v1으로 entry A 임베딩
|
|
231
|
+
2. 모델 v2로 업그레이드
|
|
232
|
+
3. entry A를 v2로 재임베딩 필요
|
|
233
|
+
|
|
234
|
+
**해결**:
|
|
235
|
+
```sql
|
|
236
|
+
-- v1과 v2 job이 별도로 존재 가능
|
|
237
|
+
UNIQUE(item_kind, item_id, embedding_version)
|
|
238
|
+
|
|
239
|
+
-- v1 job
|
|
240
|
+
(job_1, 'entry', 'e1', 'minilm-v1', 'done')
|
|
241
|
+
|
|
242
|
+
-- v2 job
|
|
243
|
+
(job_2, 'entry', 'e1', 'minilm-v2', 'pending')
|
|
244
|
+
```
|
|
245
|
+
|
|
246
|
+
### 5.2 왜 단일 writer인가?
|
|
247
|
+
|
|
248
|
+
**문제**: 여러 프로세스가 동시에 LanceDB에 쓰면
|
|
249
|
+
- 동일 id에 대해 race condition
|
|
250
|
+
- delete와 add 사이에 다른 write 끼어들 수 있음
|
|
251
|
+
- LanceDB 자체 락 메커니즘 미약
|
|
252
|
+
|
|
253
|
+
**해결**:
|
|
254
|
+
- 애플리케이션 레벨에서 단일 writer 보장
|
|
255
|
+
- 파일 락 또는 DB 락 사용
|
|
256
|
+
|
|
257
|
+
### 5.3 왜 delete + add인가?
|
|
258
|
+
|
|
259
|
+
LanceDB가 true upsert를 지원하지 않기 때문:
|
|
260
|
+
|
|
261
|
+
```typescript
|
|
262
|
+
// 방법 1: update 시도 (LanceDB 제한적 지원)
|
|
263
|
+
await table.update({ id: 'e1' }, { vector: newVector }); // 불완전
|
|
264
|
+
|
|
265
|
+
// 방법 2: delete + add (권장)
|
|
266
|
+
await table.delete(`id = 'e1'`);
|
|
267
|
+
await table.add([{ id: 'e1', vector: newVector, ... }]); // 확실
|
|
268
|
+
```
|
|
269
|
+
|
|
270
|
+
## 6. Reconcile 전략
|
|
271
|
+
|
|
272
|
+
### 6.1 Failed Job 재시도
|
|
273
|
+
|
|
274
|
+
```typescript
|
|
275
|
+
const RETRY_POLICY = {
|
|
276
|
+
maxRetries: 3,
|
|
277
|
+
backoffMs: [1000, 5000, 30000] // 1초, 5초, 30초
|
|
278
|
+
};
|
|
279
|
+
|
|
280
|
+
async function shouldRetry(job: OutboxJob): Promise<boolean> {
|
|
281
|
+
return job.retryCount < RETRY_POLICY.maxRetries;
|
|
282
|
+
}
|
|
283
|
+
|
|
284
|
+
async function reconcileFailed(): Promise<number> {
|
|
285
|
+
return db.run(`
|
|
286
|
+
UPDATE vector_outbox
|
|
287
|
+
SET status = 'pending',
|
|
288
|
+
retry_count = retry_count + 1,
|
|
289
|
+
updated_at = CURRENT_TIMESTAMP
|
|
290
|
+
WHERE status = 'failed'
|
|
291
|
+
AND retry_count < ?
|
|
292
|
+
`, [RETRY_POLICY.maxRetries]);
|
|
293
|
+
}
|
|
294
|
+
```
|
|
295
|
+
|
|
296
|
+
### 6.2 Stuck Job 복구
|
|
297
|
+
|
|
298
|
+
Processing 상태에서 worker가 죽으면:
|
|
299
|
+
|
|
300
|
+
```typescript
|
|
301
|
+
const STUCK_THRESHOLD_MS = 5 * 60 * 1000; // 5분
|
|
302
|
+
|
|
303
|
+
async function recoverStuck(): Promise<number> {
|
|
304
|
+
const threshold = new Date(Date.now() - STUCK_THRESHOLD_MS);
|
|
305
|
+
return db.run(`
|
|
306
|
+
UPDATE vector_outbox
|
|
307
|
+
SET status = 'pending',
|
|
308
|
+
updated_at = CURRENT_TIMESTAMP
|
|
309
|
+
WHERE status = 'processing'
|
|
310
|
+
AND updated_at < ?
|
|
311
|
+
`, [threshold]);
|
|
312
|
+
}
|
|
313
|
+
```
|
|
314
|
+
|
|
315
|
+
### 6.3 Done Job 정리
|
|
316
|
+
|
|
317
|
+
저장 공간 관리:
|
|
318
|
+
|
|
319
|
+
```typescript
|
|
320
|
+
async function cleanupDone(olderThanDays: number = 7): Promise<number> {
|
|
321
|
+
return db.run(`
|
|
322
|
+
DELETE FROM vector_outbox
|
|
323
|
+
WHERE status = 'done'
|
|
324
|
+
AND updated_at < datetime('now', '-${olderThanDays} days')
|
|
325
|
+
`);
|
|
326
|
+
}
|
|
327
|
+
```
|
|
328
|
+
|
|
329
|
+
## 7. 모니터링 및 알림
|
|
330
|
+
|
|
331
|
+
### 7.1 메트릭
|
|
332
|
+
|
|
333
|
+
```typescript
|
|
334
|
+
interface OutboxMetrics {
|
|
335
|
+
pendingCount: number;
|
|
336
|
+
processingCount: number;
|
|
337
|
+
doneCount: number;
|
|
338
|
+
failedCount: number;
|
|
339
|
+
avgProcessingTimeMs: number;
|
|
340
|
+
oldestPendingAge: number; // 가장 오래된 pending job의 나이 (ms)
|
|
341
|
+
}
|
|
342
|
+
```
|
|
343
|
+
|
|
344
|
+
### 7.2 알림 조건
|
|
345
|
+
|
|
346
|
+
```typescript
|
|
347
|
+
const ALERT_THRESHOLDS = {
|
|
348
|
+
failedCount: 10, // failed가 10개 이상
|
|
349
|
+
pendingAge: 60 * 60 * 1000 // pending이 1시간 이상 된 경우
|
|
350
|
+
};
|
|
351
|
+
|
|
352
|
+
async function checkAlerts(): Promise<Alert[]> {
|
|
353
|
+
const metrics = await getMetrics();
|
|
354
|
+
const alerts: Alert[] = [];
|
|
355
|
+
|
|
356
|
+
if (metrics.failedCount >= ALERT_THRESHOLDS.failedCount) {
|
|
357
|
+
alerts.push({
|
|
358
|
+
level: 'warning',
|
|
359
|
+
message: `${metrics.failedCount} vector jobs failed`
|
|
360
|
+
});
|
|
361
|
+
}
|
|
362
|
+
|
|
363
|
+
if (metrics.oldestPendingAge >= ALERT_THRESHOLDS.pendingAge) {
|
|
364
|
+
alerts.push({
|
|
365
|
+
level: 'warning',
|
|
366
|
+
message: `Oldest pending job is ${metrics.oldestPendingAge / 1000}s old`
|
|
367
|
+
});
|
|
368
|
+
}
|
|
369
|
+
|
|
370
|
+
return alerts;
|
|
371
|
+
}
|
|
372
|
+
```
|
|
373
|
+
|
|
374
|
+
## 8. 에러 처리
|
|
375
|
+
|
|
376
|
+
### 8.1 임베딩 실패
|
|
377
|
+
|
|
378
|
+
```typescript
|
|
379
|
+
try {
|
|
380
|
+
const embedding = await embedder.embed(content);
|
|
381
|
+
} catch (error) {
|
|
382
|
+
if (error.message.includes('rate limit')) {
|
|
383
|
+
// 재시도 가능
|
|
384
|
+
throw new RetryableError('Rate limited', { retryAfterMs: 60000 });
|
|
385
|
+
} else if (error.message.includes('too long')) {
|
|
386
|
+
// 영구 실패
|
|
387
|
+
throw new PermanentError('Content too long for embedding');
|
|
388
|
+
}
|
|
389
|
+
throw error;
|
|
390
|
+
}
|
|
391
|
+
```
|
|
392
|
+
|
|
393
|
+
### 8.2 LanceDB 실패
|
|
394
|
+
|
|
395
|
+
```typescript
|
|
396
|
+
try {
|
|
397
|
+
await vectorStore.upsert(record);
|
|
398
|
+
} catch (error) {
|
|
399
|
+
if (error.message.includes('disk full')) {
|
|
400
|
+
throw new PermanentError('Disk full');
|
|
401
|
+
} else if (error.message.includes('connection')) {
|
|
402
|
+
throw new RetryableError('Connection failed');
|
|
403
|
+
}
|
|
404
|
+
throw error;
|
|
405
|
+
}
|
|
406
|
+
```
|
|
407
|
+
|
|
408
|
+
### 8.3 콘텐츠 없음
|
|
409
|
+
|
|
410
|
+
```typescript
|
|
411
|
+
const content = await getContent(job.itemKind, job.itemId);
|
|
412
|
+
if (!content) {
|
|
413
|
+
// Entry가 삭제되었거나 존재하지 않음
|
|
414
|
+
// Job을 done으로 마크하고 건너뜀
|
|
415
|
+
await markDone(job.jobId, { skipped: true, reason: 'content_not_found' });
|
|
416
|
+
return;
|
|
417
|
+
}
|
|
418
|
+
```
|
|
419
|
+
|
|
420
|
+
## 9. 성능 고려사항
|
|
421
|
+
|
|
422
|
+
### 9.1 배치 처리
|
|
423
|
+
|
|
424
|
+
```typescript
|
|
425
|
+
const BATCH_SIZE = 50;
|
|
426
|
+
|
|
427
|
+
// 한 번에 여러 job claim
|
|
428
|
+
const jobs = await claimJobs(BATCH_SIZE);
|
|
429
|
+
|
|
430
|
+
// 임베딩도 배치로
|
|
431
|
+
const contents = jobs.map(j => j.content);
|
|
432
|
+
const embeddings = await embedder.embedBatch(contents);
|
|
433
|
+
|
|
434
|
+
// LanceDB 배치 insert
|
|
435
|
+
await vectorStore.addBatch(jobs.map((j, i) => ({
|
|
436
|
+
id: j.itemId,
|
|
437
|
+
vector: embeddings[i],
|
|
438
|
+
...
|
|
439
|
+
})));
|
|
440
|
+
```
|
|
441
|
+
|
|
442
|
+
### 9.2 병렬 처리 (주의)
|
|
443
|
+
|
|
444
|
+
```typescript
|
|
445
|
+
// 단일 writer 내에서 병렬 처리
|
|
446
|
+
// LanceDB 쓰기는 순차적으로, 임베딩은 병렬로
|
|
447
|
+
|
|
448
|
+
const jobs = await claimJobs(BATCH_SIZE);
|
|
449
|
+
|
|
450
|
+
// 임베딩 병렬 생성
|
|
451
|
+
const embeddings = await Promise.all(
|
|
452
|
+
jobs.map(async (job) => {
|
|
453
|
+
const content = await getContent(job.itemKind, job.itemId);
|
|
454
|
+
return embedder.embed(content);
|
|
455
|
+
})
|
|
456
|
+
);
|
|
457
|
+
|
|
458
|
+
// LanceDB 순차 쓰기
|
|
459
|
+
for (let i = 0; i < jobs.length; i++) {
|
|
460
|
+
await vectorStore.upsert({ id: jobs[i].itemId, vector: embeddings[i], ... });
|
|
461
|
+
await markDone(jobs[i].jobId);
|
|
462
|
+
}
|
|
463
|
+
```
|
|
464
|
+
|
|
465
|
+
## 10. 참고 자료
|
|
466
|
+
|
|
467
|
+
- **Memo.txt**: 섹션 8 - Vector Outbox + LanceDB writer 구현 지시
|
|
468
|
+
- **현재 구현**: `src/core/vector-worker.ts`
|
|
469
|
+
- **Transactional Outbox**: 마이크로서비스 패턴
|
|
470
|
+
- **AXIOMMIND**: Principle 6 - 벡터 정합성
|