claude-brain 0.30.2 → 0.30.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (236) hide show
  1. package/README.md +241 -191
  2. package/VERSION +1 -1
  3. package/assets/CLAUDE-unified.md +11 -11
  4. package/assets/CLAUDE.md +29 -29
  5. package/package.json +7 -3
  6. package/packs/backend/node.json +173 -173
  7. package/packs/core/javascript.json +176 -176
  8. package/packs/core/typescript.json +222 -222
  9. package/packs/frontend/react.json +254 -254
  10. package/packs/meta/testing.json +172 -172
  11. package/scripts/postinstall.mjs +531 -531
  12. package/src/automation/decision-detector.ts +452 -452
  13. package/src/automation/phase12-manager.ts +456 -456
  14. package/src/automation/proactive-recall.ts +373 -373
  15. package/src/automation/project-detector.ts +310 -310
  16. package/src/automation/repo-scanner.ts +210 -205
  17. package/src/cli/auto-setup.ts +75 -75
  18. package/src/cli/auto-start.ts +266 -266
  19. package/src/cli/bin.ts +264 -264
  20. package/src/cli/commands/autostart.ts +90 -90
  21. package/src/cli/commands/chroma.ts +578 -577
  22. package/src/cli/commands/export-training.ts +70 -70
  23. package/src/cli/commands/export.ts +130 -130
  24. package/src/cli/commands/git-hook.ts +183 -183
  25. package/src/cli/commands/hooks.ts +217 -217
  26. package/src/cli/commands/init.ts +123 -123
  27. package/src/cli/commands/install-mcp.ts +122 -111
  28. package/src/cli/commands/models.ts +979 -979
  29. package/src/cli/commands/pack.ts +200 -200
  30. package/src/cli/commands/refresh.ts +344 -339
  31. package/src/cli/commands/reindex.ts +120 -120
  32. package/src/cli/commands/serve.ts +466 -463
  33. package/src/cli/commands/start.ts +44 -44
  34. package/src/cli/commands/status.ts +220 -203
  35. package/src/cli/commands/uninstall-mcp.ts +45 -41
  36. package/src/cli/commands/update.ts +130 -124
  37. package/src/cli/migrate-chroma.ts +106 -106
  38. package/src/cli/ui/animations.ts +80 -80
  39. package/src/cli/ui/components.ts +82 -82
  40. package/src/cli/ui/index.ts +4 -4
  41. package/src/cli/ui/logo.ts +36 -36
  42. package/src/cli/ui/theme.ts +55 -55
  43. package/src/code-intelligence/indexer.ts +352 -352
  44. package/src/code-intelligence/linker.ts +178 -178
  45. package/src/code-intelligence/parser.ts +484 -484
  46. package/src/code-intelligence/query.ts +291 -291
  47. package/src/code-intelligence/schema.ts +83 -83
  48. package/src/code-intelligence/types.ts +95 -95
  49. package/src/config/defaults.ts +52 -52
  50. package/src/config/home.ts +56 -56
  51. package/src/config/index.ts +5 -5
  52. package/src/config/loader.ts +192 -192
  53. package/src/config/schema.ts +446 -415
  54. package/src/config/validator.ts +182 -182
  55. package/src/context/assembler.ts +407 -400
  56. package/src/context/index.ts +79 -79
  57. package/src/context/progress-tracker.ts +174 -174
  58. package/src/context/standards-manager.ts +287 -287
  59. package/src/context/validator.ts +58 -58
  60. package/src/diagnostics/index.ts +122 -121
  61. package/src/health/index.ts +233 -232
  62. package/src/hooks/brain-hook.ts +134 -131
  63. package/src/hooks/capture.ts +168 -168
  64. package/src/hooks/claude-code-mastery.md +112 -112
  65. package/src/hooks/context-hook.ts +260 -245
  66. package/src/hooks/deduplicator.ts +72 -72
  67. package/src/hooks/git-capture.ts +109 -109
  68. package/src/hooks/git-hook-installer.ts +211 -207
  69. package/src/hooks/index.ts +20 -20
  70. package/src/hooks/installer.ts +306 -288
  71. package/src/hooks/interceptor-hook.ts +204 -201
  72. package/src/hooks/passive-classifier.ts +397 -397
  73. package/src/hooks/queue.ts +160 -129
  74. package/src/hooks/session-tracker.ts +312 -312
  75. package/src/hooks/types.ts +52 -52
  76. package/src/index.ts +7 -7
  77. package/src/intelligence/cross-project/generalizer.ts +283 -283
  78. package/src/intelligence/cross-project/index.ts +7 -7
  79. package/src/intelligence/hf-downloader.ts +222 -222
  80. package/src/intelligence/hf-manifest.json +78 -78
  81. package/src/intelligence/index.ts +24 -24
  82. package/src/intelligence/inference-router.ts +762 -762
  83. package/src/intelligence/model-manager.ts +263 -245
  84. package/src/intelligence/optimization/index.ts +10 -10
  85. package/src/intelligence/optimization/precompute.ts +202 -202
  86. package/src/intelligence/optimization/semantic-cache.ts +213 -207
  87. package/src/intelligence/prediction/index.ts +7 -7
  88. package/src/intelligence/prediction/recommender.ts +276 -268
  89. package/src/intelligence/reasoning/chain-retrieval.ts +243 -247
  90. package/src/intelligence/reasoning/index.ts +7 -7
  91. package/src/intelligence/temporal/evolution.ts +193 -197
  92. package/src/intelligence/temporal/index.ts +16 -16
  93. package/src/intelligence/temporal/query-processor.ts +190 -190
  94. package/src/intelligence/temporal/timeline.ts +272 -259
  95. package/src/intelligence/temporal/trends.ts +263 -263
  96. package/src/intelligence/tokenizer.ts +118 -118
  97. package/src/knowledge/entity-extractor.ts +447 -443
  98. package/src/knowledge/graph/builder.ts +185 -185
  99. package/src/knowledge/graph/linker.ts +201 -201
  100. package/src/knowledge/graph/memory-graph.ts +359 -359
  101. package/src/knowledge/graph/schema.ts +99 -99
  102. package/src/knowledge/graph/search.ts +166 -166
  103. package/src/knowledge/relationship-extractor.ts +108 -108
  104. package/src/memory/chroma/client.ts +211 -192
  105. package/src/memory/chroma/collection-manager.ts +92 -92
  106. package/src/memory/chroma/config.ts +57 -57
  107. package/src/memory/chroma/embeddings.ts +177 -175
  108. package/src/memory/chroma/index.ts +82 -82
  109. package/src/memory/chroma/migration.ts +270 -270
  110. package/src/memory/chroma/schemas.ts +69 -69
  111. package/src/memory/chroma/search.ts +319 -315
  112. package/src/memory/chroma/store.ts +755 -747
  113. package/src/memory/compression.ts +121 -121
  114. package/src/memory/consolidation/archiver.ts +162 -165
  115. package/src/memory/consolidation/merger.ts +182 -186
  116. package/src/memory/consolidation/scorer.ts +136 -136
  117. package/src/memory/database.ts +9 -0
  118. package/src/memory/dual-write.ts +145 -0
  119. package/src/memory/embeddings.ts +226 -226
  120. package/src/memory/episodic/detector.ts +108 -108
  121. package/src/memory/episodic/manager.ts +347 -351
  122. package/src/memory/episodic/summarizer.ts +179 -179
  123. package/src/memory/episodic/types.ts +52 -52
  124. package/src/memory/fts5-search.ts +692 -633
  125. package/src/memory/index.ts +943 -1060
  126. package/src/memory/migrations/add-fts5.ts +118 -108
  127. package/src/memory/patterns.ts +438 -438
  128. package/src/memory/pruning.ts +60 -60
  129. package/src/memory/schema.ts +88 -88
  130. package/src/memory/store.ts +911 -787
  131. package/src/orchestrator/handlers/decision-handler.ts +204 -204
  132. package/src/packs/index.ts +9 -9
  133. package/src/packs/loader.ts +134 -134
  134. package/src/packs/manager.ts +204 -204
  135. package/src/packs/ranker.ts +78 -78
  136. package/src/packs/types.ts +81 -81
  137. package/src/phase12/index.ts +5 -5
  138. package/src/retrieval/bm25/index.ts +300 -297
  139. package/src/retrieval/bm25/tokenizer.ts +184 -184
  140. package/src/retrieval/feedback/adaptive.ts +221 -221
  141. package/src/retrieval/feedback/index.ts +16 -16
  142. package/src/retrieval/feedback/metrics.ts +221 -221
  143. package/src/retrieval/feedback/store.ts +283 -283
  144. package/src/retrieval/fusion/index.ts +194 -194
  145. package/src/retrieval/fusion/rrf.ts +165 -165
  146. package/src/retrieval/index.ts +12 -12
  147. package/src/retrieval/pipeline.ts +375 -375
  148. package/src/retrieval/query/expander.ts +203 -203
  149. package/src/retrieval/query/index.ts +27 -27
  150. package/src/retrieval/query/intent-classifier.ts +252 -252
  151. package/src/retrieval/query/temporal-parser.ts +295 -295
  152. package/src/retrieval/reranker/index.ts +189 -188
  153. package/src/retrieval/reranker/model.ts +99 -95
  154. package/src/retrieval/service.ts +125 -125
  155. package/src/retrieval/types.ts +162 -162
  156. package/src/routing/entity-extractor.ts +454 -454
  157. package/src/routing/handlers/exploration-handler.ts +369 -0
  158. package/src/routing/handlers/index.ts +19 -0
  159. package/src/routing/handlers/memory-handler.ts +273 -0
  160. package/src/routing/handlers/mutation-handler.ts +241 -0
  161. package/src/routing/handlers/recall-handler.ts +642 -0
  162. package/src/routing/handlers/shared.ts +515 -0
  163. package/src/routing/handlers/types.ts +48 -0
  164. package/src/routing/intent-classifier.ts +552 -552
  165. package/src/routing/response-filter.ts +399 -391
  166. package/src/routing/router.ts +245 -2193
  167. package/src/routing/search-engine.ts +521 -514
  168. package/src/routing/types.ts +104 -94
  169. package/src/scripts/health-check.ts +118 -118
  170. package/src/scripts/setup.ts +122 -122
  171. package/src/server/auto-updater.ts +283 -276
  172. package/src/server/handlers/call-tool.ts +159 -159
  173. package/src/server/handlers/list-tools.ts +35 -35
  174. package/src/server/handlers/tools/auto-remember.ts +165 -165
  175. package/src/server/handlers/tools/brain.ts +86 -86
  176. package/src/server/handlers/tools/create-project.ts +135 -135
  177. package/src/server/handlers/tools/get-code-standards.ts +123 -123
  178. package/src/server/handlers/tools/get-corrections.ts +152 -152
  179. package/src/server/handlers/tools/get-patterns.ts +156 -156
  180. package/src/server/handlers/tools/get-project-context.ts +75 -75
  181. package/src/server/handlers/tools/index.ts +30 -30
  182. package/src/server/handlers/tools/init-project.ts +756 -756
  183. package/src/server/handlers/tools/list-projects.ts +126 -126
  184. package/src/server/handlers/tools/recall-similar.ts +87 -87
  185. package/src/server/handlers/tools/recognize-pattern.ts +132 -132
  186. package/src/server/handlers/tools/record-correction.ts +131 -131
  187. package/src/server/handlers/tools/remember-decision.ts +168 -168
  188. package/src/server/handlers/tools/schemas.ts +179 -179
  189. package/src/server/handlers/tools/search-code.ts +122 -122
  190. package/src/server/handlers/tools/smart-context.ts +146 -146
  191. package/src/server/handlers/tools/update-progress.ts +131 -131
  192. package/src/server/http-api.ts +215 -1229
  193. package/src/server/mcp-proxy.ts +85 -84
  194. package/src/server/mcp-server.ts +285 -284
  195. package/src/server/middleware/auth.ts +39 -0
  196. package/src/server/middleware/error-handler.ts +37 -0
  197. package/src/server/middleware/rate-limit.ts +53 -0
  198. package/src/server/middleware/validate.ts +42 -0
  199. package/src/server/pid-manager.ts +137 -136
  200. package/src/server/providers/resources.ts +581 -581
  201. package/src/server/routes/code.ts +228 -0
  202. package/src/server/routes/context.ts +26 -0
  203. package/src/server/routes/health.ts +19 -0
  204. package/src/server/routes/helpers.ts +100 -0
  205. package/src/server/routes/hooks.ts +197 -0
  206. package/src/server/routes/mcp.ts +47 -0
  207. package/src/server/routes/memory.ts +397 -0
  208. package/src/server/routes/models.ts +96 -0
  209. package/src/server/routes/projects.ts +89 -0
  210. package/src/server/routes/types.ts +21 -0
  211. package/src/server/schemas/api-schemas.ts +202 -0
  212. package/src/server/services.ts +720 -720
  213. package/src/server/utils/memory-indicator.ts +84 -84
  214. package/src/server/utils/response-formatter.ts +129 -129
  215. package/src/server/web-viewer.ts +1145 -1115
  216. package/src/setup/index.ts +38 -38
  217. package/src/tools/registry.ts +115 -115
  218. package/src/tools/schemas.ts +666 -666
  219. package/src/tools/types.ts +412 -412
  220. package/src/training/data-store.ts +320 -298
  221. package/src/training/retrain-pipeline.ts +399 -394
  222. package/src/utils/error-handler.ts +136 -136
  223. package/src/utils/index.ts +58 -58
  224. package/src/utils/kill-port.ts +55 -53
  225. package/src/utils/phase12-helper.ts +56 -56
  226. package/src/utils/safe-path.ts +43 -0
  227. package/src/utils/timing.ts +47 -47
  228. package/src/utils/transaction.ts +63 -63
  229. package/src/vault/index.ts +4 -3
  230. package/src/vault/paths.ts +106 -106
  231. package/src/vault/query.ts +4 -1
  232. package/src/vault/reader.ts +44 -1
  233. package/src/vault/watcher.ts +24 -1
  234. package/src/vault/writer.ts +487 -413
  235. package/skills/persistent-memory/SKILL.md +0 -148
  236. package/skills/persistent-memory/references/tool-reference.md +0 -90
@@ -1,394 +1,399 @@
1
- /**
2
- * Retrain Pipeline — SLM Upgrade Phase 6B
3
- * Automated retraining when enough feedback accumulates.
4
- *
5
- * Flow:
6
- * 1. Check if retraining is needed (feedback count + disagreement rate)
7
- * 2. Export merged training data (existing + feedback corrections) as JSONL
8
- * 3. Shell out to Python: prepare_data → train → evaluate → export_onnx
9
- * 4. Compare new accuracy to old, promote model if improved
10
- * 5. Update retrain-state.json with timestamp + stats
11
- */
12
-
13
- import { execSync } from 'node:child_process'
14
- import { existsSync, mkdirSync, readFileSync, writeFileSync } from 'node:fs'
15
- import { join } from 'node:path'
16
- import { homedir } from 'node:os'
17
- import { getClaudeBrainHome, getHomePaths } from '@/config/home'
18
- import {
19
- exportTrainingData,
20
- exportModelFeedback,
21
- getModelFeedbackStats,
22
- type TrainingTask,
23
- } from '@/training/data-store'
24
- import type { ModelManifest, ModelTask } from '@/intelligence/model-manager'
25
-
26
- // ── Types ────────────────────────────────────────────────────────────
27
-
28
- export interface RetrainConfig {
29
- minFeedbackCount: number
30
- maxDisagreementRate: number
31
- pythonPath: string
32
- trainingDir: string
33
- force: boolean
34
- }
35
-
36
- export interface RetrainCheck {
37
- needed: boolean
38
- reason: string
39
- feedbackCount: number
40
- disagreementRate: number
41
- lastRetrainDate: string | null
42
- }
43
-
44
- export interface RetrainResult {
45
- task: string
46
- success: boolean
47
- error?: string
48
- oldAccuracy?: number
49
- newAccuracy?: number
50
- trainingDataCount: number
51
- duration: number
52
- }
53
-
54
- interface RetrainStateEntry {
55
- lastRetrain: string
56
- lastAccuracy: number
57
- feedbackAtRetrain: number
58
- }
59
-
60
- type RetrainState = Record<string, RetrainStateEntry>
61
-
62
- // ── Helpers ──────────────────────────────────────────────────────────
63
-
64
- function resolveTrainingDir(trainingDir: string): string {
65
- if (trainingDir.startsWith('~')) {
66
- return join(homedir(), trainingDir.slice(1))
67
- }
68
- return trainingDir
69
- }
70
-
71
- function getRetrainStatePath(): string {
72
- return join(getClaudeBrainHome(), 'data', 'retrain-state.json')
73
- }
74
-
75
- function loadRetrainState(): RetrainState {
76
- const statePath = getRetrainStatePath()
77
- if (!existsSync(statePath)) return {}
78
- try {
79
- return JSON.parse(readFileSync(statePath, 'utf-8'))
80
- } catch {
81
- return {}
82
- }
83
- }
84
-
85
- function saveRetrainState(state: RetrainState): void {
86
- const statePath = getRetrainStatePath()
87
- const dir = join(getClaudeBrainHome(), 'data')
88
- if (!existsSync(dir)) {
89
- mkdirSync(dir, { recursive: true })
90
- }
91
- writeFileSync(statePath, JSON.stringify(state, null, 2))
92
- }
93
-
94
- function loadManifest(): ModelManifest | null {
95
- const manifestPath = join(getHomePaths().models, 'manifest.json')
96
- if (!existsSync(manifestPath)) return null
97
- try {
98
- return JSON.parse(readFileSync(manifestPath, 'utf-8'))
99
- } catch {
100
- return null
101
- }
102
- }
103
-
104
- function saveManifest(manifest: ModelManifest): void {
105
- const modelsDir = getHomePaths().models
106
- if (!existsSync(modelsDir)) {
107
- mkdirSync(modelsDir, { recursive: true })
108
- }
109
- writeFileSync(join(modelsDir, 'manifest.json'), JSON.stringify(manifest, null, 2))
110
- }
111
-
112
- // ── Public API ───────────────────────────────────────────────────────
113
-
114
- /**
115
- * Check if retraining is needed for a task based on feedback accumulation.
116
- */
117
- export function shouldRetrain(task: ModelTask, config: RetrainConfig): RetrainCheck {
118
- const state = loadRetrainState()
119
- const taskState = state[task]
120
- const lastRetrainDate = taskState?.lastRetrain ?? null
121
- const feedbackAtLastRetrain = taskState?.feedbackAtRetrain ?? 0
122
-
123
- const feedbackStats = getModelFeedbackStats()
124
- const taskStats = feedbackStats[task]
125
-
126
- if (!taskStats) {
127
- return {
128
- needed: false,
129
- reason: 'No feedback data available',
130
- feedbackCount: 0,
131
- disagreementRate: 0,
132
- lastRetrainDate,
133
- }
134
- }
135
-
136
- const newFeedbackCount = taskStats.total - feedbackAtLastRetrain
137
- const disagreementRate = taskStats.disagreementRate
138
-
139
- // Check if enough new feedback has accumulated
140
- if (newFeedbackCount < config.minFeedbackCount) {
141
- return {
142
- needed: false,
143
- reason: `Only ${newFeedbackCount} new feedback entries (need ${config.minFeedbackCount})`,
144
- feedbackCount: taskStats.total,
145
- disagreementRate,
146
- lastRetrainDate,
147
- }
148
- }
149
-
150
- // Check if disagreement rate exceeds threshold
151
- if (disagreementRate > config.maxDisagreementRate) {
152
- return {
153
- needed: true,
154
- reason: `Disagreement rate ${(disagreementRate * 100).toFixed(1)}% exceeds threshold ${(config.maxDisagreementRate * 100).toFixed(1)}%`,
155
- feedbackCount: taskStats.total,
156
- disagreementRate,
157
- lastRetrainDate,
158
- }
159
- }
160
-
161
- // Enough feedback accumulated even if disagreement rate is below threshold
162
- return {
163
- needed: true,
164
- reason: `${newFeedbackCount} new feedback entries since last retrain`,
165
- feedbackCount: taskStats.total,
166
- disagreementRate,
167
- lastRetrainDate,
168
- }
169
- }
170
-
171
- /**
172
- * Export merged training data (training_data + feedback corrections) as JSONL.
173
- */
174
- export function exportMergedTrainingData(
175
- task: ModelTask,
176
- trainingDir: string
177
- ): { path: string; count: number } {
178
- const resolvedDir = resolveTrainingDir(trainingDir)
179
- const dataDir = join(resolvedDir, 'data', task)
180
- if (!existsSync(dataDir)) {
181
- mkdirSync(dataDir, { recursive: true })
182
- }
183
-
184
- const outputPath = join(dataDir, 'train.jsonl')
185
-
186
- // Get existing training data
187
- const trainingLines = exportTrainingData(task as TrainingTask)
188
-
189
- // Get feedback data (disagreements are useful training signal)
190
- const feedbackLines = exportModelFeedback(task)
191
-
192
- // Merge: training data first, then feedback
193
- const allLines = [...trainingLines, ...feedbackLines]
194
-
195
- writeFileSync(outputPath, allLines.join('\n') + '\n')
196
-
197
- return { path: outputPath, count: allLines.length }
198
- }
199
-
200
- /**
201
- * Run the full retrain pipeline for a single task.
202
- */
203
- export async function retrainTask(
204
- task: ModelTask,
205
- config: RetrainConfig
206
- ): Promise<RetrainResult> {
207
- const startTime = Date.now()
208
- const resolvedDir = resolveTrainingDir(config.trainingDir)
209
-
210
- // Step 1: Export merged training data
211
- console.log(` [${task}] Exporting merged training data...`)
212
- let dataCount: number
213
- try {
214
- const { count } = exportMergedTrainingData(task, config.trainingDir)
215
- dataCount = count
216
- console.log(` [${task}] Exported ${count} training examples`)
217
- } catch (err) {
218
- return {
219
- task,
220
- success: false,
221
- error: `Failed to export training data: ${err instanceof Error ? err.message : String(err)}`,
222
- trainingDataCount: 0,
223
- duration: Date.now() - startTime,
224
- }
225
- }
226
-
227
- if (dataCount === 0) {
228
- return {
229
- task,
230
- success: false,
231
- error: 'No training data available',
232
- trainingDataCount: 0,
233
- duration: Date.now() - startTime,
234
- }
235
- }
236
-
237
- // Step 2: Run Python training pipeline
238
- const pythonSteps = [
239
- { script: 'scripts/prepare_data.py', args: `--task ${task}`, label: 'Preparing data' },
240
- { script: 'scripts/train.py', args: `--task ${task}`, label: 'Training model' },
241
- { script: 'scripts/evaluate.py', args: `--task ${task} --save`, label: 'Evaluating model' },
242
- { script: 'scripts/export_onnx.py', args: `--task ${task} --output-dir models/`, label: 'Exporting ONNX' },
243
- ]
244
-
245
- for (const step of pythonSteps) {
246
- console.log(` [${task}] ${step.label}...`)
247
- const cmd = `${config.pythonPath} ${step.script} ${step.args}`
248
- try {
249
- execSync(cmd, {
250
- cwd: resolvedDir,
251
- stdio: 'pipe',
252
- timeout: 600_000, // 10 minute timeout per step
253
- })
254
- } catch (err) {
255
- const stderr = err instanceof Error && 'stderr' in err
256
- ? (err as any).stderr?.toString().slice(0, 500)
257
- : String(err)
258
- return {
259
- task,
260
- success: false,
261
- error: `Python step "${step.label}" failed: ${stderr}`,
262
- trainingDataCount: dataCount,
263
- duration: Date.now() - startTime,
264
- }
265
- }
266
- }
267
-
268
- // Step 3: Read evaluation results
269
- const benchmarkPath = join(resolvedDir, 'benchmarks', `${task}.json`)
270
- let newAccuracy: number | undefined
271
- try {
272
- if (existsSync(benchmarkPath)) {
273
- const benchData = JSON.parse(readFileSync(benchmarkPath, 'utf-8'))
274
- newAccuracy = benchData.accuracy ?? benchData.overall_accuracy
275
- }
276
- } catch {
277
- console.log(` [${task}] Warning: Could not read benchmark results`)
278
- }
279
-
280
- // Step 4: Compare with existing model accuracy
281
- const manifest = loadManifest()
282
- const oldAccuracy = manifest?.models[task]?.accuracy
283
-
284
- if (newAccuracy != null && oldAccuracy != null && newAccuracy < oldAccuracy && !config.force) {
285
- console.log(` [${task}] New accuracy ${(newAccuracy * 100).toFixed(1)}% < old ${(oldAccuracy * 100).toFixed(1)}% — skipping model replacement`)
286
- // Still record the retrain attempt
287
- const state = loadRetrainState()
288
- const feedbackStats = getModelFeedbackStats()
289
- state[task] = {
290
- lastRetrain: new Date().toISOString(),
291
- lastAccuracy: oldAccuracy,
292
- feedbackAtRetrain: feedbackStats[task]?.total ?? 0,
293
- }
294
- saveRetrainState(state)
295
-
296
- return {
297
- task,
298
- success: false,
299
- error: `New accuracy (${(newAccuracy * 100).toFixed(1)}%) lower than current (${(oldAccuracy * 100).toFixed(1)}%). Use --force to override.`,
300
- oldAccuracy,
301
- newAccuracy,
302
- trainingDataCount: dataCount,
303
- duration: Date.now() - startTime,
304
- }
305
- }
306
-
307
- // Step 5: Copy new ONNX model to ~/.claude-brain/models/
308
- const modelsDir = getHomePaths().models
309
- if (!existsSync(modelsDir)) {
310
- mkdirSync(modelsDir, { recursive: true })
311
- }
312
-
313
- const onnxSource = join(resolvedDir, 'models', `${task}.onnx`)
314
- if (existsSync(onnxSource)) {
315
- const onnxDest = join(modelsDir, `${task}.onnx`)
316
- const onnxData = readFileSync(onnxSource)
317
- writeFileSync(onnxDest, onnxData)
318
- console.log(` [${task}] Model copied to ${onnxDest}`)
319
-
320
- // Update manifest
321
- const currentManifest = loadManifest() ?? { models: {} }
322
- const existing = currentManifest.models[task]
323
- currentManifest.models[task] = {
324
- version: bumpVersion(existing?.version),
325
- file: `${task}.onnx`,
326
- accuracy: newAccuracy,
327
- labels: existing?.labels,
328
- maxSeqLen: existing?.maxSeqLen,
329
- }
330
- saveManifest(currentManifest)
331
- console.log(` [${task}] Manifest updated`)
332
- } else {
333
- console.log(` [${task}] Warning: ONNX file not found at ${onnxSource}`)
334
- }
335
-
336
- // Step 6: Update retrain state
337
- const state = loadRetrainState()
338
- const feedbackStats = getModelFeedbackStats()
339
- state[task] = {
340
- lastRetrain: new Date().toISOString(),
341
- lastAccuracy: newAccuracy ?? oldAccuracy ?? 0,
342
- feedbackAtRetrain: feedbackStats[task]?.total ?? 0,
343
- }
344
- saveRetrainState(state)
345
-
346
- console.log(` [${task}] Retrain complete in ${((Date.now() - startTime) / 1000).toFixed(1)}s`)
347
-
348
- return {
349
- task,
350
- success: true,
351
- oldAccuracy,
352
- newAccuracy,
353
- trainingDataCount: dataCount,
354
- duration: Date.now() - startTime,
355
- }
356
- }
357
-
358
- /**
359
- * Run retrain for all tasks that need it.
360
- */
361
- export async function retrainAll(
362
- config: RetrainConfig
363
- ): Promise<Map<string, RetrainResult>> {
364
- const ALL_TASKS: ModelTask[] = ['intent', 'entity', 'query', 'knowledge', 'compress', 'pattern']
365
- const results = new Map<string, RetrainResult>()
366
-
367
- for (const task of ALL_TASKS) {
368
- const check = shouldRetrain(task, config)
369
-
370
- if (!check.needed && !config.force) {
371
- console.log(` [${task}] Skipping — ${check.reason}`)
372
- continue
373
- }
374
-
375
- if (config.force && !check.needed) {
376
- console.log(` [${task}] Forcing retrain (${check.reason})`)
377
- }
378
-
379
- const result = await retrainTask(task, config)
380
- results.set(task, result)
381
- }
382
-
383
- return results
384
- }
385
-
386
- // ── Internal Helpers ─────────────────────────────────────────────────
387
-
388
- function bumpVersion(current?: string): string {
389
- if (!current) return '1.0.0'
390
- const parts = current.split('.').map(Number)
391
- // Bump patch version
392
- parts[2] = (parts[2] ?? 0) + 1
393
- return parts.join('.')
394
- }
1
+ /**
2
+ * Retrain Pipeline — SLM Upgrade Phase 6B
3
+ * Automated retraining when enough feedback accumulates.
4
+ *
5
+ * Flow:
6
+ * 1. Check if retraining is needed (feedback count + disagreement rate)
7
+ * 2. Export merged training data (existing + feedback corrections) as JSONL
8
+ * 3. Shell out to Python: prepare_data → train → evaluate → export_onnx
9
+ * 4. Compare new accuracy to old, promote model if improved
10
+ * 5. Update retrain-state.json with timestamp + stats
11
+ */
12
+
13
+ import { spawnSync } from 'node:child_process'
14
+ import { existsSync, mkdirSync, readFileSync, writeFileSync, realpathSync } from 'node:fs'
15
+ import { join } from 'node:path'
16
+ import { homedir } from 'node:os'
17
+ import { getClaudeBrainHome, getHomePaths } from '@/config/home'
18
+ import {
19
+ exportTrainingData,
20
+ exportModelFeedback,
21
+ getModelFeedbackStats,
22
+ type TrainingTask,
23
+ } from '@/training/data-store'
24
+ import type { ModelManifest, ModelTask } from '@/intelligence/model-manager'
25
+
26
+ // ── Types ────────────────────────────────────────────────────────────
27
+
28
+ export interface RetrainConfig {
29
+ minFeedbackCount: number
30
+ maxDisagreementRate: number
31
+ pythonPath: string
32
+ trainingDir: string
33
+ force: boolean
34
+ }
35
+
36
+ export interface RetrainCheck {
37
+ needed: boolean
38
+ reason: string
39
+ feedbackCount: number
40
+ disagreementRate: number
41
+ lastRetrainDate: string | null
42
+ }
43
+
44
+ export interface RetrainResult {
45
+ task: string
46
+ success: boolean
47
+ error?: string
48
+ oldAccuracy?: number
49
+ newAccuracy?: number
50
+ trainingDataCount: number
51
+ duration: number
52
+ }
53
+
54
+ interface RetrainStateEntry {
55
+ lastRetrain: string
56
+ lastAccuracy: number
57
+ feedbackAtRetrain: number
58
+ }
59
+
60
+ type RetrainState = Record<string, RetrainStateEntry>
61
+
62
+ // ── Helpers ──────────────────────────────────────────────────────────
63
+
64
+ function resolveTrainingDir(trainingDir: string): string {
65
+ if (trainingDir.startsWith('~')) {
66
+ return join(homedir(), trainingDir.slice(1))
67
+ }
68
+ return trainingDir
69
+ }
70
+
71
+ function getRetrainStatePath(): string {
72
+ return join(getClaudeBrainHome(), 'data', 'retrain-state.json')
73
+ }
74
+
75
+ function loadRetrainState(): RetrainState {
76
+ const statePath = getRetrainStatePath()
77
+ if (!existsSync(statePath)) return {}
78
+ try {
79
+ return JSON.parse(readFileSync(statePath, 'utf-8'))
80
+ } catch {
81
+ return {}
82
+ }
83
+ }
84
+
85
+ function saveRetrainState(state: RetrainState): void {
86
+ const statePath = getRetrainStatePath()
87
+ const dir = join(getClaudeBrainHome(), 'data')
88
+ if (!existsSync(dir)) {
89
+ mkdirSync(dir, { recursive: true })
90
+ }
91
+ writeFileSync(statePath, JSON.stringify(state, null, 2))
92
+ }
93
+
94
+ function loadManifest(): ModelManifest | null {
95
+ const manifestPath = join(getHomePaths().models, 'manifest.json')
96
+ if (!existsSync(manifestPath)) return null
97
+ try {
98
+ return JSON.parse(readFileSync(manifestPath, 'utf-8'))
99
+ } catch {
100
+ return null
101
+ }
102
+ }
103
+
104
+ function saveManifest(manifest: ModelManifest): void {
105
+ const modelsDir = getHomePaths().models
106
+ if (!existsSync(modelsDir)) {
107
+ mkdirSync(modelsDir, { recursive: true })
108
+ }
109
+ writeFileSync(join(modelsDir, 'manifest.json'), JSON.stringify(manifest, null, 2))
110
+ }
111
+
112
+ // ── Public API ───────────────────────────────────────────────────────
113
+
114
+ /**
115
+ * Check if retraining is needed for a task based on feedback accumulation.
116
+ */
117
+ export function shouldRetrain(task: ModelTask, config: RetrainConfig): RetrainCheck {
118
+ const state = loadRetrainState()
119
+ const taskState = state[task]
120
+ const lastRetrainDate = taskState?.lastRetrain ?? null
121
+ const feedbackAtLastRetrain = taskState?.feedbackAtRetrain ?? 0
122
+
123
+ const feedbackStats = getModelFeedbackStats()
124
+ const taskStats = feedbackStats[task]
125
+
126
+ if (!taskStats) {
127
+ return {
128
+ needed: false,
129
+ reason: 'No feedback data available',
130
+ feedbackCount: 0,
131
+ disagreementRate: 0,
132
+ lastRetrainDate,
133
+ }
134
+ }
135
+
136
+ const newFeedbackCount = taskStats.total - feedbackAtLastRetrain
137
+ const disagreementRate = taskStats.disagreementRate
138
+
139
+ // Check if enough new feedback has accumulated
140
+ if (newFeedbackCount < config.minFeedbackCount) {
141
+ return {
142
+ needed: false,
143
+ reason: `Only ${newFeedbackCount} new feedback entries (need ${config.minFeedbackCount})`,
144
+ feedbackCount: taskStats.total,
145
+ disagreementRate,
146
+ lastRetrainDate,
147
+ }
148
+ }
149
+
150
+ // Check if disagreement rate exceeds threshold
151
+ if (disagreementRate > config.maxDisagreementRate) {
152
+ return {
153
+ needed: true,
154
+ reason: `Disagreement rate ${(disagreementRate * 100).toFixed(1)}% exceeds threshold ${(config.maxDisagreementRate * 100).toFixed(1)}%`,
155
+ feedbackCount: taskStats.total,
156
+ disagreementRate,
157
+ lastRetrainDate,
158
+ }
159
+ }
160
+
161
+ // Enough feedback accumulated even if disagreement rate is below threshold
162
+ return {
163
+ needed: true,
164
+ reason: `${newFeedbackCount} new feedback entries since last retrain`,
165
+ feedbackCount: taskStats.total,
166
+ disagreementRate,
167
+ lastRetrainDate,
168
+ }
169
+ }
170
+
171
+ /**
172
+ * Export merged training data (training_data + feedback corrections) as JSONL.
173
+ */
174
+ export function exportMergedTrainingData(
175
+ task: ModelTask,
176
+ trainingDir: string
177
+ ): { path: string; count: number } {
178
+ const resolvedDir = resolveTrainingDir(trainingDir)
179
+ const dataDir = join(resolvedDir, 'data', task)
180
+ if (!existsSync(dataDir)) {
181
+ mkdirSync(dataDir, { recursive: true })
182
+ }
183
+
184
+ const outputPath = join(dataDir, 'train.jsonl')
185
+
186
+ // Get existing training data
187
+ const trainingLines = exportTrainingData(task as TrainingTask)
188
+
189
+ // Get feedback data (disagreements are useful training signal)
190
+ const feedbackLines = exportModelFeedback(task)
191
+
192
+ // Merge: training data first, then feedback
193
+ const allLines = [...trainingLines, ...feedbackLines]
194
+
195
+ writeFileSync(outputPath, allLines.join('\n') + '\n')
196
+
197
+ return { path: outputPath, count: allLines.length }
198
+ }
199
+
200
+ /**
201
+ * Run the full retrain pipeline for a single task.
202
+ */
203
+ export async function retrainTask(
204
+ task: ModelTask,
205
+ config: RetrainConfig
206
+ ): Promise<RetrainResult> {
207
+ const startTime = Date.now()
208
+ const resolvedDir = resolveTrainingDir(config.trainingDir)
209
+
210
+ // Step 1: Export merged training data
211
+ console.log(` [${task}] Exporting merged training data...`)
212
+ let dataCount: number
213
+ try {
214
+ const { count } = exportMergedTrainingData(task, config.trainingDir)
215
+ dataCount = count
216
+ console.log(` [${task}] Exported ${count} training examples`)
217
+ } catch (err) {
218
+ return {
219
+ task,
220
+ success: false,
221
+ error: `Failed to export training data: ${err instanceof Error ? err.message : String(err)}`,
222
+ trainingDataCount: 0,
223
+ duration: Date.now() - startTime,
224
+ }
225
+ }
226
+
227
+ if (dataCount === 0) {
228
+ return {
229
+ task,
230
+ success: false,
231
+ error: 'No training data available',
232
+ trainingDataCount: 0,
233
+ duration: Date.now() - startTime,
234
+ }
235
+ }
236
+
237
+ // Step 2: Run Python training pipeline
238
+ const pythonSteps = [
239
+ { script: 'scripts/prepare_data.py', args: `--task ${task}`, label: 'Preparing data' },
240
+ { script: 'scripts/train.py', args: `--task ${task}`, label: 'Training model' },
241
+ { script: 'scripts/evaluate.py', args: `--task ${task} --save`, label: 'Evaluating model' },
242
+ { script: 'scripts/export_onnx.py', args: `--task ${task} --output-dir models/`, label: 'Exporting ONNX' },
243
+ ]
244
+
245
+ let resolvedCwd: string
246
+ try {
247
+ resolvedCwd = realpathSync(resolvedDir)
248
+ } catch {
249
+ resolvedCwd = resolvedDir
250
+ }
251
+
252
+ for (const step of pythonSteps) {
253
+ console.log(` [${task}] ${step.label}...`)
254
+ const args = [step.script, ...step.args.split(' ')]
255
+ const result = spawnSync(config.pythonPath, args, {
256
+ cwd: resolvedCwd,
257
+ encoding: 'utf-8',
258
+ stdio: 'pipe',
259
+ timeout: 600_000, // 10 minute timeout per step
260
+ })
261
+ if (result.error || result.status !== 0) {
262
+ const stderr = result.stderr?.slice(0, 500) || result.error?.message || 'Unknown error'
263
+ return {
264
+ task,
265
+ success: false,
266
+ error: `Python step "${step.label}" failed: ${stderr}`,
267
+ trainingDataCount: dataCount,
268
+ duration: Date.now() - startTime,
269
+ }
270
+ }
271
+ }
272
+
273
+ // Step 3: Read evaluation results
274
+ const benchmarkPath = join(resolvedDir, 'benchmarks', `${task}.json`)
275
+ let newAccuracy: number | undefined
276
+ try {
277
+ if (existsSync(benchmarkPath)) {
278
+ const benchData = JSON.parse(readFileSync(benchmarkPath, 'utf-8'))
279
+ newAccuracy = benchData.accuracy ?? benchData.overall_accuracy
280
+ }
281
+ } catch {
282
+ console.log(` [${task}] Warning: Could not read benchmark results`)
283
+ }
284
+
285
+ // Step 4: Compare with existing model accuracy
286
+ const manifest = loadManifest()
287
+ const oldAccuracy = manifest?.models[task]?.accuracy
288
+
289
+ if (newAccuracy != null && oldAccuracy != null && newAccuracy < oldAccuracy && !config.force) {
290
+ console.log(` [${task}] New accuracy ${(newAccuracy * 100).toFixed(1)}% < old ${(oldAccuracy * 100).toFixed(1)}% — skipping model replacement`)
291
+ // Still record the retrain attempt
292
+ const state = loadRetrainState()
293
+ const feedbackStats = getModelFeedbackStats()
294
+ state[task] = {
295
+ lastRetrain: new Date().toISOString(),
296
+ lastAccuracy: oldAccuracy,
297
+ feedbackAtRetrain: feedbackStats[task]?.total ?? 0,
298
+ }
299
+ saveRetrainState(state)
300
+
301
+ return {
302
+ task,
303
+ success: false,
304
+ error: `New accuracy (${(newAccuracy * 100).toFixed(1)}%) lower than current (${(oldAccuracy * 100).toFixed(1)}%). Use --force to override.`,
305
+ oldAccuracy,
306
+ newAccuracy,
307
+ trainingDataCount: dataCount,
308
+ duration: Date.now() - startTime,
309
+ }
310
+ }
311
+
312
+ // Step 5: Copy new ONNX model to ~/.claude-brain/models/
313
+ const modelsDir = getHomePaths().models
314
+ if (!existsSync(modelsDir)) {
315
+ mkdirSync(modelsDir, { recursive: true })
316
+ }
317
+
318
+ const onnxSource = join(resolvedDir, 'models', `${task}.onnx`)
319
+ if (existsSync(onnxSource)) {
320
+ const onnxDest = join(modelsDir, `${task}.onnx`)
321
+ const onnxData = readFileSync(onnxSource)
322
+ writeFileSync(onnxDest, onnxData)
323
+ console.log(` [${task}] Model copied to ${onnxDest}`)
324
+
325
+ // Update manifest
326
+ const currentManifest = loadManifest() ?? { models: {} }
327
+ const existing = currentManifest.models[task]
328
+ currentManifest.models[task] = {
329
+ version: bumpVersion(existing?.version),
330
+ file: `${task}.onnx`,
331
+ accuracy: newAccuracy,
332
+ labels: existing?.labels,
333
+ maxSeqLen: existing?.maxSeqLen,
334
+ }
335
+ saveManifest(currentManifest)
336
+ console.log(` [${task}] Manifest updated`)
337
+ } else {
338
+ console.log(` [${task}] Warning: ONNX file not found at ${onnxSource}`)
339
+ }
340
+
341
+ // Step 6: Update retrain state
342
+ const state = loadRetrainState()
343
+ const feedbackStats = getModelFeedbackStats()
344
+ state[task] = {
345
+ lastRetrain: new Date().toISOString(),
346
+ lastAccuracy: newAccuracy ?? oldAccuracy ?? 0,
347
+ feedbackAtRetrain: feedbackStats[task]?.total ?? 0,
348
+ }
349
+ saveRetrainState(state)
350
+
351
+ console.log(` [${task}] Retrain complete in ${((Date.now() - startTime) / 1000).toFixed(1)}s`)
352
+
353
+ return {
354
+ task,
355
+ success: true,
356
+ oldAccuracy,
357
+ newAccuracy,
358
+ trainingDataCount: dataCount,
359
+ duration: Date.now() - startTime,
360
+ }
361
+ }
362
+
363
+ /**
364
+ * Run retrain for all tasks that need it.
365
+ */
366
+ export async function retrainAll(
367
+ config: RetrainConfig
368
+ ): Promise<Map<string, RetrainResult>> {
369
+ const ALL_TASKS: ModelTask[] = ['intent', 'entity', 'query', 'knowledge', 'compress', 'pattern']
370
+ const results = new Map<string, RetrainResult>()
371
+
372
+ for (const task of ALL_TASKS) {
373
+ const check = shouldRetrain(task, config)
374
+
375
+ if (!check.needed && !config.force) {
376
+ console.log(` [${task}] Skipping ${check.reason}`)
377
+ continue
378
+ }
379
+
380
+ if (config.force && !check.needed) {
381
+ console.log(` [${task}] Forcing retrain (${check.reason})`)
382
+ }
383
+
384
+ const result = await retrainTask(task, config)
385
+ results.set(task, result)
386
+ }
387
+
388
+ return results
389
+ }
390
+
391
+ // ── Internal Helpers ─────────────────────────────────────────────────
392
+
393
+ function bumpVersion(current?: string): string {
394
+ if (!current) return '1.0.0'
395
+ const parts = current.split('.').map(Number)
396
+ // Bump patch version
397
+ parts[2] = (parts[2] ?? 0) + 1
398
+ return parts.join('.')
399
+ }