principles-disciple 1.8.1 → 1.8.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (508) hide show
  1. package/ADVANCED_CONFIG_ZH.md +97 -0
  2. package/AGENT_INSTALL.md +173 -0
  3. package/AGENT_INSTALL_EN.md +173 -0
  4. package/INSTALL.md +256 -0
  5. package/SKILL.md +63 -0
  6. package/docs/COMMAND_REFERENCE.md +76 -0
  7. package/docs/COMMAND_REFERENCE_EN.md +79 -0
  8. package/esbuild.config.js +75 -0
  9. package/openclaw.plugin.json +4 -4
  10. package/package.json +11 -13
  11. package/scripts/build-web.mjs +46 -0
  12. package/scripts/install-dependencies.cjs +47 -0
  13. package/scripts/sync-plugin.mjs +802 -0
  14. package/scripts/verify-build.mjs +109 -0
  15. package/src/agents/nocturnal-dreamer.md +152 -0
  16. package/src/agents/nocturnal-philosopher.md +138 -0
  17. package/src/agents/nocturnal-reflector.md +126 -0
  18. package/src/agents/nocturnal-scribe.md +164 -0
  19. package/src/commands/capabilities.ts +85 -0
  20. package/{dist/commands/context.js → src/commands/context.ts} +78 -38
  21. package/src/commands/evolution-status.ts +146 -0
  22. package/src/commands/export.ts +111 -0
  23. package/src/commands/focus.ts +533 -0
  24. package/src/commands/nocturnal-review.ts +311 -0
  25. package/src/commands/nocturnal-rollout.ts +763 -0
  26. package/src/commands/nocturnal-train.ts +1002 -0
  27. package/{dist/commands/pain.js → src/commands/pain.ts} +68 -49
  28. package/src/commands/principle-rollback.ts +27 -0
  29. package/{dist/commands/rollback.js → src/commands/rollback.ts} +44 -12
  30. package/src/commands/samples.ts +60 -0
  31. package/src/commands/strategy.ts +38 -0
  32. package/{dist/commands/thinking-os.js → src/commands/thinking-os.ts} +59 -36
  33. package/src/commands/workflow-debug.ts +128 -0
  34. package/{dist/config/defaults/runtime.js → src/config/defaults/runtime.ts} +12 -5
  35. package/src/config/errors.ts +163 -0
  36. package/{dist/config/index.d.ts → src/config/index.ts} +2 -1
  37. package/src/constants/diagnostician.ts +66 -0
  38. package/src/constants/tools.ts +62 -0
  39. package/src/core/adaptive-thresholds.ts +476 -0
  40. package/{dist/core/config-service.js → src/core/config-service.ts} +7 -4
  41. package/{dist/core/config.js → src/core/config.ts} +158 -46
  42. package/src/core/control-ui-db.ts +435 -0
  43. package/{dist/core/detection-funnel.js → src/core/detection-funnel.ts} +36 -21
  44. package/{dist/core/detection-service.js → src/core/detection-service.ts} +7 -4
  45. package/{dist/core/dictionary-service.js → src/core/dictionary-service.ts} +7 -4
  46. package/{dist/core/dictionary.js → src/core/dictionary.ts} +57 -34
  47. package/src/core/empathy-keyword-matcher.ts +327 -0
  48. package/src/core/empathy-types.ts +218 -0
  49. package/src/core/event-log.ts +544 -0
  50. package/src/core/evolution-engine.ts +612 -0
  51. package/src/core/evolution-logger.ts +353 -0
  52. package/src/core/evolution-migration.ts +77 -0
  53. package/src/core/evolution-reducer.ts +731 -0
  54. package/src/core/evolution-types.ts +456 -0
  55. package/src/core/external-training-contract.ts +527 -0
  56. package/src/core/focus-history.ts +1458 -0
  57. package/src/core/hygiene/tracker.ts +117 -0
  58. package/{dist/core/init.js → src/core/init.ts} +39 -26
  59. package/src/core/local-worker-routing.ts +617 -0
  60. package/{dist/core/migration.js → src/core/migration.ts} +18 -11
  61. package/src/core/model-deployment-registry.ts +722 -0
  62. package/src/core/model-training-registry.ts +813 -0
  63. package/src/core/nocturnal-arbiter.ts +706 -0
  64. package/src/core/nocturnal-candidate-scoring.ts +392 -0
  65. package/src/core/nocturnal-compliance.ts +1075 -0
  66. package/src/core/nocturnal-dataset.ts +668 -0
  67. package/src/core/nocturnal-executability.ts +428 -0
  68. package/src/core/nocturnal-export.ts +390 -0
  69. package/{dist/core/nocturnal-paths.js → src/core/nocturnal-paths.ts} +49 -23
  70. package/src/core/nocturnal-trajectory-extractor.ts +484 -0
  71. package/src/core/nocturnal-trinity.ts +1384 -0
  72. package/src/core/pain.ts +122 -0
  73. package/{dist/core/path-resolver.js → src/core/path-resolver.ts} +157 -36
  74. package/{dist/core/paths.js → src/core/paths.ts} +13 -4
  75. package/src/core/principle-training-state.ts +450 -0
  76. package/src/core/profile.ts +226 -0
  77. package/src/core/promotion-gate.ts +822 -0
  78. package/{dist/core/risk-calculator.js → src/core/risk-calculator.ts} +42 -16
  79. package/{dist/core/session-tracker.js → src/core/session-tracker.ts} +175 -62
  80. package/src/core/shadow-observation-registry.ts +534 -0
  81. package/{dist/core/system-logger.js → src/core/system-logger.ts} +9 -5
  82. package/src/core/thinking-models.ts +217 -0
  83. package/src/core/training-program.ts +630 -0
  84. package/src/core/trajectory-types.ts +243 -0
  85. package/src/core/trajectory.ts +1673 -0
  86. package/{dist/core/workspace-context.js → src/core/workspace-context.ts} +57 -32
  87. package/src/hooks/bash-risk.ts +171 -0
  88. package/src/hooks/edit-verification.ts +295 -0
  89. package/src/hooks/gate-block-helper.ts +160 -0
  90. package/src/hooks/gate.ts +210 -0
  91. package/src/hooks/gfi-gate.ts +177 -0
  92. package/src/hooks/lifecycle.ts +326 -0
  93. package/{dist/hooks/llm.js → src/hooks/llm.ts} +160 -80
  94. package/src/hooks/message-sanitize.ts +45 -0
  95. package/src/hooks/pain.ts +384 -0
  96. package/src/hooks/progressive-trust-gate.ts +174 -0
  97. package/src/hooks/prompt.ts +920 -0
  98. package/src/hooks/subagent.ts +207 -0
  99. package/src/hooks/thinking-checkpoint.ts +73 -0
  100. package/src/hooks/trajectory-collector.ts +290 -0
  101. package/src/http/principles-console-route.ts +716 -0
  102. package/src/i18n/commands.ts +117 -0
  103. package/src/index.ts +694 -0
  104. package/src/service/central-database.ts +831 -0
  105. package/src/service/control-ui-query-service.ts +888 -0
  106. package/src/service/evolution-query-service.ts +405 -0
  107. package/src/service/evolution-worker.ts +1646 -0
  108. package/src/service/health-query-service.ts +836 -0
  109. package/{dist/service/nocturnal-runtime.js → src/service/nocturnal-runtime.ts} +235 -79
  110. package/src/service/nocturnal-service.ts +1015 -0
  111. package/src/service/nocturnal-target-selector.ts +532 -0
  112. package/src/service/phase3-input-filter.ts +237 -0
  113. package/src/service/runtime-summary-service.ts +757 -0
  114. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +513 -0
  115. package/{dist/service/subagent-workflow/empathy-observer-workflow-manager.js → src/service/subagent-workflow/empathy-observer-workflow-manager.ts} +240 -117
  116. package/src/service/subagent-workflow/index.ts +51 -0
  117. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +856 -0
  118. package/src/service/subagent-workflow/runtime-direct-driver.ts +166 -0
  119. package/{dist/service/subagent-workflow/types.d.ts → src/service/subagent-workflow/types.ts} +137 -18
  120. package/src/service/subagent-workflow/workflow-store.ts +328 -0
  121. package/src/service/trajectory-service.ts +15 -0
  122. package/{dist/tools/critique-prompt.js → src/tools/critique-prompt.ts} +25 -8
  123. package/src/tools/deep-reflect.ts +349 -0
  124. package/{dist/tools/model-index.js → src/tools/model-index.ts} +33 -17
  125. package/src/types/event-types.ts +453 -0
  126. package/src/types/hygiene-types.ts +31 -0
  127. package/src/types/principle-tree-schema.ts +244 -0
  128. package/src/types/runtime-summary.ts +49 -0
  129. package/src/types.ts +74 -0
  130. package/src/utils/file-lock.ts +391 -0
  131. package/{dist/utils/glob-match.js → src/utils/glob-match.ts} +21 -20
  132. package/{dist/utils/hashing.js → src/utils/hashing.ts} +6 -4
  133. package/src/utils/io.ts +110 -0
  134. package/{dist/utils/nlp.js → src/utils/nlp.ts} +19 -12
  135. package/{dist/utils/plugin-logger.js → src/utils/plugin-logger.ts} +33 -8
  136. package/src/utils/subagent-probe.ts +94 -0
  137. package/templates/langs/en/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
  138. package/templates/langs/en/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
  139. package/templates/langs/en/skills/ai-sprint-orchestration/SKILL.md +67 -0
  140. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
  141. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
  142. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
  143. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
  144. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
  145. package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
  146. package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
  147. package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
  148. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
  149. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
  150. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
  151. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
  152. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
  153. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
  154. package/templates/langs/zh/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
  155. package/templates/langs/zh/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
  156. package/templates/langs/zh/skills/ai-sprint-orchestration/SKILL.md +67 -0
  157. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
  158. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
  159. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
  160. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
  161. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
  162. package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
  163. package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
  164. package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
  165. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
  166. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
  167. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
  168. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
  169. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
  170. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
  171. package/templates/langs/zh/skills/ai-sprint-orchestration/test/archive.test.mjs +230 -0
  172. package/templates/langs/zh/skills/ai-sprint-orchestration/test/contract-enforcement.test.mjs +672 -0
  173. package/templates/langs/zh/skills/ai-sprint-orchestration/test/decision.test.mjs +1321 -0
  174. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +1419 -0
  175. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +70 -1
  176. package/templates/pain_settings.json +2 -1
  177. package/tests/README.md +120 -0
  178. package/tests/build-artifacts.test.ts +111 -0
  179. package/tests/commands/evolution-status.test.ts +222 -0
  180. package/tests/commands/evolver.test.ts +22 -0
  181. package/tests/commands/export.test.ts +78 -0
  182. package/tests/commands/nocturnal-review.test.ts +448 -0
  183. package/tests/commands/nocturnal-train.test.ts +97 -0
  184. package/tests/commands/pain.test.ts +108 -0
  185. package/tests/commands/samples.test.ts +65 -0
  186. package/tests/commands/strategy.test.ts +34 -0
  187. package/tests/commands/thinking-os.test.ts +88 -0
  188. package/tests/core/adaptive-thresholds.test.ts +261 -0
  189. package/tests/core/config-service.test.ts +89 -0
  190. package/tests/core/config.test.ts +90 -0
  191. package/tests/core/control-ui-db.test.ts +75 -0
  192. package/tests/core/core-template-guidance.test.ts +21 -0
  193. package/tests/core/detection-funnel.test.ts +63 -0
  194. package/tests/core/detection-service.test.ts +50 -0
  195. package/tests/core/dictionary-service.test.ts +116 -0
  196. package/tests/core/dictionary.test.ts +168 -0
  197. package/tests/core/empathy-keyword-matcher.test.ts +209 -0
  198. package/tests/core/event-log.test.ts +181 -0
  199. package/tests/core/evolution-e2e.test.ts +58 -0
  200. package/tests/core/evolution-engine-gate-integration.test.ts +543 -0
  201. package/tests/core/evolution-engine.test.ts +562 -0
  202. package/tests/core/evolution-logger.test.ts +148 -0
  203. package/tests/core/evolution-migration.test.ts +50 -0
  204. package/tests/core/evolution-paths.test.ts +21 -0
  205. package/tests/core/evolution-reducer.detector-metadata.test.ts +602 -0
  206. package/tests/core/evolution-reducer.test.ts +180 -0
  207. package/tests/core/evolution-types-loop.test.ts +48 -0
  208. package/tests/core/evolution-user-stories.e2e.test.ts +249 -0
  209. package/tests/core/external-training-contract.test.ts +463 -0
  210. package/tests/core/focus-history.test.ts +682 -0
  211. package/tests/core/init-flatten.test.ts +69 -0
  212. package/tests/core/init-refactor.test.ts +87 -0
  213. package/tests/core/init-v1.3.test.ts +46 -0
  214. package/tests/core/init.test.ts +190 -0
  215. package/tests/core/local-worker-routing.test.ts +757 -0
  216. package/tests/core/migration.test.ts +84 -0
  217. package/tests/core/model-deployment-registry.test.ts +845 -0
  218. package/tests/core/model-training-registry.test.ts +889 -0
  219. package/tests/core/nocturnal-arbiter.test.ts +494 -0
  220. package/tests/core/nocturnal-candidate-scoring.test.ts +400 -0
  221. package/tests/core/nocturnal-compliance.test.ts +646 -0
  222. package/tests/core/nocturnal-dataset.test.ts +892 -0
  223. package/tests/core/nocturnal-executability.test.ts +357 -0
  224. package/tests/core/nocturnal-export.test.ts +462 -0
  225. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +428 -0
  226. package/tests/core/nocturnal-trajectory-extractor.test.ts +634 -0
  227. package/tests/core/nocturnal-trinity.test.ts +953 -0
  228. package/tests/core/pain.test.ts +33 -0
  229. package/tests/core/path-resolver.test.ts +57 -0
  230. package/tests/core/paths-refactor.test.ts +42 -0
  231. package/tests/core/phase7-rollout-integration.test.ts +477 -0
  232. package/tests/core/principle-training-state.test.ts +712 -0
  233. package/tests/core/profile.test.ts +56 -0
  234. package/tests/core/promotion-gate.test.ts +556 -0
  235. package/tests/core/risk-calculator.test.ts +168 -0
  236. package/tests/core/session-tracker.test.ts +191 -0
  237. package/tests/core/training-program.test.ts +472 -0
  238. package/tests/core/trajectory.test.ts +265 -0
  239. package/tests/core/workspace-context-factory.test.ts +18 -0
  240. package/tests/core/workspace-context.test.ts +134 -0
  241. package/tests/fixtures/nocturnal-reviewed-subset.json +183 -0
  242. package/tests/fixtures/production-compatibility.test.ts +147 -0
  243. package/tests/fixtures/production-mock-generator.ts +282 -0
  244. package/tests/hooks/bash-risk-integration.test.ts +137 -0
  245. package/tests/hooks/bash-risk.test.ts +81 -0
  246. package/tests/hooks/edit-verification.test.ts +678 -0
  247. package/tests/hooks/gate-edit-verification-p1.test.ts +632 -0
  248. package/tests/hooks/gate-edit-verification.test.ts +435 -0
  249. package/tests/hooks/gate-pipeline-integration.test.ts +404 -0
  250. package/tests/hooks/gate.test.ts +271 -0
  251. package/tests/hooks/gfi-gate-unit.test.ts +422 -0
  252. package/tests/hooks/gfi-gate.test.ts +669 -0
  253. package/tests/hooks/lifecycle.test.ts +248 -0
  254. package/tests/hooks/llm.test.ts +308 -0
  255. package/tests/hooks/message-sanitize.test.ts +36 -0
  256. package/tests/hooks/pain.test.ts +141 -0
  257. package/tests/hooks/progressive-trust-gate.test.ts +277 -0
  258. package/tests/hooks/prompt.test.ts +1411 -0
  259. package/tests/hooks/subagent.test.ts +467 -0
  260. package/tests/hooks/thinking-gate.test.ts +313 -0
  261. package/tests/http/principles-console-route.test.ts +140 -0
  262. package/tests/hygiene-tracker.test.ts +77 -0
  263. package/tests/index.integration.test.ts +179 -0
  264. package/tests/index.shadow-routing.integration.test.ts +140 -0
  265. package/tests/index.test.ts +9 -0
  266. package/tests/integration/empathy-workflow-integration.test.ts +627 -0
  267. package/tests/service/control-ui-query-service.test.ts +121 -0
  268. package/tests/service/empathy-observer-workflow-manager.test.ts +176 -0
  269. package/tests/service/evolution-worker.test.ts +585 -0
  270. package/tests/service/nocturnal-runtime.test.ts +470 -0
  271. package/tests/service/nocturnal-service.test.ts +577 -0
  272. package/tests/service/nocturnal-target-selector.test.ts +615 -0
  273. package/tests/service/nocturnal-workflow-manager.test.ts +439 -0
  274. package/tests/service/phase3-input-filter.test.ts +289 -0
  275. package/tests/service/runtime-summary-service.test.ts +919 -0
  276. package/tests/task-compliance.test.ts +166 -0
  277. package/tests/test-utils.ts +48 -0
  278. package/tests/tools/critique-prompt.test.ts +260 -0
  279. package/tests/tools/deep-reflect.test.ts +232 -0
  280. package/tests/tools/model-index.test.ts +246 -0
  281. package/tests/ui/app.test.tsx +114 -0
  282. package/tests/utils/file-lock.test.ts +407 -0
  283. package/tests/utils/hashing.test.ts +32 -0
  284. package/tests/utils/io.test.ts +39 -0
  285. package/tests/utils/nlp.test.ts +53 -0
  286. package/tests/utils/plugin-logger.test.ts +156 -0
  287. package/tsconfig.json +16 -0
  288. package/tsconfig.tsbuildinfo +1 -0
  289. package/ui/src/App.tsx +45 -0
  290. package/ui/src/api.ts +216 -0
  291. package/ui/src/charts.tsx +586 -0
  292. package/ui/src/components/ErrorState.tsx +6 -0
  293. package/ui/src/components/Loading.tsx +13 -0
  294. package/ui/src/components/ProtectedRoute.tsx +12 -0
  295. package/ui/src/components/Shell.tsx +91 -0
  296. package/ui/src/components/WorkspaceConfig.tsx +146 -0
  297. package/ui/src/components/index.ts +5 -0
  298. package/ui/src/context/auth.tsx +80 -0
  299. package/ui/src/context/theme.tsx +66 -0
  300. package/ui/src/hooks/useAutoRefresh.ts +39 -0
  301. package/ui/src/i18n/ui.ts +363 -0
  302. package/ui/src/main.tsx +16 -0
  303. package/ui/src/pages/EvolutionPage.tsx +352 -0
  304. package/ui/src/pages/FeedbackPage.tsx +140 -0
  305. package/ui/src/pages/GateMonitorPage.tsx +136 -0
  306. package/ui/src/pages/LoginPage.tsx +88 -0
  307. package/ui/src/pages/OverviewPage.tsx +238 -0
  308. package/ui/src/pages/SamplesPage.tsx +174 -0
  309. package/ui/src/pages/ThinkingModelsPage.tsx +127 -0
  310. package/ui/src/styles.css +1661 -0
  311. package/ui/src/types.ts +368 -0
  312. package/ui/src/utils/format.ts +15 -0
  313. package/vitest.config.ts +23 -0
  314. package/dist/commands/capabilities.d.ts +0 -3
  315. package/dist/commands/capabilities.js +0 -73
  316. package/dist/commands/context.d.ts +0 -5
  317. package/dist/commands/evolution-status.d.ts +0 -4
  318. package/dist/commands/evolution-status.js +0 -117
  319. package/dist/commands/evolver.d.ts +0 -9
  320. package/dist/commands/evolver.js +0 -26
  321. package/dist/commands/export.d.ts +0 -2
  322. package/dist/commands/export.js +0 -98
  323. package/dist/commands/focus.d.ts +0 -14
  324. package/dist/commands/focus.js +0 -457
  325. package/dist/commands/nocturnal-review.d.ts +0 -24
  326. package/dist/commands/nocturnal-review.js +0 -265
  327. package/dist/commands/nocturnal-rollout.d.ts +0 -27
  328. package/dist/commands/nocturnal-rollout.js +0 -671
  329. package/dist/commands/nocturnal-train.d.ts +0 -25
  330. package/dist/commands/nocturnal-train.js +0 -919
  331. package/dist/commands/pain.d.ts +0 -5
  332. package/dist/commands/principle-rollback.d.ts +0 -4
  333. package/dist/commands/principle-rollback.js +0 -22
  334. package/dist/commands/rollback.d.ts +0 -19
  335. package/dist/commands/samples.d.ts +0 -2
  336. package/dist/commands/samples.js +0 -55
  337. package/dist/commands/strategy.d.ts +0 -3
  338. package/dist/commands/strategy.js +0 -29
  339. package/dist/commands/thinking-os.d.ts +0 -2
  340. package/dist/config/defaults/runtime.d.ts +0 -40
  341. package/dist/config/errors.d.ts +0 -84
  342. package/dist/config/errors.js +0 -94
  343. package/dist/config/index.js +0 -7
  344. package/dist/constants/diagnostician.d.ts +0 -12
  345. package/dist/constants/diagnostician.js +0 -56
  346. package/dist/constants/tools.d.ts +0 -17
  347. package/dist/constants/tools.js +0 -54
  348. package/dist/core/adaptive-thresholds.d.ts +0 -186
  349. package/dist/core/adaptive-thresholds.js +0 -300
  350. package/dist/core/config-service.d.ts +0 -15
  351. package/dist/core/config.d.ts +0 -129
  352. package/dist/core/control-ui-db.d.ts +0 -95
  353. package/dist/core/control-ui-db.js +0 -292
  354. package/dist/core/detection-funnel.d.ts +0 -33
  355. package/dist/core/detection-service.d.ts +0 -15
  356. package/dist/core/dictionary-service.d.ts +0 -15
  357. package/dist/core/dictionary.d.ts +0 -38
  358. package/dist/core/event-log.d.ts +0 -82
  359. package/dist/core/event-log.js +0 -463
  360. package/dist/core/evolution-engine.d.ts +0 -118
  361. package/dist/core/evolution-engine.js +0 -464
  362. package/dist/core/evolution-logger.d.ts +0 -137
  363. package/dist/core/evolution-logger.js +0 -256
  364. package/dist/core/evolution-migration.d.ts +0 -5
  365. package/dist/core/evolution-migration.js +0 -65
  366. package/dist/core/evolution-reducer.d.ts +0 -98
  367. package/dist/core/evolution-reducer.js +0 -465
  368. package/dist/core/evolution-types.d.ts +0 -287
  369. package/dist/core/evolution-types.js +0 -78
  370. package/dist/core/external-training-contract.d.ts +0 -276
  371. package/dist/core/external-training-contract.js +0 -269
  372. package/dist/core/focus-history.d.ts +0 -210
  373. package/dist/core/focus-history.js +0 -1185
  374. package/dist/core/hygiene/tracker.d.ts +0 -22
  375. package/dist/core/hygiene/tracker.js +0 -106
  376. package/dist/core/init.d.ts +0 -12
  377. package/dist/core/local-worker-routing.d.ts +0 -175
  378. package/dist/core/local-worker-routing.js +0 -525
  379. package/dist/core/migration.d.ts +0 -6
  380. package/dist/core/model-deployment-registry.d.ts +0 -218
  381. package/dist/core/model-deployment-registry.js +0 -503
  382. package/dist/core/model-training-registry.d.ts +0 -295
  383. package/dist/core/model-training-registry.js +0 -475
  384. package/dist/core/nocturnal-arbiter.d.ts +0 -159
  385. package/dist/core/nocturnal-arbiter.js +0 -534
  386. package/dist/core/nocturnal-candidate-scoring.d.ts +0 -137
  387. package/dist/core/nocturnal-candidate-scoring.js +0 -266
  388. package/dist/core/nocturnal-compliance.d.ts +0 -175
  389. package/dist/core/nocturnal-compliance.js +0 -824
  390. package/dist/core/nocturnal-dataset.d.ts +0 -224
  391. package/dist/core/nocturnal-dataset.js +0 -443
  392. package/dist/core/nocturnal-executability.d.ts +0 -85
  393. package/dist/core/nocturnal-executability.js +0 -331
  394. package/dist/core/nocturnal-export.d.ts +0 -124
  395. package/dist/core/nocturnal-export.js +0 -275
  396. package/dist/core/nocturnal-paths.d.ts +0 -124
  397. package/dist/core/nocturnal-trajectory-extractor.d.ts +0 -242
  398. package/dist/core/nocturnal-trajectory-extractor.js +0 -307
  399. package/dist/core/nocturnal-trinity.d.ts +0 -311
  400. package/dist/core/nocturnal-trinity.js +0 -880
  401. package/dist/core/pain.d.ts +0 -4
  402. package/dist/core/pain.js +0 -70
  403. package/dist/core/path-resolver.d.ts +0 -46
  404. package/dist/core/paths.d.ts +0 -65
  405. package/dist/core/principle-training-state.d.ts +0 -121
  406. package/dist/core/principle-training-state.js +0 -321
  407. package/dist/core/profile.d.ts +0 -62
  408. package/dist/core/profile.js +0 -210
  409. package/dist/core/promotion-gate.d.ts +0 -238
  410. package/dist/core/promotion-gate.js +0 -529
  411. package/dist/core/risk-calculator.d.ts +0 -22
  412. package/dist/core/session-tracker.d.ts +0 -101
  413. package/dist/core/shadow-observation-registry.d.ts +0 -217
  414. package/dist/core/shadow-observation-registry.js +0 -308
  415. package/dist/core/system-logger.d.ts +0 -8
  416. package/dist/core/thinking-models.d.ts +0 -38
  417. package/dist/core/thinking-models.js +0 -170
  418. package/dist/core/training-program.d.ts +0 -233
  419. package/dist/core/training-program.js +0 -433
  420. package/dist/core/trajectory.d.ts +0 -411
  421. package/dist/core/trajectory.js +0 -1307
  422. package/dist/core/workspace-context.d.ts +0 -71
  423. package/dist/hooks/bash-risk.d.ts +0 -57
  424. package/dist/hooks/bash-risk.js +0 -137
  425. package/dist/hooks/edit-verification.d.ts +0 -62
  426. package/dist/hooks/edit-verification.js +0 -256
  427. package/dist/hooks/gate-block-helper.d.ts +0 -44
  428. package/dist/hooks/gate-block-helper.js +0 -119
  429. package/dist/hooks/gate.d.ts +0 -24
  430. package/dist/hooks/gate.js +0 -173
  431. package/dist/hooks/gfi-gate.d.ts +0 -40
  432. package/dist/hooks/gfi-gate.js +0 -113
  433. package/dist/hooks/lifecycle.d.ts +0 -5
  434. package/dist/hooks/lifecycle.js +0 -284
  435. package/dist/hooks/llm.d.ts +0 -13
  436. package/dist/hooks/message-sanitize.d.ts +0 -3
  437. package/dist/hooks/message-sanitize.js +0 -37
  438. package/dist/hooks/pain.d.ts +0 -5
  439. package/dist/hooks/pain.js +0 -301
  440. package/dist/hooks/progressive-trust-gate.d.ts +0 -52
  441. package/dist/hooks/progressive-trust-gate.js +0 -134
  442. package/dist/hooks/prompt.d.ts +0 -49
  443. package/dist/hooks/prompt.js +0 -905
  444. package/dist/hooks/subagent.d.ts +0 -10
  445. package/dist/hooks/subagent.js +0 -387
  446. package/dist/hooks/thinking-checkpoint.d.ts +0 -37
  447. package/dist/hooks/thinking-checkpoint.js +0 -51
  448. package/dist/hooks/trajectory-collector.d.ts +0 -32
  449. package/dist/hooks/trajectory-collector.js +0 -256
  450. package/dist/http/principles-console-route.d.ts +0 -9
  451. package/dist/http/principles-console-route.js +0 -681
  452. package/dist/i18n/commands.d.ts +0 -26
  453. package/dist/i18n/commands.js +0 -116
  454. package/dist/index.d.ts +0 -7
  455. package/dist/index.js +0 -581
  456. package/dist/service/central-database.d.ts +0 -104
  457. package/dist/service/central-database.js +0 -649
  458. package/dist/service/control-ui-query-service.d.ts +0 -221
  459. package/dist/service/control-ui-query-service.js +0 -543
  460. package/dist/service/empathy-observer-manager.d.ts +0 -88
  461. package/dist/service/empathy-observer-manager.js +0 -414
  462. package/dist/service/evolution-query-service.d.ts +0 -155
  463. package/dist/service/evolution-query-service.js +0 -258
  464. package/dist/service/evolution-worker.d.ts +0 -101
  465. package/dist/service/evolution-worker.js +0 -975
  466. package/dist/service/health-query-service.d.ts +0 -170
  467. package/dist/service/health-query-service.js +0 -662
  468. package/dist/service/nocturnal-runtime.d.ts +0 -183
  469. package/dist/service/nocturnal-service.d.ts +0 -163
  470. package/dist/service/nocturnal-service.js +0 -787
  471. package/dist/service/nocturnal-target-selector.d.ts +0 -145
  472. package/dist/service/nocturnal-target-selector.js +0 -315
  473. package/dist/service/phase3-input-filter.d.ts +0 -73
  474. package/dist/service/phase3-input-filter.js +0 -172
  475. package/dist/service/runtime-summary-service.d.ts +0 -122
  476. package/dist/service/runtime-summary-service.js +0 -485
  477. package/dist/service/subagent-workflow/empathy-observer-workflow-manager.d.ts +0 -48
  478. package/dist/service/subagent-workflow/index.d.ts +0 -4
  479. package/dist/service/subagent-workflow/index.js +0 -3
  480. package/dist/service/subagent-workflow/runtime-direct-driver.d.ts +0 -77
  481. package/dist/service/subagent-workflow/runtime-direct-driver.js +0 -75
  482. package/dist/service/subagent-workflow/types.js +0 -11
  483. package/dist/service/subagent-workflow/workflow-store.d.ts +0 -26
  484. package/dist/service/subagent-workflow/workflow-store.js +0 -165
  485. package/dist/service/trajectory-service.d.ts +0 -2
  486. package/dist/service/trajectory-service.js +0 -15
  487. package/dist/tools/critique-prompt.d.ts +0 -14
  488. package/dist/tools/deep-reflect.d.ts +0 -39
  489. package/dist/tools/deep-reflect.js +0 -350
  490. package/dist/tools/model-index.d.ts +0 -9
  491. package/dist/types/event-types.d.ts +0 -306
  492. package/dist/types/event-types.js +0 -106
  493. package/dist/types/hygiene-types.d.ts +0 -20
  494. package/dist/types/hygiene-types.js +0 -12
  495. package/dist/types/runtime-summary.d.ts +0 -47
  496. package/dist/types/runtime-summary.js +0 -1
  497. package/dist/types.d.ts +0 -50
  498. package/dist/types.js +0 -22
  499. package/dist/utils/file-lock.d.ts +0 -71
  500. package/dist/utils/file-lock.js +0 -309
  501. package/dist/utils/glob-match.d.ts +0 -28
  502. package/dist/utils/hashing.d.ts +0 -9
  503. package/dist/utils/io.d.ts +0 -6
  504. package/dist/utils/io.js +0 -106
  505. package/dist/utils/nlp.d.ts +0 -9
  506. package/dist/utils/plugin-logger.d.ts +0 -39
  507. package/dist/utils/subagent-probe.d.ts +0 -34
  508. package/dist/utils/subagent-probe.js +0 -81
@@ -0,0 +1,813 @@
1
+ /**
2
+ * Model Training Registry — Training Run, Checkpoint, and Eval Summary Lineage
3
+ * =============================================================================
4
+ *
5
+ * PURPOSE: Establish strict auditable lineage from training run → checkpoint → eval
6
+ * so that "deployable" is a controlled state, not a free-text field.
7
+ *
8
+ * ARCHITECTURE:
9
+ * - Registry file: {stateDir}/.state/nocturnal/training-registry.json
10
+ * - Three record types in one store: TrainingRun, Checkpoint, EvalSummary
11
+ * - File locking on all write operations
12
+ * - Family alignment enforced at every transition
13
+ *
14
+ * LINEAGE CHAIN (enforced):
15
+ * TrainingRun → Checkpoint → EvalSummary
16
+ * DatasetFingerprint → TrainingRun → Checkpoint → EvalSummary
17
+ *
18
+ * DEPLOYABILITY RULE:
19
+ * A Checkpoint can only be marked deployable if:
20
+ * 1. It has an attached EvalSummary
21
+ * 2. The EvalSummary has a verdict of 'pass' or 'compare_only' (not 'fail')
22
+ * 3. The EvalSummary's targetModelFamily matches the Checkpoint's targetModelFamily
23
+ * 4. The Checkpoint's trainRun is in 'completed' status
24
+ *
25
+ * DESIGN CONSTRAINTS:
26
+ * - No real training invocation (Phase 4 only)
27
+ * - No checkpoint deploy routing (Phase 5)
28
+ * - No automatic promotion
29
+ * - Registry is append-only for runs and checkpoints
30
+ * - EvalSummary attachment is the only mutable operation on a Checkpoint
31
+ */
32
+
33
+ import * as fs from 'fs';
34
+ import * as path from 'path';
35
+ import * as crypto from 'crypto';
36
+ import { withLock } from '../utils/file-lock.js';
37
+
38
+ // ---------------------------------------------------------------------------
39
+ // Constants
40
+ // ---------------------------------------------------------------------------
41
+
42
+ const REGISTRY_FILE = '.state/nocturnal/training-registry.json';
43
+
44
+ // ---------------------------------------------------------------------------
45
+ // Types
46
+ // ---------------------------------------------------------------------------
47
+
48
+ /**
49
+ * Training run status — lifecycle enforced transitions.
50
+ */
51
+ export type TrainingRunStatus = 'pending' | 'running' | 'completed' | 'failed';
52
+
53
+ /**
54
+ * A training run record — tracks one training job.
55
+ */
56
+ export interface TrainingRun {
57
+ /** Unique identifier for this training run */
58
+ trainRunId: string;
59
+
60
+ /**
61
+ * Experiment ID this run belongs to.
62
+ * Enables lookup by experimentId in addition to trainRunId.
63
+ */
64
+ experimentId: string;
65
+
66
+ /** Target model family this run produces checkpoints for */
67
+ targetModelFamily: string;
68
+
69
+ /**
70
+ * Fingerprint of the dataset used for this run.
71
+ * Links back to the ORPO export's datasetFingerprint.
72
+ */
73
+ datasetFingerprint: string;
74
+
75
+ /**
76
+ * Reference to the ORPO export that provided the training data.
77
+ * Format: {exportId}
78
+ */
79
+ exportId: string;
80
+
81
+ /** Number of samples from the export used in this run */
82
+ sampleCount: number;
83
+
84
+ /**
85
+ * Fingerprint of the training configuration used.
86
+ * For Phase 4 this is a placeholder (e.g., 'default-v0.1.0').
87
+ * Future: references an actual config artifact.
88
+ */
89
+ configFingerprint: string;
90
+
91
+ /** ISO-8601 creation timestamp */
92
+ createdAt: string;
93
+
94
+ /** ISO-8601 completion timestamp (set when status becomes completed/failed) */
95
+ completedAt?: string;
96
+
97
+ /** Current status */
98
+ status: TrainingRunStatus;
99
+
100
+ /** Human-readable reason for failure (if status === 'failed') */
101
+ failureReason?: string;
102
+
103
+ /**
104
+ * Checkpoint IDs produced by this run.
105
+ * A run may produce multiple checkpoints (e.g., epoch saves).
106
+ */
107
+ checkpointIds: string[];
108
+ }
109
+
110
+ /**
111
+ * A checkpoint record — a deployable artifact from a training run.
112
+ */
113
+ export interface Checkpoint {
114
+ /** Unique identifier for this checkpoint */
115
+ checkpointId: string;
116
+
117
+ /** The training run that produced this checkpoint */
118
+ trainRunId: string;
119
+
120
+ /** Target model family (must match the TrainingRun's targetModelFamily) */
121
+ targetModelFamily: string;
122
+
123
+ /**
124
+ * Path to the checkpoint artifact.
125
+ * In Phase 4 this is a placeholder path.
126
+ * Future: path to adapter weights, config, etc.
127
+ */
128
+ artifactPath: string;
129
+
130
+ /** ISO-8601 creation timestamp */
131
+ createdAt: string;
132
+
133
+ /**
134
+ * Whether this checkpoint can be routed to a worker.
135
+ * MUST be false until an EvalSummary is attached with verdict 'pass' or 'compare_only'.
136
+ * Cannot be set back to true after false without a new passing eval.
137
+ */
138
+ deployable: boolean;
139
+
140
+ /**
141
+ * Reference to the attached EvalSummary (evalId).
142
+ * Required for deployable === true.
143
+ */
144
+ lastEvalSummaryRef?: string;
145
+ }
146
+
147
+ /**
148
+ * An eval summary record — result of benchmarking a checkpoint.
149
+ */
150
+ export interface EvalSummary {
151
+ /** Unique identifier for this eval */
152
+ evalId: string;
153
+
154
+ /** The checkpoint this eval was run against */
155
+ checkpointId: string;
156
+
157
+ /** The benchmark run this eval came from */
158
+ benchmarkId: string;
159
+
160
+ /**
161
+ * Target model family — MUST match the checkpoint's targetModelFamily.
162
+ * Enforced at attachEvalSummary() time.
163
+ * This field prevents a gpt-4 checkpoint from being validated by a claude-3 eval.
164
+ */
165
+ targetModelFamily: string;
166
+
167
+ /** Evaluation mode: prompt-assisted or reduced-prompt */
168
+ mode: 'prompt_assisted' | 'reduced_prompt';
169
+
170
+ /** Baseline score from the benchmark (mean score of baseline checkpoint) */
171
+ baselineScore: number;
172
+
173
+ /** Candidate score from the benchmark (mean score of this checkpoint) */
174
+ candidateScore: number;
175
+
176
+ /** delta = candidateScore - baselineScore */
177
+ delta: number;
178
+
179
+ /** Verdict from the benchmark: pass | fail | compare_only */
180
+ verdict: 'pass' | 'fail' | 'compare_only';
181
+
182
+ /** ISO-8601 creation timestamp */
183
+ createdAt: string;
184
+ }
185
+
186
+ /**
187
+ * The complete training registry — all record types in one store.
188
+ */
189
+ export interface ModelTrainingRegistry {
190
+ trainingRuns: TrainingRun[];
191
+ checkpoints: Checkpoint[];
192
+ evalSummaries: EvalSummary[];
193
+ }
194
+
195
+ // ---------------------------------------------------------------------------
196
+ // Registry Path
197
+ // ---------------------------------------------------------------------------
198
+
199
+ function getRegistryPath(stateDir: string): string {
200
+ return path.join(stateDir, REGISTRY_FILE);
201
+ }
202
+
203
+ /**
204
+ * Ensure the registry directory exists.
205
+ */
206
+ function ensureRegistryDir(stateDir: string): void {
207
+ const registryPath = getRegistryPath(stateDir);
208
+ const dir = path.dirname(registryPath);
209
+ if (!fs.existsSync(dir)) {
210
+ fs.mkdirSync(dir, { recursive: true });
211
+ }
212
+ }
213
+
214
+ // ---------------------------------------------------------------------------
215
+ // File Operations
216
+ // ---------------------------------------------------------------------------
217
+
218
+ /**
219
+ * Read the registry from disk. Returns empty registry if missing.
220
+ */
221
+ function readRegistry(stateDir: string): ModelTrainingRegistry {
222
+ const registryPath = getRegistryPath(stateDir);
223
+ if (!fs.existsSync(registryPath)) {
224
+ return { trainingRuns: [], checkpoints: [], evalSummaries: [] };
225
+ }
226
+ try {
227
+ const content = fs.readFileSync(registryPath, 'utf-8');
228
+ return JSON.parse(content) as ModelTrainingRegistry;
229
+ } catch (err) {
230
+ console.warn(`[model-training-registry] Registry corrupted at ${registryPath}, recovering with empty state: ${String(err)}`);
231
+ return { trainingRuns: [], checkpoints: [], evalSummaries: [] };
232
+ }
233
+ }
234
+
235
+ /**
236
+ * Write the registry to disk atomically.
237
+ * Caller must hold the registry lock.
238
+ */
239
+ function writeRegistry(stateDir: string, registry: ModelTrainingRegistry): void {
240
+ ensureRegistryDir(stateDir);
241
+ const registryPath = getRegistryPath(stateDir);
242
+ const tmpPath = `${registryPath}.tmp`;
243
+ fs.writeFileSync(tmpPath, JSON.stringify(registry, null, 2), 'utf-8');
244
+ fs.renameSync(tmpPath, registryPath);
245
+ }
246
+
247
+ /**
248
+ * Execute a read-modify-write under an exclusive file lock.
249
+ */
250
+ function withRegistryLock<T>(
251
+ stateDir: string,
252
+ fn: (registry: ModelTrainingRegistry) => T
253
+ ): T {
254
+ const registryPath = getRegistryPath(stateDir);
255
+ return withLock(registryPath, () => {
256
+ const registry = readRegistry(stateDir);
257
+ return fn(registry);
258
+ });
259
+ }
260
+
261
+ // ---------------------------------------------------------------------------
262
+ // Training Run Operations
263
+ // ---------------------------------------------------------------------------
264
+
265
+ /**
266
+ * Valid training run status transitions.
267
+ * pending → running → completed | failed
268
+ * (no backward transitions)
269
+ */
270
+ const VALID_RUN_TRANSITIONS: Record<TrainingRunStatus, TrainingRunStatus[]> = {
271
+ pending: ['running'],
272
+ running: ['completed', 'failed'],
273
+ completed: [], // terminal
274
+ failed: [], // terminal
275
+ };
276
+
277
+ /**
278
+ * Register a new training run.
279
+ *
280
+ * @param stateDir - Workspace state directory
281
+ * @param params - Run parameters
282
+ * @returns The registered TrainingRun
283
+ */
284
+ export function registerTrainingRun(
285
+ stateDir: string,
286
+ params: {
287
+ experimentId: string;
288
+ targetModelFamily: string;
289
+ datasetFingerprint: string;
290
+ exportId: string;
291
+ sampleCount: number;
292
+ configFingerprint: string;
293
+ }
294
+ ): TrainingRun {
295
+ return withRegistryLock(stateDir, (registry) => {
296
+ const now = new Date().toISOString();
297
+ const trainRunId = crypto.randomUUID();
298
+
299
+ const run: TrainingRun = {
300
+ trainRunId,
301
+ experimentId: params.experimentId,
302
+ targetModelFamily: params.targetModelFamily,
303
+ datasetFingerprint: params.datasetFingerprint,
304
+ exportId: params.exportId,
305
+ sampleCount: params.sampleCount,
306
+ configFingerprint: params.configFingerprint,
307
+ createdAt: now,
308
+ status: 'pending',
309
+ checkpointIds: [],
310
+ };
311
+
312
+ registry.trainingRuns.push(run);
313
+ writeRegistry(stateDir, registry);
314
+ return run;
315
+ });
316
+ }
317
+
318
+ /**
319
+ * Update a training run's status.
320
+ *
321
+ * @throws Error if run not found or transition is invalid
322
+ */
323
+ export function updateTrainingRunStatus(
324
+ stateDir: string,
325
+ trainRunId: string,
326
+ newStatus: TrainingRunStatus,
327
+ failureReason?: string
328
+ ): TrainingRun {
329
+ return withRegistryLock(stateDir, (registry) => {
330
+ const idx = registry.trainingRuns.findIndex((r) => r.trainRunId === trainRunId);
331
+ if (idx === -1) {
332
+ throw new Error(`Training run not found: ${trainRunId}`);
333
+ }
334
+
335
+ const run = registry.trainingRuns[idx];
336
+ const allowed = VALID_RUN_TRANSITIONS[run.status];
337
+ if (!allowed.includes(newStatus)) {
338
+ throw new Error(
339
+ `Invalid status transition for training run ${trainRunId}: ${run.status} → ${newStatus}. ` +
340
+ `Allowed transitions from ${run.status}: ${allowed.join(', ') || 'none'}`
341
+ );
342
+ }
343
+
344
+ registry.trainingRuns[idx] = {
345
+ ...run,
346
+ status: newStatus,
347
+ completedAt: newStatus === 'completed' || newStatus === 'failed'
348
+ ? new Date().toISOString()
349
+ : undefined,
350
+ failureReason: newStatus === 'failed' ? failureReason : undefined,
351
+ };
352
+
353
+ writeRegistry(stateDir, registry);
354
+ return registry.trainingRuns[idx];
355
+ });
356
+ }
357
+
358
+ /**
359
+ * Complete a training run (convenience wrapper).
360
+ */
361
+ export function completeTrainingRun(stateDir: string, trainRunId: string): TrainingRun {
362
+ return updateTrainingRunStatus(stateDir, trainRunId, 'completed');
363
+ }
364
+
365
+ /**
366
+ * Fail a training run (convenience wrapper).
367
+ */
368
+ export function failTrainingRun(
369
+ stateDir: string,
370
+ trainRunId: string,
371
+ reason: string
372
+ ): TrainingRun {
373
+ return updateTrainingRunStatus(stateDir, trainRunId, 'failed', reason);
374
+ }
375
+
376
+ /**
377
+ * Start a training run (convenience wrapper).
378
+ */
379
+ export function startTrainingRun(stateDir: string, trainRunId: string): TrainingRun {
380
+ return updateTrainingRunStatus(stateDir, trainRunId, 'running');
381
+ }
382
+
383
+ /**
384
+ * Get a training run by ID.
385
+ */
386
+ export function getTrainingRun(
387
+ stateDir: string,
388
+ trainRunId: string
389
+ ): TrainingRun | null {
390
+ const registry = readRegistry(stateDir);
391
+ return registry.trainingRuns.find((r) => r.trainRunId === trainRunId) ?? null;
392
+ }
393
+
394
+ /**
395
+ * List all training runs, optionally filtered by status or family.
396
+ */
397
+ export function listTrainingRuns(
398
+ stateDir: string,
399
+ filter?: {
400
+ status?: TrainingRunStatus;
401
+ targetModelFamily?: string;
402
+ }
403
+ ): TrainingRun[] {
404
+ const registry = readRegistry(stateDir);
405
+ let runs = registry.trainingRuns;
406
+
407
+ if (filter?.status) {
408
+ runs = runs.filter((r) => r.status === filter.status);
409
+ }
410
+ if (filter?.targetModelFamily) {
411
+ runs = runs.filter((r) => r.targetModelFamily === filter.targetModelFamily);
412
+ }
413
+
414
+ return runs.sort(
415
+ (a, b) => new Date(b.createdAt).getTime() - new Date(a.createdAt).getTime()
416
+ );
417
+ }
418
+
419
+ // ---------------------------------------------------------------------------
420
+ // Checkpoint Operations
421
+ // ---------------------------------------------------------------------------
422
+
423
+ /**
424
+ * Register a checkpoint produced by a training run.
425
+ *
426
+ * @throws Error if the training run is not found
427
+ * @throws Error if the targetModelFamily does not match the run's family
428
+ */
429
+ export function registerCheckpoint(
430
+ stateDir: string,
431
+ params: {
432
+ trainRunId: string;
433
+ targetModelFamily: string;
434
+ artifactPath: string;
435
+ }
436
+ ): Checkpoint {
437
+ return withRegistryLock(stateDir, (registry) => {
438
+ // Verify the training run exists
439
+ const run = registry.trainingRuns.find((r) => r.trainRunId === params.trainRunId);
440
+ if (!run) {
441
+ throw new Error(`Training run not found: ${params.trainRunId}`);
442
+ }
443
+
444
+ // Verify family alignment
445
+ if (run.targetModelFamily !== params.targetModelFamily) {
446
+ throw new Error(
447
+ `Target model family mismatch: checkpoint family "${params.targetModelFamily}" ` +
448
+ `does not match training run family "${run.targetModelFamily}"`
449
+ );
450
+ }
451
+
452
+ const now = new Date().toISOString();
453
+ const checkpointId = crypto.randomUUID();
454
+
455
+ const checkpoint: Checkpoint = {
456
+ checkpointId,
457
+ trainRunId: params.trainRunId,
458
+ targetModelFamily: params.targetModelFamily,
459
+ artifactPath: params.artifactPath,
460
+ createdAt: now,
461
+ deployable: false, // Always starts as false
462
+ };
463
+
464
+ registry.checkpoints.push(checkpoint);
465
+
466
+ // Update the training run's checkpoint IDs
467
+ const runIdx = registry.trainingRuns.findIndex((r) => r.trainRunId === params.trainRunId);
468
+ registry.trainingRuns[runIdx] = {
469
+ ...run,
470
+ checkpointIds: [...run.checkpointIds, checkpointId],
471
+ };
472
+
473
+ writeRegistry(stateDir, registry);
474
+ return checkpoint;
475
+ });
476
+ }
477
+
478
+ /**
479
+ * Get a checkpoint by ID.
480
+ */
481
+ export function getCheckpoint(
482
+ stateDir: string,
483
+ checkpointId: string
484
+ ): Checkpoint | null {
485
+ const registry = readRegistry(stateDir);
486
+ return registry.checkpoints.find((c) => c.checkpointId === checkpointId) ?? null;
487
+ }
488
+
489
+ /**
490
+ * List all checkpoints, optionally filtered.
491
+ */
492
+ export function listCheckpoints(
493
+ stateDir: string,
494
+ filter?: {
495
+ trainRunId?: string;
496
+ targetModelFamily?: string;
497
+ deployable?: boolean;
498
+ }
499
+ ): Checkpoint[] {
500
+ const registry = readRegistry(stateDir);
501
+ let checkpoints = registry.checkpoints;
502
+
503
+ if (filter?.trainRunId) {
504
+ checkpoints = checkpoints.filter((c) => c.trainRunId === filter.trainRunId);
505
+ }
506
+ if (filter?.targetModelFamily) {
507
+ checkpoints = checkpoints.filter((c) => c.targetModelFamily === filter.targetModelFamily);
508
+ }
509
+ if (filter?.deployable !== undefined) {
510
+ checkpoints = checkpoints.filter((c) => c.deployable === filter.deployable);
511
+ }
512
+
513
+ return checkpoints.sort(
514
+ (a, b) => new Date(b.createdAt).getTime() - new Date(a.createdAt).getTime()
515
+ );
516
+ }
517
+
518
+ /**
519
+ * List all deployable checkpoints for a target model family.
520
+ */
521
+ export function listDeployableCheckpoints(
522
+ stateDir: string,
523
+ targetModelFamily: string
524
+ ): Checkpoint[] {
525
+ return listCheckpoints(stateDir, {
526
+ targetModelFamily,
527
+ deployable: true,
528
+ });
529
+ }
530
+
531
+ // ---------------------------------------------------------------------------
532
+ // Eval Summary Operations
533
+ // ---------------------------------------------------------------------------
534
+
535
+ /**
536
+ * Attach an eval summary to a checkpoint.
537
+ *
538
+ * @param stateDir - Workspace state directory
539
+ * @param checkpointId - The checkpoint to attach to
540
+ * @param summary - The eval summary to attach
541
+ *
542
+ * @throws Error if checkpoint not found
543
+ * @throws Error if targetModelFamily mismatch between summary and checkpoint
544
+ */
545
+ export function attachEvalSummary(
546
+ stateDir: string,
547
+ checkpointId: string,
548
+ summary: Omit<EvalSummary, 'createdAt'>
549
+ ): EvalSummary {
550
+ return withRegistryLock(stateDir, (registry) => {
551
+ const checkpointIdx = registry.checkpoints.findIndex(
552
+ (c) => c.checkpointId === checkpointId
553
+ );
554
+ if (checkpointIdx === -1) {
555
+ throw new Error(`Checkpoint not found: ${checkpointId}`);
556
+ }
557
+
558
+ const checkpoint = registry.checkpoints[checkpointIdx];
559
+
560
+ // FAMILY ALIGNMENT — enforced fail-closed:
561
+ // An eval for a gpt-4 checkpoint cannot be attached to a claude-3 checkpoint
562
+ // (and vice versa), even if the eval verdict is 'pass'.
563
+ if (summary.targetModelFamily !== checkpoint.targetModelFamily) {
564
+ throw new Error(
565
+ `Family mismatch: eval targets "${summary.targetModelFamily}" ` +
566
+ `but checkpoint "${checkpointId}" is "${checkpoint.targetModelFamily}". ` +
567
+ `EvalSummary.targetModelFamily must match the checkpoint's targetModelFamily.`
568
+ );
569
+ }
570
+
571
+ const evalSummary: EvalSummary = {
572
+ ...summary,
573
+ createdAt: new Date().toISOString(),
574
+ };
575
+
576
+ registry.evalSummaries.push(evalSummary);
577
+
578
+ // Update the checkpoint's lastEvalSummaryRef
579
+ registry.checkpoints[checkpointIdx] = {
580
+ ...checkpoint,
581
+ lastEvalSummaryRef: evalSummary.evalId,
582
+ };
583
+
584
+ writeRegistry(stateDir, registry);
585
+ return evalSummary;
586
+ });
587
+ }
588
+
589
+ /**
590
+ * Get an eval summary by ID.
591
+ */
592
+ export function getEvalSummary(
593
+ stateDir: string,
594
+ evalId: string
595
+ ): EvalSummary | null {
596
+ const registry = readRegistry(stateDir);
597
+ return registry.evalSummaries.find((e) => e.evalId === evalId) ?? null;
598
+ }
599
+
600
+ /**
601
+ * List eval summaries, optionally filtered.
602
+ */
603
+ export function listEvalSummaries(
604
+ stateDir: string,
605
+ filter?: {
606
+ checkpointId?: string;
607
+ benchmarkId?: string;
608
+ verdict?: EvalSummary['verdict'];
609
+ targetModelFamily?: string;
610
+ }
611
+ ): EvalSummary[] {
612
+ const registry = readRegistry(stateDir);
613
+ let evals = registry.evalSummaries;
614
+
615
+ if (filter?.checkpointId) {
616
+ evals = evals.filter((e) => e.checkpointId === filter.checkpointId);
617
+ }
618
+ if (filter?.benchmarkId) {
619
+ evals = evals.filter((e) => e.benchmarkId === filter.benchmarkId);
620
+ }
621
+ if (filter?.verdict) {
622
+ evals = evals.filter((e) => e.verdict === filter.verdict);
623
+ }
624
+ if (filter?.targetModelFamily) {
625
+ evals = evals.filter((e) => e.targetModelFamily === filter.targetModelFamily);
626
+ }
627
+
628
+ return evals.sort(
629
+ (a, b) => new Date(b.createdAt).getTime() - new Date(a.createdAt).getTime()
630
+ );
631
+ }
632
+
633
+ // ---------------------------------------------------------------------------
634
+ // Deployability — Core Gating Logic
635
+ // ---------------------------------------------------------------------------
636
+
637
+ /**
638
+ * MARK the deployability status of a checkpoint.
639
+ *
640
+ * DEPLOYABILITY RULE (fail-closed):
641
+ * A checkpoint can only be marked deployable if ALL of:
642
+ * 1. It has an attached EvalSummary (lastEvalSummaryRef is set)
643
+ * 2. The attached EvalSummary has verdict 'pass' or 'compare_only' (not 'fail')
644
+ * 3. The EvalSummary's targetModelFamily matches the Checkpoint's targetModelFamily
645
+ * NOTE: This is enforced at attachEvalSummary() time (see attachEvalSummary).
646
+ * If a mismatched-family eval is attached, attachEvalSummary throws before
647
+ * the registry is modified, so no eval with wrong family can ever reach here.
648
+ * 4. The parent TrainingRun is in 'completed' status
649
+ *
650
+ * @param stateDir - Workspace state directory
651
+ * @param checkpointId - The checkpoint to mark
652
+ * @param deployable - true to mark as deployable; false to revoke
653
+ *
654
+ * @throws Error if checkpoint not found
655
+ * @throws Error if preconditions for deployable=true are not met
656
+ */
657
+ export function markCheckpointDeployable(
658
+ stateDir: string,
659
+ checkpointId: string,
660
+ deployable: boolean
661
+ ): Checkpoint {
662
+ return withRegistryLock(stateDir, (registry) => {
663
+ const idx = registry.checkpoints.findIndex((c) => c.checkpointId === checkpointId);
664
+ if (idx === -1) {
665
+ throw new Error(`Checkpoint not found: ${checkpointId}`);
666
+ }
667
+
668
+ const checkpoint = registry.checkpoints[idx];
669
+
670
+ if (deployable) {
671
+ // FAIL-CLOSED: Verify all preconditions
672
+
673
+ // 1. Must have an attached eval summary
674
+ if (!checkpoint.lastEvalSummaryRef) {
675
+ throw new Error(
676
+ `Cannot mark checkpoint ${checkpointId} as deployable: ` +
677
+ `no eval summary attached. Attach an EvalSummary first.`
678
+ );
679
+ }
680
+
681
+ // 2. Find the eval summary
682
+ const evalSummary = registry.evalSummaries.find(
683
+ (e) => e.evalId === checkpoint.lastEvalSummaryRef
684
+ );
685
+ if (!evalSummary) {
686
+ throw new Error(
687
+ `Cannot mark checkpoint ${checkpointId} as deployable: ` +
688
+ `eval summary "${checkpoint.lastEvalSummaryRef}" not found`
689
+ );
690
+ }
691
+
692
+ // 3. Verdict must be 'pass' or 'compare_only' (not 'fail')
693
+ if (evalSummary.verdict === 'fail') {
694
+ throw new Error(
695
+ `Cannot mark checkpoint ${checkpointId} as deployable: ` +
696
+ `eval verdict is '${evalSummary.verdict}' (evalId: ${evalSummary.evalId}). ` +
697
+ `Only 'pass' or 'compare_only' verdicts allow deployment.`
698
+ );
699
+ }
700
+
701
+ // 4. Parent training run must be completed
702
+ const run = registry.trainingRuns.find((r) => r.trainRunId === checkpoint.trainRunId);
703
+ if (!run) {
704
+ throw new Error(
705
+ `Cannot mark checkpoint ${checkpointId} as deployable: ` +
706
+ `parent training run "${checkpoint.trainRunId}" not found`
707
+ );
708
+ }
709
+ if (run.status !== 'completed') {
710
+ throw new Error(
711
+ `Cannot mark checkpoint ${checkpointId} as deployable: ` +
712
+ `parent training run is in '${run.status}' status (must be 'completed')`
713
+ );
714
+ }
715
+ }
716
+
717
+ // Apply the update (both marking deployable and revoking deployability)
718
+ registry.checkpoints[idx] = {
719
+ ...checkpoint,
720
+ deployable,
721
+ // If revoking deployability, also clear the eval ref
722
+ lastEvalSummaryRef: deployable ? checkpoint.lastEvalSummaryRef : undefined,
723
+ };
724
+
725
+ writeRegistry(stateDir, registry);
726
+ return registry.checkpoints[idx];
727
+ });
728
+ }
729
+
730
+ /**
731
+ * Convenience: check if a checkpoint is deployable.
732
+ */
733
+ export function isCheckpointDeployable(
734
+ stateDir: string,
735
+ checkpointId: string
736
+ ): boolean {
737
+ const checkpoint = getCheckpoint(stateDir, checkpointId);
738
+ return checkpoint?.deployable ?? false;
739
+ }
740
+
741
+ // ---------------------------------------------------------------------------
742
+ // Registry-Level Queries
743
+ // ---------------------------------------------------------------------------
744
+
745
+ /**
746
+ * Get the full lineage chain for a checkpoint.
747
+ * Returns: { run, checkpoint, eval? } or null if not found.
748
+ */
749
+ export function getCheckpointLineage(
750
+ stateDir: string,
751
+ checkpointId: string
752
+ ): {
753
+ run: TrainingRun;
754
+ checkpoint: Checkpoint;
755
+ eval: EvalSummary | null;
756
+ } | null {
757
+ const registry = readRegistry(stateDir);
758
+ const checkpoint = registry.checkpoints.find((c) => c.checkpointId === checkpointId);
759
+ if (!checkpoint) return null;
760
+
761
+ const run = registry.trainingRuns.find((r) => r.trainRunId === checkpoint.trainRunId);
762
+ if (!run) return null;
763
+
764
+ const eval_ = checkpoint.lastEvalSummaryRef
765
+ ? registry.evalSummaries.find((e) => e.evalId === checkpoint.lastEvalSummaryRef) ?? null
766
+ : null;
767
+
768
+ return { run, checkpoint, eval: eval_ ?? null };
769
+ }
770
+
771
+ /**
772
+ * Get the complete registry (for debugging/admin purposes).
773
+ */
774
+ export function getFullRegistry(stateDir: string): ModelTrainingRegistry {
775
+ return readRegistry(stateDir);
776
+ }
777
+
778
+ /**
779
+ * Compute stats for the training registry.
780
+ */
781
+ export function getTrainingRegistryStats(
782
+ stateDir: string
783
+ ): {
784
+ totalRuns: number;
785
+ completedRuns: number;
786
+ failedRuns: number;
787
+ pendingRuns: number;
788
+ runningRuns: number;
789
+ totalCheckpoints: number;
790
+ deployableCheckpoints: number;
791
+ totalEvals: number;
792
+ passingEvals: number;
793
+ failingEvals: number;
794
+ } {
795
+ const registry = readRegistry(stateDir);
796
+
797
+ const runs = registry.trainingRuns;
798
+ const checkpoints = registry.checkpoints;
799
+ const evals = registry.evalSummaries;
800
+
801
+ return {
802
+ totalRuns: runs.length,
803
+ completedRuns: runs.filter((r) => r.status === 'completed').length,
804
+ failedRuns: runs.filter((r) => r.status === 'failed').length,
805
+ pendingRuns: runs.filter((r) => r.status === 'pending').length,
806
+ runningRuns: runs.filter((r) => r.status === 'running').length,
807
+ totalCheckpoints: checkpoints.length,
808
+ deployableCheckpoints: checkpoints.filter((c) => c.deployable).length,
809
+ totalEvals: evals.length,
810
+ passingEvals: evals.filter((e) => e.verdict === 'pass' || e.verdict === 'compare_only').length,
811
+ failingEvals: evals.filter((e) => e.verdict === 'fail').length,
812
+ };
813
+ }