principles-disciple 1.8.1 → 1.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (470) hide show
  1. package/ADVANCED_CONFIG_ZH.md +97 -0
  2. package/AGENT_INSTALL.md +173 -0
  3. package/AGENT_INSTALL_EN.md +173 -0
  4. package/INSTALL.md +256 -0
  5. package/SKILL.md +63 -0
  6. package/docs/COMMAND_REFERENCE.md +76 -0
  7. package/docs/COMMAND_REFERENCE_EN.md +79 -0
  8. package/esbuild.config.js +75 -0
  9. package/openclaw.plugin.json +4 -4
  10. package/package.json +11 -13
  11. package/scripts/build-web.mjs +46 -0
  12. package/scripts/install-dependencies.cjs +47 -0
  13. package/scripts/sync-plugin.mjs +802 -0
  14. package/scripts/verify-build.mjs +109 -0
  15. package/src/agents/nocturnal-dreamer.md +152 -0
  16. package/src/agents/nocturnal-philosopher.md +138 -0
  17. package/src/agents/nocturnal-reflector.md +126 -0
  18. package/src/agents/nocturnal-scribe.md +164 -0
  19. package/src/commands/capabilities.ts +85 -0
  20. package/{dist/commands/context.js → src/commands/context.ts} +78 -38
  21. package/src/commands/evolution-status.ts +146 -0
  22. package/src/commands/export.ts +111 -0
  23. package/src/commands/focus.ts +533 -0
  24. package/src/commands/nocturnal-review.ts +311 -0
  25. package/src/commands/nocturnal-rollout.ts +763 -0
  26. package/src/commands/nocturnal-train.ts +1002 -0
  27. package/{dist/commands/pain.js → src/commands/pain.ts} +68 -49
  28. package/src/commands/principle-rollback.ts +27 -0
  29. package/{dist/commands/rollback.js → src/commands/rollback.ts} +44 -12
  30. package/src/commands/samples.ts +60 -0
  31. package/src/commands/strategy.ts +38 -0
  32. package/{dist/commands/thinking-os.js → src/commands/thinking-os.ts} +59 -36
  33. package/src/commands/workflow-debug.ts +128 -0
  34. package/{dist/config/defaults/runtime.js → src/config/defaults/runtime.ts} +12 -5
  35. package/src/config/errors.ts +163 -0
  36. package/{dist/config/index.d.ts → src/config/index.ts} +2 -1
  37. package/src/constants/diagnostician.ts +66 -0
  38. package/src/constants/tools.ts +62 -0
  39. package/src/core/adaptive-thresholds.ts +476 -0
  40. package/{dist/core/config-service.js → src/core/config-service.ts} +7 -4
  41. package/{dist/core/config.js → src/core/config.ts} +158 -46
  42. package/src/core/control-ui-db.ts +435 -0
  43. package/{dist/core/detection-funnel.js → src/core/detection-funnel.ts} +36 -21
  44. package/{dist/core/detection-service.js → src/core/detection-service.ts} +7 -4
  45. package/{dist/core/dictionary-service.js → src/core/dictionary-service.ts} +7 -4
  46. package/{dist/core/dictionary.js → src/core/dictionary.ts} +57 -34
  47. package/src/core/empathy-keyword-matcher.ts +327 -0
  48. package/src/core/empathy-types.ts +218 -0
  49. package/src/core/event-log.ts +544 -0
  50. package/src/core/evolution-engine.ts +612 -0
  51. package/src/core/evolution-logger.ts +353 -0
  52. package/src/core/evolution-migration.ts +77 -0
  53. package/src/core/evolution-reducer.ts +731 -0
  54. package/src/core/evolution-types.ts +456 -0
  55. package/src/core/external-training-contract.ts +527 -0
  56. package/src/core/focus-history.ts +1458 -0
  57. package/src/core/hygiene/tracker.ts +117 -0
  58. package/{dist/core/init.js → src/core/init.ts} +39 -26
  59. package/src/core/local-worker-routing.ts +617 -0
  60. package/{dist/core/migration.js → src/core/migration.ts} +18 -11
  61. package/src/core/model-deployment-registry.ts +722 -0
  62. package/src/core/model-training-registry.ts +813 -0
  63. package/src/core/nocturnal-arbiter.ts +706 -0
  64. package/src/core/nocturnal-candidate-scoring.ts +392 -0
  65. package/src/core/nocturnal-compliance.ts +1075 -0
  66. package/src/core/nocturnal-dataset.ts +668 -0
  67. package/src/core/nocturnal-executability.ts +428 -0
  68. package/src/core/nocturnal-export.ts +390 -0
  69. package/{dist/core/nocturnal-paths.js → src/core/nocturnal-paths.ts} +49 -23
  70. package/src/core/nocturnal-trajectory-extractor.ts +484 -0
  71. package/src/core/nocturnal-trinity.ts +1384 -0
  72. package/src/core/pain.ts +122 -0
  73. package/{dist/core/path-resolver.js → src/core/path-resolver.ts} +157 -36
  74. package/{dist/core/paths.js → src/core/paths.ts} +13 -4
  75. package/src/core/principle-training-state.ts +450 -0
  76. package/src/core/profile.ts +226 -0
  77. package/src/core/promotion-gate.ts +822 -0
  78. package/{dist/core/risk-calculator.js → src/core/risk-calculator.ts} +42 -16
  79. package/{dist/core/session-tracker.js → src/core/session-tracker.ts} +175 -62
  80. package/src/core/shadow-observation-registry.ts +534 -0
  81. package/{dist/core/system-logger.js → src/core/system-logger.ts} +9 -5
  82. package/src/core/thinking-models.ts +217 -0
  83. package/src/core/training-program.ts +630 -0
  84. package/src/core/trajectory-types.ts +243 -0
  85. package/src/core/trajectory.ts +1673 -0
  86. package/{dist/core/workspace-context.js → src/core/workspace-context.ts} +57 -32
  87. package/src/hooks/bash-risk.ts +171 -0
  88. package/src/hooks/edit-verification.ts +295 -0
  89. package/src/hooks/gate-block-helper.ts +160 -0
  90. package/src/hooks/gate.ts +210 -0
  91. package/src/hooks/gfi-gate.ts +177 -0
  92. package/src/hooks/lifecycle.ts +326 -0
  93. package/{dist/hooks/llm.js → src/hooks/llm.ts} +160 -80
  94. package/src/hooks/message-sanitize.ts +45 -0
  95. package/src/hooks/pain.ts +384 -0
  96. package/src/hooks/progressive-trust-gate.ts +174 -0
  97. package/src/hooks/prompt.ts +920 -0
  98. package/src/hooks/subagent.ts +207 -0
  99. package/src/hooks/thinking-checkpoint.ts +73 -0
  100. package/src/hooks/trajectory-collector.ts +290 -0
  101. package/src/http/principles-console-route.ts +716 -0
  102. package/src/i18n/commands.ts +117 -0
  103. package/src/index.ts +694 -0
  104. package/src/service/central-database.ts +831 -0
  105. package/src/service/control-ui-query-service.ts +888 -0
  106. package/src/service/evolution-query-service.ts +405 -0
  107. package/src/service/evolution-worker.ts +1646 -0
  108. package/src/service/health-query-service.ts +836 -0
  109. package/{dist/service/nocturnal-runtime.js → src/service/nocturnal-runtime.ts} +235 -79
  110. package/src/service/nocturnal-service.ts +1015 -0
  111. package/src/service/nocturnal-target-selector.ts +532 -0
  112. package/src/service/phase3-input-filter.ts +237 -0
  113. package/src/service/runtime-summary-service.ts +757 -0
  114. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +513 -0
  115. package/{dist/service/subagent-workflow/empathy-observer-workflow-manager.js → src/service/subagent-workflow/empathy-observer-workflow-manager.ts} +240 -117
  116. package/src/service/subagent-workflow/index.ts +51 -0
  117. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +856 -0
  118. package/src/service/subagent-workflow/runtime-direct-driver.ts +166 -0
  119. package/{dist/service/subagent-workflow/types.d.ts → src/service/subagent-workflow/types.ts} +137 -18
  120. package/src/service/subagent-workflow/workflow-store.ts +328 -0
  121. package/src/service/trajectory-service.ts +15 -0
  122. package/{dist/tools/critique-prompt.js → src/tools/critique-prompt.ts} +25 -8
  123. package/src/tools/deep-reflect.ts +349 -0
  124. package/{dist/tools/model-index.js → src/tools/model-index.ts} +33 -17
  125. package/src/types/event-types.ts +453 -0
  126. package/src/types/hygiene-types.ts +31 -0
  127. package/src/types/principle-tree-schema.ts +244 -0
  128. package/src/types/runtime-summary.ts +49 -0
  129. package/src/types.ts +74 -0
  130. package/src/utils/file-lock.ts +391 -0
  131. package/{dist/utils/glob-match.js → src/utils/glob-match.ts} +21 -20
  132. package/{dist/utils/hashing.js → src/utils/hashing.ts} +6 -4
  133. package/src/utils/io.ts +110 -0
  134. package/{dist/utils/nlp.js → src/utils/nlp.ts} +19 -12
  135. package/{dist/utils/plugin-logger.js → src/utils/plugin-logger.ts} +33 -8
  136. package/src/utils/subagent-probe.ts +94 -0
  137. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +70 -1
  138. package/templates/pain_settings.json +2 -1
  139. package/tests/README.md +120 -0
  140. package/tests/build-artifacts.test.ts +111 -0
  141. package/tests/commands/evolution-status.test.ts +222 -0
  142. package/tests/commands/evolver.test.ts +22 -0
  143. package/tests/commands/export.test.ts +78 -0
  144. package/tests/commands/nocturnal-review.test.ts +448 -0
  145. package/tests/commands/nocturnal-train.test.ts +97 -0
  146. package/tests/commands/pain.test.ts +108 -0
  147. package/tests/commands/samples.test.ts +65 -0
  148. package/tests/commands/strategy.test.ts +34 -0
  149. package/tests/commands/thinking-os.test.ts +88 -0
  150. package/tests/core/adaptive-thresholds.test.ts +261 -0
  151. package/tests/core/config-service.test.ts +89 -0
  152. package/tests/core/config.test.ts +90 -0
  153. package/tests/core/control-ui-db.test.ts +75 -0
  154. package/tests/core/core-template-guidance.test.ts +21 -0
  155. package/tests/core/detection-funnel.test.ts +63 -0
  156. package/tests/core/detection-service.test.ts +50 -0
  157. package/tests/core/dictionary-service.test.ts +116 -0
  158. package/tests/core/dictionary.test.ts +168 -0
  159. package/tests/core/empathy-keyword-matcher.test.ts +209 -0
  160. package/tests/core/event-log.test.ts +181 -0
  161. package/tests/core/evolution-e2e.test.ts +58 -0
  162. package/tests/core/evolution-engine-gate-integration.test.ts +543 -0
  163. package/tests/core/evolution-engine.test.ts +562 -0
  164. package/tests/core/evolution-logger.test.ts +148 -0
  165. package/tests/core/evolution-migration.test.ts +50 -0
  166. package/tests/core/evolution-paths.test.ts +21 -0
  167. package/tests/core/evolution-reducer.detector-metadata.test.ts +602 -0
  168. package/tests/core/evolution-reducer.test.ts +180 -0
  169. package/tests/core/evolution-types-loop.test.ts +48 -0
  170. package/tests/core/evolution-user-stories.e2e.test.ts +249 -0
  171. package/tests/core/external-training-contract.test.ts +463 -0
  172. package/tests/core/focus-history.test.ts +682 -0
  173. package/tests/core/init-flatten.test.ts +69 -0
  174. package/tests/core/init-refactor.test.ts +87 -0
  175. package/tests/core/init-v1.3.test.ts +46 -0
  176. package/tests/core/init.test.ts +190 -0
  177. package/tests/core/local-worker-routing.test.ts +757 -0
  178. package/tests/core/migration.test.ts +84 -0
  179. package/tests/core/model-deployment-registry.test.ts +845 -0
  180. package/tests/core/model-training-registry.test.ts +889 -0
  181. package/tests/core/nocturnal-arbiter.test.ts +494 -0
  182. package/tests/core/nocturnal-candidate-scoring.test.ts +400 -0
  183. package/tests/core/nocturnal-compliance.test.ts +646 -0
  184. package/tests/core/nocturnal-dataset.test.ts +892 -0
  185. package/tests/core/nocturnal-executability.test.ts +357 -0
  186. package/tests/core/nocturnal-export.test.ts +462 -0
  187. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +428 -0
  188. package/tests/core/nocturnal-trajectory-extractor.test.ts +634 -0
  189. package/tests/core/nocturnal-trinity.test.ts +953 -0
  190. package/tests/core/pain.test.ts +33 -0
  191. package/tests/core/path-resolver.test.ts +57 -0
  192. package/tests/core/paths-refactor.test.ts +42 -0
  193. package/tests/core/phase7-rollout-integration.test.ts +477 -0
  194. package/tests/core/principle-training-state.test.ts +712 -0
  195. package/tests/core/profile.test.ts +56 -0
  196. package/tests/core/promotion-gate.test.ts +556 -0
  197. package/tests/core/risk-calculator.test.ts +168 -0
  198. package/tests/core/session-tracker.test.ts +191 -0
  199. package/tests/core/training-program.test.ts +472 -0
  200. package/tests/core/trajectory.test.ts +265 -0
  201. package/tests/core/workspace-context-factory.test.ts +18 -0
  202. package/tests/core/workspace-context.test.ts +134 -0
  203. package/tests/fixtures/nocturnal-reviewed-subset.json +183 -0
  204. package/tests/fixtures/production-compatibility.test.ts +147 -0
  205. package/tests/fixtures/production-mock-generator.ts +282 -0
  206. package/tests/hooks/bash-risk-integration.test.ts +137 -0
  207. package/tests/hooks/bash-risk.test.ts +81 -0
  208. package/tests/hooks/edit-verification.test.ts +678 -0
  209. package/tests/hooks/gate-edit-verification-p1.test.ts +632 -0
  210. package/tests/hooks/gate-edit-verification.test.ts +435 -0
  211. package/tests/hooks/gate-pipeline-integration.test.ts +404 -0
  212. package/tests/hooks/gate.test.ts +271 -0
  213. package/tests/hooks/gfi-gate-unit.test.ts +422 -0
  214. package/tests/hooks/gfi-gate.test.ts +669 -0
  215. package/tests/hooks/lifecycle.test.ts +248 -0
  216. package/tests/hooks/llm.test.ts +308 -0
  217. package/tests/hooks/message-sanitize.test.ts +36 -0
  218. package/tests/hooks/pain.test.ts +141 -0
  219. package/tests/hooks/progressive-trust-gate.test.ts +277 -0
  220. package/tests/hooks/prompt.test.ts +1411 -0
  221. package/tests/hooks/subagent.test.ts +467 -0
  222. package/tests/hooks/thinking-gate.test.ts +313 -0
  223. package/tests/http/principles-console-route.test.ts +140 -0
  224. package/tests/hygiene-tracker.test.ts +77 -0
  225. package/tests/index.integration.test.ts +179 -0
  226. package/tests/index.shadow-routing.integration.test.ts +140 -0
  227. package/tests/index.test.ts +9 -0
  228. package/tests/integration/empathy-workflow-integration.test.ts +627 -0
  229. package/tests/service/control-ui-query-service.test.ts +121 -0
  230. package/tests/service/empathy-observer-workflow-manager.test.ts +176 -0
  231. package/tests/service/evolution-worker.test.ts +585 -0
  232. package/tests/service/nocturnal-runtime.test.ts +470 -0
  233. package/tests/service/nocturnal-service.test.ts +577 -0
  234. package/tests/service/nocturnal-target-selector.test.ts +615 -0
  235. package/tests/service/nocturnal-workflow-manager.test.ts +439 -0
  236. package/tests/service/phase3-input-filter.test.ts +289 -0
  237. package/tests/service/runtime-summary-service.test.ts +919 -0
  238. package/tests/task-compliance.test.ts +166 -0
  239. package/tests/test-utils.ts +48 -0
  240. package/tests/tools/critique-prompt.test.ts +260 -0
  241. package/tests/tools/deep-reflect.test.ts +232 -0
  242. package/tests/tools/model-index.test.ts +246 -0
  243. package/tests/ui/app.test.tsx +114 -0
  244. package/tests/utils/file-lock.test.ts +407 -0
  245. package/tests/utils/hashing.test.ts +32 -0
  246. package/tests/utils/io.test.ts +39 -0
  247. package/tests/utils/nlp.test.ts +53 -0
  248. package/tests/utils/plugin-logger.test.ts +156 -0
  249. package/tsconfig.json +16 -0
  250. package/tsconfig.tsbuildinfo +1 -0
  251. package/ui/src/App.tsx +45 -0
  252. package/ui/src/api.ts +216 -0
  253. package/ui/src/charts.tsx +586 -0
  254. package/ui/src/components/ErrorState.tsx +6 -0
  255. package/ui/src/components/Loading.tsx +13 -0
  256. package/ui/src/components/ProtectedRoute.tsx +12 -0
  257. package/ui/src/components/Shell.tsx +91 -0
  258. package/ui/src/components/WorkspaceConfig.tsx +146 -0
  259. package/ui/src/components/index.ts +5 -0
  260. package/ui/src/context/auth.tsx +80 -0
  261. package/ui/src/context/theme.tsx +66 -0
  262. package/ui/src/hooks/useAutoRefresh.ts +39 -0
  263. package/ui/src/i18n/ui.ts +363 -0
  264. package/ui/src/main.tsx +16 -0
  265. package/ui/src/pages/EvolutionPage.tsx +352 -0
  266. package/ui/src/pages/FeedbackPage.tsx +140 -0
  267. package/ui/src/pages/GateMonitorPage.tsx +136 -0
  268. package/ui/src/pages/LoginPage.tsx +88 -0
  269. package/ui/src/pages/OverviewPage.tsx +238 -0
  270. package/ui/src/pages/SamplesPage.tsx +174 -0
  271. package/ui/src/pages/ThinkingModelsPage.tsx +127 -0
  272. package/ui/src/styles.css +1661 -0
  273. package/ui/src/types.ts +368 -0
  274. package/ui/src/utils/format.ts +15 -0
  275. package/vitest.config.ts +23 -0
  276. package/dist/commands/capabilities.d.ts +0 -3
  277. package/dist/commands/capabilities.js +0 -73
  278. package/dist/commands/context.d.ts +0 -5
  279. package/dist/commands/evolution-status.d.ts +0 -4
  280. package/dist/commands/evolution-status.js +0 -117
  281. package/dist/commands/evolver.d.ts +0 -9
  282. package/dist/commands/evolver.js +0 -26
  283. package/dist/commands/export.d.ts +0 -2
  284. package/dist/commands/export.js +0 -98
  285. package/dist/commands/focus.d.ts +0 -14
  286. package/dist/commands/focus.js +0 -457
  287. package/dist/commands/nocturnal-review.d.ts +0 -24
  288. package/dist/commands/nocturnal-review.js +0 -265
  289. package/dist/commands/nocturnal-rollout.d.ts +0 -27
  290. package/dist/commands/nocturnal-rollout.js +0 -671
  291. package/dist/commands/nocturnal-train.d.ts +0 -25
  292. package/dist/commands/nocturnal-train.js +0 -919
  293. package/dist/commands/pain.d.ts +0 -5
  294. package/dist/commands/principle-rollback.d.ts +0 -4
  295. package/dist/commands/principle-rollback.js +0 -22
  296. package/dist/commands/rollback.d.ts +0 -19
  297. package/dist/commands/samples.d.ts +0 -2
  298. package/dist/commands/samples.js +0 -55
  299. package/dist/commands/strategy.d.ts +0 -3
  300. package/dist/commands/strategy.js +0 -29
  301. package/dist/commands/thinking-os.d.ts +0 -2
  302. package/dist/config/defaults/runtime.d.ts +0 -40
  303. package/dist/config/errors.d.ts +0 -84
  304. package/dist/config/errors.js +0 -94
  305. package/dist/config/index.js +0 -7
  306. package/dist/constants/diagnostician.d.ts +0 -12
  307. package/dist/constants/diagnostician.js +0 -56
  308. package/dist/constants/tools.d.ts +0 -17
  309. package/dist/constants/tools.js +0 -54
  310. package/dist/core/adaptive-thresholds.d.ts +0 -186
  311. package/dist/core/adaptive-thresholds.js +0 -300
  312. package/dist/core/config-service.d.ts +0 -15
  313. package/dist/core/config.d.ts +0 -129
  314. package/dist/core/control-ui-db.d.ts +0 -95
  315. package/dist/core/control-ui-db.js +0 -292
  316. package/dist/core/detection-funnel.d.ts +0 -33
  317. package/dist/core/detection-service.d.ts +0 -15
  318. package/dist/core/dictionary-service.d.ts +0 -15
  319. package/dist/core/dictionary.d.ts +0 -38
  320. package/dist/core/event-log.d.ts +0 -82
  321. package/dist/core/event-log.js +0 -463
  322. package/dist/core/evolution-engine.d.ts +0 -118
  323. package/dist/core/evolution-engine.js +0 -464
  324. package/dist/core/evolution-logger.d.ts +0 -137
  325. package/dist/core/evolution-logger.js +0 -256
  326. package/dist/core/evolution-migration.d.ts +0 -5
  327. package/dist/core/evolution-migration.js +0 -65
  328. package/dist/core/evolution-reducer.d.ts +0 -98
  329. package/dist/core/evolution-reducer.js +0 -465
  330. package/dist/core/evolution-types.d.ts +0 -287
  331. package/dist/core/evolution-types.js +0 -78
  332. package/dist/core/external-training-contract.d.ts +0 -276
  333. package/dist/core/external-training-contract.js +0 -269
  334. package/dist/core/focus-history.d.ts +0 -210
  335. package/dist/core/focus-history.js +0 -1185
  336. package/dist/core/hygiene/tracker.d.ts +0 -22
  337. package/dist/core/hygiene/tracker.js +0 -106
  338. package/dist/core/init.d.ts +0 -12
  339. package/dist/core/local-worker-routing.d.ts +0 -175
  340. package/dist/core/local-worker-routing.js +0 -525
  341. package/dist/core/migration.d.ts +0 -6
  342. package/dist/core/model-deployment-registry.d.ts +0 -218
  343. package/dist/core/model-deployment-registry.js +0 -503
  344. package/dist/core/model-training-registry.d.ts +0 -295
  345. package/dist/core/model-training-registry.js +0 -475
  346. package/dist/core/nocturnal-arbiter.d.ts +0 -159
  347. package/dist/core/nocturnal-arbiter.js +0 -534
  348. package/dist/core/nocturnal-candidate-scoring.d.ts +0 -137
  349. package/dist/core/nocturnal-candidate-scoring.js +0 -266
  350. package/dist/core/nocturnal-compliance.d.ts +0 -175
  351. package/dist/core/nocturnal-compliance.js +0 -824
  352. package/dist/core/nocturnal-dataset.d.ts +0 -224
  353. package/dist/core/nocturnal-dataset.js +0 -443
  354. package/dist/core/nocturnal-executability.d.ts +0 -85
  355. package/dist/core/nocturnal-executability.js +0 -331
  356. package/dist/core/nocturnal-export.d.ts +0 -124
  357. package/dist/core/nocturnal-export.js +0 -275
  358. package/dist/core/nocturnal-paths.d.ts +0 -124
  359. package/dist/core/nocturnal-trajectory-extractor.d.ts +0 -242
  360. package/dist/core/nocturnal-trajectory-extractor.js +0 -307
  361. package/dist/core/nocturnal-trinity.d.ts +0 -311
  362. package/dist/core/nocturnal-trinity.js +0 -880
  363. package/dist/core/pain.d.ts +0 -4
  364. package/dist/core/pain.js +0 -70
  365. package/dist/core/path-resolver.d.ts +0 -46
  366. package/dist/core/paths.d.ts +0 -65
  367. package/dist/core/principle-training-state.d.ts +0 -121
  368. package/dist/core/principle-training-state.js +0 -321
  369. package/dist/core/profile.d.ts +0 -62
  370. package/dist/core/profile.js +0 -210
  371. package/dist/core/promotion-gate.d.ts +0 -238
  372. package/dist/core/promotion-gate.js +0 -529
  373. package/dist/core/risk-calculator.d.ts +0 -22
  374. package/dist/core/session-tracker.d.ts +0 -101
  375. package/dist/core/shadow-observation-registry.d.ts +0 -217
  376. package/dist/core/shadow-observation-registry.js +0 -308
  377. package/dist/core/system-logger.d.ts +0 -8
  378. package/dist/core/thinking-models.d.ts +0 -38
  379. package/dist/core/thinking-models.js +0 -170
  380. package/dist/core/training-program.d.ts +0 -233
  381. package/dist/core/training-program.js +0 -433
  382. package/dist/core/trajectory.d.ts +0 -411
  383. package/dist/core/trajectory.js +0 -1307
  384. package/dist/core/workspace-context.d.ts +0 -71
  385. package/dist/hooks/bash-risk.d.ts +0 -57
  386. package/dist/hooks/bash-risk.js +0 -137
  387. package/dist/hooks/edit-verification.d.ts +0 -62
  388. package/dist/hooks/edit-verification.js +0 -256
  389. package/dist/hooks/gate-block-helper.d.ts +0 -44
  390. package/dist/hooks/gate-block-helper.js +0 -119
  391. package/dist/hooks/gate.d.ts +0 -24
  392. package/dist/hooks/gate.js +0 -173
  393. package/dist/hooks/gfi-gate.d.ts +0 -40
  394. package/dist/hooks/gfi-gate.js +0 -113
  395. package/dist/hooks/lifecycle.d.ts +0 -5
  396. package/dist/hooks/lifecycle.js +0 -284
  397. package/dist/hooks/llm.d.ts +0 -13
  398. package/dist/hooks/message-sanitize.d.ts +0 -3
  399. package/dist/hooks/message-sanitize.js +0 -37
  400. package/dist/hooks/pain.d.ts +0 -5
  401. package/dist/hooks/pain.js +0 -301
  402. package/dist/hooks/progressive-trust-gate.d.ts +0 -52
  403. package/dist/hooks/progressive-trust-gate.js +0 -134
  404. package/dist/hooks/prompt.d.ts +0 -49
  405. package/dist/hooks/prompt.js +0 -905
  406. package/dist/hooks/subagent.d.ts +0 -10
  407. package/dist/hooks/subagent.js +0 -387
  408. package/dist/hooks/thinking-checkpoint.d.ts +0 -37
  409. package/dist/hooks/thinking-checkpoint.js +0 -51
  410. package/dist/hooks/trajectory-collector.d.ts +0 -32
  411. package/dist/hooks/trajectory-collector.js +0 -256
  412. package/dist/http/principles-console-route.d.ts +0 -9
  413. package/dist/http/principles-console-route.js +0 -681
  414. package/dist/i18n/commands.d.ts +0 -26
  415. package/dist/i18n/commands.js +0 -116
  416. package/dist/index.d.ts +0 -7
  417. package/dist/index.js +0 -581
  418. package/dist/service/central-database.d.ts +0 -104
  419. package/dist/service/central-database.js +0 -649
  420. package/dist/service/control-ui-query-service.d.ts +0 -221
  421. package/dist/service/control-ui-query-service.js +0 -543
  422. package/dist/service/empathy-observer-manager.d.ts +0 -88
  423. package/dist/service/empathy-observer-manager.js +0 -414
  424. package/dist/service/evolution-query-service.d.ts +0 -155
  425. package/dist/service/evolution-query-service.js +0 -258
  426. package/dist/service/evolution-worker.d.ts +0 -101
  427. package/dist/service/evolution-worker.js +0 -975
  428. package/dist/service/health-query-service.d.ts +0 -170
  429. package/dist/service/health-query-service.js +0 -662
  430. package/dist/service/nocturnal-runtime.d.ts +0 -183
  431. package/dist/service/nocturnal-service.d.ts +0 -163
  432. package/dist/service/nocturnal-service.js +0 -787
  433. package/dist/service/nocturnal-target-selector.d.ts +0 -145
  434. package/dist/service/nocturnal-target-selector.js +0 -315
  435. package/dist/service/phase3-input-filter.d.ts +0 -73
  436. package/dist/service/phase3-input-filter.js +0 -172
  437. package/dist/service/runtime-summary-service.d.ts +0 -122
  438. package/dist/service/runtime-summary-service.js +0 -485
  439. package/dist/service/subagent-workflow/empathy-observer-workflow-manager.d.ts +0 -48
  440. package/dist/service/subagent-workflow/index.d.ts +0 -4
  441. package/dist/service/subagent-workflow/index.js +0 -3
  442. package/dist/service/subagent-workflow/runtime-direct-driver.d.ts +0 -77
  443. package/dist/service/subagent-workflow/runtime-direct-driver.js +0 -75
  444. package/dist/service/subagent-workflow/types.js +0 -11
  445. package/dist/service/subagent-workflow/workflow-store.d.ts +0 -26
  446. package/dist/service/subagent-workflow/workflow-store.js +0 -165
  447. package/dist/service/trajectory-service.d.ts +0 -2
  448. package/dist/service/trajectory-service.js +0 -15
  449. package/dist/tools/critique-prompt.d.ts +0 -14
  450. package/dist/tools/deep-reflect.d.ts +0 -39
  451. package/dist/tools/deep-reflect.js +0 -350
  452. package/dist/tools/model-index.d.ts +0 -9
  453. package/dist/types/event-types.d.ts +0 -306
  454. package/dist/types/event-types.js +0 -106
  455. package/dist/types/hygiene-types.d.ts +0 -20
  456. package/dist/types/hygiene-types.js +0 -12
  457. package/dist/types/runtime-summary.d.ts +0 -47
  458. package/dist/types/runtime-summary.js +0 -1
  459. package/dist/types.d.ts +0 -50
  460. package/dist/types.js +0 -22
  461. package/dist/utils/file-lock.d.ts +0 -71
  462. package/dist/utils/file-lock.js +0 -309
  463. package/dist/utils/glob-match.d.ts +0 -28
  464. package/dist/utils/hashing.d.ts +0 -9
  465. package/dist/utils/io.d.ts +0 -6
  466. package/dist/utils/io.js +0 -106
  467. package/dist/utils/nlp.d.ts +0 -9
  468. package/dist/utils/plugin-logger.d.ts +0 -39
  469. package/dist/utils/subagent-probe.d.ts +0 -34
  470. package/dist/utils/subagent-probe.js +0 -81
@@ -0,0 +1,630 @@
1
+ /**
2
+ * Training Program — Orchestrates External Training Execution and Lineage
3
+ * =========================================================================
4
+ *
5
+ * PURPOSE: Coordinate the training workflow from experiment spec creation
6
+ * through checkpoint registration and eval attachment.
7
+ *
8
+ * ARCHITECTURE:
9
+ * - TrainingProgram orchestrates the workflow but does NOT execute training itself
10
+ * - External trainer backends (Python scripts) do the actual training
11
+ * - Training run, checkpoint, and eval lineage is registered in model-training-registry
12
+ * - Promotion gate (promotion-gate.ts) controls deployment readiness
13
+ *
14
+ * WORKFLOW:
15
+ * 1. Create experiment spec (TrainingProgram.createExperiment)
16
+ * 2. Execute external trainer (TrainingProgram.executeTrainer)
17
+ * 3. Validate trainer result against spec (validateTrainerResult)
18
+ * 4. Register training run (model-training-registry)
19
+ * 5. Register checkpoint (model-training-registry)
20
+ * 6. Attach eval summary after benchmark (model-training-registry)
21
+ * 7. Promotion gate controls deployment readiness
22
+ *
23
+ * DESIGN CONSTRAINTS:
24
+ * - ORPO-first: only 'orpo' training mode
25
+ * - No training inside the plugin runtime
26
+ * - No direct deployment binding from trainer output
27
+ * - Trainer backends are fire-and-forget (plugin does not poll trainer)
28
+ * - All lineage must be traceable through model-training-registry
29
+ */
30
+
31
+ import * as fs from 'fs';
32
+ import * as path from 'path';
33
+ import * as crypto from 'crypto';
34
+ import { fileURLToPath } from 'url';
35
+ import {
36
+ type TrainingExperimentSpec,
37
+ type TrainingExperimentResult,
38
+ type TrainerBackendKind,
39
+ type TrainableWorkerProfile,
40
+ type HardwareTier,
41
+ type TrainingHyperparameters,
42
+ type TrainingBudget,
43
+ validateTrainerResult,
44
+ computeConfigFingerprint,
45
+ computeDatasetFingerprint,
46
+ computeCodeHash,
47
+ generateExperimentId,
48
+ validateHardwareTier,
49
+ getDefaultHardwareTier,
50
+ isValidModelFamilyForProfile,
51
+ LOCAL_EDITOR_ENABLED,
52
+ } from './external-training-contract.js';
53
+ import {
54
+ registerTrainingRun,
55
+ startTrainingRun,
56
+ completeTrainingRun,
57
+ failTrainingRun,
58
+ registerCheckpoint,
59
+ attachEvalSummary,
60
+ markCheckpointDeployable,
61
+ getCheckpointLineage,
62
+ } from './model-training-registry.js';
63
+
64
+ // ---------------------------------------------------------------------------
65
+ // Constants
66
+ // ---------------------------------------------------------------------------
67
+
68
+ /**
69
+ * Path to the external trainer scripts directory.
70
+ */
71
+ const TRAINER_SCRIPTS_DIR = 'scripts/nocturnal/trainer';
72
+ const MODULE_DIR = path.dirname(fileURLToPath(import.meta.url));
73
+ const REPO_ROOT = path.resolve(MODULE_DIR, '..', '..', '..', '..');
74
+
75
+ /**
76
+ * Default hyperparameters for ORPO training.
77
+ * These are conservative defaults for consumer GPU (RTX 4090 24GB).
78
+ */
79
+ export const DEFAULT_ORPO_HYPERPARAMETERS: TrainingHyperparameters = {
80
+ learningRate: 3e-4,
81
+ batchSize: 2,
82
+ gradientAccumulation: 8,
83
+ loraRank: 16,
84
+ loraAlpha: 32,
85
+ loraDropout: 0.05,
86
+ warmupRatio: 0.1,
87
+ maxSteps: 1000,
88
+ maxSeqLength: 2048,
89
+ };
90
+
91
+ /**
92
+ * Default budget for training runs.
93
+ */
94
+ export const DEFAULT_BUDGET: TrainingBudget = {
95
+ maxWallClockMinutes: 240, // 4 hours
96
+ maxTrainTokens: 2_000_000,
97
+ };
98
+
99
+ // ---------------------------------------------------------------------------
100
+ // Experiment Spec Creation
101
+ // ---------------------------------------------------------------------------
102
+
103
+ /**
104
+ * Parameters for creating a training experiment.
105
+ */
106
+ export interface CreateExperimentParams {
107
+ /** Target worker profile */
108
+ targetWorkerProfile: TrainableWorkerProfile;
109
+
110
+ /** Target model family */
111
+ targetModelFamily: string;
112
+
113
+ /** Hardware tier */
114
+ hardwareTier?: HardwareTier;
115
+
116
+ /** Backend to use */
117
+ backend: TrainerBackendKind;
118
+
119
+ /** Dataset export ID */
120
+ datasetExportId: string;
121
+
122
+ /** Dataset export path */
123
+ datasetExportPath: string;
124
+
125
+ /** Dataset fingerprint */
126
+ datasetFingerprint: string;
127
+
128
+ /** Benchmark export ID */
129
+ benchmarkExportId: string;
130
+
131
+ /** Output directory for checkpoints */
132
+ outputDir: string;
133
+
134
+ /** Custom hyperparameters (optional) */
135
+ hyperparameters?: Partial<TrainingHyperparameters>;
136
+
137
+ /** Custom budget (optional) */
138
+ budget?: Partial<TrainingBudget>;
139
+ }
140
+
141
+ /**
142
+ * Result of creating an experiment.
143
+ */
144
+ export interface CreateExperimentResult {
145
+ /** The experiment specification */
146
+ spec: TrainingExperimentSpec;
147
+
148
+ /** The registered training run ID */
149
+ trainRunId: string;
150
+ }
151
+
152
+ /**
153
+ * Create a new training experiment.
154
+ *
155
+ * This creates the experiment spec and registers a training run in the registry.
156
+ *
157
+ * @param stateDir - Workspace state directory
158
+ * @param params - Experiment parameters
159
+ * @returns Created experiment spec and registered training run ID
160
+ *
161
+ * @throws Error if worker profile is not allowed (local-editor not yet enabled)
162
+ * @throws Error if model family is not valid for the worker profile
163
+ * @throws Error if hardware tier is not valid for the backend
164
+ */
165
+ export function createExperiment(
166
+ stateDir: string,
167
+ params: CreateExperimentParams
168
+ ): CreateExperimentResult {
169
+ // --- Validate worker profile ---
170
+ if (params.targetWorkerProfile === 'local-editor' && !LOCAL_EDITOR_ENABLED) {
171
+ throw new Error(
172
+ `Training for 'local-editor' is not yet enabled. ` +
173
+ `Phase 7 first rollout is limited to 'local-reader'. ` +
174
+ `To enable local-editor training, set LOCAL_EDITOR_ENABLED = true ` +
175
+ `in external-training-contract.ts after appropriate review.`
176
+ );
177
+ }
178
+
179
+ // --- Validate model family for profile ---
180
+ if (!isValidModelFamilyForProfile(params.targetModelFamily, params.targetWorkerProfile)) {
181
+ throw new Error(
182
+ `Model family '${params.targetModelFamily}' is not valid for profile ` +
183
+ `'${params.targetWorkerProfile}'. ` +
184
+ `Ensure the model family name contains an appropriate keyword.`
185
+ );
186
+ }
187
+
188
+ // --- Validate hardware tier ---
189
+ const tier = params.hardwareTier ?? getDefaultHardwareTier(params.backend);
190
+ validateHardwareTier(params.backend, tier);
191
+
192
+ // --- Merge hyperparameters ---
193
+ const hyperparameters: TrainingHyperparameters = {
194
+ ...DEFAULT_ORPO_HYPERPARAMETERS,
195
+ ...params.hyperparameters,
196
+ };
197
+
198
+ // --- Compute fingerprints ---
199
+ const configFingerprint = computeConfigFingerprint(hyperparameters);
200
+ const codeHash = computeCodeHash();
201
+
202
+ // --- Create experiment spec ---
203
+ const spec: TrainingExperimentSpec = {
204
+ experimentId: generateExperimentId(),
205
+ backend: params.backend,
206
+ trainingMode: 'orpo',
207
+ targetWorkerProfile: params.targetWorkerProfile,
208
+ targetModelFamily: params.targetModelFamily,
209
+ hardwareTier: tier,
210
+ datasetExportId: params.datasetExportId,
211
+ datasetExportPath: params.datasetExportPath,
212
+ datasetFingerprint: params.datasetFingerprint,
213
+ benchmarkExportId: params.benchmarkExportId,
214
+ outputDir: params.outputDir,
215
+ configFingerprint,
216
+ codeHash,
217
+ hyperparameters,
218
+ budget: { ...DEFAULT_BUDGET, ...params.budget },
219
+ expectedArtifact: {
220
+ checkpointName: `checkpoint-${params.targetModelFamily}-${Date.now()}`,
221
+ adapterFormat: 'peft-adapter',
222
+ },
223
+ };
224
+
225
+ // --- Register training run in registry ---
226
+ const trainRun = registerTrainingRun(stateDir, {
227
+ experimentId: spec.experimentId,
228
+ targetModelFamily: spec.targetModelFamily,
229
+ datasetFingerprint: spec.datasetFingerprint,
230
+ exportId: spec.datasetExportId,
231
+ sampleCount: 0, // Will be updated when result is registered
232
+ configFingerprint: spec.configFingerprint,
233
+ });
234
+
235
+ return { spec, trainRunId: trainRun.trainRunId };
236
+ }
237
+
238
+ // ---------------------------------------------------------------------------
239
+ // Trainer Execution
240
+ // ---------------------------------------------------------------------------
241
+
242
+ /**
243
+ * Parameters for executing an external trainer.
244
+ */
245
+ export interface ExecuteTrainerParams {
246
+ /** The experiment specification */
247
+ spec: TrainingExperimentSpec;
248
+
249
+ /** Path to the trainer scripts directory */
250
+ scriptsDir?: string;
251
+ }
252
+
253
+ /**
254
+ * Execute an external trainer backend.
255
+ *
256
+ * This function:
257
+ * 1. Validates the trainer script exists
258
+ * 2. Serializes the experiment spec to JSON
259
+ * 3. Invokes the Python backend
260
+ * 4. Returns the trainer's parsed result
261
+ *
262
+ * The trainer protocol:
263
+ * - stdout: MUST contain only the machine-readable JSON result (TrainingExperimentResult)
264
+ * - stderr: Contains training progress logs (ignored by plugin)
265
+ * - result file: Written to output dir as backup if stdout parsing fails
266
+ *
267
+ * NOTE: This is a fire-and-forget execution. The plugin does not poll
268
+ * the trainer. For Phase 7, trainer execution is assumed to be synchronous
269
+ * or to complete before this function returns.
270
+ *
271
+ * @param spec - The experiment specification
272
+ * @param scriptsDir - Override for the scripts directory
273
+ * @returns The trainer's result as parsed JSON object
274
+ *
275
+ * @throws Error if the trainer script is not found
276
+ * @throws Error if trainer execution fails
277
+ * @throws Error if result cannot be parsed
278
+ */
279
+ export async function executeTrainer(
280
+ spec: TrainingExperimentSpec,
281
+ scriptsDir?: string
282
+ ): Promise<import('./external-training-contract.js').TrainingExperimentResult> {
283
+ const baseDir = scriptsDir ?? path.join(REPO_ROOT, TRAINER_SCRIPTS_DIR);
284
+
285
+ // Map backend to script name
286
+ const scriptMap: Record<TrainerBackendKind, string> = {
287
+ 'peft-trl-orpo': 'main.py',
288
+ 'unsloth-orpo': 'main.py',
289
+ 'dry-run': 'main.py',
290
+ };
291
+
292
+ const scriptName = scriptMap[spec.backend];
293
+ const scriptPath = path.join(baseDir, scriptName);
294
+
295
+ // Check if script exists (for dry-run, we allow missing scripts in development)
296
+ if (spec.backend !== 'dry-run' && !fs.existsSync(scriptPath)) {
297
+ throw new Error(
298
+ `Trainer script not found: ${scriptPath}. ` +
299
+ `Ensure the external trainer backends are installed at ${baseDir}.`
300
+ );
301
+ }
302
+
303
+ // Serialize spec to JSON for passing to trainer
304
+ const specPath = path.join(baseDir, `experiment-${spec.experimentId}.json`);
305
+ const specJson = JSON.stringify(spec, null, 2);
306
+
307
+ // Write spec to file for trainer to read
308
+ const specDir = path.dirname(specPath);
309
+ if (!fs.existsSync(specDir)) {
310
+ fs.mkdirSync(specDir, { recursive: true });
311
+ }
312
+ fs.writeFileSync(specPath, specJson, 'utf-8');
313
+
314
+ // Result file path (written by trainer to output dir)
315
+ const resultFilePath = path.join(spec.outputDir, `result-${spec.experimentId}.json`);
316
+
317
+ try {
318
+ if (spec.backend === 'dry-run') {
319
+ // For dry-run, simulate a successful dry-run result
320
+ // No actual Python script execution needed - dry-run just validates spec
321
+ return {
322
+ experimentId: spec.experimentId,
323
+ backend: 'dry-run',
324
+ status: 'dry_run' as const,
325
+ targetWorkerProfile: spec.targetWorkerProfile,
326
+ targetModelFamily: spec.targetModelFamily,
327
+ datasetFingerprint: spec.datasetFingerprint,
328
+ configFingerprint: spec.configFingerprint,
329
+ codeHash: spec.codeHash,
330
+ createdAt: new Date().toISOString(),
331
+ };
332
+ }
333
+
334
+ // Execute the Python trainer using spawn (streaming).
335
+ const { spawn } = await import('child_process');
336
+ // - stdout is collected into a fixed-size buffer (1MB max) to prevent OOM from training logs
337
+ // - stderr is piped directly to parent stderr so it never accumulates in memory
338
+ // - Non-zero exit codes are handled with clear error messages
339
+ const timeoutMs = (spec.budget.maxWallClockMinutes * 60 * 1000) + 30000;
340
+ const pythonExecutable = process.platform === 'win32' ? 'python' : 'python3';
341
+ const MAX_STDOUT_BUFFER = 1 * 1024 * 1024; // 1MB cap
342
+
343
+ const trainerResult = await new Promise<
344
+ import('./external-training-contract.js').TrainingExperimentResult
345
+ >((resolve, reject) => {
346
+ const proc = spawn(pythonExecutable, [scriptPath, '--spec', specPath, '--output-dir', spec.outputDir]);
347
+
348
+ // Collect stdout with size cap to prevent OOM from huge log output
349
+ const stdoutChunks: Buffer[] = [];
350
+ let stdoutSize = 0;
351
+
352
+ proc.stdout.on('data', (chunk: Buffer) => {
353
+ const remaining = MAX_STDOUT_BUFFER - stdoutSize;
354
+ if (remaining > 0) {
355
+ stdoutChunks.push(chunk.slice(0, remaining));
356
+ stdoutSize += Math.min(chunk.length, remaining);
357
+ }
358
+ });
359
+
360
+ // Pipe stderr directly — training logs must NOT accumulate in memory
361
+ proc.stderr.pipe(process.stderr);
362
+
363
+ const timer = setTimeout(() => {
364
+ proc.kill();
365
+ reject(new Error(`Trainer timed out after ${timeoutMs}ms`));
366
+ }, timeoutMs);
367
+
368
+ proc.on('close', (code) => {
369
+ clearTimeout(timer);
370
+ if (code === 0) {
371
+ const stdout = Buffer.concat(stdoutChunks).toString('utf-8');
372
+ const trimmed = stdout.trim();
373
+ if (trimmed) {
374
+ try {
375
+ resolve(JSON.parse(trimmed) as import('./external-training-contract.js').TrainingExperimentResult);
376
+ return;
377
+ } catch {
378
+ // fall through to result file
379
+ }
380
+ }
381
+ // Fallback: try result file
382
+ if (fs.existsSync(resultFilePath)) {
383
+ try {
384
+ const content = fs.readFileSync(resultFilePath, 'utf-8');
385
+ resolve(JSON.parse(content) as import('./external-training-contract.js').TrainingExperimentResult);
386
+ return;
387
+ } catch {
388
+ // fall through to error
389
+ }
390
+ }
391
+ reject(
392
+ new Error(
393
+ `Trainer stdout was not valid JSON and result file also invalid. ` +
394
+ `result file: ${resultFilePath}`
395
+ )
396
+ );
397
+ } else {
398
+ // Non-zero exit — try result file as last resort
399
+ if (fs.existsSync(resultFilePath)) {
400
+ try {
401
+ const content = fs.readFileSync(resultFilePath, 'utf-8');
402
+ resolve(JSON.parse(content) as import('./external-training-contract.js').TrainingExperimentResult);
403
+ } catch {
404
+ reject(new Error(`Trainer exited with code ${code} and result file was invalid: ${resultFilePath}`));
405
+ }
406
+ } else {
407
+ reject(new Error(`Trainer exited with code ${code} and no result file found at: ${resultFilePath}`));
408
+ }
409
+ }
410
+ });
411
+
412
+ proc.on('error', (err) => {
413
+ clearTimeout(timer);
414
+ reject(new Error(`Trainer spawn failed: ${err.message}`));
415
+ });
416
+ });
417
+
418
+ return trainerResult;
419
+ } finally {
420
+ // Clean up spec file after execution
421
+ if (fs.existsSync(specPath)) {
422
+ fs.unlinkSync(specPath);
423
+ }
424
+ }
425
+ }
426
+
427
+ // ---------------------------------------------------------------------------
428
+ // Result Processing
429
+ // ---------------------------------------------------------------------------
430
+
431
+ /**
432
+ * Parameters for processing a trainer result.
433
+ */
434
+ export interface ProcessTrainerResultParams {
435
+ /** The original experiment specification */
436
+ spec: TrainingExperimentSpec;
437
+
438
+ /** The training run ID from registry */
439
+ trainRunId: string;
440
+
441
+ /** The trainer's result (parsed) */
442
+ result: TrainingExperimentResult;
443
+
444
+ /** Workspace state directory */
445
+ stateDir: string;
446
+ }
447
+
448
+ /**
449
+ * Process a trainer result:
450
+ * 1. Validate result against spec
451
+ * 2. Register checkpoint in training registry
452
+ * 3. Return checkpoint for eval attachment
453
+ *
454
+ * @param params - Processing parameters
455
+ * @returns The registered checkpoint, or null for dry_run (no checkpoint produced)
456
+ *
457
+ * @throws Error if validation fails
458
+ * @throws Error if checkpoint registration fails
459
+ */
460
+ export function processTrainerResult(
461
+ params: ProcessTrainerResultParams
462
+ ): { checkpointId: string; checkpointRef: string } | null {
463
+ const { spec, trainRunId, result, stateDir } = params;
464
+
465
+ // --- Handle dry_run BEFORE validation (it has no checkpoint and should not be validated) ---
466
+ if (result.status === 'dry_run') {
467
+ // Dry-run: mark completed (no checkpoint expected) and return null.
468
+ // This is a supported non-error outcome — upper layers distinguish it from
469
+ // completed (which has a checkpoint) by checking the return value.
470
+ startTrainingRun(stateDir, trainRunId);
471
+ completeTrainingRun(stateDir, trainRunId);
472
+ return null;
473
+ }
474
+
475
+ // --- Transition pending -> running first ---
476
+ // Must happen before any validation or failure path so that
477
+ // failTrainingRun has a valid transition (running → failed).
478
+ startTrainingRun(stateDir, trainRunId);
479
+
480
+ // --- Validate result against spec (fail-closed) ---
481
+ const validation = validateTrainerResult(spec, result);
482
+ if (!validation.valid) {
483
+ const errorMessages = validation.errors
484
+ .map((e) => ` - ${e.field}: ${e.reason} (expected: ${e.expected}, got: ${e.actual})`)
485
+ .join('\n');
486
+
487
+ // Fail the training run in registry (running → failed is valid)
488
+ failTrainingRun(stateDir, trainRunId, `Validation failed:\n${errorMessages}`);
489
+
490
+ throw new Error(
491
+ `Trainer result validation failed (${validation.errors.length} errors):\n${errorMessages}\n` +
492
+ `The trainer result does not match the experiment spec. ` +
493
+ `This checkpoint will not be registered.`
494
+ );
495
+ }
496
+
497
+ // --- Update training run status ---
498
+ // Already transitioned to 'running' above
499
+
500
+ if (result.status === 'failed') {
501
+ failTrainingRun(stateDir, trainRunId, result.failureReason ?? 'Unknown failure');
502
+ throw new Error(`Training failed: ${result.failureReason}`);
503
+ }
504
+
505
+ // result.status === 'completed' (or any other non-failed/dry_run) — proceed to checkpoint
506
+ if (!result.checkpointId || !result.artifact) {
507
+ // Mark run failed since it didn't produce a checkpoint (run is in 'running' state)
508
+ failTrainingRun(stateDir, trainRunId, 'Trainer result is marked completed but missing checkpointId or artifact');
509
+ throw new Error(
510
+ `Trainer result is marked 'completed' but missing checkpointId or artifact.`
511
+ );
512
+ }
513
+
514
+ // --- Register checkpoint BEFORE marking run completed ---
515
+ // Ordering matters: if registerCheckpoint throws, run stays in 'running' state
516
+ // (not 'completed'), making the failure visible in registry audits.
517
+ const checkpoint = registerCheckpoint(stateDir, {
518
+ trainRunId,
519
+ targetModelFamily: spec.targetModelFamily,
520
+ artifactPath: result.artifact.artifactPath,
521
+ });
522
+
523
+ // Checkpoint registered successfully — now mark run completed
524
+ completeTrainingRun(stateDir, trainRunId);
525
+
526
+ return {
527
+ checkpointId: checkpoint.checkpointId,
528
+ checkpointRef: result.checkpointRef ?? checkpoint.checkpointId,
529
+ };
530
+ }
531
+
532
+ // ---------------------------------------------------------------------------
533
+ // Training Program Orchestration
534
+ // ---------------------------------------------------------------------------
535
+
536
+ /**
537
+ * The TrainingProgram class orchestrates the complete training workflow.
538
+ *
539
+ * Usage:
540
+ * ```typescript
541
+ * const program = new TrainingProgram(stateDir);
542
+ *
543
+ * // Create experiment
544
+ * const { spec, trainRunId } = program.createExperiment({
545
+ * backend: 'peft-trl-orpo',
546
+ * targetWorkerProfile: 'local-reader',
547
+ * targetModelFamily: 'qwen2.5-7b-reader',
548
+ * datasetExportId: 'export-123',
549
+ * datasetExportPath: '.state/exports/orpo/export-123.jsonl',
550
+ * datasetFingerprint: 'abc123',
551
+ * benchmarkExportId: 'benchmark-456',
552
+ * outputDir: '.state/nocturnal/checkpoints',
553
+ * });
554
+ *
555
+ * // Execute trainer (external)
556
+ * const trainerOutput = await executeTrainer(spec);
557
+ *
558
+ * // Process result
559
+ * const { checkpointId } = program.processResult({
560
+ * spec,
561
+ * trainRunId,
562
+ * result: JSON.parse(trainerOutput),
563
+ * });
564
+ *
565
+ * // Attach eval (after benchmark runs)
566
+ * program.attachEval(checkpointId, evalSummary);
567
+ * ```
568
+ */
569
+ export class TrainingProgram {
570
+ constructor(private readonly stateDir: string) {}
571
+
572
+ /**
573
+ * Create a new training experiment.
574
+ */
575
+ createExperiment(params: CreateExperimentParams): CreateExperimentResult {
576
+ return createExperiment(this.stateDir, params);
577
+ }
578
+
579
+ /**
580
+ * Process a trainer result and register the checkpoint.
581
+ * Returns null for dry_run (no checkpoint produced).
582
+ */
583
+ processResult(params: {
584
+ spec: TrainingExperimentSpec;
585
+ trainRunId: string;
586
+ result: TrainingExperimentResult;
587
+ }): { checkpointId: string; checkpointRef: string } | null {
588
+ return processTrainerResult({
589
+ ...params,
590
+ stateDir: this.stateDir,
591
+ });
592
+ }
593
+
594
+ /**
595
+ * Attach an eval summary to a checkpoint and mark it deployable if eval passes.
596
+ *
597
+ * @param checkpointId - The checkpoint to attach eval to
598
+ * @param evalSummary - The eval summary (from benchmark run)
599
+ * @returns The updated checkpoint
600
+ */
601
+ attachEvalAndMarkDeployable(
602
+ checkpointId: string,
603
+ evalSummary: {
604
+ evalId: string;
605
+ checkpointId: string;
606
+ benchmarkId: string;
607
+ targetModelFamily: string;
608
+ mode: 'prompt_assisted' | 'reduced_prompt';
609
+ baselineScore: number;
610
+ candidateScore: number;
611
+ delta: number;
612
+ verdict: 'pass' | 'fail' | 'compare_only';
613
+ }
614
+ ): void {
615
+ // Attach eval summary
616
+ attachEvalSummary(this.stateDir, checkpointId, evalSummary);
617
+
618
+ // Mark deployable if verdict is pass or compare_only
619
+ if (evalSummary.verdict === 'pass' || evalSummary.verdict === 'compare_only') {
620
+ markCheckpointDeployable(this.stateDir, checkpointId, true);
621
+ }
622
+ }
623
+
624
+ /**
625
+ * Get checkpoint lineage for audit.
626
+ */
627
+ getCheckpointLineage(checkpointId: string) {
628
+ return getCheckpointLineage(this.stateDir, checkpointId);
629
+ }
630
+ }