principles-disciple 1.8.1 → 1.8.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (508) hide show
  1. package/ADVANCED_CONFIG_ZH.md +97 -0
  2. package/AGENT_INSTALL.md +173 -0
  3. package/AGENT_INSTALL_EN.md +173 -0
  4. package/INSTALL.md +256 -0
  5. package/SKILL.md +63 -0
  6. package/docs/COMMAND_REFERENCE.md +76 -0
  7. package/docs/COMMAND_REFERENCE_EN.md +79 -0
  8. package/esbuild.config.js +75 -0
  9. package/openclaw.plugin.json +4 -4
  10. package/package.json +11 -13
  11. package/scripts/build-web.mjs +46 -0
  12. package/scripts/install-dependencies.cjs +47 -0
  13. package/scripts/sync-plugin.mjs +802 -0
  14. package/scripts/verify-build.mjs +109 -0
  15. package/src/agents/nocturnal-dreamer.md +152 -0
  16. package/src/agents/nocturnal-philosopher.md +138 -0
  17. package/src/agents/nocturnal-reflector.md +126 -0
  18. package/src/agents/nocturnal-scribe.md +164 -0
  19. package/src/commands/capabilities.ts +85 -0
  20. package/{dist/commands/context.js → src/commands/context.ts} +78 -38
  21. package/src/commands/evolution-status.ts +146 -0
  22. package/src/commands/export.ts +111 -0
  23. package/src/commands/focus.ts +533 -0
  24. package/src/commands/nocturnal-review.ts +311 -0
  25. package/src/commands/nocturnal-rollout.ts +763 -0
  26. package/src/commands/nocturnal-train.ts +1002 -0
  27. package/{dist/commands/pain.js → src/commands/pain.ts} +68 -49
  28. package/src/commands/principle-rollback.ts +27 -0
  29. package/{dist/commands/rollback.js → src/commands/rollback.ts} +44 -12
  30. package/src/commands/samples.ts +60 -0
  31. package/src/commands/strategy.ts +38 -0
  32. package/{dist/commands/thinking-os.js → src/commands/thinking-os.ts} +59 -36
  33. package/src/commands/workflow-debug.ts +128 -0
  34. package/{dist/config/defaults/runtime.js → src/config/defaults/runtime.ts} +12 -5
  35. package/src/config/errors.ts +163 -0
  36. package/{dist/config/index.d.ts → src/config/index.ts} +2 -1
  37. package/src/constants/diagnostician.ts +66 -0
  38. package/src/constants/tools.ts +62 -0
  39. package/src/core/adaptive-thresholds.ts +476 -0
  40. package/{dist/core/config-service.js → src/core/config-service.ts} +7 -4
  41. package/{dist/core/config.js → src/core/config.ts} +158 -46
  42. package/src/core/control-ui-db.ts +435 -0
  43. package/{dist/core/detection-funnel.js → src/core/detection-funnel.ts} +36 -21
  44. package/{dist/core/detection-service.js → src/core/detection-service.ts} +7 -4
  45. package/{dist/core/dictionary-service.js → src/core/dictionary-service.ts} +7 -4
  46. package/{dist/core/dictionary.js → src/core/dictionary.ts} +57 -34
  47. package/src/core/empathy-keyword-matcher.ts +327 -0
  48. package/src/core/empathy-types.ts +218 -0
  49. package/src/core/event-log.ts +544 -0
  50. package/src/core/evolution-engine.ts +612 -0
  51. package/src/core/evolution-logger.ts +353 -0
  52. package/src/core/evolution-migration.ts +77 -0
  53. package/src/core/evolution-reducer.ts +731 -0
  54. package/src/core/evolution-types.ts +456 -0
  55. package/src/core/external-training-contract.ts +527 -0
  56. package/src/core/focus-history.ts +1458 -0
  57. package/src/core/hygiene/tracker.ts +117 -0
  58. package/{dist/core/init.js → src/core/init.ts} +39 -26
  59. package/src/core/local-worker-routing.ts +617 -0
  60. package/{dist/core/migration.js → src/core/migration.ts} +18 -11
  61. package/src/core/model-deployment-registry.ts +722 -0
  62. package/src/core/model-training-registry.ts +813 -0
  63. package/src/core/nocturnal-arbiter.ts +706 -0
  64. package/src/core/nocturnal-candidate-scoring.ts +392 -0
  65. package/src/core/nocturnal-compliance.ts +1075 -0
  66. package/src/core/nocturnal-dataset.ts +668 -0
  67. package/src/core/nocturnal-executability.ts +428 -0
  68. package/src/core/nocturnal-export.ts +390 -0
  69. package/{dist/core/nocturnal-paths.js → src/core/nocturnal-paths.ts} +49 -23
  70. package/src/core/nocturnal-trajectory-extractor.ts +484 -0
  71. package/src/core/nocturnal-trinity.ts +1384 -0
  72. package/src/core/pain.ts +122 -0
  73. package/{dist/core/path-resolver.js → src/core/path-resolver.ts} +157 -36
  74. package/{dist/core/paths.js → src/core/paths.ts} +13 -4
  75. package/src/core/principle-training-state.ts +450 -0
  76. package/src/core/profile.ts +226 -0
  77. package/src/core/promotion-gate.ts +822 -0
  78. package/{dist/core/risk-calculator.js → src/core/risk-calculator.ts} +42 -16
  79. package/{dist/core/session-tracker.js → src/core/session-tracker.ts} +175 -62
  80. package/src/core/shadow-observation-registry.ts +534 -0
  81. package/{dist/core/system-logger.js → src/core/system-logger.ts} +9 -5
  82. package/src/core/thinking-models.ts +217 -0
  83. package/src/core/training-program.ts +630 -0
  84. package/src/core/trajectory-types.ts +243 -0
  85. package/src/core/trajectory.ts +1673 -0
  86. package/{dist/core/workspace-context.js → src/core/workspace-context.ts} +57 -32
  87. package/src/hooks/bash-risk.ts +171 -0
  88. package/src/hooks/edit-verification.ts +295 -0
  89. package/src/hooks/gate-block-helper.ts +160 -0
  90. package/src/hooks/gate.ts +210 -0
  91. package/src/hooks/gfi-gate.ts +177 -0
  92. package/src/hooks/lifecycle.ts +326 -0
  93. package/{dist/hooks/llm.js → src/hooks/llm.ts} +160 -80
  94. package/src/hooks/message-sanitize.ts +45 -0
  95. package/src/hooks/pain.ts +384 -0
  96. package/src/hooks/progressive-trust-gate.ts +174 -0
  97. package/src/hooks/prompt.ts +920 -0
  98. package/src/hooks/subagent.ts +207 -0
  99. package/src/hooks/thinking-checkpoint.ts +73 -0
  100. package/src/hooks/trajectory-collector.ts +290 -0
  101. package/src/http/principles-console-route.ts +716 -0
  102. package/src/i18n/commands.ts +117 -0
  103. package/src/index.ts +694 -0
  104. package/src/service/central-database.ts +831 -0
  105. package/src/service/control-ui-query-service.ts +888 -0
  106. package/src/service/evolution-query-service.ts +405 -0
  107. package/src/service/evolution-worker.ts +1646 -0
  108. package/src/service/health-query-service.ts +836 -0
  109. package/{dist/service/nocturnal-runtime.js → src/service/nocturnal-runtime.ts} +235 -79
  110. package/src/service/nocturnal-service.ts +1015 -0
  111. package/src/service/nocturnal-target-selector.ts +532 -0
  112. package/src/service/phase3-input-filter.ts +237 -0
  113. package/src/service/runtime-summary-service.ts +757 -0
  114. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +513 -0
  115. package/{dist/service/subagent-workflow/empathy-observer-workflow-manager.js → src/service/subagent-workflow/empathy-observer-workflow-manager.ts} +240 -117
  116. package/src/service/subagent-workflow/index.ts +51 -0
  117. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +856 -0
  118. package/src/service/subagent-workflow/runtime-direct-driver.ts +166 -0
  119. package/{dist/service/subagent-workflow/types.d.ts → src/service/subagent-workflow/types.ts} +137 -18
  120. package/src/service/subagent-workflow/workflow-store.ts +328 -0
  121. package/src/service/trajectory-service.ts +15 -0
  122. package/{dist/tools/critique-prompt.js → src/tools/critique-prompt.ts} +25 -8
  123. package/src/tools/deep-reflect.ts +349 -0
  124. package/{dist/tools/model-index.js → src/tools/model-index.ts} +33 -17
  125. package/src/types/event-types.ts +453 -0
  126. package/src/types/hygiene-types.ts +31 -0
  127. package/src/types/principle-tree-schema.ts +244 -0
  128. package/src/types/runtime-summary.ts +49 -0
  129. package/src/types.ts +74 -0
  130. package/src/utils/file-lock.ts +391 -0
  131. package/{dist/utils/glob-match.js → src/utils/glob-match.ts} +21 -20
  132. package/{dist/utils/hashing.js → src/utils/hashing.ts} +6 -4
  133. package/src/utils/io.ts +110 -0
  134. package/{dist/utils/nlp.js → src/utils/nlp.ts} +19 -12
  135. package/{dist/utils/plugin-logger.js → src/utils/plugin-logger.ts} +33 -8
  136. package/src/utils/subagent-probe.ts +94 -0
  137. package/templates/langs/en/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
  138. package/templates/langs/en/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
  139. package/templates/langs/en/skills/ai-sprint-orchestration/SKILL.md +67 -0
  140. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
  141. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
  142. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
  143. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
  144. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
  145. package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
  146. package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
  147. package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
  148. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
  149. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
  150. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
  151. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
  152. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
  153. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
  154. package/templates/langs/zh/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
  155. package/templates/langs/zh/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
  156. package/templates/langs/zh/skills/ai-sprint-orchestration/SKILL.md +67 -0
  157. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
  158. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
  159. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
  160. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
  161. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
  162. package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
  163. package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
  164. package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
  165. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
  166. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
  167. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
  168. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
  169. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
  170. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
  171. package/templates/langs/zh/skills/ai-sprint-orchestration/test/archive.test.mjs +230 -0
  172. package/templates/langs/zh/skills/ai-sprint-orchestration/test/contract-enforcement.test.mjs +672 -0
  173. package/templates/langs/zh/skills/ai-sprint-orchestration/test/decision.test.mjs +1321 -0
  174. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +1419 -0
  175. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +70 -1
  176. package/templates/pain_settings.json +2 -1
  177. package/tests/README.md +120 -0
  178. package/tests/build-artifacts.test.ts +111 -0
  179. package/tests/commands/evolution-status.test.ts +222 -0
  180. package/tests/commands/evolver.test.ts +22 -0
  181. package/tests/commands/export.test.ts +78 -0
  182. package/tests/commands/nocturnal-review.test.ts +448 -0
  183. package/tests/commands/nocturnal-train.test.ts +97 -0
  184. package/tests/commands/pain.test.ts +108 -0
  185. package/tests/commands/samples.test.ts +65 -0
  186. package/tests/commands/strategy.test.ts +34 -0
  187. package/tests/commands/thinking-os.test.ts +88 -0
  188. package/tests/core/adaptive-thresholds.test.ts +261 -0
  189. package/tests/core/config-service.test.ts +89 -0
  190. package/tests/core/config.test.ts +90 -0
  191. package/tests/core/control-ui-db.test.ts +75 -0
  192. package/tests/core/core-template-guidance.test.ts +21 -0
  193. package/tests/core/detection-funnel.test.ts +63 -0
  194. package/tests/core/detection-service.test.ts +50 -0
  195. package/tests/core/dictionary-service.test.ts +116 -0
  196. package/tests/core/dictionary.test.ts +168 -0
  197. package/tests/core/empathy-keyword-matcher.test.ts +209 -0
  198. package/tests/core/event-log.test.ts +181 -0
  199. package/tests/core/evolution-e2e.test.ts +58 -0
  200. package/tests/core/evolution-engine-gate-integration.test.ts +543 -0
  201. package/tests/core/evolution-engine.test.ts +562 -0
  202. package/tests/core/evolution-logger.test.ts +148 -0
  203. package/tests/core/evolution-migration.test.ts +50 -0
  204. package/tests/core/evolution-paths.test.ts +21 -0
  205. package/tests/core/evolution-reducer.detector-metadata.test.ts +602 -0
  206. package/tests/core/evolution-reducer.test.ts +180 -0
  207. package/tests/core/evolution-types-loop.test.ts +48 -0
  208. package/tests/core/evolution-user-stories.e2e.test.ts +249 -0
  209. package/tests/core/external-training-contract.test.ts +463 -0
  210. package/tests/core/focus-history.test.ts +682 -0
  211. package/tests/core/init-flatten.test.ts +69 -0
  212. package/tests/core/init-refactor.test.ts +87 -0
  213. package/tests/core/init-v1.3.test.ts +46 -0
  214. package/tests/core/init.test.ts +190 -0
  215. package/tests/core/local-worker-routing.test.ts +757 -0
  216. package/tests/core/migration.test.ts +84 -0
  217. package/tests/core/model-deployment-registry.test.ts +845 -0
  218. package/tests/core/model-training-registry.test.ts +889 -0
  219. package/tests/core/nocturnal-arbiter.test.ts +494 -0
  220. package/tests/core/nocturnal-candidate-scoring.test.ts +400 -0
  221. package/tests/core/nocturnal-compliance.test.ts +646 -0
  222. package/tests/core/nocturnal-dataset.test.ts +892 -0
  223. package/tests/core/nocturnal-executability.test.ts +357 -0
  224. package/tests/core/nocturnal-export.test.ts +462 -0
  225. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +428 -0
  226. package/tests/core/nocturnal-trajectory-extractor.test.ts +634 -0
  227. package/tests/core/nocturnal-trinity.test.ts +953 -0
  228. package/tests/core/pain.test.ts +33 -0
  229. package/tests/core/path-resolver.test.ts +57 -0
  230. package/tests/core/paths-refactor.test.ts +42 -0
  231. package/tests/core/phase7-rollout-integration.test.ts +477 -0
  232. package/tests/core/principle-training-state.test.ts +712 -0
  233. package/tests/core/profile.test.ts +56 -0
  234. package/tests/core/promotion-gate.test.ts +556 -0
  235. package/tests/core/risk-calculator.test.ts +168 -0
  236. package/tests/core/session-tracker.test.ts +191 -0
  237. package/tests/core/training-program.test.ts +472 -0
  238. package/tests/core/trajectory.test.ts +265 -0
  239. package/tests/core/workspace-context-factory.test.ts +18 -0
  240. package/tests/core/workspace-context.test.ts +134 -0
  241. package/tests/fixtures/nocturnal-reviewed-subset.json +183 -0
  242. package/tests/fixtures/production-compatibility.test.ts +147 -0
  243. package/tests/fixtures/production-mock-generator.ts +282 -0
  244. package/tests/hooks/bash-risk-integration.test.ts +137 -0
  245. package/tests/hooks/bash-risk.test.ts +81 -0
  246. package/tests/hooks/edit-verification.test.ts +678 -0
  247. package/tests/hooks/gate-edit-verification-p1.test.ts +632 -0
  248. package/tests/hooks/gate-edit-verification.test.ts +435 -0
  249. package/tests/hooks/gate-pipeline-integration.test.ts +404 -0
  250. package/tests/hooks/gate.test.ts +271 -0
  251. package/tests/hooks/gfi-gate-unit.test.ts +422 -0
  252. package/tests/hooks/gfi-gate.test.ts +669 -0
  253. package/tests/hooks/lifecycle.test.ts +248 -0
  254. package/tests/hooks/llm.test.ts +308 -0
  255. package/tests/hooks/message-sanitize.test.ts +36 -0
  256. package/tests/hooks/pain.test.ts +141 -0
  257. package/tests/hooks/progressive-trust-gate.test.ts +277 -0
  258. package/tests/hooks/prompt.test.ts +1411 -0
  259. package/tests/hooks/subagent.test.ts +467 -0
  260. package/tests/hooks/thinking-gate.test.ts +313 -0
  261. package/tests/http/principles-console-route.test.ts +140 -0
  262. package/tests/hygiene-tracker.test.ts +77 -0
  263. package/tests/index.integration.test.ts +179 -0
  264. package/tests/index.shadow-routing.integration.test.ts +140 -0
  265. package/tests/index.test.ts +9 -0
  266. package/tests/integration/empathy-workflow-integration.test.ts +627 -0
  267. package/tests/service/control-ui-query-service.test.ts +121 -0
  268. package/tests/service/empathy-observer-workflow-manager.test.ts +176 -0
  269. package/tests/service/evolution-worker.test.ts +585 -0
  270. package/tests/service/nocturnal-runtime.test.ts +470 -0
  271. package/tests/service/nocturnal-service.test.ts +577 -0
  272. package/tests/service/nocturnal-target-selector.test.ts +615 -0
  273. package/tests/service/nocturnal-workflow-manager.test.ts +439 -0
  274. package/tests/service/phase3-input-filter.test.ts +289 -0
  275. package/tests/service/runtime-summary-service.test.ts +919 -0
  276. package/tests/task-compliance.test.ts +166 -0
  277. package/tests/test-utils.ts +48 -0
  278. package/tests/tools/critique-prompt.test.ts +260 -0
  279. package/tests/tools/deep-reflect.test.ts +232 -0
  280. package/tests/tools/model-index.test.ts +246 -0
  281. package/tests/ui/app.test.tsx +114 -0
  282. package/tests/utils/file-lock.test.ts +407 -0
  283. package/tests/utils/hashing.test.ts +32 -0
  284. package/tests/utils/io.test.ts +39 -0
  285. package/tests/utils/nlp.test.ts +53 -0
  286. package/tests/utils/plugin-logger.test.ts +156 -0
  287. package/tsconfig.json +16 -0
  288. package/tsconfig.tsbuildinfo +1 -0
  289. package/ui/src/App.tsx +45 -0
  290. package/ui/src/api.ts +216 -0
  291. package/ui/src/charts.tsx +586 -0
  292. package/ui/src/components/ErrorState.tsx +6 -0
  293. package/ui/src/components/Loading.tsx +13 -0
  294. package/ui/src/components/ProtectedRoute.tsx +12 -0
  295. package/ui/src/components/Shell.tsx +91 -0
  296. package/ui/src/components/WorkspaceConfig.tsx +146 -0
  297. package/ui/src/components/index.ts +5 -0
  298. package/ui/src/context/auth.tsx +80 -0
  299. package/ui/src/context/theme.tsx +66 -0
  300. package/ui/src/hooks/useAutoRefresh.ts +39 -0
  301. package/ui/src/i18n/ui.ts +363 -0
  302. package/ui/src/main.tsx +16 -0
  303. package/ui/src/pages/EvolutionPage.tsx +352 -0
  304. package/ui/src/pages/FeedbackPage.tsx +140 -0
  305. package/ui/src/pages/GateMonitorPage.tsx +136 -0
  306. package/ui/src/pages/LoginPage.tsx +88 -0
  307. package/ui/src/pages/OverviewPage.tsx +238 -0
  308. package/ui/src/pages/SamplesPage.tsx +174 -0
  309. package/ui/src/pages/ThinkingModelsPage.tsx +127 -0
  310. package/ui/src/styles.css +1661 -0
  311. package/ui/src/types.ts +368 -0
  312. package/ui/src/utils/format.ts +15 -0
  313. package/vitest.config.ts +23 -0
  314. package/dist/commands/capabilities.d.ts +0 -3
  315. package/dist/commands/capabilities.js +0 -73
  316. package/dist/commands/context.d.ts +0 -5
  317. package/dist/commands/evolution-status.d.ts +0 -4
  318. package/dist/commands/evolution-status.js +0 -117
  319. package/dist/commands/evolver.d.ts +0 -9
  320. package/dist/commands/evolver.js +0 -26
  321. package/dist/commands/export.d.ts +0 -2
  322. package/dist/commands/export.js +0 -98
  323. package/dist/commands/focus.d.ts +0 -14
  324. package/dist/commands/focus.js +0 -457
  325. package/dist/commands/nocturnal-review.d.ts +0 -24
  326. package/dist/commands/nocturnal-review.js +0 -265
  327. package/dist/commands/nocturnal-rollout.d.ts +0 -27
  328. package/dist/commands/nocturnal-rollout.js +0 -671
  329. package/dist/commands/nocturnal-train.d.ts +0 -25
  330. package/dist/commands/nocturnal-train.js +0 -919
  331. package/dist/commands/pain.d.ts +0 -5
  332. package/dist/commands/principle-rollback.d.ts +0 -4
  333. package/dist/commands/principle-rollback.js +0 -22
  334. package/dist/commands/rollback.d.ts +0 -19
  335. package/dist/commands/samples.d.ts +0 -2
  336. package/dist/commands/samples.js +0 -55
  337. package/dist/commands/strategy.d.ts +0 -3
  338. package/dist/commands/strategy.js +0 -29
  339. package/dist/commands/thinking-os.d.ts +0 -2
  340. package/dist/config/defaults/runtime.d.ts +0 -40
  341. package/dist/config/errors.d.ts +0 -84
  342. package/dist/config/errors.js +0 -94
  343. package/dist/config/index.js +0 -7
  344. package/dist/constants/diagnostician.d.ts +0 -12
  345. package/dist/constants/diagnostician.js +0 -56
  346. package/dist/constants/tools.d.ts +0 -17
  347. package/dist/constants/tools.js +0 -54
  348. package/dist/core/adaptive-thresholds.d.ts +0 -186
  349. package/dist/core/adaptive-thresholds.js +0 -300
  350. package/dist/core/config-service.d.ts +0 -15
  351. package/dist/core/config.d.ts +0 -129
  352. package/dist/core/control-ui-db.d.ts +0 -95
  353. package/dist/core/control-ui-db.js +0 -292
  354. package/dist/core/detection-funnel.d.ts +0 -33
  355. package/dist/core/detection-service.d.ts +0 -15
  356. package/dist/core/dictionary-service.d.ts +0 -15
  357. package/dist/core/dictionary.d.ts +0 -38
  358. package/dist/core/event-log.d.ts +0 -82
  359. package/dist/core/event-log.js +0 -463
  360. package/dist/core/evolution-engine.d.ts +0 -118
  361. package/dist/core/evolution-engine.js +0 -464
  362. package/dist/core/evolution-logger.d.ts +0 -137
  363. package/dist/core/evolution-logger.js +0 -256
  364. package/dist/core/evolution-migration.d.ts +0 -5
  365. package/dist/core/evolution-migration.js +0 -65
  366. package/dist/core/evolution-reducer.d.ts +0 -98
  367. package/dist/core/evolution-reducer.js +0 -465
  368. package/dist/core/evolution-types.d.ts +0 -287
  369. package/dist/core/evolution-types.js +0 -78
  370. package/dist/core/external-training-contract.d.ts +0 -276
  371. package/dist/core/external-training-contract.js +0 -269
  372. package/dist/core/focus-history.d.ts +0 -210
  373. package/dist/core/focus-history.js +0 -1185
  374. package/dist/core/hygiene/tracker.d.ts +0 -22
  375. package/dist/core/hygiene/tracker.js +0 -106
  376. package/dist/core/init.d.ts +0 -12
  377. package/dist/core/local-worker-routing.d.ts +0 -175
  378. package/dist/core/local-worker-routing.js +0 -525
  379. package/dist/core/migration.d.ts +0 -6
  380. package/dist/core/model-deployment-registry.d.ts +0 -218
  381. package/dist/core/model-deployment-registry.js +0 -503
  382. package/dist/core/model-training-registry.d.ts +0 -295
  383. package/dist/core/model-training-registry.js +0 -475
  384. package/dist/core/nocturnal-arbiter.d.ts +0 -159
  385. package/dist/core/nocturnal-arbiter.js +0 -534
  386. package/dist/core/nocturnal-candidate-scoring.d.ts +0 -137
  387. package/dist/core/nocturnal-candidate-scoring.js +0 -266
  388. package/dist/core/nocturnal-compliance.d.ts +0 -175
  389. package/dist/core/nocturnal-compliance.js +0 -824
  390. package/dist/core/nocturnal-dataset.d.ts +0 -224
  391. package/dist/core/nocturnal-dataset.js +0 -443
  392. package/dist/core/nocturnal-executability.d.ts +0 -85
  393. package/dist/core/nocturnal-executability.js +0 -331
  394. package/dist/core/nocturnal-export.d.ts +0 -124
  395. package/dist/core/nocturnal-export.js +0 -275
  396. package/dist/core/nocturnal-paths.d.ts +0 -124
  397. package/dist/core/nocturnal-trajectory-extractor.d.ts +0 -242
  398. package/dist/core/nocturnal-trajectory-extractor.js +0 -307
  399. package/dist/core/nocturnal-trinity.d.ts +0 -311
  400. package/dist/core/nocturnal-trinity.js +0 -880
  401. package/dist/core/pain.d.ts +0 -4
  402. package/dist/core/pain.js +0 -70
  403. package/dist/core/path-resolver.d.ts +0 -46
  404. package/dist/core/paths.d.ts +0 -65
  405. package/dist/core/principle-training-state.d.ts +0 -121
  406. package/dist/core/principle-training-state.js +0 -321
  407. package/dist/core/profile.d.ts +0 -62
  408. package/dist/core/profile.js +0 -210
  409. package/dist/core/promotion-gate.d.ts +0 -238
  410. package/dist/core/promotion-gate.js +0 -529
  411. package/dist/core/risk-calculator.d.ts +0 -22
  412. package/dist/core/session-tracker.d.ts +0 -101
  413. package/dist/core/shadow-observation-registry.d.ts +0 -217
  414. package/dist/core/shadow-observation-registry.js +0 -308
  415. package/dist/core/system-logger.d.ts +0 -8
  416. package/dist/core/thinking-models.d.ts +0 -38
  417. package/dist/core/thinking-models.js +0 -170
  418. package/dist/core/training-program.d.ts +0 -233
  419. package/dist/core/training-program.js +0 -433
  420. package/dist/core/trajectory.d.ts +0 -411
  421. package/dist/core/trajectory.js +0 -1307
  422. package/dist/core/workspace-context.d.ts +0 -71
  423. package/dist/hooks/bash-risk.d.ts +0 -57
  424. package/dist/hooks/bash-risk.js +0 -137
  425. package/dist/hooks/edit-verification.d.ts +0 -62
  426. package/dist/hooks/edit-verification.js +0 -256
  427. package/dist/hooks/gate-block-helper.d.ts +0 -44
  428. package/dist/hooks/gate-block-helper.js +0 -119
  429. package/dist/hooks/gate.d.ts +0 -24
  430. package/dist/hooks/gate.js +0 -173
  431. package/dist/hooks/gfi-gate.d.ts +0 -40
  432. package/dist/hooks/gfi-gate.js +0 -113
  433. package/dist/hooks/lifecycle.d.ts +0 -5
  434. package/dist/hooks/lifecycle.js +0 -284
  435. package/dist/hooks/llm.d.ts +0 -13
  436. package/dist/hooks/message-sanitize.d.ts +0 -3
  437. package/dist/hooks/message-sanitize.js +0 -37
  438. package/dist/hooks/pain.d.ts +0 -5
  439. package/dist/hooks/pain.js +0 -301
  440. package/dist/hooks/progressive-trust-gate.d.ts +0 -52
  441. package/dist/hooks/progressive-trust-gate.js +0 -134
  442. package/dist/hooks/prompt.d.ts +0 -49
  443. package/dist/hooks/prompt.js +0 -905
  444. package/dist/hooks/subagent.d.ts +0 -10
  445. package/dist/hooks/subagent.js +0 -387
  446. package/dist/hooks/thinking-checkpoint.d.ts +0 -37
  447. package/dist/hooks/thinking-checkpoint.js +0 -51
  448. package/dist/hooks/trajectory-collector.d.ts +0 -32
  449. package/dist/hooks/trajectory-collector.js +0 -256
  450. package/dist/http/principles-console-route.d.ts +0 -9
  451. package/dist/http/principles-console-route.js +0 -681
  452. package/dist/i18n/commands.d.ts +0 -26
  453. package/dist/i18n/commands.js +0 -116
  454. package/dist/index.d.ts +0 -7
  455. package/dist/index.js +0 -581
  456. package/dist/service/central-database.d.ts +0 -104
  457. package/dist/service/central-database.js +0 -649
  458. package/dist/service/control-ui-query-service.d.ts +0 -221
  459. package/dist/service/control-ui-query-service.js +0 -543
  460. package/dist/service/empathy-observer-manager.d.ts +0 -88
  461. package/dist/service/empathy-observer-manager.js +0 -414
  462. package/dist/service/evolution-query-service.d.ts +0 -155
  463. package/dist/service/evolution-query-service.js +0 -258
  464. package/dist/service/evolution-worker.d.ts +0 -101
  465. package/dist/service/evolution-worker.js +0 -975
  466. package/dist/service/health-query-service.d.ts +0 -170
  467. package/dist/service/health-query-service.js +0 -662
  468. package/dist/service/nocturnal-runtime.d.ts +0 -183
  469. package/dist/service/nocturnal-service.d.ts +0 -163
  470. package/dist/service/nocturnal-service.js +0 -787
  471. package/dist/service/nocturnal-target-selector.d.ts +0 -145
  472. package/dist/service/nocturnal-target-selector.js +0 -315
  473. package/dist/service/phase3-input-filter.d.ts +0 -73
  474. package/dist/service/phase3-input-filter.js +0 -172
  475. package/dist/service/runtime-summary-service.d.ts +0 -122
  476. package/dist/service/runtime-summary-service.js +0 -485
  477. package/dist/service/subagent-workflow/empathy-observer-workflow-manager.d.ts +0 -48
  478. package/dist/service/subagent-workflow/index.d.ts +0 -4
  479. package/dist/service/subagent-workflow/index.js +0 -3
  480. package/dist/service/subagent-workflow/runtime-direct-driver.d.ts +0 -77
  481. package/dist/service/subagent-workflow/runtime-direct-driver.js +0 -75
  482. package/dist/service/subagent-workflow/types.js +0 -11
  483. package/dist/service/subagent-workflow/workflow-store.d.ts +0 -26
  484. package/dist/service/subagent-workflow/workflow-store.js +0 -165
  485. package/dist/service/trajectory-service.d.ts +0 -2
  486. package/dist/service/trajectory-service.js +0 -15
  487. package/dist/tools/critique-prompt.d.ts +0 -14
  488. package/dist/tools/deep-reflect.d.ts +0 -39
  489. package/dist/tools/deep-reflect.js +0 -350
  490. package/dist/tools/model-index.d.ts +0 -9
  491. package/dist/types/event-types.d.ts +0 -306
  492. package/dist/types/event-types.js +0 -106
  493. package/dist/types/hygiene-types.d.ts +0 -20
  494. package/dist/types/hygiene-types.js +0 -12
  495. package/dist/types/runtime-summary.d.ts +0 -47
  496. package/dist/types/runtime-summary.js +0 -1
  497. package/dist/types.d.ts +0 -50
  498. package/dist/types.js +0 -22
  499. package/dist/utils/file-lock.d.ts +0 -71
  500. package/dist/utils/file-lock.js +0 -309
  501. package/dist/utils/glob-match.d.ts +0 -28
  502. package/dist/utils/hashing.d.ts +0 -9
  503. package/dist/utils/io.d.ts +0 -6
  504. package/dist/utils/io.js +0 -106
  505. package/dist/utils/nlp.d.ts +0 -9
  506. package/dist/utils/plugin-logger.d.ts +0 -39
  507. package/dist/utils/subagent-probe.d.ts +0 -34
  508. package/dist/utils/subagent-probe.js +0 -81
@@ -0,0 +1,630 @@
1
+ /**
2
+ * Training Program — Orchestrates External Training Execution and Lineage
3
+ * =========================================================================
4
+ *
5
+ * PURPOSE: Coordinate the training workflow from experiment spec creation
6
+ * through checkpoint registration and eval attachment.
7
+ *
8
+ * ARCHITECTURE:
9
+ * - TrainingProgram orchestrates the workflow but does NOT execute training itself
10
+ * - External trainer backends (Python scripts) do the actual training
11
+ * - Training run, checkpoint, and eval lineage is registered in model-training-registry
12
+ * - Promotion gate (promotion-gate.ts) controls deployment readiness
13
+ *
14
+ * WORKFLOW:
15
+ * 1. Create experiment spec (TrainingProgram.createExperiment)
16
+ * 2. Execute external trainer (TrainingProgram.executeTrainer)
17
+ * 3. Validate trainer result against spec (validateTrainerResult)
18
+ * 4. Register training run (model-training-registry)
19
+ * 5. Register checkpoint (model-training-registry)
20
+ * 6. Attach eval summary after benchmark (model-training-registry)
21
+ * 7. Promotion gate controls deployment readiness
22
+ *
23
+ * DESIGN CONSTRAINTS:
24
+ * - ORPO-first: only 'orpo' training mode
25
+ * - No training inside the plugin runtime
26
+ * - No direct deployment binding from trainer output
27
+ * - Trainer backends are fire-and-forget (plugin does not poll trainer)
28
+ * - All lineage must be traceable through model-training-registry
29
+ */
30
+
31
+ import * as fs from 'fs';
32
+ import * as path from 'path';
33
+ import * as crypto from 'crypto';
34
+ import { fileURLToPath } from 'url';
35
+ import {
36
+ type TrainingExperimentSpec,
37
+ type TrainingExperimentResult,
38
+ type TrainerBackendKind,
39
+ type TrainableWorkerProfile,
40
+ type HardwareTier,
41
+ type TrainingHyperparameters,
42
+ type TrainingBudget,
43
+ validateTrainerResult,
44
+ computeConfigFingerprint,
45
+ computeDatasetFingerprint,
46
+ computeCodeHash,
47
+ generateExperimentId,
48
+ validateHardwareTier,
49
+ getDefaultHardwareTier,
50
+ isValidModelFamilyForProfile,
51
+ LOCAL_EDITOR_ENABLED,
52
+ } from './external-training-contract.js';
53
+ import {
54
+ registerTrainingRun,
55
+ startTrainingRun,
56
+ completeTrainingRun,
57
+ failTrainingRun,
58
+ registerCheckpoint,
59
+ attachEvalSummary,
60
+ markCheckpointDeployable,
61
+ getCheckpointLineage,
62
+ } from './model-training-registry.js';
63
+
64
+ // ---------------------------------------------------------------------------
65
+ // Constants
66
+ // ---------------------------------------------------------------------------
67
+
68
+ /**
69
+ * Path to the external trainer scripts directory.
70
+ */
71
+ const TRAINER_SCRIPTS_DIR = 'scripts/nocturnal/trainer';
72
+ const MODULE_DIR = path.dirname(fileURLToPath(import.meta.url));
73
+ const REPO_ROOT = path.resolve(MODULE_DIR, '..', '..', '..', '..');
74
+
75
+ /**
76
+ * Default hyperparameters for ORPO training.
77
+ * These are conservative defaults for consumer GPU (RTX 4090 24GB).
78
+ */
79
+ export const DEFAULT_ORPO_HYPERPARAMETERS: TrainingHyperparameters = {
80
+ learningRate: 3e-4,
81
+ batchSize: 2,
82
+ gradientAccumulation: 8,
83
+ loraRank: 16,
84
+ loraAlpha: 32,
85
+ loraDropout: 0.05,
86
+ warmupRatio: 0.1,
87
+ maxSteps: 1000,
88
+ maxSeqLength: 2048,
89
+ };
90
+
91
+ /**
92
+ * Default budget for training runs.
93
+ */
94
+ export const DEFAULT_BUDGET: TrainingBudget = {
95
+ maxWallClockMinutes: 240, // 4 hours
96
+ maxTrainTokens: 2_000_000,
97
+ };
98
+
99
+ // ---------------------------------------------------------------------------
100
+ // Experiment Spec Creation
101
+ // ---------------------------------------------------------------------------
102
+
103
+ /**
104
+ * Parameters for creating a training experiment.
105
+ */
106
+ export interface CreateExperimentParams {
107
+ /** Target worker profile */
108
+ targetWorkerProfile: TrainableWorkerProfile;
109
+
110
+ /** Target model family */
111
+ targetModelFamily: string;
112
+
113
+ /** Hardware tier */
114
+ hardwareTier?: HardwareTier;
115
+
116
+ /** Backend to use */
117
+ backend: TrainerBackendKind;
118
+
119
+ /** Dataset export ID */
120
+ datasetExportId: string;
121
+
122
+ /** Dataset export path */
123
+ datasetExportPath: string;
124
+
125
+ /** Dataset fingerprint */
126
+ datasetFingerprint: string;
127
+
128
+ /** Benchmark export ID */
129
+ benchmarkExportId: string;
130
+
131
+ /** Output directory for checkpoints */
132
+ outputDir: string;
133
+
134
+ /** Custom hyperparameters (optional) */
135
+ hyperparameters?: Partial<TrainingHyperparameters>;
136
+
137
+ /** Custom budget (optional) */
138
+ budget?: Partial<TrainingBudget>;
139
+ }
140
+
141
+ /**
142
+ * Result of creating an experiment.
143
+ */
144
+ export interface CreateExperimentResult {
145
+ /** The experiment specification */
146
+ spec: TrainingExperimentSpec;
147
+
148
+ /** The registered training run ID */
149
+ trainRunId: string;
150
+ }
151
+
152
+ /**
153
+ * Create a new training experiment.
154
+ *
155
+ * This creates the experiment spec and registers a training run in the registry.
156
+ *
157
+ * @param stateDir - Workspace state directory
158
+ * @param params - Experiment parameters
159
+ * @returns Created experiment spec and registered training run ID
160
+ *
161
+ * @throws Error if worker profile is not allowed (local-editor not yet enabled)
162
+ * @throws Error if model family is not valid for the worker profile
163
+ * @throws Error if hardware tier is not valid for the backend
164
+ */
165
+ export function createExperiment(
166
+ stateDir: string,
167
+ params: CreateExperimentParams
168
+ ): CreateExperimentResult {
169
+ // --- Validate worker profile ---
170
+ if (params.targetWorkerProfile === 'local-editor' && !LOCAL_EDITOR_ENABLED) {
171
+ throw new Error(
172
+ `Training for 'local-editor' is not yet enabled. ` +
173
+ `Phase 7 first rollout is limited to 'local-reader'. ` +
174
+ `To enable local-editor training, set LOCAL_EDITOR_ENABLED = true ` +
175
+ `in external-training-contract.ts after appropriate review.`
176
+ );
177
+ }
178
+
179
+ // --- Validate model family for profile ---
180
+ if (!isValidModelFamilyForProfile(params.targetModelFamily, params.targetWorkerProfile)) {
181
+ throw new Error(
182
+ `Model family '${params.targetModelFamily}' is not valid for profile ` +
183
+ `'${params.targetWorkerProfile}'. ` +
184
+ `Ensure the model family name contains an appropriate keyword.`
185
+ );
186
+ }
187
+
188
+ // --- Validate hardware tier ---
189
+ const tier = params.hardwareTier ?? getDefaultHardwareTier(params.backend);
190
+ validateHardwareTier(params.backend, tier);
191
+
192
+ // --- Merge hyperparameters ---
193
+ const hyperparameters: TrainingHyperparameters = {
194
+ ...DEFAULT_ORPO_HYPERPARAMETERS,
195
+ ...params.hyperparameters,
196
+ };
197
+
198
+ // --- Compute fingerprints ---
199
+ const configFingerprint = computeConfigFingerprint(hyperparameters);
200
+ const codeHash = computeCodeHash();
201
+
202
+ // --- Create experiment spec ---
203
+ const spec: TrainingExperimentSpec = {
204
+ experimentId: generateExperimentId(),
205
+ backend: params.backend,
206
+ trainingMode: 'orpo',
207
+ targetWorkerProfile: params.targetWorkerProfile,
208
+ targetModelFamily: params.targetModelFamily,
209
+ hardwareTier: tier,
210
+ datasetExportId: params.datasetExportId,
211
+ datasetExportPath: params.datasetExportPath,
212
+ datasetFingerprint: params.datasetFingerprint,
213
+ benchmarkExportId: params.benchmarkExportId,
214
+ outputDir: params.outputDir,
215
+ configFingerprint,
216
+ codeHash,
217
+ hyperparameters,
218
+ budget: { ...DEFAULT_BUDGET, ...params.budget },
219
+ expectedArtifact: {
220
+ checkpointName: `checkpoint-${params.targetModelFamily}-${Date.now()}`,
221
+ adapterFormat: 'peft-adapter',
222
+ },
223
+ };
224
+
225
+ // --- Register training run in registry ---
226
+ const trainRun = registerTrainingRun(stateDir, {
227
+ experimentId: spec.experimentId,
228
+ targetModelFamily: spec.targetModelFamily,
229
+ datasetFingerprint: spec.datasetFingerprint,
230
+ exportId: spec.datasetExportId,
231
+ sampleCount: 0, // Will be updated when result is registered
232
+ configFingerprint: spec.configFingerprint,
233
+ });
234
+
235
+ return { spec, trainRunId: trainRun.trainRunId };
236
+ }
237
+
238
+ // ---------------------------------------------------------------------------
239
+ // Trainer Execution
240
+ // ---------------------------------------------------------------------------
241
+
242
+ /**
243
+ * Parameters for executing an external trainer.
244
+ */
245
+ export interface ExecuteTrainerParams {
246
+ /** The experiment specification */
247
+ spec: TrainingExperimentSpec;
248
+
249
+ /** Path to the trainer scripts directory */
250
+ scriptsDir?: string;
251
+ }
252
+
253
+ /**
254
+ * Execute an external trainer backend.
255
+ *
256
+ * This function:
257
+ * 1. Validates the trainer script exists
258
+ * 2. Serializes the experiment spec to JSON
259
+ * 3. Invokes the Python backend
260
+ * 4. Returns the trainer's parsed result
261
+ *
262
+ * The trainer protocol:
263
+ * - stdout: MUST contain only the machine-readable JSON result (TrainingExperimentResult)
264
+ * - stderr: Contains training progress logs (ignored by plugin)
265
+ * - result file: Written to output dir as backup if stdout parsing fails
266
+ *
267
+ * NOTE: This is a fire-and-forget execution. The plugin does not poll
268
+ * the trainer. For Phase 7, trainer execution is assumed to be synchronous
269
+ * or to complete before this function returns.
270
+ *
271
+ * @param spec - The experiment specification
272
+ * @param scriptsDir - Override for the scripts directory
273
+ * @returns The trainer's result as parsed JSON object
274
+ *
275
+ * @throws Error if the trainer script is not found
276
+ * @throws Error if trainer execution fails
277
+ * @throws Error if result cannot be parsed
278
+ */
279
+ export async function executeTrainer(
280
+ spec: TrainingExperimentSpec,
281
+ scriptsDir?: string
282
+ ): Promise<import('./external-training-contract.js').TrainingExperimentResult> {
283
+ const baseDir = scriptsDir ?? path.join(REPO_ROOT, TRAINER_SCRIPTS_DIR);
284
+
285
+ // Map backend to script name
286
+ const scriptMap: Record<TrainerBackendKind, string> = {
287
+ 'peft-trl-orpo': 'main.py',
288
+ 'unsloth-orpo': 'main.py',
289
+ 'dry-run': 'main.py',
290
+ };
291
+
292
+ const scriptName = scriptMap[spec.backend];
293
+ const scriptPath = path.join(baseDir, scriptName);
294
+
295
+ // Check if script exists (for dry-run, we allow missing scripts in development)
296
+ if (spec.backend !== 'dry-run' && !fs.existsSync(scriptPath)) {
297
+ throw new Error(
298
+ `Trainer script not found: ${scriptPath}. ` +
299
+ `Ensure the external trainer backends are installed at ${baseDir}.`
300
+ );
301
+ }
302
+
303
+ // Serialize spec to JSON for passing to trainer
304
+ const specPath = path.join(baseDir, `experiment-${spec.experimentId}.json`);
305
+ const specJson = JSON.stringify(spec, null, 2);
306
+
307
+ // Write spec to file for trainer to read
308
+ const specDir = path.dirname(specPath);
309
+ if (!fs.existsSync(specDir)) {
310
+ fs.mkdirSync(specDir, { recursive: true });
311
+ }
312
+ fs.writeFileSync(specPath, specJson, 'utf-8');
313
+
314
+ // Result file path (written by trainer to output dir)
315
+ const resultFilePath = path.join(spec.outputDir, `result-${spec.experimentId}.json`);
316
+
317
+ try {
318
+ if (spec.backend === 'dry-run') {
319
+ // For dry-run, simulate a successful dry-run result
320
+ // No actual Python script execution needed - dry-run just validates spec
321
+ return {
322
+ experimentId: spec.experimentId,
323
+ backend: 'dry-run',
324
+ status: 'dry_run' as const,
325
+ targetWorkerProfile: spec.targetWorkerProfile,
326
+ targetModelFamily: spec.targetModelFamily,
327
+ datasetFingerprint: spec.datasetFingerprint,
328
+ configFingerprint: spec.configFingerprint,
329
+ codeHash: spec.codeHash,
330
+ createdAt: new Date().toISOString(),
331
+ };
332
+ }
333
+
334
+ // Execute the Python trainer using spawn (streaming).
335
+ const { spawn } = await import('child_process');
336
+ // - stdout is collected into a fixed-size buffer (1MB max) to prevent OOM from training logs
337
+ // - stderr is piped directly to parent stderr so it never accumulates in memory
338
+ // - Non-zero exit codes are handled with clear error messages
339
+ const timeoutMs = (spec.budget.maxWallClockMinutes * 60 * 1000) + 30000;
340
+ const pythonExecutable = process.platform === 'win32' ? 'python' : 'python3';
341
+ const MAX_STDOUT_BUFFER = 1 * 1024 * 1024; // 1MB cap
342
+
343
+ const trainerResult = await new Promise<
344
+ import('./external-training-contract.js').TrainingExperimentResult
345
+ >((resolve, reject) => {
346
+ const proc = spawn(pythonExecutable, [scriptPath, '--spec', specPath, '--output-dir', spec.outputDir]);
347
+
348
+ // Collect stdout with size cap to prevent OOM from huge log output
349
+ const stdoutChunks: Buffer[] = [];
350
+ let stdoutSize = 0;
351
+
352
+ proc.stdout.on('data', (chunk: Buffer) => {
353
+ const remaining = MAX_STDOUT_BUFFER - stdoutSize;
354
+ if (remaining > 0) {
355
+ stdoutChunks.push(chunk.slice(0, remaining));
356
+ stdoutSize += Math.min(chunk.length, remaining);
357
+ }
358
+ });
359
+
360
+ // Pipe stderr directly — training logs must NOT accumulate in memory
361
+ proc.stderr.pipe(process.stderr);
362
+
363
+ const timer = setTimeout(() => {
364
+ proc.kill();
365
+ reject(new Error(`Trainer timed out after ${timeoutMs}ms`));
366
+ }, timeoutMs);
367
+
368
+ proc.on('close', (code) => {
369
+ clearTimeout(timer);
370
+ if (code === 0) {
371
+ const stdout = Buffer.concat(stdoutChunks).toString('utf-8');
372
+ const trimmed = stdout.trim();
373
+ if (trimmed) {
374
+ try {
375
+ resolve(JSON.parse(trimmed) as import('./external-training-contract.js').TrainingExperimentResult);
376
+ return;
377
+ } catch {
378
+ // fall through to result file
379
+ }
380
+ }
381
+ // Fallback: try result file
382
+ if (fs.existsSync(resultFilePath)) {
383
+ try {
384
+ const content = fs.readFileSync(resultFilePath, 'utf-8');
385
+ resolve(JSON.parse(content) as import('./external-training-contract.js').TrainingExperimentResult);
386
+ return;
387
+ } catch {
388
+ // fall through to error
389
+ }
390
+ }
391
+ reject(
392
+ new Error(
393
+ `Trainer stdout was not valid JSON and result file also invalid. ` +
394
+ `result file: ${resultFilePath}`
395
+ )
396
+ );
397
+ } else {
398
+ // Non-zero exit — try result file as last resort
399
+ if (fs.existsSync(resultFilePath)) {
400
+ try {
401
+ const content = fs.readFileSync(resultFilePath, 'utf-8');
402
+ resolve(JSON.parse(content) as import('./external-training-contract.js').TrainingExperimentResult);
403
+ } catch {
404
+ reject(new Error(`Trainer exited with code ${code} and result file was invalid: ${resultFilePath}`));
405
+ }
406
+ } else {
407
+ reject(new Error(`Trainer exited with code ${code} and no result file found at: ${resultFilePath}`));
408
+ }
409
+ }
410
+ });
411
+
412
+ proc.on('error', (err) => {
413
+ clearTimeout(timer);
414
+ reject(new Error(`Trainer spawn failed: ${err.message}`));
415
+ });
416
+ });
417
+
418
+ return trainerResult;
419
+ } finally {
420
+ // Clean up spec file after execution
421
+ if (fs.existsSync(specPath)) {
422
+ fs.unlinkSync(specPath);
423
+ }
424
+ }
425
+ }
426
+
427
+ // ---------------------------------------------------------------------------
428
+ // Result Processing
429
+ // ---------------------------------------------------------------------------
430
+
431
+ /**
432
+ * Parameters for processing a trainer result.
433
+ */
434
+ export interface ProcessTrainerResultParams {
435
+ /** The original experiment specification */
436
+ spec: TrainingExperimentSpec;
437
+
438
+ /** The training run ID from registry */
439
+ trainRunId: string;
440
+
441
+ /** The trainer's result (parsed) */
442
+ result: TrainingExperimentResult;
443
+
444
+ /** Workspace state directory */
445
+ stateDir: string;
446
+ }
447
+
448
+ /**
449
+ * Process a trainer result:
450
+ * 1. Validate result against spec
451
+ * 2. Register checkpoint in training registry
452
+ * 3. Return checkpoint for eval attachment
453
+ *
454
+ * @param params - Processing parameters
455
+ * @returns The registered checkpoint, or null for dry_run (no checkpoint produced)
456
+ *
457
+ * @throws Error if validation fails
458
+ * @throws Error if checkpoint registration fails
459
+ */
460
+ export function processTrainerResult(
461
+ params: ProcessTrainerResultParams
462
+ ): { checkpointId: string; checkpointRef: string } | null {
463
+ const { spec, trainRunId, result, stateDir } = params;
464
+
465
+ // --- Handle dry_run BEFORE validation (it has no checkpoint and should not be validated) ---
466
+ if (result.status === 'dry_run') {
467
+ // Dry-run: mark completed (no checkpoint expected) and return null.
468
+ // This is a supported non-error outcome — upper layers distinguish it from
469
+ // completed (which has a checkpoint) by checking the return value.
470
+ startTrainingRun(stateDir, trainRunId);
471
+ completeTrainingRun(stateDir, trainRunId);
472
+ return null;
473
+ }
474
+
475
+ // --- Transition pending -> running first ---
476
+ // Must happen before any validation or failure path so that
477
+ // failTrainingRun has a valid transition (running → failed).
478
+ startTrainingRun(stateDir, trainRunId);
479
+
480
+ // --- Validate result against spec (fail-closed) ---
481
+ const validation = validateTrainerResult(spec, result);
482
+ if (!validation.valid) {
483
+ const errorMessages = validation.errors
484
+ .map((e) => ` - ${e.field}: ${e.reason} (expected: ${e.expected}, got: ${e.actual})`)
485
+ .join('\n');
486
+
487
+ // Fail the training run in registry (running → failed is valid)
488
+ failTrainingRun(stateDir, trainRunId, `Validation failed:\n${errorMessages}`);
489
+
490
+ throw new Error(
491
+ `Trainer result validation failed (${validation.errors.length} errors):\n${errorMessages}\n` +
492
+ `The trainer result does not match the experiment spec. ` +
493
+ `This checkpoint will not be registered.`
494
+ );
495
+ }
496
+
497
+ // --- Update training run status ---
498
+ // Already transitioned to 'running' above
499
+
500
+ if (result.status === 'failed') {
501
+ failTrainingRun(stateDir, trainRunId, result.failureReason ?? 'Unknown failure');
502
+ throw new Error(`Training failed: ${result.failureReason}`);
503
+ }
504
+
505
+ // result.status === 'completed' (or any other non-failed/dry_run) — proceed to checkpoint
506
+ if (!result.checkpointId || !result.artifact) {
507
+ // Mark run failed since it didn't produce a checkpoint (run is in 'running' state)
508
+ failTrainingRun(stateDir, trainRunId, 'Trainer result is marked completed but missing checkpointId or artifact');
509
+ throw new Error(
510
+ `Trainer result is marked 'completed' but missing checkpointId or artifact.`
511
+ );
512
+ }
513
+
514
+ // --- Register checkpoint BEFORE marking run completed ---
515
+ // Ordering matters: if registerCheckpoint throws, run stays in 'running' state
516
+ // (not 'completed'), making the failure visible in registry audits.
517
+ const checkpoint = registerCheckpoint(stateDir, {
518
+ trainRunId,
519
+ targetModelFamily: spec.targetModelFamily,
520
+ artifactPath: result.artifact.artifactPath,
521
+ });
522
+
523
+ // Checkpoint registered successfully — now mark run completed
524
+ completeTrainingRun(stateDir, trainRunId);
525
+
526
+ return {
527
+ checkpointId: checkpoint.checkpointId,
528
+ checkpointRef: result.checkpointRef ?? checkpoint.checkpointId,
529
+ };
530
+ }
531
+
532
+ // ---------------------------------------------------------------------------
533
+ // Training Program Orchestration
534
+ // ---------------------------------------------------------------------------
535
+
536
+ /**
537
+ * The TrainingProgram class orchestrates the complete training workflow.
538
+ *
539
+ * Usage:
540
+ * ```typescript
541
+ * const program = new TrainingProgram(stateDir);
542
+ *
543
+ * // Create experiment
544
+ * const { spec, trainRunId } = program.createExperiment({
545
+ * backend: 'peft-trl-orpo',
546
+ * targetWorkerProfile: 'local-reader',
547
+ * targetModelFamily: 'qwen2.5-7b-reader',
548
+ * datasetExportId: 'export-123',
549
+ * datasetExportPath: '.state/exports/orpo/export-123.jsonl',
550
+ * datasetFingerprint: 'abc123',
551
+ * benchmarkExportId: 'benchmark-456',
552
+ * outputDir: '.state/nocturnal/checkpoints',
553
+ * });
554
+ *
555
+ * // Execute trainer (external)
556
+ * const trainerOutput = await executeTrainer(spec);
557
+ *
558
+ * // Process result
559
+ * const { checkpointId } = program.processResult({
560
+ * spec,
561
+ * trainRunId,
562
+ * result: JSON.parse(trainerOutput),
563
+ * });
564
+ *
565
+ * // Attach eval (after benchmark runs)
566
+ * program.attachEval(checkpointId, evalSummary);
567
+ * ```
568
+ */
569
+ export class TrainingProgram {
570
+ constructor(private readonly stateDir: string) {}
571
+
572
+ /**
573
+ * Create a new training experiment.
574
+ */
575
+ createExperiment(params: CreateExperimentParams): CreateExperimentResult {
576
+ return createExperiment(this.stateDir, params);
577
+ }
578
+
579
+ /**
580
+ * Process a trainer result and register the checkpoint.
581
+ * Returns null for dry_run (no checkpoint produced).
582
+ */
583
+ processResult(params: {
584
+ spec: TrainingExperimentSpec;
585
+ trainRunId: string;
586
+ result: TrainingExperimentResult;
587
+ }): { checkpointId: string; checkpointRef: string } | null {
588
+ return processTrainerResult({
589
+ ...params,
590
+ stateDir: this.stateDir,
591
+ });
592
+ }
593
+
594
+ /**
595
+ * Attach an eval summary to a checkpoint and mark it deployable if eval passes.
596
+ *
597
+ * @param checkpointId - The checkpoint to attach eval to
598
+ * @param evalSummary - The eval summary (from benchmark run)
599
+ * @returns The updated checkpoint
600
+ */
601
+ attachEvalAndMarkDeployable(
602
+ checkpointId: string,
603
+ evalSummary: {
604
+ evalId: string;
605
+ checkpointId: string;
606
+ benchmarkId: string;
607
+ targetModelFamily: string;
608
+ mode: 'prompt_assisted' | 'reduced_prompt';
609
+ baselineScore: number;
610
+ candidateScore: number;
611
+ delta: number;
612
+ verdict: 'pass' | 'fail' | 'compare_only';
613
+ }
614
+ ): void {
615
+ // Attach eval summary
616
+ attachEvalSummary(this.stateDir, checkpointId, evalSummary);
617
+
618
+ // Mark deployable if verdict is pass or compare_only
619
+ if (evalSummary.verdict === 'pass' || evalSummary.verdict === 'compare_only') {
620
+ markCheckpointDeployable(this.stateDir, checkpointId, true);
621
+ }
622
+ }
623
+
624
+ /**
625
+ * Get checkpoint lineage for audit.
626
+ */
627
+ getCheckpointLineage(checkpointId: string) {
628
+ return getCheckpointLineage(this.stateDir, checkpointId);
629
+ }
630
+ }