principles-disciple 1.72.0 → 1.74.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (319) hide show
  1. package/INSTALL.md +1 -3
  2. package/openclaw.plugin.json +10 -5
  3. package/package.json +17 -19
  4. package/scripts/acceptance-test.mjs +16 -73
  5. package/scripts/sync-plugin.mjs +382 -77
  6. package/src/commands/archive-impl.ts +2 -1
  7. package/src/commands/capabilities.ts +2 -2
  8. package/src/commands/context.ts +2 -2
  9. package/src/commands/disable-impl.ts +2 -1
  10. package/src/commands/evolution-status.ts +16 -16
  11. package/src/commands/export.ts +12 -67
  12. package/src/commands/pain.ts +91 -1
  13. package/src/commands/principle-rollback.ts +2 -1
  14. package/src/commands/promote-impl.ts +7 -43
  15. package/src/commands/rollback-impl.ts +2 -1
  16. package/src/commands/rollback.ts +2 -1
  17. package/src/commands/samples.ts +2 -1
  18. package/src/commands/thinking-os.ts +2 -1
  19. package/src/config/errors.ts +18 -2
  20. package/src/constants/diagnostician.ts +2 -2
  21. package/src/constants/tools.ts +2 -1
  22. package/src/core/__tests__/focus-history.test.ts +210 -0
  23. package/src/core/config.ts +1 -1
  24. package/src/core/correction-cue-learner.ts +2 -136
  25. package/src/core/correction-types.ts +16 -88
  26. package/src/core/dictionary.ts +19 -20
  27. package/src/core/empathy-keyword-matcher.ts +17 -289
  28. package/src/core/empathy-types.ts +18 -229
  29. package/src/core/event-log.ts +29 -132
  30. package/src/core/evolution-reducer.ts +21 -2
  31. package/src/core/evolution-types.ts +76 -464
  32. package/src/core/file-store.ts +80 -0
  33. package/src/core/focus-history.ts +228 -955
  34. package/src/core/local-worker-routing.ts +34 -314
  35. package/src/core/merge-gate-audit.ts +0 -195
  36. package/src/core/migration.ts +0 -1
  37. package/src/core/pain-diagnostic-gate.ts +154 -0
  38. package/src/core/pain-signal.ts +21 -138
  39. package/src/core/pain.ts +15 -88
  40. package/src/core/path-resolver.ts +0 -1
  41. package/src/core/paths.ts +0 -1
  42. package/src/core/pd-task-reconciler.ts +26 -115
  43. package/src/core/pd-task-service.ts +9 -9
  44. package/src/core/pd-task-types.ts +23 -127
  45. package/src/core/principle-compiler/__tests__/compiler-replay-gate.test.ts +174 -0
  46. package/src/core/principle-compiler/code-validator.ts +15 -42
  47. package/src/core/principle-compiler/compiler.ts +100 -15
  48. package/src/core/principle-compiler/index.ts +5 -2
  49. package/src/core/principle-compiler/template-generator.ts +4 -104
  50. package/src/core/principle-injection.ts +10 -202
  51. package/src/core/principle-internalization/filesystem-lifecycle-datasource.ts +42 -0
  52. package/src/core/principle-internalization/lifecycle-read-model.ts +39 -242
  53. package/src/core/principle-internalization/principle-lifecycle-service.ts +12 -10
  54. package/src/core/principle-tree-ledger-adapter.ts +145 -0
  55. package/src/core/principle-tree-ledger.ts +8 -6
  56. package/src/core/reflection/reflection-context.ts +14 -109
  57. package/src/core/replay-engine.ts +8 -500
  58. package/src/core/rule-host-helpers.ts +5 -35
  59. package/src/core/rule-host-types.ts +10 -82
  60. package/src/core/rule-host.ts +6 -63
  61. package/src/core/runtime-v2-prompt-activation-reader.ts +231 -0
  62. package/src/core/session-tracker.ts +87 -101
  63. package/src/core/shadow-observation-registry.ts +19 -48
  64. package/src/core/trajectory.ts +3 -1
  65. package/src/core/workflow-funnel-loader.ts +62 -68
  66. package/src/core/workspace-context.ts +46 -0
  67. package/src/core/workspace-dir-service.ts +1 -1
  68. package/src/core/workspace-dir-validation.ts +18 -9
  69. package/src/hooks/AGENTS.md +1 -1
  70. package/src/hooks/gate-block-helper.ts +71 -64
  71. package/src/hooks/gate.ts +183 -31
  72. package/src/hooks/lifecycle.ts +30 -32
  73. package/src/hooks/llm.ts +60 -32
  74. package/src/hooks/pain.ts +297 -103
  75. package/src/hooks/prompt.ts +400 -440
  76. package/src/hooks/subagent.ts +2 -29
  77. package/src/i18n/commands.ts +2 -10
  78. package/src/index.ts +95 -85
  79. package/src/openclaw-sdk.ts +311 -0
  80. package/src/service/central-database.ts +8 -4
  81. package/src/service/evolution-queue-migration.ts +2 -1
  82. package/src/service/evolution-worker.ts +163 -1786
  83. package/src/service/internalization-trigger-adapter.ts +302 -0
  84. package/src/service/keyword-optimization-service.ts +4 -4
  85. package/src/service/monitoring-query-service.ts +1 -215
  86. package/src/service/queue-io.ts +60 -331
  87. package/src/service/runtime-summary-service.ts +59 -16
  88. package/src/service/subagent-workflow/index.ts +0 -41
  89. package/src/service/subagent-workflow/types.ts +9 -120
  90. package/src/service/subagent-workflow/workflow-store.ts +2 -119
  91. package/src/service/workflow-watchdog.ts +0 -43
  92. package/src/types/event-payload.ts +16 -74
  93. package/src/types/event-types.ts +38 -547
  94. package/src/types/hygiene-types.ts +7 -30
  95. package/src/types/principle-tree-schema.ts +20 -222
  96. package/src/types/queue.ts +15 -70
  97. package/src/types/runtime-summary.ts +5 -49
  98. package/src/utils/io.ts +8 -20
  99. package/src/utils/retry.ts +1 -1
  100. package/src/utils/shadow-fingerprint.ts +2 -2
  101. package/src/utils/workspace-resolver.ts +50 -0
  102. package/templates/langs/en/core/AGENTS.md +7 -7
  103. package/templates/langs/en/core/BOOT.md +1 -1
  104. package/templates/langs/en/core/HEARTBEAT.md +2 -2
  105. package/templates/langs/en/principles/THINKING_OS.md +3 -2
  106. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  107. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  108. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  109. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  110. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  111. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  112. package/templates/langs/en/skills/evolve-task/SKILL.md +3 -3
  113. package/templates/langs/en/skills/pd-cli-operator/SKILL.md +67 -0
  114. package/templates/langs/en/skills/pd-diagnostician/SKILL.md +1 -1
  115. package/templates/langs/en/skills/pd-mentor/SKILL.md +2 -3
  116. package/templates/langs/en/skills/pd-pain-signal/SKILL.md +17 -39
  117. package/templates/langs/en/skills/pd-runtime-v2/SKILL.md +61 -0
  118. package/templates/langs/zh/core/AGENTS.md +7 -7
  119. package/templates/langs/zh/core/BOOT.md +1 -1
  120. package/templates/langs/zh/core/HEARTBEAT.md +2 -2
  121. package/templates/langs/zh/principles/THINKING_OS.md +3 -2
  122. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  123. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  124. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  125. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +8 -8
  126. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  127. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  128. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  129. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +21 -5
  130. package/templates/langs/zh/skills/evolve-task/SKILL.md +4 -4
  131. package/templates/langs/zh/skills/pd-cli-operator/SKILL.md +67 -0
  132. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +1 -1
  133. package/templates/langs/zh/skills/pd-mentor/SKILL.md +2 -3
  134. package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +17 -38
  135. package/templates/langs/zh/skills/pd-runtime-v2/SKILL.md +61 -0
  136. package/tests/build-artifacts.test.ts +1 -3
  137. package/tests/commands/evolution-status.test.ts +0 -118
  138. package/tests/core/bootstrap-rules.test.ts +1 -1
  139. package/tests/core/config.test.ts +1 -1
  140. package/tests/core/event-log.test.ts +35 -0
  141. package/tests/core/evolution-engine.test.ts +610 -0
  142. package/tests/core/file-store.test.ts +102 -0
  143. package/tests/core/focus-history.test.ts +203 -11
  144. package/tests/core/merge-gate-audit.test.ts +2 -169
  145. package/tests/core/migration.test.ts +7 -7
  146. package/tests/core/model-deployment-registry.test.ts +7 -1
  147. package/tests/core/model-training-registry.test.ts +19 -0
  148. package/tests/core/observability.test.ts +0 -1
  149. package/tests/core/pain-diagnostic-gate.test.ts +498 -0
  150. package/tests/core/pain.test.ts +0 -1
  151. package/tests/core/path-resolver.test.ts +1 -1
  152. package/tests/core/paths-refactor.test.ts +0 -22
  153. package/tests/core/principle-internalization/deprecated-readiness.test.ts +2 -2
  154. package/tests/core/principle-internalization/lifecycle-metrics.test.ts +2 -2
  155. package/tests/core/principle-internalization/{internalization-routing-policy.test.ts → lifecycle-routing-policy.test.ts} +6 -6
  156. package/tests/core/principle-internalization/lineage-source-retired.test.ts +56 -0
  157. package/tests/core/principle-internalization/principle-lifecycle-service.test.ts +1 -23
  158. package/tests/core/principle-tree-ledger-adapter.test.ts +253 -0
  159. package/tests/core/reflection-context.test.ts +0 -14
  160. package/tests/core/replay-engine.test.ts +127 -215
  161. package/tests/core/rule-host-helpers.test.ts +2 -2
  162. package/tests/core/rule-implementation-runtime.test.ts +0 -27
  163. package/tests/core/workflow-funnel-loader.test.ts +162 -0
  164. package/tests/core/workspace-context.test.ts +2 -2
  165. package/tests/core/workspace-dir-validation.test.ts +8 -1
  166. package/tests/core-anti-growth.test.ts +191 -0
  167. package/tests/hook-workspace-nextaction-contract.test.ts +42 -0
  168. package/tests/hooks/confirm-first-removal.test.ts +188 -0
  169. package/tests/hooks/gate-auto-correct-shadow.test.ts +310 -0
  170. package/tests/hooks/gate-auto-correct.test.ts +665 -0
  171. package/tests/hooks/gate-no-path-write-tool.test.ts +172 -0
  172. package/tests/hooks/gate-rule-host-pipeline.test.ts +2 -1
  173. package/tests/hooks/pain.test.ts +269 -12
  174. package/tests/hooks/prompt-characterization.test.ts +500 -0
  175. package/tests/hooks/prompt-size-guard.test.ts +32 -17
  176. package/tests/hooks/runtime-v2-prompt-activation.test.ts +869 -0
  177. package/tests/index.test.ts +94 -1
  178. package/tests/integration/auto-entry-gate.test.ts +248 -0
  179. package/tests/integration/internalization-trigger-guard.test.ts +69 -0
  180. package/tests/integration/m8-legacy-paths.test.ts +63 -0
  181. package/tests/integration/runtime-v2-pain-guard.test.ts +125 -0
  182. package/tests/plugin-config-resolution-cutover.test.ts +359 -0
  183. package/tests/runtime-v2-discovery-guard.test.ts +154 -0
  184. package/tests/service/central-database.test.ts +457 -0
  185. package/tests/service/evolution-worker.correction-observer.test.ts +173 -0
  186. package/tests/service/evolution-worker.timeout.test.ts +11 -129
  187. package/tests/service/internalization-trigger-adapter.test.ts +251 -0
  188. package/tests/service/monitoring-query-service.test.ts +1 -47
  189. package/tests/service/queue-io.test.ts +1 -62
  190. package/tests/service/runtime-summary-service.test.ts +3 -1
  191. package/tests/service/workflow-watchdog.test.ts +0 -91
  192. package/tests/utils/file-lock.test.ts +5 -3
  193. package/tests/utils/session-key.test.ts +52 -0
  194. package/tests/utils/subagent-probe.test.ts +48 -1
  195. package/vitest.config.ts +4 -11
  196. package/.planning/codebase/ARCHITECTURE.md +0 -157
  197. package/.planning/codebase/CONCERNS.md +0 -145
  198. package/.planning/codebase/CONVENTIONS.md +0 -148
  199. package/.planning/codebase/INTEGRATIONS.md +0 -81
  200. package/.planning/codebase/STACK.md +0 -87
  201. package/.planning/codebase/STRUCTURE.md +0 -193
  202. package/.planning/codebase/TESTING.md +0 -243
  203. package/.planning/phases/01-basic-visualization/01-GAP-CLOSURE-VERIFICATION.md +0 -113
  204. package/docs/COMMAND_REFERENCE.md +0 -76
  205. package/docs/COMMAND_REFERENCE_EN.md +0 -79
  206. package/scripts/build-web.mjs +0 -46
  207. package/scripts/diagnose-nocturnal.mjs +0 -537
  208. package/scripts/seed-nocturnal-scenarios.mjs +0 -384
  209. package/src/commands/nocturnal-review.ts +0 -322
  210. package/src/commands/nocturnal-rollout.ts +0 -790
  211. package/src/commands/nocturnal-train.ts +0 -986
  212. package/src/commands/pd-reflect.ts +0 -88
  213. package/src/core/adaptive-thresholds.ts +0 -478
  214. package/src/core/diagnostician-task-store.ts +0 -192
  215. package/src/core/nocturnal-arbiter.ts +0 -715
  216. package/src/core/nocturnal-artifact-lineage.ts +0 -116
  217. package/src/core/nocturnal-artificer.ts +0 -257
  218. package/src/core/nocturnal-candidate-scoring.ts +0 -530
  219. package/src/core/nocturnal-compliance.ts +0 -1146
  220. package/src/core/nocturnal-dataset.ts +0 -763
  221. package/src/core/nocturnal-executability.ts +0 -428
  222. package/src/core/nocturnal-export.ts +0 -499
  223. package/src/core/nocturnal-paths.ts +0 -240
  224. package/src/core/nocturnal-reasoning-deriver.ts +0 -343
  225. package/src/core/nocturnal-rule-implementation-validator.ts +0 -246
  226. package/src/core/nocturnal-snapshot-contract.ts +0 -99
  227. package/src/core/nocturnal-trajectory-extractor.ts +0 -512
  228. package/src/core/nocturnal-trinity-types.ts +0 -218
  229. package/src/core/nocturnal-trinity.ts +0 -2680
  230. package/src/core/principle-internalization/deprecated-readiness.ts +0 -93
  231. package/src/core/principle-internalization/internalization-routing-policy.ts +0 -208
  232. package/src/core/principle-internalization/lifecycle-metrics.ts +0 -152
  233. package/src/http/principles-console-route.ts +0 -709
  234. package/src/service/central-health-service.ts +0 -49
  235. package/src/service/central-overview-service.ts +0 -138
  236. package/src/service/control-ui-query-service.ts +0 -900
  237. package/src/service/cooldown-strategy.ts +0 -97
  238. package/src/service/evolution-pain-context.ts +0 -79
  239. package/src/service/evolution-query-service.ts +0 -407
  240. package/src/service/health-query-service.ts +0 -1038
  241. package/src/service/nocturnal-config.ts +0 -214
  242. package/src/service/nocturnal-runtime.ts +0 -734
  243. package/src/service/nocturnal-service.ts +0 -1605
  244. package/src/service/nocturnal-target-selector.ts +0 -545
  245. package/src/service/sleep-cycle.ts +0 -157
  246. package/src/service/startup-reconciler.ts +0 -112
  247. package/src/service/subagent-workflow/correction-observer-types.ts +0 -82
  248. package/src/service/subagent-workflow/correction-observer-workflow-manager.ts +0 -250
  249. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +0 -1
  250. package/src/service/subagent-workflow/dynamic-timeout.ts +0 -30
  251. package/src/service/subagent-workflow/empathy-observer-workflow-manager.ts +0 -268
  252. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +0 -795
  253. package/src/service/subagent-workflow/runtime-direct-driver.ts +0 -268
  254. package/src/service/subagent-workflow/workflow-manager-base.ts +0 -580
  255. package/src/tools/write-pain-flag.ts +0 -215
  256. package/templates/langs/en/skills/plan-script/SKILL.md +0 -32
  257. package/templates/langs/zh/skills/plan-script/SKILL.md +0 -32
  258. package/tests/commands/nocturnal-review.test.ts +0 -448
  259. package/tests/commands/nocturnal-train.test.ts +0 -97
  260. package/tests/commands/pd-reflect.test.ts +0 -49
  261. package/tests/core/adaptive-thresholds.test.ts +0 -261
  262. package/tests/core/nocturnal-arbiter.test.ts +0 -559
  263. package/tests/core/nocturnal-artifact-lineage.test.ts +0 -53
  264. package/tests/core/nocturnal-artificer.test.ts +0 -241
  265. package/tests/core/nocturnal-candidate-scoring.test.ts +0 -532
  266. package/tests/core/nocturnal-compliance-p-principles.test.ts +0 -133
  267. package/tests/core/nocturnal-compliance.test.ts +0 -646
  268. package/tests/core/nocturnal-dataset.test.ts +0 -892
  269. package/tests/core/nocturnal-e2e.test.ts +0 -234
  270. package/tests/core/nocturnal-executability.test.ts +0 -357
  271. package/tests/core/nocturnal-export.test.ts +0 -517
  272. package/tests/core/nocturnal-reasoning-deriver.test.ts +0 -372
  273. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +0 -428
  274. package/tests/core/nocturnal-rule-implementation-validator.test.ts +0 -127
  275. package/tests/core/nocturnal-snapshot-contract.test.ts +0 -121
  276. package/tests/core/nocturnal-trajectory-extractor.test.ts +0 -634
  277. package/tests/core/nocturnal-trinity.test.ts +0 -2053
  278. package/tests/core/pain-auto-repair.test.ts +0 -96
  279. package/tests/core/pain-integration.test.ts +0 -510
  280. package/tests/fixtures/nocturnal-reviewed-subset.json +0 -183
  281. package/tests/http/principles-console-route.test.ts +0 -162
  282. package/tests/integration/chaos-resilience.test.ts +0 -348
  283. package/tests/integration/empathy-workflow-integration.test.ts +0 -626
  284. package/tests/integration/pain-diagnostician-loop.e2e.test.ts +0 -380
  285. package/tests/service/control-ui-query-service.test.ts +0 -121
  286. package/tests/service/cooldown-strategy.test.ts +0 -164
  287. package/tests/service/data-endpoints-regression.test.ts +0 -834
  288. package/tests/service/empathy-observer-workflow-manager.test.ts +0 -175
  289. package/tests/service/evolution-worker.nocturnal.test.ts +0 -601
  290. package/tests/service/nocturnal-runtime-hardening.test.ts +0 -118
  291. package/tests/service/nocturnal-runtime.test.ts +0 -473
  292. package/tests/service/nocturnal-service-code-candidate.test.ts +0 -330
  293. package/tests/service/nocturnal-target-selector.test.ts +0 -615
  294. package/tests/service/startup-reconciler.test.ts +0 -148
  295. package/tests/tools/write-pain-flag.test.ts +0 -358
  296. package/ui/src/App.tsx +0 -45
  297. package/ui/src/api.ts +0 -220
  298. package/ui/src/charts.tsx +0 -955
  299. package/ui/src/components/ErrorState.tsx +0 -6
  300. package/ui/src/components/Loading.tsx +0 -13
  301. package/ui/src/components/ProtectedRoute.tsx +0 -12
  302. package/ui/src/components/Shell.tsx +0 -91
  303. package/ui/src/components/WorkspaceConfig.tsx +0 -178
  304. package/ui/src/components/index.ts +0 -5
  305. package/ui/src/context/auth.tsx +0 -80
  306. package/ui/src/context/theme.tsx +0 -66
  307. package/ui/src/hooks/useAutoRefresh.ts +0 -39
  308. package/ui/src/i18n/ui.ts +0 -473
  309. package/ui/src/main.tsx +0 -16
  310. package/ui/src/pages/EvolutionPage.tsx +0 -333
  311. package/ui/src/pages/FeedbackPage.tsx +0 -138
  312. package/ui/src/pages/GateMonitorPage.tsx +0 -136
  313. package/ui/src/pages/LoginPage.tsx +0 -89
  314. package/ui/src/pages/OverviewPage.tsx +0 -599
  315. package/ui/src/pages/SamplesPage.tsx +0 -174
  316. package/ui/src/pages/ThinkingModelsPage.tsx +0 -702
  317. package/ui/src/styles.css +0 -2020
  318. package/ui/src/types.ts +0 -384
  319. package/ui/src/utils/format.ts +0 -15
@@ -1,517 +0,0 @@
1
- import { describe, it, expect, beforeEach, afterEach } from 'vitest';
2
- import * as fs from 'fs';
3
- import * as path from 'path';
4
- import * as os from 'os';
5
- import {
6
- exportORPOSamples,
7
- verifyExportIntegrity,
8
- listExports,
9
- getExportManifest,
10
- } from '../../src/core/nocturnal-export.js';
11
- import type { NocturnalArtifact } from '../../src/core/nocturnal-arbiter.js';
12
- import {
13
- registerSample,
14
- listDatasetRecords,
15
- updateReviewStatus,
16
- getDatasetRecord,
17
- } from '../../src/core/nocturnal-dataset.js';
18
- import { appendArtifactLineageRecord } from '../../src/core/nocturnal-artifact-lineage.js';
19
- import type { NocturnalDatasetRecord } from '../../src/core/nocturnal-dataset.js';
20
-
21
- // ---------------------------------------------------------------------------
22
- // Test Fixtures
23
- // ---------------------------------------------------------------------------
24
-
25
- function makeArtifact(overrides: Partial<NocturnalArtifact> = {}): NocturnalArtifact {
26
- return {
27
- artifactId: 'a1b2c3d4-e5f6-7890-abcd-ef1234567890',
28
- sessionId: 'session-abc123',
29
- principleId: 'T-08',
30
- sourceSnapshotRef: 'snapshot-2026-03-27-001',
31
- badDecision: 'After bash command failed, immediately retried without diagnosing',
32
- betterDecision: 'Check the error message before retrying',
33
- rationale: 'Diagnosing failures prevents repeated failures and respects cost of each attempt',
34
- createdAt: '2026-03-27T12:00:00.000Z',
35
- ...overrides,
36
- };
37
- }
38
-
39
- function makeTmpDir(): string {
40
- return fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-export-test-'));
41
- }
42
-
43
- function rmdir(dir: string): void {
44
- try {
45
- if (fs.existsSync(dir)) {
46
- fs.rmSync(dir, { recursive: true, force: true });
47
- }
48
- } catch {
49
- // Ignore
50
- }
51
- }
52
-
53
- // ---------------------------------------------------------------------------
54
- // Helper: Setup fully export-ready sample
55
- // ---------------------------------------------------------------------------
56
-
57
- function setupExportReady(
58
- workspaceDir: string,
59
- artifactId: string,
60
- family: string = 'gpt-4'
61
- ): NocturnalDatasetRecord {
62
- const artifact = makeArtifact({ artifactId });
63
- const artifactPath = path.join(
64
- workspaceDir,
65
- '.state',
66
- 'nocturnal',
67
- 'samples',
68
- `${artifactId}.json`
69
- );
70
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
71
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
72
-
73
- const registered = registerSample(workspaceDir, artifact, artifactPath, family).record;
74
- updateReviewStatus(
75
- workspaceDir,
76
- registered.sampleFingerprint,
77
- 'approved_for_training',
78
- 'Approved for ORPO export test'
79
- );
80
- return getDatasetRecord(workspaceDir, registered.sampleFingerprint)!;
81
- }
82
-
83
- // ---------------------------------------------------------------------------
84
- // Tests: exportORPOSamples — basic
85
- // ---------------------------------------------------------------------------
86
-
87
- describe('NocturnalExport exportORPOSamples', () => {
88
- let tmpDir: string;
89
-
90
- beforeEach(() => {
91
- tmpDir = makeTmpDir();
92
- });
93
-
94
- afterEach(() => {
95
- rmdir(tmpDir);
96
- });
97
-
98
- it('exports approved samples to JSONL', () => {
99
- setupExportReady(tmpDir, 'art-export-1', 'gpt-4');
100
- setupExportReady(tmpDir, 'art-export-2', 'gpt-4');
101
-
102
- const result = exportORPOSamples(tmpDir, 'gpt-4');
103
-
104
- expect(result.success).toBe(true);
105
- expect(result.manifest).toBeDefined();
106
- expect(result.manifest!.sampleCount).toBe(2);
107
- expect(result.manifest!.targetModelFamily).toBe('gpt-4');
108
- expect(result.manifest!.exportId).toBeDefined();
109
- expect(result.manifest!.datasetFingerprint).toHaveLength(64);
110
-
111
- // Verify JSONL file exists
112
- const jsonlPath = result.manifest!.exportPath;
113
- expect(fs.existsSync(jsonlPath)).toBe(true);
114
-
115
- // Verify JSONL is parseable
116
- const content = fs.readFileSync(jsonlPath, 'utf-8');
117
- const lines = content.trim().split('\n').filter(Boolean);
118
- expect(lines).toHaveLength(2);
119
-
120
- for (const line of lines) {
121
- const sample = JSON.parse(line);
122
- expect(sample.prompt).toBeTruthy();
123
- expect(sample.chosen).toBeTruthy();
124
- expect(sample.rejected).toBeTruthy();
125
- expect(sample.rationale).toBeTruthy();
126
- expect(sample.datasetMetadata.exportId).toBe(result.manifest!.exportId);
127
- expect(sample.datasetMetadata.evidenceSummary.lineageStatus).toBe('unknown');
128
- }
129
- });
130
-
131
- it('degrades to evidence-bounded neutral text when lineage is missing', () => {
132
- setupExportReady(tmpDir, 'art-no-lineage', 'gpt-4');
133
-
134
- const result = exportORPOSamples(tmpDir, 'gpt-4');
135
-
136
- expect(result.success).toBe(true);
137
- const [sample] = fs.readFileSync(result.manifest!.exportPath, 'utf-8').trim().split('\n').map((line) => JSON.parse(line));
138
- expect(sample.prompt).toBe('Take the next action without verified source evidence.');
139
- expect(sample.rejected).toBe('Take the next action without verified source evidence.');
140
- expect(sample.rationale).toContain('Source evidence is unknown');
141
- expect(sample.datasetMetadata.evidenceSummary).toEqual({
142
- lineageStatus: 'unknown',
143
- painSignals: { status: 'unknown', count: null, ids: [] },
144
- gateBlocks: { status: 'unknown', count: null, ids: [] },
145
- });
146
- });
147
-
148
- it('exports observed lineage evidence when available', () => {
149
- const record = setupExportReady(tmpDir, 'art-with-lineage', 'gpt-4');
150
- appendArtifactLineageRecord(tmpDir, {
151
- artifactKind: 'behavioral-sample',
152
- artifactId: record.artifactId,
153
- principleId: record.principleId,
154
- ruleId: null,
155
- sessionId: record.sessionId,
156
- sourceSnapshotRef: record.sourceSnapshotRef,
157
- sourcePainIds: ['pain-1', 'pain-2'],
158
- sourceGateBlockIds: ['gate-1'],
159
- storagePath: record.artifactPath,
160
- implementationId: null,
161
- createdAt: record.createdAt,
162
- });
163
-
164
- const result = exportORPOSamples(tmpDir, 'gpt-4');
165
-
166
- expect(result.success).toBe(true);
167
- const [sample] = fs.readFileSync(result.manifest!.exportPath, 'utf-8').trim().split('\n').map((line) => JSON.parse(line));
168
- expect(sample.prompt).toContain('2 observed pain signals');
169
- expect(sample.rejected).toContain('1 observed gate blocks');
170
- expect(sample.rationale).toContain('Observed source evidence: 2 pain signals and 1 gate blocks');
171
- expect(sample.datasetMetadata.evidenceSummary.lineageStatus).toBe('observed');
172
- expect(sample.datasetMetadata.evidenceSummary.painSignals).toEqual({
173
- status: 'observed',
174
- count: 2,
175
- ids: ['pain-1', 'pain-2'],
176
- });
177
- expect(sample.datasetMetadata.evidenceSummary.gateBlocks).toEqual({
178
- status: 'observed',
179
- count: 1,
180
- ids: ['gate-1'],
181
- });
182
- });
183
-
184
- it('writes manifest alongside JSONL', () => {
185
- setupExportReady(tmpDir, 'art-manifest-1', 'gpt-4');
186
-
187
- const result = exportORPOSamples(tmpDir, 'gpt-4');
188
-
189
- expect(result.success).toBe(true);
190
- expect(fs.existsSync(result.manifest!.manifestPath)).toBe(true);
191
-
192
- const manifest = JSON.parse(fs.readFileSync(result.manifest!.manifestPath, 'utf-8'));
193
- expect(manifest.exportId).toBe(result.manifest!.exportId);
194
- expect(manifest.sampleCount).toBe(1);
195
- expect(manifest.datasetFingerprint).toBe(result.manifest!.datasetFingerprint);
196
- });
197
-
198
- it('returns empty result when no approved samples', () => {
199
- // Register but don't approve
200
- const artifact = makeArtifact({ artifactId: 'art-not-approved' });
201
- const artifactPath = path.join(
202
- tmpDir,
203
- '.state',
204
- 'nocturnal',
205
- 'samples',
206
- 'art-not-approved.json'
207
- );
208
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
209
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
210
- registerSample(tmpDir, artifact, artifactPath, 'gpt-4');
211
-
212
- const result = exportORPOSamples(tmpDir, 'gpt-4');
213
-
214
- expect(result.success).toBe(false);
215
- expect(result.emptyReason).toBe('no_approved_samples');
216
- });
217
-
218
- it('filters by targetModelFamily', () => {
219
- setupExportReady(tmpDir, 'art-gpt4', 'gpt-4');
220
- setupExportReady(tmpDir, 'art-claude', 'claude-3');
221
-
222
- const result = exportORPOSamples(tmpDir, 'gpt-4');
223
-
224
- expect(result.success).toBe(true);
225
- expect(result.manifest!.sampleCount).toBe(1);
226
- expect(result.manifest!.samples[0].artifactId).toBe('art-gpt4');
227
- });
228
-
229
- it('returns empty for family mismatch', () => {
230
- setupExportReady(tmpDir, 'art-claude', 'claude-3');
231
-
232
- const result = exportORPOSamples(tmpDir, 'gpt-4');
233
-
234
- expect(result.success).toBe(false);
235
- expect(result.emptyReason).toBe('family_mismatch');
236
- });
237
-
238
- it('exports all families when targetModelFamily is undefined', () => {
239
- setupExportReady(tmpDir, 'art-family-1', 'gpt-4');
240
- setupExportReady(tmpDir, 'art-family-2', 'claude-3');
241
-
242
- const result = exportORPOSamples(tmpDir);
243
-
244
- expect(result.success).toBe(true);
245
- expect(result.manifest!.sampleCount).toBe(2);
246
- expect(result.manifest!.targetModelFamily).toBe('all');
247
- });
248
-
249
- it('computes deterministic datasetFingerprint', () => {
250
- setupExportReady(tmpDir, 'art-det-1', 'gpt-4');
251
- setupExportReady(tmpDir, 'art-det-2', 'gpt-4');
252
-
253
- const result1 = exportORPOSamples(tmpDir, 'gpt-4');
254
- const manifest1 = result1.manifest!;
255
-
256
- // Export again — should get same datasetFingerprint
257
- const result2 = exportORPOSamples(tmpDir, 'gpt-4');
258
- const manifest2 = result2.manifest!;
259
-
260
- expect(manifest1.datasetFingerprint).toBe(manifest2.datasetFingerprint);
261
- });
262
-
263
- it('null-family samples cannot be exported — family binding is required', () => {
264
- // Register approved but with null family — should NOT be exported
265
- const artifact = makeArtifact({ artifactId: 'art-null-family' });
266
- const artifactPath = path.join(
267
- tmpDir,
268
- '.state',
269
- 'nocturnal',
270
- 'samples',
271
- 'art-null-family.json'
272
- );
273
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
274
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
275
- const record = registerSample(tmpDir, artifact, artifactPath, null).record;
276
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'approved_for_training', 'no family');
277
-
278
- // Export with explicit null family — null-family records must be skipped
279
- const result = exportORPOSamples(tmpDir, null);
280
-
281
- // All eligible records had null family and were skipped (all_samples_missing_artifacts)
282
- expect(result.success).toBe(false);
283
- expect(result.emptyReason).toBe('all_samples_missing_artifacts');
284
- });
285
-
286
- it('rejected samples are not exported', () => {
287
- // Register and reject
288
- const artifact = makeArtifact({ artifactId: 'art-rejected' });
289
- const artifactPath = path.join(
290
- tmpDir,
291
- '.state',
292
- 'nocturnal',
293
- 'samples',
294
- 'art-rejected.json'
295
- );
296
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
297
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
298
- const record = registerSample(tmpDir, artifact, artifactPath, 'gpt-4').record;
299
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'rejected', 'Rejected for test');
300
-
301
- const result = exportORPOSamples(tmpDir, 'gpt-4');
302
-
303
- expect(result.success).toBe(false);
304
- expect(result.emptyReason).toBe('no_approved_samples');
305
- });
306
-
307
- it('superseded samples are not exported', () => {
308
- const artifact = makeArtifact({ artifactId: 'art-superseded' });
309
- const artifactPath = path.join(
310
- tmpDir,
311
- '.state',
312
- 'nocturnal',
313
- 'samples',
314
- 'art-superseded.json'
315
- );
316
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
317
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
318
- const record = registerSample(tmpDir, artifact, artifactPath, 'gpt-4').record;
319
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'approved_for_training', 'ready');
320
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'superseded', 'Superseded by newer sample');
321
-
322
- const result = exportORPOSamples(tmpDir, 'gpt-4');
323
-
324
- expect(result.success).toBe(false);
325
- expect(result.emptyReason).toBe('no_approved_samples');
326
- });
327
-
328
- it('missing artifact file excludes sample', () => {
329
- // Register record but don't create artifact file
330
- const artifact = makeArtifact({ artifactId: 'art-missing-file' });
331
- const artifactPath = path.join(
332
- tmpDir,
333
- '.state',
334
- 'nocturnal',
335
- 'samples',
336
- 'art-missing-file.json'
337
- );
338
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
339
- // Don't write the file
340
- const record = registerSample(tmpDir, artifact, artifactPath, 'gpt-4').record;
341
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'approved_for_training', 'missing file');
342
-
343
- const result = exportORPOSamples(tmpDir, 'gpt-4');
344
-
345
- expect(result.success).toBe(false);
346
- expect(result.emptyReason).toBe('all_samples_missing_artifacts');
347
- });
348
- });
349
-
350
- // ---------------------------------------------------------------------------
351
- // Tests: verifyExportIntegrity
352
- // ---------------------------------------------------------------------------
353
-
354
- describe('NocturnalExport verifyExportIntegrity', () => {
355
- let tmpDir: string;
356
-
357
- beforeEach(() => {
358
- tmpDir = makeTmpDir();
359
- });
360
-
361
- afterEach(() => {
362
- rmdir(tmpDir);
363
- });
364
-
365
- it('returns valid for intact export', () => {
366
- setupExportReady(tmpDir, 'art-verify-1', 'gpt-4');
367
-
368
- const exportResult = exportORPOSamples(tmpDir, 'gpt-4');
369
- const verification = verifyExportIntegrity(tmpDir, exportResult.manifest!.exportId);
370
-
371
- expect(verification).not.toBeNull();
372
- expect(verification!.valid).toBe(true);
373
- expect(verification!.computedFingerprint).toBe(verification!.manifestFingerprint);
374
- });
375
-
376
- it('returns null for non-existent export', () => {
377
- const verification = verifyExportIntegrity(tmpDir, 'nonexistent-export-id');
378
- expect(verification).toBeNull();
379
- });
380
-
381
- it('returns invalid if manifest is corrupted', () => {
382
- setupExportReady(tmpDir, 'art-corrupt', 'gpt-4');
383
-
384
- const exportResult = exportORPOSamples(tmpDir, 'gpt-4');
385
- const manifestPath = exportResult.manifest!.manifestPath;
386
- fs.writeFileSync(manifestPath, 'not valid json', 'utf-8');
387
-
388
- const verification = verifyExportIntegrity(tmpDir, exportResult.manifest!.exportId);
389
- expect(verification).toBeNull();
390
- });
391
- });
392
-
393
- // ---------------------------------------------------------------------------
394
- // Tests: listExports + getExportManifest
395
- // ---------------------------------------------------------------------------
396
-
397
- describe('NocturnalExport listExports + getExportManifest', () => {
398
- let tmpDir: string;
399
-
400
- beforeEach(() => {
401
- tmpDir = makeTmpDir();
402
- });
403
-
404
- afterEach(() => {
405
- rmdir(tmpDir);
406
- });
407
-
408
- it('lists all exports sorted by date', () => {
409
- setupExportReady(tmpDir, 'art-list-1', 'gpt-4');
410
- const r1 = exportORPOSamples(tmpDir, 'gpt-4');
411
-
412
- setupExportReady(tmpDir, 'art-list-2', 'gpt-4');
413
- const r2 = exportORPOSamples(tmpDir, 'gpt-4');
414
-
415
- const exports = listExports(tmpDir);
416
- expect(exports).toHaveLength(2);
417
- // Newest first
418
- expect(exports[0].exportId).toBe(r2.manifest!.exportId);
419
- expect(exports[1].exportId).toBe(r1.manifest!.exportId);
420
- });
421
-
422
- it('returns empty array when no exports', () => {
423
- const exports = listExports(tmpDir);
424
- expect(exports).toHaveLength(0);
425
- });
426
-
427
- it('getExportManifest returns correct manifest', () => {
428
- setupExportReady(tmpDir, 'art-getm', 'gpt-4');
429
- const exportResult = exportORPOSamples(tmpDir, 'gpt-4');
430
-
431
- const manifest = getExportManifest(tmpDir, exportResult.manifest!.exportId);
432
- expect(manifest).not.toBeNull();
433
- expect(manifest!.exportId).toBe(exportResult.manifest!.exportId);
434
- expect(manifest!.sampleCount).toBe(1);
435
- });
436
-
437
- it('getExportManifest returns null for non-existent', () => {
438
- const manifest = getExportManifest(tmpDir, 'nonexistent');
439
- expect(manifest).toBeNull();
440
- });
441
- });
442
-
443
- // ---------------------------------------------------------------------------
444
- // Integration: JSONL parseability + ORPO structure
445
- // ---------------------------------------------------------------------------
446
-
447
- describe('NocturnalExport JSONL parseability', () => {
448
- let tmpDir: string;
449
-
450
- beforeEach(() => {
451
- tmpDir = makeTmpDir();
452
- });
453
-
454
- afterEach(() => {
455
- rmdir(tmpDir);
456
- });
457
-
458
- it('every JSONL line is parseable and has ORPO structure', () => {
459
- setupExportReady(tmpDir, 'art-parse-1', 'gpt-4');
460
- setupExportReady(tmpDir, 'art-parse-2', 'gpt-4');
461
-
462
- const result = exportORPOSamples(tmpDir, 'gpt-4');
463
- const content = fs.readFileSync(result.manifest!.exportPath, 'utf-8');
464
- const lines = content.trim().split('\n').filter(Boolean);
465
-
466
- expect(lines.length).toBe(2);
467
-
468
- for (const line of lines) {
469
- const sample = JSON.parse(line);
470
-
471
- // ORPO required fields
472
- expect(typeof sample.sampleFingerprint).toBe('string');
473
- expect(typeof sample.artifactId).toBe('string');
474
- expect(typeof sample.sessionId).toBe('string');
475
- expect(typeof sample.principleId).toBe('string');
476
- expect(typeof sample.targetModelFamily).toBe('string');
477
- expect(typeof sample.prompt).toBe('string');
478
- expect(typeof sample.chosen).toBe('string');
479
- expect(typeof sample.rejected).toBe('string');
480
- expect(typeof sample.rationale).toBe('string');
481
- expect(typeof sample.datasetMetadata).toBe('object');
482
-
483
- // Metadata fields
484
- expect(typeof sample.datasetMetadata.sampleFingerprint).toBe('string');
485
- expect(typeof sample.datasetMetadata.artifactPath).toBe('string');
486
- expect(typeof sample.datasetMetadata.createdAt).toBe('string');
487
- expect(typeof sample.datasetMetadata.exportedAt).toBe('string');
488
- expect(typeof sample.datasetMetadata.exportId).toBe('string');
489
- expect(typeof sample.datasetMetadata.datasetFingerprint).toBe('string');
490
- }
491
- });
492
-
493
- it('prompt equals rejected (ORPO teaches to avoid badDecision)', () => {
494
- setupExportReady(tmpDir, 'art-orpo-check', 'gpt-4');
495
-
496
- const result = exportORPOSamples(tmpDir, 'gpt-4');
497
- const content = fs.readFileSync(result.manifest!.exportPath, 'utf-8');
498
- const lines = content.trim().split('\n').filter(Boolean);
499
- const sample = JSON.parse(lines[0]);
500
-
501
- expect(sample.prompt).toBe(sample.rejected);
502
- expect(sample.chosen).not.toBe(sample.rejected);
503
- });
504
-
505
- it('export is reproducible with same dataset', () => {
506
- setupExportReady(tmpDir, 'art-repro-1', 'gpt-4');
507
- setupExportReady(tmpDir, 'art-repro-2', 'gpt-4');
508
-
509
- const r1 = exportORPOSamples(tmpDir, 'gpt-4');
510
- const r2 = exportORPOSamples(tmpDir, 'gpt-4');
511
- const r3 = exportORPOSamples(tmpDir, 'gpt-4');
512
-
513
- expect(r1.manifest!.datasetFingerprint).toBe(r2.manifest!.datasetFingerprint);
514
- expect(r2.manifest!.datasetFingerprint).toBe(r3.manifest!.datasetFingerprint);
515
- expect(r1.manifest!.sampleCount).toBe(r2.manifest!.sampleCount);
516
- });
517
- });