principles-disciple 1.72.0 → 1.73.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (309) hide show
  1. package/openclaw.plugin.json +10 -5
  2. package/package.json +17 -19
  3. package/scripts/acceptance-test.mjs +16 -73
  4. package/scripts/sync-plugin.mjs +382 -77
  5. package/src/commands/archive-impl.ts +2 -1
  6. package/src/commands/capabilities.ts +2 -2
  7. package/src/commands/context.ts +2 -2
  8. package/src/commands/disable-impl.ts +2 -1
  9. package/src/commands/evolution-status.ts +16 -16
  10. package/src/commands/export.ts +12 -67
  11. package/src/commands/pain.ts +91 -1
  12. package/src/commands/principle-rollback.ts +2 -1
  13. package/src/commands/promote-impl.ts +7 -43
  14. package/src/commands/rollback-impl.ts +2 -1
  15. package/src/commands/rollback.ts +2 -1
  16. package/src/commands/samples.ts +2 -1
  17. package/src/commands/thinking-os.ts +2 -1
  18. package/src/config/errors.ts +18 -2
  19. package/src/constants/diagnostician.ts +2 -2
  20. package/src/constants/tools.ts +2 -1
  21. package/src/core/__tests__/focus-history.test.ts +210 -0
  22. package/src/core/config.ts +1 -1
  23. package/src/core/confirm-first-gate.ts +255 -0
  24. package/src/core/correction-cue-learner.ts +2 -136
  25. package/src/core/correction-types.ts +16 -88
  26. package/src/core/dictionary.ts +19 -20
  27. package/src/core/empathy-keyword-matcher.ts +17 -289
  28. package/src/core/empathy-types.ts +18 -229
  29. package/src/core/event-log.ts +38 -132
  30. package/src/core/evolution-reducer.ts +21 -2
  31. package/src/core/evolution-types.ts +76 -464
  32. package/src/core/file-store.ts +80 -0
  33. package/src/core/focus-history.ts +228 -955
  34. package/src/core/local-worker-routing.ts +34 -314
  35. package/src/core/merge-gate-audit.ts +0 -195
  36. package/src/core/pain-diagnostic-gate.ts +154 -0
  37. package/src/core/pain-signal.ts +21 -138
  38. package/src/core/pain.ts +15 -88
  39. package/src/core/pd-task-reconciler.ts +26 -115
  40. package/src/core/pd-task-service.ts +9 -9
  41. package/src/core/pd-task-types.ts +23 -127
  42. package/src/core/principle-compiler/__tests__/compiler-replay-gate.test.ts +174 -0
  43. package/src/core/principle-compiler/code-validator.ts +15 -42
  44. package/src/core/principle-compiler/compiler.ts +100 -15
  45. package/src/core/principle-compiler/index.ts +5 -2
  46. package/src/core/principle-compiler/template-generator.ts +4 -104
  47. package/src/core/principle-injection.ts +10 -202
  48. package/src/core/principle-internalization/filesystem-lifecycle-datasource.ts +42 -0
  49. package/src/core/principle-internalization/lifecycle-read-model.ts +39 -242
  50. package/src/core/principle-internalization/principle-lifecycle-service.ts +12 -10
  51. package/src/core/principle-tree-ledger-adapter.ts +145 -0
  52. package/src/core/principle-tree-ledger.ts +8 -6
  53. package/src/core/reflection/reflection-context.ts +14 -109
  54. package/src/core/replay-engine.ts +8 -500
  55. package/src/core/rule-host-helpers.ts +5 -35
  56. package/src/core/rule-host-types.ts +10 -82
  57. package/src/core/rule-host.ts +6 -63
  58. package/src/core/runtime-v2-prompt-activation-reader.ts +231 -0
  59. package/src/core/session-tracker.ts +87 -101
  60. package/src/core/shadow-observation-registry.ts +19 -48
  61. package/src/core/trajectory.ts +3 -1
  62. package/src/core/workflow-funnel-loader.ts +62 -68
  63. package/src/core/workspace-context.ts +46 -0
  64. package/src/core/workspace-dir-service.ts +1 -1
  65. package/src/core/workspace-dir-validation.ts +18 -9
  66. package/src/hooks/AGENTS.md +1 -1
  67. package/src/hooks/gate-block-helper.ts +46 -44
  68. package/src/hooks/gate.ts +207 -7
  69. package/src/hooks/lifecycle.ts +30 -32
  70. package/src/hooks/llm.ts +60 -32
  71. package/src/hooks/pain.ts +297 -103
  72. package/src/hooks/prompt.ts +459 -439
  73. package/src/hooks/subagent.ts +2 -29
  74. package/src/i18n/commands.ts +2 -10
  75. package/src/index.ts +95 -85
  76. package/src/openclaw-sdk.ts +311 -0
  77. package/src/service/central-database.ts +8 -4
  78. package/src/service/evolution-queue-migration.ts +2 -1
  79. package/src/service/evolution-worker.ts +163 -1786
  80. package/src/service/internalization-trigger-adapter.ts +302 -0
  81. package/src/service/keyword-optimization-service.ts +4 -4
  82. package/src/service/monitoring-query-service.ts +1 -215
  83. package/src/service/queue-io.ts +60 -331
  84. package/src/service/runtime-summary-service.ts +59 -16
  85. package/src/service/subagent-workflow/index.ts +0 -41
  86. package/src/service/subagent-workflow/types.ts +9 -120
  87. package/src/service/subagent-workflow/workflow-store.ts +2 -119
  88. package/src/service/workflow-watchdog.ts +0 -43
  89. package/src/types/event-payload.ts +16 -74
  90. package/src/types/event-types.ts +39 -547
  91. package/src/types/hygiene-types.ts +7 -30
  92. package/src/types/principle-tree-schema.ts +20 -222
  93. package/src/types/queue.ts +15 -70
  94. package/src/types/runtime-summary.ts +5 -49
  95. package/src/utils/io.ts +10 -0
  96. package/src/utils/retry.ts +1 -1
  97. package/src/utils/shadow-fingerprint.ts +2 -2
  98. package/src/utils/workspace-resolver.ts +50 -0
  99. package/templates/langs/en/core/AGENTS.md +2 -2
  100. package/templates/langs/en/core/BOOT.md +1 -1
  101. package/templates/langs/en/core/HEARTBEAT.md +2 -2
  102. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  103. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  104. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  105. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  106. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  107. package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -2
  108. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  109. package/templates/langs/en/skills/evolve-task/SKILL.md +1 -1
  110. package/templates/langs/en/skills/pd-cli-operator/SKILL.md +67 -0
  111. package/templates/langs/en/skills/pd-diagnostician/SKILL.md +1 -1
  112. package/templates/langs/en/skills/pd-mentor/SKILL.md +1 -1
  113. package/templates/langs/en/skills/pd-pain-signal/SKILL.md +17 -39
  114. package/templates/langs/en/skills/pd-runtime-v2/SKILL.md +61 -0
  115. package/templates/langs/zh/core/AGENTS.md +2 -2
  116. package/templates/langs/zh/core/BOOT.md +1 -1
  117. package/templates/langs/zh/core/HEARTBEAT.md +2 -2
  118. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  119. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  120. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  121. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +8 -8
  122. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  123. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  124. package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -2
  125. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  126. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +21 -5
  127. package/templates/langs/zh/skills/evolve-task/SKILL.md +2 -2
  128. package/templates/langs/zh/skills/pd-cli-operator/SKILL.md +67 -0
  129. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +1 -1
  130. package/templates/langs/zh/skills/pd-mentor/SKILL.md +1 -1
  131. package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +17 -38
  132. package/templates/langs/zh/skills/pd-runtime-v2/SKILL.md +61 -0
  133. package/tests/build-artifacts.test.ts +1 -3
  134. package/tests/commands/evolution-status.test.ts +0 -118
  135. package/tests/core/bootstrap-rules.test.ts +1 -1
  136. package/tests/core/config.test.ts +1 -1
  137. package/tests/core/event-log.test.ts +35 -0
  138. package/tests/core/evolution-engine.test.ts +610 -0
  139. package/tests/core/file-store.test.ts +102 -0
  140. package/tests/core/focus-history.test.ts +203 -11
  141. package/tests/core/merge-gate-audit.test.ts +2 -169
  142. package/tests/core/model-deployment-registry.test.ts +7 -1
  143. package/tests/core/model-training-registry.test.ts +19 -0
  144. package/tests/core/observability.test.ts +0 -1
  145. package/tests/core/pain-diagnostic-gate.test.ts +498 -0
  146. package/tests/core/pain.test.ts +0 -1
  147. package/tests/core/principle-internalization/deprecated-readiness.test.ts +2 -2
  148. package/tests/core/principle-internalization/lifecycle-metrics.test.ts +2 -2
  149. package/tests/core/principle-internalization/{internalization-routing-policy.test.ts → lifecycle-routing-policy.test.ts} +6 -6
  150. package/tests/core/principle-internalization/lineage-source-retired.test.ts +56 -0
  151. package/tests/core/principle-internalization/principle-lifecycle-service.test.ts +1 -23
  152. package/tests/core/principle-tree-ledger-adapter.test.ts +253 -0
  153. package/tests/core/reflection-context.test.ts +0 -14
  154. package/tests/core/replay-engine.test.ts +127 -215
  155. package/tests/core/rule-host-helpers.test.ts +2 -2
  156. package/tests/core/rule-implementation-runtime.test.ts +0 -27
  157. package/tests/core/workflow-funnel-loader.test.ts +162 -0
  158. package/tests/core/workspace-dir-validation.test.ts +8 -1
  159. package/tests/core-anti-growth.test.ts +192 -0
  160. package/tests/hook-workspace-nextaction-contract.test.ts +42 -0
  161. package/tests/hooks/confirm-first-gate.test.ts +333 -0
  162. package/tests/hooks/gate-auto-correct-shadow.test.ts +310 -0
  163. package/tests/hooks/gate-auto-correct.test.ts +665 -0
  164. package/tests/hooks/gate-rule-host-pipeline.test.ts +2 -1
  165. package/tests/hooks/pain.test.ts +269 -12
  166. package/tests/hooks/prompt-characterization.test.ts +500 -0
  167. package/tests/hooks/prompt-size-guard.test.ts +32 -17
  168. package/tests/hooks/runtime-v2-prompt-activation.test.ts +869 -0
  169. package/tests/index.test.ts +94 -1
  170. package/tests/integration/auto-entry-gate.test.ts +248 -0
  171. package/tests/integration/internalization-trigger-guard.test.ts +69 -0
  172. package/tests/integration/m8-legacy-paths.test.ts +63 -0
  173. package/tests/integration/runtime-v2-pain-guard.test.ts +125 -0
  174. package/tests/plugin-config-resolution-cutover.test.ts +359 -0
  175. package/tests/runtime-v2-discovery-guard.test.ts +154 -0
  176. package/tests/service/central-database.test.ts +457 -0
  177. package/tests/service/evolution-worker.correction-observer.test.ts +173 -0
  178. package/tests/service/evolution-worker.timeout.test.ts +11 -129
  179. package/tests/service/internalization-trigger-adapter.test.ts +251 -0
  180. package/tests/service/monitoring-query-service.test.ts +1 -47
  181. package/tests/service/queue-io.test.ts +1 -62
  182. package/tests/service/runtime-summary-service.test.ts +3 -1
  183. package/tests/service/workflow-watchdog.test.ts +0 -91
  184. package/tests/utils/file-lock.test.ts +5 -3
  185. package/tests/utils/session-key.test.ts +52 -0
  186. package/tests/utils/subagent-probe.test.ts +48 -1
  187. package/vitest.config.ts +4 -11
  188. package/.planning/codebase/ARCHITECTURE.md +0 -157
  189. package/.planning/codebase/CONCERNS.md +0 -145
  190. package/.planning/codebase/CONVENTIONS.md +0 -148
  191. package/.planning/codebase/INTEGRATIONS.md +0 -81
  192. package/.planning/codebase/STACK.md +0 -87
  193. package/.planning/codebase/STRUCTURE.md +0 -193
  194. package/.planning/codebase/TESTING.md +0 -243
  195. package/.planning/phases/01-basic-visualization/01-GAP-CLOSURE-VERIFICATION.md +0 -113
  196. package/docs/COMMAND_REFERENCE.md +0 -76
  197. package/docs/COMMAND_REFERENCE_EN.md +0 -79
  198. package/scripts/build-web.mjs +0 -46
  199. package/scripts/diagnose-nocturnal.mjs +0 -537
  200. package/scripts/seed-nocturnal-scenarios.mjs +0 -384
  201. package/src/commands/nocturnal-review.ts +0 -322
  202. package/src/commands/nocturnal-rollout.ts +0 -790
  203. package/src/commands/nocturnal-train.ts +0 -986
  204. package/src/commands/pd-reflect.ts +0 -88
  205. package/src/core/adaptive-thresholds.ts +0 -478
  206. package/src/core/diagnostician-task-store.ts +0 -192
  207. package/src/core/nocturnal-arbiter.ts +0 -715
  208. package/src/core/nocturnal-artifact-lineage.ts +0 -116
  209. package/src/core/nocturnal-artificer.ts +0 -257
  210. package/src/core/nocturnal-candidate-scoring.ts +0 -530
  211. package/src/core/nocturnal-compliance.ts +0 -1146
  212. package/src/core/nocturnal-dataset.ts +0 -763
  213. package/src/core/nocturnal-executability.ts +0 -428
  214. package/src/core/nocturnal-export.ts +0 -499
  215. package/src/core/nocturnal-paths.ts +0 -240
  216. package/src/core/nocturnal-reasoning-deriver.ts +0 -343
  217. package/src/core/nocturnal-rule-implementation-validator.ts +0 -246
  218. package/src/core/nocturnal-snapshot-contract.ts +0 -99
  219. package/src/core/nocturnal-trajectory-extractor.ts +0 -512
  220. package/src/core/nocturnal-trinity-types.ts +0 -218
  221. package/src/core/nocturnal-trinity.ts +0 -2680
  222. package/src/core/principle-internalization/deprecated-readiness.ts +0 -93
  223. package/src/core/principle-internalization/internalization-routing-policy.ts +0 -208
  224. package/src/core/principle-internalization/lifecycle-metrics.ts +0 -152
  225. package/src/http/principles-console-route.ts +0 -709
  226. package/src/service/central-health-service.ts +0 -49
  227. package/src/service/central-overview-service.ts +0 -138
  228. package/src/service/control-ui-query-service.ts +0 -900
  229. package/src/service/cooldown-strategy.ts +0 -97
  230. package/src/service/evolution-pain-context.ts +0 -79
  231. package/src/service/evolution-query-service.ts +0 -407
  232. package/src/service/health-query-service.ts +0 -1038
  233. package/src/service/nocturnal-config.ts +0 -214
  234. package/src/service/nocturnal-runtime.ts +0 -734
  235. package/src/service/nocturnal-service.ts +0 -1605
  236. package/src/service/nocturnal-target-selector.ts +0 -545
  237. package/src/service/sleep-cycle.ts +0 -157
  238. package/src/service/startup-reconciler.ts +0 -112
  239. package/src/service/subagent-workflow/correction-observer-types.ts +0 -82
  240. package/src/service/subagent-workflow/correction-observer-workflow-manager.ts +0 -250
  241. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +0 -1
  242. package/src/service/subagent-workflow/dynamic-timeout.ts +0 -30
  243. package/src/service/subagent-workflow/empathy-observer-workflow-manager.ts +0 -268
  244. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +0 -795
  245. package/src/service/subagent-workflow/runtime-direct-driver.ts +0 -268
  246. package/src/service/subagent-workflow/workflow-manager-base.ts +0 -580
  247. package/src/tools/write-pain-flag.ts +0 -215
  248. package/tests/commands/nocturnal-review.test.ts +0 -448
  249. package/tests/commands/nocturnal-train.test.ts +0 -97
  250. package/tests/commands/pd-reflect.test.ts +0 -49
  251. package/tests/core/adaptive-thresholds.test.ts +0 -261
  252. package/tests/core/nocturnal-arbiter.test.ts +0 -559
  253. package/tests/core/nocturnal-artifact-lineage.test.ts +0 -53
  254. package/tests/core/nocturnal-artificer.test.ts +0 -241
  255. package/tests/core/nocturnal-candidate-scoring.test.ts +0 -532
  256. package/tests/core/nocturnal-compliance-p-principles.test.ts +0 -133
  257. package/tests/core/nocturnal-compliance.test.ts +0 -646
  258. package/tests/core/nocturnal-dataset.test.ts +0 -892
  259. package/tests/core/nocturnal-e2e.test.ts +0 -234
  260. package/tests/core/nocturnal-executability.test.ts +0 -357
  261. package/tests/core/nocturnal-export.test.ts +0 -517
  262. package/tests/core/nocturnal-reasoning-deriver.test.ts +0 -372
  263. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +0 -428
  264. package/tests/core/nocturnal-rule-implementation-validator.test.ts +0 -127
  265. package/tests/core/nocturnal-snapshot-contract.test.ts +0 -121
  266. package/tests/core/nocturnal-trajectory-extractor.test.ts +0 -634
  267. package/tests/core/nocturnal-trinity.test.ts +0 -2053
  268. package/tests/core/pain-auto-repair.test.ts +0 -96
  269. package/tests/core/pain-integration.test.ts +0 -510
  270. package/tests/fixtures/nocturnal-reviewed-subset.json +0 -183
  271. package/tests/http/principles-console-route.test.ts +0 -162
  272. package/tests/integration/chaos-resilience.test.ts +0 -348
  273. package/tests/integration/empathy-workflow-integration.test.ts +0 -626
  274. package/tests/integration/pain-diagnostician-loop.e2e.test.ts +0 -380
  275. package/tests/service/control-ui-query-service.test.ts +0 -121
  276. package/tests/service/cooldown-strategy.test.ts +0 -164
  277. package/tests/service/data-endpoints-regression.test.ts +0 -834
  278. package/tests/service/empathy-observer-workflow-manager.test.ts +0 -175
  279. package/tests/service/evolution-worker.nocturnal.test.ts +0 -601
  280. package/tests/service/nocturnal-runtime-hardening.test.ts +0 -118
  281. package/tests/service/nocturnal-runtime.test.ts +0 -473
  282. package/tests/service/nocturnal-service-code-candidate.test.ts +0 -330
  283. package/tests/service/nocturnal-target-selector.test.ts +0 -615
  284. package/tests/service/startup-reconciler.test.ts +0 -148
  285. package/tests/tools/write-pain-flag.test.ts +0 -358
  286. package/ui/src/App.tsx +0 -45
  287. package/ui/src/api.ts +0 -220
  288. package/ui/src/charts.tsx +0 -955
  289. package/ui/src/components/ErrorState.tsx +0 -6
  290. package/ui/src/components/Loading.tsx +0 -13
  291. package/ui/src/components/ProtectedRoute.tsx +0 -12
  292. package/ui/src/components/Shell.tsx +0 -91
  293. package/ui/src/components/WorkspaceConfig.tsx +0 -178
  294. package/ui/src/components/index.ts +0 -5
  295. package/ui/src/context/auth.tsx +0 -80
  296. package/ui/src/context/theme.tsx +0 -66
  297. package/ui/src/hooks/useAutoRefresh.ts +0 -39
  298. package/ui/src/i18n/ui.ts +0 -473
  299. package/ui/src/main.tsx +0 -16
  300. package/ui/src/pages/EvolutionPage.tsx +0 -333
  301. package/ui/src/pages/FeedbackPage.tsx +0 -138
  302. package/ui/src/pages/GateMonitorPage.tsx +0 -136
  303. package/ui/src/pages/LoginPage.tsx +0 -89
  304. package/ui/src/pages/OverviewPage.tsx +0 -599
  305. package/ui/src/pages/SamplesPage.tsx +0 -174
  306. package/ui/src/pages/ThinkingModelsPage.tsx +0 -702
  307. package/ui/src/styles.css +0 -2020
  308. package/ui/src/types.ts +0 -384
  309. package/ui/src/utils/format.ts +0 -15
@@ -1,517 +0,0 @@
1
- import { describe, it, expect, beforeEach, afterEach } from 'vitest';
2
- import * as fs from 'fs';
3
- import * as path from 'path';
4
- import * as os from 'os';
5
- import {
6
- exportORPOSamples,
7
- verifyExportIntegrity,
8
- listExports,
9
- getExportManifest,
10
- } from '../../src/core/nocturnal-export.js';
11
- import type { NocturnalArtifact } from '../../src/core/nocturnal-arbiter.js';
12
- import {
13
- registerSample,
14
- listDatasetRecords,
15
- updateReviewStatus,
16
- getDatasetRecord,
17
- } from '../../src/core/nocturnal-dataset.js';
18
- import { appendArtifactLineageRecord } from '../../src/core/nocturnal-artifact-lineage.js';
19
- import type { NocturnalDatasetRecord } from '../../src/core/nocturnal-dataset.js';
20
-
21
- // ---------------------------------------------------------------------------
22
- // Test Fixtures
23
- // ---------------------------------------------------------------------------
24
-
25
- function makeArtifact(overrides: Partial<NocturnalArtifact> = {}): NocturnalArtifact {
26
- return {
27
- artifactId: 'a1b2c3d4-e5f6-7890-abcd-ef1234567890',
28
- sessionId: 'session-abc123',
29
- principleId: 'T-08',
30
- sourceSnapshotRef: 'snapshot-2026-03-27-001',
31
- badDecision: 'After bash command failed, immediately retried without diagnosing',
32
- betterDecision: 'Check the error message before retrying',
33
- rationale: 'Diagnosing failures prevents repeated failures and respects cost of each attempt',
34
- createdAt: '2026-03-27T12:00:00.000Z',
35
- ...overrides,
36
- };
37
- }
38
-
39
- function makeTmpDir(): string {
40
- return fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-export-test-'));
41
- }
42
-
43
- function rmdir(dir: string): void {
44
- try {
45
- if (fs.existsSync(dir)) {
46
- fs.rmSync(dir, { recursive: true, force: true });
47
- }
48
- } catch {
49
- // Ignore
50
- }
51
- }
52
-
53
- // ---------------------------------------------------------------------------
54
- // Helper: Setup fully export-ready sample
55
- // ---------------------------------------------------------------------------
56
-
57
- function setupExportReady(
58
- workspaceDir: string,
59
- artifactId: string,
60
- family: string = 'gpt-4'
61
- ): NocturnalDatasetRecord {
62
- const artifact = makeArtifact({ artifactId });
63
- const artifactPath = path.join(
64
- workspaceDir,
65
- '.state',
66
- 'nocturnal',
67
- 'samples',
68
- `${artifactId}.json`
69
- );
70
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
71
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
72
-
73
- const registered = registerSample(workspaceDir, artifact, artifactPath, family).record;
74
- updateReviewStatus(
75
- workspaceDir,
76
- registered.sampleFingerprint,
77
- 'approved_for_training',
78
- 'Approved for ORPO export test'
79
- );
80
- return getDatasetRecord(workspaceDir, registered.sampleFingerprint)!;
81
- }
82
-
83
- // ---------------------------------------------------------------------------
84
- // Tests: exportORPOSamples — basic
85
- // ---------------------------------------------------------------------------
86
-
87
- describe('NocturnalExport exportORPOSamples', () => {
88
- let tmpDir: string;
89
-
90
- beforeEach(() => {
91
- tmpDir = makeTmpDir();
92
- });
93
-
94
- afterEach(() => {
95
- rmdir(tmpDir);
96
- });
97
-
98
- it('exports approved samples to JSONL', () => {
99
- setupExportReady(tmpDir, 'art-export-1', 'gpt-4');
100
- setupExportReady(tmpDir, 'art-export-2', 'gpt-4');
101
-
102
- const result = exportORPOSamples(tmpDir, 'gpt-4');
103
-
104
- expect(result.success).toBe(true);
105
- expect(result.manifest).toBeDefined();
106
- expect(result.manifest!.sampleCount).toBe(2);
107
- expect(result.manifest!.targetModelFamily).toBe('gpt-4');
108
- expect(result.manifest!.exportId).toBeDefined();
109
- expect(result.manifest!.datasetFingerprint).toHaveLength(64);
110
-
111
- // Verify JSONL file exists
112
- const jsonlPath = result.manifest!.exportPath;
113
- expect(fs.existsSync(jsonlPath)).toBe(true);
114
-
115
- // Verify JSONL is parseable
116
- const content = fs.readFileSync(jsonlPath, 'utf-8');
117
- const lines = content.trim().split('\n').filter(Boolean);
118
- expect(lines).toHaveLength(2);
119
-
120
- for (const line of lines) {
121
- const sample = JSON.parse(line);
122
- expect(sample.prompt).toBeTruthy();
123
- expect(sample.chosen).toBeTruthy();
124
- expect(sample.rejected).toBeTruthy();
125
- expect(sample.rationale).toBeTruthy();
126
- expect(sample.datasetMetadata.exportId).toBe(result.manifest!.exportId);
127
- expect(sample.datasetMetadata.evidenceSummary.lineageStatus).toBe('unknown');
128
- }
129
- });
130
-
131
- it('degrades to evidence-bounded neutral text when lineage is missing', () => {
132
- setupExportReady(tmpDir, 'art-no-lineage', 'gpt-4');
133
-
134
- const result = exportORPOSamples(tmpDir, 'gpt-4');
135
-
136
- expect(result.success).toBe(true);
137
- const [sample] = fs.readFileSync(result.manifest!.exportPath, 'utf-8').trim().split('\n').map((line) => JSON.parse(line));
138
- expect(sample.prompt).toBe('Take the next action without verified source evidence.');
139
- expect(sample.rejected).toBe('Take the next action without verified source evidence.');
140
- expect(sample.rationale).toContain('Source evidence is unknown');
141
- expect(sample.datasetMetadata.evidenceSummary).toEqual({
142
- lineageStatus: 'unknown',
143
- painSignals: { status: 'unknown', count: null, ids: [] },
144
- gateBlocks: { status: 'unknown', count: null, ids: [] },
145
- });
146
- });
147
-
148
- it('exports observed lineage evidence when available', () => {
149
- const record = setupExportReady(tmpDir, 'art-with-lineage', 'gpt-4');
150
- appendArtifactLineageRecord(tmpDir, {
151
- artifactKind: 'behavioral-sample',
152
- artifactId: record.artifactId,
153
- principleId: record.principleId,
154
- ruleId: null,
155
- sessionId: record.sessionId,
156
- sourceSnapshotRef: record.sourceSnapshotRef,
157
- sourcePainIds: ['pain-1', 'pain-2'],
158
- sourceGateBlockIds: ['gate-1'],
159
- storagePath: record.artifactPath,
160
- implementationId: null,
161
- createdAt: record.createdAt,
162
- });
163
-
164
- const result = exportORPOSamples(tmpDir, 'gpt-4');
165
-
166
- expect(result.success).toBe(true);
167
- const [sample] = fs.readFileSync(result.manifest!.exportPath, 'utf-8').trim().split('\n').map((line) => JSON.parse(line));
168
- expect(sample.prompt).toContain('2 observed pain signals');
169
- expect(sample.rejected).toContain('1 observed gate blocks');
170
- expect(sample.rationale).toContain('Observed source evidence: 2 pain signals and 1 gate blocks');
171
- expect(sample.datasetMetadata.evidenceSummary.lineageStatus).toBe('observed');
172
- expect(sample.datasetMetadata.evidenceSummary.painSignals).toEqual({
173
- status: 'observed',
174
- count: 2,
175
- ids: ['pain-1', 'pain-2'],
176
- });
177
- expect(sample.datasetMetadata.evidenceSummary.gateBlocks).toEqual({
178
- status: 'observed',
179
- count: 1,
180
- ids: ['gate-1'],
181
- });
182
- });
183
-
184
- it('writes manifest alongside JSONL', () => {
185
- setupExportReady(tmpDir, 'art-manifest-1', 'gpt-4');
186
-
187
- const result = exportORPOSamples(tmpDir, 'gpt-4');
188
-
189
- expect(result.success).toBe(true);
190
- expect(fs.existsSync(result.manifest!.manifestPath)).toBe(true);
191
-
192
- const manifest = JSON.parse(fs.readFileSync(result.manifest!.manifestPath, 'utf-8'));
193
- expect(manifest.exportId).toBe(result.manifest!.exportId);
194
- expect(manifest.sampleCount).toBe(1);
195
- expect(manifest.datasetFingerprint).toBe(result.manifest!.datasetFingerprint);
196
- });
197
-
198
- it('returns empty result when no approved samples', () => {
199
- // Register but don't approve
200
- const artifact = makeArtifact({ artifactId: 'art-not-approved' });
201
- const artifactPath = path.join(
202
- tmpDir,
203
- '.state',
204
- 'nocturnal',
205
- 'samples',
206
- 'art-not-approved.json'
207
- );
208
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
209
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
210
- registerSample(tmpDir, artifact, artifactPath, 'gpt-4');
211
-
212
- const result = exportORPOSamples(tmpDir, 'gpt-4');
213
-
214
- expect(result.success).toBe(false);
215
- expect(result.emptyReason).toBe('no_approved_samples');
216
- });
217
-
218
- it('filters by targetModelFamily', () => {
219
- setupExportReady(tmpDir, 'art-gpt4', 'gpt-4');
220
- setupExportReady(tmpDir, 'art-claude', 'claude-3');
221
-
222
- const result = exportORPOSamples(tmpDir, 'gpt-4');
223
-
224
- expect(result.success).toBe(true);
225
- expect(result.manifest!.sampleCount).toBe(1);
226
- expect(result.manifest!.samples[0].artifactId).toBe('art-gpt4');
227
- });
228
-
229
- it('returns empty for family mismatch', () => {
230
- setupExportReady(tmpDir, 'art-claude', 'claude-3');
231
-
232
- const result = exportORPOSamples(tmpDir, 'gpt-4');
233
-
234
- expect(result.success).toBe(false);
235
- expect(result.emptyReason).toBe('family_mismatch');
236
- });
237
-
238
- it('exports all families when targetModelFamily is undefined', () => {
239
- setupExportReady(tmpDir, 'art-family-1', 'gpt-4');
240
- setupExportReady(tmpDir, 'art-family-2', 'claude-3');
241
-
242
- const result = exportORPOSamples(tmpDir);
243
-
244
- expect(result.success).toBe(true);
245
- expect(result.manifest!.sampleCount).toBe(2);
246
- expect(result.manifest!.targetModelFamily).toBe('all');
247
- });
248
-
249
- it('computes deterministic datasetFingerprint', () => {
250
- setupExportReady(tmpDir, 'art-det-1', 'gpt-4');
251
- setupExportReady(tmpDir, 'art-det-2', 'gpt-4');
252
-
253
- const result1 = exportORPOSamples(tmpDir, 'gpt-4');
254
- const manifest1 = result1.manifest!;
255
-
256
- // Export again — should get same datasetFingerprint
257
- const result2 = exportORPOSamples(tmpDir, 'gpt-4');
258
- const manifest2 = result2.manifest!;
259
-
260
- expect(manifest1.datasetFingerprint).toBe(manifest2.datasetFingerprint);
261
- });
262
-
263
- it('null-family samples cannot be exported — family binding is required', () => {
264
- // Register approved but with null family — should NOT be exported
265
- const artifact = makeArtifact({ artifactId: 'art-null-family' });
266
- const artifactPath = path.join(
267
- tmpDir,
268
- '.state',
269
- 'nocturnal',
270
- 'samples',
271
- 'art-null-family.json'
272
- );
273
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
274
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
275
- const record = registerSample(tmpDir, artifact, artifactPath, null).record;
276
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'approved_for_training', 'no family');
277
-
278
- // Export with explicit null family — null-family records must be skipped
279
- const result = exportORPOSamples(tmpDir, null);
280
-
281
- // All eligible records had null family and were skipped (all_samples_missing_artifacts)
282
- expect(result.success).toBe(false);
283
- expect(result.emptyReason).toBe('all_samples_missing_artifacts');
284
- });
285
-
286
- it('rejected samples are not exported', () => {
287
- // Register and reject
288
- const artifact = makeArtifact({ artifactId: 'art-rejected' });
289
- const artifactPath = path.join(
290
- tmpDir,
291
- '.state',
292
- 'nocturnal',
293
- 'samples',
294
- 'art-rejected.json'
295
- );
296
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
297
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
298
- const record = registerSample(tmpDir, artifact, artifactPath, 'gpt-4').record;
299
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'rejected', 'Rejected for test');
300
-
301
- const result = exportORPOSamples(tmpDir, 'gpt-4');
302
-
303
- expect(result.success).toBe(false);
304
- expect(result.emptyReason).toBe('no_approved_samples');
305
- });
306
-
307
- it('superseded samples are not exported', () => {
308
- const artifact = makeArtifact({ artifactId: 'art-superseded' });
309
- const artifactPath = path.join(
310
- tmpDir,
311
- '.state',
312
- 'nocturnal',
313
- 'samples',
314
- 'art-superseded.json'
315
- );
316
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
317
- fs.writeFileSync(artifactPath, JSON.stringify({ ...artifact, status: 'approved' }), 'utf-8');
318
- const record = registerSample(tmpDir, artifact, artifactPath, 'gpt-4').record;
319
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'approved_for_training', 'ready');
320
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'superseded', 'Superseded by newer sample');
321
-
322
- const result = exportORPOSamples(tmpDir, 'gpt-4');
323
-
324
- expect(result.success).toBe(false);
325
- expect(result.emptyReason).toBe('no_approved_samples');
326
- });
327
-
328
- it('missing artifact file excludes sample', () => {
329
- // Register record but don't create artifact file
330
- const artifact = makeArtifact({ artifactId: 'art-missing-file' });
331
- const artifactPath = path.join(
332
- tmpDir,
333
- '.state',
334
- 'nocturnal',
335
- 'samples',
336
- 'art-missing-file.json'
337
- );
338
- fs.mkdirSync(path.dirname(artifactPath), { recursive: true });
339
- // Don't write the file
340
- const record = registerSample(tmpDir, artifact, artifactPath, 'gpt-4').record;
341
- updateReviewStatus(tmpDir, record.sampleFingerprint, 'approved_for_training', 'missing file');
342
-
343
- const result = exportORPOSamples(tmpDir, 'gpt-4');
344
-
345
- expect(result.success).toBe(false);
346
- expect(result.emptyReason).toBe('all_samples_missing_artifacts');
347
- });
348
- });
349
-
350
- // ---------------------------------------------------------------------------
351
- // Tests: verifyExportIntegrity
352
- // ---------------------------------------------------------------------------
353
-
354
- describe('NocturnalExport verifyExportIntegrity', () => {
355
- let tmpDir: string;
356
-
357
- beforeEach(() => {
358
- tmpDir = makeTmpDir();
359
- });
360
-
361
- afterEach(() => {
362
- rmdir(tmpDir);
363
- });
364
-
365
- it('returns valid for intact export', () => {
366
- setupExportReady(tmpDir, 'art-verify-1', 'gpt-4');
367
-
368
- const exportResult = exportORPOSamples(tmpDir, 'gpt-4');
369
- const verification = verifyExportIntegrity(tmpDir, exportResult.manifest!.exportId);
370
-
371
- expect(verification).not.toBeNull();
372
- expect(verification!.valid).toBe(true);
373
- expect(verification!.computedFingerprint).toBe(verification!.manifestFingerprint);
374
- });
375
-
376
- it('returns null for non-existent export', () => {
377
- const verification = verifyExportIntegrity(tmpDir, 'nonexistent-export-id');
378
- expect(verification).toBeNull();
379
- });
380
-
381
- it('returns invalid if manifest is corrupted', () => {
382
- setupExportReady(tmpDir, 'art-corrupt', 'gpt-4');
383
-
384
- const exportResult = exportORPOSamples(tmpDir, 'gpt-4');
385
- const manifestPath = exportResult.manifest!.manifestPath;
386
- fs.writeFileSync(manifestPath, 'not valid json', 'utf-8');
387
-
388
- const verification = verifyExportIntegrity(tmpDir, exportResult.manifest!.exportId);
389
- expect(verification).toBeNull();
390
- });
391
- });
392
-
393
- // ---------------------------------------------------------------------------
394
- // Tests: listExports + getExportManifest
395
- // ---------------------------------------------------------------------------
396
-
397
- describe('NocturnalExport listExports + getExportManifest', () => {
398
- let tmpDir: string;
399
-
400
- beforeEach(() => {
401
- tmpDir = makeTmpDir();
402
- });
403
-
404
- afterEach(() => {
405
- rmdir(tmpDir);
406
- });
407
-
408
- it('lists all exports sorted by date', () => {
409
- setupExportReady(tmpDir, 'art-list-1', 'gpt-4');
410
- const r1 = exportORPOSamples(tmpDir, 'gpt-4');
411
-
412
- setupExportReady(tmpDir, 'art-list-2', 'gpt-4');
413
- const r2 = exportORPOSamples(tmpDir, 'gpt-4');
414
-
415
- const exports = listExports(tmpDir);
416
- expect(exports).toHaveLength(2);
417
- // Newest first
418
- expect(exports[0].exportId).toBe(r2.manifest!.exportId);
419
- expect(exports[1].exportId).toBe(r1.manifest!.exportId);
420
- });
421
-
422
- it('returns empty array when no exports', () => {
423
- const exports = listExports(tmpDir);
424
- expect(exports).toHaveLength(0);
425
- });
426
-
427
- it('getExportManifest returns correct manifest', () => {
428
- setupExportReady(tmpDir, 'art-getm', 'gpt-4');
429
- const exportResult = exportORPOSamples(tmpDir, 'gpt-4');
430
-
431
- const manifest = getExportManifest(tmpDir, exportResult.manifest!.exportId);
432
- expect(manifest).not.toBeNull();
433
- expect(manifest!.exportId).toBe(exportResult.manifest!.exportId);
434
- expect(manifest!.sampleCount).toBe(1);
435
- });
436
-
437
- it('getExportManifest returns null for non-existent', () => {
438
- const manifest = getExportManifest(tmpDir, 'nonexistent');
439
- expect(manifest).toBeNull();
440
- });
441
- });
442
-
443
- // ---------------------------------------------------------------------------
444
- // Integration: JSONL parseability + ORPO structure
445
- // ---------------------------------------------------------------------------
446
-
447
- describe('NocturnalExport JSONL parseability', () => {
448
- let tmpDir: string;
449
-
450
- beforeEach(() => {
451
- tmpDir = makeTmpDir();
452
- });
453
-
454
- afterEach(() => {
455
- rmdir(tmpDir);
456
- });
457
-
458
- it('every JSONL line is parseable and has ORPO structure', () => {
459
- setupExportReady(tmpDir, 'art-parse-1', 'gpt-4');
460
- setupExportReady(tmpDir, 'art-parse-2', 'gpt-4');
461
-
462
- const result = exportORPOSamples(tmpDir, 'gpt-4');
463
- const content = fs.readFileSync(result.manifest!.exportPath, 'utf-8');
464
- const lines = content.trim().split('\n').filter(Boolean);
465
-
466
- expect(lines.length).toBe(2);
467
-
468
- for (const line of lines) {
469
- const sample = JSON.parse(line);
470
-
471
- // ORPO required fields
472
- expect(typeof sample.sampleFingerprint).toBe('string');
473
- expect(typeof sample.artifactId).toBe('string');
474
- expect(typeof sample.sessionId).toBe('string');
475
- expect(typeof sample.principleId).toBe('string');
476
- expect(typeof sample.targetModelFamily).toBe('string');
477
- expect(typeof sample.prompt).toBe('string');
478
- expect(typeof sample.chosen).toBe('string');
479
- expect(typeof sample.rejected).toBe('string');
480
- expect(typeof sample.rationale).toBe('string');
481
- expect(typeof sample.datasetMetadata).toBe('object');
482
-
483
- // Metadata fields
484
- expect(typeof sample.datasetMetadata.sampleFingerprint).toBe('string');
485
- expect(typeof sample.datasetMetadata.artifactPath).toBe('string');
486
- expect(typeof sample.datasetMetadata.createdAt).toBe('string');
487
- expect(typeof sample.datasetMetadata.exportedAt).toBe('string');
488
- expect(typeof sample.datasetMetadata.exportId).toBe('string');
489
- expect(typeof sample.datasetMetadata.datasetFingerprint).toBe('string');
490
- }
491
- });
492
-
493
- it('prompt equals rejected (ORPO teaches to avoid badDecision)', () => {
494
- setupExportReady(tmpDir, 'art-orpo-check', 'gpt-4');
495
-
496
- const result = exportORPOSamples(tmpDir, 'gpt-4');
497
- const content = fs.readFileSync(result.manifest!.exportPath, 'utf-8');
498
- const lines = content.trim().split('\n').filter(Boolean);
499
- const sample = JSON.parse(lines[0]);
500
-
501
- expect(sample.prompt).toBe(sample.rejected);
502
- expect(sample.chosen).not.toBe(sample.rejected);
503
- });
504
-
505
- it('export is reproducible with same dataset', () => {
506
- setupExportReady(tmpDir, 'art-repro-1', 'gpt-4');
507
- setupExportReady(tmpDir, 'art-repro-2', 'gpt-4');
508
-
509
- const r1 = exportORPOSamples(tmpDir, 'gpt-4');
510
- const r2 = exportORPOSamples(tmpDir, 'gpt-4');
511
- const r3 = exportORPOSamples(tmpDir, 'gpt-4');
512
-
513
- expect(r1.manifest!.datasetFingerprint).toBe(r2.manifest!.datasetFingerprint);
514
- expect(r2.manifest!.datasetFingerprint).toBe(r3.manifest!.datasetFingerprint);
515
- expect(r1.manifest!.sampleCount).toBe(r2.manifest!.sampleCount);
516
- });
517
- });