principles-disciple 1.72.0 → 1.74.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (319) hide show
  1. package/INSTALL.md +1 -3
  2. package/openclaw.plugin.json +10 -5
  3. package/package.json +17 -19
  4. package/scripts/acceptance-test.mjs +16 -73
  5. package/scripts/sync-plugin.mjs +382 -77
  6. package/src/commands/archive-impl.ts +2 -1
  7. package/src/commands/capabilities.ts +2 -2
  8. package/src/commands/context.ts +2 -2
  9. package/src/commands/disable-impl.ts +2 -1
  10. package/src/commands/evolution-status.ts +16 -16
  11. package/src/commands/export.ts +12 -67
  12. package/src/commands/pain.ts +91 -1
  13. package/src/commands/principle-rollback.ts +2 -1
  14. package/src/commands/promote-impl.ts +7 -43
  15. package/src/commands/rollback-impl.ts +2 -1
  16. package/src/commands/rollback.ts +2 -1
  17. package/src/commands/samples.ts +2 -1
  18. package/src/commands/thinking-os.ts +2 -1
  19. package/src/config/errors.ts +18 -2
  20. package/src/constants/diagnostician.ts +2 -2
  21. package/src/constants/tools.ts +2 -1
  22. package/src/core/__tests__/focus-history.test.ts +210 -0
  23. package/src/core/config.ts +1 -1
  24. package/src/core/correction-cue-learner.ts +2 -136
  25. package/src/core/correction-types.ts +16 -88
  26. package/src/core/dictionary.ts +19 -20
  27. package/src/core/empathy-keyword-matcher.ts +17 -289
  28. package/src/core/empathy-types.ts +18 -229
  29. package/src/core/event-log.ts +29 -132
  30. package/src/core/evolution-reducer.ts +21 -2
  31. package/src/core/evolution-types.ts +76 -464
  32. package/src/core/file-store.ts +80 -0
  33. package/src/core/focus-history.ts +228 -955
  34. package/src/core/local-worker-routing.ts +34 -314
  35. package/src/core/merge-gate-audit.ts +0 -195
  36. package/src/core/migration.ts +0 -1
  37. package/src/core/pain-diagnostic-gate.ts +154 -0
  38. package/src/core/pain-signal.ts +21 -138
  39. package/src/core/pain.ts +15 -88
  40. package/src/core/path-resolver.ts +0 -1
  41. package/src/core/paths.ts +0 -1
  42. package/src/core/pd-task-reconciler.ts +26 -115
  43. package/src/core/pd-task-service.ts +9 -9
  44. package/src/core/pd-task-types.ts +23 -127
  45. package/src/core/principle-compiler/__tests__/compiler-replay-gate.test.ts +174 -0
  46. package/src/core/principle-compiler/code-validator.ts +15 -42
  47. package/src/core/principle-compiler/compiler.ts +100 -15
  48. package/src/core/principle-compiler/index.ts +5 -2
  49. package/src/core/principle-compiler/template-generator.ts +4 -104
  50. package/src/core/principle-injection.ts +10 -202
  51. package/src/core/principle-internalization/filesystem-lifecycle-datasource.ts +42 -0
  52. package/src/core/principle-internalization/lifecycle-read-model.ts +39 -242
  53. package/src/core/principle-internalization/principle-lifecycle-service.ts +12 -10
  54. package/src/core/principle-tree-ledger-adapter.ts +145 -0
  55. package/src/core/principle-tree-ledger.ts +8 -6
  56. package/src/core/reflection/reflection-context.ts +14 -109
  57. package/src/core/replay-engine.ts +8 -500
  58. package/src/core/rule-host-helpers.ts +5 -35
  59. package/src/core/rule-host-types.ts +10 -82
  60. package/src/core/rule-host.ts +6 -63
  61. package/src/core/runtime-v2-prompt-activation-reader.ts +231 -0
  62. package/src/core/session-tracker.ts +87 -101
  63. package/src/core/shadow-observation-registry.ts +19 -48
  64. package/src/core/trajectory.ts +3 -1
  65. package/src/core/workflow-funnel-loader.ts +62 -68
  66. package/src/core/workspace-context.ts +46 -0
  67. package/src/core/workspace-dir-service.ts +1 -1
  68. package/src/core/workspace-dir-validation.ts +18 -9
  69. package/src/hooks/AGENTS.md +1 -1
  70. package/src/hooks/gate-block-helper.ts +71 -64
  71. package/src/hooks/gate.ts +183 -31
  72. package/src/hooks/lifecycle.ts +30 -32
  73. package/src/hooks/llm.ts +60 -32
  74. package/src/hooks/pain.ts +297 -103
  75. package/src/hooks/prompt.ts +400 -440
  76. package/src/hooks/subagent.ts +2 -29
  77. package/src/i18n/commands.ts +2 -10
  78. package/src/index.ts +95 -85
  79. package/src/openclaw-sdk.ts +311 -0
  80. package/src/service/central-database.ts +8 -4
  81. package/src/service/evolution-queue-migration.ts +2 -1
  82. package/src/service/evolution-worker.ts +163 -1786
  83. package/src/service/internalization-trigger-adapter.ts +302 -0
  84. package/src/service/keyword-optimization-service.ts +4 -4
  85. package/src/service/monitoring-query-service.ts +1 -215
  86. package/src/service/queue-io.ts +60 -331
  87. package/src/service/runtime-summary-service.ts +59 -16
  88. package/src/service/subagent-workflow/index.ts +0 -41
  89. package/src/service/subagent-workflow/types.ts +9 -120
  90. package/src/service/subagent-workflow/workflow-store.ts +2 -119
  91. package/src/service/workflow-watchdog.ts +0 -43
  92. package/src/types/event-payload.ts +16 -74
  93. package/src/types/event-types.ts +38 -547
  94. package/src/types/hygiene-types.ts +7 -30
  95. package/src/types/principle-tree-schema.ts +20 -222
  96. package/src/types/queue.ts +15 -70
  97. package/src/types/runtime-summary.ts +5 -49
  98. package/src/utils/io.ts +8 -20
  99. package/src/utils/retry.ts +1 -1
  100. package/src/utils/shadow-fingerprint.ts +2 -2
  101. package/src/utils/workspace-resolver.ts +50 -0
  102. package/templates/langs/en/core/AGENTS.md +7 -7
  103. package/templates/langs/en/core/BOOT.md +1 -1
  104. package/templates/langs/en/core/HEARTBEAT.md +2 -2
  105. package/templates/langs/en/principles/THINKING_OS.md +3 -2
  106. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  107. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  108. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  109. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  110. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  111. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  112. package/templates/langs/en/skills/evolve-task/SKILL.md +3 -3
  113. package/templates/langs/en/skills/pd-cli-operator/SKILL.md +67 -0
  114. package/templates/langs/en/skills/pd-diagnostician/SKILL.md +1 -1
  115. package/templates/langs/en/skills/pd-mentor/SKILL.md +2 -3
  116. package/templates/langs/en/skills/pd-pain-signal/SKILL.md +17 -39
  117. package/templates/langs/en/skills/pd-runtime-v2/SKILL.md +61 -0
  118. package/templates/langs/zh/core/AGENTS.md +7 -7
  119. package/templates/langs/zh/core/BOOT.md +1 -1
  120. package/templates/langs/zh/core/HEARTBEAT.md +2 -2
  121. package/templates/langs/zh/principles/THINKING_OS.md +3 -2
  122. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  123. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  124. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  125. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +8 -8
  126. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  127. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  128. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  129. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +21 -5
  130. package/templates/langs/zh/skills/evolve-task/SKILL.md +4 -4
  131. package/templates/langs/zh/skills/pd-cli-operator/SKILL.md +67 -0
  132. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +1 -1
  133. package/templates/langs/zh/skills/pd-mentor/SKILL.md +2 -3
  134. package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +17 -38
  135. package/templates/langs/zh/skills/pd-runtime-v2/SKILL.md +61 -0
  136. package/tests/build-artifacts.test.ts +1 -3
  137. package/tests/commands/evolution-status.test.ts +0 -118
  138. package/tests/core/bootstrap-rules.test.ts +1 -1
  139. package/tests/core/config.test.ts +1 -1
  140. package/tests/core/event-log.test.ts +35 -0
  141. package/tests/core/evolution-engine.test.ts +610 -0
  142. package/tests/core/file-store.test.ts +102 -0
  143. package/tests/core/focus-history.test.ts +203 -11
  144. package/tests/core/merge-gate-audit.test.ts +2 -169
  145. package/tests/core/migration.test.ts +7 -7
  146. package/tests/core/model-deployment-registry.test.ts +7 -1
  147. package/tests/core/model-training-registry.test.ts +19 -0
  148. package/tests/core/observability.test.ts +0 -1
  149. package/tests/core/pain-diagnostic-gate.test.ts +498 -0
  150. package/tests/core/pain.test.ts +0 -1
  151. package/tests/core/path-resolver.test.ts +1 -1
  152. package/tests/core/paths-refactor.test.ts +0 -22
  153. package/tests/core/principle-internalization/deprecated-readiness.test.ts +2 -2
  154. package/tests/core/principle-internalization/lifecycle-metrics.test.ts +2 -2
  155. package/tests/core/principle-internalization/{internalization-routing-policy.test.ts → lifecycle-routing-policy.test.ts} +6 -6
  156. package/tests/core/principle-internalization/lineage-source-retired.test.ts +56 -0
  157. package/tests/core/principle-internalization/principle-lifecycle-service.test.ts +1 -23
  158. package/tests/core/principle-tree-ledger-adapter.test.ts +253 -0
  159. package/tests/core/reflection-context.test.ts +0 -14
  160. package/tests/core/replay-engine.test.ts +127 -215
  161. package/tests/core/rule-host-helpers.test.ts +2 -2
  162. package/tests/core/rule-implementation-runtime.test.ts +0 -27
  163. package/tests/core/workflow-funnel-loader.test.ts +162 -0
  164. package/tests/core/workspace-context.test.ts +2 -2
  165. package/tests/core/workspace-dir-validation.test.ts +8 -1
  166. package/tests/core-anti-growth.test.ts +191 -0
  167. package/tests/hook-workspace-nextaction-contract.test.ts +42 -0
  168. package/tests/hooks/confirm-first-removal.test.ts +188 -0
  169. package/tests/hooks/gate-auto-correct-shadow.test.ts +310 -0
  170. package/tests/hooks/gate-auto-correct.test.ts +665 -0
  171. package/tests/hooks/gate-no-path-write-tool.test.ts +172 -0
  172. package/tests/hooks/gate-rule-host-pipeline.test.ts +2 -1
  173. package/tests/hooks/pain.test.ts +269 -12
  174. package/tests/hooks/prompt-characterization.test.ts +500 -0
  175. package/tests/hooks/prompt-size-guard.test.ts +32 -17
  176. package/tests/hooks/runtime-v2-prompt-activation.test.ts +869 -0
  177. package/tests/index.test.ts +94 -1
  178. package/tests/integration/auto-entry-gate.test.ts +248 -0
  179. package/tests/integration/internalization-trigger-guard.test.ts +69 -0
  180. package/tests/integration/m8-legacy-paths.test.ts +63 -0
  181. package/tests/integration/runtime-v2-pain-guard.test.ts +125 -0
  182. package/tests/plugin-config-resolution-cutover.test.ts +359 -0
  183. package/tests/runtime-v2-discovery-guard.test.ts +154 -0
  184. package/tests/service/central-database.test.ts +457 -0
  185. package/tests/service/evolution-worker.correction-observer.test.ts +173 -0
  186. package/tests/service/evolution-worker.timeout.test.ts +11 -129
  187. package/tests/service/internalization-trigger-adapter.test.ts +251 -0
  188. package/tests/service/monitoring-query-service.test.ts +1 -47
  189. package/tests/service/queue-io.test.ts +1 -62
  190. package/tests/service/runtime-summary-service.test.ts +3 -1
  191. package/tests/service/workflow-watchdog.test.ts +0 -91
  192. package/tests/utils/file-lock.test.ts +5 -3
  193. package/tests/utils/session-key.test.ts +52 -0
  194. package/tests/utils/subagent-probe.test.ts +48 -1
  195. package/vitest.config.ts +4 -11
  196. package/.planning/codebase/ARCHITECTURE.md +0 -157
  197. package/.planning/codebase/CONCERNS.md +0 -145
  198. package/.planning/codebase/CONVENTIONS.md +0 -148
  199. package/.planning/codebase/INTEGRATIONS.md +0 -81
  200. package/.planning/codebase/STACK.md +0 -87
  201. package/.planning/codebase/STRUCTURE.md +0 -193
  202. package/.planning/codebase/TESTING.md +0 -243
  203. package/.planning/phases/01-basic-visualization/01-GAP-CLOSURE-VERIFICATION.md +0 -113
  204. package/docs/COMMAND_REFERENCE.md +0 -76
  205. package/docs/COMMAND_REFERENCE_EN.md +0 -79
  206. package/scripts/build-web.mjs +0 -46
  207. package/scripts/diagnose-nocturnal.mjs +0 -537
  208. package/scripts/seed-nocturnal-scenarios.mjs +0 -384
  209. package/src/commands/nocturnal-review.ts +0 -322
  210. package/src/commands/nocturnal-rollout.ts +0 -790
  211. package/src/commands/nocturnal-train.ts +0 -986
  212. package/src/commands/pd-reflect.ts +0 -88
  213. package/src/core/adaptive-thresholds.ts +0 -478
  214. package/src/core/diagnostician-task-store.ts +0 -192
  215. package/src/core/nocturnal-arbiter.ts +0 -715
  216. package/src/core/nocturnal-artifact-lineage.ts +0 -116
  217. package/src/core/nocturnal-artificer.ts +0 -257
  218. package/src/core/nocturnal-candidate-scoring.ts +0 -530
  219. package/src/core/nocturnal-compliance.ts +0 -1146
  220. package/src/core/nocturnal-dataset.ts +0 -763
  221. package/src/core/nocturnal-executability.ts +0 -428
  222. package/src/core/nocturnal-export.ts +0 -499
  223. package/src/core/nocturnal-paths.ts +0 -240
  224. package/src/core/nocturnal-reasoning-deriver.ts +0 -343
  225. package/src/core/nocturnal-rule-implementation-validator.ts +0 -246
  226. package/src/core/nocturnal-snapshot-contract.ts +0 -99
  227. package/src/core/nocturnal-trajectory-extractor.ts +0 -512
  228. package/src/core/nocturnal-trinity-types.ts +0 -218
  229. package/src/core/nocturnal-trinity.ts +0 -2680
  230. package/src/core/principle-internalization/deprecated-readiness.ts +0 -93
  231. package/src/core/principle-internalization/internalization-routing-policy.ts +0 -208
  232. package/src/core/principle-internalization/lifecycle-metrics.ts +0 -152
  233. package/src/http/principles-console-route.ts +0 -709
  234. package/src/service/central-health-service.ts +0 -49
  235. package/src/service/central-overview-service.ts +0 -138
  236. package/src/service/control-ui-query-service.ts +0 -900
  237. package/src/service/cooldown-strategy.ts +0 -97
  238. package/src/service/evolution-pain-context.ts +0 -79
  239. package/src/service/evolution-query-service.ts +0 -407
  240. package/src/service/health-query-service.ts +0 -1038
  241. package/src/service/nocturnal-config.ts +0 -214
  242. package/src/service/nocturnal-runtime.ts +0 -734
  243. package/src/service/nocturnal-service.ts +0 -1605
  244. package/src/service/nocturnal-target-selector.ts +0 -545
  245. package/src/service/sleep-cycle.ts +0 -157
  246. package/src/service/startup-reconciler.ts +0 -112
  247. package/src/service/subagent-workflow/correction-observer-types.ts +0 -82
  248. package/src/service/subagent-workflow/correction-observer-workflow-manager.ts +0 -250
  249. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +0 -1
  250. package/src/service/subagent-workflow/dynamic-timeout.ts +0 -30
  251. package/src/service/subagent-workflow/empathy-observer-workflow-manager.ts +0 -268
  252. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +0 -795
  253. package/src/service/subagent-workflow/runtime-direct-driver.ts +0 -268
  254. package/src/service/subagent-workflow/workflow-manager-base.ts +0 -580
  255. package/src/tools/write-pain-flag.ts +0 -215
  256. package/templates/langs/en/skills/plan-script/SKILL.md +0 -32
  257. package/templates/langs/zh/skills/plan-script/SKILL.md +0 -32
  258. package/tests/commands/nocturnal-review.test.ts +0 -448
  259. package/tests/commands/nocturnal-train.test.ts +0 -97
  260. package/tests/commands/pd-reflect.test.ts +0 -49
  261. package/tests/core/adaptive-thresholds.test.ts +0 -261
  262. package/tests/core/nocturnal-arbiter.test.ts +0 -559
  263. package/tests/core/nocturnal-artifact-lineage.test.ts +0 -53
  264. package/tests/core/nocturnal-artificer.test.ts +0 -241
  265. package/tests/core/nocturnal-candidate-scoring.test.ts +0 -532
  266. package/tests/core/nocturnal-compliance-p-principles.test.ts +0 -133
  267. package/tests/core/nocturnal-compliance.test.ts +0 -646
  268. package/tests/core/nocturnal-dataset.test.ts +0 -892
  269. package/tests/core/nocturnal-e2e.test.ts +0 -234
  270. package/tests/core/nocturnal-executability.test.ts +0 -357
  271. package/tests/core/nocturnal-export.test.ts +0 -517
  272. package/tests/core/nocturnal-reasoning-deriver.test.ts +0 -372
  273. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +0 -428
  274. package/tests/core/nocturnal-rule-implementation-validator.test.ts +0 -127
  275. package/tests/core/nocturnal-snapshot-contract.test.ts +0 -121
  276. package/tests/core/nocturnal-trajectory-extractor.test.ts +0 -634
  277. package/tests/core/nocturnal-trinity.test.ts +0 -2053
  278. package/tests/core/pain-auto-repair.test.ts +0 -96
  279. package/tests/core/pain-integration.test.ts +0 -510
  280. package/tests/fixtures/nocturnal-reviewed-subset.json +0 -183
  281. package/tests/http/principles-console-route.test.ts +0 -162
  282. package/tests/integration/chaos-resilience.test.ts +0 -348
  283. package/tests/integration/empathy-workflow-integration.test.ts +0 -626
  284. package/tests/integration/pain-diagnostician-loop.e2e.test.ts +0 -380
  285. package/tests/service/control-ui-query-service.test.ts +0 -121
  286. package/tests/service/cooldown-strategy.test.ts +0 -164
  287. package/tests/service/data-endpoints-regression.test.ts +0 -834
  288. package/tests/service/empathy-observer-workflow-manager.test.ts +0 -175
  289. package/tests/service/evolution-worker.nocturnal.test.ts +0 -601
  290. package/tests/service/nocturnal-runtime-hardening.test.ts +0 -118
  291. package/tests/service/nocturnal-runtime.test.ts +0 -473
  292. package/tests/service/nocturnal-service-code-candidate.test.ts +0 -330
  293. package/tests/service/nocturnal-target-selector.test.ts +0 -615
  294. package/tests/service/startup-reconciler.test.ts +0 -148
  295. package/tests/tools/write-pain-flag.test.ts +0 -358
  296. package/ui/src/App.tsx +0 -45
  297. package/ui/src/api.ts +0 -220
  298. package/ui/src/charts.tsx +0 -955
  299. package/ui/src/components/ErrorState.tsx +0 -6
  300. package/ui/src/components/Loading.tsx +0 -13
  301. package/ui/src/components/ProtectedRoute.tsx +0 -12
  302. package/ui/src/components/Shell.tsx +0 -91
  303. package/ui/src/components/WorkspaceConfig.tsx +0 -178
  304. package/ui/src/components/index.ts +0 -5
  305. package/ui/src/context/auth.tsx +0 -80
  306. package/ui/src/context/theme.tsx +0 -66
  307. package/ui/src/hooks/useAutoRefresh.ts +0 -39
  308. package/ui/src/i18n/ui.ts +0 -473
  309. package/ui/src/main.tsx +0 -16
  310. package/ui/src/pages/EvolutionPage.tsx +0 -333
  311. package/ui/src/pages/FeedbackPage.tsx +0 -138
  312. package/ui/src/pages/GateMonitorPage.tsx +0 -136
  313. package/ui/src/pages/LoginPage.tsx +0 -89
  314. package/ui/src/pages/OverviewPage.tsx +0 -599
  315. package/ui/src/pages/SamplesPage.tsx +0 -174
  316. package/ui/src/pages/ThinkingModelsPage.tsx +0 -702
  317. package/ui/src/styles.css +0 -2020
  318. package/ui/src/types.ts +0 -384
  319. package/ui/src/utils/format.ts +0 -15
@@ -1,601 +0,0 @@
1
- import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
2
- import * as fs from 'fs';
3
- import * as os from 'os';
4
- import * as path from 'path';
5
-
6
- vi.mock('../../src/core/dictionary-service.js', () => ({
7
- DictionaryService: {
8
- get: vi.fn(() => ({ flush: vi.fn() })),
9
- },
10
- }));
11
-
12
- vi.mock('../../src/core/session-tracker.js', () => ({
13
- initPersistence: vi.fn(),
14
- flushAllSessions: vi.fn(),
15
- listSessions: vi.fn(() => []),
16
- }));
17
-
18
- const { mockStartWorkflow, mockGetWorkflowDebugSummary } = vi.hoisted(() => ({
19
- mockStartWorkflow: vi.fn(),
20
- mockGetWorkflowDebugSummary: vi.fn(),
21
- }));
22
-
23
- vi.mock('../../src/service/subagent-workflow/nocturnal-workflow-manager.js', () => ({
24
- NocturnalWorkflowManager: class {
25
- startWorkflow = mockStartWorkflow;
26
- getWorkflowDebugSummary = mockGetWorkflowDebugSummary;
27
- },
28
- nocturnalWorkflowSpec: {
29
- workflowType: 'nocturnal',
30
- transport: 'runtime_direct',
31
- timeoutMs: 15 * 60 * 1000,
32
- ttlMs: 30 * 60 * 1000,
33
- },
34
- }));
35
-
36
- const { mockGetNocturnalSessionSnapshot, mockListRecentNocturnalCandidateSessions } = vi.hoisted(() => ({
37
- mockGetNocturnalSessionSnapshot: vi.fn(),
38
- mockListRecentNocturnalCandidateSessions: vi.fn(() => [] as Array<{ sessionId: string; startedAt: string; failureCount: number; painEventCount: number; gateBlockCount: number }>),
39
- }));
40
-
41
- // Create a shared mock extractor instance so spy calls are tracked correctly
42
- const mockExtractorInstance = {
43
- getNocturnalSessionSnapshot: mockGetNocturnalSessionSnapshot,
44
- listRecentNocturnalCandidateSessions: mockListRecentNocturnalCandidateSessions,
45
- };
46
-
47
- vi.mock('../../src/core/nocturnal-trajectory-extractor.js', async () => {
48
- const actual = await vi.importActual<typeof import('../../src/core/nocturnal-trajectory-extractor.js')>(
49
- '../../src/core/nocturnal-trajectory-extractor.js'
50
- );
51
- return {
52
- ...actual,
53
- createNocturnalTrajectoryExtractor: vi.fn(() => mockExtractorInstance),
54
- };
55
- });
56
-
57
- import { EvolutionWorkerService } from '../../src/service/evolution-worker.js';
58
- import { readRecentPainContext } from '../../src/service/evolution-pain-context.js';
59
- import { WorkspaceContext } from '../../src/core/workspace-context.js';
60
- import { handlePdReflect } from '../../src/commands/pd-reflect.js';
61
- import { safeRmDir } from '../test-utils.js';
62
- import * as diagnosticianStore from '../../src/core/diagnostician-task-store.js';
63
-
64
- // Helper to create a mock API for E2E tests
65
- function createMockApi() {
66
- return {
67
- logger: { info: vi.fn(), warn: vi.fn(), error: vi.fn(), debug: vi.fn() },
68
- runtime: {
69
- agent: { runEmbeddedPiAgent: vi.fn() },
70
- system: {
71
- requestHeartbeatNow: vi.fn(),
72
- runHeartbeatOnce: vi.fn()
73
- }
74
- },
75
- } as any;
76
- }
77
-
78
- // Helper config for fast poll cycle
79
- const fastPollConfig = { get: (k: string) => k === 'intervals.worker_poll_ms' ? 100 : undefined };
80
-
81
- function readQueue(stateDir: string) {
82
- return JSON.parse(fs.readFileSync(path.join(stateDir, 'evolution_queue.json'), 'utf8'));
83
- }
84
-
85
- describe('EvolutionWorkerService nocturnal hardening', () => {
86
- beforeEach(() => {
87
- vi.useFakeTimers();
88
- vi.clearAllMocks();
89
- EvolutionWorkerService.api = null;
90
- });
91
-
92
- afterEach(() => {
93
- vi.useRealTimers();
94
- EvolutionWorkerService.api = null;
95
- });
96
-
97
- it('extracts session_id from .pain_flag file correctly', async () => {
98
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-pain-session-'));
99
- const stateDir = path.join(workspaceDir, '.state');
100
- fs.mkdirSync(stateDir, { recursive: true });
101
-
102
- // Write a pain flag WITH session_id
103
- fs.writeFileSync(
104
- path.join(stateDir, '.pain_flag'),
105
- `source: test_pain
106
- score: 80
107
- reason: test reason
108
- time: 2026-04-10T00:00:00.000Z
109
- session_id: explicit-session-from-pain
110
- `,
111
- 'utf8'
112
- );
113
-
114
- // Create a WorkspaceContext to test the function
115
- const wctx = WorkspaceContext.fromHookContext({ workspaceDir, stateDir, logger: console } as any);
116
-
117
- try {
118
- const context = readRecentPainContext(wctx);
119
-
120
- // Verify the session_id was extracted from the pain flag file
121
- expect(context.mostRecent).toBeDefined();
122
- expect(context.mostRecent!.sessionId).toBe('explicit-session-from-pain');
123
- expect(context.mostRecent!.score).toBe(80);
124
- expect(context.recentPainCount).toBe(1);
125
- } finally {
126
- safeRmDir(workspaceDir);
127
- }
128
- });
129
-
130
- it('treats malformed pain flag data as unusable context', async () => {
131
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-pain-invalid-'));
132
- const stateDir = path.join(workspaceDir, '.state');
133
- fs.mkdirSync(stateDir, { recursive: true });
134
-
135
- fs.writeFileSync(
136
- path.join(stateDir, '.pain_flag'),
137
- `source: test_pain
138
- score: 80`,
139
- 'utf8'
140
- );
141
-
142
- const wctx = WorkspaceContext.fromHookContext({ workspaceDir, stateDir, logger: console } as any);
143
-
144
- try {
145
- const context = readRecentPainContext(wctx);
146
- expect(context.mostRecent).toBeNull();
147
- expect(context.recentPainCount).toBe(0);
148
- } finally {
149
- safeRmDir(workspaceDir);
150
- }
151
- });
152
-
153
- // === End-to-End Contract Tests ===
154
-
155
- it('e2e: pain flag → worker enqueue → session_id is correctly attached to queued task', async () => {
156
- // This test verifies the contract: when a pain flag with session_id exists,
157
- // any sleep_reflection task created by the worker MUST carry that session_id
158
- // in its recentPainContext.mostRecent.sessionId field.
159
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-e2e-pain-enqueue-'));
160
- const stateDir = path.join(workspaceDir, '.state');
161
- fs.mkdirSync(stateDir, { recursive: true });
162
-
163
- // Write a pain flag WITH session_id
164
- fs.writeFileSync(
165
- path.join(stateDir, '.pain_flag'),
166
- `source: tool_failure
167
- score: 70
168
- reason: Test pain with session
169
- time: 2026-04-10T00:00:00.000Z
170
- session_id: pain-session-abc
171
- `,
172
- 'utf8'
173
- );
174
-
175
- // Verify the worker's readRecentPainContext extracts the session_id correctly
176
- const wctx = WorkspaceContext.fromHookContext({ workspaceDir, stateDir, logger: console } as any);
177
- const painContext = readRecentPainContext(wctx);
178
-
179
- // Contract: session_id must be extracted from the pain flag
180
- expect(painContext.mostRecent).toBeDefined();
181
- expect(painContext.mostRecent!.sessionId).toBe('pain-session-abc');
182
- expect(painContext.mostRecent!.score).toBe(70);
183
- expect(painContext.mostRecent!.source).toBe('tool_failure');
184
-
185
- // Now simulate what the worker does: attach this context to a queued task
186
- const simulatedTask = {
187
- id: 'simulated-task',
188
- taskKind: 'sleep_reflection',
189
- recentPainContext: painContext,
190
- };
191
-
192
- // Verify the contract holds end-to-end
193
- expect(simulatedTask.recentPainContext.mostRecent!.sessionId).toBe('pain-session-abc');
194
- });
195
-
196
- it('e2e: /pd-reflect command writes to workspace/.state, never to HOME/.state', async () => {
197
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-e2e-command-writes-'));
198
- const stateDir = path.join(workspaceDir, '.state');
199
- fs.mkdirSync(stateDir, { recursive: true });
200
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
201
-
202
- // Ensure HOME/.state does NOT have the queue file
203
- const homeState = path.join(os.homedir(), '.state');
204
- const homeQueue = path.join(homeState, 'evolution_queue.json');
205
- const homeExistedBefore = fs.existsSync(homeQueue);
206
-
207
- try {
208
- // Execute the command with explicit workspaceDir
209
- const result = await handlePdReflect.handler({
210
- workspaceDir,
211
- channel: 'test',
212
- isAuthorizedSender: true,
213
- commandBody: '',
214
- config: {},
215
- api: { logger: { info: vi.fn(), warn: vi.fn(), error: vi.fn() } } as any,
216
- } as any);
217
-
218
- // Command should succeed
219
- expect(result.isError).toBeFalsy();
220
- expect(result.text).toContain('enqueued');
221
-
222
- // Queue file should exist in workspace
223
- const workspaceQueue = path.join(stateDir, 'evolution_queue.json');
224
- expect(fs.existsSync(workspaceQueue)).toBe(true);
225
-
226
- // Verify the task is in the workspace queue
227
- const queue = readQueue(stateDir);
228
- const manualTasks = queue.filter((t: any) => t.id.startsWith('manual_'));
229
- expect(manualTasks.length).toBe(1);
230
- expect(manualTasks[0].taskKind).toBe('sleep_reflection');
231
-
232
- // HOME/.state/evolution_queue.json should NOT have been created/modified by this command
233
- if (!homeExistedBefore) {
234
- expect(fs.existsSync(homeQueue)).toBe(false);
235
- }
236
- } finally {
237
- safeRmDir(workspaceDir);
238
- }
239
- });
240
-
241
- // === Nocturnal E2E Pipeline Tests (from PR #243) ===
242
-
243
- it('does not start a nocturnal workflow when only an empty fallback snapshot is available', async () => {
244
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-empty-'));
245
- const stateDir = path.join(workspaceDir, '.state');
246
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
247
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
248
-
249
- mockGetNocturnalSessionSnapshot.mockReturnValue(null);
250
-
251
- fs.writeFileSync(
252
- path.join(stateDir, 'evolution_queue.json'),
253
- JSON.stringify([
254
- {
255
- id: 'sleep-empty',
256
- taskKind: 'sleep_reflection',
257
- priority: 'medium',
258
- score: 50,
259
- source: 'nocturnal',
260
- reason: 'Sleep reflection',
261
- timestamp: '2026-04-10T00:00:00.000Z',
262
- enqueued_at: '2026-04-10T00:00:00.000Z',
263
- status: 'pending',
264
- retryCount: 0,
265
- maxRetries: 1,
266
- recentPainContext: {
267
- mostRecent: null,
268
- recentPainCount: 0,
269
- recentMaxPainScore: 0,
270
- },
271
- },
272
- ], null, 2),
273
- 'utf8'
274
- );
275
-
276
- const mockApi = createMockApi();
277
- EvolutionWorkerService.api = mockApi;
278
-
279
- try {
280
- EvolutionWorkerService.start({
281
- workspaceDir,
282
- stateDir,
283
- logger: mockApi.logger,
284
- config: fastPollConfig,
285
- api: mockApi,
286
- } as any);
287
-
288
- await vi.advanceTimersByTimeAsync(6000);
289
-
290
- const queue = readQueue(stateDir);
291
- expect(queue[0].status).toBe('failed');
292
- expect(queue[0].lastError).toContain('invalid_snapshot_ingress');
293
- expect(queue[0].lastError).toContain('fallback snapshot must contain at least one pain signal');
294
- expect(queue[0].resultRef).toBeFalsy();
295
- expect(mockStartWorkflow).not.toHaveBeenCalled();
296
- } finally {
297
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
298
- safeRmDir(workspaceDir);
299
- }
300
- });
301
-
302
- it('uses stub_fallback for expected gateway-only background unavailability', async () => {
303
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-gateway-'));
304
- const stateDir = path.join(workspaceDir, '.state');
305
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
306
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
307
-
308
- mockGetNocturnalSessionSnapshot.mockReturnValue({
309
- sessionId: 'sleep-gateway',
310
- startedAt: '2026-04-10T00:00:00.000Z',
311
- updatedAt: '2026-04-10T00:01:00.000Z',
312
- assistantTurns: [],
313
- userTurns: [],
314
- toolCalls: [],
315
- painEvents: [],
316
- gateBlocks: [],
317
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, totalPainEvents: 0, totalGateBlocks: 0, failureCount: 0 },
318
- });
319
- mockStartWorkflow.mockResolvedValue({ workflowId: 'wf-1', childSessionKey: 'child-1', state: 'active' });
320
- mockGetWorkflowDebugSummary.mockResolvedValue({
321
- state: 'terminal_error',
322
- metadata: {},
323
- recentEvents: [{ reason: 'Error: Plugin runtime subagent methods are only available during a gateway request.', payload: {} }],
324
- });
325
-
326
- fs.writeFileSync(
327
- path.join(stateDir, 'evolution_queue.json'),
328
- JSON.stringify([
329
- {
330
- id: 'sleep-gateway',
331
- taskKind: 'sleep_reflection',
332
- priority: 'medium',
333
- score: 50,
334
- source: 'nocturnal',
335
- reason: 'Sleep reflection',
336
- timestamp: '2026-04-10T00:00:00.000Z',
337
- enqueued_at: '2026-04-10T00:00:00.000Z',
338
- status: 'pending',
339
- retryCount: 0,
340
- maxRetries: 1,
341
- recentPainContext: {
342
- mostRecent: { source: 'test', score: 50, reason: 'test', timestamp: '2026-04-10T00:00:00.000Z', sessionId: 'sleep-gateway' },
343
- recentPainCount: 1,
344
- recentMaxPainScore: 50,
345
- },
346
- },
347
- ], null, 2),
348
- 'utf8'
349
- );
350
-
351
- const mockApi = createMockApi();
352
- EvolutionWorkerService.api = mockApi;
353
-
354
- try {
355
- EvolutionWorkerService.start({
356
- workspaceDir,
357
- stateDir,
358
- logger: mockApi.logger,
359
- config: fastPollConfig,
360
- api: mockApi,
361
- } as any);
362
-
363
- await vi.advanceTimersByTimeAsync(6000);
364
-
365
- const queue = readQueue(stateDir);
366
- expect(queue[0].status).toBe('completed');
367
- expect(queue[0].resolution).toBe('stub_fallback');
368
- } finally {
369
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
370
- safeRmDir(workspaceDir);
371
- }
372
- });
373
-
374
- it('uses stub_fallback for expected subagent runtime unavailability', async () => {
375
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-subagent-'));
376
- const stateDir = path.join(workspaceDir, '.state');
377
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
378
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
379
-
380
- mockGetNocturnalSessionSnapshot.mockReturnValue({
381
- sessionId: 'sleep-subagent',
382
- startedAt: '2026-04-10T00:00:00.000Z',
383
- updatedAt: '2026-04-10T00:01:00.000Z',
384
- assistantTurns: [],
385
- userTurns: [],
386
- toolCalls: [],
387
- painEvents: [],
388
- gateBlocks: [],
389
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, totalPainEvents: 0, totalGateBlocks: 0, failureCount: 0 },
390
- });
391
- mockStartWorkflow.mockRejectedValue(new Error('NocturnalWorkflowManager: subagent runtime unavailable'));
392
-
393
- fs.writeFileSync(
394
- path.join(stateDir, 'evolution_queue.json'),
395
- JSON.stringify([
396
- {
397
- id: 'sleep-subagent',
398
- taskKind: 'sleep_reflection',
399
- priority: 'medium',
400
- score: 50,
401
- source: 'nocturnal',
402
- reason: 'Sleep reflection',
403
- timestamp: '2026-04-10T00:00:00.000Z',
404
- enqueued_at: '2026-04-10T00:00:00.000Z',
405
- status: 'pending',
406
- retryCount: 0,
407
- maxRetries: 1,
408
- recentPainContext: {
409
- mostRecent: { source: 'test', score: 50, reason: 'test', timestamp: '2026-04-10T00:00:00.000Z', sessionId: 'sleep-subagent' },
410
- recentPainCount: 1,
411
- recentMaxPainScore: 50,
412
- },
413
- },
414
- ], null, 2),
415
- 'utf8'
416
- );
417
-
418
- const mockApi = createMockApi();
419
- EvolutionWorkerService.api = mockApi;
420
-
421
- try {
422
- EvolutionWorkerService.start({
423
- workspaceDir,
424
- stateDir,
425
- logger: mockApi.logger,
426
- config: fastPollConfig,
427
- api: mockApi,
428
- } as any);
429
-
430
- await vi.advanceTimersByTimeAsync(6000);
431
-
432
- const queue = readQueue(stateDir);
433
- expect(queue[0].status).toBe('completed');
434
- expect(queue[0].resolution).toBe('stub_fallback');
435
- } finally {
436
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
437
- safeRmDir(workspaceDir);
438
- }
439
- });
440
-
441
- it('prioritizes pain signal session ID for snapshot extraction', async () => {
442
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-pain-session-'));
443
- const stateDir = path.join(workspaceDir, '.state');
444
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
445
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
446
-
447
- const painSessionId = 'pain-signal-session-123';
448
-
449
- mockGetNocturnalSessionSnapshot.mockImplementation((sessionId: string) => {
450
- if (sessionId === painSessionId) {
451
- return {
452
- sessionId: painSessionId,
453
- startedAt: '2026-04-09T23:00:00.000Z',
454
- updatedAt: '2026-04-09T23:01:00.000Z',
455
- assistantTurns: [],
456
- userTurns: [],
457
- toolCalls: [],
458
- painEvents: [{ source: 'tool_failure', score: 70, severity: null, reason: 'test', createdAt: '2026-04-09T23:00:00.000Z' }],
459
- gateBlocks: [],
460
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, failureCount: 1, totalPainEvents: 1, totalGateBlocks: 0 },
461
- };
462
- }
463
- return null;
464
- });
465
- mockStartWorkflow.mockResolvedValue({ workflowId: 'wf-pain', childSessionKey: 'child-pain', state: 'active' });
466
-
467
- fs.writeFileSync(
468
- path.join(stateDir, 'evolution_queue.json'),
469
- JSON.stringify([
470
- {
471
- id: 'sleep-pain-priority',
472
- taskKind: 'sleep_reflection',
473
- priority: 'medium',
474
- score: 50,
475
- source: 'nocturnal',
476
- reason: 'Sleep reflection',
477
- timestamp: '2026-04-10T00:00:00.000Z',
478
- enqueued_at: '2026-04-10T00:00:00.000Z',
479
- status: 'pending',
480
- retryCount: 0,
481
- maxRetries: 1,
482
- recentPainContext: {
483
- mostRecent: { source: 'tool_failure', score: 70, reason: 'test', timestamp: '2026-04-10T00:00:00.000Z', sessionId: painSessionId },
484
- recentPainCount: 1,
485
- recentMaxPainScore: 70,
486
- },
487
- },
488
- ], null, 2),
489
- 'utf8'
490
- );
491
-
492
- const mockApi = createMockApi();
493
- EvolutionWorkerService.api = mockApi;
494
-
495
- try {
496
- EvolutionWorkerService.start({
497
- workspaceDir,
498
- stateDir,
499
- logger: mockApi.logger,
500
- config: fastPollConfig,
501
- api: mockApi,
502
- } as any);
503
-
504
- await vi.advanceTimersByTimeAsync(6000);
505
-
506
- expect(mockStartWorkflow).toHaveBeenCalledTimes(1);
507
- const metadata = mockStartWorkflow.mock.calls[0][1].metadata;
508
- expect(metadata.snapshot.sessionId).toBe(painSessionId);
509
- } finally {
510
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
511
- safeRmDir(workspaceDir);
512
- }
513
- });
514
-
515
- it('e2e: bounded session selection — never picks a session newer than the triggering task', async () => {
516
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-e2e-bounded-'));
517
- const stateDir = path.join(workspaceDir, '.state');
518
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
519
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
520
-
521
- const taskTimestamp = '2026-04-10T00:00:00.000Z';
522
- const validSessionTimestamp = '2026-04-09T23:00:00.000Z';
523
- const invalidSessionTimestamp = '2026-04-10T01:00:00.000Z';
524
-
525
- mockGetNocturnalSessionSnapshot.mockImplementation((sessionId: string) => {
526
- if (sessionId === 'valid-session') {
527
- return {
528
- sessionId: 'valid-session',
529
- startedAt: validSessionTimestamp,
530
- updatedAt: validSessionTimestamp,
531
- assistantTurns: [],
532
- userTurns: [],
533
- toolCalls: [],
534
- painEvents: [{ source: 'tool_failure', score: 50, severity: null, reason: 'test', createdAt: validSessionTimestamp }],
535
- gateBlocks: [],
536
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, failureCount: 1, totalPainEvents: 1, totalGateBlocks: 0 },
537
- };
538
- }
539
- return null;
540
- });
541
- mockListRecentNocturnalCandidateSessions.mockReturnValue([
542
- { sessionId: 'valid-session', startedAt: validSessionTimestamp, failureCount: 1, painEventCount: 1, gateBlockCount: 0 },
543
- { sessionId: 'invalid-session', startedAt: invalidSessionTimestamp, failureCount: 1, painEventCount: 0, gateBlockCount: 0 },
544
- ]);
545
- mockStartWorkflow.mockResolvedValue({ workflowId: 'wf-bounded', childSessionKey: 'child-bounded', state: 'active' });
546
-
547
- fs.writeFileSync(
548
- path.join(stateDir, 'evolution_queue.json'),
549
- JSON.stringify([
550
- {
551
- id: 'sleep-e2e-bounded',
552
- taskKind: 'sleep_reflection',
553
- priority: 'medium',
554
- score: 50,
555
- source: 'nocturnal',
556
- reason: 'Sleep reflection',
557
- timestamp: taskTimestamp,
558
- enqueued_at: taskTimestamp,
559
- status: 'pending',
560
- retryCount: 0,
561
- maxRetries: 1,
562
- recentPainContext: {
563
- mostRecent: { source: 'test', score: 50, reason: 'test', timestamp: taskTimestamp, sessionId: 'pain-session' },
564
- recentPainCount: 1,
565
- recentMaxPainScore: 50,
566
- },
567
- },
568
- ], null, 2),
569
- 'utf8'
570
- );
571
-
572
- const mockApi = createMockApi();
573
- EvolutionWorkerService.api = mockApi;
574
-
575
- try {
576
- EvolutionWorkerService.start({
577
- workspaceDir,
578
- stateDir,
579
- logger: mockApi.logger,
580
- config: fastPollConfig,
581
- api: mockApi,
582
- } as any);
583
-
584
- await vi.advanceTimersByTimeAsync(6000);
585
-
586
- expect(mockStartWorkflow).toHaveBeenCalledTimes(1);
587
- const metadata = mockStartWorkflow.mock.calls[0][1].metadata;
588
- expect(metadata.snapshot.sessionId).toBe('valid-session');
589
- expect(new Date(metadata.snapshot.startedAt).getTime()).toBeLessThanOrEqual(new Date(taskTimestamp).getTime());
590
- } finally {
591
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
592
- safeRmDir(workspaceDir);
593
- }
594
- });
595
-
596
- // === PR #307 Fixes: Pain Diagnosis Timeout & Heartbeat Retry ===
597
-
598
- // Note: Testing requestHeartbeatNow call directly is complex due to
599
- // the async nature of checkPainFlag → doEnqueuePainTask → requestHeartbeatNow.
600
- // The fix is verified via E2E monitoring (PR #307 production verification).
601
- });