principles-disciple 1.72.0 → 1.73.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (309) hide show
  1. package/openclaw.plugin.json +10 -5
  2. package/package.json +17 -19
  3. package/scripts/acceptance-test.mjs +16 -73
  4. package/scripts/sync-plugin.mjs +382 -77
  5. package/src/commands/archive-impl.ts +2 -1
  6. package/src/commands/capabilities.ts +2 -2
  7. package/src/commands/context.ts +2 -2
  8. package/src/commands/disable-impl.ts +2 -1
  9. package/src/commands/evolution-status.ts +16 -16
  10. package/src/commands/export.ts +12 -67
  11. package/src/commands/pain.ts +91 -1
  12. package/src/commands/principle-rollback.ts +2 -1
  13. package/src/commands/promote-impl.ts +7 -43
  14. package/src/commands/rollback-impl.ts +2 -1
  15. package/src/commands/rollback.ts +2 -1
  16. package/src/commands/samples.ts +2 -1
  17. package/src/commands/thinking-os.ts +2 -1
  18. package/src/config/errors.ts +18 -2
  19. package/src/constants/diagnostician.ts +2 -2
  20. package/src/constants/tools.ts +2 -1
  21. package/src/core/__tests__/focus-history.test.ts +210 -0
  22. package/src/core/config.ts +1 -1
  23. package/src/core/confirm-first-gate.ts +255 -0
  24. package/src/core/correction-cue-learner.ts +2 -136
  25. package/src/core/correction-types.ts +16 -88
  26. package/src/core/dictionary.ts +19 -20
  27. package/src/core/empathy-keyword-matcher.ts +17 -289
  28. package/src/core/empathy-types.ts +18 -229
  29. package/src/core/event-log.ts +38 -132
  30. package/src/core/evolution-reducer.ts +21 -2
  31. package/src/core/evolution-types.ts +76 -464
  32. package/src/core/file-store.ts +80 -0
  33. package/src/core/focus-history.ts +228 -955
  34. package/src/core/local-worker-routing.ts +34 -314
  35. package/src/core/merge-gate-audit.ts +0 -195
  36. package/src/core/pain-diagnostic-gate.ts +154 -0
  37. package/src/core/pain-signal.ts +21 -138
  38. package/src/core/pain.ts +15 -88
  39. package/src/core/pd-task-reconciler.ts +26 -115
  40. package/src/core/pd-task-service.ts +9 -9
  41. package/src/core/pd-task-types.ts +23 -127
  42. package/src/core/principle-compiler/__tests__/compiler-replay-gate.test.ts +174 -0
  43. package/src/core/principle-compiler/code-validator.ts +15 -42
  44. package/src/core/principle-compiler/compiler.ts +100 -15
  45. package/src/core/principle-compiler/index.ts +5 -2
  46. package/src/core/principle-compiler/template-generator.ts +4 -104
  47. package/src/core/principle-injection.ts +10 -202
  48. package/src/core/principle-internalization/filesystem-lifecycle-datasource.ts +42 -0
  49. package/src/core/principle-internalization/lifecycle-read-model.ts +39 -242
  50. package/src/core/principle-internalization/principle-lifecycle-service.ts +12 -10
  51. package/src/core/principle-tree-ledger-adapter.ts +145 -0
  52. package/src/core/principle-tree-ledger.ts +8 -6
  53. package/src/core/reflection/reflection-context.ts +14 -109
  54. package/src/core/replay-engine.ts +8 -500
  55. package/src/core/rule-host-helpers.ts +5 -35
  56. package/src/core/rule-host-types.ts +10 -82
  57. package/src/core/rule-host.ts +6 -63
  58. package/src/core/runtime-v2-prompt-activation-reader.ts +231 -0
  59. package/src/core/session-tracker.ts +87 -101
  60. package/src/core/shadow-observation-registry.ts +19 -48
  61. package/src/core/trajectory.ts +3 -1
  62. package/src/core/workflow-funnel-loader.ts +62 -68
  63. package/src/core/workspace-context.ts +46 -0
  64. package/src/core/workspace-dir-service.ts +1 -1
  65. package/src/core/workspace-dir-validation.ts +18 -9
  66. package/src/hooks/AGENTS.md +1 -1
  67. package/src/hooks/gate-block-helper.ts +46 -44
  68. package/src/hooks/gate.ts +207 -7
  69. package/src/hooks/lifecycle.ts +30 -32
  70. package/src/hooks/llm.ts +60 -32
  71. package/src/hooks/pain.ts +297 -103
  72. package/src/hooks/prompt.ts +459 -439
  73. package/src/hooks/subagent.ts +2 -29
  74. package/src/i18n/commands.ts +2 -10
  75. package/src/index.ts +95 -85
  76. package/src/openclaw-sdk.ts +311 -0
  77. package/src/service/central-database.ts +8 -4
  78. package/src/service/evolution-queue-migration.ts +2 -1
  79. package/src/service/evolution-worker.ts +163 -1786
  80. package/src/service/internalization-trigger-adapter.ts +302 -0
  81. package/src/service/keyword-optimization-service.ts +4 -4
  82. package/src/service/monitoring-query-service.ts +1 -215
  83. package/src/service/queue-io.ts +60 -331
  84. package/src/service/runtime-summary-service.ts +59 -16
  85. package/src/service/subagent-workflow/index.ts +0 -41
  86. package/src/service/subagent-workflow/types.ts +9 -120
  87. package/src/service/subagent-workflow/workflow-store.ts +2 -119
  88. package/src/service/workflow-watchdog.ts +0 -43
  89. package/src/types/event-payload.ts +16 -74
  90. package/src/types/event-types.ts +39 -547
  91. package/src/types/hygiene-types.ts +7 -30
  92. package/src/types/principle-tree-schema.ts +20 -222
  93. package/src/types/queue.ts +15 -70
  94. package/src/types/runtime-summary.ts +5 -49
  95. package/src/utils/io.ts +10 -0
  96. package/src/utils/retry.ts +1 -1
  97. package/src/utils/shadow-fingerprint.ts +2 -2
  98. package/src/utils/workspace-resolver.ts +50 -0
  99. package/templates/langs/en/core/AGENTS.md +2 -2
  100. package/templates/langs/en/core/BOOT.md +1 -1
  101. package/templates/langs/en/core/HEARTBEAT.md +2 -2
  102. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  103. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  104. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  105. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  106. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  107. package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -2
  108. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  109. package/templates/langs/en/skills/evolve-task/SKILL.md +1 -1
  110. package/templates/langs/en/skills/pd-cli-operator/SKILL.md +67 -0
  111. package/templates/langs/en/skills/pd-diagnostician/SKILL.md +1 -1
  112. package/templates/langs/en/skills/pd-mentor/SKILL.md +1 -1
  113. package/templates/langs/en/skills/pd-pain-signal/SKILL.md +17 -39
  114. package/templates/langs/en/skills/pd-runtime-v2/SKILL.md +61 -0
  115. package/templates/langs/zh/core/AGENTS.md +2 -2
  116. package/templates/langs/zh/core/BOOT.md +1 -1
  117. package/templates/langs/zh/core/HEARTBEAT.md +2 -2
  118. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  119. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  120. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  121. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +8 -8
  122. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  123. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  124. package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -2
  125. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  126. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +21 -5
  127. package/templates/langs/zh/skills/evolve-task/SKILL.md +2 -2
  128. package/templates/langs/zh/skills/pd-cli-operator/SKILL.md +67 -0
  129. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +1 -1
  130. package/templates/langs/zh/skills/pd-mentor/SKILL.md +1 -1
  131. package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +17 -38
  132. package/templates/langs/zh/skills/pd-runtime-v2/SKILL.md +61 -0
  133. package/tests/build-artifacts.test.ts +1 -3
  134. package/tests/commands/evolution-status.test.ts +0 -118
  135. package/tests/core/bootstrap-rules.test.ts +1 -1
  136. package/tests/core/config.test.ts +1 -1
  137. package/tests/core/event-log.test.ts +35 -0
  138. package/tests/core/evolution-engine.test.ts +610 -0
  139. package/tests/core/file-store.test.ts +102 -0
  140. package/tests/core/focus-history.test.ts +203 -11
  141. package/tests/core/merge-gate-audit.test.ts +2 -169
  142. package/tests/core/model-deployment-registry.test.ts +7 -1
  143. package/tests/core/model-training-registry.test.ts +19 -0
  144. package/tests/core/observability.test.ts +0 -1
  145. package/tests/core/pain-diagnostic-gate.test.ts +498 -0
  146. package/tests/core/pain.test.ts +0 -1
  147. package/tests/core/principle-internalization/deprecated-readiness.test.ts +2 -2
  148. package/tests/core/principle-internalization/lifecycle-metrics.test.ts +2 -2
  149. package/tests/core/principle-internalization/{internalization-routing-policy.test.ts → lifecycle-routing-policy.test.ts} +6 -6
  150. package/tests/core/principle-internalization/lineage-source-retired.test.ts +56 -0
  151. package/tests/core/principle-internalization/principle-lifecycle-service.test.ts +1 -23
  152. package/tests/core/principle-tree-ledger-adapter.test.ts +253 -0
  153. package/tests/core/reflection-context.test.ts +0 -14
  154. package/tests/core/replay-engine.test.ts +127 -215
  155. package/tests/core/rule-host-helpers.test.ts +2 -2
  156. package/tests/core/rule-implementation-runtime.test.ts +0 -27
  157. package/tests/core/workflow-funnel-loader.test.ts +162 -0
  158. package/tests/core/workspace-dir-validation.test.ts +8 -1
  159. package/tests/core-anti-growth.test.ts +192 -0
  160. package/tests/hook-workspace-nextaction-contract.test.ts +42 -0
  161. package/tests/hooks/confirm-first-gate.test.ts +333 -0
  162. package/tests/hooks/gate-auto-correct-shadow.test.ts +310 -0
  163. package/tests/hooks/gate-auto-correct.test.ts +665 -0
  164. package/tests/hooks/gate-rule-host-pipeline.test.ts +2 -1
  165. package/tests/hooks/pain.test.ts +269 -12
  166. package/tests/hooks/prompt-characterization.test.ts +500 -0
  167. package/tests/hooks/prompt-size-guard.test.ts +32 -17
  168. package/tests/hooks/runtime-v2-prompt-activation.test.ts +869 -0
  169. package/tests/index.test.ts +94 -1
  170. package/tests/integration/auto-entry-gate.test.ts +248 -0
  171. package/tests/integration/internalization-trigger-guard.test.ts +69 -0
  172. package/tests/integration/m8-legacy-paths.test.ts +63 -0
  173. package/tests/integration/runtime-v2-pain-guard.test.ts +125 -0
  174. package/tests/plugin-config-resolution-cutover.test.ts +359 -0
  175. package/tests/runtime-v2-discovery-guard.test.ts +154 -0
  176. package/tests/service/central-database.test.ts +457 -0
  177. package/tests/service/evolution-worker.correction-observer.test.ts +173 -0
  178. package/tests/service/evolution-worker.timeout.test.ts +11 -129
  179. package/tests/service/internalization-trigger-adapter.test.ts +251 -0
  180. package/tests/service/monitoring-query-service.test.ts +1 -47
  181. package/tests/service/queue-io.test.ts +1 -62
  182. package/tests/service/runtime-summary-service.test.ts +3 -1
  183. package/tests/service/workflow-watchdog.test.ts +0 -91
  184. package/tests/utils/file-lock.test.ts +5 -3
  185. package/tests/utils/session-key.test.ts +52 -0
  186. package/tests/utils/subagent-probe.test.ts +48 -1
  187. package/vitest.config.ts +4 -11
  188. package/.planning/codebase/ARCHITECTURE.md +0 -157
  189. package/.planning/codebase/CONCERNS.md +0 -145
  190. package/.planning/codebase/CONVENTIONS.md +0 -148
  191. package/.planning/codebase/INTEGRATIONS.md +0 -81
  192. package/.planning/codebase/STACK.md +0 -87
  193. package/.planning/codebase/STRUCTURE.md +0 -193
  194. package/.planning/codebase/TESTING.md +0 -243
  195. package/.planning/phases/01-basic-visualization/01-GAP-CLOSURE-VERIFICATION.md +0 -113
  196. package/docs/COMMAND_REFERENCE.md +0 -76
  197. package/docs/COMMAND_REFERENCE_EN.md +0 -79
  198. package/scripts/build-web.mjs +0 -46
  199. package/scripts/diagnose-nocturnal.mjs +0 -537
  200. package/scripts/seed-nocturnal-scenarios.mjs +0 -384
  201. package/src/commands/nocturnal-review.ts +0 -322
  202. package/src/commands/nocturnal-rollout.ts +0 -790
  203. package/src/commands/nocturnal-train.ts +0 -986
  204. package/src/commands/pd-reflect.ts +0 -88
  205. package/src/core/adaptive-thresholds.ts +0 -478
  206. package/src/core/diagnostician-task-store.ts +0 -192
  207. package/src/core/nocturnal-arbiter.ts +0 -715
  208. package/src/core/nocturnal-artifact-lineage.ts +0 -116
  209. package/src/core/nocturnal-artificer.ts +0 -257
  210. package/src/core/nocturnal-candidate-scoring.ts +0 -530
  211. package/src/core/nocturnal-compliance.ts +0 -1146
  212. package/src/core/nocturnal-dataset.ts +0 -763
  213. package/src/core/nocturnal-executability.ts +0 -428
  214. package/src/core/nocturnal-export.ts +0 -499
  215. package/src/core/nocturnal-paths.ts +0 -240
  216. package/src/core/nocturnal-reasoning-deriver.ts +0 -343
  217. package/src/core/nocturnal-rule-implementation-validator.ts +0 -246
  218. package/src/core/nocturnal-snapshot-contract.ts +0 -99
  219. package/src/core/nocturnal-trajectory-extractor.ts +0 -512
  220. package/src/core/nocturnal-trinity-types.ts +0 -218
  221. package/src/core/nocturnal-trinity.ts +0 -2680
  222. package/src/core/principle-internalization/deprecated-readiness.ts +0 -93
  223. package/src/core/principle-internalization/internalization-routing-policy.ts +0 -208
  224. package/src/core/principle-internalization/lifecycle-metrics.ts +0 -152
  225. package/src/http/principles-console-route.ts +0 -709
  226. package/src/service/central-health-service.ts +0 -49
  227. package/src/service/central-overview-service.ts +0 -138
  228. package/src/service/control-ui-query-service.ts +0 -900
  229. package/src/service/cooldown-strategy.ts +0 -97
  230. package/src/service/evolution-pain-context.ts +0 -79
  231. package/src/service/evolution-query-service.ts +0 -407
  232. package/src/service/health-query-service.ts +0 -1038
  233. package/src/service/nocturnal-config.ts +0 -214
  234. package/src/service/nocturnal-runtime.ts +0 -734
  235. package/src/service/nocturnal-service.ts +0 -1605
  236. package/src/service/nocturnal-target-selector.ts +0 -545
  237. package/src/service/sleep-cycle.ts +0 -157
  238. package/src/service/startup-reconciler.ts +0 -112
  239. package/src/service/subagent-workflow/correction-observer-types.ts +0 -82
  240. package/src/service/subagent-workflow/correction-observer-workflow-manager.ts +0 -250
  241. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +0 -1
  242. package/src/service/subagent-workflow/dynamic-timeout.ts +0 -30
  243. package/src/service/subagent-workflow/empathy-observer-workflow-manager.ts +0 -268
  244. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +0 -795
  245. package/src/service/subagent-workflow/runtime-direct-driver.ts +0 -268
  246. package/src/service/subagent-workflow/workflow-manager-base.ts +0 -580
  247. package/src/tools/write-pain-flag.ts +0 -215
  248. package/tests/commands/nocturnal-review.test.ts +0 -448
  249. package/tests/commands/nocturnal-train.test.ts +0 -97
  250. package/tests/commands/pd-reflect.test.ts +0 -49
  251. package/tests/core/adaptive-thresholds.test.ts +0 -261
  252. package/tests/core/nocturnal-arbiter.test.ts +0 -559
  253. package/tests/core/nocturnal-artifact-lineage.test.ts +0 -53
  254. package/tests/core/nocturnal-artificer.test.ts +0 -241
  255. package/tests/core/nocturnal-candidate-scoring.test.ts +0 -532
  256. package/tests/core/nocturnal-compliance-p-principles.test.ts +0 -133
  257. package/tests/core/nocturnal-compliance.test.ts +0 -646
  258. package/tests/core/nocturnal-dataset.test.ts +0 -892
  259. package/tests/core/nocturnal-e2e.test.ts +0 -234
  260. package/tests/core/nocturnal-executability.test.ts +0 -357
  261. package/tests/core/nocturnal-export.test.ts +0 -517
  262. package/tests/core/nocturnal-reasoning-deriver.test.ts +0 -372
  263. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +0 -428
  264. package/tests/core/nocturnal-rule-implementation-validator.test.ts +0 -127
  265. package/tests/core/nocturnal-snapshot-contract.test.ts +0 -121
  266. package/tests/core/nocturnal-trajectory-extractor.test.ts +0 -634
  267. package/tests/core/nocturnal-trinity.test.ts +0 -2053
  268. package/tests/core/pain-auto-repair.test.ts +0 -96
  269. package/tests/core/pain-integration.test.ts +0 -510
  270. package/tests/fixtures/nocturnal-reviewed-subset.json +0 -183
  271. package/tests/http/principles-console-route.test.ts +0 -162
  272. package/tests/integration/chaos-resilience.test.ts +0 -348
  273. package/tests/integration/empathy-workflow-integration.test.ts +0 -626
  274. package/tests/integration/pain-diagnostician-loop.e2e.test.ts +0 -380
  275. package/tests/service/control-ui-query-service.test.ts +0 -121
  276. package/tests/service/cooldown-strategy.test.ts +0 -164
  277. package/tests/service/data-endpoints-regression.test.ts +0 -834
  278. package/tests/service/empathy-observer-workflow-manager.test.ts +0 -175
  279. package/tests/service/evolution-worker.nocturnal.test.ts +0 -601
  280. package/tests/service/nocturnal-runtime-hardening.test.ts +0 -118
  281. package/tests/service/nocturnal-runtime.test.ts +0 -473
  282. package/tests/service/nocturnal-service-code-candidate.test.ts +0 -330
  283. package/tests/service/nocturnal-target-selector.test.ts +0 -615
  284. package/tests/service/startup-reconciler.test.ts +0 -148
  285. package/tests/tools/write-pain-flag.test.ts +0 -358
  286. package/ui/src/App.tsx +0 -45
  287. package/ui/src/api.ts +0 -220
  288. package/ui/src/charts.tsx +0 -955
  289. package/ui/src/components/ErrorState.tsx +0 -6
  290. package/ui/src/components/Loading.tsx +0 -13
  291. package/ui/src/components/ProtectedRoute.tsx +0 -12
  292. package/ui/src/components/Shell.tsx +0 -91
  293. package/ui/src/components/WorkspaceConfig.tsx +0 -178
  294. package/ui/src/components/index.ts +0 -5
  295. package/ui/src/context/auth.tsx +0 -80
  296. package/ui/src/context/theme.tsx +0 -66
  297. package/ui/src/hooks/useAutoRefresh.ts +0 -39
  298. package/ui/src/i18n/ui.ts +0 -473
  299. package/ui/src/main.tsx +0 -16
  300. package/ui/src/pages/EvolutionPage.tsx +0 -333
  301. package/ui/src/pages/FeedbackPage.tsx +0 -138
  302. package/ui/src/pages/GateMonitorPage.tsx +0 -136
  303. package/ui/src/pages/LoginPage.tsx +0 -89
  304. package/ui/src/pages/OverviewPage.tsx +0 -599
  305. package/ui/src/pages/SamplesPage.tsx +0 -174
  306. package/ui/src/pages/ThinkingModelsPage.tsx +0 -702
  307. package/ui/src/styles.css +0 -2020
  308. package/ui/src/types.ts +0 -384
  309. package/ui/src/utils/format.ts +0 -15
@@ -1,601 +0,0 @@
1
- import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
2
- import * as fs from 'fs';
3
- import * as os from 'os';
4
- import * as path from 'path';
5
-
6
- vi.mock('../../src/core/dictionary-service.js', () => ({
7
- DictionaryService: {
8
- get: vi.fn(() => ({ flush: vi.fn() })),
9
- },
10
- }));
11
-
12
- vi.mock('../../src/core/session-tracker.js', () => ({
13
- initPersistence: vi.fn(),
14
- flushAllSessions: vi.fn(),
15
- listSessions: vi.fn(() => []),
16
- }));
17
-
18
- const { mockStartWorkflow, mockGetWorkflowDebugSummary } = vi.hoisted(() => ({
19
- mockStartWorkflow: vi.fn(),
20
- mockGetWorkflowDebugSummary: vi.fn(),
21
- }));
22
-
23
- vi.mock('../../src/service/subagent-workflow/nocturnal-workflow-manager.js', () => ({
24
- NocturnalWorkflowManager: class {
25
- startWorkflow = mockStartWorkflow;
26
- getWorkflowDebugSummary = mockGetWorkflowDebugSummary;
27
- },
28
- nocturnalWorkflowSpec: {
29
- workflowType: 'nocturnal',
30
- transport: 'runtime_direct',
31
- timeoutMs: 15 * 60 * 1000,
32
- ttlMs: 30 * 60 * 1000,
33
- },
34
- }));
35
-
36
- const { mockGetNocturnalSessionSnapshot, mockListRecentNocturnalCandidateSessions } = vi.hoisted(() => ({
37
- mockGetNocturnalSessionSnapshot: vi.fn(),
38
- mockListRecentNocturnalCandidateSessions: vi.fn(() => [] as Array<{ sessionId: string; startedAt: string; failureCount: number; painEventCount: number; gateBlockCount: number }>),
39
- }));
40
-
41
- // Create a shared mock extractor instance so spy calls are tracked correctly
42
- const mockExtractorInstance = {
43
- getNocturnalSessionSnapshot: mockGetNocturnalSessionSnapshot,
44
- listRecentNocturnalCandidateSessions: mockListRecentNocturnalCandidateSessions,
45
- };
46
-
47
- vi.mock('../../src/core/nocturnal-trajectory-extractor.js', async () => {
48
- const actual = await vi.importActual<typeof import('../../src/core/nocturnal-trajectory-extractor.js')>(
49
- '../../src/core/nocturnal-trajectory-extractor.js'
50
- );
51
- return {
52
- ...actual,
53
- createNocturnalTrajectoryExtractor: vi.fn(() => mockExtractorInstance),
54
- };
55
- });
56
-
57
- import { EvolutionWorkerService } from '../../src/service/evolution-worker.js';
58
- import { readRecentPainContext } from '../../src/service/evolution-pain-context.js';
59
- import { WorkspaceContext } from '../../src/core/workspace-context.js';
60
- import { handlePdReflect } from '../../src/commands/pd-reflect.js';
61
- import { safeRmDir } from '../test-utils.js';
62
- import * as diagnosticianStore from '../../src/core/diagnostician-task-store.js';
63
-
64
- // Helper to create a mock API for E2E tests
65
- function createMockApi() {
66
- return {
67
- logger: { info: vi.fn(), warn: vi.fn(), error: vi.fn(), debug: vi.fn() },
68
- runtime: {
69
- agent: { runEmbeddedPiAgent: vi.fn() },
70
- system: {
71
- requestHeartbeatNow: vi.fn(),
72
- runHeartbeatOnce: vi.fn()
73
- }
74
- },
75
- } as any;
76
- }
77
-
78
- // Helper config for fast poll cycle
79
- const fastPollConfig = { get: (k: string) => k === 'intervals.worker_poll_ms' ? 100 : undefined };
80
-
81
- function readQueue(stateDir: string) {
82
- return JSON.parse(fs.readFileSync(path.join(stateDir, 'evolution_queue.json'), 'utf8'));
83
- }
84
-
85
- describe('EvolutionWorkerService nocturnal hardening', () => {
86
- beforeEach(() => {
87
- vi.useFakeTimers();
88
- vi.clearAllMocks();
89
- EvolutionWorkerService.api = null;
90
- });
91
-
92
- afterEach(() => {
93
- vi.useRealTimers();
94
- EvolutionWorkerService.api = null;
95
- });
96
-
97
- it('extracts session_id from .pain_flag file correctly', async () => {
98
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-pain-session-'));
99
- const stateDir = path.join(workspaceDir, '.state');
100
- fs.mkdirSync(stateDir, { recursive: true });
101
-
102
- // Write a pain flag WITH session_id
103
- fs.writeFileSync(
104
- path.join(stateDir, '.pain_flag'),
105
- `source: test_pain
106
- score: 80
107
- reason: test reason
108
- time: 2026-04-10T00:00:00.000Z
109
- session_id: explicit-session-from-pain
110
- `,
111
- 'utf8'
112
- );
113
-
114
- // Create a WorkspaceContext to test the function
115
- const wctx = WorkspaceContext.fromHookContext({ workspaceDir, stateDir, logger: console } as any);
116
-
117
- try {
118
- const context = readRecentPainContext(wctx);
119
-
120
- // Verify the session_id was extracted from the pain flag file
121
- expect(context.mostRecent).toBeDefined();
122
- expect(context.mostRecent!.sessionId).toBe('explicit-session-from-pain');
123
- expect(context.mostRecent!.score).toBe(80);
124
- expect(context.recentPainCount).toBe(1);
125
- } finally {
126
- safeRmDir(workspaceDir);
127
- }
128
- });
129
-
130
- it('treats malformed pain flag data as unusable context', async () => {
131
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-pain-invalid-'));
132
- const stateDir = path.join(workspaceDir, '.state');
133
- fs.mkdirSync(stateDir, { recursive: true });
134
-
135
- fs.writeFileSync(
136
- path.join(stateDir, '.pain_flag'),
137
- `source: test_pain
138
- score: 80`,
139
- 'utf8'
140
- );
141
-
142
- const wctx = WorkspaceContext.fromHookContext({ workspaceDir, stateDir, logger: console } as any);
143
-
144
- try {
145
- const context = readRecentPainContext(wctx);
146
- expect(context.mostRecent).toBeNull();
147
- expect(context.recentPainCount).toBe(0);
148
- } finally {
149
- safeRmDir(workspaceDir);
150
- }
151
- });
152
-
153
- // === End-to-End Contract Tests ===
154
-
155
- it('e2e: pain flag → worker enqueue → session_id is correctly attached to queued task', async () => {
156
- // This test verifies the contract: when a pain flag with session_id exists,
157
- // any sleep_reflection task created by the worker MUST carry that session_id
158
- // in its recentPainContext.mostRecent.sessionId field.
159
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-e2e-pain-enqueue-'));
160
- const stateDir = path.join(workspaceDir, '.state');
161
- fs.mkdirSync(stateDir, { recursive: true });
162
-
163
- // Write a pain flag WITH session_id
164
- fs.writeFileSync(
165
- path.join(stateDir, '.pain_flag'),
166
- `source: tool_failure
167
- score: 70
168
- reason: Test pain with session
169
- time: 2026-04-10T00:00:00.000Z
170
- session_id: pain-session-abc
171
- `,
172
- 'utf8'
173
- );
174
-
175
- // Verify the worker's readRecentPainContext extracts the session_id correctly
176
- const wctx = WorkspaceContext.fromHookContext({ workspaceDir, stateDir, logger: console } as any);
177
- const painContext = readRecentPainContext(wctx);
178
-
179
- // Contract: session_id must be extracted from the pain flag
180
- expect(painContext.mostRecent).toBeDefined();
181
- expect(painContext.mostRecent!.sessionId).toBe('pain-session-abc');
182
- expect(painContext.mostRecent!.score).toBe(70);
183
- expect(painContext.mostRecent!.source).toBe('tool_failure');
184
-
185
- // Now simulate what the worker does: attach this context to a queued task
186
- const simulatedTask = {
187
- id: 'simulated-task',
188
- taskKind: 'sleep_reflection',
189
- recentPainContext: painContext,
190
- };
191
-
192
- // Verify the contract holds end-to-end
193
- expect(simulatedTask.recentPainContext.mostRecent!.sessionId).toBe('pain-session-abc');
194
- });
195
-
196
- it('e2e: /pd-reflect command writes to workspace/.state, never to HOME/.state', async () => {
197
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-e2e-command-writes-'));
198
- const stateDir = path.join(workspaceDir, '.state');
199
- fs.mkdirSync(stateDir, { recursive: true });
200
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
201
-
202
- // Ensure HOME/.state does NOT have the queue file
203
- const homeState = path.join(os.homedir(), '.state');
204
- const homeQueue = path.join(homeState, 'evolution_queue.json');
205
- const homeExistedBefore = fs.existsSync(homeQueue);
206
-
207
- try {
208
- // Execute the command with explicit workspaceDir
209
- const result = await handlePdReflect.handler({
210
- workspaceDir,
211
- channel: 'test',
212
- isAuthorizedSender: true,
213
- commandBody: '',
214
- config: {},
215
- api: { logger: { info: vi.fn(), warn: vi.fn(), error: vi.fn() } } as any,
216
- } as any);
217
-
218
- // Command should succeed
219
- expect(result.isError).toBeFalsy();
220
- expect(result.text).toContain('enqueued');
221
-
222
- // Queue file should exist in workspace
223
- const workspaceQueue = path.join(stateDir, 'evolution_queue.json');
224
- expect(fs.existsSync(workspaceQueue)).toBe(true);
225
-
226
- // Verify the task is in the workspace queue
227
- const queue = readQueue(stateDir);
228
- const manualTasks = queue.filter((t: any) => t.id.startsWith('manual_'));
229
- expect(manualTasks.length).toBe(1);
230
- expect(manualTasks[0].taskKind).toBe('sleep_reflection');
231
-
232
- // HOME/.state/evolution_queue.json should NOT have been created/modified by this command
233
- if (!homeExistedBefore) {
234
- expect(fs.existsSync(homeQueue)).toBe(false);
235
- }
236
- } finally {
237
- safeRmDir(workspaceDir);
238
- }
239
- });
240
-
241
- // === Nocturnal E2E Pipeline Tests (from PR #243) ===
242
-
243
- it('does not start a nocturnal workflow when only an empty fallback snapshot is available', async () => {
244
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-empty-'));
245
- const stateDir = path.join(workspaceDir, '.state');
246
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
247
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
248
-
249
- mockGetNocturnalSessionSnapshot.mockReturnValue(null);
250
-
251
- fs.writeFileSync(
252
- path.join(stateDir, 'evolution_queue.json'),
253
- JSON.stringify([
254
- {
255
- id: 'sleep-empty',
256
- taskKind: 'sleep_reflection',
257
- priority: 'medium',
258
- score: 50,
259
- source: 'nocturnal',
260
- reason: 'Sleep reflection',
261
- timestamp: '2026-04-10T00:00:00.000Z',
262
- enqueued_at: '2026-04-10T00:00:00.000Z',
263
- status: 'pending',
264
- retryCount: 0,
265
- maxRetries: 1,
266
- recentPainContext: {
267
- mostRecent: null,
268
- recentPainCount: 0,
269
- recentMaxPainScore: 0,
270
- },
271
- },
272
- ], null, 2),
273
- 'utf8'
274
- );
275
-
276
- const mockApi = createMockApi();
277
- EvolutionWorkerService.api = mockApi;
278
-
279
- try {
280
- EvolutionWorkerService.start({
281
- workspaceDir,
282
- stateDir,
283
- logger: mockApi.logger,
284
- config: fastPollConfig,
285
- api: mockApi,
286
- } as any);
287
-
288
- await vi.advanceTimersByTimeAsync(6000);
289
-
290
- const queue = readQueue(stateDir);
291
- expect(queue[0].status).toBe('failed');
292
- expect(queue[0].lastError).toContain('invalid_snapshot_ingress');
293
- expect(queue[0].lastError).toContain('fallback snapshot must contain at least one pain signal');
294
- expect(queue[0].resultRef).toBeFalsy();
295
- expect(mockStartWorkflow).not.toHaveBeenCalled();
296
- } finally {
297
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
298
- safeRmDir(workspaceDir);
299
- }
300
- });
301
-
302
- it('uses stub_fallback for expected gateway-only background unavailability', async () => {
303
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-gateway-'));
304
- const stateDir = path.join(workspaceDir, '.state');
305
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
306
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
307
-
308
- mockGetNocturnalSessionSnapshot.mockReturnValue({
309
- sessionId: 'sleep-gateway',
310
- startedAt: '2026-04-10T00:00:00.000Z',
311
- updatedAt: '2026-04-10T00:01:00.000Z',
312
- assistantTurns: [],
313
- userTurns: [],
314
- toolCalls: [],
315
- painEvents: [],
316
- gateBlocks: [],
317
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, totalPainEvents: 0, totalGateBlocks: 0, failureCount: 0 },
318
- });
319
- mockStartWorkflow.mockResolvedValue({ workflowId: 'wf-1', childSessionKey: 'child-1', state: 'active' });
320
- mockGetWorkflowDebugSummary.mockResolvedValue({
321
- state: 'terminal_error',
322
- metadata: {},
323
- recentEvents: [{ reason: 'Error: Plugin runtime subagent methods are only available during a gateway request.', payload: {} }],
324
- });
325
-
326
- fs.writeFileSync(
327
- path.join(stateDir, 'evolution_queue.json'),
328
- JSON.stringify([
329
- {
330
- id: 'sleep-gateway',
331
- taskKind: 'sleep_reflection',
332
- priority: 'medium',
333
- score: 50,
334
- source: 'nocturnal',
335
- reason: 'Sleep reflection',
336
- timestamp: '2026-04-10T00:00:00.000Z',
337
- enqueued_at: '2026-04-10T00:00:00.000Z',
338
- status: 'pending',
339
- retryCount: 0,
340
- maxRetries: 1,
341
- recentPainContext: {
342
- mostRecent: { source: 'test', score: 50, reason: 'test', timestamp: '2026-04-10T00:00:00.000Z', sessionId: 'sleep-gateway' },
343
- recentPainCount: 1,
344
- recentMaxPainScore: 50,
345
- },
346
- },
347
- ], null, 2),
348
- 'utf8'
349
- );
350
-
351
- const mockApi = createMockApi();
352
- EvolutionWorkerService.api = mockApi;
353
-
354
- try {
355
- EvolutionWorkerService.start({
356
- workspaceDir,
357
- stateDir,
358
- logger: mockApi.logger,
359
- config: fastPollConfig,
360
- api: mockApi,
361
- } as any);
362
-
363
- await vi.advanceTimersByTimeAsync(6000);
364
-
365
- const queue = readQueue(stateDir);
366
- expect(queue[0].status).toBe('completed');
367
- expect(queue[0].resolution).toBe('stub_fallback');
368
- } finally {
369
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
370
- safeRmDir(workspaceDir);
371
- }
372
- });
373
-
374
- it('uses stub_fallback for expected subagent runtime unavailability', async () => {
375
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-subagent-'));
376
- const stateDir = path.join(workspaceDir, '.state');
377
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
378
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
379
-
380
- mockGetNocturnalSessionSnapshot.mockReturnValue({
381
- sessionId: 'sleep-subagent',
382
- startedAt: '2026-04-10T00:00:00.000Z',
383
- updatedAt: '2026-04-10T00:01:00.000Z',
384
- assistantTurns: [],
385
- userTurns: [],
386
- toolCalls: [],
387
- painEvents: [],
388
- gateBlocks: [],
389
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, totalPainEvents: 0, totalGateBlocks: 0, failureCount: 0 },
390
- });
391
- mockStartWorkflow.mockRejectedValue(new Error('NocturnalWorkflowManager: subagent runtime unavailable'));
392
-
393
- fs.writeFileSync(
394
- path.join(stateDir, 'evolution_queue.json'),
395
- JSON.stringify([
396
- {
397
- id: 'sleep-subagent',
398
- taskKind: 'sleep_reflection',
399
- priority: 'medium',
400
- score: 50,
401
- source: 'nocturnal',
402
- reason: 'Sleep reflection',
403
- timestamp: '2026-04-10T00:00:00.000Z',
404
- enqueued_at: '2026-04-10T00:00:00.000Z',
405
- status: 'pending',
406
- retryCount: 0,
407
- maxRetries: 1,
408
- recentPainContext: {
409
- mostRecent: { source: 'test', score: 50, reason: 'test', timestamp: '2026-04-10T00:00:00.000Z', sessionId: 'sleep-subagent' },
410
- recentPainCount: 1,
411
- recentMaxPainScore: 50,
412
- },
413
- },
414
- ], null, 2),
415
- 'utf8'
416
- );
417
-
418
- const mockApi = createMockApi();
419
- EvolutionWorkerService.api = mockApi;
420
-
421
- try {
422
- EvolutionWorkerService.start({
423
- workspaceDir,
424
- stateDir,
425
- logger: mockApi.logger,
426
- config: fastPollConfig,
427
- api: mockApi,
428
- } as any);
429
-
430
- await vi.advanceTimersByTimeAsync(6000);
431
-
432
- const queue = readQueue(stateDir);
433
- expect(queue[0].status).toBe('completed');
434
- expect(queue[0].resolution).toBe('stub_fallback');
435
- } finally {
436
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
437
- safeRmDir(workspaceDir);
438
- }
439
- });
440
-
441
- it('prioritizes pain signal session ID for snapshot extraction', async () => {
442
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-pain-session-'));
443
- const stateDir = path.join(workspaceDir, '.state');
444
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
445
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
446
-
447
- const painSessionId = 'pain-signal-session-123';
448
-
449
- mockGetNocturnalSessionSnapshot.mockImplementation((sessionId: string) => {
450
- if (sessionId === painSessionId) {
451
- return {
452
- sessionId: painSessionId,
453
- startedAt: '2026-04-09T23:00:00.000Z',
454
- updatedAt: '2026-04-09T23:01:00.000Z',
455
- assistantTurns: [],
456
- userTurns: [],
457
- toolCalls: [],
458
- painEvents: [{ source: 'tool_failure', score: 70, severity: null, reason: 'test', createdAt: '2026-04-09T23:00:00.000Z' }],
459
- gateBlocks: [],
460
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, failureCount: 1, totalPainEvents: 1, totalGateBlocks: 0 },
461
- };
462
- }
463
- return null;
464
- });
465
- mockStartWorkflow.mockResolvedValue({ workflowId: 'wf-pain', childSessionKey: 'child-pain', state: 'active' });
466
-
467
- fs.writeFileSync(
468
- path.join(stateDir, 'evolution_queue.json'),
469
- JSON.stringify([
470
- {
471
- id: 'sleep-pain-priority',
472
- taskKind: 'sleep_reflection',
473
- priority: 'medium',
474
- score: 50,
475
- source: 'nocturnal',
476
- reason: 'Sleep reflection',
477
- timestamp: '2026-04-10T00:00:00.000Z',
478
- enqueued_at: '2026-04-10T00:00:00.000Z',
479
- status: 'pending',
480
- retryCount: 0,
481
- maxRetries: 1,
482
- recentPainContext: {
483
- mostRecent: { source: 'tool_failure', score: 70, reason: 'test', timestamp: '2026-04-10T00:00:00.000Z', sessionId: painSessionId },
484
- recentPainCount: 1,
485
- recentMaxPainScore: 70,
486
- },
487
- },
488
- ], null, 2),
489
- 'utf8'
490
- );
491
-
492
- const mockApi = createMockApi();
493
- EvolutionWorkerService.api = mockApi;
494
-
495
- try {
496
- EvolutionWorkerService.start({
497
- workspaceDir,
498
- stateDir,
499
- logger: mockApi.logger,
500
- config: fastPollConfig,
501
- api: mockApi,
502
- } as any);
503
-
504
- await vi.advanceTimersByTimeAsync(6000);
505
-
506
- expect(mockStartWorkflow).toHaveBeenCalledTimes(1);
507
- const metadata = mockStartWorkflow.mock.calls[0][1].metadata;
508
- expect(metadata.snapshot.sessionId).toBe(painSessionId);
509
- } finally {
510
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
511
- safeRmDir(workspaceDir);
512
- }
513
- });
514
-
515
- it('e2e: bounded session selection — never picks a session newer than the triggering task', async () => {
516
- const workspaceDir = fs.mkdtempSync(path.join(os.tmpdir(), 'pd-nocturnal-e2e-bounded-'));
517
- const stateDir = path.join(workspaceDir, '.state');
518
- fs.mkdirSync(path.join(stateDir, 'sessions'), { recursive: true });
519
- fs.mkdirSync(path.join(stateDir, 'logs'), { recursive: true });
520
-
521
- const taskTimestamp = '2026-04-10T00:00:00.000Z';
522
- const validSessionTimestamp = '2026-04-09T23:00:00.000Z';
523
- const invalidSessionTimestamp = '2026-04-10T01:00:00.000Z';
524
-
525
- mockGetNocturnalSessionSnapshot.mockImplementation((sessionId: string) => {
526
- if (sessionId === 'valid-session') {
527
- return {
528
- sessionId: 'valid-session',
529
- startedAt: validSessionTimestamp,
530
- updatedAt: validSessionTimestamp,
531
- assistantTurns: [],
532
- userTurns: [],
533
- toolCalls: [],
534
- painEvents: [{ source: 'tool_failure', score: 50, severity: null, reason: 'test', createdAt: validSessionTimestamp }],
535
- gateBlocks: [],
536
- stats: { totalAssistantTurns: 1, totalToolCalls: 1, failureCount: 1, totalPainEvents: 1, totalGateBlocks: 0 },
537
- };
538
- }
539
- return null;
540
- });
541
- mockListRecentNocturnalCandidateSessions.mockReturnValue([
542
- { sessionId: 'valid-session', startedAt: validSessionTimestamp, failureCount: 1, painEventCount: 1, gateBlockCount: 0 },
543
- { sessionId: 'invalid-session', startedAt: invalidSessionTimestamp, failureCount: 1, painEventCount: 0, gateBlockCount: 0 },
544
- ]);
545
- mockStartWorkflow.mockResolvedValue({ workflowId: 'wf-bounded', childSessionKey: 'child-bounded', state: 'active' });
546
-
547
- fs.writeFileSync(
548
- path.join(stateDir, 'evolution_queue.json'),
549
- JSON.stringify([
550
- {
551
- id: 'sleep-e2e-bounded',
552
- taskKind: 'sleep_reflection',
553
- priority: 'medium',
554
- score: 50,
555
- source: 'nocturnal',
556
- reason: 'Sleep reflection',
557
- timestamp: taskTimestamp,
558
- enqueued_at: taskTimestamp,
559
- status: 'pending',
560
- retryCount: 0,
561
- maxRetries: 1,
562
- recentPainContext: {
563
- mostRecent: { source: 'test', score: 50, reason: 'test', timestamp: taskTimestamp, sessionId: 'pain-session' },
564
- recentPainCount: 1,
565
- recentMaxPainScore: 50,
566
- },
567
- },
568
- ], null, 2),
569
- 'utf8'
570
- );
571
-
572
- const mockApi = createMockApi();
573
- EvolutionWorkerService.api = mockApi;
574
-
575
- try {
576
- EvolutionWorkerService.start({
577
- workspaceDir,
578
- stateDir,
579
- logger: mockApi.logger,
580
- config: fastPollConfig,
581
- api: mockApi,
582
- } as any);
583
-
584
- await vi.advanceTimersByTimeAsync(6000);
585
-
586
- expect(mockStartWorkflow).toHaveBeenCalledTimes(1);
587
- const metadata = mockStartWorkflow.mock.calls[0][1].metadata;
588
- expect(metadata.snapshot.sessionId).toBe('valid-session');
589
- expect(new Date(metadata.snapshot.startedAt).getTime()).toBeLessThanOrEqual(new Date(taskTimestamp).getTime());
590
- } finally {
591
- EvolutionWorkerService.stop!({ workspaceDir, stateDir, logger: console } as any);
592
- safeRmDir(workspaceDir);
593
- }
594
- });
595
-
596
- // === PR #307 Fixes: Pain Diagnosis Timeout & Heartbeat Retry ===
597
-
598
- // Note: Testing requestHeartbeatNow call directly is complex due to
599
- // the async nature of checkPainFlag → doEnqueuePainTask → requestHeartbeatNow.
600
- // The fix is verified via E2E monitoring (PR #307 production verification).
601
- });