principles-disciple 1.72.0 → 1.74.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (319) hide show
  1. package/INSTALL.md +1 -3
  2. package/openclaw.plugin.json +10 -5
  3. package/package.json +17 -19
  4. package/scripts/acceptance-test.mjs +16 -73
  5. package/scripts/sync-plugin.mjs +382 -77
  6. package/src/commands/archive-impl.ts +2 -1
  7. package/src/commands/capabilities.ts +2 -2
  8. package/src/commands/context.ts +2 -2
  9. package/src/commands/disable-impl.ts +2 -1
  10. package/src/commands/evolution-status.ts +16 -16
  11. package/src/commands/export.ts +12 -67
  12. package/src/commands/pain.ts +91 -1
  13. package/src/commands/principle-rollback.ts +2 -1
  14. package/src/commands/promote-impl.ts +7 -43
  15. package/src/commands/rollback-impl.ts +2 -1
  16. package/src/commands/rollback.ts +2 -1
  17. package/src/commands/samples.ts +2 -1
  18. package/src/commands/thinking-os.ts +2 -1
  19. package/src/config/errors.ts +18 -2
  20. package/src/constants/diagnostician.ts +2 -2
  21. package/src/constants/tools.ts +2 -1
  22. package/src/core/__tests__/focus-history.test.ts +210 -0
  23. package/src/core/config.ts +1 -1
  24. package/src/core/correction-cue-learner.ts +2 -136
  25. package/src/core/correction-types.ts +16 -88
  26. package/src/core/dictionary.ts +19 -20
  27. package/src/core/empathy-keyword-matcher.ts +17 -289
  28. package/src/core/empathy-types.ts +18 -229
  29. package/src/core/event-log.ts +29 -132
  30. package/src/core/evolution-reducer.ts +21 -2
  31. package/src/core/evolution-types.ts +76 -464
  32. package/src/core/file-store.ts +80 -0
  33. package/src/core/focus-history.ts +228 -955
  34. package/src/core/local-worker-routing.ts +34 -314
  35. package/src/core/merge-gate-audit.ts +0 -195
  36. package/src/core/migration.ts +0 -1
  37. package/src/core/pain-diagnostic-gate.ts +154 -0
  38. package/src/core/pain-signal.ts +21 -138
  39. package/src/core/pain.ts +15 -88
  40. package/src/core/path-resolver.ts +0 -1
  41. package/src/core/paths.ts +0 -1
  42. package/src/core/pd-task-reconciler.ts +26 -115
  43. package/src/core/pd-task-service.ts +9 -9
  44. package/src/core/pd-task-types.ts +23 -127
  45. package/src/core/principle-compiler/__tests__/compiler-replay-gate.test.ts +174 -0
  46. package/src/core/principle-compiler/code-validator.ts +15 -42
  47. package/src/core/principle-compiler/compiler.ts +100 -15
  48. package/src/core/principle-compiler/index.ts +5 -2
  49. package/src/core/principle-compiler/template-generator.ts +4 -104
  50. package/src/core/principle-injection.ts +10 -202
  51. package/src/core/principle-internalization/filesystem-lifecycle-datasource.ts +42 -0
  52. package/src/core/principle-internalization/lifecycle-read-model.ts +39 -242
  53. package/src/core/principle-internalization/principle-lifecycle-service.ts +12 -10
  54. package/src/core/principle-tree-ledger-adapter.ts +145 -0
  55. package/src/core/principle-tree-ledger.ts +8 -6
  56. package/src/core/reflection/reflection-context.ts +14 -109
  57. package/src/core/replay-engine.ts +8 -500
  58. package/src/core/rule-host-helpers.ts +5 -35
  59. package/src/core/rule-host-types.ts +10 -82
  60. package/src/core/rule-host.ts +6 -63
  61. package/src/core/runtime-v2-prompt-activation-reader.ts +231 -0
  62. package/src/core/session-tracker.ts +87 -101
  63. package/src/core/shadow-observation-registry.ts +19 -48
  64. package/src/core/trajectory.ts +3 -1
  65. package/src/core/workflow-funnel-loader.ts +62 -68
  66. package/src/core/workspace-context.ts +46 -0
  67. package/src/core/workspace-dir-service.ts +1 -1
  68. package/src/core/workspace-dir-validation.ts +18 -9
  69. package/src/hooks/AGENTS.md +1 -1
  70. package/src/hooks/gate-block-helper.ts +71 -64
  71. package/src/hooks/gate.ts +183 -31
  72. package/src/hooks/lifecycle.ts +30 -32
  73. package/src/hooks/llm.ts +60 -32
  74. package/src/hooks/pain.ts +297 -103
  75. package/src/hooks/prompt.ts +400 -440
  76. package/src/hooks/subagent.ts +2 -29
  77. package/src/i18n/commands.ts +2 -10
  78. package/src/index.ts +95 -85
  79. package/src/openclaw-sdk.ts +311 -0
  80. package/src/service/central-database.ts +8 -4
  81. package/src/service/evolution-queue-migration.ts +2 -1
  82. package/src/service/evolution-worker.ts +163 -1786
  83. package/src/service/internalization-trigger-adapter.ts +302 -0
  84. package/src/service/keyword-optimization-service.ts +4 -4
  85. package/src/service/monitoring-query-service.ts +1 -215
  86. package/src/service/queue-io.ts +60 -331
  87. package/src/service/runtime-summary-service.ts +59 -16
  88. package/src/service/subagent-workflow/index.ts +0 -41
  89. package/src/service/subagent-workflow/types.ts +9 -120
  90. package/src/service/subagent-workflow/workflow-store.ts +2 -119
  91. package/src/service/workflow-watchdog.ts +0 -43
  92. package/src/types/event-payload.ts +16 -74
  93. package/src/types/event-types.ts +38 -547
  94. package/src/types/hygiene-types.ts +7 -30
  95. package/src/types/principle-tree-schema.ts +20 -222
  96. package/src/types/queue.ts +15 -70
  97. package/src/types/runtime-summary.ts +5 -49
  98. package/src/utils/io.ts +8 -20
  99. package/src/utils/retry.ts +1 -1
  100. package/src/utils/shadow-fingerprint.ts +2 -2
  101. package/src/utils/workspace-resolver.ts +50 -0
  102. package/templates/langs/en/core/AGENTS.md +7 -7
  103. package/templates/langs/en/core/BOOT.md +1 -1
  104. package/templates/langs/en/core/HEARTBEAT.md +2 -2
  105. package/templates/langs/en/principles/THINKING_OS.md +3 -2
  106. package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  107. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  108. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  109. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  110. package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  111. package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  112. package/templates/langs/en/skills/evolve-task/SKILL.md +3 -3
  113. package/templates/langs/en/skills/pd-cli-operator/SKILL.md +67 -0
  114. package/templates/langs/en/skills/pd-diagnostician/SKILL.md +1 -1
  115. package/templates/langs/en/skills/pd-mentor/SKILL.md +2 -3
  116. package/templates/langs/en/skills/pd-pain-signal/SKILL.md +17 -39
  117. package/templates/langs/en/skills/pd-runtime-v2/SKILL.md +61 -0
  118. package/templates/langs/zh/core/AGENTS.md +7 -7
  119. package/templates/langs/zh/core/BOOT.md +1 -1
  120. package/templates/langs/zh/core/HEARTBEAT.md +2 -2
  121. package/templates/langs/zh/principles/THINKING_OS.md +3 -2
  122. package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
  123. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
  124. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
  125. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +8 -8
  126. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
  127. package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
  128. package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
  129. package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +21 -5
  130. package/templates/langs/zh/skills/evolve-task/SKILL.md +4 -4
  131. package/templates/langs/zh/skills/pd-cli-operator/SKILL.md +67 -0
  132. package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +1 -1
  133. package/templates/langs/zh/skills/pd-mentor/SKILL.md +2 -3
  134. package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +17 -38
  135. package/templates/langs/zh/skills/pd-runtime-v2/SKILL.md +61 -0
  136. package/tests/build-artifacts.test.ts +1 -3
  137. package/tests/commands/evolution-status.test.ts +0 -118
  138. package/tests/core/bootstrap-rules.test.ts +1 -1
  139. package/tests/core/config.test.ts +1 -1
  140. package/tests/core/event-log.test.ts +35 -0
  141. package/tests/core/evolution-engine.test.ts +610 -0
  142. package/tests/core/file-store.test.ts +102 -0
  143. package/tests/core/focus-history.test.ts +203 -11
  144. package/tests/core/merge-gate-audit.test.ts +2 -169
  145. package/tests/core/migration.test.ts +7 -7
  146. package/tests/core/model-deployment-registry.test.ts +7 -1
  147. package/tests/core/model-training-registry.test.ts +19 -0
  148. package/tests/core/observability.test.ts +0 -1
  149. package/tests/core/pain-diagnostic-gate.test.ts +498 -0
  150. package/tests/core/pain.test.ts +0 -1
  151. package/tests/core/path-resolver.test.ts +1 -1
  152. package/tests/core/paths-refactor.test.ts +0 -22
  153. package/tests/core/principle-internalization/deprecated-readiness.test.ts +2 -2
  154. package/tests/core/principle-internalization/lifecycle-metrics.test.ts +2 -2
  155. package/tests/core/principle-internalization/{internalization-routing-policy.test.ts → lifecycle-routing-policy.test.ts} +6 -6
  156. package/tests/core/principle-internalization/lineage-source-retired.test.ts +56 -0
  157. package/tests/core/principle-internalization/principle-lifecycle-service.test.ts +1 -23
  158. package/tests/core/principle-tree-ledger-adapter.test.ts +253 -0
  159. package/tests/core/reflection-context.test.ts +0 -14
  160. package/tests/core/replay-engine.test.ts +127 -215
  161. package/tests/core/rule-host-helpers.test.ts +2 -2
  162. package/tests/core/rule-implementation-runtime.test.ts +0 -27
  163. package/tests/core/workflow-funnel-loader.test.ts +162 -0
  164. package/tests/core/workspace-context.test.ts +2 -2
  165. package/tests/core/workspace-dir-validation.test.ts +8 -1
  166. package/tests/core-anti-growth.test.ts +191 -0
  167. package/tests/hook-workspace-nextaction-contract.test.ts +42 -0
  168. package/tests/hooks/confirm-first-removal.test.ts +188 -0
  169. package/tests/hooks/gate-auto-correct-shadow.test.ts +310 -0
  170. package/tests/hooks/gate-auto-correct.test.ts +665 -0
  171. package/tests/hooks/gate-no-path-write-tool.test.ts +172 -0
  172. package/tests/hooks/gate-rule-host-pipeline.test.ts +2 -1
  173. package/tests/hooks/pain.test.ts +269 -12
  174. package/tests/hooks/prompt-characterization.test.ts +500 -0
  175. package/tests/hooks/prompt-size-guard.test.ts +32 -17
  176. package/tests/hooks/runtime-v2-prompt-activation.test.ts +869 -0
  177. package/tests/index.test.ts +94 -1
  178. package/tests/integration/auto-entry-gate.test.ts +248 -0
  179. package/tests/integration/internalization-trigger-guard.test.ts +69 -0
  180. package/tests/integration/m8-legacy-paths.test.ts +63 -0
  181. package/tests/integration/runtime-v2-pain-guard.test.ts +125 -0
  182. package/tests/plugin-config-resolution-cutover.test.ts +359 -0
  183. package/tests/runtime-v2-discovery-guard.test.ts +154 -0
  184. package/tests/service/central-database.test.ts +457 -0
  185. package/tests/service/evolution-worker.correction-observer.test.ts +173 -0
  186. package/tests/service/evolution-worker.timeout.test.ts +11 -129
  187. package/tests/service/internalization-trigger-adapter.test.ts +251 -0
  188. package/tests/service/monitoring-query-service.test.ts +1 -47
  189. package/tests/service/queue-io.test.ts +1 -62
  190. package/tests/service/runtime-summary-service.test.ts +3 -1
  191. package/tests/service/workflow-watchdog.test.ts +0 -91
  192. package/tests/utils/file-lock.test.ts +5 -3
  193. package/tests/utils/session-key.test.ts +52 -0
  194. package/tests/utils/subagent-probe.test.ts +48 -1
  195. package/vitest.config.ts +4 -11
  196. package/.planning/codebase/ARCHITECTURE.md +0 -157
  197. package/.planning/codebase/CONCERNS.md +0 -145
  198. package/.planning/codebase/CONVENTIONS.md +0 -148
  199. package/.planning/codebase/INTEGRATIONS.md +0 -81
  200. package/.planning/codebase/STACK.md +0 -87
  201. package/.planning/codebase/STRUCTURE.md +0 -193
  202. package/.planning/codebase/TESTING.md +0 -243
  203. package/.planning/phases/01-basic-visualization/01-GAP-CLOSURE-VERIFICATION.md +0 -113
  204. package/docs/COMMAND_REFERENCE.md +0 -76
  205. package/docs/COMMAND_REFERENCE_EN.md +0 -79
  206. package/scripts/build-web.mjs +0 -46
  207. package/scripts/diagnose-nocturnal.mjs +0 -537
  208. package/scripts/seed-nocturnal-scenarios.mjs +0 -384
  209. package/src/commands/nocturnal-review.ts +0 -322
  210. package/src/commands/nocturnal-rollout.ts +0 -790
  211. package/src/commands/nocturnal-train.ts +0 -986
  212. package/src/commands/pd-reflect.ts +0 -88
  213. package/src/core/adaptive-thresholds.ts +0 -478
  214. package/src/core/diagnostician-task-store.ts +0 -192
  215. package/src/core/nocturnal-arbiter.ts +0 -715
  216. package/src/core/nocturnal-artifact-lineage.ts +0 -116
  217. package/src/core/nocturnal-artificer.ts +0 -257
  218. package/src/core/nocturnal-candidate-scoring.ts +0 -530
  219. package/src/core/nocturnal-compliance.ts +0 -1146
  220. package/src/core/nocturnal-dataset.ts +0 -763
  221. package/src/core/nocturnal-executability.ts +0 -428
  222. package/src/core/nocturnal-export.ts +0 -499
  223. package/src/core/nocturnal-paths.ts +0 -240
  224. package/src/core/nocturnal-reasoning-deriver.ts +0 -343
  225. package/src/core/nocturnal-rule-implementation-validator.ts +0 -246
  226. package/src/core/nocturnal-snapshot-contract.ts +0 -99
  227. package/src/core/nocturnal-trajectory-extractor.ts +0 -512
  228. package/src/core/nocturnal-trinity-types.ts +0 -218
  229. package/src/core/nocturnal-trinity.ts +0 -2680
  230. package/src/core/principle-internalization/deprecated-readiness.ts +0 -93
  231. package/src/core/principle-internalization/internalization-routing-policy.ts +0 -208
  232. package/src/core/principle-internalization/lifecycle-metrics.ts +0 -152
  233. package/src/http/principles-console-route.ts +0 -709
  234. package/src/service/central-health-service.ts +0 -49
  235. package/src/service/central-overview-service.ts +0 -138
  236. package/src/service/control-ui-query-service.ts +0 -900
  237. package/src/service/cooldown-strategy.ts +0 -97
  238. package/src/service/evolution-pain-context.ts +0 -79
  239. package/src/service/evolution-query-service.ts +0 -407
  240. package/src/service/health-query-service.ts +0 -1038
  241. package/src/service/nocturnal-config.ts +0 -214
  242. package/src/service/nocturnal-runtime.ts +0 -734
  243. package/src/service/nocturnal-service.ts +0 -1605
  244. package/src/service/nocturnal-target-selector.ts +0 -545
  245. package/src/service/sleep-cycle.ts +0 -157
  246. package/src/service/startup-reconciler.ts +0 -112
  247. package/src/service/subagent-workflow/correction-observer-types.ts +0 -82
  248. package/src/service/subagent-workflow/correction-observer-workflow-manager.ts +0 -250
  249. package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +0 -1
  250. package/src/service/subagent-workflow/dynamic-timeout.ts +0 -30
  251. package/src/service/subagent-workflow/empathy-observer-workflow-manager.ts +0 -268
  252. package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +0 -795
  253. package/src/service/subagent-workflow/runtime-direct-driver.ts +0 -268
  254. package/src/service/subagent-workflow/workflow-manager-base.ts +0 -580
  255. package/src/tools/write-pain-flag.ts +0 -215
  256. package/templates/langs/en/skills/plan-script/SKILL.md +0 -32
  257. package/templates/langs/zh/skills/plan-script/SKILL.md +0 -32
  258. package/tests/commands/nocturnal-review.test.ts +0 -448
  259. package/tests/commands/nocturnal-train.test.ts +0 -97
  260. package/tests/commands/pd-reflect.test.ts +0 -49
  261. package/tests/core/adaptive-thresholds.test.ts +0 -261
  262. package/tests/core/nocturnal-arbiter.test.ts +0 -559
  263. package/tests/core/nocturnal-artifact-lineage.test.ts +0 -53
  264. package/tests/core/nocturnal-artificer.test.ts +0 -241
  265. package/tests/core/nocturnal-candidate-scoring.test.ts +0 -532
  266. package/tests/core/nocturnal-compliance-p-principles.test.ts +0 -133
  267. package/tests/core/nocturnal-compliance.test.ts +0 -646
  268. package/tests/core/nocturnal-dataset.test.ts +0 -892
  269. package/tests/core/nocturnal-e2e.test.ts +0 -234
  270. package/tests/core/nocturnal-executability.test.ts +0 -357
  271. package/tests/core/nocturnal-export.test.ts +0 -517
  272. package/tests/core/nocturnal-reasoning-deriver.test.ts +0 -372
  273. package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +0 -428
  274. package/tests/core/nocturnal-rule-implementation-validator.test.ts +0 -127
  275. package/tests/core/nocturnal-snapshot-contract.test.ts +0 -121
  276. package/tests/core/nocturnal-trajectory-extractor.test.ts +0 -634
  277. package/tests/core/nocturnal-trinity.test.ts +0 -2053
  278. package/tests/core/pain-auto-repair.test.ts +0 -96
  279. package/tests/core/pain-integration.test.ts +0 -510
  280. package/tests/fixtures/nocturnal-reviewed-subset.json +0 -183
  281. package/tests/http/principles-console-route.test.ts +0 -162
  282. package/tests/integration/chaos-resilience.test.ts +0 -348
  283. package/tests/integration/empathy-workflow-integration.test.ts +0 -626
  284. package/tests/integration/pain-diagnostician-loop.e2e.test.ts +0 -380
  285. package/tests/service/control-ui-query-service.test.ts +0 -121
  286. package/tests/service/cooldown-strategy.test.ts +0 -164
  287. package/tests/service/data-endpoints-regression.test.ts +0 -834
  288. package/tests/service/empathy-observer-workflow-manager.test.ts +0 -175
  289. package/tests/service/evolution-worker.nocturnal.test.ts +0 -601
  290. package/tests/service/nocturnal-runtime-hardening.test.ts +0 -118
  291. package/tests/service/nocturnal-runtime.test.ts +0 -473
  292. package/tests/service/nocturnal-service-code-candidate.test.ts +0 -330
  293. package/tests/service/nocturnal-target-selector.test.ts +0 -615
  294. package/tests/service/startup-reconciler.test.ts +0 -148
  295. package/tests/tools/write-pain-flag.test.ts +0 -358
  296. package/ui/src/App.tsx +0 -45
  297. package/ui/src/api.ts +0 -220
  298. package/ui/src/charts.tsx +0 -955
  299. package/ui/src/components/ErrorState.tsx +0 -6
  300. package/ui/src/components/Loading.tsx +0 -13
  301. package/ui/src/components/ProtectedRoute.tsx +0 -12
  302. package/ui/src/components/Shell.tsx +0 -91
  303. package/ui/src/components/WorkspaceConfig.tsx +0 -178
  304. package/ui/src/components/index.ts +0 -5
  305. package/ui/src/context/auth.tsx +0 -80
  306. package/ui/src/context/theme.tsx +0 -66
  307. package/ui/src/hooks/useAutoRefresh.ts +0 -39
  308. package/ui/src/i18n/ui.ts +0 -473
  309. package/ui/src/main.tsx +0 -16
  310. package/ui/src/pages/EvolutionPage.tsx +0 -333
  311. package/ui/src/pages/FeedbackPage.tsx +0 -138
  312. package/ui/src/pages/GateMonitorPage.tsx +0 -136
  313. package/ui/src/pages/LoginPage.tsx +0 -89
  314. package/ui/src/pages/OverviewPage.tsx +0 -599
  315. package/ui/src/pages/SamplesPage.tsx +0 -174
  316. package/ui/src/pages/ThinkingModelsPage.tsx +0 -702
  317. package/ui/src/styles.css +0 -2020
  318. package/ui/src/types.ts +0 -384
  319. package/ui/src/utils/format.ts +0 -15
@@ -1,530 +0,0 @@
1
- /**
2
- * Nocturnal Candidate Scoring — Deterministic Tournament Selection
3
- * ============================================================
4
- *
5
- * PURPOSE: Score Trinity candidates and run deterministic tournament selection
6
- * to choose the best candidate for artifact generation.
7
- *
8
- * DESIGN CONSTRAINTS:
9
- * - Scoring is deterministic: same inputs → same winner
10
- * - Tie-break rules are stable and explicit
11
- * - No randomness in ranking or selection
12
- * - Winner is always the highest-scoring candidate
13
- * - Thresholds provide minimum quality gates
14
- * - Failed threshold candidates are excluded from tournament
15
- *
16
- * SCORING COMPONENTS:
17
- * - schema completeness: candidate has all required fields
18
- * - principle alignment: candidate aligns with target principle
19
- * - executability: candidate describes an actionable next step
20
- * - boundedness: candidate is specific and bounded
21
- * - confidence/consistency: candidate's internal consistency
22
- *
23
- * PHASE 6 ONLY — No real training, no automatic deployment
24
- */
25
-
26
- import type { DreamerCandidate, PhilosopherJudgment } from './nocturnal-trinity-types.js';
27
- import type { ThresholdValues } from './adaptive-thresholds.js';
28
-
29
- // ---------------------------------------------------------------------------
30
- // Types
31
- // ---------------------------------------------------------------------------
32
-
33
- /**
34
- * Individual scoring dimensions for a candidate.
35
- */
36
- export interface CandidateScores {
37
- /** Schema completeness (0-1) */
38
- schemaCompleteness: number;
39
- /** Principle alignment (0-1) */
40
- principleAlignment: number;
41
- /** Executability (0-1) */
42
- executability: number;
43
- /** Boundedness — specificity and constraint (0-1) */
44
- boundedness: number;
45
- /** Confidence/consistency (0-1) */
46
- confidence: number;
47
- /** Aggregate score (weighted average) */
48
- aggregate: number;
49
- }
50
-
51
- /**
52
- * Scored candidate with ranking.
53
- */
54
- export interface ScoredCandidate {
55
- /** Original candidate index from Dreamer */
56
- candidateIndex: number;
57
- /** The Dreamer candidate */
58
- candidate: DreamerCandidate;
59
- /** The Philosopher judgment */
60
- judgment: PhilosopherJudgment;
61
- /** Individual dimension scores */
62
- scores: CandidateScores;
63
- /** Final tournament rank (1 = winner) */
64
- rank: number;
65
- /** Whether this candidate passed all thresholds */
66
- thresholdPassed: boolean;
67
- /** Which thresholds failed (if any) */
68
- failedThresholds: string[];
69
- }
70
-
71
- /**
72
- * Result of a tournament selection.
73
- */
74
- export interface TournamentResult {
75
- /** Whether tournament produced a winner */
76
- success: boolean;
77
- /** The winning candidate (if success === true) */
78
- winner: ScoredCandidate | null;
79
- /** All ranked candidates (sorted by rank) */
80
- rankedCandidates: ScoredCandidate[];
81
- /** Trace of decisions for debugging/explainability */
82
- trace: TournamentTraceEntry[];
83
- /** Why no winner was selected (if success === false) */
84
- failureReason?: string;
85
- }
86
-
87
- /**
88
- * Single entry in the tournament trace.
89
- */
90
- export interface TournamentTraceEntry {
91
- /** Description of this step */
92
- step: string;
93
- /** Details about the decision */
94
- details: string;
95
- }
96
-
97
- /**
98
- * Scoring weights for aggregate calculation.
99
- */
100
- export interface ScoringWeights {
101
- schemaCompleteness: number;
102
- principleAlignment: number;
103
- executability: number;
104
- boundedness: number;
105
- confidence: number;
106
- }
107
-
108
- /**
109
- * Default scoring weights (must sum to 1.0).
110
- */
111
- export const DEFAULT_SCORING_WEIGHTS: ScoringWeights = {
112
- schemaCompleteness: 0.15,
113
- principleAlignment: 0.30,
114
- executability: 0.20,
115
- boundedness: 0.20,
116
- confidence: 0.15,
117
- };
118
-
119
- /**
120
- * Result of diversity validation on Dreamer candidates.
121
- * Soft enforcement: result is informational, never gates the pipeline.
122
- */
123
- export interface DiversityValidationResult {
124
- /** Whether candidates passed diversity checks */
125
- diversityCheckPassed: boolean;
126
- /** Whether at least 2 distinct risk levels were present */
127
- riskLevelDiversity: boolean;
128
- /** Whether no candidate pair exceeded keyword overlap threshold */
129
- keywordOverlapPassed: boolean;
130
- /** Highest pairwise keyword overlap score (for telemetry) */
131
- maxOverlapScore: number;
132
- /** Human-readable summary of check results */
133
- details: string;
134
- }
135
-
136
- // ---------------------------------------------------------------------------
137
- // Scoring Logic
138
- // ---------------------------------------------------------------------------
139
-
140
- /**
141
- * Score a single Dreamer candidate + Philosopher judgment pair.
142
- *
143
- * @param candidate - Dreamer candidate
144
- * @param judgment - Philosopher judgment
145
- * @param weights - Scoring weights
146
- * @returns Individual scores
147
- */
148
- export function scoreCandidate(
149
- candidate: DreamerCandidate,
150
- judgment: PhilosopherJudgment,
151
- weights: ScoringWeights = DEFAULT_SCORING_WEIGHTS
152
- ): CandidateScores {
153
- // Schema completeness: all required fields present and non-empty
154
- let schemaCompleteness = 1.0;
155
- if (!candidate.badDecision || candidate.badDecision.trim().length === 0) schemaCompleteness -= 0.2;
156
- if (!candidate.betterDecision || candidate.betterDecision.trim().length === 0) schemaCompleteness -= 0.2;
157
- if (!candidate.rationale || candidate.rationale.trim().length === 0) schemaCompleteness -= 0.2;
158
- if (typeof candidate.confidence !== 'number' || candidate.confidence < 0 || candidate.confidence > 1) schemaCompleteness -= 0.2;
159
- if (candidate.badDecision && candidate.betterDecision && candidate.badDecision.trim() === candidate.betterDecision.trim()) schemaCompleteness -= 0.2;
160
- schemaCompleteness = Math.max(0, schemaCompleteness);
161
-
162
- // Principle alignment: from Philosopher judgment
163
- const principleAlignment = judgment.principleAligned ? 1.0 : 0.3;
164
-
165
- // Executability: betterDecision contains actionable verb
166
- const actionableVerbs = ['read', 'check', 'verify', 'edit', 'write', 'search', 'grep', 'review', 'analyze', 'diagnose', 'debug', 'inspect', 'examine', 'test'];
167
- const hasActionableVerb = candidate.betterDecision
168
- ? actionableVerbs.some((v) =>
169
- candidate.betterDecision.toLowerCase().includes(v)
170
- )
171
- : false;
172
- const executability = hasActionableVerb ? 1.0 : 0.4;
173
-
174
- // Boundedness: specific and constrained
175
- let boundedness = 0.5;
176
- // Specific: mentions specific targets (files, tools, etc.)
177
- const betterDecisionStr = candidate.betterDecision ?? '';
178
- const hasSpecificTarget = /[a-zA-Z0-9_.]+\.(ts|js|json|md|yml|yaml|sh|py|go|rs)/.test(betterDecisionStr);
179
- if (hasSpecificTarget) boundedness += 0.2;
180
- // Not too generic
181
- const genericPatterns = [
182
- /\bsomething\b/i,
183
- /\bsomething else\b/i,
184
- /\bit\b/i,
185
- /\bthe thing\b/i,
186
- ];
187
- const isGeneric = genericPatterns.some((pattern) => pattern.test(betterDecisionStr));
188
- if (isGeneric) boundedness -= 0.3;
189
- // Not too long (如果 multi-step vagueness)
190
- if (betterDecisionStr.length > 200) boundedness -= 0.1;
191
- boundedness = Math.max(0, Math.min(1, boundedness));
192
-
193
- // Confidence: from Dreamer's confidence, adjusted by consistency
194
- const baseConfidence = typeof candidate.confidence === 'number' ? candidate.confidence : 0.5;
195
- // Slight consistency check: Philosopher score should correlate with confidence
196
- const consistency = 1.0 - Math.abs(baseConfidence - judgment.score);
197
- const confidence = baseConfidence * 0.7 + consistency * 0.3;
198
-
199
- // Calculate aggregate
200
- const aggregate =
201
- schemaCompleteness * weights.schemaCompleteness +
202
- principleAlignment * weights.principleAlignment +
203
- executability * weights.executability +
204
- boundedness * weights.boundedness +
205
- confidence * weights.confidence;
206
-
207
- return {
208
- schemaCompleteness: Math.round(schemaCompleteness * 100) / 100,
209
- principleAlignment: Math.round(principleAlignment * 100) / 100,
210
- executability: Math.round(executability * 100) / 100,
211
- boundedness: Math.round(boundedness * 100) / 100,
212
- confidence: Math.round(confidence * 100) / 100,
213
- aggregate: Math.round(aggregate * 100) / 100,
214
- };
215
- }
216
-
217
- /**
218
- * Check if candidate passes minimum thresholds.
219
- *
220
- * @param scores - Candidate scores
221
- * @param thresholds - Minimum threshold values
222
- * @returns Tuple of [passed, failedThresholdNames]
223
- */
224
- export function checkThresholds(
225
- scores: CandidateScores,
226
- thresholds: ThresholdValues
227
- ): [boolean, string[]] {
228
- const failedThresholds: string[] = [];
229
-
230
- if (scores.schemaCompleteness < thresholds.schemaCompletenessMin) {
231
- failedThresholds.push(`schemaCompleteness (${scores.schemaCompleteness} < ${thresholds.schemaCompletenessMin})`);
232
- }
233
- if (scores.principleAlignment < thresholds.principleAlignmentMin) {
234
- failedThresholds.push(`principleAlignment (${scores.principleAlignment} < ${thresholds.principleAlignmentMin})`);
235
- }
236
- if (scores.executability < thresholds.executabilityMin) {
237
- failedThresholds.push(`executability (${scores.executability} < ${thresholds.executabilityMin})`);
238
- }
239
- if (scores.boundedness < thresholds.boundednessMin) {
240
- failedThresholds.push(`boundedness (${scores.boundedness} < ${thresholds.boundednessMin})`);
241
- }
242
- if (scores.confidence < thresholds.confidenceMin) {
243
- failedThresholds.push(`confidence (${scores.confidence} < ${thresholds.confidenceMin})`);
244
- }
245
- if (scores.aggregate < thresholds.aggregateMin) {
246
- failedThresholds.push(`aggregate (${scores.aggregate} < ${thresholds.aggregateMin})`);
247
- }
248
-
249
- return [failedThresholds.length === 0, failedThresholds];
250
- }
251
-
252
- /**
253
- * Validate that Dreamer candidates are strategically diverse.
254
- *
255
- * DIVER-03: Checks risk level diversity (Set.size >= 2 when candidates >= 2)
256
- * and keyword overlap similarity (reject if intersection / max(|A|, |B|) > 0.8
257
- * for words > 3 chars per D-05).
258
- *
259
- * This is SOFT enforcement: returns a result, never throws.
260
- * Pipeline continues regardless of diversityCheckPassed value.
261
- *
262
- * @param candidates - Dreamer candidates to validate
263
- * @returns DiversityValidationResult with pass/fail details
264
- */
265
- export function validateCandidateDiversity(
266
- candidates: DreamerCandidate[],
267
- ): DiversityValidationResult {
268
- // Edge cases: empty, null, or single candidate always passes
269
- if (!candidates || candidates.length <= 1) {
270
- return {
271
- diversityCheckPassed: true,
272
- riskLevelDiversity: true,
273
- keywordOverlapPassed: true,
274
- maxOverlapScore: 0,
275
- details: candidates?.length === 1
276
- ? 'Single candidate — diversity check not applicable'
277
- : 'No candidates to validate',
278
- };
279
- }
280
-
281
- // Check 1: Risk level diversity (D-05)
282
- const riskLevels = new Set(
283
- candidates
284
- .map(c => c.riskLevel)
285
- .filter((r): r is "low" | "medium" | "high" => typeof r === 'string')
286
- );
287
- // If NO candidates have riskLevel, skip risk diversity check (graceful degradation)
288
- const riskLevelDiversity = riskLevels.size === 0 || riskLevels.size >= 2;
289
-
290
- // Check 2: Keyword overlap (D-05: intersection / max(|A|, |B|) for words > 3 chars)
291
- let maxOverlapScore = 0;
292
- let keywordOverlapPassed = true;
293
-
294
- for (let i = 0; i < candidates.length; i++) {
295
- for (let j = i + 1; j < candidates.length; j++) {
296
-
297
- const overlap = computeKeywordOverlap(
298
- candidates[i].betterDecision ?? '',
299
- candidates[j].betterDecision ?? '',
300
- );
301
- if (overlap > maxOverlapScore) {
302
- maxOverlapScore = overlap;
303
- }
304
- if (overlap > 0.8) {
305
- keywordOverlapPassed = false;
306
- }
307
- }
308
- }
309
-
310
- const diversityCheckPassed = riskLevelDiversity && keywordOverlapPassed;
311
-
312
- // Build details string
313
- const parts: string[] = [];
314
- if (!riskLevelDiversity) {
315
- parts.push(`Risk levels not diverse (found: ${[...riskLevels].join(', ') || 'none'})`);
316
- }
317
- if (!keywordOverlapPassed) {
318
- parts.push(`Keyword overlap too high (max: ${maxOverlapScore.toFixed(2)})`);
319
- }
320
-
321
- return {
322
- diversityCheckPassed,
323
- riskLevelDiversity,
324
- keywordOverlapPassed,
325
- maxOverlapScore: Math.round(maxOverlapScore * 100) / 100,
326
- details: diversityCheckPassed
327
- ? 'Diversity check passed'
328
- : parts.join('; '),
329
- };
330
- }
331
-
332
- /**
333
- * Compute keyword overlap between two strings.
334
- * Algorithm: intersection / max(|A|, |B|) for words > 3 chars (per D-05).
335
- * Returns value between 0 and 1.
336
- */
337
- function computeKeywordOverlap(textA: string, textB: string): number {
338
-
339
- const wordsA = extractKeywords(textA);
340
-
341
- const wordsB = extractKeywords(textB);
342
-
343
- if (wordsA.length === 0 && wordsB.length === 0) return 0;
344
- if (wordsA.length === 0 || wordsB.length === 0) return 0;
345
-
346
- const setA = new Set(wordsA);
347
- const setB = new Set(wordsB);
348
-
349
- let intersection = 0;
350
- for (const word of setA) {
351
- if (setB.has(word)) intersection++;
352
- }
353
-
354
- const denominator = Math.max(setA.size, setB.size);
355
- return denominator === 0 ? 0 : intersection / denominator;
356
- }
357
-
358
- /**
359
- * Extract keywords from text: words > 3 characters, lowercased.
360
- */
361
- function extractKeywords(text: string): string[] {
362
- if (!text) return [];
363
- return text
364
- .toLowerCase()
365
- .split(/[^a-z0-9]+/)
366
- .filter(w => w.length > 3);
367
- }
368
-
369
- /**
370
- * Score and rank all candidates deterministically.
371
- *
372
- * @param candidates - Dreamer candidates
373
- * @param judgments - Philosopher judgments (aligned by candidateIndex)
374
- * @param thresholds - Minimum thresholds
375
- * @param weights - Scoring weights
376
- * @returns All scored and ranked candidates
377
- */
378
-
379
-
380
- export function rankCandidates(
381
- candidates: DreamerCandidate[],
382
- judgments: PhilosopherJudgment[],
383
- thresholds: ThresholdValues,
384
- weights: ScoringWeights = DEFAULT_SCORING_WEIGHTS
385
- ): ScoredCandidate[] {
386
- const trace: TournamentTraceEntry[] = [];
387
-
388
- trace.push({
389
- step: 'Input Validation',
390
- details: `Received ${candidates.length} candidates and ${judgments.length} judgments`,
391
- });
392
-
393
- // Score each candidate
394
- const scored: ScoredCandidate[] = [];
395
- for (const candidate of candidates) {
396
- const judgment = judgments.find((j) => j.candidateIndex === candidate.candidateIndex);
397
- if (!judgment) {
398
- trace.push({
399
- step: `Candidate ${candidate.candidateIndex}`,
400
- details: 'Skipped - no matching judgment found',
401
- });
402
- continue;
403
- }
404
-
405
- const scores = scoreCandidate(candidate, judgment, weights);
406
- const [passed, failed] = checkThresholds(scores, thresholds);
407
-
408
- scored.push({
409
- candidateIndex: candidate.candidateIndex,
410
- candidate,
411
- judgment,
412
- scores,
413
- rank: 0, // Will be set after sorting
414
- thresholdPassed: passed,
415
- failedThresholds: failed,
416
- });
417
-
418
- trace.push({
419
- step: `Candidate ${candidate.candidateIndex} Scored`,
420
- details: `aggregate=${scores.aggregate.toFixed(2)}, thresholdPassed=${passed}`,
421
- });
422
- }
423
-
424
- // Sort by: thresholdPassed DESC, aggregate DESC, candidateIndex ASC (for stability)
425
- scored.sort((a, b) => {
426
- // Threshold-passed candidates come first
427
- if (a.thresholdPassed !== b.thresholdPassed) {
428
- return a.thresholdPassed ? -1 : 1;
429
- }
430
- // Higher aggregate score wins
431
- if (a.scores.aggregate !== b.scores.aggregate) {
432
- return b.scores.aggregate - a.scores.aggregate;
433
- }
434
- // Lower candidateIndex wins ties (stability)
435
- return a.candidateIndex - b.candidateIndex;
436
- });
437
-
438
- // Assign ranks
439
- let currentRank = 1;
440
- let currentAggregate = -1;
441
- for (const candidate of scored) {
442
- if (candidate.scores.aggregate !== currentAggregate) {
443
- currentRank = scored.indexOf(candidate) + 1;
444
- currentAggregate = candidate.scores.aggregate;
445
- }
446
- candidate.rank = currentRank;
447
- }
448
-
449
- trace.push({
450
- step: 'Ranking Complete',
451
- details: `Final order: ${scored.map((c) => `C${c.candidateIndex}(rank=${c.rank},agg=${c.scores.aggregate.toFixed(2)})`).join(', ')}`,
452
- });
453
-
454
- return scored;
455
- }
456
-
457
- /**
458
- * Run tournament selection to choose the best candidate.
459
- *
460
- * @param candidates - Dreamer candidates
461
- * @param judgments - Philosopher judgments
462
- * @param thresholds - Minimum thresholds
463
- * @param weights - Scoring weights
464
- * @returns Tournament result with winner
465
- */
466
-
467
-
468
- export function runTournament(
469
- candidates: DreamerCandidate[],
470
- judgments: PhilosopherJudgment[],
471
- thresholds: ThresholdValues,
472
- weights: ScoringWeights = DEFAULT_SCORING_WEIGHTS
473
- ): TournamentResult {
474
- const trace: TournamentTraceEntry[] = [];
475
-
476
- if (candidates.length === 0 || judgments.length === 0) {
477
- return {
478
- success: false,
479
- winner: null,
480
- rankedCandidates: [],
481
- trace: [{ step: 'Validation', details: 'No candidates or judgments provided' }],
482
- failureReason: 'No candidates or judgments provided',
483
- };
484
- }
485
-
486
- trace.push({
487
- step: 'Tournament Start',
488
- details: `${candidates.length} candidates in tournament`,
489
- });
490
-
491
- // Rank candidates
492
- const ranked = rankCandidates(candidates, judgments, thresholds, weights);
493
-
494
- trace.push({
495
- step: 'Threshold Check',
496
- details: `${ranked.filter((c) => c.thresholdPassed).length} candidates passed thresholds`,
497
- });
498
-
499
- // Filter to threshold-passed candidates for winner determination
500
- const eligible = ranked.filter((c) => c.thresholdPassed);
501
-
502
- if (eligible.length === 0) {
503
- trace.push({
504
- step: 'No Winner',
505
- details: 'All candidates failed threshold check',
506
- });
507
- return {
508
- success: false,
509
- winner: null,
510
- rankedCandidates: ranked,
511
- trace,
512
- failureReason: 'All candidates failed threshold check',
513
- };
514
- }
515
-
516
- // Winner is rank 1
517
- const [winner] = eligible;
518
-
519
- trace.push({
520
- step: 'Winner Selected',
521
- details: `Candidate ${winner.candidateIndex} wins with aggregate score ${winner.scores.aggregate.toFixed(2)}`,
522
- });
523
-
524
- return {
525
- success: true,
526
- winner,
527
- rankedCandidates: ranked,
528
- trace,
529
- };
530
- }