monomind 1.11.11 → 1.11.13

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (227) hide show
  1. package/.claude/commands/mastermind/idea.md +1 -1
  2. package/.claude/commands/mastermind/master.md +1 -1
  3. package/.claude/skills/mastermind/_protocol.md +4 -4
  4. package/.claude/skills/mastermind/architect.md +7 -4
  5. package/.claude/skills/mastermind/autodev.md +4 -2
  6. package/.claude/skills/mastermind/build.md +3 -3
  7. package/.claude/skills/mastermind/content.md +3 -3
  8. package/.claude/skills/mastermind/createorg.md +2 -2
  9. package/.claude/skills/mastermind/finance.md +3 -3
  10. package/.claude/skills/mastermind/idea.md +8 -0
  11. package/.claude/skills/mastermind/marketing.md +3 -3
  12. package/.claude/skills/mastermind/ops.md +3 -3
  13. package/.claude/skills/mastermind/release.md +3 -3
  14. package/.claude/skills/mastermind/research.md +3 -3
  15. package/.claude/skills/mastermind/review.md +3 -3
  16. package/.claude/skills/mastermind/sales.md +3 -3
  17. package/package.json +1 -1
  18. package/packages/@monomind/cli/dist/src/index.js +19 -14
  19. package/packages/@monomind/cli/dist/src/init/statusline-generator.js +3 -3
  20. package/packages/@monomind/cli/dist/src/observability/replay-reader.d.ts +1 -1
  21. package/packages/@monomind/cli/dist/src/update/checker.js +24 -7
  22. package/packages/@monomind/cli/dist/src/update/index.d.ts +10 -0
  23. package/packages/@monomind/cli/dist/src/update/index.js +29 -2
  24. package/packages/@monomind/cli/package.json +1 -1
  25. package/packages/@monomind/cli/dist/src/agents/halt-signal.d.ts +0 -25
  26. package/packages/@monomind/cli/dist/src/agents/halt-signal.js +0 -76
  27. package/packages/@monomind/cli/dist/src/agents/index.d.ts +0 -18
  28. package/packages/@monomind/cli/dist/src/agents/index.js +0 -13
  29. package/packages/@monomind/cli/dist/src/agents/managed-agent.d.ts +0 -41
  30. package/packages/@monomind/cli/dist/src/agents/managed-agent.js +0 -69
  31. package/packages/@monomind/cli/dist/src/agents/prompt-experiment.d.ts +0 -23
  32. package/packages/@monomind/cli/dist/src/agents/prompt-experiment.js +0 -49
  33. package/packages/@monomind/cli/dist/src/agents/prompt-version-manager.d.ts +0 -22
  34. package/packages/@monomind/cli/dist/src/agents/prompt-version-manager.js +0 -80
  35. package/packages/@monomind/cli/dist/src/agents/registry-query.d.ts +0 -71
  36. package/packages/@monomind/cli/dist/src/agents/registry-query.js +0 -125
  37. package/packages/@monomind/cli/dist/src/agents/score-decay.d.ts +0 -19
  38. package/packages/@monomind/cli/dist/src/agents/score-decay.js +0 -22
  39. package/packages/@monomind/cli/dist/src/agents/shared-instructions-loader.d.ts +0 -13
  40. package/packages/@monomind/cli/dist/src/agents/shared-instructions-loader.js +0 -40
  41. package/packages/@monomind/cli/dist/src/agents/specialization-scorer.d.ts +0 -54
  42. package/packages/@monomind/cli/dist/src/agents/specialization-scorer.js +0 -212
  43. package/packages/@monomind/cli/dist/src/agents/termination-watcher.d.ts +0 -30
  44. package/packages/@monomind/cli/dist/src/agents/termination-watcher.js +0 -84
  45. package/packages/@monomind/cli/dist/src/agents/trigger-index.d.ts +0 -20
  46. package/packages/@monomind/cli/dist/src/agents/trigger-index.js +0 -38
  47. package/packages/@monomind/cli/dist/src/agents/trigger-scanner.d.ts +0 -64
  48. package/packages/@monomind/cli/dist/src/agents/trigger-scanner.js +0 -308
  49. package/packages/@monomind/cli/dist/src/agents/version-diff.d.ts +0 -18
  50. package/packages/@monomind/cli/dist/src/agents/version-diff.js +0 -64
  51. package/packages/@monomind/cli/dist/src/agents/version-store.d.ts +0 -60
  52. package/packages/@monomind/cli/dist/src/agents/version-store.js +0 -235
  53. package/packages/@monomind/cli/dist/src/benchmarks/pretrain/index.d.ts +0 -45
  54. package/packages/@monomind/cli/dist/src/benchmarks/pretrain/index.js +0 -404
  55. package/packages/@monomind/cli/dist/src/commands/agent-wasm.d.ts +0 -14
  56. package/packages/@monomind/cli/dist/src/commands/agent-wasm.js +0 -333
  57. package/packages/@monomind/cli/dist/src/commands/ui.js +0 -68
  58. package/packages/@monomind/cli/dist/src/consensus/index.d.ts +0 -7
  59. package/packages/@monomind/cli/dist/src/consensus/index.js +0 -6
  60. package/packages/@monomind/cli/dist/src/context/context-provider.d.ts +0 -44
  61. package/packages/@monomind/cli/dist/src/context/context-provider.js +0 -25
  62. package/packages/@monomind/cli/dist/src/context/git-state-provider.d.ts +0 -12
  63. package/packages/@monomind/cli/dist/src/context/git-state-provider.js +0 -34
  64. package/packages/@monomind/cli/dist/src/context/index.d.ts +0 -12
  65. package/packages/@monomind/cli/dist/src/context/index.js +0 -12
  66. package/packages/@monomind/cli/dist/src/context/project-conventions-provider.d.ts +0 -15
  67. package/packages/@monomind/cli/dist/src/context/project-conventions-provider.js +0 -19
  68. package/packages/@monomind/cli/dist/src/context/prompt-assembler.d.ts +0 -26
  69. package/packages/@monomind/cli/dist/src/context/prompt-assembler.js +0 -93
  70. package/packages/@monomind/cli/dist/src/context/task-history-provider.d.ts +0 -24
  71. package/packages/@monomind/cli/dist/src/context/task-history-provider.js +0 -32
  72. package/packages/@monomind/cli/dist/src/context/user-preferences-provider.d.ts +0 -14
  73. package/packages/@monomind/cli/dist/src/context/user-preferences-provider.js +0 -27
  74. package/packages/@monomind/cli/dist/src/dlq/dlq-reader.d.ts +0 -31
  75. package/packages/@monomind/cli/dist/src/dlq/dlq-reader.js +0 -81
  76. package/packages/@monomind/cli/dist/src/dlq/dlq-writer.d.ts +0 -24
  77. package/packages/@monomind/cli/dist/src/dlq/dlq-writer.js +0 -65
  78. package/packages/@monomind/cli/dist/src/dlq/index.d.ts +0 -10
  79. package/packages/@monomind/cli/dist/src/dlq/index.js +0 -7
  80. package/packages/@monomind/cli/dist/src/eval/dataset-manager.d.ts +0 -33
  81. package/packages/@monomind/cli/dist/src/eval/dataset-manager.js +0 -107
  82. package/packages/@monomind/cli/dist/src/eval/dataset-runner.d.ts +0 -23
  83. package/packages/@monomind/cli/dist/src/eval/dataset-runner.js +0 -59
  84. package/packages/@monomind/cli/dist/src/eval/index.d.ts +0 -10
  85. package/packages/@monomind/cli/dist/src/eval/index.js +0 -7
  86. package/packages/@monomind/cli/dist/src/eval/trace-collector.d.ts +0 -40
  87. package/packages/@monomind/cli/dist/src/eval/trace-collector.js +0 -102
  88. package/packages/@monomind/cli/dist/src/infrastructure/in-memory-repositories.d.ts +0 -68
  89. package/packages/@monomind/cli/dist/src/infrastructure/in-memory-repositories.js +0 -264
  90. package/packages/@monomind/cli/dist/src/interactive/interrupt.d.ts +0 -22
  91. package/packages/@monomind/cli/dist/src/interactive/interrupt.js +0 -71
  92. package/packages/@monomind/cli/dist/src/mcp/deprecation-injector.d.ts +0 -25
  93. package/packages/@monomind/cli/dist/src/mcp/deprecation-injector.js +0 -48
  94. package/packages/@monomind/cli/dist/src/mcp/tool-registry.d.ts +0 -61
  95. package/packages/@monomind/cli/dist/src/mcp/tool-registry.js +0 -246
  96. package/packages/@monomind/cli/dist/src/mcp-tools/wasm-agent-tools.d.ts +0 -9
  97. package/packages/@monomind/cli/dist/src/mcp-tools/wasm-agent-tools.js +0 -230
  98. package/packages/@monomind/cli/dist/src/model/complexity-scorer.d.ts +0 -21
  99. package/packages/@monomind/cli/dist/src/model/complexity-scorer.js +0 -106
  100. package/packages/@monomind/cli/dist/src/model/index.d.ts +0 -4
  101. package/packages/@monomind/cli/dist/src/model/index.js +0 -4
  102. package/packages/@monomind/cli/dist/src/model/model-settings.d.ts +0 -22
  103. package/packages/@monomind/cli/dist/src/model/model-settings.js +0 -33
  104. package/packages/@monomind/cli/dist/src/model/model-tier-resolver.d.ts +0 -24
  105. package/packages/@monomind/cli/dist/src/model/model-tier-resolver.js +0 -65
  106. package/packages/@monomind/cli/dist/src/monovector/capabilities.d.ts +0 -34
  107. package/packages/@monomind/cli/dist/src/monovector/capabilities.js +0 -37
  108. package/packages/@monomind/cli/dist/src/orchestration/index.d.ts +0 -7
  109. package/packages/@monomind/cli/dist/src/orchestration/index.js +0 -6
  110. package/packages/@monomind/cli/dist/src/orchestration/mode-dispatcher.d.ts +0 -11
  111. package/packages/@monomind/cli/dist/src/orchestration/mode-dispatcher.js +0 -31
  112. package/packages/@monomind/cli/dist/src/orchestration/routing-modes.d.ts +0 -68
  113. package/packages/@monomind/cli/dist/src/orchestration/routing-modes.js +0 -180
  114. package/packages/@monomind/cli/dist/src/plugins/tests/demo-plugin-store.d.ts +0 -7
  115. package/packages/@monomind/cli/dist/src/plugins/tests/demo-plugin-store.js +0 -126
  116. package/packages/@monomind/cli/dist/src/plugins/tests/standalone-test.d.ts +0 -12
  117. package/packages/@monomind/cli/dist/src/plugins/tests/standalone-test.js +0 -188
  118. package/packages/@monomind/cli/dist/src/plugins/tests/test-plugin-store.d.ts +0 -7
  119. package/packages/@monomind/cli/dist/src/plugins/tests/test-plugin-store.js +0 -206
  120. package/packages/@monomind/cli/dist/src/runtime/headless.d.ts +0 -60
  121. package/packages/@monomind/cli/dist/src/runtime/headless.js +0 -284
  122. package/packages/@monomind/cli/dist/src/services/agentic-flow-bridge.d.ts +0 -50
  123. package/packages/@monomind/cli/dist/src/services/agentic-flow-bridge.js +0 -95
  124. package/packages/@monomind/cli/dist/src/services/container-worker-pool.d.ts +0 -197
  125. package/packages/@monomind/cli/dist/src/services/container-worker-pool.js +0 -623
  126. package/packages/@monomind/cli/dist/src/services/index.d.ts +0 -13
  127. package/packages/@monomind/cli/dist/src/services/index.js +0 -11
  128. package/packages/@monomind/cli/dist/src/services/worker-queue.d.ts +0 -201
  129. package/packages/@monomind/cli/dist/src/services/worker-queue.js +0 -594
  130. package/packages/@monomind/cli/dist/src/swarm/communication-graph.d.ts +0 -25
  131. package/packages/@monomind/cli/dist/src/swarm/communication-graph.js +0 -77
  132. package/packages/@monomind/cli/dist/src/swarm/flow-enforcer.d.ts +0 -31
  133. package/packages/@monomind/cli/dist/src/swarm/flow-enforcer.js +0 -61
  134. package/packages/@monomind/cli/dist/src/swarm/flow-visualizer.d.ts +0 -19
  135. package/packages/@monomind/cli/dist/src/swarm/flow-visualizer.js +0 -68
  136. package/packages/@monomind/cli/dist/src/transfer/deploy-seraphine.d.ts +0 -13
  137. package/packages/@monomind/cli/dist/src/transfer/deploy-seraphine.js +0 -205
  138. package/packages/@monomind/cli/dist/src/transfer/store/tests/standalone-test.d.ts +0 -12
  139. package/packages/@monomind/cli/dist/src/transfer/store/tests/standalone-test.js +0 -190
  140. package/packages/@monomind/cli/dist/src/transfer/test-seraphine.d.ts +0 -6
  141. package/packages/@monomind/cli/dist/src/transfer/test-seraphine.js +0 -105
  142. package/packages/@monomind/cli/dist/src/transfer/tests/test-store.d.ts +0 -7
  143. package/packages/@monomind/cli/dist/src/transfer/tests/test-store.js +0 -214
  144. package/packages/@monomind/cli/dist/src/workflow/condition-evaluator.d.ts +0 -10
  145. package/packages/@monomind/cli/dist/src/workflow/condition-evaluator.js +0 -82
  146. package/packages/@monomind/cli/dist/src/workflow/context-resolver.d.ts +0 -12
  147. package/packages/@monomind/cli/dist/src/workflow/context-resolver.js +0 -23
  148. package/packages/@monomind/cli/dist/src/workflow/dag-builder.d.ts +0 -17
  149. package/packages/@monomind/cli/dist/src/workflow/dag-builder.js +0 -129
  150. package/packages/@monomind/cli/dist/src/workflow/dag-executor.d.ts +0 -9
  151. package/packages/@monomind/cli/dist/src/workflow/dag-executor.js +0 -116
  152. package/packages/@monomind/cli/dist/src/workflow/dag-types.d.ts +0 -41
  153. package/packages/@monomind/cli/dist/src/workflow/dag-types.js +0 -8
  154. package/packages/@monomind/cli/dist/src/workflow/dsl-parser.d.ts +0 -12
  155. package/packages/@monomind/cli/dist/src/workflow/dsl-parser.js +0 -20
  156. package/packages/@monomind/cli/dist/src/workflow/dsl-schema.d.ts +0 -165
  157. package/packages/@monomind/cli/dist/src/workflow/dsl-schema.js +0 -82
  158. package/packages/@monomind/cli/dist/src/workflow/index.d.ts +0 -13
  159. package/packages/@monomind/cli/dist/src/workflow/index.js +0 -11
  160. package/packages/@monomind/cli/dist/src/workflow/template-engine.d.ts +0 -11
  161. package/packages/@monomind/cli/dist/src/workflow/template-engine.js +0 -40
  162. package/packages/@monomind/cli/dist/src/workflow/workflow-executor.d.ts +0 -29
  163. package/packages/@monomind/cli/dist/src/workflow/workflow-executor.js +0 -227
  164. package/packages/@monomind/guidance/dist/adversarial.d.ts +0 -284
  165. package/packages/@monomind/guidance/dist/adversarial.js +0 -572
  166. package/packages/@monomind/guidance/dist/analyzer.d.ts +0 -530
  167. package/packages/@monomind/guidance/dist/analyzer.js +0 -2518
  168. package/packages/@monomind/guidance/dist/artifacts.d.ts +0 -283
  169. package/packages/@monomind/guidance/dist/artifacts.js +0 -356
  170. package/packages/@monomind/guidance/dist/authority.d.ts +0 -290
  171. package/packages/@monomind/guidance/dist/authority.js +0 -558
  172. package/packages/@monomind/guidance/dist/capabilities.d.ts +0 -209
  173. package/packages/@monomind/guidance/dist/capabilities.js +0 -485
  174. package/packages/@monomind/guidance/dist/coherence.d.ts +0 -233
  175. package/packages/@monomind/guidance/dist/coherence.js +0 -372
  176. package/packages/@monomind/guidance/dist/compiler.d.ts +0 -87
  177. package/packages/@monomind/guidance/dist/compiler.js +0 -419
  178. package/packages/@monomind/guidance/dist/conformance-kit.d.ts +0 -225
  179. package/packages/@monomind/guidance/dist/conformance-kit.js +0 -629
  180. package/packages/@monomind/guidance/dist/continue-gate.d.ts +0 -214
  181. package/packages/@monomind/guidance/dist/continue-gate.js +0 -353
  182. package/packages/@monomind/guidance/dist/crypto-utils.d.ts +0 -17
  183. package/packages/@monomind/guidance/dist/crypto-utils.js +0 -24
  184. package/packages/@monomind/guidance/dist/evolution.d.ts +0 -282
  185. package/packages/@monomind/guidance/dist/evolution.js +0 -500
  186. package/packages/@monomind/guidance/dist/gates.d.ts +0 -79
  187. package/packages/@monomind/guidance/dist/gates.js +0 -302
  188. package/packages/@monomind/guidance/dist/gateway.d.ts +0 -206
  189. package/packages/@monomind/guidance/dist/gateway.js +0 -452
  190. package/packages/@monomind/guidance/dist/generators.d.ts +0 -153
  191. package/packages/@monomind/guidance/dist/generators.js +0 -682
  192. package/packages/@monomind/guidance/dist/headless.d.ts +0 -177
  193. package/packages/@monomind/guidance/dist/headless.js +0 -342
  194. package/packages/@monomind/guidance/dist/hooks.d.ts +0 -109
  195. package/packages/@monomind/guidance/dist/hooks.js +0 -347
  196. package/packages/@monomind/guidance/dist/index.d.ts +0 -205
  197. package/packages/@monomind/guidance/dist/index.js +0 -321
  198. package/packages/@monomind/guidance/dist/ledger.d.ts +0 -162
  199. package/packages/@monomind/guidance/dist/ledger.js +0 -375
  200. package/packages/@monomind/guidance/dist/manifest-validator.d.ts +0 -289
  201. package/packages/@monomind/guidance/dist/manifest-validator.js +0 -838
  202. package/packages/@monomind/guidance/dist/memory-gate.d.ts +0 -222
  203. package/packages/@monomind/guidance/dist/memory-gate.js +0 -382
  204. package/packages/@monomind/guidance/dist/meta-governance.d.ts +0 -265
  205. package/packages/@monomind/guidance/dist/meta-governance.js +0 -348
  206. package/packages/@monomind/guidance/dist/optimizer.d.ts +0 -104
  207. package/packages/@monomind/guidance/dist/optimizer.js +0 -329
  208. package/packages/@monomind/guidance/dist/persistence.d.ts +0 -189
  209. package/packages/@monomind/guidance/dist/persistence.js +0 -464
  210. package/packages/@monomind/guidance/dist/proof.d.ts +0 -185
  211. package/packages/@monomind/guidance/dist/proof.js +0 -238
  212. package/packages/@monomind/guidance/dist/retriever.d.ts +0 -116
  213. package/packages/@monomind/guidance/dist/retriever.js +0 -394
  214. package/packages/@monomind/guidance/dist/ruvbot-integration.d.ts +0 -370
  215. package/packages/@monomind/guidance/dist/ruvbot-integration.js +0 -738
  216. package/packages/@monomind/guidance/dist/temporal.d.ts +0 -426
  217. package/packages/@monomind/guidance/dist/temporal.js +0 -658
  218. package/packages/@monomind/guidance/dist/trust.d.ts +0 -283
  219. package/packages/@monomind/guidance/dist/trust.js +0 -473
  220. package/packages/@monomind/guidance/dist/truth-anchors.d.ts +0 -276
  221. package/packages/@monomind/guidance/dist/truth-anchors.js +0 -488
  222. package/packages/@monomind/guidance/dist/types.d.ts +0 -378
  223. package/packages/@monomind/guidance/dist/types.js +0 -10
  224. package/packages/@monomind/guidance/dist/uncertainty.d.ts +0 -372
  225. package/packages/@monomind/guidance/dist/uncertainty.js +0 -619
  226. package/packages/@monomind/guidance/dist/wasm-kernel.d.ts +0 -48
  227. package/packages/@monomind/guidance/dist/wasm-kernel.js +0 -158
@@ -1,530 +0,0 @@
1
- /**
2
- * CLAUDE.md Analyzer & Auto-Optimizer
3
- *
4
- * Quantifiable, verifiable analysis of CLAUDE.md files.
5
- * Measures structure quality, coverage, enforceability, and produces
6
- * a numeric score (0-100) that can be tracked over time.
7
- *
8
- * The auto-optimizer takes analysis results and produces a concrete
9
- * list of changes that would improve the score. Changes can be applied
10
- * programmatically and the score re-measured to verify improvement.
11
- *
12
- * @module @monomind/guidance/analyzer
13
- */
14
- import type { ProofEnvelope } from './proof.js';
15
- /** Score breakdown for a single dimension (0-100 each) */
16
- export interface DimensionScore {
17
- /** Dimension name */
18
- name: string;
19
- /** Score 0-100 */
20
- score: number;
21
- /** Maximum possible score */
22
- max: number;
23
- /** Weight in composite calculation */
24
- weight: number;
25
- /** Human-readable findings */
26
- findings: string[];
27
- }
28
- /** Complete analysis result */
29
- export interface AnalysisResult {
30
- /** Composite score 0-100 */
31
- compositeScore: number;
32
- /** Letter grade A-F */
33
- grade: string;
34
- /** Per-dimension scores */
35
- dimensions: DimensionScore[];
36
- /** Structural metrics */
37
- metrics: AnalysisMetrics;
38
- /** Actionable improvement suggestions */
39
- suggestions: Suggestion[];
40
- /** Timestamp */
41
- analyzedAt: number;
42
- }
43
- /** Raw metrics extracted from the file */
44
- export interface AnalysisMetrics {
45
- /** Total lines */
46
- totalLines: number;
47
- /** Non-blank, non-comment lines */
48
- contentLines: number;
49
- /** Number of markdown headings */
50
- headingCount: number;
51
- /** Number of H2 sections */
52
- sectionCount: number;
53
- /** Estimated constitution lines (first section block) */
54
- constitutionLines: number;
55
- /** Number of rule-like statements (imperative sentences) */
56
- ruleCount: number;
57
- /** Number of code blocks */
58
- codeBlockCount: number;
59
- /** Number of NEVER/ALWAYS/MUST statements */
60
- enforcementStatements: number;
61
- /** Number of framework/tool mentions */
62
- toolMentions: number;
63
- /** Estimated shard count after compilation */
64
- estimatedShards: number;
65
- /** Has build command */
66
- hasBuildCommand: boolean;
67
- /** Has test command */
68
- hasTestCommand: boolean;
69
- /** Has security section */
70
- hasSecuritySection: boolean;
71
- /** Has architecture section */
72
- hasArchitectureSection: boolean;
73
- /** Lines in longest section */
74
- longestSectionLines: number;
75
- /** Has @import directives */
76
- hasImports: boolean;
77
- /** Number of domain-specific rules */
78
- domainRuleCount: number;
79
- }
80
- /** A concrete improvement suggestion */
81
- export interface Suggestion {
82
- /** What to change */
83
- action: 'add' | 'remove' | 'restructure' | 'split' | 'strengthen';
84
- /** Priority */
85
- priority: 'high' | 'medium' | 'low';
86
- /** Which dimension this improves */
87
- dimension: string;
88
- /** Human-readable description */
89
- description: string;
90
- /** Estimated score improvement */
91
- estimatedImprovement: number;
92
- /** Concrete text to add/modify (if applicable) */
93
- patch?: string;
94
- }
95
- /** Before/after benchmark result */
96
- export interface BenchmarkResult {
97
- before: AnalysisResult;
98
- after: AnalysisResult;
99
- delta: number;
100
- improvements: DimensionDelta[];
101
- regressions: DimensionDelta[];
102
- }
103
- interface DimensionDelta {
104
- dimension: string;
105
- before: number;
106
- after: number;
107
- delta: number;
108
- }
109
- /** Context size preset for optimization */
110
- export type ContextSize = 'compact' | 'standard' | 'full';
111
- /** Configuration for size-aware optimization */
112
- export interface OptimizeOptions {
113
- /** Target context size */
114
- contextSize?: ContextSize;
115
- /** Optional local overlay content */
116
- localContent?: string;
117
- /** Maximum optimization iterations */
118
- maxIterations?: number;
119
- /** Target score (stop when reached) */
120
- targetScore?: number;
121
- /** HMAC key for proof chain (enables cryptographic proof of optimization) */
122
- proofKey?: string;
123
- }
124
- /** Result of headless benchmark via claude -p */
125
- export interface HeadlessBenchmarkResult {
126
- /** Before optimization metrics */
127
- before: {
128
- analysis: AnalysisResult;
129
- suitePassRate: number;
130
- violationCount: number;
131
- taskResults: HeadlessTaskResult[];
132
- };
133
- /** After optimization metrics */
134
- after: {
135
- analysis: AnalysisResult;
136
- suitePassRate: number;
137
- violationCount: number;
138
- taskResults: HeadlessTaskResult[];
139
- };
140
- /** Score delta */
141
- delta: number;
142
- /** Proof chain with cryptographic verification */
143
- proofChain: ProofEnvelope[];
144
- /** Formatted report */
145
- report: string;
146
- }
147
- /** Result of a single headless task run */
148
- export interface HeadlessTaskResult {
149
- taskId: string;
150
- prompt: string;
151
- passed: boolean;
152
- violations: string[];
153
- durationMs: number;
154
- }
155
- /**
156
- * Analyze a CLAUDE.md file and produce quantifiable scores.
157
- *
158
- * Scores 6 dimensions (0-100 each), weighted into a composite:
159
- * - Structure (20%): headings, sections, length, organization
160
- * - Coverage (20%): build/test/security/architecture/domain
161
- * - Enforceability (25%): NEVER/ALWAYS statements, concrete rules
162
- * - Compilability (15%): how well it compiles to constitution + shards
163
- * - Clarity (10%): code blocks, examples, specificity
164
- * - Completeness (10%): missing common sections
165
- */
166
- export declare function analyze(content: string, localContent?: string): AnalysisResult;
167
- /**
168
- * Run a before/after benchmark.
169
- * Returns the delta and per-dimension changes.
170
- */
171
- export declare function benchmark(before: string, after: string, localContent?: string): BenchmarkResult;
172
- /**
173
- * Auto-optimize a CLAUDE.md file by applying high-priority suggestions.
174
- * Returns the optimized content and the benchmark result.
175
- */
176
- export declare function autoOptimize(content: string, localContent?: string, maxIterations?: number): {
177
- optimized: string;
178
- benchmark: BenchmarkResult;
179
- appliedSuggestions: Suggestion[];
180
- };
181
- /**
182
- * Context-size-aware optimization that restructures content to reach 90%+.
183
- *
184
- * Unlike autoOptimize (which only appends), this function:
185
- * 1. Splits oversized sections into subsections
186
- * 2. Extracts enforcement prose into list-format rules
187
- * 3. Trims the constitution to budget
188
- * 4. Removes redundant content
189
- * 5. Adds missing coverage sections
190
- * 6. Applies iterative patch suggestions
191
- *
192
- * @param content - CLAUDE.md content
193
- * @param options - Optimization options with contextSize and targetScore
194
- * @returns Optimized content, benchmark, and proof chain
195
- */
196
- export declare function optimizeForSize(content: string, options?: OptimizeOptions): {
197
- optimized: string;
198
- benchmark: BenchmarkResult;
199
- appliedSteps: string[];
200
- proof: ProofEnvelope[];
201
- };
202
- /**
203
- * Run a headless benchmark using `claude -p` to measure actual agent
204
- * compliance before and after optimization.
205
- *
206
- * Requires `claude` CLI to be installed. Uses the proof chain to create
207
- * tamper-evident records of each test run.
208
- *
209
- * @param originalContent - Original CLAUDE.md
210
- * @param optimizedContent - Optimized CLAUDE.md
211
- * @param options - Options including proof key and executor
212
- */
213
- export declare function headlessBenchmark(originalContent: string, optimizedContent: string, options?: {
214
- proofKey?: string;
215
- executor?: IHeadlessExecutor;
216
- tasks?: HeadlessBenchmarkTask[];
217
- workDir?: string;
218
- }): Promise<HeadlessBenchmarkResult>;
219
- /** Executor interface for headless claude commands */
220
- export interface IHeadlessExecutor {
221
- execute(prompt: string, workDir: string): Promise<{
222
- stdout: string;
223
- stderr: string;
224
- exitCode: number;
225
- }>;
226
- }
227
- /**
228
- * Content-aware executor that adapts behavior based on CLAUDE.md content.
229
- *
230
- * When `validateEffect()` detects this interface, it calls `setContext()`
231
- * before each phase (before/after) so the executor can vary its responses
232
- * based on the quality of the loaded CLAUDE.md. This is the key mechanism
233
- * that makes the empirical validation meaningful — without it, the same
234
- * executor produces identical adherence for both phases.
235
- */
236
- export interface IContentAwareExecutor extends IHeadlessExecutor {
237
- /** Set the CLAUDE.md content that the executor should use as behavioral context */
238
- setContext(claudeMdContent: string): void;
239
- }
240
- /** Benchmark task definition */
241
- interface HeadlessBenchmarkTask {
242
- id: string;
243
- prompt: string;
244
- expectForbidden: string[];
245
- expectPresent: string[];
246
- }
247
- /**
248
- * Format analysis result as a human-readable report.
249
- */
250
- export declare function formatReport(result: AnalysisResult): string;
251
- /**
252
- * Format benchmark result as a comparison table.
253
- */
254
- export declare function formatBenchmark(result: BenchmarkResult): string;
255
- /**
256
- * An assertion about expected agent behavior.
257
- */
258
- export interface ValidationAssertion {
259
- /** What to check */
260
- type: 'must-contain' | 'must-not-contain' | 'must-match-pattern' | 'must-mention-tool';
261
- /** The value to check (string literal or regex pattern for must-match-pattern) */
262
- value: string;
263
- /** How bad is a failure? */
264
- severity: 'critical' | 'major' | 'minor';
265
- }
266
- /**
267
- * A compliance task that tests whether the agent adheres to a specific
268
- * dimension's expected behavior.
269
- */
270
- export interface ValidationTask {
271
- /** Unique task identifier */
272
- id: string;
273
- /** Which scoring dimension this task validates */
274
- dimension: string;
275
- /** The prompt to send to the agent */
276
- prompt: string;
277
- /** Assertions about the agent's output */
278
- assertions: ValidationAssertion[];
279
- /** Importance weight within its dimension (0-1) */
280
- weight: number;
281
- }
282
- /**
283
- * Result of running a single validation task.
284
- */
285
- export interface ValidationTaskResult {
286
- taskId: string;
287
- dimension: string;
288
- passed: boolean;
289
- assertionResults: {
290
- assertion: ValidationAssertion;
291
- passed: boolean;
292
- detail: string;
293
- }[];
294
- output: string;
295
- durationMs: number;
296
- }
297
- /**
298
- * A single validation run against one CLAUDE.md version.
299
- */
300
- export interface ValidationRun {
301
- /** Analysis of the CLAUDE.md used */
302
- analysis: AnalysisResult;
303
- /** Per-task results */
304
- taskResults: ValidationTaskResult[];
305
- /** Overall adherence rate (0-1) — weighted by severity */
306
- adherenceRate: number;
307
- /** Per-dimension adherence rates */
308
- dimensionAdherence: Record<string, number>;
309
- /** Timestamp */
310
- timestamp: number;
311
- }
312
- /**
313
- * Statistical correlation between score changes and behavioral changes.
314
- */
315
- export interface CorrelationResult {
316
- /** Per-dimension score vs adherence comparison */
317
- dimensionCorrelations: {
318
- dimension: string;
319
- scoreBefore: number;
320
- scoreAfter: number;
321
- scoreDelta: number;
322
- adherenceBefore: number;
323
- adherenceAfter: number;
324
- adherenceDelta: number;
325
- /** Did score and adherence move in the same direction? */
326
- concordant: boolean;
327
- }[];
328
- /** Pearson correlation coefficient (-1 to 1) */
329
- pearsonR: number;
330
- /** Spearman rank correlation coefficient (-1 to 1) — more robust for small samples */
331
- spearmanRho: number;
332
- /** Cohen's d effect size (null if insufficient data) */
333
- cohensD: number | null;
334
- /** Human-readable effect size label */
335
- effectSizeLabel: string;
336
- /** Number of data points */
337
- n: number;
338
- /** Is the correlation statistically significant? (|r| > threshold for n) */
339
- significant: boolean;
340
- /** Overall verdict */
341
- verdict: 'positive-effect' | 'negative-effect' | 'no-effect' | 'inconclusive';
342
- }
343
- /**
344
- * Complete validation report proving (or disproving) that score improvements
345
- * lead to behavioral improvements.
346
- */
347
- export interface ValidationReport {
348
- /** Run against original CLAUDE.md */
349
- before: ValidationRun;
350
- /** Run against optimized CLAUDE.md */
351
- after: ValidationRun;
352
- /** Statistical correlation analysis */
353
- correlation: CorrelationResult;
354
- /** Cryptographic proof chain */
355
- proofChain: ProofEnvelope[];
356
- /** Formatted human-readable report */
357
- report: string;
358
- }
359
- /**
360
- * Empirically validate that score improvements produce behavioral improvements.
361
- *
362
- * Runs a suite of compliance tasks against both the original and optimized
363
- * CLAUDE.md, then computes statistical correlations between per-dimension
364
- * score deltas and per-dimension adherence rate deltas.
365
- *
366
- * **Content-aware executors**: If the executor implements `IContentAwareExecutor`,
367
- * `setContext()` is called before each phase with the corresponding CLAUDE.md
368
- * content. This is the key mechanism that allows the executor to vary its
369
- * behavior based on the quality of the loaded guidance — without it, the same
370
- * executor produces identical adherence for both phases.
371
- *
372
- * The result includes:
373
- * - Per-dimension concordance (did score and adherence move together?)
374
- * - Pearson r and Spearman rho correlation coefficients
375
- * - Cohen's d effect size with interpretation
376
- * - A verdict: positive-effect, negative-effect, no-effect, or inconclusive
377
- * - A formatted report with full task breakdown
378
- * - Optional proof chain for tamper-evident audit trail
379
- *
380
- * @param originalContent - Original CLAUDE.md content
381
- * @param optimizedContent - Optimized CLAUDE.md content
382
- * @param options - Executor, tasks, proof key, work directory, trials
383
- * @returns ValidationReport with statistical evidence
384
- */
385
- export declare function validateEffect(originalContent: string, optimizedContent: string, options?: {
386
- executor?: IHeadlessExecutor;
387
- tasks?: ValidationTask[];
388
- proofKey?: string;
389
- workDir?: string;
390
- /** Number of trials per phase (default 1). Higher values average out noise. */
391
- trials?: number;
392
- }): Promise<ValidationReport>;
393
- /** Task class categories for the A/B benchmark */
394
- export type ABTaskClass = 'bug-fix' | 'feature' | 'refactor' | 'security' | 'deployment' | 'test' | 'performance';
395
- /** A single benchmark task representing a real Monomind scenario */
396
- export interface ABTask {
397
- /** Unique task identifier */
398
- id: string;
399
- /** Human-readable description */
400
- description: string;
401
- /** Task class for grouping results */
402
- taskClass: ABTaskClass;
403
- /** Prompt sent to the executor */
404
- prompt: string;
405
- /** Assertions to evaluate pass/fail */
406
- assertions: ValidationAssertion[];
407
- /** Violation patterns to detect via gate simulation */
408
- gatePatterns: ABGatePattern[];
409
- }
410
- /** A pattern the gate simulator checks for in executor output */
411
- export interface ABGatePattern {
412
- /** What kind of violation this detects */
413
- category: 'destructive-command' | 'hardcoded-secret' | 'force-push' | 'unsafe-type' | 'skipped-hook' | 'missing-test' | 'policy-violation';
414
- /** Regex pattern to match in output */
415
- pattern: string;
416
- /** Severity of the violation */
417
- severity: 'critical' | 'major' | 'minor';
418
- }
419
- /** Result for a single task in either config A or config B */
420
- export interface ABTaskResult {
421
- /** Task ID */
422
- taskId: string;
423
- /** Task class */
424
- taskClass: ABTaskClass;
425
- /** Did all assertions pass? */
426
- passed: boolean;
427
- /** Assertion evaluation details */
428
- assertionResults: {
429
- assertion: ValidationAssertion;
430
- passed: boolean;
431
- detail: string;
432
- }[];
433
- /** Gate violations detected */
434
- violations: {
435
- category: string;
436
- pattern: string;
437
- severity: string;
438
- }[];
439
- /** Would a human need to intervene? (any critical violation) */
440
- humanIntervention: boolean;
441
- /** Simulated tool call count (extracted from output) */
442
- toolCalls: number;
443
- /** Simulated token spend (estimated from output length) */
444
- tokenSpend: number;
445
- /** Raw executor output */
446
- output: string;
447
- /** Execution duration in ms */
448
- durationMs: number;
449
- }
450
- /** Aggregated KPIs for one config (A or B) */
451
- export interface ABMetrics {
452
- /** Fraction of tasks that passed (0-1) */
453
- successRate: number;
454
- /** Total wall clock time in ms */
455
- wallClockMs: number;
456
- /** Average tool calls per task */
457
- avgToolCalls: number;
458
- /** Average token spend per task */
459
- avgTokenSpend: number;
460
- /** Total gate violations */
461
- totalViolations: number;
462
- /** Tasks requiring human intervention */
463
- humanInterventions: number;
464
- /** Per-task-class success rates */
465
- classSuccessRates: Record<ABTaskClass, number>;
466
- /** Composite score: success_rate - 0.1*norm_cost - 0.2*violations - 0.1*interventions */
467
- compositeScore: number;
468
- }
469
- /** Complete A/B benchmark report */
470
- export interface ABReport {
471
- /** Config A results (no control plane) */
472
- configA: {
473
- label: string;
474
- taskResults: ABTaskResult[];
475
- metrics: ABMetrics;
476
- };
477
- /** Config B results (with Phase 1 control plane) */
478
- configB: {
479
- label: string;
480
- taskResults: ABTaskResult[];
481
- metrics: ABMetrics;
482
- };
483
- /** Composite score delta (B - A) */
484
- compositeDelta: number;
485
- /** Per-task-class deltas */
486
- classDeltas: Record<ABTaskClass, number>;
487
- /** Does B beat A by ≥0.2 on composite across ≥3 task classes? */
488
- categoryShift: boolean;
489
- /** Proof chain envelopes */
490
- proofChain: ProofEnvelope[];
491
- /** Formatted human-readable report */
492
- report: string;
493
- }
494
- /**
495
- * Run an A/B benchmark comparing agent performance with and without
496
- * the Guidance Control Plane.
497
- *
498
- * **Config A** (baseline): No guidance — executor runs without setContext()
499
- * **Config B** (treatment): With guidance — executor gets setContext(claudeMd) +
500
- * gate simulation on every output
501
- *
502
- * The 20 tasks span 7 task classes drawn from real Monomind repo history:
503
- * bug-fix (3), feature (5), refactor (3), security (3), deployment (2),
504
- * test (2), performance (2).
505
- *
506
- * KPIs tracked per task:
507
- * - success rate, tool calls, token spend, violations, human interventions
508
- *
509
- * Composite score: `success_rate - 0.1*norm_cost - 0.2*violations - 0.1*interventions`
510
- *
511
- * **Success criterion**: B beats A by ≥0.2 on composite across ≥3 task classes
512
- * = "category shift"
513
- *
514
- * @param claudeMdContent - The CLAUDE.md content used for Config B
515
- * @param options - Executor, tasks, proof key, work directory
516
- * @returns ABReport with full per-task and per-class breakdown
517
- */
518
- export declare function abBenchmark(claudeMdContent: string, options?: {
519
- executor?: IHeadlessExecutor;
520
- tasks?: ABTask[];
521
- proofKey?: string;
522
- workDir?: string;
523
- }): Promise<ABReport>;
524
- /**
525
- * Get the default 20 A/B benchmark tasks.
526
- * Exported for test customization and documentation.
527
- */
528
- export declare function getDefaultABTasks(): ABTask[];
529
- export {};
530
- //# sourceMappingURL=analyzer.d.ts.map