avorelo 0.1.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (260) hide show
  1. package/LICENSE +23 -16
  2. package/README.md +90 -51
  3. package/bin/avorelo.mjs +7 -0
  4. package/dist/avorelo.mjs +19741 -0
  5. package/package.json +135 -120
  6. package/bin/avorelo +0 -9
  7. package/scripts/README.md +0 -40
  8. package/scripts/cco-dashboard.js +0 -252
  9. package/scripts/cco-status.js +0 -430
  10. package/scripts/lib/activation/account-state.js +0 -37
  11. package/scripts/lib/activation/activation-runner.js +0 -546
  12. package/scripts/lib/activation/activation-self-healing.js +0 -480
  13. package/scripts/lib/activation/activation-state.js +0 -83
  14. package/scripts/lib/activation/activation-summary.js +0 -191
  15. package/scripts/lib/activation/adapters/claude-code.js +0 -77
  16. package/scripts/lib/activation/adapters/codex-cli.js +0 -52
  17. package/scripts/lib/activation/adapters/cursor.js +0 -37
  18. package/scripts/lib/activation/adapters/github-agent.js +0 -39
  19. package/scripts/lib/activation/adapters/terminal.js +0 -42
  20. package/scripts/lib/activation/adapters/vscode.js +0 -39
  21. package/scripts/lib/activation/adapters/windsurf.js +0 -37
  22. package/scripts/lib/activation/ai-surface-detector.js +0 -151
  23. package/scripts/lib/activation/connect-account.js +0 -145
  24. package/scripts/lib/activation/detect-environment.js +0 -75
  25. package/scripts/lib/activation/detect-hosts.js +0 -62
  26. package/scripts/lib/activation/format-activation-output.js +0 -109
  27. package/scripts/lib/activation/next-action.js +0 -43
  28. package/scripts/lib/activation/repair-engine.js +0 -219
  29. package/scripts/lib/activation-distribution-readiness.js +0 -507
  30. package/scripts/lib/adapter-conformance.js +0 -176
  31. package/scripts/lib/adapter-readiness.js +0 -417
  32. package/scripts/lib/adapter-safety-boundaries.js +0 -335
  33. package/scripts/lib/adapter-technical-readiness-gate.js +0 -205
  34. package/scripts/lib/agent-access-governance.js +0 -455
  35. package/scripts/lib/agent-enforcement.js +0 -765
  36. package/scripts/lib/agent-policy-profile.js +0 -210
  37. package/scripts/lib/agent-security/action-evaluator.js +0 -507
  38. package/scripts/lib/agent-security/adapter-registry.js +0 -98
  39. package/scripts/lib/agent-security/auto-policy.js +0 -139
  40. package/scripts/lib/agent-security/bounded-scan.js +0 -93
  41. package/scripts/lib/agent-security/enforcement-adapter.js +0 -174
  42. package/scripts/lib/agent-security/enforcement-engine.js +0 -1129
  43. package/scripts/lib/agent-security/file-write-adapter.js +0 -183
  44. package/scripts/lib/agent-security/file-write-rules.js +0 -178
  45. package/scripts/lib/agent-security/index.js +0 -3342
  46. package/scripts/lib/agent-security/instruction-risk.js +0 -181
  47. package/scripts/lib/agent-security/mcp-action-adapter.js +0 -185
  48. package/scripts/lib/agent-security/mcp-action-rules.js +0 -184
  49. package/scripts/lib/agent-security/package-action-adapter.js +0 -175
  50. package/scripts/lib/agent-security/package-action-rules.js +0 -233
  51. package/scripts/lib/agent-security/performance.js +0 -148
  52. package/scripts/lib/agent-security/permission-minimizer.js +0 -403
  53. package/scripts/lib/agent-security/scan-cache.js +0 -74
  54. package/scripts/lib/agent-security/source-trust.js +0 -146
  55. package/scripts/lib/ai-install-prompt.js +0 -288
  56. package/scripts/lib/ai-workspace-hygiene.js +0 -1499
  57. package/scripts/lib/alpha-activation.js +0 -520
  58. package/scripts/lib/alpha-feedback.js +0 -263
  59. package/scripts/lib/alpha-readiness-gate.js +0 -332
  60. package/scripts/lib/anti-gaming.js +0 -169
  61. package/scripts/lib/artifact-health.js +0 -431
  62. package/scripts/lib/attribution.js +0 -180
  63. package/scripts/lib/audit.js +0 -289
  64. package/scripts/lib/avorelo-skill-registry.js +0 -810
  65. package/scripts/lib/batch-jobs.js +0 -71
  66. package/scripts/lib/brain-pack.js +0 -578
  67. package/scripts/lib/brand-boundary.js +0 -424
  68. package/scripts/lib/brand.js +0 -74
  69. package/scripts/lib/browser-capability.js +0 -1048
  70. package/scripts/lib/browser-proof-preflight.js +0 -321
  71. package/scripts/lib/cache-readiness.js +0 -187
  72. package/scripts/lib/canonical-reentry.js +0 -162
  73. package/scripts/lib/capability-packs.js +0 -314
  74. package/scripts/lib/capability-recommender.js +0 -512
  75. package/scripts/lib/capability-registry.js +0 -1059
  76. package/scripts/lib/carry-forward-surfacing.js +0 -194
  77. package/scripts/lib/ccusage-adapter.js +0 -188
  78. package/scripts/lib/company-loop.js +0 -1149
  79. package/scripts/lib/config.js +0 -637
  80. package/scripts/lib/context-acquisition-plan.js +0 -287
  81. package/scripts/lib/context-budget-guard.js +0 -170
  82. package/scripts/lib/context-budget-scanner.js +0 -257
  83. package/scripts/lib/context-optimizer.js +0 -715
  84. package/scripts/lib/context-reduction-plan.js +0 -178
  85. package/scripts/lib/context-safety.js +0 -88
  86. package/scripts/lib/context-savings-engine.js +0 -158
  87. package/scripts/lib/cost-evidence.js +0 -254
  88. package/scripts/lib/cross-host-install-plan.js +0 -308
  89. package/scripts/lib/cross-host-install-readiness.js +0 -237
  90. package/scripts/lib/cross-host-value-flow.js +0 -268
  91. package/scripts/lib/dashboard.js +0 -900
  92. package/scripts/lib/design-partner-feedback.js +0 -346
  93. package/scripts/lib/entitlements.js +0 -100
  94. package/scripts/lib/execution-packet.js +0 -559
  95. package/scripts/lib/experimentation-events.js +0 -547
  96. package/scripts/lib/external-capability-compliance.js +0 -107
  97. package/scripts/lib/external-user-simulation.js +0 -166
  98. package/scripts/lib/failure-recovery-readiness.js +0 -81
  99. package/scripts/lib/failure-recovery.js +0 -419
  100. package/scripts/lib/feedback-intelligence.js +0 -537
  101. package/scripts/lib/feedback-signals.js +0 -205
  102. package/scripts/lib/file-integrity.js +0 -68
  103. package/scripts/lib/fsx.js +0 -127
  104. package/scripts/lib/full-readiness-gate.js +0 -451
  105. package/scripts/lib/guidance-builder.js +0 -174
  106. package/scripts/lib/hook-apply.js +0 -1019
  107. package/scripts/lib/hook-baseline.js +0 -310
  108. package/scripts/lib/hook-config-preview.js +0 -275
  109. package/scripts/lib/hook-contracts.js +0 -290
  110. package/scripts/lib/hook-safety-boundary-readiness.js +0 -80
  111. package/scripts/lib/host-capability-matrix.js +0 -351
  112. package/scripts/lib/host-support-context.js +0 -254
  113. package/scripts/lib/http-hook-action.js +0 -538
  114. package/scripts/lib/install-ai-readiness.js +0 -84
  115. package/scripts/lib/install-intake-risk.js +0 -1037
  116. package/scripts/lib/install-journey-intelligence.js +0 -329
  117. package/scripts/lib/intervention-guidance.js +0 -57
  118. package/scripts/lib/known-limitations.js +0 -115
  119. package/scripts/lib/l8-path-truth.js +0 -146
  120. package/scripts/lib/launch-hardening-gate.js +0 -436
  121. package/scripts/lib/launch-readiness.js +0 -628
  122. package/scripts/lib/learning-memory.js +0 -686
  123. package/scripts/lib/lifecycle-hooks.js +0 -802
  124. package/scripts/lib/local-package-smoke.js +0 -423
  125. package/scripts/lib/local-pricing.js +0 -299
  126. package/scripts/lib/mcp-enforcement.js +0 -311
  127. package/scripts/lib/mcp-least-privilege-policy.js +0 -303
  128. package/scripts/lib/mcp-tool-inventory.js +0 -388
  129. package/scripts/lib/mcp-tool-risk.js +0 -0
  130. package/scripts/lib/memory.js +0 -335
  131. package/scripts/lib/metrics.js +0 -699
  132. package/scripts/lib/micro-proof.js +0 -133
  133. package/scripts/lib/next-run-context.js +0 -436
  134. package/scripts/lib/operating-value.js +0 -1648
  135. package/scripts/lib/optimization-v3.js +0 -122
  136. package/scripts/lib/orchestration/adapters/_shared.js +0 -49
  137. package/scripts/lib/orchestration/adapters/aider.js +0 -18
  138. package/scripts/lib/orchestration/adapters/claude-code.js +0 -35
  139. package/scripts/lib/orchestration/adapters/codex.js +0 -35
  140. package/scripts/lib/orchestration/adapters/gemini-cli.js +0 -18
  141. package/scripts/lib/orchestration/adapters/git.js +0 -25
  142. package/scripts/lib/orchestration/adapters/index.js +0 -31
  143. package/scripts/lib/orchestration/adapters/lm-studio.js +0 -18
  144. package/scripts/lib/orchestration/adapters/ollama.js +0 -18
  145. package/scripts/lib/orchestration/adapters/opencode.js +0 -18
  146. package/scripts/lib/orchestration/adapters/openrouter.js +0 -18
  147. package/scripts/lib/orchestration/adapters/test-runner.js +0 -25
  148. package/scripts/lib/orchestration/cli.js +0 -438
  149. package/scripts/lib/orchestration/execution-manager.js +0 -279
  150. package/scripts/lib/orchestration/handoff.js +0 -314
  151. package/scripts/lib/orchestration/index.js +0 -456
  152. package/scripts/lib/orchestration/inventory.js +0 -47
  153. package/scripts/lib/orchestration/model-discovery.js +0 -498
  154. package/scripts/lib/orchestration/model-profiler.js +0 -170
  155. package/scripts/lib/orchestration/model-profiles.js +0 -252
  156. package/scripts/lib/orchestration/model-refresh-policy.js +0 -72
  157. package/scripts/lib/orchestration/proof-writer.js +0 -349
  158. package/scripts/lib/orchestration/provider-discovery/aider.js +0 -49
  159. package/scripts/lib/orchestration/provider-discovery/claude-code.js +0 -56
  160. package/scripts/lib/orchestration/provider-discovery/codex.js +0 -49
  161. package/scripts/lib/orchestration/provider-discovery/common.js +0 -186
  162. package/scripts/lib/orchestration/provider-discovery/gemini.js +0 -106
  163. package/scripts/lib/orchestration/provider-discovery/lm-studio.js +0 -118
  164. package/scripts/lib/orchestration/provider-discovery/models-dev.js +0 -12
  165. package/scripts/lib/orchestration/provider-discovery/ollama.js +0 -100
  166. package/scripts/lib/orchestration/provider-discovery/opencode.js +0 -47
  167. package/scripts/lib/orchestration/provider-discovery/openrouter.js +0 -44
  168. package/scripts/lib/orchestration/risk-classifier.js +0 -130
  169. package/scripts/lib/orchestration/routing-policy.js +0 -486
  170. package/scripts/lib/orchestration/settings.js +0 -112
  171. package/scripts/lib/orchestration/state.js +0 -165
  172. package/scripts/lib/orchestration/verification-manager.js +0 -138
  173. package/scripts/lib/output-profiles.js +0 -146
  174. package/scripts/lib/package-content-audit.js +0 -368
  175. package/scripts/lib/package-runtime.js +0 -278
  176. package/scripts/lib/plan-surface.js +0 -53
  177. package/scripts/lib/plans.js +0 -2318
  178. package/scripts/lib/policy-provider.js +0 -27
  179. package/scripts/lib/prelaunch-activation-readiness.js +0 -409
  180. package/scripts/lib/prelaunch-evidence-store.js +0 -816
  181. package/scripts/lib/prelaunch-intelligence.js +0 -869
  182. package/scripts/lib/pricing-experiment.js +0 -118
  183. package/scripts/lib/pro-moment-events.js +0 -77
  184. package/scripts/lib/pro-moment-state.js +0 -227
  185. package/scripts/lib/pro-moments.js +0 -1216
  186. package/scripts/lib/product-learning-events.js +0 -629
  187. package/scripts/lib/project-profile.js +0 -555
  188. package/scripts/lib/prompt-compiler.js +0 -280
  189. package/scripts/lib/prompt-lint.js +0 -32
  190. package/scripts/lib/prompt-suggestions.js +0 -52
  191. package/scripts/lib/proof-canonical.js +0 -398
  192. package/scripts/lib/proof-drilldown.js +0 -383
  193. package/scripts/lib/proof-events.js +0 -342
  194. package/scripts/lib/proof-history.js +0 -243
  195. package/scripts/lib/proof-metrics.js +0 -296
  196. package/scripts/lib/proof-outcome-evidence.js +0 -134
  197. package/scripts/lib/proof-receipt.js +0 -335
  198. package/scripts/lib/proof-record.js +0 -461
  199. package/scripts/lib/public-activation-distribution-gate.js +0 -258
  200. package/scripts/lib/public-cli.js +0 -3891
  201. package/scripts/lib/public-distribution-truth.js +0 -211
  202. package/scripts/lib/public-install-claim-checker.js +0 -294
  203. package/scripts/lib/publish-provenance-readiness.js +0 -283
  204. package/scripts/lib/readiness-delta.js +0 -218
  205. package/scripts/lib/readiness-evidence-closure.js +0 -196
  206. package/scripts/lib/reentry-memory-capture.js +0 -241
  207. package/scripts/lib/reentry-memory-retrieval.js +0 -302
  208. package/scripts/lib/reentry-memory-status.js +0 -146
  209. package/scripts/lib/reentry-memory-store.js +0 -178
  210. package/scripts/lib/reentry-state.js +0 -66
  211. package/scripts/lib/release-candidate-bundle.js +0 -166
  212. package/scripts/lib/remediation.js +0 -81
  213. package/scripts/lib/repo-map.js +0 -391
  214. package/scripts/lib/run-improvements-lifecycle.js +0 -330
  215. package/scripts/lib/run-improvements.js +0 -789
  216. package/scripts/lib/runtime-decision-policy.js +0 -387
  217. package/scripts/lib/safe-path-engine.js +0 -705
  218. package/scripts/lib/safe-run-controller.js +0 -887
  219. package/scripts/lib/score.js +0 -262
  220. package/scripts/lib/seamless-enforcement.js +0 -329
  221. package/scripts/lib/seamless-outcome.js +0 -689
  222. package/scripts/lib/seamless-reality-gate.js +0 -5043
  223. package/scripts/lib/security-risk-classifier.js +0 -511
  224. package/scripts/lib/security-scan.js +0 -384
  225. package/scripts/lib/session-context-optimizer.js +0 -1211
  226. package/scripts/lib/session-timing.js +0 -315
  227. package/scripts/lib/skill-hygiene.js +0 -805
  228. package/scripts/lib/skill-packs.js +0 -161
  229. package/scripts/lib/skills-operating-layer.js +0 -580
  230. package/scripts/lib/smart-work-routing.js +0 -768
  231. package/scripts/lib/source-catalog.js +0 -700
  232. package/scripts/lib/status-value-summary.js +0 -32
  233. package/scripts/lib/support-bundle.js +0 -578
  234. package/scripts/lib/task-continuation.js +0 -440
  235. package/scripts/lib/test-helpers.js +0 -15
  236. package/scripts/lib/tier.js +0 -38
  237. package/scripts/lib/token-context-quality-gate.js +0 -370
  238. package/scripts/lib/token-cost-capture.js +0 -187
  239. package/scripts/lib/token-cost-intelligence.js +0 -358
  240. package/scripts/lib/token-efficiency-evidence.js +0 -213
  241. package/scripts/lib/token-evidence.js +0 -699
  242. package/scripts/lib/tokenish.js +0 -17
  243. package/scripts/lib/tool-output-sandbox.js +0 -304
  244. package/scripts/lib/trust-audit.js +0 -136
  245. package/scripts/lib/unified-events.js +0 -396
  246. package/scripts/lib/upgrade-interruption-recovery.js +0 -407
  247. package/scripts/lib/usage-ledger.js +0 -201
  248. package/scripts/lib/value-ledger.js +0 -130
  249. package/scripts/lib/value-proof-calibration.js +0 -531
  250. package/scripts/lib/visual-qa.js +0 -231
  251. package/scripts/lib/voice-alpha.js +0 -29
  252. package/scripts/lib/work-aware-orchestration.js +0 -976
  253. package/scripts/lib/work-control-receipts.js +0 -577
  254. package/scripts/lib/work-ledger.js +0 -1123
  255. package/scripts/lib/work-panel-preview.js +0 -352
  256. package/scripts/lib/workflow-discipline.js +0 -280
  257. package/scripts/lib/workflow-signals.js +0 -419
  258. package/scripts/lib/workspace-map.js +0 -281
  259. package/scripts/lib/workspace-registry.js +0 -1367
  260. package/scripts/lib/workspace-resolver.js +0 -480
@@ -1,296 +0,0 @@
1
- "use strict";
2
-
3
- /**
4
- * Proof Metrics - 12 named effectiveness metric definitions.
5
- */
6
-
7
- const { readAllMetrics } = require("./metrics");
8
- const { composeProofRecord } = require("./proof-record");
9
-
10
- const METRIC_DEFINITIONS = {
11
- time_to_first_useful_result: {
12
- id: "time_to_first_useful_result",
13
- name: "Time to First Useful Result",
14
- description: "Time from run start to the first truly usable output.",
15
- unit: "seconds",
16
- dimension: "outcome",
17
- derivation: "started_at to first TASK_COMPLETED or meaningful artifact event",
18
- },
19
- completion_rate: {
20
- id: "completion_rate",
21
- name: "Completion Rate",
22
- description: "Percentage of runs ending in completed task or safe stop with bounded next action.",
23
- unit: "percent",
24
- dimension: "outcome",
25
- derivation: "sessions with canonical completion truth when present, otherwise TASK_COMPLETED or STOP_SNAPSHOT / total sessions",
26
- },
27
- evidence_backed_completion_rate: {
28
- id: "evidence_backed_completion_rate",
29
- name: "Evidence-Backed Completion Rate",
30
- description:
31
- "Of completions, how many have related security/trust evidence artifacts in the same session. This is a proxy for evidence presence, not a verification of task correctness.",
32
- unit: "percent",
33
- dimension: "outcome",
34
- derivation: "canonical proof-aware completions with related evidence / total completions",
35
- },
36
- retries_per_task: {
37
- id: "retries_per_task",
38
- name: "Retries Per Task",
39
- description: "Average retries, reruns, or recovery loops per task.",
40
- unit: "count",
41
- dimension: "efficiency",
42
- derivation: "proof-record retries_count / sessions",
43
- },
44
- dead_end_rate: {
45
- id: "dead_end_rate",
46
- name: "Dead-End Rate",
47
- description: "Runs ending without usable output, recovery path, or safe stop.",
48
- unit: "percent",
49
- dimension: "efficiency",
50
- derivation: "sessions without completion, safe stop, or recovery / total sessions",
51
- },
52
- large_outputs_managed: {
53
- id: "large_outputs_managed",
54
- name: "Large Outputs Managed",
55
- description:
56
- "Count of large tool outputs stored out-of-band to reduce context pressure. This is a count, not a precise byte-level reduction measurement.",
57
- unit: "count",
58
- dimension: "efficiency",
59
- derivation: "canonical material steps or CTX_LARGE_OUTPUT counts across sessions",
60
- },
61
- unnecessary_tool_load_avoided: {
62
- id: "unnecessary_tool_load_avoided",
63
- name: "Unnecessary Tool Load Avoided",
64
- description: "Count of tool loads or scans intentionally skipped because unnecessary.",
65
- unit: "count",
66
- dimension: "efficiency",
67
- derivation: "proof-record tools_skipped",
68
- },
69
- approval_interruptions_avoided: {
70
- id: "approval_interruptions_avoided",
71
- name: "Approval Interruptions Avoided",
72
- description: "Count of policy-relevant interruptions avoided because execution stayed within policy.",
73
- unit: "count",
74
- dimension: "control",
75
- derivation: "proof-record approval_requests_avoided",
76
- },
77
- risky_actions_blocked_or_downgraded: {
78
- id: "risky_actions_blocked_or_downgraded",
79
- name: "Risky Actions Blocked or Downgraded",
80
- description: "Count of risky actions blocked, downgraded, or deferred.",
81
- unit: "count",
82
- dimension: "control",
83
- derivation: "proof-record risky action counts, canonical proof first",
84
- },
85
- honest_fallback_rate: {
86
- id: "honest_fallback_rate",
87
- name: "Honest Fallback Rate",
88
- description: "Rate at which Wuz stopped or limited claims honestly instead of fabricating certainty.",
89
- unit: "percent",
90
- dimension: "trust",
91
- derivation: "safe-stop sessions / total sessions",
92
- },
93
- recovery_success_rate: {
94
- id: "recovery_success_rate",
95
- name: "Recovery Success Rate",
96
- description: "Of runs that encountered blocks or failures, how many reached successful completion.",
97
- unit: "percent",
98
- dimension: "trust",
99
- derivation: "sessions with retries that still reach completion / retry sessions",
100
- },
101
- evidence_coverage: {
102
- id: "evidence_coverage",
103
- name: "Evidence Coverage",
104
- description: "Percentage of material sessions with evidence or traceable support.",
105
- unit: "percent",
106
- dimension: "trust",
107
- derivation: "proof-record sessions with related evidence / total sessions",
108
- },
109
- };
110
-
111
- function computeProofMetrics(cwd, options = {}) {
112
- const days = Number(options.days || 7);
113
- const cutoff = Date.now() - days * 24 * 60 * 60 * 1000;
114
- const allMetrics = readAllMetrics(cwd);
115
- const recent = allMetrics.filter((metric) => {
116
- const ts = Date.parse(metric.ts || 0);
117
- return Number.isFinite(ts) && ts >= cutoff;
118
- });
119
-
120
- const bySession = new Map();
121
- recent.forEach((metric) => {
122
- const id = metric.sessionId || "unknown";
123
- if (!bySession.has(id)) bySession.set(id, []);
124
- bySession.get(id).push(metric);
125
- });
126
-
127
- const totalSessions = bySession.size;
128
- if (totalSessions === 0) return emptyMetrics();
129
-
130
- let completedSessions = 0;
131
- let safeStopSessions = 0;
132
- let evidenceBackedSessions = 0;
133
- let deadEndSessions = 0;
134
- let blockedSessions = 0;
135
- let blockedThenCompletedSessions = 0;
136
- let evidenceSessions = 0;
137
- let totalRetries = 0;
138
- let totalLargeOutputBytes = 0;
139
- let totalLargeOutputEvents = 0;
140
- let totalScanSkips = 0;
141
- let totalPermFatigueConsolidated = 0;
142
- let totalRiskyBlocked = 0;
143
- const ttfrValues = [];
144
-
145
- for (const [sessionId, sessionMetrics] of bySession) {
146
- const record = composeProofRecord(sessionId, sessionMetrics, []);
147
- if (record.completion_status === "completed") completedSessions++;
148
- if (record.completion_status === "safe_stop") safeStopSessions++;
149
- if (record.outcome?.evidence_backed_completion) evidenceBackedSessions++;
150
- if (
151
- record.completion_status === "ended_without_completion" &&
152
- !record.outcome?.next_bounded_action
153
- ) {
154
- deadEndSessions++;
155
- }
156
- if ((record.efficiency?.retries_count || 0) > 0) {
157
- blockedSessions++;
158
- if (record.completion_status === "completed") blockedThenCompletedSessions++;
159
- }
160
- if (record.trust?.has_related_evidence) evidenceSessions++;
161
-
162
- totalRetries += record.efficiency?.retries_count || 0;
163
- totalLargeOutputBytes += record.efficiency?.large_output_bytes_managed || 0;
164
- totalLargeOutputEvents += record.efficiency?.large_output_events || 0;
165
- totalScanSkips += record.efficiency?.tools_skipped || 0;
166
- totalPermFatigueConsolidated += record.control?.approval_requests_avoided || 0;
167
- totalRiskyBlocked +=
168
- (record.control?.risky_actions_blocked || 0) +
169
- (record.control?.risky_actions_downgraded || 0);
170
-
171
- const timestamps = sessionMetrics
172
- .map((metric) => Date.parse(metric.ts || 0))
173
- .filter((value) => Number.isFinite(value));
174
- const startTs = timestamps.length ? Math.min(...timestamps) : 0;
175
- const completionMetric = sessionMetrics.find((metric) =>
176
- (metric.reasonCodes || []).includes("TASK_COMPLETED")
177
- );
178
- if (completionMetric && startTs) {
179
- const endTs = Date.parse(completionMetric.ts || 0);
180
- if (Number.isFinite(endTs) && endTs > startTs) {
181
- ttfrValues.push(Math.round((endTs - startTs) / 1000));
182
- }
183
- }
184
- }
185
-
186
- const completedOrStopped = completedSessions + safeStopSessions;
187
- const completionRate = totalSessions > 0 ? Math.round((completedOrStopped / totalSessions) * 100) : 0;
188
- const evidenceBackedRate =
189
- completedSessions > 0 ? Math.round((evidenceBackedSessions / completedSessions) * 100) : 0;
190
- const deadEndRate = totalSessions > 0 ? Math.round((deadEndSessions / totalSessions) * 100) : 0;
191
- const retriesPerTask =
192
- totalSessions > 0 ? Math.round((totalRetries / totalSessions) * 100) / 100 : 0;
193
- const honestFallbackRate =
194
- totalSessions > 0 ? Math.round((safeStopSessions / totalSessions) * 100) : 0;
195
- const recoverySuccessRate =
196
- blockedSessions > 0 ? Math.round((blockedThenCompletedSessions / blockedSessions) * 100) : 0;
197
- const evidenceCoverage =
198
- totalSessions > 0 ? Math.round((evidenceSessions / totalSessions) * 100) : 0;
199
- const medianTtfr = ttfrValues.length > 0 ? median(ttfrValues) : null;
200
-
201
- return {
202
- period_days: days,
203
- total_sessions: totalSessions,
204
- time_to_first_useful_result: {
205
- ...METRIC_DEFINITIONS.time_to_first_useful_result,
206
- value: medianTtfr,
207
- sample_size: ttfrValues.length,
208
- confidence: ttfrValues.length >= 5 ? "medium" : "low",
209
- },
210
- completion_rate: {
211
- ...METRIC_DEFINITIONS.completion_rate,
212
- value: completionRate,
213
- numerator: completedOrStopped,
214
- denominator: totalSessions,
215
- },
216
- evidence_backed_completion_rate: {
217
- ...METRIC_DEFINITIONS.evidence_backed_completion_rate,
218
- value: evidenceBackedRate,
219
- numerator: evidenceBackedSessions,
220
- denominator: completedSessions,
221
- },
222
- retries_per_task: {
223
- ...METRIC_DEFINITIONS.retries_per_task,
224
- value: retriesPerTask,
225
- total_retries: totalRetries,
226
- sessions: totalSessions,
227
- },
228
- dead_end_rate: {
229
- ...METRIC_DEFINITIONS.dead_end_rate,
230
- value: deadEndRate,
231
- numerator: deadEndSessions,
232
- denominator: totalSessions,
233
- },
234
- large_outputs_managed: {
235
- ...METRIC_DEFINITIONS.large_outputs_managed,
236
- value: totalLargeOutputEvents,
237
- total_bytes: totalLargeOutputBytes,
238
- },
239
- unnecessary_tool_load_avoided: {
240
- ...METRIC_DEFINITIONS.unnecessary_tool_load_avoided,
241
- value: totalScanSkips,
242
- },
243
- approval_interruptions_avoided: {
244
- ...METRIC_DEFINITIONS.approval_interruptions_avoided,
245
- value: totalPermFatigueConsolidated,
246
- },
247
- risky_actions_blocked_or_downgraded: {
248
- ...METRIC_DEFINITIONS.risky_actions_blocked_or_downgraded,
249
- value: totalRiskyBlocked,
250
- },
251
- honest_fallback_rate: {
252
- ...METRIC_DEFINITIONS.honest_fallback_rate,
253
- value: honestFallbackRate,
254
- numerator: safeStopSessions,
255
- denominator: totalSessions,
256
- },
257
- recovery_success_rate: {
258
- ...METRIC_DEFINITIONS.recovery_success_rate,
259
- value: recoverySuccessRate,
260
- numerator: blockedThenCompletedSessions,
261
- denominator: blockedSessions,
262
- confidence: blockedSessions >= 3 ? "medium" : "low",
263
- },
264
- evidence_coverage: {
265
- ...METRIC_DEFINITIONS.evidence_coverage,
266
- value: evidenceCoverage,
267
- numerator: evidenceSessions,
268
- denominator: totalSessions,
269
- },
270
- };
271
- }
272
-
273
- function emptyMetrics() {
274
- const result = { period_days: 0, total_sessions: 0 };
275
- for (const [id, def] of Object.entries(METRIC_DEFINITIONS)) {
276
- result[id] = {
277
- ...def,
278
- value: def.unit === "percent" ? 0 : def.unit === "count" ? 0 : null,
279
- };
280
- }
281
- return result;
282
- }
283
-
284
- function median(arr) {
285
- if (!arr.length) return 0;
286
- const sorted = arr.slice().sort((a, b) => a - b);
287
- const mid = Math.floor(sorted.length / 2);
288
- return sorted.length % 2
289
- ? sorted[mid]
290
- : Math.round((sorted[mid - 1] + sorted[mid]) / 2);
291
- }
292
-
293
- module.exports = {
294
- METRIC_DEFINITIONS,
295
- computeProofMetrics,
296
- };
@@ -1,134 +0,0 @@
1
- "use strict";
2
-
3
- const fs = require("fs");
4
- const path = require("path");
5
- const { nowIso } = require("./fsx");
6
-
7
- const CONTRACT = "avorelo.proofOutcomeEvidence.v1";
8
- const SCHEMA_VERSION = 1;
9
- const PROOF_OUTCOME_DIR_REL = ".claude/cco/orchestration/seamless-outcome";
10
- const ARTIFACT_REL = `${PROOF_OUTCOME_DIR_REL}/latest-proof-outcome-evidence.json`;
11
- const VALUE_SUMMARY_REL = `${PROOF_OUTCOME_DIR_REL}/latest-value-summary.json`;
12
- const REALITY_GATE_REL = `${PROOF_OUTCOME_DIR_REL}/latest-reality-gate.json`;
13
-
14
- function safeReadJson(absPath) {
15
- try {
16
- if (!fs.existsSync(absPath)) return null;
17
- return JSON.parse(fs.readFileSync(absPath, "utf8").replace(/^\uFEFF/, ""));
18
- } catch {
19
- return null;
20
- }
21
- }
22
-
23
- function buildProofOutcomeEvidence(cwd) {
24
- const valueSummary = safeReadJson(path.join(cwd, VALUE_SUMMARY_REL));
25
- const realityGate = safeReadJson(path.join(cwd, REALITY_GATE_REL));
26
-
27
- const latestProofAvailable = !!valueSummary;
28
- const simulatedProofDetected = valueSummary && valueSummary.simulated === true;
29
- const realTaskProofCount = valueSummary && simulatedProofDetected !== true ? 1 : 0;
30
- const evidenceBacked = valueSummary ? valueSummary.evidenceBacked !== false : false;
31
-
32
- let status = "warn";
33
- let proofQuality = "missing";
34
- const missingEvidence = [];
35
- const safeNextActions = [];
36
-
37
- if (!valueSummary) {
38
- missingEvidence.push("No proof/value summary artifact is available from a completed real task.");
39
- safeNextActions.push("Run a bounded real task in this repo.");
40
- safeNextActions.push("Run: node bin/avorelo proof");
41
- safeNextActions.push("Run: node bin/avorelo full-readiness --json");
42
- } else {
43
- proofQuality = evidenceBacked ? "evidence_backed" : "present_but_unverified";
44
- if (simulatedProofDetected) {
45
- proofQuality = "simulated_fixture_only";
46
- missingEvidence.push("Latest proof artifact is marked simulated and does not count as real task evidence.");
47
- }
48
- if (!evidenceBacked) {
49
- missingEvidence.push("Latest proof/value summary is present but not marked evidence-backed.");
50
- }
51
- if (!realityGate) {
52
- missingEvidence.push("No reality gate artifact is available alongside the latest proof summary.");
53
- safeNextActions.push("Run: node bin/avorelo outcome --gate --json");
54
- }
55
- if (evidenceBacked && realityGate && simulatedProofDetected !== true) {
56
- status = "pass";
57
- }
58
- }
59
-
60
- if (safeNextActions.length === 0) {
61
- safeNextActions.push("Run: node bin/avorelo full-readiness --json");
62
- }
63
-
64
- return {
65
- contract: CONTRACT,
66
- schemaVersion: SCHEMA_VERSION,
67
- createdAt: nowIso(),
68
- status,
69
- latestProofAvailable,
70
- realTaskProofCount,
71
- simulatedProofDetected: simulatedProofDetected === true,
72
- proofQuality,
73
- evidenceRefs: {
74
- valueSummary: latestProofAvailable ? VALUE_SUMMARY_REL : null,
75
- realityGate: realityGate ? REALITY_GATE_REL : null,
76
- },
77
- missingEvidence,
78
- safeNextActions,
79
- redacted: true,
80
- };
81
- }
82
-
83
- function writeProofOutcomeEvidence(cwd, evidence) {
84
- const dirAbs = path.join(cwd, PROOF_OUTCOME_DIR_REL);
85
- fs.mkdirSync(dirAbs, { recursive: true });
86
- fs.writeFileSync(path.join(cwd, ARTIFACT_REL), JSON.stringify(evidence, null, 2), "utf8");
87
- return path.join(cwd, ARTIFACT_REL);
88
- }
89
-
90
- function buildProofOutcomeEvidenceSurface(cwd) {
91
- const existing = safeReadJson(path.join(cwd, ARTIFACT_REL));
92
- const evidence = existing || buildProofOutcomeEvidence(cwd);
93
- if (!existing) writeProofOutcomeEvidence(cwd, evidence);
94
- return {
95
- status: evidence.status,
96
- latestProofAvailable: evidence.latestProofAvailable,
97
- realTaskProofCount: evidence.realTaskProofCount,
98
- proofQuality: evidence.proofQuality,
99
- artifactPath: ARTIFACT_REL,
100
- redacted: true,
101
- };
102
- }
103
-
104
- function formatProofOutcomeEvidenceText(evidence) {
105
- const lines = [
106
- `Proof outcome evidence: ${evidence.status}`,
107
- `Latest proof available: ${evidence.latestProofAvailable === true ? "yes" : "no"}`,
108
- `Real task proof count: ${evidence.realTaskProofCount || 0}`,
109
- `Proof quality: ${evidence.proofQuality || "missing"}`,
110
- ];
111
- if (Array.isArray(evidence.missingEvidence) && evidence.missingEvidence.length) {
112
- lines.push("");
113
- lines.push("Missing evidence:");
114
- evidence.missingEvidence.slice(0, 5).forEach((item) => lines.push(` - ${item}`));
115
- }
116
- if (Array.isArray(evidence.safeNextActions) && evidence.safeNextActions.length) {
117
- lines.push("");
118
- lines.push("Next:");
119
- evidence.safeNextActions.slice(0, 3).forEach((item) => lines.push(` - ${item}`));
120
- }
121
- return lines.join("\n");
122
- }
123
-
124
- module.exports = {
125
- CONTRACT,
126
- SCHEMA_VERSION,
127
- ARTIFACT_REL,
128
- VALUE_SUMMARY_REL,
129
- REALITY_GATE_REL,
130
- buildProofOutcomeEvidence,
131
- writeProofOutcomeEvidence,
132
- buildProofOutcomeEvidenceSurface,
133
- formatProofOutcomeEvidenceText,
134
- };