thumbgate 1.4.2 → 1.4.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (279) hide show
  1. package/.claude-plugin/README.md +45 -34
  2. package/.claude-plugin/marketplace.json +3 -3
  3. package/.claude-plugin/plugin.json +3 -3
  4. package/.well-known/llms.txt +1 -1
  5. package/.well-known/mcp/server-card.json +1 -1
  6. package/README.md +26 -2
  7. package/adapters/README.md +4 -1
  8. package/adapters/claude/.mcp.json +2 -2
  9. package/adapters/codex/config.toml +2 -2
  10. package/adapters/mcp/server-stdio.js +10 -4
  11. package/adapters/opencode/opencode.json +1 -1
  12. package/bin/cli.js +246 -90
  13. package/config/mcp-allowlists.json +11 -3
  14. package/package.json +184 -21
  15. package/scripts/audit-trail.js +25 -15
  16. package/scripts/auto-wire-hooks.js +127 -0
  17. package/scripts/cli-demo.js +102 -0
  18. package/scripts/cli-schema.js +285 -0
  19. package/scripts/cli-status.js +166 -0
  20. package/scripts/cross-encoder-reranker.js +235 -0
  21. package/scripts/explore-subcommands.js +277 -0
  22. package/scripts/explore.js +569 -0
  23. package/scripts/feedback-loop.js +20 -6
  24. package/scripts/lesson-inference.js +7 -1
  25. package/scripts/lesson-reranker.js +263 -0
  26. package/scripts/lesson-retrieval.js +34 -17
  27. package/scripts/lesson-search.js +69 -0
  28. package/scripts/perplexity-client.js +210 -0
  29. package/scripts/reflector-agent.js +2 -2
  30. package/scripts/statusline-local-stats.js +3 -1
  31. package/scripts/statusline.sh +12 -11
  32. package/src/api/server.js +178 -17
  33. package/src/index.js +3 -0
  34. package/.claude-plugin/bundle/icon.png +0 -0
  35. package/.claude-plugin/bundle/icon.svg +0 -18
  36. package/.claude-plugin/bundle/server/index.js +0 -24
  37. package/adapters/chatgpt/INSTALL.md +0 -138
  38. package/bin/memory.sh +0 -64
  39. package/bin/obsidian-sync.sh +0 -20
  40. package/plugins/amp-skill/INSTALL.md +0 -52
  41. package/plugins/amp-skill/SKILL.md +0 -64
  42. package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +0 -22
  43. package/plugins/claude-codex-bridge/.mcp.json +0 -14
  44. package/plugins/claude-codex-bridge/INSTALL.md +0 -43
  45. package/plugins/claude-codex-bridge/README.md +0 -46
  46. package/plugins/claude-codex-bridge/scripts/codex-bridge.js +0 -286
  47. package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +0 -24
  48. package/plugins/claude-codex-bridge/skills/result/SKILL.md +0 -22
  49. package/plugins/claude-codex-bridge/skills/review/SKILL.md +0 -28
  50. package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +0 -27
  51. package/plugins/claude-codex-bridge/skills/setup/SKILL.md +0 -21
  52. package/plugins/claude-codex-bridge/skills/status/SKILL.md +0 -19
  53. package/plugins/claude-skill/INSTALL.md +0 -55
  54. package/plugins/claude-skill/SKILL.md +0 -46
  55. package/plugins/codex-profile/.codex-plugin/plugin.json +0 -43
  56. package/plugins/codex-profile/.mcp.json +0 -14
  57. package/plugins/codex-profile/AGENTS.md +0 -20
  58. package/plugins/codex-profile/INSTALL.md +0 -89
  59. package/plugins/codex-profile/README.md +0 -61
  60. package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +0 -23
  61. package/plugins/cursor-marketplace/CHANGELOG.md +0 -30
  62. package/plugins/cursor-marketplace/LICENSE +0 -21
  63. package/plugins/cursor-marketplace/README.md +0 -124
  64. package/plugins/cursor-marketplace/agents/reliability-reviewer.md +0 -31
  65. package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
  66. package/plugins/cursor-marketplace/commands/capture-feedback.md +0 -33
  67. package/plugins/cursor-marketplace/commands/check-gates.md +0 -25
  68. package/plugins/cursor-marketplace/commands/show-lessons.md +0 -27
  69. package/plugins/cursor-marketplace/hooks/hooks.json +0 -10
  70. package/plugins/cursor-marketplace/mcp.json +0 -14
  71. package/plugins/cursor-marketplace/rules/feedback-capture.mdc +0 -34
  72. package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +0 -30
  73. package/plugins/cursor-marketplace/rules/session-continuity.mdc +0 -28
  74. package/plugins/cursor-marketplace/scripts/gate-check.sh +0 -21
  75. package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +0 -48
  76. package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +0 -31
  77. package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +0 -30
  78. package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +0 -33
  79. package/plugins/gemini-extension/INSTALL.md +0 -92
  80. package/plugins/gemini-extension/gemini_prompt.txt +0 -14
  81. package/plugins/gemini-extension/tool_contract.json +0 -45
  82. package/plugins/opencode-profile/INSTALL.md +0 -57
  83. package/public/assets/instagram-card.png +0 -0
  84. package/public/assets/tiktok-agent-memory.mp4 +0 -0
  85. package/public/blog.html +0 -474
  86. package/public/compare/mem0.html +0 -189
  87. package/public/compare/speclock.html +0 -180
  88. package/public/compare.html +0 -310
  89. package/public/dashboard.html +0 -1100
  90. package/public/guide.html +0 -317
  91. package/public/guides/claude-code-prevent-repeated-mistakes.html +0 -161
  92. package/public/guides/codex-cli-guardrails.html +0 -158
  93. package/public/guides/cursor-prevent-repeated-mistakes.html +0 -161
  94. package/public/guides/pre-action-gates.html +0 -162
  95. package/public/guides/stop-repeated-ai-agent-mistakes.html +0 -159
  96. package/public/index.html +0 -1128
  97. package/public/js/buyer-intent.js +0 -252
  98. package/public/learn/agent-harness-pattern.html +0 -180
  99. package/public/learn/ai-agent-persistent-memory.html +0 -203
  100. package/public/learn/learn.css +0 -45
  101. package/public/learn/mcp-pre-action-gates-explained.html +0 -172
  102. package/public/learn/stop-ai-agent-force-push.html +0 -134
  103. package/public/learn/vibe-coding-safety-net.html +0 -142
  104. package/public/learn.html +0 -274
  105. package/public/lessons.html +0 -967
  106. package/public/llm-context.md +0 -140
  107. package/public/pro.html +0 -1087
  108. package/public/vercel.json +0 -8
  109. package/scripts/a2ui-engine.js +0 -73
  110. package/scripts/adk-consolidator.js +0 -274
  111. package/scripts/agent-security-hardening.js +0 -225
  112. package/scripts/ai-search-visibility.js +0 -142
  113. package/scripts/autonomous-sales-agent.js +0 -39
  114. package/scripts/autoresearch-runner.js +0 -216
  115. package/scripts/background-agent-governance.js +0 -229
  116. package/scripts/behavioral-extraction.js +0 -93
  117. package/scripts/budget-enforcer.js +0 -173
  118. package/scripts/budget-guard.js +0 -173
  119. package/scripts/build-claude-mcpb.js +0 -255
  120. package/scripts/build-codex-plugin.js +0 -152
  121. package/scripts/capture-railway-diagnostics.sh +0 -97
  122. package/scripts/changeset-check.js +0 -372
  123. package/scripts/check-congruence.js +0 -443
  124. package/scripts/computer-use-firewall.js +0 -280
  125. package/scripts/content-engine/linkedin-content-generator.js +0 -154
  126. package/scripts/content-engine/output/linkedin-memento-validation.md +0 -17
  127. package/scripts/content-engine/output/linkedin-posts-2026-04-09.md +0 -175
  128. package/scripts/content-engine/reddit-thread-finder.js +0 -154
  129. package/scripts/context-engine.js +0 -710
  130. package/scripts/daily-digest.js +0 -11
  131. package/scripts/data-governance.js +0 -173
  132. package/scripts/deploy-gcp.sh +0 -44
  133. package/scripts/deploy-policy.js +0 -249
  134. package/scripts/disagreement-mining.js +0 -315
  135. package/scripts/dpo-optimizer.js +0 -206
  136. package/scripts/ensure-repo-bootstrap.js +0 -130
  137. package/scripts/ephemeral-agent-store.js +0 -212
  138. package/scripts/eval-harness.js +0 -56
  139. package/scripts/export-kto-pairs.js +0 -309
  140. package/scripts/export-training.js +0 -446
  141. package/scripts/feedback-fallback.js +0 -111
  142. package/scripts/feedback-inbox-read.js +0 -162
  143. package/scripts/feedback-root-consolidator.js +0 -233
  144. package/scripts/feedback-to-memory.js +0 -185
  145. package/scripts/gate-satisfy.js +0 -42
  146. package/scripts/generate-paperbanana-diagrams.sh +0 -99
  147. package/scripts/generate-pretool-hook.sh +0 -40
  148. package/scripts/github-about.js +0 -430
  149. package/scripts/github-outreach.js +0 -65
  150. package/scripts/gtm-revenue-loop.js +0 -535
  151. package/scripts/hallucination-detector.js +0 -226
  152. package/scripts/hf-papers.js +0 -317
  153. package/scripts/hook-auto-capture.sh +0 -100
  154. package/scripts/hook-stop-pr-thread-check.sh +0 -68
  155. package/scripts/hook-stop-self-score.sh +0 -51
  156. package/scripts/hook-stop-verify-deploy.sh +0 -31
  157. package/scripts/hook-verify-before-done.sh +0 -20
  158. package/scripts/managed-dpo-export.js +0 -91
  159. package/scripts/markdown-escape.js +0 -12
  160. package/scripts/marketing-experiment.js +0 -657
  161. package/scripts/memalign-recall.js +0 -111
  162. package/scripts/memory-migration.js +0 -296
  163. package/scripts/meta-policy.js +0 -190
  164. package/scripts/metered-billing.js +0 -16
  165. package/scripts/model-tier-router.js +0 -310
  166. package/scripts/money-watcher.js +0 -218
  167. package/scripts/multi-hop-recall.js +0 -240
  168. package/scripts/per-step-scoring.js +0 -163
  169. package/scripts/perplexity-marketing.js +0 -466
  170. package/scripts/pii-scanner.js +0 -153
  171. package/scripts/plan-gate.js +0 -154
  172. package/scripts/post-everywhere.js +0 -341
  173. package/scripts/post-to-x-retry.sh +0 -22
  174. package/scripts/post-to-x.js +0 -369
  175. package/scripts/pr-manager.js +0 -421
  176. package/scripts/principle-extractor.js +0 -162
  177. package/scripts/pro-features.js +0 -41
  178. package/scripts/prompt-dlp.js +0 -222
  179. package/scripts/prove-adapters.js +0 -860
  180. package/scripts/prove-attribution.js +0 -361
  181. package/scripts/prove-automation.js +0 -651
  182. package/scripts/prove-autoresearch.js +0 -304
  183. package/scripts/prove-claim-verification.js +0 -277
  184. package/scripts/prove-cloudflare-sandbox.js +0 -161
  185. package/scripts/prove-data-pipeline.js +0 -408
  186. package/scripts/prove-data-quality.js +0 -227
  187. package/scripts/prove-evolution.js +0 -352
  188. package/scripts/prove-harnesses.js +0 -287
  189. package/scripts/prove-intelligence.js +0 -257
  190. package/scripts/prove-lancedb.js +0 -425
  191. package/scripts/prove-local-intelligence.js +0 -340
  192. package/scripts/prove-loop-closure.js +0 -263
  193. package/scripts/prove-packaged-runtime.js +0 -326
  194. package/scripts/prove-predictive-insights.js +0 -355
  195. package/scripts/prove-runtime.js +0 -363
  196. package/scripts/prove-seo-gsd.js +0 -234
  197. package/scripts/prove-settings.js +0 -279
  198. package/scripts/prove-subway-upgrades.js +0 -277
  199. package/scripts/prove-tessl.js +0 -229
  200. package/scripts/prove-training-export.js +0 -325
  201. package/scripts/prove-workflow-contract.js +0 -112
  202. package/scripts/prove-xmemory.js +0 -332
  203. package/scripts/publish-decision.js +0 -159
  204. package/scripts/ralph-loop.js +0 -376
  205. package/scripts/ralph-mode-ci.js +0 -331
  206. package/scripts/reddit-dm-outreach.js +0 -192
  207. package/scripts/reddit-monitor-cron.sh +0 -26
  208. package/scripts/reminder-engine.js +0 -132
  209. package/scripts/revenue-status.js +0 -472
  210. package/scripts/rotate-stripe-webhook-secret.js +0 -314
  211. package/scripts/schedule-manager.js +0 -249
  212. package/scripts/self-healing-check.js +0 -193
  213. package/scripts/shieldcortex-memory-firewall-runner.mjs +0 -53
  214. package/scripts/skill-exporter.js +0 -260
  215. package/scripts/skill-materializer.js +0 -134
  216. package/scripts/skill-packs.js +0 -136
  217. package/scripts/skill-proposer.js +0 -99
  218. package/scripts/skill-quality-tracker.js +0 -282
  219. package/scripts/slow-loop.js +0 -72
  220. package/scripts/social-analytics/db/analytics.sqlite +0 -0
  221. package/scripts/social-analytics/db/schema.sql +0 -32
  222. package/scripts/social-analytics/digest.js +0 -256
  223. package/scripts/social-analytics/engagement-audit.js +0 -185
  224. package/scripts/social-analytics/generate-instagram-card.js +0 -97
  225. package/scripts/social-analytics/instagram-thumbgate-post.js +0 -111
  226. package/scripts/social-analytics/install-growth-automation.js +0 -114
  227. package/scripts/social-analytics/load-env.js +0 -77
  228. package/scripts/social-analytics/mcp-server.js +0 -289
  229. package/scripts/social-analytics/normalizer.js +0 -580
  230. package/scripts/social-analytics/notify.js +0 -162
  231. package/scripts/social-analytics/poll-all.js +0 -107
  232. package/scripts/social-analytics/pollers/github.js +0 -195
  233. package/scripts/social-analytics/pollers/instagram.js +0 -253
  234. package/scripts/social-analytics/pollers/linkedin.js +0 -340
  235. package/scripts/social-analytics/pollers/plausible.js +0 -245
  236. package/scripts/social-analytics/pollers/reddit.js +0 -306
  237. package/scripts/social-analytics/pollers/threads.js +0 -233
  238. package/scripts/social-analytics/pollers/tiktok.js +0 -203
  239. package/scripts/social-analytics/pollers/x.js +0 -227
  240. package/scripts/social-analytics/pollers/youtube.js +0 -304
  241. package/scripts/social-analytics/pollers/zernio.js +0 -183
  242. package/scripts/social-analytics/publish-instagram-thumbgate.js +0 -104
  243. package/scripts/social-analytics/publish-thumbgate-launch.js +0 -322
  244. package/scripts/social-analytics/publishers/devto.js +0 -122
  245. package/scripts/social-analytics/publishers/instagram.js +0 -317
  246. package/scripts/social-analytics/publishers/linkedin.js +0 -294
  247. package/scripts/social-analytics/publishers/reddit.js +0 -385
  248. package/scripts/social-analytics/publishers/threads.js +0 -275
  249. package/scripts/social-analytics/publishers/tiktok.js +0 -217
  250. package/scripts/social-analytics/publishers/x.js +0 -259
  251. package/scripts/social-analytics/publishers/youtube.js +0 -223
  252. package/scripts/social-analytics/publishers/zernio.js +0 -539
  253. package/scripts/social-analytics/reconcile-thumbgate-campaign.js +0 -165
  254. package/scripts/social-analytics/run-digest.js +0 -34
  255. package/scripts/social-analytics/schedule-thumbgate-campaign.js +0 -275
  256. package/scripts/social-analytics/store.js +0 -455
  257. package/scripts/social-analytics/sync-launch-assets.js +0 -185
  258. package/scripts/social-analytics/utm.js +0 -143
  259. package/scripts/social-pipeline.js +0 -2626
  260. package/scripts/social-post-hourly.js +0 -228
  261. package/scripts/social-quality-gate.js +0 -134
  262. package/scripts/social-reply-monitor.js +0 -592
  263. package/scripts/status-dashboard.js +0 -155
  264. package/scripts/stripe-live-status.js +0 -115
  265. package/scripts/subagent-profiles.js +0 -79
  266. package/scripts/sync-branch-protection.js +0 -340
  267. package/scripts/sync-gh-secrets-from-env.sh +0 -70
  268. package/scripts/sync-github-about.js +0 -55
  269. package/scripts/sync-version.js +0 -479
  270. package/scripts/synthetic-dpo.js +0 -234
  271. package/scripts/tessl-export.js +0 -369
  272. package/scripts/test-coverage.js +0 -128
  273. package/scripts/thumbgate_session_start.sh +0 -32
  274. package/scripts/train_from_feedback.py +0 -929
  275. package/scripts/validate-feedback.js +0 -581
  276. package/scripts/verify-obsidian-setup.sh +0 -269
  277. package/scripts/verify-run.js +0 -269
  278. package/scripts/weekly-auto-post.js +0 -124
  279. package/scripts/x-autonomous-marketing.js +0 -139
@@ -1,227 +0,0 @@
1
- 'use strict';
2
- /**
3
- * Phase 7: Data Quality — Proof Gate
4
- *
5
- * Validates all QUAL-01 through QUAL-04 requirements offline.
6
- * Mirrors the pattern of prove-attribution.js (mkdtempSync + env override + execSync).
7
- *
8
- * Usage:
9
- * node scripts/prove-data-quality.js
10
- *
11
- * Produces:
12
- * proof/data-quality-report.json
13
- * proof/data-quality-report.md
14
- */
15
-
16
- const { execSync } = require('child_process');
17
- const fs = require('fs');
18
- const os = require('os');
19
- const path = require('path');
20
-
21
- const ROOT = path.join(__dirname, '..');
22
-
23
- function resolveProofPaths() {
24
- const proofDir = process.env.THUMBGATE_PROOF_DIR || path.join(ROOT, 'proof');
25
- return {
26
- proofDir,
27
- reportJson: path.join(proofDir, 'data-quality-report.json'),
28
- reportMd: path.join(proofDir, 'data-quality-report.md'),
29
- };
30
- }
31
-
32
- function run() {
33
- const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-qual-proof-'));
34
- const results = { passed: 0, failed: 0, requirements: {} };
35
- const { proofDir, reportJson, reportMd } = resolveProofPaths();
36
-
37
- const checks = [
38
- {
39
- id: 'QUAL-01',
40
- desc: 'validate-feedback.js exports validateEntry with 4-level pipeline',
41
- fn: () => {
42
- delete require.cache[require.resolve('./validate-feedback')];
43
- const v = require('./validate-feedback');
44
- if (typeof v.validateEntry !== 'function') throw new Error('validateEntry not exported');
45
- if (typeof v.validateSchema !== 'function') throw new Error('validateSchema not exported');
46
- if (typeof v.validateSemantics !== 'function') throw new Error('validateSemantics not exported');
47
- if (typeof v.detectAnomalies !== 'function') throw new Error('detectAnomalies not exported');
48
- if (typeof v.generateCorrections !== 'function') throw new Error('generateCorrections not exported');
49
-
50
- // Verify semantic inconsistency is caught
51
- const r = v.validateEntry({
52
- id: 'proof-x',
53
- timestamp: new Date().toISOString(),
54
- signal: 'positive',
55
- reward: -1,
56
- context: 'good work done',
57
- });
58
- if (r.valid) throw new Error('Expected invalid for positive+negative-reward');
59
- if (!r.corrections.length) throw new Error('Expected auto-correction for reward');
60
- if (r.correctedEntry.reward !== 1) throw new Error('Expected corrected reward=1');
61
-
62
- // Verify sensitive data detection
63
- const r2 = v.validateEntry({
64
- id: 'proof-y',
65
- timestamp: new Date().toISOString(),
66
- signal: 'positive',
67
- reward: 1,
68
- context: 'api_key=abc123 was in the response',
69
- });
70
- if (!r2.issues.some((i) => i.type === 'security')) {
71
- throw new Error('Expected security issue for api_key pattern');
72
- }
73
- },
74
- },
75
- {
76
- id: 'QUAL-02',
77
- desc: 'captureFeedback produces richContext with domain, filePaths, errorType, outcomeCategory',
78
- fn: () => {
79
- process.env.THUMBGATE_FEEDBACK_DIR = tmpDir;
80
- // Clear module cache so env var takes effect
81
- [
82
- './feedback-loop',
83
- './feedback-attribution',
84
- './rlaif-self-audit',
85
- ].forEach((m) => {
86
- try {
87
- delete require.cache[require.resolve(m)];
88
- } catch {
89
- // optional module
90
- }
91
- });
92
- const { captureFeedback } = require('./feedback-loop');
93
- const r = captureFeedback({
94
- signal: 'positive',
95
- context: 'unit tests added for edge cases',
96
- tags: ['testing'],
97
- filePaths: ['src/api.js'],
98
- });
99
- if (!r.feedbackEvent) throw new Error('No feedbackEvent in result');
100
- const rc = r.feedbackEvent.richContext;
101
- if (!rc) throw new Error('richContext missing from feedbackEvent');
102
- if (typeof rc.domain !== 'string') throw new Error('richContext.domain must be string');
103
- if (!Array.isArray(rc.filePaths)) throw new Error('richContext.filePaths must be array');
104
- if (!('errorType' in rc)) throw new Error('richContext.errorType field missing');
105
- if (typeof rc.outcomeCategory !== 'string') throw new Error('richContext.outcomeCategory must be string');
106
- if (rc.domain !== 'testing') throw new Error(`Expected domain=testing, got ${rc.domain}`);
107
- },
108
- },
109
- {
110
- id: 'QUAL-03',
111
- desc: 'inferOutcome returns granular categories beyond binary up/down',
112
- fn: () => {
113
- [
114
- './feedback-loop',
115
- ].forEach((m) => {
116
- try { delete require.cache[require.resolve(m)]; } catch {}
117
- });
118
- const { inferOutcome } = require('./feedback-loop');
119
- if (typeof inferOutcome !== 'function') throw new Error('inferOutcome not exported from feedback-loop');
120
-
121
- const cases = [
122
- ['positive', 'solved it first try', 'quick-success'],
123
- ['positive', 'thorough comprehensive analysis', 'deep-success'],
124
- ['positive', 'worked well overall', 'standard-success'],
125
- ['negative', 'gave wrong incorrect answer', 'factual-error'],
126
- ['negative', 'shallow surface level response', 'insufficient-depth'],
127
- ['negative', 'guessed without checking docs', 'false-assumption'],
128
- ];
129
-
130
- for (const [signal, context, expected] of cases) {
131
- const got = inferOutcome(signal, context);
132
- if (got !== expected) {
133
- throw new Error(`inferOutcome('${signal}', '${context}') = '${got}', expected '${expected}'`);
134
- }
135
- }
136
- },
137
- },
138
- {
139
- id: 'QUAL-04',
140
- desc: 'test:quality (node --test tests/validate-feedback.test.js) passes with 0 failures',
141
- fn: () => {
142
- const out = execSync('node --test tests/validate-feedback.test.js', {
143
- cwd: ROOT,
144
- env: { ...process.env, THUMBGATE_FEEDBACK_DIR: tmpDir },
145
- encoding: 'utf8',
146
- stdio: 'pipe',
147
- });
148
- // node:test exits non-zero on failure — if we get here, all tests passed
149
- const failMatch = out.match(/ℹ fail (\d+)/);
150
- if (failMatch && parseInt(failMatch[1], 10) > 0) {
151
- throw new Error(`Tests failed: ${failMatch[1]} failure(s)\n${out.slice(-500)}`);
152
- }
153
- },
154
- },
155
- ];
156
-
157
- console.log('Phase 7: Data Quality — Proof Gate\n');
158
- console.log('Checking requirements:\n');
159
-
160
- for (const check of checks) {
161
- try {
162
- check.fn();
163
- results.passed++;
164
- results.requirements[check.id] = { status: 'pass', desc: check.desc };
165
- console.log(` PASS ${check.id}: ${check.desc}`);
166
- } catch (err) {
167
- results.failed++;
168
- results.requirements[check.id] = {
169
- status: 'fail',
170
- desc: check.desc,
171
- error: err.message,
172
- };
173
- console.error(` FAIL ${check.id}: ${err.message}`);
174
- }
175
- }
176
-
177
- // Cleanup tmp dir
178
- try {
179
- fs.rmSync(tmpDir, { recursive: true, force: true });
180
- } catch {}
181
- delete process.env.THUMBGATE_FEEDBACK_DIR;
182
-
183
- // Write proof artifacts
184
- fs.mkdirSync(proofDir, { recursive: true });
185
-
186
- const report = {
187
- phase: '07-data-quality',
188
- generatedAt: new Date().toISOString(),
189
- passed: results.passed,
190
- failed: results.failed,
191
- total: checks.length,
192
- requirements: results.requirements,
193
- };
194
-
195
- fs.writeFileSync(reportJson, JSON.stringify(report, null, 2) + '\n');
196
-
197
- const md = [
198
- '# Phase 7: Data Quality — Proof Report',
199
- '',
200
- `Generated: ${report.generatedAt}`,
201
- `Result: ${results.passed}/${checks.length} passed`,
202
- '',
203
- '## Requirements',
204
- '',
205
- ...Object.entries(results.requirements).map(([id, r]) => {
206
- const checkbox = r.status === 'pass' ? '[x]' : '[ ]';
207
- const errLine = r.error ? `\n - Error: \`${r.error}\`` : '';
208
- return `- ${checkbox} **${id}**: ${r.desc}${errLine}`;
209
- }),
210
- '',
211
- '## Evidence',
212
- '',
213
- '- `scripts/validate-feedback.js` — 4-level validation pipeline (schema, semantics, anomaly, self-correction)',
214
- '- `scripts/feedback-loop.js` — `inferOutcome()` and `enrichFeedbackContext()` added; `richContext` in every feedbackEvent',
215
- '- `tests/validate-feedback.test.js` — 25 node:test cases covering all QUAL requirements',
216
- '',
217
- ].join('\n');
218
-
219
- fs.writeFileSync(reportMd, md);
220
-
221
- console.log(`\nPhase 7 proof: ${results.passed} passed, ${results.failed} failed`);
222
- console.log(`Report: ${reportJson}`);
223
-
224
- if (results.failed > 0) process.exit(1);
225
- }
226
-
227
- run();
@@ -1,352 +0,0 @@
1
- 'use strict';
2
-
3
- const fs = require('node:fs');
4
- const os = require('node:os');
5
- const path = require('node:path');
6
-
7
- const ROOT = path.join(__dirname, '..');
8
- const RUNNER_PATH = require.resolve('./async-job-runner');
9
- const FEEDBACK_PATH = require.resolve('./feedback-loop');
10
- const VERIFICATION_PATH = require.resolve('./verification-loop');
11
- const EXPERIMENT_TRACKER_PATH = require.resolve('./experiment-tracker');
12
- const EVOLUTION_STATE_PATH = require.resolve('./evolution-state');
13
- const WORKSPACE_EVOLVER_PATH = require.resolve('./workspace-evolver');
14
- const AUTORESEARCH_PATH = require.resolve('./autoresearch-runner');
15
- const VERIFY_RUN_PATH = require.resolve('./verify-run');
16
-
17
- function resolveProofPaths() {
18
- const proofDir = process.env.THUMBGATE_PROOF_DIR || path.join(ROOT, 'proof');
19
- return {
20
- proofDir,
21
- reportJson: path.join(proofDir, 'evolution-report.json'),
22
- reportMd: path.join(proofDir, 'evolution-report.md'),
23
- };
24
- }
25
-
26
- function resetModules() {
27
- [
28
- RUNNER_PATH,
29
- FEEDBACK_PATH,
30
- VERIFICATION_PATH,
31
- EXPERIMENT_TRACKER_PATH,
32
- EVOLUTION_STATE_PATH,
33
- WORKSPACE_EVOLVER_PATH,
34
- AUTORESEARCH_PATH,
35
- VERIFY_RUN_PATH,
36
- ].forEach((modulePath) => {
37
- delete require.cache[modulePath];
38
- });
39
- }
40
-
41
- function stubModule(modulePath, exports) {
42
- require.cache[modulePath] = {
43
- id: modulePath,
44
- filename: modulePath,
45
- loaded: true,
46
- exports,
47
- };
48
- }
49
-
50
- function buildStateCommand(settingKey, expectedValue) {
51
- const script = [
52
- 'const { readEvolutionState } = require("./scripts/evolution-state");',
53
- `const expected = ${JSON.stringify(expectedValue)};`,
54
- `const value = readEvolutionState().settings[${JSON.stringify(settingKey)}];`,
55
- 'const passed = value === expected;',
56
- 'console.log("ℹ tests 1");',
57
- 'console.log("ℹ pass " + (passed ? 1 : 0));',
58
- 'console.log("ℹ fail " + (passed ? 0 : 1));',
59
- 'if (!passed) process.exit(1);',
60
- ].join(' ');
61
- return `${JSON.stringify(process.execPath)} -e ${JSON.stringify(script)}`;
62
- }
63
-
64
- function makeRejectedVerification() {
65
- return {
66
- accepted: false,
67
- attempts: 2,
68
- finalVerification: {
69
- score: 0.2,
70
- violations: [
71
- {
72
- pattern: 'webhook signature mismatch',
73
- avoidRule: 'Verify webhook signatures before deploy.',
74
- },
75
- ],
76
- },
77
- partnerStrategy: {
78
- profile: 'strict_reviewer',
79
- verificationMode: 'evidence_first',
80
- },
81
- partnerReward: {
82
- reward: 0,
83
- },
84
- };
85
- }
86
-
87
- async function run() {
88
- const results = { passed: 0, failed: 0, requirements: {} };
89
- const { proofDir, reportJson, reportMd } = resolveProofPaths();
90
-
91
- const checks = [
92
- {
93
- id: 'EVOLVE-01',
94
- desc: 'evolution-state loads defaults and captures rollback snapshots',
95
- fn: () => {
96
- const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
97
- try {
98
- process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
99
- resetModules();
100
- const state = require('./evolution-state');
101
- const initial = state.readEvolutionState();
102
- if (initial.settings.half_life_days !== 7) throw new Error('Expected default half_life_days=7');
103
-
104
- const accepted = state.applyAcceptedMutation({
105
- targetKey: 'half_life_days',
106
- nextValue: 9,
107
- experimentId: 'exp_proof',
108
- summary: 'proof mutation',
109
- });
110
- if (!accepted.rollbackSnapshot.snapshotId) throw new Error('Expected rollback snapshot id');
111
- if (state.readEvolutionState().settings.half_life_days !== 9) throw new Error('Accepted mutation did not persist');
112
- } finally {
113
- delete process.env.THUMBGATE_FEEDBACK_DIR;
114
- resetModules();
115
- fs.rmSync(feedbackDir, { recursive: true, force: true });
116
- }
117
- },
118
- },
119
- {
120
- id: 'EVOLVE-02',
121
- desc: 'workspace-evolver accepts improved candidates only when primary and holdout checks pass',
122
- fn: () => {
123
- const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
124
- try {
125
- process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
126
- resetModules();
127
- const { runWorkspaceEvolution } = require('./workspace-evolver');
128
- const { readEvolutionState } = require('./evolution-state');
129
- const result = runWorkspaceEvolution({
130
- cwd: ROOT,
131
- targetName: 'half_life_days',
132
- nextValue: 8,
133
- primaryCommands: [buildStateCommand('half_life_days', 8)],
134
- holdoutCommands: [buildStateCommand('half_life_days', 8)],
135
- timeoutMs: 5000,
136
- });
137
-
138
- if (!result.kept) throw new Error('Expected improved candidate to be kept');
139
- if (!result.metrics.rollbackSnapshotId) throw new Error('Expected rollback snapshot metadata');
140
- if (readEvolutionState().settings.half_life_days !== 8) throw new Error('Accepted evolution state not applied');
141
- } finally {
142
- delete process.env.THUMBGATE_FEEDBACK_DIR;
143
- resetModules();
144
- fs.rmSync(feedbackDir, { recursive: true, force: true });
145
- }
146
- },
147
- },
148
- {
149
- id: 'EVOLVE-03',
150
- desc: 'restoreWorkspaceEvolution rolls accepted state back to the previous snapshot',
151
- fn: () => {
152
- const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
153
- try {
154
- process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
155
- resetModules();
156
- const { runWorkspaceEvolution, restoreWorkspaceEvolution } = require('./workspace-evolver');
157
- const { readEvolutionState } = require('./evolution-state');
158
- const result = runWorkspaceEvolution({
159
- cwd: ROOT,
160
- targetName: 'half_life_days',
161
- nextValue: 8,
162
- primaryCommands: [buildStateCommand('half_life_days', 8)],
163
- holdoutCommands: [buildStateCommand('half_life_days', 8)],
164
- timeoutMs: 5000,
165
- });
166
-
167
- restoreWorkspaceEvolution(result.metrics.rollbackSnapshotId);
168
- if (readEvolutionState().settings.half_life_days !== 7) throw new Error('Rollback did not restore default state');
169
- } finally {
170
- delete process.env.THUMBGATE_FEEDBACK_DIR;
171
- resetModules();
172
- fs.rmSync(feedbackDir, { recursive: true, force: true });
173
- }
174
- },
175
- },
176
- {
177
- id: 'EVOLVE-04',
178
- desc: 'autoresearch-runner delegates to workspace evolver and records research metadata plus rollback evidence',
179
- fn: async () => {
180
- const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
181
- try {
182
- process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
183
- resetModules();
184
- const runner = require('./autoresearch-runner');
185
- const result = await runner.runIteration({
186
- targetName: 'half_life_days',
187
- nextValue: 8,
188
- testCommand: buildStateCommand('half_life_days', 8),
189
- holdoutCommands: [buildStateCommand('half_life_days', 8)],
190
- timeoutMs: 5000,
191
- researchQuery: 'rank fusion',
192
- searchPapersImpl: async () => [{
193
- paperId: '2603.01896',
194
- title: 'Agentic Rank Fusion for Research Systems',
195
- summary: 'Retrieval fusion for agent workflows.',
196
- authors: ['Ada Lovelace'],
197
- tags: ['retrieval'],
198
- url: 'https://arxiv.org/abs/2603.01896',
199
- source: 'huggingface-papers',
200
- }],
201
- });
202
-
203
- if (!result.kept) throw new Error('Expected autoresearch iteration to keep the improved candidate');
204
- if (result.metrics.researchQuery !== 'rank fusion') throw new Error('Research query metadata missing');
205
- if (!result.metrics.researchPackId) throw new Error('Research pack id missing');
206
- if (!result.metrics.researchPaperIds.includes('2603.01896')) throw new Error('Research paper id missing');
207
- if (!result.metrics.rollbackSnapshotId) throw new Error('Rollback snapshot metadata missing');
208
- } finally {
209
- delete process.env.THUMBGATE_FEEDBACK_DIR;
210
- resetModules();
211
- fs.rmSync(feedbackDir, { recursive: true, force: true });
212
- }
213
- },
214
- },
215
- {
216
- id: 'EVOLVE-05',
217
- desc: 'async-job-runner follow-up experiments include a recommended evolution target and replay command',
218
- fn: () => {
219
- const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
220
- try {
221
- process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
222
- resetModules();
223
- stubModule(VERIFICATION_PATH, {
224
- runVerificationLoop: () => makeRejectedVerification(),
225
- });
226
- const runner = require('./async-job-runner');
227
- const tracker = require('./experiment-tracker');
228
- runner.executeJob({
229
- id: 'verification-failure-job',
230
- context: 'webhook signature mismatch',
231
- tags: ['billing'],
232
- skill: 'billing-guard',
233
- });
234
- const experiments = tracker.loadExperiments();
235
- const experiment = experiments[0];
236
-
237
- if (!experiment) throw new Error('Expected queued improvement experiment');
238
- if (!experiment.mutation.recommendedTarget) throw new Error('Missing recommendedTarget');
239
- if (!experiment.mutation.evolutionCommand.includes('workspace-evolver.js')) {
240
- throw new Error('Missing workspace evolver replay command');
241
- }
242
- } finally {
243
- delete process.env.THUMBGATE_FEEDBACK_DIR;
244
- resetModules();
245
- fs.rmSync(feedbackDir, { recursive: true, force: true });
246
- }
247
- },
248
- },
249
- {
250
- id: 'EVOLVE-06',
251
- desc: 'verify:full includes the evolution proof lane and records the artifact',
252
- fn: () => {
253
- resetModules();
254
- const { buildVerifyPlan, recordVerifyWorkflowRun } = require('./verify-run');
255
- const plan = buildVerifyPlan('full');
256
- const commands = plan.map((step) => [step.command, ...(step.args || [])].join(' ')).join('\n');
257
- if (!commands.includes('prove:evolution')) {
258
- throw new Error('verify:full is missing prove:evolution');
259
- }
260
-
261
- const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-feedback-'));
262
- const cwd = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-cwd-'));
263
- try {
264
- const entry = recordVerifyWorkflowRun('full', cwd, feedbackDir);
265
- if (!entry.proofArtifacts.some((artifact) => artifact.endsWith(path.join('proof', 'evolution-report.json')))) {
266
- throw new Error('Workflow run missing evolution proof artifact');
267
- }
268
- } finally {
269
- fs.rmSync(feedbackDir, { recursive: true, force: true });
270
- fs.rmSync(cwd, { recursive: true, force: true });
271
- }
272
- },
273
- },
274
- ];
275
-
276
- console.log('Phase 17: Agent Workspace Evolution — Proof Gate\n');
277
- console.log('Checking requirements:\n');
278
-
279
- for (const check of checks) {
280
- try {
281
- await check.fn();
282
- results.passed++;
283
- results.requirements[check.id] = { status: 'pass', desc: check.desc };
284
- console.log(` PASS ${check.id}: ${check.desc}`);
285
- } catch (error) {
286
- results.failed++;
287
- results.requirements[check.id] = {
288
- status: 'fail',
289
- desc: check.desc,
290
- error: error.message,
291
- };
292
- console.error(` FAIL ${check.id}: ${error.message}`);
293
- }
294
- }
295
-
296
- fs.mkdirSync(proofDir, { recursive: true });
297
-
298
- const report = {
299
- phase: '17-agent-workspace-evolution',
300
- generatedAt: new Date().toISOString(),
301
- passed: results.passed,
302
- failed: results.failed,
303
- requirements: results.requirements,
304
- };
305
-
306
- fs.writeFileSync(reportJson, `${JSON.stringify(report, null, 2)}\n`);
307
-
308
- const lines = [
309
- '# Agent Workspace Evolution Proof Report',
310
- '',
311
- `Generated: ${report.generatedAt}`,
312
- '',
313
- `Summary: ${results.passed} passed, ${results.failed} failed`,
314
- '',
315
- '## Requirements',
316
- '',
317
- ];
318
-
319
- for (const [id, requirement] of Object.entries(results.requirements)) {
320
- lines.push(`- [${requirement.status === 'pass' ? 'x' : ' '}] **${id}** — ${requirement.desc}`);
321
- if (requirement.error) {
322
- lines.push(` - Error: ${requirement.error}`);
323
- }
324
- }
325
-
326
- lines.push('');
327
- lines.push('## Evidence');
328
- lines.push('');
329
- lines.push('- `scripts/evolution-state.js` — local accepted-state overlay + rollback snapshots');
330
- lines.push('- `scripts/workspace-evolver.js` — evolve / evaluate / accept / rollback engine');
331
- lines.push('- `scripts/autoresearch-runner.js` — shared research-backed mutation loop on top of the evolver');
332
- lines.push('- `scripts/prove-evolution.js` — this proof gate');
333
-
334
- fs.writeFileSync(reportMd, `${lines.join('\n')}\n`);
335
-
336
- console.log(`\n${results.passed} passed, ${results.failed} failed`);
337
-
338
- if (results.failed > 0) {
339
- process.exitCode = 1;
340
- }
341
- }
342
-
343
- if (require.main === module) {
344
- run().catch((error) => {
345
- console.error(error);
346
- process.exit(1);
347
- });
348
- }
349
-
350
- module.exports = {
351
- run,
352
- };