npm - thumbgate - Versions diffs - 1.4.2 → 1.4.4 - Mend

thumbgate 1.4.2 → 1.4.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (279) hide show

package/.claude-plugin/README.md +45 -34
package/.claude-plugin/marketplace.json +3 -3
package/.claude-plugin/plugin.json +3 -3
package/.well-known/llms.txt +1 -1
package/.well-known/mcp/server-card.json +1 -1
package/README.md +26 -2
package/adapters/README.md +4 -1
package/adapters/claude/.mcp.json +2 -2
package/adapters/codex/config.toml +2 -2
package/adapters/mcp/server-stdio.js +10 -4
package/adapters/opencode/opencode.json +1 -1
package/bin/cli.js +246 -90
package/config/mcp-allowlists.json +11 -3
package/package.json +184 -21
package/scripts/audit-trail.js +25 -15
package/scripts/auto-wire-hooks.js +127 -0
package/scripts/cli-demo.js +102 -0
package/scripts/cli-schema.js +285 -0
package/scripts/cli-status.js +166 -0
package/scripts/cross-encoder-reranker.js +235 -0
package/scripts/explore-subcommands.js +277 -0
package/scripts/explore.js +569 -0
package/scripts/feedback-loop.js +20 -6
package/scripts/lesson-inference.js +7 -1
package/scripts/lesson-reranker.js +263 -0
package/scripts/lesson-retrieval.js +34 -17
package/scripts/lesson-search.js +69 -0
package/scripts/perplexity-client.js +210 -0
package/scripts/reflector-agent.js +2 -2
package/scripts/statusline-local-stats.js +3 -1
package/scripts/statusline.sh +12 -11
package/src/api/server.js +178 -17
package/src/index.js +3 -0
package/.claude-plugin/bundle/icon.png +0 -0
package/.claude-plugin/bundle/icon.svg +0 -18
package/.claude-plugin/bundle/server/index.js +0 -24
package/adapters/chatgpt/INSTALL.md +0 -138
package/bin/memory.sh +0 -64
package/bin/obsidian-sync.sh +0 -20
package/plugins/amp-skill/INSTALL.md +0 -52
package/plugins/amp-skill/SKILL.md +0 -64
package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +0 -22
package/plugins/claude-codex-bridge/.mcp.json +0 -14
package/plugins/claude-codex-bridge/INSTALL.md +0 -43
package/plugins/claude-codex-bridge/README.md +0 -46
package/plugins/claude-codex-bridge/scripts/codex-bridge.js +0 -286
package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +0 -24
package/plugins/claude-codex-bridge/skills/result/SKILL.md +0 -22
package/plugins/claude-codex-bridge/skills/review/SKILL.md +0 -28
package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +0 -27
package/plugins/claude-codex-bridge/skills/setup/SKILL.md +0 -21
package/plugins/claude-codex-bridge/skills/status/SKILL.md +0 -19
package/plugins/claude-skill/INSTALL.md +0 -55
package/plugins/claude-skill/SKILL.md +0 -46
package/plugins/codex-profile/.codex-plugin/plugin.json +0 -43
package/plugins/codex-profile/.mcp.json +0 -14
package/plugins/codex-profile/AGENTS.md +0 -20
package/plugins/codex-profile/INSTALL.md +0 -89
package/plugins/codex-profile/README.md +0 -61
package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +0 -23
package/plugins/cursor-marketplace/CHANGELOG.md +0 -30
package/plugins/cursor-marketplace/LICENSE +0 -21
package/plugins/cursor-marketplace/README.md +0 -124
package/plugins/cursor-marketplace/agents/reliability-reviewer.md +0 -31
package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
package/plugins/cursor-marketplace/commands/capture-feedback.md +0 -33
package/plugins/cursor-marketplace/commands/check-gates.md +0 -25
package/plugins/cursor-marketplace/commands/show-lessons.md +0 -27
package/plugins/cursor-marketplace/hooks/hooks.json +0 -10
package/plugins/cursor-marketplace/mcp.json +0 -14
package/plugins/cursor-marketplace/rules/feedback-capture.mdc +0 -34
package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +0 -30
package/plugins/cursor-marketplace/rules/session-continuity.mdc +0 -28
package/plugins/cursor-marketplace/scripts/gate-check.sh +0 -21
package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +0 -48
package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +0 -31
package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +0 -30
package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +0 -33
package/plugins/gemini-extension/INSTALL.md +0 -92
package/plugins/gemini-extension/gemini_prompt.txt +0 -14
package/plugins/gemini-extension/tool_contract.json +0 -45
package/plugins/opencode-profile/INSTALL.md +0 -57
package/public/assets/instagram-card.png +0 -0
package/public/assets/tiktok-agent-memory.mp4 +0 -0
package/public/blog.html +0 -474
package/public/compare/mem0.html +0 -189
package/public/compare/speclock.html +0 -180
package/public/compare.html +0 -310
package/public/dashboard.html +0 -1100
package/public/guide.html +0 -317
package/public/guides/claude-code-prevent-repeated-mistakes.html +0 -161
package/public/guides/codex-cli-guardrails.html +0 -158
package/public/guides/cursor-prevent-repeated-mistakes.html +0 -161
package/public/guides/pre-action-gates.html +0 -162
package/public/guides/stop-repeated-ai-agent-mistakes.html +0 -159
package/public/index.html +0 -1128
package/public/js/buyer-intent.js +0 -252
package/public/learn/agent-harness-pattern.html +0 -180
package/public/learn/ai-agent-persistent-memory.html +0 -203
package/public/learn/learn.css +0 -45
package/public/learn/mcp-pre-action-gates-explained.html +0 -172
package/public/learn/stop-ai-agent-force-push.html +0 -134
package/public/learn/vibe-coding-safety-net.html +0 -142
package/public/learn.html +0 -274
package/public/lessons.html +0 -967
package/public/llm-context.md +0 -140
package/public/pro.html +0 -1087
package/public/vercel.json +0 -8
package/scripts/a2ui-engine.js +0 -73
package/scripts/adk-consolidator.js +0 -274
package/scripts/agent-security-hardening.js +0 -225
package/scripts/ai-search-visibility.js +0 -142
package/scripts/autonomous-sales-agent.js +0 -39
package/scripts/autoresearch-runner.js +0 -216
package/scripts/background-agent-governance.js +0 -229
package/scripts/behavioral-extraction.js +0 -93
package/scripts/budget-enforcer.js +0 -173
package/scripts/budget-guard.js +0 -173
package/scripts/build-claude-mcpb.js +0 -255
package/scripts/build-codex-plugin.js +0 -152
package/scripts/capture-railway-diagnostics.sh +0 -97
package/scripts/changeset-check.js +0 -372
package/scripts/check-congruence.js +0 -443
package/scripts/computer-use-firewall.js +0 -280
package/scripts/content-engine/linkedin-content-generator.js +0 -154
package/scripts/content-engine/output/linkedin-memento-validation.md +0 -17
package/scripts/content-engine/output/linkedin-posts-2026-04-09.md +0 -175
package/scripts/content-engine/reddit-thread-finder.js +0 -154
package/scripts/context-engine.js +0 -710
package/scripts/daily-digest.js +0 -11
package/scripts/data-governance.js +0 -173
package/scripts/deploy-gcp.sh +0 -44
package/scripts/deploy-policy.js +0 -249
package/scripts/disagreement-mining.js +0 -315
package/scripts/dpo-optimizer.js +0 -206
package/scripts/ensure-repo-bootstrap.js +0 -130
package/scripts/ephemeral-agent-store.js +0 -212
package/scripts/eval-harness.js +0 -56
package/scripts/export-kto-pairs.js +0 -309
package/scripts/export-training.js +0 -446
package/scripts/feedback-fallback.js +0 -111
package/scripts/feedback-inbox-read.js +0 -162
package/scripts/feedback-root-consolidator.js +0 -233
package/scripts/feedback-to-memory.js +0 -185
package/scripts/gate-satisfy.js +0 -42
package/scripts/generate-paperbanana-diagrams.sh +0 -99
package/scripts/generate-pretool-hook.sh +0 -40
package/scripts/github-about.js +0 -430
package/scripts/github-outreach.js +0 -65
package/scripts/gtm-revenue-loop.js +0 -535
package/scripts/hallucination-detector.js +0 -226
package/scripts/hf-papers.js +0 -317
package/scripts/hook-auto-capture.sh +0 -100
package/scripts/hook-stop-pr-thread-check.sh +0 -68
package/scripts/hook-stop-self-score.sh +0 -51
package/scripts/hook-stop-verify-deploy.sh +0 -31
package/scripts/hook-verify-before-done.sh +0 -20
package/scripts/managed-dpo-export.js +0 -91
package/scripts/markdown-escape.js +0 -12
package/scripts/marketing-experiment.js +0 -657
package/scripts/memalign-recall.js +0 -111
package/scripts/memory-migration.js +0 -296
package/scripts/meta-policy.js +0 -190
package/scripts/metered-billing.js +0 -16
package/scripts/model-tier-router.js +0 -310
package/scripts/money-watcher.js +0 -218
package/scripts/multi-hop-recall.js +0 -240
package/scripts/per-step-scoring.js +0 -163
package/scripts/perplexity-marketing.js +0 -466
package/scripts/pii-scanner.js +0 -153
package/scripts/plan-gate.js +0 -154
package/scripts/post-everywhere.js +0 -341
package/scripts/post-to-x-retry.sh +0 -22
package/scripts/post-to-x.js +0 -369
package/scripts/pr-manager.js +0 -421
package/scripts/principle-extractor.js +0 -162
package/scripts/pro-features.js +0 -41
package/scripts/prompt-dlp.js +0 -222
package/scripts/prove-adapters.js +0 -860
package/scripts/prove-attribution.js +0 -361
package/scripts/prove-automation.js +0 -651
package/scripts/prove-autoresearch.js +0 -304
package/scripts/prove-claim-verification.js +0 -277
package/scripts/prove-cloudflare-sandbox.js +0 -161
package/scripts/prove-data-pipeline.js +0 -408
package/scripts/prove-data-quality.js +0 -227
package/scripts/prove-evolution.js +0 -352
package/scripts/prove-harnesses.js +0 -287
package/scripts/prove-intelligence.js +0 -257
package/scripts/prove-lancedb.js +0 -425
package/scripts/prove-local-intelligence.js +0 -340
package/scripts/prove-loop-closure.js +0 -263
package/scripts/prove-packaged-runtime.js +0 -326
package/scripts/prove-predictive-insights.js +0 -355
package/scripts/prove-runtime.js +0 -363
package/scripts/prove-seo-gsd.js +0 -234
package/scripts/prove-settings.js +0 -279
package/scripts/prove-subway-upgrades.js +0 -277
package/scripts/prove-tessl.js +0 -229
package/scripts/prove-training-export.js +0 -325
package/scripts/prove-workflow-contract.js +0 -112
package/scripts/prove-xmemory.js +0 -332
package/scripts/publish-decision.js +0 -159
package/scripts/ralph-loop.js +0 -376
package/scripts/ralph-mode-ci.js +0 -331
package/scripts/reddit-dm-outreach.js +0 -192
package/scripts/reddit-monitor-cron.sh +0 -26
package/scripts/reminder-engine.js +0 -132
package/scripts/revenue-status.js +0 -472
package/scripts/rotate-stripe-webhook-secret.js +0 -314
package/scripts/schedule-manager.js +0 -249
package/scripts/self-healing-check.js +0 -193
package/scripts/shieldcortex-memory-firewall-runner.mjs +0 -53
package/scripts/skill-exporter.js +0 -260
package/scripts/skill-materializer.js +0 -134
package/scripts/skill-packs.js +0 -136
package/scripts/skill-proposer.js +0 -99
package/scripts/skill-quality-tracker.js +0 -282
package/scripts/slow-loop.js +0 -72
package/scripts/social-analytics/db/analytics.sqlite +0 -0
package/scripts/social-analytics/db/schema.sql +0 -32
package/scripts/social-analytics/digest.js +0 -256
package/scripts/social-analytics/engagement-audit.js +0 -185
package/scripts/social-analytics/generate-instagram-card.js +0 -97
package/scripts/social-analytics/instagram-thumbgate-post.js +0 -111
package/scripts/social-analytics/install-growth-automation.js +0 -114
package/scripts/social-analytics/load-env.js +0 -77
package/scripts/social-analytics/mcp-server.js +0 -289
package/scripts/social-analytics/normalizer.js +0 -580
package/scripts/social-analytics/notify.js +0 -162
package/scripts/social-analytics/poll-all.js +0 -107
package/scripts/social-analytics/pollers/github.js +0 -195
package/scripts/social-analytics/pollers/instagram.js +0 -253
package/scripts/social-analytics/pollers/linkedin.js +0 -340
package/scripts/social-analytics/pollers/plausible.js +0 -245
package/scripts/social-analytics/pollers/reddit.js +0 -306
package/scripts/social-analytics/pollers/threads.js +0 -233
package/scripts/social-analytics/pollers/tiktok.js +0 -203
package/scripts/social-analytics/pollers/x.js +0 -227
package/scripts/social-analytics/pollers/youtube.js +0 -304
package/scripts/social-analytics/pollers/zernio.js +0 -183
package/scripts/social-analytics/publish-instagram-thumbgate.js +0 -104
package/scripts/social-analytics/publish-thumbgate-launch.js +0 -322
package/scripts/social-analytics/publishers/devto.js +0 -122
package/scripts/social-analytics/publishers/instagram.js +0 -317
package/scripts/social-analytics/publishers/linkedin.js +0 -294
package/scripts/social-analytics/publishers/reddit.js +0 -385
package/scripts/social-analytics/publishers/threads.js +0 -275
package/scripts/social-analytics/publishers/tiktok.js +0 -217
package/scripts/social-analytics/publishers/x.js +0 -259
package/scripts/social-analytics/publishers/youtube.js +0 -223
package/scripts/social-analytics/publishers/zernio.js +0 -539
package/scripts/social-analytics/reconcile-thumbgate-campaign.js +0 -165
package/scripts/social-analytics/run-digest.js +0 -34
package/scripts/social-analytics/schedule-thumbgate-campaign.js +0 -275
package/scripts/social-analytics/store.js +0 -455
package/scripts/social-analytics/sync-launch-assets.js +0 -185
package/scripts/social-analytics/utm.js +0 -143
package/scripts/social-pipeline.js +0 -2626
package/scripts/social-post-hourly.js +0 -228
package/scripts/social-quality-gate.js +0 -134
package/scripts/social-reply-monitor.js +0 -592
package/scripts/status-dashboard.js +0 -155
package/scripts/stripe-live-status.js +0 -115
package/scripts/subagent-profiles.js +0 -79
package/scripts/sync-branch-protection.js +0 -340
package/scripts/sync-gh-secrets-from-env.sh +0 -70
package/scripts/sync-github-about.js +0 -55
package/scripts/sync-version.js +0 -479
package/scripts/synthetic-dpo.js +0 -234
package/scripts/tessl-export.js +0 -369
package/scripts/test-coverage.js +0 -128
package/scripts/thumbgate_session_start.sh +0 -32
package/scripts/train_from_feedback.py +0 -929
package/scripts/validate-feedback.js +0 -581
package/scripts/verify-obsidian-setup.sh +0 -269
package/scripts/verify-run.js +0 -269
package/scripts/weekly-auto-post.js +0 -124
package/scripts/x-autonomous-marketing.js +0 -139

package/scripts/prove-data-quality.js DELETED Viewed

@@ -1,227 +0,0 @@
-'use strict';
-/**
- * Phase 7: Data Quality — Proof Gate
- *
- * Validates all QUAL-01 through QUAL-04 requirements offline.
- * Mirrors the pattern of prove-attribution.js (mkdtempSync + env override + execSync).
- *
- * Usage:
- *   node scripts/prove-data-quality.js
- *
- * Produces:
- *   proof/data-quality-report.json
- *   proof/data-quality-report.md
- */
-const { execSync } = require('child_process');
-const fs = require('fs');
-const os = require('os');
-const path = require('path');
-const ROOT = path.join(__dirname, '..');
-function resolveProofPaths() {
-  const proofDir = process.env.THUMBGATE_PROOF_DIR || path.join(ROOT, 'proof');
-  return {
-    proofDir,
-    reportJson: path.join(proofDir, 'data-quality-report.json'),
-    reportMd: path.join(proofDir, 'data-quality-report.md'),
-  };
-}
-function run() {
-  const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-qual-proof-'));
-  const results = { passed: 0, failed: 0, requirements: {} };
-  const { proofDir, reportJson, reportMd } = resolveProofPaths();
-  const checks = [
-    {
-      id: 'QUAL-01',
-      desc: 'validate-feedback.js exports validateEntry with 4-level pipeline',
-      fn: () => {
-        delete require.cache[require.resolve('./validate-feedback')];
-        const v = require('./validate-feedback');
-        if (typeof v.validateEntry !== 'function') throw new Error('validateEntry not exported');
-        if (typeof v.validateSchema !== 'function') throw new Error('validateSchema not exported');
-        if (typeof v.validateSemantics !== 'function') throw new Error('validateSemantics not exported');
-        if (typeof v.detectAnomalies !== 'function') throw new Error('detectAnomalies not exported');
-        if (typeof v.generateCorrections !== 'function') throw new Error('generateCorrections not exported');
-        // Verify semantic inconsistency is caught
-        const r = v.validateEntry({
-          id: 'proof-x',
-          timestamp: new Date().toISOString(),
-          signal: 'positive',
-          reward: -1,
-          context: 'good work done',
-        });
-        if (r.valid) throw new Error('Expected invalid for positive+negative-reward');
-        if (!r.corrections.length) throw new Error('Expected auto-correction for reward');
-        if (r.correctedEntry.reward !== 1) throw new Error('Expected corrected reward=1');
-        // Verify sensitive data detection
-        const r2 = v.validateEntry({
-          id: 'proof-y',
-          timestamp: new Date().toISOString(),
-          signal: 'positive',
-          reward: 1,
-          context: 'api_key=abc123 was in the response',
-        });
-        if (!r2.issues.some((i) => i.type === 'security')) {
-          throw new Error('Expected security issue for api_key pattern');
-        }
-      },
-    },
-    {
-      id: 'QUAL-02',
-      desc: 'captureFeedback produces richContext with domain, filePaths, errorType, outcomeCategory',
-      fn: () => {
-        process.env.THUMBGATE_FEEDBACK_DIR = tmpDir;
-        // Clear module cache so env var takes effect
-        [
-          './feedback-loop',
-          './feedback-attribution',
-          './rlaif-self-audit',
-        ].forEach((m) => {
-          try {
-            delete require.cache[require.resolve(m)];
-          } catch {
-            // optional module
-          }
-        });
-        const { captureFeedback } = require('./feedback-loop');
-        const r = captureFeedback({
-          signal: 'positive',
-          context: 'unit tests added for edge cases',
-          tags: ['testing'],
-          filePaths: ['src/api.js'],
-        });
-        if (!r.feedbackEvent) throw new Error('No feedbackEvent in result');
-        const rc = r.feedbackEvent.richContext;
-        if (!rc) throw new Error('richContext missing from feedbackEvent');
-        if (typeof rc.domain !== 'string') throw new Error('richContext.domain must be string');
-        if (!Array.isArray(rc.filePaths)) throw new Error('richContext.filePaths must be array');
-        if (!('errorType' in rc)) throw new Error('richContext.errorType field missing');
-        if (typeof rc.outcomeCategory !== 'string') throw new Error('richContext.outcomeCategory must be string');
-        if (rc.domain !== 'testing') throw new Error(`Expected domain=testing, got ${rc.domain}`);
-      },
-    },
-    {
-      id: 'QUAL-03',
-      desc: 'inferOutcome returns granular categories beyond binary up/down',
-      fn: () => {
-        [
-          './feedback-loop',
-        ].forEach((m) => {
-          try { delete require.cache[require.resolve(m)]; } catch {}
-        });
-        const { inferOutcome } = require('./feedback-loop');
-        if (typeof inferOutcome !== 'function') throw new Error('inferOutcome not exported from feedback-loop');
-        const cases = [
-          ['positive', 'solved it first try', 'quick-success'],
-          ['positive', 'thorough comprehensive analysis', 'deep-success'],
-          ['positive', 'worked well overall', 'standard-success'],
-          ['negative', 'gave wrong incorrect answer', 'factual-error'],
-          ['negative', 'shallow surface level response', 'insufficient-depth'],
-          ['negative', 'guessed without checking docs', 'false-assumption'],
-        ];
-        for (const [signal, context, expected] of cases) {
-          const got = inferOutcome(signal, context);
-          if (got !== expected) {
-            throw new Error(`inferOutcome('${signal}', '${context}') = '${got}', expected '${expected}'`);
-          }
-        }
-      },
-    },
-    {
-      id: 'QUAL-04',
-      desc: 'test:quality (node --test tests/validate-feedback.test.js) passes with 0 failures',
-      fn: () => {
-        const out = execSync('node --test tests/validate-feedback.test.js', {
-          cwd: ROOT,
-          env: { ...process.env, THUMBGATE_FEEDBACK_DIR: tmpDir },
-          encoding: 'utf8',
-          stdio: 'pipe',
-        });
-        // node:test exits non-zero on failure — if we get here, all tests passed
-        const failMatch = out.match(/ℹ fail (\d+)/);
-        if (failMatch && parseInt(failMatch[1], 10) > 0) {
-          throw new Error(`Tests failed: ${failMatch[1]} failure(s)\n${out.slice(-500)}`);
-        }
-      },
-    },
-  ];
-  console.log('Phase 7: Data Quality — Proof Gate\n');
-  console.log('Checking requirements:\n');
-  for (const check of checks) {
-    try {
-      check.fn();
-      results.passed++;
-      results.requirements[check.id] = { status: 'pass', desc: check.desc };
-      console.log(`  PASS  ${check.id}: ${check.desc}`);
-    } catch (err) {
-      results.failed++;
-      results.requirements[check.id] = {
-        status: 'fail',
-        desc: check.desc,
-        error: err.message,
-      };
-      console.error(`  FAIL  ${check.id}: ${err.message}`);
-    }
-  }
-  // Cleanup tmp dir
-  try {
-    fs.rmSync(tmpDir, { recursive: true, force: true });
-  } catch {}
-  delete process.env.THUMBGATE_FEEDBACK_DIR;
-  // Write proof artifacts
-  fs.mkdirSync(proofDir, { recursive: true });
-  const report = {
-    phase: '07-data-quality',
-    generatedAt: new Date().toISOString(),
-    passed: results.passed,
-    failed: results.failed,
-    total: checks.length,
-    requirements: results.requirements,
-  };
-  fs.writeFileSync(reportJson, JSON.stringify(report, null, 2) + '\n');
-  const md = [
-    '# Phase 7: Data Quality — Proof Report',
-    '',
-    `Generated: ${report.generatedAt}`,
-    `Result: ${results.passed}/${checks.length} passed`,
-    '',
-    '## Requirements',
-    '',
-    ...Object.entries(results.requirements).map(([id, r]) => {
-      const checkbox = r.status === 'pass' ? '[x]' : '[ ]';
-      const errLine = r.error ? `\n  - Error: \`${r.error}\`` : '';
-      return `- ${checkbox} **${id}**: ${r.desc}${errLine}`;
-    }),
-    '',
-    '## Evidence',
-    '',
-    '- `scripts/validate-feedback.js` — 4-level validation pipeline (schema, semantics, anomaly, self-correction)',
-    '- `scripts/feedback-loop.js` — `inferOutcome()` and `enrichFeedbackContext()` added; `richContext` in every feedbackEvent',
-    '- `tests/validate-feedback.test.js` — 25 node:test cases covering all QUAL requirements',
-    '',
-  ].join('\n');
-  fs.writeFileSync(reportMd, md);
-  console.log(`\nPhase 7 proof: ${results.passed} passed, ${results.failed} failed`);
-  console.log(`Report: ${reportJson}`);
-  if (results.failed > 0) process.exit(1);
-}
-run();

package/scripts/prove-evolution.js DELETED Viewed

@@ -1,352 +0,0 @@
-'use strict';
-const fs = require('node:fs');
-const os = require('node:os');
-const path = require('node:path');
-const ROOT = path.join(__dirname, '..');
-const RUNNER_PATH = require.resolve('./async-job-runner');
-const FEEDBACK_PATH = require.resolve('./feedback-loop');
-const VERIFICATION_PATH = require.resolve('./verification-loop');
-const EXPERIMENT_TRACKER_PATH = require.resolve('./experiment-tracker');
-const EVOLUTION_STATE_PATH = require.resolve('./evolution-state');
-const WORKSPACE_EVOLVER_PATH = require.resolve('./workspace-evolver');
-const AUTORESEARCH_PATH = require.resolve('./autoresearch-runner');
-const VERIFY_RUN_PATH = require.resolve('./verify-run');
-function resolveProofPaths() {
-  const proofDir = process.env.THUMBGATE_PROOF_DIR || path.join(ROOT, 'proof');
-  return {
-    proofDir,
-    reportJson: path.join(proofDir, 'evolution-report.json'),
-    reportMd: path.join(proofDir, 'evolution-report.md'),
-  };
-}
-function resetModules() {
-  [
-    RUNNER_PATH,
-    FEEDBACK_PATH,
-    VERIFICATION_PATH,
-    EXPERIMENT_TRACKER_PATH,
-    EVOLUTION_STATE_PATH,
-    WORKSPACE_EVOLVER_PATH,
-    AUTORESEARCH_PATH,
-    VERIFY_RUN_PATH,
-  ].forEach((modulePath) => {
-    delete require.cache[modulePath];
-  });
-}
-function stubModule(modulePath, exports) {
-  require.cache[modulePath] = {
-    id: modulePath,
-    filename: modulePath,
-    loaded: true,
-    exports,
-  };
-}
-function buildStateCommand(settingKey, expectedValue) {
-  const script = [
-    'const { readEvolutionState } = require("./scripts/evolution-state");',
-    `const expected = ${JSON.stringify(expectedValue)};`,
-    `const value = readEvolutionState().settings[${JSON.stringify(settingKey)}];`,
-    'const passed = value === expected;',
-    'console.log("ℹ tests 1");',
-    'console.log("ℹ pass " + (passed ? 1 : 0));',
-    'console.log("ℹ fail " + (passed ? 0 : 1));',
-    'if (!passed) process.exit(1);',
-  ].join(' ');
-  return `${JSON.stringify(process.execPath)} -e ${JSON.stringify(script)}`;
-}
-function makeRejectedVerification() {
-  return {
-    accepted: false,
-    attempts: 2,
-    finalVerification: {
-      score: 0.2,
-      violations: [
-        {
-          pattern: 'webhook signature mismatch',
-          avoidRule: 'Verify webhook signatures before deploy.',
-        },
-      ],
-    },
-    partnerStrategy: {
-      profile: 'strict_reviewer',
-      verificationMode: 'evidence_first',
-    },
-    partnerReward: {
-      reward: 0,
-    },
-  };
-}
-async function run() {
-  const results = { passed: 0, failed: 0, requirements: {} };
-  const { proofDir, reportJson, reportMd } = resolveProofPaths();
-  const checks = [
-    {
-      id: 'EVOLVE-01',
-      desc: 'evolution-state loads defaults and captures rollback snapshots',
-      fn: () => {
-        const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
-        try {
-          process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
-          resetModules();
-          const state = require('./evolution-state');
-          const initial = state.readEvolutionState();
-          if (initial.settings.half_life_days !== 7) throw new Error('Expected default half_life_days=7');
-          const accepted = state.applyAcceptedMutation({
-            targetKey: 'half_life_days',
-            nextValue: 9,
-            experimentId: 'exp_proof',
-            summary: 'proof mutation',
-          });
-          if (!accepted.rollbackSnapshot.snapshotId) throw new Error('Expected rollback snapshot id');
-          if (state.readEvolutionState().settings.half_life_days !== 9) throw new Error('Accepted mutation did not persist');
-        } finally {
-          delete process.env.THUMBGATE_FEEDBACK_DIR;
-          resetModules();
-          fs.rmSync(feedbackDir, { recursive: true, force: true });
-        }
-      },
-    },
-    {
-      id: 'EVOLVE-02',
-      desc: 'workspace-evolver accepts improved candidates only when primary and holdout checks pass',
-      fn: () => {
-        const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
-        try {
-          process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
-          resetModules();
-          const { runWorkspaceEvolution } = require('./workspace-evolver');
-          const { readEvolutionState } = require('./evolution-state');
-          const result = runWorkspaceEvolution({
-            cwd: ROOT,
-            targetName: 'half_life_days',
-            nextValue: 8,
-            primaryCommands: [buildStateCommand('half_life_days', 8)],
-            holdoutCommands: [buildStateCommand('half_life_days', 8)],
-            timeoutMs: 5000,
-          });
-          if (!result.kept) throw new Error('Expected improved candidate to be kept');
-          if (!result.metrics.rollbackSnapshotId) throw new Error('Expected rollback snapshot metadata');
-          if (readEvolutionState().settings.half_life_days !== 8) throw new Error('Accepted evolution state not applied');
-        } finally {
-          delete process.env.THUMBGATE_FEEDBACK_DIR;
-          resetModules();
-          fs.rmSync(feedbackDir, { recursive: true, force: true });
-        }
-      },
-    },
-    {
-      id: 'EVOLVE-03',
-      desc: 'restoreWorkspaceEvolution rolls accepted state back to the previous snapshot',
-      fn: () => {
-        const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
-        try {
-          process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
-          resetModules();
-          const { runWorkspaceEvolution, restoreWorkspaceEvolution } = require('./workspace-evolver');
-          const { readEvolutionState } = require('./evolution-state');
-          const result = runWorkspaceEvolution({
-            cwd: ROOT,
-            targetName: 'half_life_days',
-            nextValue: 8,
-            primaryCommands: [buildStateCommand('half_life_days', 8)],
-            holdoutCommands: [buildStateCommand('half_life_days', 8)],
-            timeoutMs: 5000,
-          });
-          restoreWorkspaceEvolution(result.metrics.rollbackSnapshotId);
-          if (readEvolutionState().settings.half_life_days !== 7) throw new Error('Rollback did not restore default state');
-        } finally {
-          delete process.env.THUMBGATE_FEEDBACK_DIR;
-          resetModules();
-          fs.rmSync(feedbackDir, { recursive: true, force: true });
-        }
-      },
-    },
-    {
-      id: 'EVOLVE-04',
-      desc: 'autoresearch-runner delegates to workspace evolver and records research metadata plus rollback evidence',
-      fn: async () => {
-        const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
-        try {
-          process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
-          resetModules();
-          const runner = require('./autoresearch-runner');
-          const result = await runner.runIteration({
-            targetName: 'half_life_days',
-            nextValue: 8,
-            testCommand: buildStateCommand('half_life_days', 8),
-            holdoutCommands: [buildStateCommand('half_life_days', 8)],
-            timeoutMs: 5000,
-            researchQuery: 'rank fusion',
-            searchPapersImpl: async () => [{
-              paperId: '2603.01896',
-              title: 'Agentic Rank Fusion for Research Systems',
-              summary: 'Retrieval fusion for agent workflows.',
-              authors: ['Ada Lovelace'],
-              tags: ['retrieval'],
-              url: 'https://arxiv.org/abs/2603.01896',
-              source: 'huggingface-papers',
-            }],
-          });
-          if (!result.kept) throw new Error('Expected autoresearch iteration to keep the improved candidate');
-          if (result.metrics.researchQuery !== 'rank fusion') throw new Error('Research query metadata missing');
-          if (!result.metrics.researchPackId) throw new Error('Research pack id missing');
-          if (!result.metrics.researchPaperIds.includes('2603.01896')) throw new Error('Research paper id missing');
-          if (!result.metrics.rollbackSnapshotId) throw new Error('Rollback snapshot metadata missing');
-        } finally {
-          delete process.env.THUMBGATE_FEEDBACK_DIR;
-          resetModules();
-          fs.rmSync(feedbackDir, { recursive: true, force: true });
-        }
-      },
-    },
-    {
-      id: 'EVOLVE-05',
-      desc: 'async-job-runner follow-up experiments include a recommended evolution target and replay command',
-      fn: () => {
-        const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-'));
-        try {
-          process.env.THUMBGATE_FEEDBACK_DIR = feedbackDir;
-          resetModules();
-          stubModule(VERIFICATION_PATH, {
-            runVerificationLoop: () => makeRejectedVerification(),
-          });
-          const runner = require('./async-job-runner');
-          const tracker = require('./experiment-tracker');
-          runner.executeJob({
-            id: 'verification-failure-job',
-            context: 'webhook signature mismatch',
-            tags: ['billing'],
-            skill: 'billing-guard',
-          });
-          const experiments = tracker.loadExperiments();
-          const experiment = experiments[0];
-          if (!experiment) throw new Error('Expected queued improvement experiment');
-          if (!experiment.mutation.recommendedTarget) throw new Error('Missing recommendedTarget');
-          if (!experiment.mutation.evolutionCommand.includes('workspace-evolver.js')) {
-            throw new Error('Missing workspace evolver replay command');
-          }
-        } finally {
-          delete process.env.THUMBGATE_FEEDBACK_DIR;
-          resetModules();
-          fs.rmSync(feedbackDir, { recursive: true, force: true });
-        }
-      },
-    },
-    {
-      id: 'EVOLVE-06',
-      desc: 'verify:full includes the evolution proof lane and records the artifact',
-      fn: () => {
-        resetModules();
-        const { buildVerifyPlan, recordVerifyWorkflowRun } = require('./verify-run');
-        const plan = buildVerifyPlan('full');
-        const commands = plan.map((step) => [step.command, ...(step.args || [])].join(' ')).join('\n');
-        if (!commands.includes('prove:evolution')) {
-          throw new Error('verify:full is missing prove:evolution');
-        }
-        const feedbackDir = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-feedback-'));
-        const cwd = fs.mkdtempSync(path.join(os.tmpdir(), 'thumbgate-evolution-proof-cwd-'));
-        try {
-          const entry = recordVerifyWorkflowRun('full', cwd, feedbackDir);
-          if (!entry.proofArtifacts.some((artifact) => artifact.endsWith(path.join('proof', 'evolution-report.json')))) {
-            throw new Error('Workflow run missing evolution proof artifact');
-          }
-        } finally {
-          fs.rmSync(feedbackDir, { recursive: true, force: true });
-          fs.rmSync(cwd, { recursive: true, force: true });
-        }
-      },
-    },
-  ];
-  console.log('Phase 17: Agent Workspace Evolution — Proof Gate\n');
-  console.log('Checking requirements:\n');
-  for (const check of checks) {
-    try {
-      await check.fn();
-      results.passed++;
-      results.requirements[check.id] = { status: 'pass', desc: check.desc };
-      console.log(`  PASS  ${check.id}: ${check.desc}`);
-    } catch (error) {
-      results.failed++;
-      results.requirements[check.id] = {
-        status: 'fail',
-        desc: check.desc,
-        error: error.message,
-      };
-      console.error(`  FAIL  ${check.id}: ${error.message}`);
-    }
-  }
-  fs.mkdirSync(proofDir, { recursive: true });
-  const report = {
-    phase: '17-agent-workspace-evolution',
-    generatedAt: new Date().toISOString(),
-    passed: results.passed,
-    failed: results.failed,
-    requirements: results.requirements,
-  };
-  fs.writeFileSync(reportJson, `${JSON.stringify(report, null, 2)}\n`);
-  const lines = [
-    '# Agent Workspace Evolution Proof Report',
-    '',
-    `Generated: ${report.generatedAt}`,
-    '',
-    `Summary: ${results.passed} passed, ${results.failed} failed`,
-    '',
-    '## Requirements',
-    '',
-  ];
-  for (const [id, requirement] of Object.entries(results.requirements)) {
-    lines.push(`- [${requirement.status === 'pass' ? 'x' : ' '}] **${id}** — ${requirement.desc}`);
-    if (requirement.error) {
-      lines.push(`  - Error: ${requirement.error}`);
-    }
-  }
-  lines.push('');
-  lines.push('## Evidence');
-  lines.push('');
-  lines.push('- `scripts/evolution-state.js` — local accepted-state overlay + rollback snapshots');
-  lines.push('- `scripts/workspace-evolver.js` — evolve / evaluate / accept / rollback engine');
-  lines.push('- `scripts/autoresearch-runner.js` — shared research-backed mutation loop on top of the evolver');
-  lines.push('- `scripts/prove-evolution.js` — this proof gate');
-  fs.writeFileSync(reportMd, `${lines.join('\n')}\n`);
-  console.log(`\n${results.passed} passed, ${results.failed} failed`);
-  if (results.failed > 0) {
-    process.exitCode = 1;
-  }
-}
-if (require.main === module) {
-  run().catch((error) => {
-    console.error(error);
-    process.exit(1);
-  });
-}
-module.exports = {
-  run,
-};