thumbgate 1.4.2 → 1.4.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (279) hide show
  1. package/.claude-plugin/README.md +45 -34
  2. package/.claude-plugin/marketplace.json +3 -3
  3. package/.claude-plugin/plugin.json +3 -3
  4. package/.well-known/llms.txt +1 -1
  5. package/.well-known/mcp/server-card.json +1 -1
  6. package/README.md +26 -2
  7. package/adapters/README.md +4 -1
  8. package/adapters/claude/.mcp.json +2 -2
  9. package/adapters/codex/config.toml +2 -2
  10. package/adapters/mcp/server-stdio.js +10 -4
  11. package/adapters/opencode/opencode.json +1 -1
  12. package/bin/cli.js +246 -90
  13. package/config/mcp-allowlists.json +11 -3
  14. package/package.json +184 -21
  15. package/scripts/audit-trail.js +25 -15
  16. package/scripts/auto-wire-hooks.js +127 -0
  17. package/scripts/cli-demo.js +102 -0
  18. package/scripts/cli-schema.js +285 -0
  19. package/scripts/cli-status.js +166 -0
  20. package/scripts/cross-encoder-reranker.js +235 -0
  21. package/scripts/explore-subcommands.js +277 -0
  22. package/scripts/explore.js +569 -0
  23. package/scripts/feedback-loop.js +20 -6
  24. package/scripts/lesson-inference.js +7 -1
  25. package/scripts/lesson-reranker.js +263 -0
  26. package/scripts/lesson-retrieval.js +34 -17
  27. package/scripts/lesson-search.js +69 -0
  28. package/scripts/perplexity-client.js +210 -0
  29. package/scripts/reflector-agent.js +2 -2
  30. package/scripts/statusline-local-stats.js +3 -1
  31. package/scripts/statusline.sh +12 -11
  32. package/src/api/server.js +178 -17
  33. package/src/index.js +3 -0
  34. package/.claude-plugin/bundle/icon.png +0 -0
  35. package/.claude-plugin/bundle/icon.svg +0 -18
  36. package/.claude-plugin/bundle/server/index.js +0 -24
  37. package/adapters/chatgpt/INSTALL.md +0 -138
  38. package/bin/memory.sh +0 -64
  39. package/bin/obsidian-sync.sh +0 -20
  40. package/plugins/amp-skill/INSTALL.md +0 -52
  41. package/plugins/amp-skill/SKILL.md +0 -64
  42. package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +0 -22
  43. package/plugins/claude-codex-bridge/.mcp.json +0 -14
  44. package/plugins/claude-codex-bridge/INSTALL.md +0 -43
  45. package/plugins/claude-codex-bridge/README.md +0 -46
  46. package/plugins/claude-codex-bridge/scripts/codex-bridge.js +0 -286
  47. package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +0 -24
  48. package/plugins/claude-codex-bridge/skills/result/SKILL.md +0 -22
  49. package/plugins/claude-codex-bridge/skills/review/SKILL.md +0 -28
  50. package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +0 -27
  51. package/plugins/claude-codex-bridge/skills/setup/SKILL.md +0 -21
  52. package/plugins/claude-codex-bridge/skills/status/SKILL.md +0 -19
  53. package/plugins/claude-skill/INSTALL.md +0 -55
  54. package/plugins/claude-skill/SKILL.md +0 -46
  55. package/plugins/codex-profile/.codex-plugin/plugin.json +0 -43
  56. package/plugins/codex-profile/.mcp.json +0 -14
  57. package/plugins/codex-profile/AGENTS.md +0 -20
  58. package/plugins/codex-profile/INSTALL.md +0 -89
  59. package/plugins/codex-profile/README.md +0 -61
  60. package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +0 -23
  61. package/plugins/cursor-marketplace/CHANGELOG.md +0 -30
  62. package/plugins/cursor-marketplace/LICENSE +0 -21
  63. package/plugins/cursor-marketplace/README.md +0 -124
  64. package/plugins/cursor-marketplace/agents/reliability-reviewer.md +0 -31
  65. package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
  66. package/plugins/cursor-marketplace/commands/capture-feedback.md +0 -33
  67. package/plugins/cursor-marketplace/commands/check-gates.md +0 -25
  68. package/plugins/cursor-marketplace/commands/show-lessons.md +0 -27
  69. package/plugins/cursor-marketplace/hooks/hooks.json +0 -10
  70. package/plugins/cursor-marketplace/mcp.json +0 -14
  71. package/plugins/cursor-marketplace/rules/feedback-capture.mdc +0 -34
  72. package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +0 -30
  73. package/plugins/cursor-marketplace/rules/session-continuity.mdc +0 -28
  74. package/plugins/cursor-marketplace/scripts/gate-check.sh +0 -21
  75. package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +0 -48
  76. package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +0 -31
  77. package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +0 -30
  78. package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +0 -33
  79. package/plugins/gemini-extension/INSTALL.md +0 -92
  80. package/plugins/gemini-extension/gemini_prompt.txt +0 -14
  81. package/plugins/gemini-extension/tool_contract.json +0 -45
  82. package/plugins/opencode-profile/INSTALL.md +0 -57
  83. package/public/assets/instagram-card.png +0 -0
  84. package/public/assets/tiktok-agent-memory.mp4 +0 -0
  85. package/public/blog.html +0 -474
  86. package/public/compare/mem0.html +0 -189
  87. package/public/compare/speclock.html +0 -180
  88. package/public/compare.html +0 -310
  89. package/public/dashboard.html +0 -1100
  90. package/public/guide.html +0 -317
  91. package/public/guides/claude-code-prevent-repeated-mistakes.html +0 -161
  92. package/public/guides/codex-cli-guardrails.html +0 -158
  93. package/public/guides/cursor-prevent-repeated-mistakes.html +0 -161
  94. package/public/guides/pre-action-gates.html +0 -162
  95. package/public/guides/stop-repeated-ai-agent-mistakes.html +0 -159
  96. package/public/index.html +0 -1128
  97. package/public/js/buyer-intent.js +0 -252
  98. package/public/learn/agent-harness-pattern.html +0 -180
  99. package/public/learn/ai-agent-persistent-memory.html +0 -203
  100. package/public/learn/learn.css +0 -45
  101. package/public/learn/mcp-pre-action-gates-explained.html +0 -172
  102. package/public/learn/stop-ai-agent-force-push.html +0 -134
  103. package/public/learn/vibe-coding-safety-net.html +0 -142
  104. package/public/learn.html +0 -274
  105. package/public/lessons.html +0 -967
  106. package/public/llm-context.md +0 -140
  107. package/public/pro.html +0 -1087
  108. package/public/vercel.json +0 -8
  109. package/scripts/a2ui-engine.js +0 -73
  110. package/scripts/adk-consolidator.js +0 -274
  111. package/scripts/agent-security-hardening.js +0 -225
  112. package/scripts/ai-search-visibility.js +0 -142
  113. package/scripts/autonomous-sales-agent.js +0 -39
  114. package/scripts/autoresearch-runner.js +0 -216
  115. package/scripts/background-agent-governance.js +0 -229
  116. package/scripts/behavioral-extraction.js +0 -93
  117. package/scripts/budget-enforcer.js +0 -173
  118. package/scripts/budget-guard.js +0 -173
  119. package/scripts/build-claude-mcpb.js +0 -255
  120. package/scripts/build-codex-plugin.js +0 -152
  121. package/scripts/capture-railway-diagnostics.sh +0 -97
  122. package/scripts/changeset-check.js +0 -372
  123. package/scripts/check-congruence.js +0 -443
  124. package/scripts/computer-use-firewall.js +0 -280
  125. package/scripts/content-engine/linkedin-content-generator.js +0 -154
  126. package/scripts/content-engine/output/linkedin-memento-validation.md +0 -17
  127. package/scripts/content-engine/output/linkedin-posts-2026-04-09.md +0 -175
  128. package/scripts/content-engine/reddit-thread-finder.js +0 -154
  129. package/scripts/context-engine.js +0 -710
  130. package/scripts/daily-digest.js +0 -11
  131. package/scripts/data-governance.js +0 -173
  132. package/scripts/deploy-gcp.sh +0 -44
  133. package/scripts/deploy-policy.js +0 -249
  134. package/scripts/disagreement-mining.js +0 -315
  135. package/scripts/dpo-optimizer.js +0 -206
  136. package/scripts/ensure-repo-bootstrap.js +0 -130
  137. package/scripts/ephemeral-agent-store.js +0 -212
  138. package/scripts/eval-harness.js +0 -56
  139. package/scripts/export-kto-pairs.js +0 -309
  140. package/scripts/export-training.js +0 -446
  141. package/scripts/feedback-fallback.js +0 -111
  142. package/scripts/feedback-inbox-read.js +0 -162
  143. package/scripts/feedback-root-consolidator.js +0 -233
  144. package/scripts/feedback-to-memory.js +0 -185
  145. package/scripts/gate-satisfy.js +0 -42
  146. package/scripts/generate-paperbanana-diagrams.sh +0 -99
  147. package/scripts/generate-pretool-hook.sh +0 -40
  148. package/scripts/github-about.js +0 -430
  149. package/scripts/github-outreach.js +0 -65
  150. package/scripts/gtm-revenue-loop.js +0 -535
  151. package/scripts/hallucination-detector.js +0 -226
  152. package/scripts/hf-papers.js +0 -317
  153. package/scripts/hook-auto-capture.sh +0 -100
  154. package/scripts/hook-stop-pr-thread-check.sh +0 -68
  155. package/scripts/hook-stop-self-score.sh +0 -51
  156. package/scripts/hook-stop-verify-deploy.sh +0 -31
  157. package/scripts/hook-verify-before-done.sh +0 -20
  158. package/scripts/managed-dpo-export.js +0 -91
  159. package/scripts/markdown-escape.js +0 -12
  160. package/scripts/marketing-experiment.js +0 -657
  161. package/scripts/memalign-recall.js +0 -111
  162. package/scripts/memory-migration.js +0 -296
  163. package/scripts/meta-policy.js +0 -190
  164. package/scripts/metered-billing.js +0 -16
  165. package/scripts/model-tier-router.js +0 -310
  166. package/scripts/money-watcher.js +0 -218
  167. package/scripts/multi-hop-recall.js +0 -240
  168. package/scripts/per-step-scoring.js +0 -163
  169. package/scripts/perplexity-marketing.js +0 -466
  170. package/scripts/pii-scanner.js +0 -153
  171. package/scripts/plan-gate.js +0 -154
  172. package/scripts/post-everywhere.js +0 -341
  173. package/scripts/post-to-x-retry.sh +0 -22
  174. package/scripts/post-to-x.js +0 -369
  175. package/scripts/pr-manager.js +0 -421
  176. package/scripts/principle-extractor.js +0 -162
  177. package/scripts/pro-features.js +0 -41
  178. package/scripts/prompt-dlp.js +0 -222
  179. package/scripts/prove-adapters.js +0 -860
  180. package/scripts/prove-attribution.js +0 -361
  181. package/scripts/prove-automation.js +0 -651
  182. package/scripts/prove-autoresearch.js +0 -304
  183. package/scripts/prove-claim-verification.js +0 -277
  184. package/scripts/prove-cloudflare-sandbox.js +0 -161
  185. package/scripts/prove-data-pipeline.js +0 -408
  186. package/scripts/prove-data-quality.js +0 -227
  187. package/scripts/prove-evolution.js +0 -352
  188. package/scripts/prove-harnesses.js +0 -287
  189. package/scripts/prove-intelligence.js +0 -257
  190. package/scripts/prove-lancedb.js +0 -425
  191. package/scripts/prove-local-intelligence.js +0 -340
  192. package/scripts/prove-loop-closure.js +0 -263
  193. package/scripts/prove-packaged-runtime.js +0 -326
  194. package/scripts/prove-predictive-insights.js +0 -355
  195. package/scripts/prove-runtime.js +0 -363
  196. package/scripts/prove-seo-gsd.js +0 -234
  197. package/scripts/prove-settings.js +0 -279
  198. package/scripts/prove-subway-upgrades.js +0 -277
  199. package/scripts/prove-tessl.js +0 -229
  200. package/scripts/prove-training-export.js +0 -325
  201. package/scripts/prove-workflow-contract.js +0 -112
  202. package/scripts/prove-xmemory.js +0 -332
  203. package/scripts/publish-decision.js +0 -159
  204. package/scripts/ralph-loop.js +0 -376
  205. package/scripts/ralph-mode-ci.js +0 -331
  206. package/scripts/reddit-dm-outreach.js +0 -192
  207. package/scripts/reddit-monitor-cron.sh +0 -26
  208. package/scripts/reminder-engine.js +0 -132
  209. package/scripts/revenue-status.js +0 -472
  210. package/scripts/rotate-stripe-webhook-secret.js +0 -314
  211. package/scripts/schedule-manager.js +0 -249
  212. package/scripts/self-healing-check.js +0 -193
  213. package/scripts/shieldcortex-memory-firewall-runner.mjs +0 -53
  214. package/scripts/skill-exporter.js +0 -260
  215. package/scripts/skill-materializer.js +0 -134
  216. package/scripts/skill-packs.js +0 -136
  217. package/scripts/skill-proposer.js +0 -99
  218. package/scripts/skill-quality-tracker.js +0 -282
  219. package/scripts/slow-loop.js +0 -72
  220. package/scripts/social-analytics/db/analytics.sqlite +0 -0
  221. package/scripts/social-analytics/db/schema.sql +0 -32
  222. package/scripts/social-analytics/digest.js +0 -256
  223. package/scripts/social-analytics/engagement-audit.js +0 -185
  224. package/scripts/social-analytics/generate-instagram-card.js +0 -97
  225. package/scripts/social-analytics/instagram-thumbgate-post.js +0 -111
  226. package/scripts/social-analytics/install-growth-automation.js +0 -114
  227. package/scripts/social-analytics/load-env.js +0 -77
  228. package/scripts/social-analytics/mcp-server.js +0 -289
  229. package/scripts/social-analytics/normalizer.js +0 -580
  230. package/scripts/social-analytics/notify.js +0 -162
  231. package/scripts/social-analytics/poll-all.js +0 -107
  232. package/scripts/social-analytics/pollers/github.js +0 -195
  233. package/scripts/social-analytics/pollers/instagram.js +0 -253
  234. package/scripts/social-analytics/pollers/linkedin.js +0 -340
  235. package/scripts/social-analytics/pollers/plausible.js +0 -245
  236. package/scripts/social-analytics/pollers/reddit.js +0 -306
  237. package/scripts/social-analytics/pollers/threads.js +0 -233
  238. package/scripts/social-analytics/pollers/tiktok.js +0 -203
  239. package/scripts/social-analytics/pollers/x.js +0 -227
  240. package/scripts/social-analytics/pollers/youtube.js +0 -304
  241. package/scripts/social-analytics/pollers/zernio.js +0 -183
  242. package/scripts/social-analytics/publish-instagram-thumbgate.js +0 -104
  243. package/scripts/social-analytics/publish-thumbgate-launch.js +0 -322
  244. package/scripts/social-analytics/publishers/devto.js +0 -122
  245. package/scripts/social-analytics/publishers/instagram.js +0 -317
  246. package/scripts/social-analytics/publishers/linkedin.js +0 -294
  247. package/scripts/social-analytics/publishers/reddit.js +0 -385
  248. package/scripts/social-analytics/publishers/threads.js +0 -275
  249. package/scripts/social-analytics/publishers/tiktok.js +0 -217
  250. package/scripts/social-analytics/publishers/x.js +0 -259
  251. package/scripts/social-analytics/publishers/youtube.js +0 -223
  252. package/scripts/social-analytics/publishers/zernio.js +0 -539
  253. package/scripts/social-analytics/reconcile-thumbgate-campaign.js +0 -165
  254. package/scripts/social-analytics/run-digest.js +0 -34
  255. package/scripts/social-analytics/schedule-thumbgate-campaign.js +0 -275
  256. package/scripts/social-analytics/store.js +0 -455
  257. package/scripts/social-analytics/sync-launch-assets.js +0 -185
  258. package/scripts/social-analytics/utm.js +0 -143
  259. package/scripts/social-pipeline.js +0 -2626
  260. package/scripts/social-post-hourly.js +0 -228
  261. package/scripts/social-quality-gate.js +0 -134
  262. package/scripts/social-reply-monitor.js +0 -592
  263. package/scripts/status-dashboard.js +0 -155
  264. package/scripts/stripe-live-status.js +0 -115
  265. package/scripts/subagent-profiles.js +0 -79
  266. package/scripts/sync-branch-protection.js +0 -340
  267. package/scripts/sync-gh-secrets-from-env.sh +0 -70
  268. package/scripts/sync-github-about.js +0 -55
  269. package/scripts/sync-version.js +0 -479
  270. package/scripts/synthetic-dpo.js +0 -234
  271. package/scripts/tessl-export.js +0 -369
  272. package/scripts/test-coverage.js +0 -128
  273. package/scripts/thumbgate_session_start.sh +0 -32
  274. package/scripts/train_from_feedback.py +0 -929
  275. package/scripts/validate-feedback.js +0 -581
  276. package/scripts/verify-obsidian-setup.sh +0 -269
  277. package/scripts/verify-run.js +0 -269
  278. package/scripts/weekly-auto-post.js +0 -124
  279. package/scripts/x-autonomous-marketing.js +0 -139
@@ -1,361 +0,0 @@
1
- #!/usr/bin/env node
2
- 'use strict';
3
-
4
- /**
5
- * prove-attribution.js — Phase 6 gate proof script.
6
- *
7
- * Generates proof/attribution-report.md and proof/attribution-report.json
8
- * documenting per-requirement evidence for ATTR-01, ATTR-02, ATTR-03.
9
- *
10
- * Mirrors the prove-rlaif.js structure exactly (mkdtempSync / env override /
11
- * execSync node --test / write JSON + markdown report).
12
- *
13
- * Exit 0 if no 'fail' statuses; exit 1 if any 'fail'.
14
- */
15
-
16
- const fs = require('fs');
17
- const path = require('path');
18
- const os = require('os');
19
- const { execSync } = require('child_process');
20
- const { escapeMarkdownTableCell } = require('./markdown-escape');
21
- const { ensureDir } = require('./fs-utils');
22
-
23
- const ROOT = path.join(__dirname, '..');
24
-
25
- // Phase 5 node-runner test baseline (before Phase 6 attribution tests)
26
- const PHASE5_BASELINE = 142;
27
-
28
-
29
- async function runProof(options = {}) {
30
- const proofDir = options.proofDir || process.env.THUMBGATE_PROOF_DIR || path.join(ROOT, 'proof');
31
- const report = {
32
- phase: '06-feedback-attribution',
33
- generated: new Date().toISOString(),
34
- requirements: {},
35
- summary: { passed: 0, failed: 0 },
36
- };
37
-
38
- function addResult(reqId, reqStatus, evidence) {
39
- report.requirements[reqId] = { status: reqStatus, evidence };
40
- if (reqStatus === 'pass') report.summary.passed += 1;
41
- else report.summary.failed += 1;
42
- }
43
-
44
- // ─────────────────────────────────────────────────────────────────────────
45
- // ATTR-01: recordAction + attributeFeedback correctness
46
- // - require feedback-attribution.js with tmpDir env overrides
47
- // - call recordAction('Bash', '{"command":"git push --force"}')
48
- // - assert result.ok === true, result.action.intent === 'git-risk'
49
- // - call attributeFeedback('negative', 'bad git push force broke main')
50
- // - assert fs.existsSync(THUMBGATE_FEEDBACK_ATTRIBUTIONS path)
51
- // - parse JSONL, assert attribution_id and signal === 'negative'
52
- // ─────────────────────────────────────────────────────────────────────────
53
- const tmpDir01 = fs.mkdtempSync(path.join(os.tmpdir(), 'prove-attr01-'));
54
- let attr01Status = 'fail';
55
- let attr01Evidence = '';
56
- try {
57
- process.env.THUMBGATE_ACTION_LOG = path.join(tmpDir01, 'action-log.jsonl');
58
- process.env.THUMBGATE_FEEDBACK_ATTRIBUTIONS = path.join(tmpDir01, 'feedback-attributions.jsonl');
59
- process.env.THUMBGATE_ATTRIBUTED_FEEDBACK = path.join(tmpDir01, 'attributed-feedback.jsonl');
60
-
61
- // Invalidate module cache so env vars take effect
62
- for (const key of Object.keys(require.cache)) {
63
- if (key.includes('feedback-attribution')) {
64
- delete require.cache[key];
65
- }
66
- }
67
- const { recordAction, attributeFeedback } = require('./feedback-attribution');
68
-
69
- // Test recordAction
70
- const recResult = recordAction('Bash', '{"command":"git push --force"}');
71
- const recOk = recResult.ok === true && recResult.action.intent === 'git-risk';
72
- const actionLogExists = fs.existsSync(path.join(tmpDir01, 'action-log.jsonl'));
73
-
74
- // Test attributeFeedback — negative signal should write attributions
75
- const attrResult = attributeFeedback('negative', 'bad git push force broke main');
76
- const attrOk = attrResult.ok === true;
77
- const attributionsPath = path.join(tmpDir01, 'feedback-attributions.jsonl');
78
- const attributionsExist = fs.existsSync(attributionsPath);
79
-
80
- let attributionValid = false;
81
- if (attributionsExist) {
82
- const lines = fs.readFileSync(attributionsPath, 'utf8').trim().split('\n').filter(Boolean);
83
- if (lines.length > 0) {
84
- try {
85
- const parsed = JSON.parse(lines[lines.length - 1]);
86
- attributionValid = typeof parsed.attribution_id === 'string' &&
87
- parsed.attribution_id.startsWith('att_') &&
88
- parsed.signal === 'negative';
89
- } catch (_) {
90
- attributionValid = false;
91
- }
92
- }
93
- }
94
-
95
- if (recOk && actionLogExists && attrOk && attributionsExist && attributionValid) {
96
- attr01Status = 'pass';
97
- attr01Evidence =
98
- `recordAction('Bash', git push --force) returned ok=true, intent=git-risk. ` +
99
- `action-log.jsonl written to ${tmpDir01}. ` +
100
- `action_id=${recResult.action.action_id}, risk_score=${recResult.action.risk_score}. ` +
101
- `attributeFeedback('negative', ...) returned ok=true, attributedCount=${attrResult.attributedCount}. ` +
102
- `feedback-attributions.jsonl written. attribution_id=${attrResult.attributionId || 'written'}, signal=negative. ` +
103
- `Module: scripts/feedback-attribution.js. Pure offline JSONL-based attribution.`;
104
- } else {
105
- const issues = [];
106
- if (!recOk) issues.push(`recordAction returned ok=${recResult.ok}, intent=${recResult.action ? recResult.action.intent : 'none'} (expected git-risk)`);
107
- if (!actionLogExists) issues.push(`action-log.jsonl not written to ${tmpDir01}`);
108
- if (!attrOk) issues.push(`attributeFeedback returned ok=${attrResult.ok}`);
109
- if (!attributionsExist) issues.push(`feedback-attributions.jsonl not written`);
110
- if (!attributionValid) issues.push(`attribution entry missing attribution_id or signal`);
111
- attr01Status = 'fail';
112
- attr01Evidence = `ATTR-01 smoke test failed: ${issues.join('; ')}`;
113
- }
114
- } catch (err) {
115
- attr01Status = 'fail';
116
- attr01Evidence = `ATTR-01 threw: ${err.message}`;
117
- } finally {
118
- try { fs.rmSync(tmpDir01, { recursive: true, force: true }); } catch (_) {}
119
- delete process.env.THUMBGATE_ACTION_LOG;
120
- delete process.env.THUMBGATE_FEEDBACK_ATTRIBUTIONS;
121
- delete process.env.THUMBGATE_ATTRIBUTED_FEEDBACK;
122
- }
123
- addResult('ATTR-01', attr01Status, attr01Evidence);
124
-
125
- // ─────────────────────────────────────────────────────────────────────────
126
- // ATTR-02: evaluatePretool allow/block/warn paths
127
- // - require hybrid-feedback-context.js with tmpDir env overrides
128
- // - seed attributed-feedback.jsonl with 3 negative entries for Bash + git push force
129
- // - call buildHybridState() — should detect recurringNegativePatterns with count >= 3
130
- // - call evaluatePretoolFromState(state, 'Bash', 'git push force main') → assert mode === 'block'
131
- // - call evaluatePretoolFromState(state, 'Read', 'some-unrelated-file.md') → assert mode === 'allow'
132
- // ─────────────────────────────────────────────────────────────────────────
133
- const tmpDir02 = fs.mkdtempSync(path.join(os.tmpdir(), 'prove-attr02-'));
134
- let attr02Status = 'fail';
135
- let attr02Evidence = '';
136
- try {
137
- process.env.THUMBGATE_FEEDBACK_LOG = path.join(tmpDir02, 'feedback-log.jsonl');
138
- process.env.THUMBGATE_ATTRIBUTED_FEEDBACK = path.join(tmpDir02, 'attributed-feedback.jsonl');
139
- process.env.THUMBGATE_GUARDS_PATH = path.join(tmpDir02, 'pretool-guards.json');
140
-
141
- // Seed attributed-feedback.jsonl with 3 identical negative entries
142
- const attrFeedbackPath = path.join(tmpDir02, 'attributed-feedback.jsonl');
143
- const ts = new Date().toISOString();
144
- const seedEntries = [
145
- {
146
- timestamp: ts,
147
- signal: 'negative',
148
- feedback: 'negative',
149
- tool_name: 'Bash',
150
- context: 'git push force main branch override',
151
- source: 'attributed',
152
- },
153
- {
154
- timestamp: ts,
155
- signal: 'negative',
156
- feedback: 'negative',
157
- tool_name: 'Bash',
158
- context: 'git push force main branch override',
159
- source: 'attributed',
160
- },
161
- {
162
- timestamp: ts,
163
- signal: 'negative',
164
- feedback: 'negative',
165
- tool_name: 'Bash',
166
- context: 'git push force main branch override',
167
- source: 'attributed',
168
- },
169
- ];
170
- fs.mkdirSync(path.dirname(attrFeedbackPath), { recursive: true });
171
- fs.writeFileSync(
172
- attrFeedbackPath,
173
- seedEntries.map((e) => JSON.stringify(e)).join('\n') + '\n',
174
- );
175
-
176
- // Invalidate module cache
177
- for (const key of Object.keys(require.cache)) {
178
- if (key.includes('hybrid-feedback-context')) {
179
- delete require.cache[key];
180
- }
181
- }
182
- const { buildHybridState, evaluatePretoolFromState } = require('./hybrid-feedback-context');
183
-
184
- const state = buildHybridState({
185
- feedbackLogPath: path.join(tmpDir02, 'feedback-log.jsonl'),
186
- attributedFeedbackPath: attrFeedbackPath,
187
- });
188
-
189
- const hasRecurring = state.recurringNegativePatterns.length > 0;
190
- const topCount = hasRecurring ? state.recurringNegativePatterns[0].count : 0;
191
- const countOk = topCount >= 3;
192
-
193
- // block path: git push force matches pattern
194
- const blockResult = evaluatePretoolFromState(state, 'Bash', 'git push force main');
195
- const blockOk = blockResult.mode === 'block';
196
-
197
- // allow path: completely different tool+input
198
- const allowResult = evaluatePretoolFromState(state, 'Read', 'some-unrelated-file.md');
199
- const allowOk = allowResult.mode === 'allow';
200
-
201
- if (hasRecurring && countOk && blockOk && allowOk) {
202
- attr02Status = 'pass';
203
- attr02Evidence =
204
- `buildHybridState() detected ${state.recurringNegativePatterns.length} recurring pattern(s). ` +
205
- `Top pattern count=${topCount} (>= 3 → critical). ` +
206
- `evaluatePretoolFromState('Bash', 'git push force main') → mode=${blockResult.mode}. ` +
207
- `evaluatePretoolFromState('Read', 'some-unrelated-file.md') → mode=${allowResult.mode}. ` +
208
- `block + allow paths verified. No false positive for unrelated Read tool. ` +
209
- `Module: scripts/hybrid-feedback-context.js. hasTwoKeywordHits enforces no-false-positive invariant.`;
210
- } else {
211
- const issues = [];
212
- if (!hasRecurring) issues.push(`no recurring negative patterns detected (expected >= 1 from 3 identical entries)`);
213
- if (!countOk) issues.push(`top pattern count=${topCount} (expected >= 3)`);
214
- if (!blockOk) issues.push(`block path returned mode=${blockResult.mode} (expected block)`);
215
- if (!allowOk) issues.push(`allow path returned mode=${allowResult.mode} (expected allow)`);
216
- attr02Status = 'fail';
217
- attr02Evidence = `ATTR-02 smoke test failed: ${issues.join('; ')}`;
218
- }
219
- } catch (err) {
220
- attr02Status = 'fail';
221
- attr02Evidence = `ATTR-02 threw: ${err.message}`;
222
- } finally {
223
- try { fs.rmSync(tmpDir02, { recursive: true, force: true }); } catch (_) {}
224
- delete process.env.THUMBGATE_FEEDBACK_LOG;
225
- delete process.env.THUMBGATE_ATTRIBUTED_FEEDBACK;
226
- delete process.env.THUMBGATE_GUARDS_PATH;
227
- }
228
- addResult('ATTR-02', attr02Status, attr02Evidence);
229
-
230
- // ─────────────────────────────────────────────────────────────────────────
231
- // ATTR-03: node --test on both attribution test files exits 0
232
- // execSync('node --test tests/feedback-attribution.test.js tests/hybrid-feedback-context.test.js')
233
- // Parse stdout to count passing tests vs baseline
234
- // status: 'pass' if exit code 0 and pass count >= 1
235
- // ─────────────────────────────────────────────────────────────────────────
236
- let attr03Status = 'fail';
237
- let attr03Evidence = '';
238
- let attrPassCount = 0;
239
- let attrFailCount = 0;
240
- try {
241
- const testOutput = execSync(
242
- 'node --test tests/feedback-attribution.test.js tests/hybrid-feedback-context.test.js 2>&1',
243
- { cwd: ROOT, timeout: 60000, encoding: 'utf-8' },
244
- );
245
-
246
- const passMatch = testOutput.match(/pass\s+(\d+)/);
247
- const failMatch = testOutput.match(/fail\s+(\d+)/);
248
- attrPassCount = passMatch ? parseInt(passMatch[1], 10) : 0;
249
- attrFailCount = failMatch ? parseInt(failMatch[1], 10) : 0;
250
-
251
- const meetsRequirement = attrPassCount >= 1 && attrFailCount === 0;
252
-
253
- if (meetsRequirement) {
254
- attr03Status = 'pass';
255
- attr03Evidence =
256
- `node --test (2 attribution test files): pass=${attrPassCount}, fail=${attrFailCount}. ` +
257
- `Phase 5 baseline (test:api + test:proof + test:rlaif): ${PHASE5_BASELINE} tests. ` +
258
- `Phase 6 adds ${attrPassCount} new attribution tests. ` +
259
- `Total with attribution: ${PHASE5_BASELINE + attrPassCount} tests (node-runner only). ` +
260
- `Files: tests/feedback-attribution.test.js (recordAction, attributeFeedback), ` +
261
- `tests/hybrid-feedback-context.test.js (evaluatePretool, buildHybridState, compileGuardArtifact). ` +
262
- `All tests use fs.mkdtempSync() tmpdir isolation — zero production feedback dirs touched.`;
263
- } else {
264
- attr03Status = 'fail';
265
- attr03Evidence =
266
- `node --test attribution files: pass=${attrPassCount}, fail=${attrFailCount}. ` +
267
- `Expected >= 1 passing and 0 failures. ` +
268
- `${attrFailCount > 0 ? `${attrFailCount} test(s) failing.` : `Only ${attrPassCount} tests passing (need >= 1).`}`;
269
- }
270
- } catch (err) {
271
- const output = err.stdout || err.stderr || err.message || '';
272
- const outStr = String(output);
273
- const passMatch = outStr.match(/pass\s+(\d+)/);
274
- const failMatch = outStr.match(/fail\s+(\d+)/);
275
- attrPassCount = passMatch ? parseInt(passMatch[1], 10) : 0;
276
- attrFailCount = failMatch ? parseInt(failMatch[1], 10) : 1;
277
- attr03Status = 'fail';
278
- attr03Evidence = `node --test attribution files exited non-zero (${attrFailCount} failures). Output: ${outStr.slice(0, 500)}`;
279
- }
280
- addResult('ATTR-03', attr03Status, attr03Evidence);
281
-
282
- // ─────────────────────────────────────────────────────────────────────────
283
- // Write proof artifacts
284
- // ─────────────────────────────────────────────────────────────────────────
285
- ensureDir(proofDir);
286
-
287
- const jsonPath = path.join(proofDir, 'attribution-report.json');
288
- fs.writeFileSync(jsonPath, `${JSON.stringify(report, null, 2)}\n`);
289
-
290
- const mdLines = [
291
- '# Feedback Attribution — Proof Report',
292
- '',
293
- `Generated: ${report.generated}`,
294
- `Phase: ${report.phase}`,
295
- '',
296
- `**Passed: ${report.summary.passed} | Failed: ${report.summary.failed}**`,
297
- '',
298
- '## Requirements',
299
- '',
300
- '| Requirement | Status | Evidence |',
301
- '|-------------|--------|----------|',
302
- ...Object.entries(report.requirements).map(
303
- ([reqId, { status: s, evidence }]) =>
304
- `| ${reqId} | ${s.toUpperCase()} | ${escapeMarkdownTableCell(evidence)} |`
305
- ),
306
- '',
307
- '## Requirement Details',
308
- '',
309
- ];
310
-
311
- for (const [reqId, { status: s, evidence }] of Object.entries(report.requirements)) {
312
- mdLines.push(`### ${reqId} — ${s.toUpperCase()}`);
313
- mdLines.push('');
314
- mdLines.push(evidence);
315
- mdLines.push('');
316
- }
317
-
318
- mdLines.push('## Test Count Delta');
319
- mdLines.push('');
320
- mdLines.push('| Baseline (Phase 5 final) | Phase 6 Attribution Addition | Total (node-runner) |');
321
- mdLines.push('|--------------------------|------------------------------|---------------------|');
322
- mdLines.push(`| ${PHASE5_BASELINE} tests | +${attrPassCount} attribution tests (2 test files) | ${PHASE5_BASELINE + attrPassCount} |`);
323
- mdLines.push('');
324
- mdLines.push('Phase 6 (plan-03) added attribution test coverage:');
325
- mdLines.push('- `tests/feedback-attribution.test.js` — recordAction(), attributeFeedback() (5 tests)');
326
- mdLines.push('- `tests/hybrid-feedback-context.test.js` — evaluatePretool, buildHybridState, compileGuardArtifact (16 tests)');
327
- mdLines.push('');
328
- mdLines.push('All tests use `fs.mkdtempSync()` tmpdir isolation. Zero production feedback dirs touched.');
329
- mdLines.push('');
330
- mdLines.push('## Summary');
331
- mdLines.push('');
332
- mdLines.push(`${report.summary.passed}/3 requirements passed.`);
333
- mdLines.push('');
334
-
335
- const mdPath = path.join(proofDir, 'attribution-report.md');
336
- fs.writeFileSync(mdPath, `${mdLines.join('\n')}\n`);
337
-
338
- console.log(`Proof written to ${mdPath}`);
339
- console.log(` and ${jsonPath}`);
340
- console.log('');
341
- console.log(JSON.stringify(report.summary, null, 2));
342
-
343
- const hasFail = report.summary.failed > 0;
344
- if (hasFail) {
345
- process.exitCode = 1;
346
- console.error(`\nFAIL — one or more requirements did not pass. See ${mdPath} for details.`);
347
- } else {
348
- console.log('\nPASS — all requirements satisfied.');
349
- }
350
-
351
- return report;
352
- }
353
-
354
- module.exports = { runProof };
355
-
356
- if (require.main === module) {
357
- runProof().catch((err) => {
358
- console.error('Fatal error in prove-attribution.js:', err);
359
- process.exitCode = 1;
360
- });
361
- }