thumbgate 1.4.2 → 1.4.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (279) hide show
  1. package/.claude-plugin/README.md +45 -34
  2. package/.claude-plugin/marketplace.json +3 -3
  3. package/.claude-plugin/plugin.json +3 -3
  4. package/.well-known/llms.txt +1 -1
  5. package/.well-known/mcp/server-card.json +1 -1
  6. package/README.md +26 -2
  7. package/adapters/README.md +4 -1
  8. package/adapters/claude/.mcp.json +2 -2
  9. package/adapters/codex/config.toml +2 -2
  10. package/adapters/mcp/server-stdio.js +10 -4
  11. package/adapters/opencode/opencode.json +1 -1
  12. package/bin/cli.js +246 -90
  13. package/config/mcp-allowlists.json +11 -3
  14. package/package.json +184 -21
  15. package/scripts/audit-trail.js +25 -15
  16. package/scripts/auto-wire-hooks.js +127 -0
  17. package/scripts/cli-demo.js +102 -0
  18. package/scripts/cli-schema.js +285 -0
  19. package/scripts/cli-status.js +166 -0
  20. package/scripts/cross-encoder-reranker.js +235 -0
  21. package/scripts/explore-subcommands.js +277 -0
  22. package/scripts/explore.js +569 -0
  23. package/scripts/feedback-loop.js +20 -6
  24. package/scripts/lesson-inference.js +7 -1
  25. package/scripts/lesson-reranker.js +263 -0
  26. package/scripts/lesson-retrieval.js +34 -17
  27. package/scripts/lesson-search.js +69 -0
  28. package/scripts/perplexity-client.js +210 -0
  29. package/scripts/reflector-agent.js +2 -2
  30. package/scripts/statusline-local-stats.js +3 -1
  31. package/scripts/statusline.sh +12 -11
  32. package/src/api/server.js +178 -17
  33. package/src/index.js +3 -0
  34. package/.claude-plugin/bundle/icon.png +0 -0
  35. package/.claude-plugin/bundle/icon.svg +0 -18
  36. package/.claude-plugin/bundle/server/index.js +0 -24
  37. package/adapters/chatgpt/INSTALL.md +0 -138
  38. package/bin/memory.sh +0 -64
  39. package/bin/obsidian-sync.sh +0 -20
  40. package/plugins/amp-skill/INSTALL.md +0 -52
  41. package/plugins/amp-skill/SKILL.md +0 -64
  42. package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +0 -22
  43. package/plugins/claude-codex-bridge/.mcp.json +0 -14
  44. package/plugins/claude-codex-bridge/INSTALL.md +0 -43
  45. package/plugins/claude-codex-bridge/README.md +0 -46
  46. package/plugins/claude-codex-bridge/scripts/codex-bridge.js +0 -286
  47. package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +0 -24
  48. package/plugins/claude-codex-bridge/skills/result/SKILL.md +0 -22
  49. package/plugins/claude-codex-bridge/skills/review/SKILL.md +0 -28
  50. package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +0 -27
  51. package/plugins/claude-codex-bridge/skills/setup/SKILL.md +0 -21
  52. package/plugins/claude-codex-bridge/skills/status/SKILL.md +0 -19
  53. package/plugins/claude-skill/INSTALL.md +0 -55
  54. package/plugins/claude-skill/SKILL.md +0 -46
  55. package/plugins/codex-profile/.codex-plugin/plugin.json +0 -43
  56. package/plugins/codex-profile/.mcp.json +0 -14
  57. package/plugins/codex-profile/AGENTS.md +0 -20
  58. package/plugins/codex-profile/INSTALL.md +0 -89
  59. package/plugins/codex-profile/README.md +0 -61
  60. package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +0 -23
  61. package/plugins/cursor-marketplace/CHANGELOG.md +0 -30
  62. package/plugins/cursor-marketplace/LICENSE +0 -21
  63. package/plugins/cursor-marketplace/README.md +0 -124
  64. package/plugins/cursor-marketplace/agents/reliability-reviewer.md +0 -31
  65. package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
  66. package/plugins/cursor-marketplace/commands/capture-feedback.md +0 -33
  67. package/plugins/cursor-marketplace/commands/check-gates.md +0 -25
  68. package/plugins/cursor-marketplace/commands/show-lessons.md +0 -27
  69. package/plugins/cursor-marketplace/hooks/hooks.json +0 -10
  70. package/plugins/cursor-marketplace/mcp.json +0 -14
  71. package/plugins/cursor-marketplace/rules/feedback-capture.mdc +0 -34
  72. package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +0 -30
  73. package/plugins/cursor-marketplace/rules/session-continuity.mdc +0 -28
  74. package/plugins/cursor-marketplace/scripts/gate-check.sh +0 -21
  75. package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +0 -48
  76. package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +0 -31
  77. package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +0 -30
  78. package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +0 -33
  79. package/plugins/gemini-extension/INSTALL.md +0 -92
  80. package/plugins/gemini-extension/gemini_prompt.txt +0 -14
  81. package/plugins/gemini-extension/tool_contract.json +0 -45
  82. package/plugins/opencode-profile/INSTALL.md +0 -57
  83. package/public/assets/instagram-card.png +0 -0
  84. package/public/assets/tiktok-agent-memory.mp4 +0 -0
  85. package/public/blog.html +0 -474
  86. package/public/compare/mem0.html +0 -189
  87. package/public/compare/speclock.html +0 -180
  88. package/public/compare.html +0 -310
  89. package/public/dashboard.html +0 -1100
  90. package/public/guide.html +0 -317
  91. package/public/guides/claude-code-prevent-repeated-mistakes.html +0 -161
  92. package/public/guides/codex-cli-guardrails.html +0 -158
  93. package/public/guides/cursor-prevent-repeated-mistakes.html +0 -161
  94. package/public/guides/pre-action-gates.html +0 -162
  95. package/public/guides/stop-repeated-ai-agent-mistakes.html +0 -159
  96. package/public/index.html +0 -1128
  97. package/public/js/buyer-intent.js +0 -252
  98. package/public/learn/agent-harness-pattern.html +0 -180
  99. package/public/learn/ai-agent-persistent-memory.html +0 -203
  100. package/public/learn/learn.css +0 -45
  101. package/public/learn/mcp-pre-action-gates-explained.html +0 -172
  102. package/public/learn/stop-ai-agent-force-push.html +0 -134
  103. package/public/learn/vibe-coding-safety-net.html +0 -142
  104. package/public/learn.html +0 -274
  105. package/public/lessons.html +0 -967
  106. package/public/llm-context.md +0 -140
  107. package/public/pro.html +0 -1087
  108. package/public/vercel.json +0 -8
  109. package/scripts/a2ui-engine.js +0 -73
  110. package/scripts/adk-consolidator.js +0 -274
  111. package/scripts/agent-security-hardening.js +0 -225
  112. package/scripts/ai-search-visibility.js +0 -142
  113. package/scripts/autonomous-sales-agent.js +0 -39
  114. package/scripts/autoresearch-runner.js +0 -216
  115. package/scripts/background-agent-governance.js +0 -229
  116. package/scripts/behavioral-extraction.js +0 -93
  117. package/scripts/budget-enforcer.js +0 -173
  118. package/scripts/budget-guard.js +0 -173
  119. package/scripts/build-claude-mcpb.js +0 -255
  120. package/scripts/build-codex-plugin.js +0 -152
  121. package/scripts/capture-railway-diagnostics.sh +0 -97
  122. package/scripts/changeset-check.js +0 -372
  123. package/scripts/check-congruence.js +0 -443
  124. package/scripts/computer-use-firewall.js +0 -280
  125. package/scripts/content-engine/linkedin-content-generator.js +0 -154
  126. package/scripts/content-engine/output/linkedin-memento-validation.md +0 -17
  127. package/scripts/content-engine/output/linkedin-posts-2026-04-09.md +0 -175
  128. package/scripts/content-engine/reddit-thread-finder.js +0 -154
  129. package/scripts/context-engine.js +0 -710
  130. package/scripts/daily-digest.js +0 -11
  131. package/scripts/data-governance.js +0 -173
  132. package/scripts/deploy-gcp.sh +0 -44
  133. package/scripts/deploy-policy.js +0 -249
  134. package/scripts/disagreement-mining.js +0 -315
  135. package/scripts/dpo-optimizer.js +0 -206
  136. package/scripts/ensure-repo-bootstrap.js +0 -130
  137. package/scripts/ephemeral-agent-store.js +0 -212
  138. package/scripts/eval-harness.js +0 -56
  139. package/scripts/export-kto-pairs.js +0 -309
  140. package/scripts/export-training.js +0 -446
  141. package/scripts/feedback-fallback.js +0 -111
  142. package/scripts/feedback-inbox-read.js +0 -162
  143. package/scripts/feedback-root-consolidator.js +0 -233
  144. package/scripts/feedback-to-memory.js +0 -185
  145. package/scripts/gate-satisfy.js +0 -42
  146. package/scripts/generate-paperbanana-diagrams.sh +0 -99
  147. package/scripts/generate-pretool-hook.sh +0 -40
  148. package/scripts/github-about.js +0 -430
  149. package/scripts/github-outreach.js +0 -65
  150. package/scripts/gtm-revenue-loop.js +0 -535
  151. package/scripts/hallucination-detector.js +0 -226
  152. package/scripts/hf-papers.js +0 -317
  153. package/scripts/hook-auto-capture.sh +0 -100
  154. package/scripts/hook-stop-pr-thread-check.sh +0 -68
  155. package/scripts/hook-stop-self-score.sh +0 -51
  156. package/scripts/hook-stop-verify-deploy.sh +0 -31
  157. package/scripts/hook-verify-before-done.sh +0 -20
  158. package/scripts/managed-dpo-export.js +0 -91
  159. package/scripts/markdown-escape.js +0 -12
  160. package/scripts/marketing-experiment.js +0 -657
  161. package/scripts/memalign-recall.js +0 -111
  162. package/scripts/memory-migration.js +0 -296
  163. package/scripts/meta-policy.js +0 -190
  164. package/scripts/metered-billing.js +0 -16
  165. package/scripts/model-tier-router.js +0 -310
  166. package/scripts/money-watcher.js +0 -218
  167. package/scripts/multi-hop-recall.js +0 -240
  168. package/scripts/per-step-scoring.js +0 -163
  169. package/scripts/perplexity-marketing.js +0 -466
  170. package/scripts/pii-scanner.js +0 -153
  171. package/scripts/plan-gate.js +0 -154
  172. package/scripts/post-everywhere.js +0 -341
  173. package/scripts/post-to-x-retry.sh +0 -22
  174. package/scripts/post-to-x.js +0 -369
  175. package/scripts/pr-manager.js +0 -421
  176. package/scripts/principle-extractor.js +0 -162
  177. package/scripts/pro-features.js +0 -41
  178. package/scripts/prompt-dlp.js +0 -222
  179. package/scripts/prove-adapters.js +0 -860
  180. package/scripts/prove-attribution.js +0 -361
  181. package/scripts/prove-automation.js +0 -651
  182. package/scripts/prove-autoresearch.js +0 -304
  183. package/scripts/prove-claim-verification.js +0 -277
  184. package/scripts/prove-cloudflare-sandbox.js +0 -161
  185. package/scripts/prove-data-pipeline.js +0 -408
  186. package/scripts/prove-data-quality.js +0 -227
  187. package/scripts/prove-evolution.js +0 -352
  188. package/scripts/prove-harnesses.js +0 -287
  189. package/scripts/prove-intelligence.js +0 -257
  190. package/scripts/prove-lancedb.js +0 -425
  191. package/scripts/prove-local-intelligence.js +0 -340
  192. package/scripts/prove-loop-closure.js +0 -263
  193. package/scripts/prove-packaged-runtime.js +0 -326
  194. package/scripts/prove-predictive-insights.js +0 -355
  195. package/scripts/prove-runtime.js +0 -363
  196. package/scripts/prove-seo-gsd.js +0 -234
  197. package/scripts/prove-settings.js +0 -279
  198. package/scripts/prove-subway-upgrades.js +0 -277
  199. package/scripts/prove-tessl.js +0 -229
  200. package/scripts/prove-training-export.js +0 -325
  201. package/scripts/prove-workflow-contract.js +0 -112
  202. package/scripts/prove-xmemory.js +0 -332
  203. package/scripts/publish-decision.js +0 -159
  204. package/scripts/ralph-loop.js +0 -376
  205. package/scripts/ralph-mode-ci.js +0 -331
  206. package/scripts/reddit-dm-outreach.js +0 -192
  207. package/scripts/reddit-monitor-cron.sh +0 -26
  208. package/scripts/reminder-engine.js +0 -132
  209. package/scripts/revenue-status.js +0 -472
  210. package/scripts/rotate-stripe-webhook-secret.js +0 -314
  211. package/scripts/schedule-manager.js +0 -249
  212. package/scripts/self-healing-check.js +0 -193
  213. package/scripts/shieldcortex-memory-firewall-runner.mjs +0 -53
  214. package/scripts/skill-exporter.js +0 -260
  215. package/scripts/skill-materializer.js +0 -134
  216. package/scripts/skill-packs.js +0 -136
  217. package/scripts/skill-proposer.js +0 -99
  218. package/scripts/skill-quality-tracker.js +0 -282
  219. package/scripts/slow-loop.js +0 -72
  220. package/scripts/social-analytics/db/analytics.sqlite +0 -0
  221. package/scripts/social-analytics/db/schema.sql +0 -32
  222. package/scripts/social-analytics/digest.js +0 -256
  223. package/scripts/social-analytics/engagement-audit.js +0 -185
  224. package/scripts/social-analytics/generate-instagram-card.js +0 -97
  225. package/scripts/social-analytics/instagram-thumbgate-post.js +0 -111
  226. package/scripts/social-analytics/install-growth-automation.js +0 -114
  227. package/scripts/social-analytics/load-env.js +0 -77
  228. package/scripts/social-analytics/mcp-server.js +0 -289
  229. package/scripts/social-analytics/normalizer.js +0 -580
  230. package/scripts/social-analytics/notify.js +0 -162
  231. package/scripts/social-analytics/poll-all.js +0 -107
  232. package/scripts/social-analytics/pollers/github.js +0 -195
  233. package/scripts/social-analytics/pollers/instagram.js +0 -253
  234. package/scripts/social-analytics/pollers/linkedin.js +0 -340
  235. package/scripts/social-analytics/pollers/plausible.js +0 -245
  236. package/scripts/social-analytics/pollers/reddit.js +0 -306
  237. package/scripts/social-analytics/pollers/threads.js +0 -233
  238. package/scripts/social-analytics/pollers/tiktok.js +0 -203
  239. package/scripts/social-analytics/pollers/x.js +0 -227
  240. package/scripts/social-analytics/pollers/youtube.js +0 -304
  241. package/scripts/social-analytics/pollers/zernio.js +0 -183
  242. package/scripts/social-analytics/publish-instagram-thumbgate.js +0 -104
  243. package/scripts/social-analytics/publish-thumbgate-launch.js +0 -322
  244. package/scripts/social-analytics/publishers/devto.js +0 -122
  245. package/scripts/social-analytics/publishers/instagram.js +0 -317
  246. package/scripts/social-analytics/publishers/linkedin.js +0 -294
  247. package/scripts/social-analytics/publishers/reddit.js +0 -385
  248. package/scripts/social-analytics/publishers/threads.js +0 -275
  249. package/scripts/social-analytics/publishers/tiktok.js +0 -217
  250. package/scripts/social-analytics/publishers/x.js +0 -259
  251. package/scripts/social-analytics/publishers/youtube.js +0 -223
  252. package/scripts/social-analytics/publishers/zernio.js +0 -539
  253. package/scripts/social-analytics/reconcile-thumbgate-campaign.js +0 -165
  254. package/scripts/social-analytics/run-digest.js +0 -34
  255. package/scripts/social-analytics/schedule-thumbgate-campaign.js +0 -275
  256. package/scripts/social-analytics/store.js +0 -455
  257. package/scripts/social-analytics/sync-launch-assets.js +0 -185
  258. package/scripts/social-analytics/utm.js +0 -143
  259. package/scripts/social-pipeline.js +0 -2626
  260. package/scripts/social-post-hourly.js +0 -228
  261. package/scripts/social-quality-gate.js +0 -134
  262. package/scripts/social-reply-monitor.js +0 -592
  263. package/scripts/status-dashboard.js +0 -155
  264. package/scripts/stripe-live-status.js +0 -115
  265. package/scripts/subagent-profiles.js +0 -79
  266. package/scripts/sync-branch-protection.js +0 -340
  267. package/scripts/sync-gh-secrets-from-env.sh +0 -70
  268. package/scripts/sync-github-about.js +0 -55
  269. package/scripts/sync-version.js +0 -479
  270. package/scripts/synthetic-dpo.js +0 -234
  271. package/scripts/tessl-export.js +0 -369
  272. package/scripts/test-coverage.js +0 -128
  273. package/scripts/thumbgate_session_start.sh +0 -32
  274. package/scripts/train_from_feedback.py +0 -929
  275. package/scripts/validate-feedback.js +0 -581
  276. package/scripts/verify-obsidian-setup.sh +0 -269
  277. package/scripts/verify-run.js +0 -269
  278. package/scripts/weekly-auto-post.js +0 -124
  279. package/scripts/x-autonomous-marketing.js +0 -139
@@ -1,315 +0,0 @@
1
- #!/usr/bin/env node
2
- /**
3
- * Disagreement Mining
4
- *
5
- * Inspired by Dropbox's "human-calibrated LLM labeling" approach.
6
- * The strongest learning signal comes from cases where the Thompson
7
- * Sampling model DISAGREES with actual user feedback signals. These
8
- * disagreements are prioritized for review and DPO pair generation.
9
- *
10
- * Zero external npm dependencies.
11
- */
12
-
13
- 'use strict';
14
-
15
- const path = require('path');
16
- const { loadModel, getReliability } = require('./thompson-sampling');
17
- const { readJSONL, getFeedbackPaths, inferDomain } = require('./feedback-loop');
18
- const { extractDomainKeys } = require('./export-dpo-pairs');
19
-
20
- // ---------------------------------------------------------------------------
21
- // Domain → Thompson category mapping
22
- // ---------------------------------------------------------------------------
23
-
24
- /**
25
- * Map an inferDomain() result to the closest Thompson Sampling category.
26
- * Thompson uses: code_edit, git, testing, pr_review, search, architecture,
27
- * security, debugging, uncategorized.
28
- *
29
- * @param {string} domain - Domain from inferDomain()
30
- * @returns {string} Thompson category key
31
- */
32
- function domainToCategory(domain) {
33
- const mapping = {
34
- 'testing': 'testing',
35
- 'security': 'security',
36
- 'debugging': 'debugging',
37
- 'architecture': 'architecture',
38
- 'git-workflow': 'git',
39
- 'ui-components': 'code_edit',
40
- 'api-integration': 'code_edit',
41
- 'documentation': 'uncategorized',
42
- 'data-modeling': 'architecture',
43
- 'performance': 'debugging',
44
- 'general': 'uncategorized',
45
- };
46
- return mapping[domain] || 'uncategorized';
47
- }
48
-
49
- // ---------------------------------------------------------------------------
50
- // Core: Mine Disagreements
51
- // ---------------------------------------------------------------------------
52
-
53
- /**
54
- * Find disagreements between Thompson model predictions and actual user signals.
55
- *
56
- * A "disagreement" is when:
57
- * - Thompson reliability > highThreshold (e.g. 0.6) but user gave negative signal
58
- * - Thompson reliability < lowThreshold (e.g. 0.4) but user gave positive signal
59
- *
60
- * @param {Object} [opts]
61
- * @param {string} [opts.feedbackDir] - Override feedback dir
62
- * @param {string} [opts.modelPath] - Override model path
63
- * @param {number} [opts.highThreshold=0.6] - Reliability above which positive is expected
64
- * @param {number} [opts.lowThreshold=0.4] - Reliability below which negative is expected
65
- * @returns {{ disagreements: Array, stats: Object }}
66
- */
67
- function mineDisagreements(opts) {
68
- const options = opts || {};
69
- const highThreshold = options.highThreshold != null ? options.highThreshold : 0.6;
70
- const lowThreshold = options.lowThreshold != null ? options.lowThreshold : 0.4;
71
-
72
- const paths = getFeedbackPaths();
73
- const feedbackDir = options.feedbackDir || paths.FEEDBACK_DIR;
74
- const modelPath = options.modelPath || path.join(feedbackDir, 'feedback_model.json');
75
- const feedbackLogPath = path.join(feedbackDir, 'feedback-log.jsonl');
76
-
77
- const model = loadModel(modelPath);
78
- const reliability = getReliability(model);
79
- const events = readJSONL(feedbackLogPath);
80
-
81
- const disagreements = [];
82
-
83
- for (let i = 0; i < events.length; i++) {
84
- const event = events[i];
85
- if (!event.signal) continue;
86
-
87
- const isPositive = event.signal === 'positive';
88
- const domain = inferDomain(event.tags, event.context);
89
- const category = domainToCategory(domain);
90
- const catReliability = reliability[category]
91
- ? reliability[category].reliability
92
- : 0.5;
93
-
94
- let disagreementType = null;
95
- let strength = 0;
96
-
97
- if (catReliability > highThreshold && !isPositive) {
98
- // Model thinks this category is reliable, but user disagrees
99
- disagreementType = 'model_overconfident';
100
- strength = catReliability - highThreshold;
101
- } else if (catReliability < lowThreshold && isPositive) {
102
- // Model thinks this category is unreliable, but user approves
103
- disagreementType = 'model_underconfident';
104
- strength = lowThreshold - catReliability;
105
- }
106
-
107
- if (disagreementType) {
108
- disagreements.push({
109
- feedbackIndex: i,
110
- feedbackId: event.id || `event-${i}`,
111
- signal: event.signal,
112
- domain,
113
- category,
114
- categoryReliability: catReliability,
115
- disagreementType,
116
- disagreementStrength: Math.round(strength * 1000) / 1000,
117
- context: event.context || '',
118
- tags: event.tags || [],
119
- timestamp: event.timestamp || null,
120
- });
121
- }
122
- }
123
-
124
- // Sort by disagreement strength descending (strongest signal first)
125
- disagreements.sort((a, b) => b.disagreementStrength - a.disagreementStrength);
126
-
127
- const rate = events.length > 0
128
- ? Math.round((disagreements.length / events.length) * 1000) / 1000
129
- : 0;
130
-
131
- return {
132
- disagreements,
133
- stats: {
134
- totalEvents: events.length,
135
- disagreementCount: disagreements.length,
136
- disagreementRate: rate,
137
- overconfident: disagreements.filter((d) => d.disagreementType === 'model_overconfident').length,
138
- underconfident: disagreements.filter((d) => d.disagreementType === 'model_underconfident').length,
139
- },
140
- };
141
- }
142
-
143
- // ---------------------------------------------------------------------------
144
- // Amplify: Generate DPO pairs from disagreements
145
- // ---------------------------------------------------------------------------
146
-
147
- /**
148
- * Generate amplified DPO pairs from disagreements.
149
- * For each disagreement, synthesize a preference pair where:
150
- * - chosen = what the user signal implies (corrective direction)
151
- * - rejected = what the model predicted
152
- *
153
- * @param {Array} disagreements - From mineDisagreements()
154
- * @returns {Array} DPO preference pairs with amplification metadata
155
- */
156
- function amplifyFromDisagreements(disagreements) {
157
- if (!Array.isArray(disagreements)) return [];
158
-
159
- return disagreements.map((d) => {
160
- const domainKeys = extractDomainKeys({
161
- tags: d.tags,
162
- title: d.context,
163
- });
164
- const domainLabel = domainKeys.length > 0 ? domainKeys.join(', ') : d.domain;
165
-
166
- const prompt = `Domain: ${domainLabel}. ` +
167
- `The agent performed a ${d.domain} task. ` +
168
- (d.context ? `Context: ${d.context}` : 'How should the agent handle this scenario?');
169
-
170
- let chosen;
171
- let rejected;
172
-
173
- if (d.disagreementType === 'model_overconfident') {
174
- // Model thought it was good, user said no — user's correction is "chosen"
175
- chosen = `The agent should NOT rely on its current ${d.domain} approach. ` +
176
- `User feedback indicates failure despite model confidence of ${d.categoryReliability.toFixed(2)}. ` +
177
- 'Corrective action needed.';
178
- rejected = `The agent's ${d.domain} approach is reliable ` +
179
- `(model confidence: ${d.categoryReliability.toFixed(2)}). Continue current behavior.`;
180
- } else {
181
- // Model thought it was bad, user said it was fine — model is too cautious
182
- chosen = `The agent's ${d.domain} approach succeeded. ` +
183
- `User approved despite model skepticism (confidence: ${d.categoryReliability.toFixed(2)}). ` +
184
- 'This approach should be trusted more.';
185
- rejected = `The agent's ${d.domain} approach is unreliable ` +
186
- `(model confidence: ${d.categoryReliability.toFixed(2)}). Avoid this approach.`;
187
- }
188
-
189
- return {
190
- prompt,
191
- chosen,
192
- rejected,
193
- metadata: {
194
- disagreementStrength: d.disagreementStrength,
195
- disagreementType: d.disagreementType,
196
- domain: d.domain,
197
- category: d.category,
198
- originalFeedbackId: d.feedbackId,
199
- amplified: true,
200
- },
201
- };
202
- });
203
- }
204
-
205
- // ---------------------------------------------------------------------------
206
- // Calibrate: Cross-reference prevention rules with Thompson model
207
- // ---------------------------------------------------------------------------
208
-
209
- /**
210
- * Calibrate prevention rules by cross-referencing disagreements.
211
- * Only promote rules where BOTH Thompson model AND user signals agree
212
- * on the failure pattern (concordance check).
213
- *
214
- * @param {string} [feedbackDir] - Override feedback dir
215
- * @returns {{ calibratedRules: Array, droppedRules: Array, concordanceRate: number }}
216
- */
217
- function calibratePreventionRules(feedbackDir) {
218
- const paths = getFeedbackPaths();
219
- const dir = feedbackDir || paths.FEEDBACK_DIR;
220
- const modelPath = path.join(dir, 'feedback_model.json');
221
- const memoryLogPath = path.join(dir, 'memory-log.jsonl');
222
-
223
- const model = loadModel(modelPath);
224
- const reliability = getReliability(model);
225
- const memories = readJSONL(memoryLogPath);
226
-
227
- // Filter to error memories only
228
- const errorMemories = memories.filter((m) => m.category === 'error');
229
-
230
- const calibratedRules = [];
231
- const droppedRules = [];
232
-
233
- for (const mem of errorMemories) {
234
- const domain = inferDomain(mem.tags, mem.content || mem.title || '');
235
- const category = domainToCategory(domain);
236
- const catReliability = reliability[category]
237
- ? reliability[category].reliability
238
- : 0.5;
239
-
240
- const rule = {
241
- domain,
242
- category,
243
- title: mem.title || '',
244
- categoryReliability: catReliability,
245
- memoryId: mem.id || null,
246
- };
247
-
248
- // Concordance: both user (error memory) and Thompson (low reliability) agree
249
- if (catReliability < 0.5) {
250
- calibratedRules.push(rule);
251
- } else {
252
- droppedRules.push(rule);
253
- }
254
- }
255
-
256
- const total = calibratedRules.length + droppedRules.length;
257
- const concordanceRate = total > 0
258
- ? Math.round((calibratedRules.length / total) * 1000) / 1000
259
- : 1;
260
-
261
- return {
262
- calibratedRules,
263
- droppedRules,
264
- concordanceRate,
265
- };
266
- }
267
-
268
- // ---------------------------------------------------------------------------
269
- // CLI
270
- // ---------------------------------------------------------------------------
271
-
272
- function parseArgs(argv) {
273
- const args = {};
274
- argv.forEach((arg) => {
275
- if (!arg.startsWith('--')) return;
276
- const [key, ...rest] = arg.slice(2).split('=');
277
- args[key] = rest.length ? rest.join('=') : true;
278
- });
279
- return args;
280
- }
281
-
282
- if (require.main === module) {
283
- const args = parseArgs(process.argv.slice(2));
284
-
285
- if (args.calibrate) {
286
- const result = calibratePreventionRules(args['feedback-dir']);
287
- console.log(JSON.stringify(result, null, 2));
288
- } else {
289
- // --mine or --amplify (amplify implies mine)
290
- const result = mineDisagreements({
291
- feedbackDir: args['feedback-dir'],
292
- modelPath: args['model-path'],
293
- highThreshold: args['high-threshold'] ? Number(args['high-threshold']) : undefined,
294
- lowThreshold: args['low-threshold'] ? Number(args['low-threshold']) : undefined,
295
- });
296
-
297
- if (args.amplify) {
298
- const pairs = amplifyFromDisagreements(result.disagreements);
299
- console.log(JSON.stringify({ pairs, stats: result.stats }, null, 2));
300
- } else {
301
- console.log(JSON.stringify(result, null, 2));
302
- }
303
- }
304
- }
305
-
306
- // ---------------------------------------------------------------------------
307
- // Exports
308
- // ---------------------------------------------------------------------------
309
-
310
- module.exports = {
311
- mineDisagreements,
312
- amplifyFromDisagreements,
313
- calibratePreventionRules,
314
- domainToCategory,
315
- };
@@ -1,206 +0,0 @@
1
- 'use strict';
2
- /**
3
- * DPO Batch Optimizer (DPO-02)
4
- *
5
- * Builds (chosen, rejected) preference pairs from feedback-log.jsonl memories,
6
- * computes DPO log-ratio adjustments using Thompson Sampling posteriors,
7
- * and writes dpo-model.json to THUMBGATE_FEEDBACK_DIR.
8
- *
9
- * Does NOT call any external API. Pure offline batch optimization.
10
- *
11
- * Exports: run, buildPreferencePairs, applyDpoAdjustments, dpoLogRatio
12
- */
13
-
14
- const fs = require('fs');
15
- const path = require('path');
16
- const { getEffectiveSetting } = require('./evolution-state');
17
- const { resolveFeedbackDir } = require('./feedback-paths');
18
-
19
- const DPO_BETA = 0.1;
20
-
21
- // ---------------------------------------------------------------------------
22
- // dpoLogRatio — DPO preference adjustment formula
23
- // ---------------------------------------------------------------------------
24
-
25
- /**
26
- * Compute DPO adjustment in range [-1, +1] from chosen and rejected weights.
27
- *
28
- * @param {number} chosenWeight - Time-decay weight for chosen (positive) outcome
29
- * @param {number} rejectedWeight - Time-decay weight for rejected (negative) outcome
30
- * @param {number} [beta=0.1] - Temperature parameter (lower = more aggressive)
31
- * @returns {number} Adjustment in [-1, +1]
32
- */
33
- function dpoLogRatio(chosenWeight, rejectedWeight, beta) {
34
- const b = (beta !== undefined && beta !== null) ? beta : getEffectiveSetting('dpo_beta', DPO_BETA);
35
- const cw = Math.max(chosenWeight, 0.01);
36
- const rw = Math.max(rejectedWeight, 0.01);
37
- const logRatio = Math.log(cw) - Math.log(rw);
38
- const sigmoid = 1.0 / (1.0 + Math.exp(-b * logRatio));
39
- return (sigmoid - 0.5) * 2;
40
- }
41
-
42
- // ---------------------------------------------------------------------------
43
- // buildPreferencePairs — groups DPO pairs by category from feedbackDir
44
- // ---------------------------------------------------------------------------
45
-
46
- /**
47
- * Build preference pairs grouped by category.
48
- *
49
- * Uses buildDpoPairs() from export-dpo-pairs.js (do NOT reimplement).
50
- * Reads memory-log.jsonl from feedbackDir to get error + learning memories.
51
- *
52
- * @param {string} feedbackDir - Directory containing memory-log.jsonl
53
- * @returns {Object} Map of category → [{ chosen, rejected }]
54
- */
55
- function buildPreferencePairs(feedbackDir) {
56
- const { buildDpoPairs, readJSONL } = require('./export-dpo-pairs');
57
- const memoryLogPath = path.join(feedbackDir, 'memory-log.jsonl');
58
- const memories = readJSONL(memoryLogPath);
59
-
60
- const errors = memories.filter((m) => m.category === 'error');
61
- const learnings = memories.filter((m) => m.category === 'learning');
62
-
63
- const result = buildDpoPairs(errors, learnings);
64
-
65
- // Group pairs by category (inferred from matchedKeys or tags)
66
- const grouped = {};
67
- for (const pair of result.pairs) {
68
- const keys = (pair.metadata && pair.metadata.matchedKeys) || [];
69
- const category = keys.length > 0 ? keys[0] : 'uncategorized';
70
- if (!grouped[category]) grouped[category] = [];
71
- grouped[category].push({
72
- chosen: pair.metadata
73
- ? { id: pair.metadata.learningId, content: pair.chosen, timestamp: null }
74
- : { content: pair.chosen },
75
- rejected: pair.metadata
76
- ? { id: pair.metadata.errorId, content: pair.rejected, timestamp: null }
77
- : { content: pair.rejected },
78
- metadata: pair.metadata,
79
- });
80
- }
81
-
82
- return grouped;
83
- }
84
-
85
- // ---------------------------------------------------------------------------
86
- // applyDpoAdjustments — mutates Thompson model with DPO posterior adjustments
87
- // ---------------------------------------------------------------------------
88
-
89
- /**
90
- * Apply DPO adjustments to Thompson Sampling posteriors and save the model.
91
- *
92
- * CRITICAL: calls ts.saveModel(model, modelPath) after all mutations.
93
- *
94
- * @param {string} modelPath - Path to feedback_model.json
95
- * @param {Object} pairs - Map of category → [{ chosen, rejected }] from buildPreferencePairs
96
- * @returns {Object} adjustments - Map of category → { pairs, avg_adjustment }
97
- */
98
- function applyDpoAdjustments(modelPath, pairs) {
99
- const ts = require('./thompson-sampling');
100
- const model = ts.loadModel(modelPath);
101
- const adjustments = {};
102
-
103
- for (const [cat, catPairs] of Object.entries(pairs)) {
104
- if (!catPairs || catPairs.length === 0) continue;
105
-
106
- // Ensure category exists in model
107
- if (!model.categories[cat]) {
108
- model.categories[cat] = { alpha: 1.0, beta: 1.0, samples: 0, last_updated: null };
109
- }
110
-
111
- let total = 0;
112
- for (const pair of catPairs) {
113
- const chosenTs = (pair.chosen && pair.chosen.timestamp) || null;
114
- const rejectedTs = (pair.rejected && pair.rejected.timestamp) || null;
115
- const cw = ts.timeDecayWeight(chosenTs);
116
- const rw = ts.timeDecayWeight(rejectedTs);
117
- total += dpoLogRatio(cw, rw);
118
- }
119
-
120
- const avg = total / catPairs.length;
121
-
122
- if (avg > 0) {
123
- model.categories[cat].alpha += avg * catPairs.length * 0.5;
124
- } else {
125
- model.categories[cat].beta += Math.abs(avg) * catPairs.length * 0.5;
126
- }
127
-
128
- adjustments[cat] = {
129
- pairs: catPairs.length,
130
- avg_adjustment: Math.round(avg * 10000) / 10000,
131
- };
132
- }
133
-
134
- // CRITICAL: save after all mutations (Pitfall 2 from RESEARCH.md)
135
- ts.saveModel(model, modelPath);
136
-
137
- return adjustments;
138
- }
139
-
140
- // ---------------------------------------------------------------------------
141
- // run — top-level batch DPO optimization entry point
142
- // ---------------------------------------------------------------------------
143
-
144
- /**
145
- * Run the full DPO optimization batch:
146
- * 1. Build preference pairs from memory-log.jsonl
147
- * 2. Apply DPO adjustments to Thompson model
148
- * 3. Write dpo-model.json to feedbackDir
149
- *
150
- * @param {Object} [opts]
151
- * @param {string} [opts.feedbackDir] - Override THUMBGATE_FEEDBACK_DIR
152
- * @param {string} [opts.modelPath] - Override Thompson model path
153
- * @returns {{ adjustments: Object, pairs_processed: number }}
154
- */
155
- function run(opts) {
156
- const options = opts || {};
157
- const feedbackDir = options.feedbackDir || resolveFeedbackDir();
158
- const modelPath = options.modelPath || path.join(feedbackDir, 'feedback_model.json');
159
-
160
- const pairs = buildPreferencePairs(feedbackDir);
161
-
162
- const pairsProcessed = Object.values(pairs).reduce((sum, arr) => sum + arr.length, 0);
163
-
164
- let adjustments = {};
165
- if (pairsProcessed > 0) {
166
- adjustments = applyDpoAdjustments(modelPath, pairs);
167
- }
168
-
169
- const dpoModel = {
170
- generated: new Date().toISOString(),
171
- pairs_processed: pairsProcessed,
172
- adjustments,
173
- };
174
-
175
- const dpoModelPath = path.join(feedbackDir, 'dpo-model.json');
176
- if (!fs.existsSync(feedbackDir)) {
177
- fs.mkdirSync(feedbackDir, { recursive: true });
178
- }
179
- fs.writeFileSync(dpoModelPath, `${JSON.stringify(dpoModel, null, 2)}\n`);
180
-
181
- console.log(`DPO optimization complete: ${pairsProcessed} pairs processed`);
182
- if (Object.keys(adjustments).length > 0) {
183
- console.log('Adjustments:', JSON.stringify(adjustments, null, 2));
184
- } else {
185
- console.log('No adjustment pairs found (empty or no overlapping memories)');
186
- }
187
-
188
- return { adjustments, pairs_processed: pairsProcessed };
189
- }
190
-
191
- // ---------------------------------------------------------------------------
192
- // CLI entry point
193
- // ---------------------------------------------------------------------------
194
-
195
- if (require.main === module && process.argv.includes('--run')) {
196
- run().catch((e) => {
197
- console.error(e);
198
- process.exit(1);
199
- });
200
- }
201
-
202
- // ---------------------------------------------------------------------------
203
- // Exports
204
- // ---------------------------------------------------------------------------
205
-
206
- module.exports = { run, buildPreferencePairs, applyDpoAdjustments, dpoLogRatio };
@@ -1,130 +0,0 @@
1
- #!/usr/bin/env node
2
- 'use strict';
3
-
4
- const fs = require('fs');
5
- const path = require('path');
6
-
7
- const REPO_ROOT = path.resolve(process.argv[2] || process.cwd());
8
- const THUMBGATE_ENTRY = {
9
- command: 'npx',
10
- args: ['-y', 'thumbgate@latest', 'serve'],
11
- };
12
- const MCP_SERVER_KEY = 'thumbgate';
13
- const LEGACY_SERVER_NAMES = ['rlhf', 'mcp-memory-gateway', 'rlhf_feedback_loop'];
14
- const INFO_EXCLUDE_ENTRIES = ['.thumbgate/', '.mcp.json'];
15
-
16
- function readJson(filePath) {
17
- try {
18
- return JSON.parse(fs.readFileSync(filePath, 'utf8'));
19
- } catch {
20
- return null;
21
- }
22
- }
23
-
24
- function writeJsonIfChanged(filePath, value) {
25
- const next = JSON.stringify(value, null, 2) + '\n';
26
- let current = null;
27
- try {
28
- current = fs.readFileSync(filePath, 'utf8');
29
- } catch {
30
- current = null;
31
- }
32
- if (current === next) {
33
- return false;
34
- }
35
- fs.mkdirSync(path.dirname(filePath), { recursive: true });
36
- fs.writeFileSync(filePath, next);
37
- return true;
38
- }
39
-
40
- function mergeThumbgateEntry(entry = {}) {
41
- return {
42
- ...entry,
43
- command: THUMBGATE_ENTRY.command,
44
- args: THUMBGATE_ENTRY.args.slice(),
45
- };
46
- }
47
-
48
- function ensureMcpJson(repoRoot) {
49
- const filePath = path.join(repoRoot, '.mcp.json');
50
- const existing = readJson(filePath);
51
- const config = existing && typeof existing === 'object' ? existing : {};
52
- config.mcpServers = config.mcpServers && typeof config.mcpServers === 'object' ? config.mcpServers : {};
53
- config.mcpServers[MCP_SERVER_KEY] = mergeThumbgateEntry(config.mcpServers[MCP_SERVER_KEY]);
54
- for (const legacyName of LEGACY_SERVER_NAMES) {
55
- delete config.mcpServers[legacyName];
56
- }
57
- return writeJsonIfChanged(filePath, config);
58
- }
59
-
60
- function ensureClaudeSettings(repoRoot) {
61
- const filePath = path.join(repoRoot, '.claude', 'settings.json');
62
- const existing = readJson(filePath);
63
- if (!existing || typeof existing !== 'object') {
64
- return false;
65
- }
66
- const hasRelevantServer =
67
- Boolean(existing.mcpServers && existing.mcpServers[MCP_SERVER_KEY]) ||
68
- LEGACY_SERVER_NAMES.some((name) => Boolean(existing.mcpServers && existing.mcpServers[name]));
69
- if (!hasRelevantServer) {
70
- return false;
71
- }
72
- existing.mcpServers = existing.mcpServers && typeof existing.mcpServers === 'object' ? existing.mcpServers : {};
73
- existing.mcpServers[MCP_SERVER_KEY] = mergeThumbgateEntry(existing.mcpServers[MCP_SERVER_KEY]);
74
- for (const legacyName of LEGACY_SERVER_NAMES) {
75
- delete existing.mcpServers[legacyName];
76
- }
77
- return writeJsonIfChanged(filePath, existing);
78
- }
79
-
80
- function ensureInfoExclude(repoRoot) {
81
- const excludePath = path.join(repoRoot, '.git', 'info', 'exclude');
82
- let current = '';
83
- try {
84
- current = fs.readFileSync(excludePath, 'utf8');
85
- } catch {
86
- current = '';
87
- }
88
- const lines = new Set(
89
- current
90
- .split(/\r?\n/)
91
- .map((line) => line.trim())
92
- .filter(Boolean)
93
- );
94
- let changed = false;
95
- for (const entry of INFO_EXCLUDE_ENTRIES) {
96
- if (!lines.has(entry)) {
97
- lines.add(entry);
98
- changed = true;
99
- }
100
- }
101
- if (!changed) {
102
- return false;
103
- }
104
- const next = `${Array.from(lines).sort().join('\n')}\n`;
105
- fs.mkdirSync(path.dirname(excludePath), { recursive: true });
106
- fs.writeFileSync(excludePath, next);
107
- return true;
108
- }
109
-
110
- function ensureThumbgateDir(repoRoot) {
111
- const thumbgateDir = path.join(repoRoot, '.thumbgate');
112
- if (fs.existsSync(thumbgateDir)) {
113
- return false;
114
- }
115
- fs.mkdirSync(thumbgateDir, { recursive: true });
116
- return true;
117
- }
118
-
119
- function main() {
120
- const results = {
121
- repoRoot: REPO_ROOT,
122
- createdThumbgateDir: ensureThumbgateDir(REPO_ROOT),
123
- updatedMcpJson: ensureMcpJson(REPO_ROOT),
124
- updatedClaudeSettings: ensureClaudeSettings(REPO_ROOT),
125
- updatedInfoExclude: ensureInfoExclude(REPO_ROOT),
126
- };
127
- process.stdout.write(`${JSON.stringify(results)}\n`);
128
- }
129
-
130
- main();