thumbgate 1.15.0 → 1.16.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/marketplace.json +6 -6
- package/.claude-plugin/plugin.json +3 -3
- package/.well-known/llms.txt +5 -5
- package/.well-known/mcp/server-card.json +1 -1
- package/README.md +59 -35
- package/adapters/chatgpt/openapi.yaml +118 -2
- package/adapters/claude/.mcp.json +2 -2
- package/adapters/mcp/server-stdio.js +210 -84
- package/adapters/opencode/opencode.json +1 -1
- package/bench/prompt-eval-suite.json +5 -1
- package/bin/cli.js +157 -8
- package/config/evals/agent-safety-eval.json +338 -22
- package/config/gates/routine.json +43 -0
- package/config/github-about.json +3 -3
- package/config/model-candidates.json +131 -0
- package/openapi/openapi.yaml +118 -2
- package/package.json +57 -49
- package/public/blog.html +7 -7
- package/public/codex-plugin.html +6 -6
- package/public/compare.html +29 -23
- package/public/dashboard.html +82 -10
- package/public/guide.html +28 -28
- package/public/index.html +216 -98
- package/public/learn.html +50 -22
- package/public/lessons.html +1 -1
- package/public/numbers.html +17 -17
- package/public/pro.html +82 -18
- package/scripts/agent-audit-trace.js +55 -0
- package/scripts/agent-memory-lifecycle.js +96 -0
- package/scripts/agent-readiness-plan.js +118 -0
- package/scripts/agentic-data-pipeline.js +21 -1
- package/scripts/agents-sdk-sandbox-plan.js +57 -0
- package/scripts/ai-org-governance.js +98 -0
- package/scripts/ai-search-distribution.js +43 -0
- package/scripts/artifact-agent-plan.js +81 -0
- package/scripts/billing.js +27 -8
- package/scripts/cli-schema.js +18 -2
- package/scripts/code-mode-mcp-plan.js +71 -0
- package/scripts/context-engine.js +1 -2
- package/scripts/context-manager.js +4 -1
- package/scripts/dashboard-render-spec.js +1 -1
- package/scripts/dashboard.js +275 -9
- package/scripts/decision-journal.js +13 -3
- package/scripts/document-workflow-governance.js +62 -0
- package/scripts/enterprise-agent-rollout.js +34 -0
- package/scripts/experience-replay-governance.js +69 -0
- package/scripts/export-hf-dataset.js +1 -1
- package/scripts/feedback-loop.js +92 -4
- package/scripts/feedback-to-rules.js +17 -23
- package/scripts/gates-engine.js +4 -6
- package/scripts/growth-campaigns.js +49 -0
- package/scripts/harness-selector.js +16 -4
- package/scripts/hybrid-supervisor-agent.js +64 -0
- package/scripts/inference-cache-policy.js +72 -0
- package/scripts/inference-economics.js +53 -0
- package/scripts/internal-agent-bootstrap.js +12 -2
- package/scripts/knowledge-layer-plan.js +108 -0
- package/scripts/lesson-inference.js +183 -44
- package/scripts/lesson-search.js +4 -1
- package/scripts/llm-client.js +157 -26
- package/scripts/mailer/resend-mailer.js +112 -1
- package/scripts/mcp-transport-strategy.js +66 -0
- package/scripts/memory-store-governance.js +60 -0
- package/scripts/meta-agent-loop.js +7 -13
- package/scripts/model-access-eligibility.js +38 -0
- package/scripts/model-migration-readiness.js +55 -0
- package/scripts/operational-integrity.js +96 -3
- package/scripts/otel-declarative-config.js +56 -0
- package/scripts/perplexity-client.js +1 -1
- package/scripts/post-training-governance.js +34 -0
- package/scripts/private-core-boundary.js +72 -0
- package/scripts/production-agent-readiness.js +40 -0
- package/scripts/prompt-eval.js +564 -32
- package/scripts/prompt-programs.js +93 -0
- package/scripts/provider-action-normalizer.js +585 -0
- package/scripts/scaling-law-claims.js +60 -0
- package/scripts/security-scanner.js +1 -1
- package/scripts/self-distill-agent.js +7 -32
- package/scripts/seo-gsd.js +232 -55
- package/scripts/skill-rag-router.js +53 -0
- package/scripts/spec-gate.js +1 -1
- package/scripts/student-consistent-training.js +73 -0
- package/scripts/synthetic-data-provenance.js +98 -0
- package/scripts/task-context-result.js +81 -0
- package/scripts/telemetry-analytics.js +149 -0
- package/scripts/thompson-sampling.js +2 -2
- package/scripts/token-savings.js +7 -6
- package/scripts/token-tco.js +46 -0
- package/scripts/tool-registry.js +63 -3
- package/scripts/verification-loop.js +10 -1
- package/scripts/verifier-scoring.js +71 -0
- package/scripts/workflow-sentinel.js +284 -28
- package/scripts/workspace-agent-routines.js +118 -0
- package/src/api/server.js +381 -120
- package/scripts/analytics-report.js +0 -328
- package/scripts/autonomous-workflow.js +0 -377
- package/scripts/billing-setup.js +0 -109
- package/scripts/creator-campaigns.js +0 -239
- package/scripts/cross-encoder-reranker.js +0 -235
- package/scripts/daemon-manager.js +0 -108
- package/scripts/decision-trace.js +0 -354
- package/scripts/delegation-runtime.js +0 -896
- package/scripts/dispatch-brief.js +0 -159
- package/scripts/distribution-surfaces.js +0 -110
- package/scripts/feedback-history-distiller.js +0 -382
- package/scripts/funnel-analytics.js +0 -35
- package/scripts/history-distiller.js +0 -200
- package/scripts/hosted-job-launcher.js +0 -256
- package/scripts/intent-router.js +0 -392
- package/scripts/lesson-reranker.js +0 -263
- package/scripts/lesson-retrieval.js +0 -148
- package/scripts/managed-lesson-agent.js +0 -183
- package/scripts/operational-dashboard.js +0 -103
- package/scripts/operational-summary.js +0 -129
- package/scripts/operator-artifacts.js +0 -608
- package/scripts/optimize-context.js +0 -17
- package/scripts/org-dashboard.js +0 -206
- package/scripts/partner-orchestration.js +0 -146
- package/scripts/predictive-insights.js +0 -356
- package/scripts/pulse.js +0 -80
- package/scripts/reflector-agent.js +0 -221
- package/scripts/sales-pipeline.js +0 -681
- package/scripts/session-episode-store.js +0 -329
- package/scripts/session-health-sensor.js +0 -242
- package/scripts/session-report.js +0 -120
- package/scripts/swarm-coordinator.js +0 -81
- package/scripts/tool-kpi-tracker.js +0 -12
- package/scripts/webhook-delivery.js +0 -62
- package/scripts/workflow-sprint-intake.js +0 -475
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "thumbgate-marketplace",
|
|
3
|
-
"version": "1.
|
|
3
|
+
"version": "1.16.1",
|
|
4
4
|
"owner": {
|
|
5
5
|
"name": "Igor Ganapolsky",
|
|
6
6
|
"email": "ig5973700@gmail.com"
|
|
@@ -8,12 +8,12 @@
|
|
|
8
8
|
"plugins": [
|
|
9
9
|
{
|
|
10
10
|
"name": "thumbgate",
|
|
11
|
-
"description": "Type 👍 or 👎 on any agent action. ThumbGate captures it, distills a lesson, and blocks the pattern from repeating. One thumbs-down = the agent physically cannot make that mistake again. 33 pre-action
|
|
11
|
+
"description": "Type 👍 or 👎 on any agent action. ThumbGate captures it, distills a lesson, and blocks the pattern from repeating. One thumbs-down = the agent physically cannot make that mistake again. 33 pre-action checks, budget enforcement, self-protection, and NIST/SOC2 compliance tags.",
|
|
12
12
|
"source": {
|
|
13
13
|
"source": "npm",
|
|
14
14
|
"package": "thumbgate"
|
|
15
15
|
},
|
|
16
|
-
"version": "1.
|
|
16
|
+
"version": "1.16.1",
|
|
17
17
|
"author": {
|
|
18
18
|
"name": "Igor Ganapolsky"
|
|
19
19
|
},
|
|
@@ -22,7 +22,7 @@
|
|
|
22
22
|
"license": "MIT",
|
|
23
23
|
"category": "developer-tools",
|
|
24
24
|
"tags": [
|
|
25
|
-
"pre-action-
|
|
25
|
+
"pre-action-checks",
|
|
26
26
|
"ai-agent-safety",
|
|
27
27
|
"mcp",
|
|
28
28
|
"memory",
|
|
@@ -31,7 +31,7 @@
|
|
|
31
31
|
"keywords": [
|
|
32
32
|
"claude-desktop",
|
|
33
33
|
"desktop-extension",
|
|
34
|
-
"pre-action-
|
|
34
|
+
"pre-action-checks",
|
|
35
35
|
"ai-agent-safety",
|
|
36
36
|
"mcp",
|
|
37
37
|
"memory",
|
|
@@ -44,7 +44,7 @@
|
|
|
44
44
|
"keywords": [
|
|
45
45
|
"claude-desktop",
|
|
46
46
|
"desktop-extension",
|
|
47
|
-
"pre-action-
|
|
47
|
+
"pre-action-checks",
|
|
48
48
|
"ai-agent-safety",
|
|
49
49
|
"mcp",
|
|
50
50
|
"memory",
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "thumbgate",
|
|
3
|
-
"description": "Type 👍 or 👎 on any agent action. ThumbGate captures it, distills a lesson, and blocks the pattern from repeating. One thumbs-down = the agent physically cannot make that mistake again. 33 pre-action
|
|
4
|
-
"version": "1.
|
|
3
|
+
"description": "Type 👍 or 👎 on any agent action. ThumbGate captures it, distills a lesson, and blocks the pattern from repeating. One thumbs-down = the agent physically cannot make that mistake again. 33 pre-action checks, budget enforcement, self-protection, and NIST/SOC2 compliance tags.",
|
|
4
|
+
"version": "1.16.1",
|
|
5
5
|
"author": {
|
|
6
6
|
"name": "Igor Ganapolsky"
|
|
7
7
|
},
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
"claude-desktop",
|
|
13
13
|
"desktop-extension",
|
|
14
14
|
"mcp",
|
|
15
|
-
"pre-action-
|
|
15
|
+
"pre-action-checks",
|
|
16
16
|
"ai-agent-safety",
|
|
17
17
|
"memory",
|
|
18
18
|
"guardrails",
|
package/.well-known/llms.txt
CHANGED
|
@@ -6,7 +6,7 @@
|
|
|
6
6
|
> ThumbGate prevents expensive AI mistakes before they happen. It checks
|
|
7
7
|
> risky commands, file edits, deploys, payments, API calls, and other agent
|
|
8
8
|
> actions before execution. 👎 Thumbs down becomes a history-aware lesson and
|
|
9
|
-
> a Pre-Action
|
|
9
|
+
> a Pre-Action Check; 👍 thumbs up reinforces safe patterns.
|
|
10
10
|
|
|
11
11
|
## What ThumbGate solves
|
|
12
12
|
|
|
@@ -20,7 +20,7 @@
|
|
|
20
20
|
|
|
21
21
|
1. Agent makes a mistake → developer gives thumbs-down
|
|
22
22
|
2. ThumbGate captures context and infers a structured lesson
|
|
23
|
-
3. Recurring failures get promoted to
|
|
23
|
+
3. Recurring failures get promoted to prevention rules
|
|
24
24
|
4. PreToolUse hooks block the pattern before it executes again
|
|
25
25
|
5. Thompson Sampling adapts gate confidence over time
|
|
26
26
|
|
|
@@ -40,9 +40,9 @@ npx thumbgate init --agent claude-code
|
|
|
40
40
|
## Pricing
|
|
41
41
|
|
|
42
42
|
- Free GPT: advice, checkpointing, and setup help in ChatGPT
|
|
43
|
-
- Free local CLI: 3 feedback captures/day, 5 lesson searches/day, recall, and local Pre-Action
|
|
44
|
-
- Pro: $19/mo or $149/yr — personal enforcement proof, local dashboard,
|
|
45
|
-
- Team: $
|
|
43
|
+
- Free local CLI: 3 feedback captures/day, 5 lesson searches/day, recall, and local Pre-Action Checks after install
|
|
44
|
+
- Pro: $19/mo or $149/yr — personal enforcement proof, local dashboard, check debugger, DPO export, and review-ready exports
|
|
45
|
+
- Team: $49/seat/mo, 3-seat minimum after intake — shared lessons, org visibility, approval boundaries, and rollout proof
|
|
46
46
|
|
|
47
47
|
## Links
|
|
48
48
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "thumbgate",
|
|
3
|
-
"version": "1.
|
|
3
|
+
"version": "1.16.1",
|
|
4
4
|
"description": "ThumbGate — 👍👎 feedback that teaches your AI agent. Thumbs down a mistake, it never happens again.",
|
|
5
5
|
"homepage": "https://thumbgate-production.up.railway.app",
|
|
6
6
|
"transport": "stdio",
|
package/README.md
CHANGED
|
@@ -1,12 +1,18 @@
|
|
|
1
1
|
# ThumbGate
|
|
2
2
|
|
|
3
|
+
<p align="center">
|
|
4
|
+
<a href="https://thumbgate.ai">
|
|
5
|
+
<img src="public/assets/brand/thumbgate-icon-512.png" alt="ThumbGate" width="128" height="128" />
|
|
6
|
+
</a>
|
|
7
|
+
</p>
|
|
8
|
+
|
|
3
9
|
**Your AI coding bill has a leak.**
|
|
4
10
|
|
|
5
11
|
**Stop paying $ for the same AI mistake.**
|
|
6
12
|
|
|
7
|
-
Every retry loop, every hallucinated import, every *"let me try a different approach"* — those are billable tokens on every LLM vendor's bill. Thumbs-down once; ThumbGate blocks that exact mistake on every future call. Across Claude Code, Cursor, Codex, Gemini, Amp, OpenCode — any MCP-compatible agent, forever.
|
|
13
|
+
Every retry loop, every hallucinated import, every *"let me try a different approach"* — those are billable tokens on every LLM vendor's bill. Thumbs-down once; ThumbGate blocks that exact mistake on every future call. Across Claude Code, Cursor, Codex, Gemini, Amp, Cline, OpenCode — any MCP-compatible agent, forever.
|
|
8
14
|
|
|
9
|
-
Under the hood: your thumbs-down becomes
|
|
15
|
+
Under the hood: your thumbs-down becomes one of your **Pre-Action Checks** that physically blocks the pattern **permanently** on every future call — across every session, every model, every agent. It is **self-improving agent governance**: every correction promotes a fresh prevention rule, and your library of prevention rules grows stronger with every lesson. Works with Claude Code, Cursor, Codex, Gemini CLI, Amp, Cline, OpenCode, and any MCP-compatible agent. The monthly Anthropic / OpenAI bill stops paying for the same lesson over and over — local-first enforcement, zero tokens spent on repeats.
|
|
10
16
|
|
|
11
17
|
> **Prevent expensive AI mistakes. Make AI stop repeating mistakes. Turn a smart assistant into a reliable operator.**
|
|
12
18
|
|
|
@@ -34,7 +40,7 @@ If someone is not already bought into ThumbGate, do not lead with architecture.
|
|
|
34
40
|
|
|
35
41
|
1. **Show the pain:** open the **[ThumbGate GPT](https://thumbgate-production.up.railway.app/go/gpt?utm_source=github&utm_medium=readme&utm_campaign=first_dollar_activation&cta_id=readme_first_dollar_open_gpt&cta_placement=readme_first_dollar)** and paste the bad answer, risky command, deploy, PR action, or agent plan before it runs again.
|
|
36
42
|
2. **Capture the lesson:** type `thumbs down:` or `thumbs up:` with one concrete sentence. Native ChatGPT rating buttons are not the ThumbGate capture path; typed feedback is.
|
|
37
|
-
3. **Enforce the repeat:** run `npx thumbgate init` where the agent executes so the lesson can become a Pre-Action
|
|
43
|
+
3. **Enforce the repeat:** run `npx thumbgate init` where the agent executes so the lesson can become a Pre-Action Check instead of another reminder.
|
|
38
44
|
4. **Upgrade only after proof:** Solo Pro is for the dashboard, DPO export, proof-ready evidence, and higher capture limits after one real blocked repeat. Team starts with the Workflow Hardening Sprint around one repeated failure, one owner, and one proof review.
|
|
39
45
|
|
|
40
46
|
The buying question is simple: **what repeated AI mistake would be worth blocking before the next tool call?**
|
|
@@ -64,11 +70,11 @@ That's ~$0.21 in tokens just to fix the same mistake three times — multiplied
|
|
|
64
70
|
|
|
65
71
|
```
|
|
66
72
|
Session 1: Agent force-pushes to main. You 👎 it. +4,200 tokens
|
|
67
|
-
Session 2: ⛔
|
|
73
|
+
Session 2: ⛔ Check blocks the force-push. Zero round-trip. +0 tokens
|
|
68
74
|
Session 3+: Never happens again. +0 tokens
|
|
69
75
|
```
|
|
70
76
|
|
|
71
|
-
One thumbs-down. The PreToolUse hook intercepts the call **before** it reaches the model — no input tokens, no output tokens, no retry loop. The dashboard tracks **tokens saved this week** as a live counter so you can see exactly what your prevention rules are worth. Mark a review checkpoint once, and the dashboard narrows the next pass to only the feedback, lessons, and
|
|
77
|
+
One thumbs-down. The PreToolUse hook intercepts the call **before** it reaches the model — no input tokens, no output tokens, no retry loop. The dashboard tracks **tokens saved this week** as a live counter so you can see exactly what your prevention rules are worth. Mark a review checkpoint once, and the dashboard narrows the next pass to only the feedback, lessons, and check blocks that landed since your last review.
|
|
72
78
|
|
|
73
79
|
ThumbGate doesn't make your agent smarter. It makes your agent *cheaper to be wrong with.*
|
|
74
80
|
|
|
@@ -81,10 +87,10 @@ npx thumbgate init # auto-detects your agent, wires everything
|
|
|
81
87
|
npx thumbgate capture "Never run DROP on production tables"
|
|
82
88
|
```
|
|
83
89
|
|
|
84
|
-
That single command creates a
|
|
90
|
+
That single command creates a prevention rule. Next time any AI agent tries to run `DROP` on production:
|
|
85
91
|
|
|
86
92
|
```
|
|
87
|
-
⛔
|
|
93
|
+
⛔ Check blocked: "Never run DROP on production tables"
|
|
88
94
|
Pattern: DROP.*production
|
|
89
95
|
Verdict: BLOCK
|
|
90
96
|
```
|
|
@@ -100,16 +106,33 @@ ThumbGate operates as a 4-layer enforcement stack between your AI agent and your
|
|
|
100
106
|
### Layer 1: Feedback Capture
|
|
101
107
|
Your thumbs-up/down reactions are captured via MCP protocol, CLI, or the ChatGPT GPT surface. Each reaction is stored as a structured lesson with context, timestamp, and severity.
|
|
102
108
|
|
|
103
|
-
### Layer 2:
|
|
104
|
-
The
|
|
109
|
+
### Layer 2: Check Engine
|
|
110
|
+
The check engine converts lessons into enforceable rules using pattern matching, semantic similarity (via LanceDB vectors), and Thompson Sampling for adaptive rule selection. Rules stay in local ThumbGate runtime state.
|
|
105
111
|
|
|
106
112
|
### Layer 3: Pre-Action Interception
|
|
107
|
-
Before any agent action executes, ThumbGate's `PreToolUse` hook intercepts the command and evaluates it against all active
|
|
113
|
+
Before any agent action executes, ThumbGate's `PreToolUse` hook intercepts the command and evaluates it against all active checks. This happens at the MCP protocol level — the agent physically cannot bypass it.
|
|
108
114
|
|
|
109
115
|
### Layer 4: Multi-Agent Distribution
|
|
110
|
-
|
|
116
|
+
Checks are distributed across all connected agents via MCP stdio protocol. One correction in Claude Code protects Cursor, Codex, Gemini CLI, Cline, and any MCP-compatible agent.
|
|
117
|
+
|
|
118
|
+
Prompt engineering still matters, but it is only the starting point. ThumbGate adds prompt evaluation on top: proof lanes, benchmarks, and self-heal checks tell you whether your prompt and workflow actually held up under execution instead of leaving you to guess from vibes. Run `npx thumbgate eval --from-feedback --write-report=.thumbgate/prompt-eval-proof.md` to turn real thumbs-up/down feedback into reusable eval cases and a buyer-ready proof report.
|
|
119
|
+
|
|
120
|
+
### Managed model benchmark lane
|
|
121
|
+
|
|
122
|
+
When a new managed model drops, do not swap ThumbGate over on vendor claims alone. Rank it against the actual ThumbGate workload first:
|
|
123
|
+
|
|
124
|
+
```bash
|
|
125
|
+
npx thumbgate model-candidates --workload=pretool-gating --json
|
|
126
|
+
npx thumbgate model-candidates --workload=long-trace-review --provider=openai-compatible --gateway=tinker --json
|
|
127
|
+
```
|
|
128
|
+
|
|
129
|
+
The catalog currently includes the April 23, 2026 Tinker additions:
|
|
130
|
+
|
|
131
|
+
- `tinker/qwen3.6-35b-a3b` for pre-action gating, agentic coding, and tool-use
|
|
132
|
+
- `tinker/qwen3.6-27b` for the cheap fast-path
|
|
133
|
+
- `tinker/kimi-k2.6-128k` for long-trace review and multi-agent sessions
|
|
111
134
|
|
|
112
|
-
|
|
135
|
+
Each recommendation ships with the benchmark commands to run next: feedback-derived prompt eval, `gate-eval`, and `thumbgate bench`. That keeps model selection evidence-backed instead of hype-driven.
|
|
113
136
|
|
|
114
137
|

|
|
115
138
|
|
|
@@ -126,10 +149,11 @@ Prompt engineering still matters, but it is only the starting point. ThumbGate a
|
|
|
126
149
|
| **Codex** | `npx thumbgate init --agent codex` |
|
|
127
150
|
| **Gemini CLI** | `npx thumbgate init --agent gemini` |
|
|
128
151
|
| **Amp** | `npx thumbgate init --agent amp` |
|
|
152
|
+
| **Cline** (Roo Code successor) | `npx thumbgate init --agent cline` |
|
|
129
153
|
| **Claude Desktop** | [Download extension bundle](https://github.com/IgorGanapolsky/ThumbGate/releases/latest/download/thumbgate-claude-desktop.mcpb) |
|
|
130
154
|
| **Any MCP agent** | `npx thumbgate serve` |
|
|
131
155
|
|
|
132
|
-
Works with **Claude Code, Cursor, Codex, Gemini CLI, Amp, OpenCode**, and any MCP-compatible agent.
|
|
156
|
+
Works with **Claude Code, Cursor, Codex, Gemini CLI, Amp, Cline, OpenCode**, and any MCP-compatible agent. Migrating from Roo Code (sunsetting 2026-05-15)? See [`adapters/cline/INSTALL.md`](./adapters/cline/INSTALL.md).
|
|
133
157
|
|
|
134
158
|
### Status bar proof
|
|
135
159
|
|
|
@@ -155,7 +179,7 @@ Open the Codex plugin install page or download the standalone bundle from GitHub
|
|
|
155
179
|
STEP 1 STEP 2 STEP 3
|
|
156
180
|
──────── ──────── ────────
|
|
157
181
|
|
|
158
|
-
You react ThumbGate learns The
|
|
182
|
+
You react ThumbGate learns The check holds
|
|
159
183
|
|
|
160
184
|
👎 on a bad ──► Feedback becomes ──► Next time the
|
|
161
185
|
agent action a saved lesson agent tries the
|
|
@@ -173,13 +197,13 @@ ThumbGate sells three concrete outcomes:
|
|
|
173
197
|
- **Prevent expensive AI mistakes** — catch bad commands, destructive database actions, unsafe publishes, and risky API calls before they run.
|
|
174
198
|
- **Make AI stop repeating mistakes** — fix it once, turn the lesson into a rule, and block the repeat before the next tool call lands.
|
|
175
199
|
- **Turn AI into a reliable operator** — move from a smart assistant that apologizes after damage to a production-ready operator with checkpoints, proof, and enforcement.
|
|
176
|
-
- **Measure prompts instead of rewriting them blindly** — use proof lanes, ThumbGate Bench, and `self-heal:check` to evaluate whether prompts and workflows actually improved behavior.
|
|
200
|
+
- **Measure prompts instead of rewriting them blindly** — use `thumbgate eval --from-feedback`, proof lanes, ThumbGate Bench, and `self-heal:check` to evaluate whether prompts and workflows actually improved behavior.
|
|
177
201
|
|
|
178
202
|
---
|
|
179
203
|
|
|
180
204
|
## Use Cases
|
|
181
205
|
|
|
182
|
-
- **Stop force-push to main** —
|
|
206
|
+
- **Stop force-push to main** — Check blocks `git push --force` on protected branches before it runs
|
|
183
207
|
- **Prevent repeated migration failures** — Each mistake becomes a searchable lesson that fires before the next attempt
|
|
184
208
|
- **Block unauthorized file edits** — Control which files agents can touch with path-based rules
|
|
185
209
|
- **Memory across sessions** — The agent remembers your feedback from yesterday
|
|
@@ -188,7 +212,7 @@ ThumbGate sells three concrete outcomes:
|
|
|
188
212
|
|
|
189
213
|
---
|
|
190
214
|
|
|
191
|
-
## Built-in
|
|
215
|
+
## Built-in Checks
|
|
192
216
|
|
|
193
217
|
```
|
|
194
218
|
⛔ force-push → blocks git push --force
|
|
@@ -197,7 +221,7 @@ ThumbGate sells three concrete outcomes:
|
|
|
197
221
|
⛔ package-lock-reset → blocks destructive lock edits
|
|
198
222
|
⛔ env-file-edit → blocks .env secret exposure
|
|
199
223
|
|
|
200
|
-
+ custom
|
|
224
|
+
+ custom prevention rules for project-specific failures
|
|
201
225
|
```
|
|
202
226
|
|
|
203
227
|
---
|
|
@@ -207,9 +231,9 @@ ThumbGate sells three concrete outcomes:
|
|
|
207
231
|
```bash
|
|
208
232
|
npx thumbgate init # detect agent, wire hooks
|
|
209
233
|
npx thumbgate doctor # health check
|
|
210
|
-
npx thumbgate capture # create a
|
|
234
|
+
npx thumbgate capture # create a check from text
|
|
211
235
|
npx thumbgate lessons # see what's been learned
|
|
212
|
-
npx thumbgate explore # terminal explorer for lessons,
|
|
236
|
+
npx thumbgate explore # terminal explorer for lessons, checks, stats
|
|
213
237
|
npx thumbgate native-messaging-audit # inspect local browser bridges and extension hosts
|
|
214
238
|
npx thumbgate dashboard # open local dashboard
|
|
215
239
|
npx thumbgate serve # start MCP server on stdio
|
|
@@ -222,7 +246,7 @@ npx thumbgate bench # run reliability benchmark
|
|
|
222
246
|
|
|
223
247
|
| | Free | Pro ($19/mo) | Team ($49/seat/mo) |
|
|
224
248
|
|---|---|---|---|
|
|
225
|
-
| Local CLI + enforced
|
|
249
|
+
| Local CLI + enforced checks | ✅ | ✅ | ✅ |
|
|
226
250
|
| Feedback captures (lifetime) | 3 | Unlimited | Unlimited |
|
|
227
251
|
| Auto-promoted prevention rules | 1 | Unlimited | Unlimited |
|
|
228
252
|
| MCP agent integrations | All | All | All |
|
|
@@ -233,17 +257,17 @@ npx thumbgate bench # run reliability benchmark
|
|
|
233
257
|
| Org-wide dashboard | — | — | ✅ |
|
|
234
258
|
| Approval + audit proof | — | — | ✅ |
|
|
235
259
|
|
|
236
|
-
The free tier gives you 3 lifetime feedback captures and 1 auto-promoted prevention rule — enough to prove the enforcement loop works. MCP integrations for all agents (Claude Code, Cursor, Codex, Gemini, Amp, OpenCode) ship free.
|
|
260
|
+
The free tier gives you 3 lifetime feedback captures and 1 auto-promoted prevention rule — enough to prove the enforcement loop works. MCP integrations for all agents (Claude Code, Cursor, Codex, Gemini, Amp, Cline, OpenCode) ship free.
|
|
237
261
|
|
|
238
262
|
Pro ($19/mo or $149/yr) lifts those caps and adds history-aware lesson recall, lesson search, DPO export, and a personal dashboard. Team ($49/seat/mo) adds a shared hosted lesson DB, org dashboard, and shared enforcement across the org. Pro and Team include `open_feedback_session`, `append_feedback_context`, and `finalize_feedback_session` for structured multi-turn feedback capture.
|
|
239
263
|
|
|
240
|
-
**Best first paid motion for teams:** the **Workflow Hardening Sprint** — qualify one repeated failure before committing to a full rollout. **[Start intake →](https://
|
|
264
|
+
**Best first paid motion for teams:** the **Workflow Hardening Sprint** — qualify one repeated failure before committing to a full rollout. **[Start intake →](https://usethumbgate.com/?utm_source=github&utm_medium=readme&utm_campaign=team_rollout#workflow-sprint-intake)**
|
|
241
265
|
|
|
242
266
|
**Best first technical motion:** install the CLI-first and let `init` wire hooks for the agent you already use.
|
|
243
267
|
|
|
244
|
-
**Paid path for individual operators:** [ThumbGate Pro](https://
|
|
268
|
+
**Paid path for individual operators:** [ThumbGate Pro](https://usethumbgate.com/pro?utm_source=github&utm_medium=readme&utm_campaign=pro_page) is the self-serve side lane for a personal dashboard and export-ready evidence.
|
|
245
269
|
|
|
246
|
-
**[Start free](https://
|
|
270
|
+
**[Start free](https://usethumbgate.com/?utm_source=github&utm_medium=readme)** · **[See Pro](https://usethumbgate.com/pro?utm_source=github&utm_medium=readme)** · **[Team Sprint intake](https://usethumbgate.com/?utm_source=github&utm_medium=readme#workflow-sprint-intake)**
|
|
247
271
|
|
|
248
272
|
---
|
|
249
273
|
|
|
@@ -295,7 +319,7 @@ The export bundle includes full lesson metadata: signal, title, context, tags, f
|
|
|
295
319
|
|
|
296
320
|
## DPO Export for Fine-Tuning (Pro + Team)
|
|
297
321
|
|
|
298
|
-
Every thumbs-up and thumbs-down becomes a training signal. ThumbGate Pro exports your captured feedback as DPO (Direct Preference Optimization) pairs — ready to feed into a LoRA fine-tune so your model stops repeating known mistakes at the weight level, not just the
|
|
322
|
+
Every thumbs-up and thumbs-down becomes a training signal. ThumbGate Pro exports your captured feedback as DPO (Direct Preference Optimization) pairs — ready to feed into a LoRA fine-tune so your model stops repeating known mistakes at the weight level, not just the check level.
|
|
299
323
|
|
|
300
324
|
**Export DPO pairs:**
|
|
301
325
|
|
|
@@ -313,9 +337,9 @@ curl -X POST http://localhost:3456/v1/dpo/export \
|
|
|
313
337
|
**Use cases:**
|
|
314
338
|
- Fine-tune Llama 3 / Mistral / local models with a LoRA adapter trained on your real mistakes
|
|
315
339
|
- Feed into RLAIF or KTO pipelines (KTO export also available via `/v1/kto/export`)
|
|
316
|
-
- Build a model that natively avoids your team's known failure patterns — no
|
|
340
|
+
- Build a model that natively avoids your team's known failure patterns — no check at inference time needed
|
|
317
341
|
|
|
318
|
-
**Why this matters:**
|
|
342
|
+
**Why this matters:** Checks block mistakes. Fine-tuning prevents them from being attempted. Combine both for belt-and-suspenders governance.
|
|
319
343
|
|
|
320
344
|
---
|
|
321
345
|
|
|
@@ -326,7 +350,7 @@ curl -X POST http://localhost:3456/v1/dpo/export \
|
|
|
326
350
|
| **Storage** | SQLite + FTS5, LanceDB vectors, JSONL logs |
|
|
327
351
|
| **Capture** | 3 feedback captures lifetime (free), unlimited (Pro) |
|
|
328
352
|
| **Intelligence** | MemAlign dual recall, Thompson Sampling |
|
|
329
|
-
| **Enforcement** | PreToolUse hook engine,
|
|
353
|
+
| **Enforcement** | PreToolUse hook engine, Checks config |
|
|
330
354
|
| **Interfaces** | MCP stdio, HTTP API, CLI (Node.js >=18) |
|
|
331
355
|
| **Billing** | Stripe |
|
|
332
356
|
| **Execution** | Railway, Cloudflare Workers, Docker Sandboxes |
|
|
@@ -336,9 +360,9 @@ Every Changeset is tied to the exact `main` merge commit and generates Verificat
|
|
|
336
360
|
|
|
337
361
|
---
|
|
338
362
|
|
|
339
|
-
**Popular buyer questions:** **[Stop repeated AI agent mistakes](https://
|
|
363
|
+
**Popular buyer questions:** **[AI search topical presence](https://usethumbgate.com/guides/ai-search-topical-presence?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Relational knowledge and AI recommendations](https://usethumbgate.com/guides/relational-knowledge-ai-recommendations?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Stop repeated AI agent mistakes](https://usethumbgate.com/guides/stop-repeated-ai-agent-mistakes?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Browser automation safety](https://usethumbgate.com/guides/browser-automation-safety?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Native messaging host security](https://usethumbgate.com/guides/native-messaging-host-security?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Autoresearch agent safety](https://usethumbgate.com/guides/autoresearch-agent-safety?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Cursor guardrails](https://usethumbgate.com/guides/cursor-agent-guardrails?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Codex CLI guardrails](https://usethumbgate.com/guides/codex-cli-guardrails?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)** · **[Gemini CLI memory + enforcement](https://usethumbgate.com/guides/gemini-cli-feedback-memory?utm_source=github&utm_medium=readme&utm_campaign=buyer_questions)**
|
|
340
364
|
|
|
341
|
-
**[Workflow Hardening Sprint](https://
|
|
365
|
+
**[Workflow Hardening Sprint](https://usethumbgate.com/?utm_source=github&utm_medium=readme&utm_campaign=top_cta#workflow-sprint-intake)** · **[Live Dashboard](https://usethumbgate.com/dashboard?utm_source=github&utm_medium=readme&utm_campaign=top_cta)**
|
|
342
366
|
|
|
343
367
|
---
|
|
344
368
|
|
|
@@ -348,7 +372,7 @@ Every Changeset is tied to the exact `main` merge commit and generates Verificat
|
|
|
348
372
|
- **[Claude Desktop Extension](https://github.com/IgorGanapolsky/ThumbGate/releases/latest/download/thumbgate-claude-desktop.mcpb)** — One-click install for Claude Desktop
|
|
349
373
|
- **[Codex Plugin](https://thumbgate-production.up.railway.app/codex-plugin)** — Auto-updating standalone bundle and install page for Codex CLI
|
|
350
374
|
- **[Perplexity Command Center](docs/PERPLEXITY_MAX_COMMAND_CENTER.md)** — AI-search visibility + lead discovery
|
|
351
|
-
- **[ThumbGate Bench](docs/THUMBGATE_BENCH.md)** — Reliability benchmark for
|
|
375
|
+
- **[ThumbGate Bench](docs/THUMBGATE_BENCH.md)** — Reliability benchmark for check evaluation
|
|
352
376
|
- **[Manus AI Skill](skills/thumbgate/SKILL.md)** — ThumbGate integration for Manus AI agents
|
|
353
377
|
|
|
354
378
|
---
|
|
@@ -376,10 +400,10 @@ Free and self-hosted users can invoke `search_lessons` directly through MCP, and
|
|
|
376
400
|
No. ThumbGate does not update model weights. It captures feedback, stores lessons, injects context at runtime, and blocks bad actions before they execute.
|
|
377
401
|
|
|
378
402
|
**How is this different from CLAUDE.md or .cursorrules?**
|
|
379
|
-
Those are suggestions the agent can ignore. ThumbGate
|
|
403
|
+
Those are suggestions the agent can ignore. ThumbGate checks are enforced — they physically block the action before it runs. They also auto-generate from feedback instead of requiring manual writing.
|
|
380
404
|
|
|
381
405
|
**Does it work with my agent?**
|
|
382
|
-
If it supports MCP or pre-action hooks, yes. Claude Code, Claude Desktop, Cursor, Codex, Gemini CLI, Amp, OpenCode all work out of the box.
|
|
406
|
+
If it supports MCP or pre-action hooks, yes. Claude Code, Claude Desktop, Cursor, Codex, Gemini CLI, Amp, Cline, OpenCode all work out of the box.
|
|
383
407
|
|
|
384
408
|
**Is it free?**
|
|
385
409
|
The free tier gives you 3 lifetime feedback captures and 1 auto-promoted prevention rule — enough to prove the enforcement loop works. MCP integrations ship free for every agent.
|
|
@@ -399,7 +423,7 @@ Pro ($19/mo or $149/yr) lifts those caps and adds history-aware lesson recall, l
|
|
|
399
423
|
- [Agent Workflow Contract](WORKFLOW.md) — the agent-run contract for all ThumbGate operations
|
|
400
424
|
- [Ready for Agent Intake](https://github.com/IgorGanapolsky/ThumbGate/issues/new?template=ready-for-agent.yml) — ready-for-agent intake template
|
|
401
425
|
- [SEO Guide: Claude Code Guardrails](docs/learn/claude-code-guardrails.md)
|
|
402
|
-
- [
|
|
426
|
+
- [ThumbGate-Core](https://github.com/IgorGanapolsky/ThumbGate-Core) — private core for hosted overlays, ranking, policy synthesis, billing intelligence, and org/team workflows
|
|
403
427
|
|
|
404
428
|
---
|
|
405
429
|
|
|
@@ -751,6 +751,34 @@ paths:
|
|
|
751
751
|
$ref: '#/components/schemas/FunnelAnalyticsResponse'
|
|
752
752
|
'401':
|
|
753
753
|
description: Unauthorized
|
|
754
|
+
/v1/analytics/losses:
|
|
755
|
+
get:
|
|
756
|
+
operationId: getLossAnalytics
|
|
757
|
+
parameters:
|
|
758
|
+
- in: query
|
|
759
|
+
name: window
|
|
760
|
+
schema:
|
|
761
|
+
type: string
|
|
762
|
+
enum: [today, 7d, 30d, lifetime]
|
|
763
|
+
- in: query
|
|
764
|
+
name: timezone
|
|
765
|
+
schema:
|
|
766
|
+
type: string
|
|
767
|
+
- in: query
|
|
768
|
+
name: now
|
|
769
|
+
schema:
|
|
770
|
+
type: string
|
|
771
|
+
format: date-time
|
|
772
|
+
responses:
|
|
773
|
+
'200':
|
|
774
|
+
description: Ranked buyer-loss and revenue-opportunity analysis for the active analytics window
|
|
775
|
+
content:
|
|
776
|
+
application/json:
|
|
777
|
+
schema:
|
|
778
|
+
type: object
|
|
779
|
+
additionalProperties: true
|
|
780
|
+
'401':
|
|
781
|
+
description: Unauthorized
|
|
754
782
|
/v1/dashboard:
|
|
755
783
|
get:
|
|
756
784
|
operationId: getDashboard
|
|
@@ -848,10 +876,79 @@ paths:
|
|
|
848
876
|
application/json:
|
|
849
877
|
schema:
|
|
850
878
|
type: object
|
|
851
|
-
required: [toolName]
|
|
852
879
|
properties:
|
|
853
880
|
toolName:
|
|
854
881
|
type: string
|
|
882
|
+
description: Tool name is optional when provider-native tool call payload is supplied.
|
|
883
|
+
provider:
|
|
884
|
+
type: string
|
|
885
|
+
model:
|
|
886
|
+
type: string
|
|
887
|
+
providerToolCall:
|
|
888
|
+
type: object
|
|
889
|
+
additionalProperties: true
|
|
890
|
+
toolCall:
|
|
891
|
+
type: object
|
|
892
|
+
additionalProperties: true
|
|
893
|
+
toolUse:
|
|
894
|
+
type: object
|
|
895
|
+
additionalProperties: true
|
|
896
|
+
content:
|
|
897
|
+
type: array
|
|
898
|
+
items:
|
|
899
|
+
type: object
|
|
900
|
+
additionalProperties: true
|
|
901
|
+
input:
|
|
902
|
+
type: object
|
|
903
|
+
additionalProperties: true
|
|
904
|
+
arguments:
|
|
905
|
+
type: object
|
|
906
|
+
additionalProperties: true
|
|
907
|
+
method:
|
|
908
|
+
type: string
|
|
909
|
+
params:
|
|
910
|
+
type: object
|
|
911
|
+
additionalProperties: true
|
|
912
|
+
mcp:
|
|
913
|
+
type: object
|
|
914
|
+
additionalProperties: true
|
|
915
|
+
mcpToolCall:
|
|
916
|
+
type: object
|
|
917
|
+
additionalProperties: true
|
|
918
|
+
usage:
|
|
919
|
+
type: object
|
|
920
|
+
additionalProperties: true
|
|
921
|
+
tokenEstimate:
|
|
922
|
+
type: number
|
|
923
|
+
costUsd:
|
|
924
|
+
type: number
|
|
925
|
+
budget:
|
|
926
|
+
type: object
|
|
927
|
+
additionalProperties: true
|
|
928
|
+
workflowPattern:
|
|
929
|
+
type: string
|
|
930
|
+
enum: [single_action, chaining, routing, parallelization, evaluator-optimizer, agent]
|
|
931
|
+
workflow:
|
|
932
|
+
type: object
|
|
933
|
+
additionalProperties: true
|
|
934
|
+
goal:
|
|
935
|
+
type: string
|
|
936
|
+
tools:
|
|
937
|
+
type: array
|
|
938
|
+
items:
|
|
939
|
+
type: string
|
|
940
|
+
branches:
|
|
941
|
+
type: array
|
|
942
|
+
items:
|
|
943
|
+
type: string
|
|
944
|
+
steps:
|
|
945
|
+
type: array
|
|
946
|
+
items:
|
|
947
|
+
type: string
|
|
948
|
+
routes:
|
|
949
|
+
type: array
|
|
950
|
+
items:
|
|
951
|
+
type: string
|
|
855
952
|
command:
|
|
856
953
|
type: string
|
|
857
954
|
filePath:
|
|
@@ -868,6 +965,25 @@ paths:
|
|
|
868
965
|
type: boolean
|
|
869
966
|
requireVersionNotBehindBase:
|
|
870
967
|
type: boolean
|
|
968
|
+
workflowDispatch:
|
|
969
|
+
type: object
|
|
970
|
+
description: Evidence required before running `gh workflow run` or another environment-specific workflow dispatch.
|
|
971
|
+
properties:
|
|
972
|
+
environment:
|
|
973
|
+
type: string
|
|
974
|
+
description: Requested environment such as dev, staging, beta, or release.
|
|
975
|
+
workflow:
|
|
976
|
+
type: string
|
|
977
|
+
description: Expected workflow file or workflow name.
|
|
978
|
+
ref:
|
|
979
|
+
type: string
|
|
980
|
+
description: Expected branch or ref passed to the workflow dispatch command.
|
|
981
|
+
sha:
|
|
982
|
+
type: string
|
|
983
|
+
description: Expected HEAD SHA to verify before and after dispatch.
|
|
984
|
+
job:
|
|
985
|
+
type: string
|
|
986
|
+
description: Expected job name to verify before reporting the workflow URL.
|
|
871
987
|
responses:
|
|
872
988
|
'200':
|
|
873
989
|
description: Persisted workflow-sentinel recommendation with decision-control metadata and actionId
|
|
@@ -1121,7 +1237,7 @@ paths:
|
|
|
1121
1237
|
description: Comma-separated tags that must all be present on a lesson.
|
|
1122
1238
|
responses:
|
|
1123
1239
|
'200':
|
|
1124
|
-
description: Searchable promoted lessons with linked corrective actions, prevention rules, and auto-
|
|
1240
|
+
description: Searchable promoted lessons with linked corrective actions, prevention rules, and auto-promoted checks
|
|
1125
1241
|
'401':
|
|
1126
1242
|
description: Unauthorized
|
|
1127
1243
|
/v1/search:
|
|
@@ -2,13 +2,13 @@
|
|
|
2
2
|
"mcpServers": {
|
|
3
3
|
"thumbgate": {
|
|
4
4
|
"command": "npx",
|
|
5
|
-
"args": ["--yes", "--package", "thumbgate@1.
|
|
5
|
+
"args": ["--yes", "--package", "thumbgate@1.16.1", "thumbgate", "serve"]
|
|
6
6
|
}
|
|
7
7
|
},
|
|
8
8
|
"hooks": {
|
|
9
9
|
"preToolUse": {
|
|
10
10
|
"command": "npx",
|
|
11
|
-
"args": ["--yes", "--package", "thumbgate@1.
|
|
11
|
+
"args": ["--yes", "--package", "thumbgate@1.16.1", "thumbgate", "gate-check"]
|
|
12
12
|
}
|
|
13
13
|
}
|
|
14
14
|
}
|