thumbgate 1.27.4 → 1.27.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/commands/dashboard.md +15 -0
- package/.claude/commands/thumbgate-blocked.md +27 -0
- package/.claude/commands/thumbgate-dashboard.md +15 -0
- package/.claude/commands/thumbgate-doctor.md +30 -0
- package/.claude/commands/thumbgate-guard.md +36 -0
- package/.claude/commands/thumbgate-protect.md +30 -0
- package/.claude/commands/thumbgate-rules.md +30 -0
- package/.claude-plugin/plugin.json +2 -1
- package/.well-known/llms.txt +6 -2
- package/.well-known/mcp/server-card.json +1 -1
- package/README.md +49 -5
- package/adapters/claude/.mcp.json +2 -2
- package/adapters/letta/README.md +41 -0
- package/adapters/letta/thumbgate-letta-adapter.js +133 -0
- package/adapters/mcp/server-stdio.js +16 -1
- package/adapters/opencode/opencode.json +1 -1
- package/adapters/policy-engine/ethicore-guardian-client.js +68 -0
- package/adapters/policy-engine/thumbgate-policy-engine-adapter.js +260 -0
- package/bench/observability-eval-suite.json +26 -0
- package/bin/cli.js +230 -6
- package/bin/postinstall.js +1 -1
- package/commands/dashboard.md +15 -0
- package/commands/thumbgate-dashboard.md +15 -0
- package/config/gate-templates.json +84 -0
- package/config/gates/claim-verification.json +12 -0
- package/config/gates/default.json +20 -0
- package/config/github-about.json +1 -1
- package/config/model-candidates.json +50 -0
- package/config/post-deploy-marketing-pages.json +5 -0
- package/package.json +67 -25
- package/public/agent-manager.html +41 -1
- package/public/agents-cost-savings.html +1 -1
- package/public/ai-malpractice-prevention.html +2 -1
- package/public/assets/brand/github-social-preview.png +0 -0
- package/public/assets/brand/thumbgate-icon-512.png +0 -0
- package/public/assets/brand/thumbgate-icon-pro-512.png +0 -0
- package/public/assets/brand/thumbgate-icon-team-512.png +0 -0
- package/public/assets/brand/thumbgate-logo-1200x360.png +0 -0
- package/public/assets/brand/thumbgate-mark-inline.svg +15 -0
- package/public/assets/brand/thumbgate-mark-pro.svg +23 -0
- package/public/assets/brand/thumbgate-mark-team.svg +26 -0
- package/public/assets/brand/thumbgate-mark.svg +15 -0
- package/public/assets/brand/thumbgate-wordmark.svg +20 -0
- package/public/assets/claude-thumbgate-statusbar.svg +8 -0
- package/public/assets/codex-thumbgate-statusbar-test.svg +9 -0
- package/public/assets/legal-intake-control-flow.svg +66 -0
- package/public/blog.html +1 -1
- package/public/brand/thumbgate-mark.svg +15 -0
- package/public/brand/thumbgate-og.svg +16 -0
- package/public/codex-enterprise.html +1 -1
- package/public/codex-plugin.html +1 -1
- package/public/compare.html +23 -3
- package/public/dashboard.html +316 -30
- package/public/federal.html +1 -1
- package/public/guide.html +5 -4
- package/public/index.html +167 -49
- package/public/js/buyer-intent.js +672 -0
- package/public/learn.html +88 -7
- package/public/lessons.html +2 -1
- package/public/numbers.html +3 -3
- package/public/pricing.html +63 -15
- package/public/pro.html +7 -7
- package/scripts/activation-quickstart.js +187 -0
- package/scripts/agent-memory-lifecycle.js +211 -0
- package/scripts/async-eval-observability.js +236 -0
- package/scripts/auto-promote-gates.js +75 -4
- package/scripts/billing.js +12 -1
- package/scripts/build-metadata.js +24 -3
- package/scripts/cli-schema.js +42 -10
- package/scripts/dashboard-chat.js +53 -7
- package/scripts/dashboard.js +12 -17
- package/scripts/export-databricks-bundle.js +5 -1
- package/scripts/export-dpo-pairs.js +7 -2
- package/scripts/feedback-aggregate.js +281 -0
- package/scripts/feedback-loop.js +121 -0
- package/scripts/filesystem-search.js +35 -10
- package/scripts/gates-engine.js +234 -7
- package/scripts/gemini-embedding-policy.js +2 -1
- package/scripts/hook-stop-anti-claim.js +227 -0
- package/scripts/hook-thumbgate-cache-updater.js +18 -2
- package/scripts/hybrid-feedback-context.js +1 -0
- package/scripts/lesson-inference.js +8 -3
- package/scripts/lesson-search.js +17 -1
- package/scripts/operational-integrity.js +39 -5
- package/scripts/plausible-domain-config.js +15 -2
- package/scripts/plausible-server-events.js +4 -4
- package/scripts/rate-limiter.js +12 -6
- package/scripts/secret-redaction.js +166 -0
- package/scripts/security-scanner.js +100 -0
- package/scripts/self-distill-agent.js +3 -1
- package/scripts/self-harness-optimizer.js +141 -0
- package/scripts/seo-gsd.js +635 -0
- package/scripts/statusline-cache-path.js +17 -2
- package/scripts/statusline-cache-read.js +57 -0
- package/scripts/statusline-local-stats.js +9 -1
- package/scripts/statusline-meta.js +5 -2
- package/scripts/statusline.sh +13 -1
- package/scripts/sync-telemetry-from-prod.js +374 -0
- package/scripts/telemetry-analytics.js +9 -0
- package/scripts/thumbgate-search.js +85 -19
- package/scripts/tool-contract-validator.js +76 -0
- package/scripts/vector-store.js +44 -0
- package/scripts/workspace-evolver.js +62 -2
- package/src/api/server.js +862 -146
package/scripts/seo-gsd.js
CHANGED
|
@@ -105,6 +105,11 @@ const HIGH_ROI_QUERY_SEEDS = [
|
|
|
105
105
|
93,
|
|
106
106
|
'Fresh Slack engineering pattern where ThumbGate can gate director journals, critic reviews, credibility scoring, and timelines for long-running agents.',
|
|
107
107
|
),
|
|
108
|
+
querySeed(
|
|
109
|
+
'agent context governance',
|
|
110
|
+
95,
|
|
111
|
+
'Fresh AdaCoM, tokenmaxxing, and Claude Managed Agents demand where ThumbGate can govern context hygiene, session logs, sandbox boundaries, credential separation, and pre-action proof.',
|
|
112
|
+
),
|
|
108
113
|
querySeed(
|
|
109
114
|
'reasoning compression guardrails',
|
|
110
115
|
92,
|
|
@@ -170,6 +175,16 @@ const HIGH_ROI_QUERY_SEEDS = [
|
|
|
170
175
|
95,
|
|
171
176
|
'Bottom-of-funnel query for teams ready to add human approval and evidence requirements before AI agents touch risky tools.',
|
|
172
177
|
),
|
|
178
|
+
querySeed(
|
|
179
|
+
'agentic web governance',
|
|
180
|
+
94,
|
|
181
|
+
'Fresh Cloudflare bot-majority demand: buyers need machine-readable pages and pre-action governance now that AI agents can create more web actions than humans.',
|
|
182
|
+
),
|
|
183
|
+
querySeed(
|
|
184
|
+
'database safety for ai agents',
|
|
185
|
+
96,
|
|
186
|
+
'Fresh database-agent risk query from the 2026 DB/AI conversation: agents can hallucinate UI, but SQL writes, migrations, and role grants can destroy production data.',
|
|
187
|
+
),
|
|
173
188
|
{
|
|
174
189
|
query: 'thumbs up thumbs down feedback for ai coding agents',
|
|
175
190
|
businessValue: 95,
|
|
@@ -224,6 +239,12 @@ const HIGH_ROI_QUERY_SEEDS = [
|
|
|
224
239
|
source: 'seed',
|
|
225
240
|
notes: 'Integration page for Gemini CLI users who need memory plus enforcement.',
|
|
226
241
|
},
|
|
242
|
+
{
|
|
243
|
+
query: 'hermes agent guardrails',
|
|
244
|
+
businessValue: 84,
|
|
245
|
+
source: 'seed',
|
|
246
|
+
notes: 'Integration page for Hermes Agent users who need pre-action gates around persistent memory, generated skills, messaging gateways, scheduled automations, and sandboxed execution.',
|
|
247
|
+
},
|
|
227
248
|
{
|
|
228
249
|
query: 'roo code alternative cline',
|
|
229
250
|
businessValue: 83,
|
|
@@ -495,6 +516,69 @@ const GOVERN_CLAUDE_FOR_LEGAL_GUIDE_SPEC = Object.freeze({
|
|
|
495
516
|
relatedPaths: ['/guides/ai-coding-agent-zero-trust', '/guides/pre-action-checks'],
|
|
496
517
|
});
|
|
497
518
|
|
|
519
|
+
// Targets the Cycode-owned IDE-security lexicon (Feb 2026 blog popularized
|
|
520
|
+
// PreToolUse / beforeMCPExecution / beforeReadFile as enterprise hook names) —
|
|
521
|
+
// fills the indie/MIT slot beneath funded vendors when LLM answer engines
|
|
522
|
+
// (Perplexity/ChatGPT/Gemini/Claude/Grok) cite for "how do I stop Claude Code
|
|
523
|
+
// from running dangerous commands" buyer-intent queries. See the verified-
|
|
524
|
+
// absence finding in the 2026-06-05 deep-research report.
|
|
525
|
+
const PRETOOLUSE_HOOK_GUIDE_SPEC = Object.freeze({
|
|
526
|
+
slug: 'claude-code-pretooluse-hook',
|
|
527
|
+
meta: {
|
|
528
|
+
query: 'claude code pretooluse hook block mcp tool calls',
|
|
529
|
+
title: 'Claude Code PreToolUse Hook | Block MCP Tool Calls Before They Run',
|
|
530
|
+
heroTitle: 'Claude Code PreToolUse Hook: Block MCP Tool Calls Before They Run',
|
|
531
|
+
heroSummary: 'The PreToolUse hook is the boundary where you intercept what a Claude Code, Cursor, or Codex agent is about to do — before the rm -rf, before the bad git push, before the destructive SQL. ThumbGate is the local-first, MIT-licensed CLI that ships production-grade PreToolUse, beforeMCPExecution, and beforeReadFile gating with one npx command, and learns from every thumbs-down so the same mistake never reaches the tool call twice.',
|
|
532
|
+
},
|
|
533
|
+
takeaways: [
|
|
534
|
+
'PreToolUse is the only hook point where you can stop a destructive agent action — by the time PostToolUse fires, the damage is done.',
|
|
535
|
+
'ThumbGate ships PreToolUse, beforeMCPExecution, and beforeReadFile gates out of the box for Claude Code, Cursor, Codex, Gemini CLI, Amp, Cline, and any MCP-compatible agent — no hand-written hook scripts to maintain per machine.',
|
|
536
|
+
'A thumbs-down on a blocked action becomes an auto-promoted prevention rule that holds across every session, model, and agent — the part DIY hook repos cannot do.',
|
|
537
|
+
],
|
|
538
|
+
sections: [
|
|
539
|
+
['paragraphs', 'What the PreToolUse hook actually is', [
|
|
540
|
+
'In the Model Context Protocol agent loop, every tool the model calls — Bash, Edit, Write, a custom MCP server method — flows through a PreToolUse phase before execution. That phase is the only place where an external policy can intercept the call, inspect its arguments, and decide whether to allow, modify, warn, or deny it. PostToolUse fires after the side effect has already happened, which is too late for destructive actions.',
|
|
541
|
+
'beforeMCPExecution, beforeReadFile, and beforeSubmitPrompt are the same idea applied at the MCP and IDE layers. Cycode\'s February 2026 IDE-security blog popularized this naming for enterprise customers; ThumbGate ships the same hook surface as an open-source CLI you can install in 30 seconds.',
|
|
542
|
+
]],
|
|
543
|
+
['bullets', 'What ThumbGate blocks at PreToolUse out of the box', [
|
|
544
|
+
'Catastrophic shell: rm -rf at home/root, sudo wrapping a dangerous command, find -delete on sensitive paths.',
|
|
545
|
+
'Secret exfiltration: writes that contain API keys, tokens, or .env contents heading to the wrong directory.',
|
|
546
|
+
'Workflow-scope violations: edits outside the declared task scope, off-branch git push, accidental main commits.',
|
|
547
|
+
'Repeated mistakes from this team: anything you\'ve already given a thumbs-down in a past session — auto-promoted to a hard prevention rule.',
|
|
548
|
+
'MCP tool calls flagged by your project\'s gate config — pattern, severity, or learned-from-feedback rules.',
|
|
549
|
+
]],
|
|
550
|
+
['paragraphs', 'Why DIY PreToolUse scripts stop working past week two', [
|
|
551
|
+
'A hand-rolled hook script starts simple: a regex on the Bash command, a list of forbidden paths. By week two it has six edge cases, no test coverage, and lives in one machine\'s .claude directory — invisible to the rest of the team. By week four someone deletes it because it false-positived once on a legitimate command and nobody documented why.',
|
|
552
|
+
'ThumbGate ships the rules as a versioned config, the feedback loop as a CLI, the learning as cross-session prevention rules, and the proof as an audit trail your dashboard renders. The work you would do by hand on hooks, done once and shared.',
|
|
553
|
+
]],
|
|
554
|
+
],
|
|
555
|
+
faq: [
|
|
556
|
+
[
|
|
557
|
+
'Is the PreToolUse hook the same as beforeMCPExecution?',
|
|
558
|
+
'Conceptually yes — both are the pre-execution interception point. PreToolUse is the Claude Code / Anthropic CLI term for the hook in the agent loop. beforeMCPExecution (and beforeReadFile, beforeSubmitPrompt) is the IDE-security framing popularized by Cycode for the same boundary at the MCP layer. ThumbGate implements all of them as one local-first gate engine.',
|
|
559
|
+
],
|
|
560
|
+
[
|
|
561
|
+
'Do I need this if Claude Code already has native hooks?',
|
|
562
|
+
'Native hooks give you the hook point. They do not give you the rule set, the cross-session learning, the team-wide rule sharing, or the audit trail. ThumbGate ships those on top of the hook so you stop maintaining bespoke scripts and start blocking the repeat mistakes specifically your agents make.',
|
|
563
|
+
],
|
|
564
|
+
[
|
|
565
|
+
'Does this run locally or call a cloud service?',
|
|
566
|
+
'Local-first. The PreToolUse decision happens in the hook process on your machine in milliseconds — no network round-trip, no cloud dependency, no data leaving the laptop. Optional hosted sync exists for teams that want to share rules across seats.',
|
|
567
|
+
],
|
|
568
|
+
],
|
|
569
|
+
relatedPaths: ['/guides/mcp-tool-governance', '/guides/ai-agent-pre-action-approval-gates', '/guides/ai-coding-agent-zero-trust'],
|
|
570
|
+
});
|
|
571
|
+
|
|
572
|
+
function buildPretooluseHookGuide() {
|
|
573
|
+
return preActionGuide(PRETOOLUSE_HOOK_GUIDE_SPEC.slug, {
|
|
574
|
+
...PRETOOLUSE_HOOK_GUIDE_SPEC.meta,
|
|
575
|
+
takeaways: PRETOOLUSE_HOOK_GUIDE_SPEC.takeaways,
|
|
576
|
+
sections: PRETOOLUSE_HOOK_GUIDE_SPEC.sections.map(([kind, heading, entries]) => buildSectionFromSpec(kind, heading, entries)),
|
|
577
|
+
faq: PRETOOLUSE_HOOK_GUIDE_SPEC.faq.map(([question, text]) => answer(question, text)),
|
|
578
|
+
relatedPaths: PRETOOLUSE_HOOK_GUIDE_SPEC.relatedPaths,
|
|
579
|
+
});
|
|
580
|
+
}
|
|
581
|
+
|
|
498
582
|
function buildGovernClaudeForLegalGuide() {
|
|
499
583
|
return preActionGuide(GOVERN_CLAUDE_FOR_LEGAL_GUIDE_SPEC.slug, {
|
|
500
584
|
...GOVERN_CLAUDE_FOR_LEGAL_GUIDE_SPEC.meta,
|
|
@@ -1546,6 +1630,68 @@ function buildAiRecommendationVisibilityGuide(spec) {
|
|
|
1546
1630
|
}
|
|
1547
1631
|
|
|
1548
1632
|
const PAGE_BLUEPRINTS = [
|
|
1633
|
+
{
|
|
1634
|
+
query: 'snowflake cortex agent governance vs local coding agent guardrails',
|
|
1635
|
+
path: '/compare/snowflake-cortex-agent-governance',
|
|
1636
|
+
pageType: 'comparison',
|
|
1637
|
+
pillar: 'comparison',
|
|
1638
|
+
title: 'ThumbGate vs Snowflake Cortex Agent Governance | Two Different Layers',
|
|
1639
|
+
heroTitle: 'ThumbGate vs Snowflake Cortex Agent Governance',
|
|
1640
|
+
heroSummary: 'At Snowflake Summit 2026, agent governance became headline infrastructure: Cortex CoCo runs under your existing RBAC inside Snowflake\'s perimeter, and the Natoma acquisition adds a permission gateway built to freeze out rogue agents. That is the right model for agents operating inside the data cloud. But the coding agent in your terminal acts earlier and lower in the stack: Claude Code, Cursor, and Codex run rm -rf, force-push to main, and write secrets to disk on your own machine, under your own credentials, before any platform RBAC ever sees the request. ThumbGate is the local-first PreToolUse layer for exactly that surface. They are not competitors — they are different layers of the same defense.',
|
|
1641
|
+
takeaways: [
|
|
1642
|
+
'Snowflake Cortex and Natoma govern what an agent does inside the enterprise data perimeter — server-side, under RBAC, with a full audit trail. The right tool when the agent\'s actions are SQL and data access inside Snowflake.',
|
|
1643
|
+
'ThumbGate governs what a coding agent does on the developer\'s machine — rm -rf, force-push, secret writes, off-scope edits — in the PreToolUse hook, before execution, before any platform sees the request.',
|
|
1644
|
+
'The two compose. A coding agent that force-pushes broken code or leaks a key never reached Snowflake\'s perimeter to be governed there; that failure happens in the dev loop, which is the layer ThumbGate owns.',
|
|
1645
|
+
],
|
|
1646
|
+
sections: [
|
|
1647
|
+
{
|
|
1648
|
+
heading: 'The boundary in one sentence',
|
|
1649
|
+
paragraphs: [
|
|
1650
|
+
'Snowflake Cortex governs what an agent is allowed to do once it is operating inside Snowflake — querying tables, accessing data, taking actions under your RBAC, with prompt-injection guardrails and an audit trail. Natoma extends that to a permission gateway across enterprise apps.',
|
|
1651
|
+
'ThumbGate governs what a coding agent does on the developer\'s machine, in the PreToolUse hook, before the tool call executes — the rm -rf, the git push --force, the secret written to disk. That happens in the terminal, under the developer\'s own credentials, before any platform boundary exists to enforce it.',
|
|
1652
|
+
],
|
|
1653
|
+
},
|
|
1654
|
+
{
|
|
1655
|
+
heading: 'Choose Snowflake Cortex / Natoma governance when',
|
|
1656
|
+
bullets: [
|
|
1657
|
+
'Your agents operate inside the Snowflake data cloud and the risk you manage is data access and SQL under enterprise RBAC.',
|
|
1658
|
+
'You need centralized, server-side policy and audit across enterprise applications and identities.',
|
|
1659
|
+
'Your buyer is a data or platform team standardizing agent access at the organization level.',
|
|
1660
|
+
],
|
|
1661
|
+
},
|
|
1662
|
+
{
|
|
1663
|
+
heading: 'Choose ThumbGate when',
|
|
1664
|
+
bullets: [
|
|
1665
|
+
'Your risk is a coding agent on a developer\'s machine — Claude Code, Cursor, Codex, Gemini, Amp, Cline, OpenCode — running destructive shell, git, or filesystem actions.',
|
|
1666
|
+
'You want enforcement in the PreToolUse hook, before execution, with zero server and zero rollout — npx thumbgate init in 30 seconds.',
|
|
1667
|
+
'You want a learning loop: a thumbs-down on a blocked action becomes an auto-promoted prevention rule that holds across every session and every agent.',
|
|
1668
|
+
'You want least-privilege task scope and a local audit trail of every blocked action — not only inside one platform\'s perimeter.',
|
|
1669
|
+
],
|
|
1670
|
+
},
|
|
1671
|
+
{
|
|
1672
|
+
heading: 'Why the two layers do not overlap',
|
|
1673
|
+
paragraphs: [
|
|
1674
|
+
'Snowflake validated the thesis the whole category now agrees on: agents need a control layer that decides what they can do before they do it, not an audit log after the damage. At Summit 2026 they made it headline infrastructure and acquired Natoma to enforce it across the enterprise.',
|
|
1675
|
+
'But platform governance can only act on requests that reach the platform. A coding agent that force-pushes broken code, deletes a directory, or commits a secret has already done the damage on the developer\'s machine — that action never traveled to Snowflake to be governed. ThumbGate is the enforcement point for that earlier, lower layer. If you run AI coding agents and AI inside your data cloud, you want both: ThumbGate at the dev loop, platform governance at the data layer.',
|
|
1676
|
+
],
|
|
1677
|
+
},
|
|
1678
|
+
],
|
|
1679
|
+
faq: [
|
|
1680
|
+
{
|
|
1681
|
+
question: 'Is ThumbGate an alternative to Snowflake Cortex agent governance?',
|
|
1682
|
+
answer: 'Not exactly — they govern different layers. Snowflake Cortex and Natoma govern agents operating inside the enterprise data cloud under RBAC. ThumbGate governs coding agents on the developer\'s machine in the PreToolUse hook, before any action reaches a platform. If your risk is a coding agent running rm -rf or force-pushing to main, ThumbGate is the right layer; if your risk is data access inside Snowflake, Cortex is. Most teams running both AI coding agents and AI in their data cloud want both.',
|
|
1683
|
+
},
|
|
1684
|
+
{
|
|
1685
|
+
question: 'Does ThumbGate require a server or enterprise rollout like Natoma?',
|
|
1686
|
+
answer: 'No. ThumbGate is local-first: npx thumbgate init wires the PreToolUse hook on your machine in about 30 seconds, with no server, no gateway, and no platform rollout. Natoma is a server-side permission gateway for enterprise applications; ThumbGate runs entirely in the developer\'s local agent loop. That is the deliberate difference in surface.',
|
|
1687
|
+
},
|
|
1688
|
+
{
|
|
1689
|
+
question: 'Snowflake says agentic security needs a fundamentally different approach. Does ThumbGate agree?',
|
|
1690
|
+
answer: 'Yes — and ThumbGate has been built on that premise from day one. The shared thesis is that you enforce before the action, not after: a deterministic pre-action gate, not a model reviewing its own output. Snowflake applies that inside the data perimeter; ThumbGate applies it at the coding-agent layer on the developer\'s machine. The agreement on the model is exactly why the two compose rather than compete.',
|
|
1691
|
+
},
|
|
1692
|
+
],
|
|
1693
|
+
relatedPaths: ['/compare/claude-code-hooks-mastery', '/guides/ai-agent-pre-action-approval-gates', '/guides/background-agent-governance'],
|
|
1694
|
+
},
|
|
1549
1695
|
{
|
|
1550
1696
|
query: 'thumbgate vs speclock',
|
|
1551
1697
|
path: '/compare/speclock',
|
|
@@ -1649,6 +1795,7 @@ const PAGE_BLUEPRINTS = [
|
|
|
1649
1795
|
buildSemanticPseoGuide(),
|
|
1650
1796
|
buildZeroTrustGuide(),
|
|
1651
1797
|
buildGovernClaudeForLegalGuide(),
|
|
1798
|
+
buildPretooluseHookGuide(),
|
|
1652
1799
|
buildProxyPointerRagGuide(),
|
|
1653
1800
|
buildRagPrecisionTuningGuide(),
|
|
1654
1801
|
buildAiEngineeringStackGuide(),
|
|
@@ -1709,6 +1856,136 @@ const PAGE_BLUEPRINTS = [
|
|
|
1709
1856
|
],
|
|
1710
1857
|
relatedPaths: ['/guides/code-knowledge-graph-guardrails', '/guides/agent-harness-optimization', '/guides/pre-action-checks'],
|
|
1711
1858
|
},
|
|
1859
|
+
{
|
|
1860
|
+
query: 'thumbgate vs cycode ai coding agent guardrails',
|
|
1861
|
+
path: '/compare/cycode',
|
|
1862
|
+
pageType: 'comparison',
|
|
1863
|
+
pillar: 'comparison',
|
|
1864
|
+
title: 'ThumbGate vs Cycode | Local-First MIT Alternative for AI Agent Guardrails',
|
|
1865
|
+
heroTitle: 'ThumbGate vs Cycode',
|
|
1866
|
+
heroSummary: 'Cycode ships IDE-native security guardrails for enterprise AppSec teams — agent-time scanning, beforeMCPExecution / beforeReadFile / beforeSubmitPrompt hooks, and integration with their broader code-security platform. ThumbGate is the local-first, MIT-licensed CLI that ships the same PreToolUse / MCP-tool-call gating surface as an open-source npm install — and adds a learning loop where every thumbs-down becomes an auto-promoted prevention rule the team shares.',
|
|
1867
|
+
takeaways: [
|
|
1868
|
+
'Cycode is enterprise IDE security: agent-time scanning + hook interception + platform integration with their broader AppSec suite.',
|
|
1869
|
+
'ThumbGate ships the same PreToolUse / beforeMCPExecution surface as an MIT-licensed CLI you install in 30 seconds — no platform contract, no procurement cycle.',
|
|
1870
|
+
'The decision is mostly company-shape: enterprise security teams take Cycode; solo devs, OSS maintainers, and small teams take ThumbGate. The learning-loop (thumbs-down → prevention rule across sessions) is something Cycode does not advertise.',
|
|
1871
|
+
],
|
|
1872
|
+
sections: [
|
|
1873
|
+
{
|
|
1874
|
+
heading: 'The product difference in one sentence',
|
|
1875
|
+
paragraphs: [
|
|
1876
|
+
'Cycode is "IDE security for the enterprise" — its February 2026 announcement positions the agent-time hooks (beforeSubmitPrompt, beforeReadFile, beforeMCPExecution) as one module of a broader AppSec platform that also covers secrets, SAST, SCA, and supply chain.',
|
|
1877
|
+
'ThumbGate is a single-purpose, open-source, local-first CLI for the same hook surface. The lexicon is the same; the buyer is different. ThumbGate optimizes for a developer who can `npx thumbgate init` and have working PreToolUse gating before lunch.',
|
|
1878
|
+
],
|
|
1879
|
+
},
|
|
1880
|
+
{
|
|
1881
|
+
heading: 'Choose Cycode when',
|
|
1882
|
+
bullets: [
|
|
1883
|
+
'You have an enterprise AppSec team that needs a unified vendor across secrets, SAST, SCA, supply-chain, and the new agent-time hook layer.',
|
|
1884
|
+
'You need centralized policy management, RBAC, SIEM integration, and a procurement-ready contract with SOC2 / ISO-grade artifacts.',
|
|
1885
|
+
'Your security org wants one dashboard for IDE-time and CI/CD-time security posture across the whole repo footprint.',
|
|
1886
|
+
],
|
|
1887
|
+
},
|
|
1888
|
+
{
|
|
1889
|
+
heading: 'Choose ThumbGate when',
|
|
1890
|
+
bullets: [
|
|
1891
|
+
'You want PreToolUse / beforeMCPExecution gating working in 30 seconds via `npx thumbgate init` — no contract, no platform install, no procurement.',
|
|
1892
|
+
'You want a learning loop: a thumbs-down on a blocked action becomes an auto-promoted prevention rule that holds across every session, model, and agent.',
|
|
1893
|
+
'You are a solo developer, OSS maintainer, or small team that wants MIT-licensed code you can read, fork, and verify — not a closed-source SaaS.',
|
|
1894
|
+
'You want the gating engine to run entirely on the developer machine with zero network egress for the hook decision itself.',
|
|
1895
|
+
],
|
|
1896
|
+
},
|
|
1897
|
+
{
|
|
1898
|
+
heading: 'What the two products share',
|
|
1899
|
+
paragraphs: [
|
|
1900
|
+
'Both put the enforcement boundary at the same place — the agent\'s tool call, before execution — and both name the hooks the same way (PreToolUse / beforeMCPExecution / beforeReadFile). The category lexicon is the same because the underlying agent loop is the same.',
|
|
1901
|
+
'The disagreement is on packaging. Cycode wraps it in an enterprise platform contract; ThumbGate ships it as an MIT-licensed CLI. If you are an enterprise security team buying a platform, you are not the ThumbGate buyer. If you are a developer who wants to type `npx thumbgate init` and have agent gating running before the next standup, Cycode is over-scoped for you.',
|
|
1902
|
+
],
|
|
1903
|
+
},
|
|
1904
|
+
],
|
|
1905
|
+
faq: [
|
|
1906
|
+
{
|
|
1907
|
+
question: 'Is ThumbGate a direct replacement for Cycode\'s agent-time hooks?',
|
|
1908
|
+
answer: 'For the hook surface itself — PreToolUse, beforeMCPExecution, beforeReadFile — yes. For the broader Cycode AppSec platform (secrets scanning, SAST, SCA, supply chain), no. ThumbGate is single-purpose: agent-time tool-call gating with a learning loop. If you only need that, ThumbGate replaces the Cycode agent-time module at zero license cost.',
|
|
1909
|
+
},
|
|
1910
|
+
{
|
|
1911
|
+
question: 'Why would I pick MIT-licensed local-first over a funded enterprise vendor?',
|
|
1912
|
+
answer: 'Three reasons. (1) Cost: no per-seat license. (2) Speed of adoption: `npx thumbgate init` is faster than enterprise procurement. (3) Auditability: you can read the gate-engine code, modify it, and run it offline. The trade-off is you do not get a platform contract, RBAC, or a single vendor for all your AppSec needs. That is a fine trade-off for a solo dev or small team; it is the wrong trade-off for a regulated enterprise.',
|
|
1913
|
+
},
|
|
1914
|
+
{
|
|
1915
|
+
question: 'Does Cycode have the cross-session learning loop?',
|
|
1916
|
+
answer: 'Not advertised on their public materials as of the February 2026 announcement. Cycode\'s hooks are policy-driven; ThumbGate adds a feedback-to-rules pipeline where a thumbs-down on a blocked action becomes an auto-promoted prevention rule that holds across every session and every agent on the same install.',
|
|
1917
|
+
},
|
|
1918
|
+
{
|
|
1919
|
+
question: 'Can I use both?',
|
|
1920
|
+
answer: 'Technically yes — Cycode at the enterprise platform layer, ThumbGate as the developer-local fast loop — but most teams will pick one. They occupy the same hook surface, so running both means resolving who wins on conflicts. The simpler pattern is to pick by buyer profile: enterprise security team buys Cycode, individual developer / small team installs ThumbGate.',
|
|
1921
|
+
},
|
|
1922
|
+
],
|
|
1923
|
+
relatedPaths: ['/guides/claude-code-pretooluse-hook', '/guides/mcp-tool-governance', '/guides/ai-coding-agent-zero-trust'],
|
|
1924
|
+
},
|
|
1925
|
+
{
|
|
1926
|
+
query: 'thumbgate vs disler claude code hooks mastery',
|
|
1927
|
+
path: '/compare/claude-code-hooks-mastery',
|
|
1928
|
+
pageType: 'comparison',
|
|
1929
|
+
pillar: 'comparison',
|
|
1930
|
+
title: 'ThumbGate vs disler/claude-code-hooks-mastery | When to Pick the OSS Tool',
|
|
1931
|
+
heroTitle: 'ThumbGate vs disler/claude-code-hooks-mastery',
|
|
1932
|
+
heroSummary: 'disler/claude-code-hooks-mastery is the most-starred community repo for Claude Code hooks — a comprehensive, free, MIT-licensed example library you can copy-paste into your own .claude/ config. ThumbGate is a published npm CLI that does the same gating work plus a learning loop where every thumbs-down becomes an auto-promoted prevention rule that holds across sessions, models, and agents. The disler repo is where you START; ThumbGate is what you USE when you stop wanting to maintain hook scripts by hand.',
|
|
1933
|
+
takeaways: [
|
|
1934
|
+
'disler/claude-code-hooks-mastery is a free reference repo of hook examples — you copy them into .claude/, edit, and maintain per-machine, per-project.',
|
|
1935
|
+
'ThumbGate ships the same gating engine as one `npx thumbgate init` install — versioned config, cross-session prevention rules, dashboard, audit trail.',
|
|
1936
|
+
'The right path: start with the disler repo to learn what is possible; move to ThumbGate when you find yourself maintaining hook scripts in three projects.',
|
|
1937
|
+
],
|
|
1938
|
+
sections: [
|
|
1939
|
+
{
|
|
1940
|
+
heading: 'The product difference in one sentence',
|
|
1941
|
+
paragraphs: [
|
|
1942
|
+
'disler/claude-code-hooks-mastery is a GitHub repository of high-quality example hooks you read, learn from, and copy into your own setup. ThumbGate is a published CLI that ships the gating engine as a runnable tool with cross-session learning, a dashboard, and an audit trail.',
|
|
1943
|
+
'Both are MIT-licensed. Both run locally. The disagreement is whether you want to read example scripts and own the maintenance, or install a tool that does the work and stays in sync.',
|
|
1944
|
+
],
|
|
1945
|
+
},
|
|
1946
|
+
{
|
|
1947
|
+
heading: 'Choose disler/claude-code-hooks-mastery when',
|
|
1948
|
+
bullets: [
|
|
1949
|
+
'You want to learn how Claude Code hooks actually work by reading well-written examples.',
|
|
1950
|
+
'You are happy maintaining your own .claude/ config per project and per machine.',
|
|
1951
|
+
'You only need static pattern-matching — no need for cross-session learning, dashboard, or audit history.',
|
|
1952
|
+
'You explicitly do not want any installed dependency beyond what you author yourself.',
|
|
1953
|
+
],
|
|
1954
|
+
},
|
|
1955
|
+
{
|
|
1956
|
+
heading: 'Choose ThumbGate when',
|
|
1957
|
+
bullets: [
|
|
1958
|
+
'You want PreToolUse gating working in 30 seconds via `npx thumbgate init` — no copy-paste, no per-machine setup.',
|
|
1959
|
+
'You want the learning loop: a thumbs-down on a blocked action becomes an auto-promoted prevention rule that holds across every session and every agent on the install.',
|
|
1960
|
+
'You want a dashboard showing what was blocked, why, and which feedback became which rule — auditable evidence, not just hook scripts on disk.',
|
|
1961
|
+
'You want one gate engine that works across Claude Code, Cursor, Codex, Gemini CLI, Amp, Cline, and OpenCode — not a separate copy-paste exercise per agent.',
|
|
1962
|
+
'You operate on more than one project and do not want to maintain N copies of the same hook scripts.',
|
|
1963
|
+
],
|
|
1964
|
+
},
|
|
1965
|
+
{
|
|
1966
|
+
heading: 'What the disler repo does brilliantly',
|
|
1967
|
+
paragraphs: [
|
|
1968
|
+
'It is the best public reference for what a Claude Code PreToolUse hook can do — clear examples, real patterns, MIT-licensed code you can read end-to-end in an afternoon. If you are evaluating the category, that repo is required reading. It also has 3,000+ stars at the time of writing for a reason: the examples are good.',
|
|
1969
|
+
'ThumbGate is not trying to replace that learning resource. The disler repo is where you understand the surface; ThumbGate is what you use when you decide to ship gating in production and want the cross-session learning, the dashboard, and the team-shared rule library that copy-paste cannot give you.',
|
|
1970
|
+
],
|
|
1971
|
+
},
|
|
1972
|
+
],
|
|
1973
|
+
faq: [
|
|
1974
|
+
{
|
|
1975
|
+
question: 'Why pay $19/mo for ThumbGate Pro when disler hooks are free?',
|
|
1976
|
+
answer: 'Free disler hooks are static patterns you maintain per machine — re-copying them when they change, debugging false positives alone, and re-applying them in every new project. ThumbGate Pro adds the learning loop (thumbs-down → cross-session prevention rule), the dashboard, hosted sync across machines, and adapter maintenance across the weekly breaking-change cycle of Claude Code, Cursor, and Cline. Free disler is the right answer if you only ever work in one project on one machine and never want to learn from past mistakes. Pro is the right answer when those assumptions stop holding.',
|
|
1977
|
+
},
|
|
1978
|
+
{
|
|
1979
|
+
question: 'Is ThumbGate just a packaged version of disler/claude-code-hooks-mastery?',
|
|
1980
|
+
answer: 'No. ThumbGate ships its own gate engine, feedback-to-rules pipeline, dashboard, and audit trail. The disler repo is a reference of well-written hook scripts you copy into your config; ThumbGate is a runnable CLI that ships the gate engine and adds a learning layer on top. Both are MIT-licensed and both rely on the same Claude Code PreToolUse hook surface — that is where the similarity ends.',
|
|
1981
|
+
},
|
|
1982
|
+
{
|
|
1983
|
+
question: 'Should I start with disler or ThumbGate?',
|
|
1984
|
+
answer: 'If you want to understand the category, read the disler repo first — it is the best public reference for what hooks can do. If you want gating working now without authoring scripts, run `npx thumbgate init`. Most users end up doing both: read disler to learn, install ThumbGate when they decide they would rather use a tool than maintain scripts.',
|
|
1985
|
+
},
|
|
1986
|
+
],
|
|
1987
|
+
relatedPaths: ['/guides/claude-code-pretooluse-hook', '/compare/cycode', '/guides/pre-action-checks'],
|
|
1988
|
+
},
|
|
1712
1989
|
buildClaudeCodeSkillsGuide(),
|
|
1713
1990
|
buildLongRunningAgentContextGuide(),
|
|
1714
1991
|
buildReasoningCompressionGuide(),
|
|
@@ -1825,6 +2102,68 @@ const PAGE_BLUEPRINTS = [
|
|
|
1825
2102
|
],
|
|
1826
2103
|
relatedPaths: ['/guides/pre-action-checks', '/guides/agent-harness-optimization', '/guides/ai-search-topical-presence'],
|
|
1827
2104
|
},
|
|
2105
|
+
{
|
|
2106
|
+
query: 'database safety for ai agents',
|
|
2107
|
+
path: '/guides/database-agent-safety',
|
|
2108
|
+
pageType: 'guide',
|
|
2109
|
+
pillar: 'pre-action-checks',
|
|
2110
|
+
title: 'Database Safety for AI Agents | ThumbGate Guide',
|
|
2111
|
+
heroTitle: 'Database Safety for AI Agents',
|
|
2112
|
+
heroSummary: 'AI agents can write code quickly, but database actions need stricter gates: a hallucinated SQL write, migration, role grant, or production config change can destroy data before review.',
|
|
2113
|
+
takeaways: [
|
|
2114
|
+
'Databases are the highest-blast-radius tool surface for autonomous coding agents.',
|
|
2115
|
+
'The winning pattern is not an AI DBA autopilot alone; it is a pre-action approval boundary before SQL, migrations, and privilege changes run.',
|
|
2116
|
+
'ThumbGate turns repeated database mistakes into rules that block or pause the next risky query before execution.',
|
|
2117
|
+
],
|
|
2118
|
+
sections: [
|
|
2119
|
+
{
|
|
2120
|
+
heading: 'Why database work is the final boss for agents',
|
|
2121
|
+
paragraphs: [
|
|
2122
|
+
'A bad UI component is visible and usually reversible. A bad production query can delete rows, lock writes, leak data, or change privileges before anyone reviews the pull request.',
|
|
2123
|
+
'That is why database-agent safety belongs at the tool-call boundary. The agent should be stopped before it runs DROP, TRUNCATE, unbounded UPDATE/DELETE, production migrations, or role grants.',
|
|
2124
|
+
],
|
|
2125
|
+
},
|
|
2126
|
+
{
|
|
2127
|
+
heading: 'The high-ROI gate pack',
|
|
2128
|
+
bullets: [
|
|
2129
|
+
'Block DROP, TRUNCATE, DROP DATABASE, and DROP SCHEMA unless human approval and rollback evidence are attached.',
|
|
2130
|
+
'Block UPDATE and DELETE without a restrictive WHERE clause, including WHERE 1=1 and WHERE TRUE.',
|
|
2131
|
+
'Require backup, snapshot, or reversible migration proof before production schema changes.',
|
|
2132
|
+
'Require dry-run or EXPLAIN evidence before production writes and migrations.',
|
|
2133
|
+
'Warn on CREATE INDEX without CONCURRENTLY and CROSS JOINs that can create performance incidents.',
|
|
2134
|
+
'Block role creation, role alteration, and broad grants from autonomous agents.',
|
|
2135
|
+
],
|
|
2136
|
+
},
|
|
2137
|
+
{
|
|
2138
|
+
heading: 'Where ThumbGate fits',
|
|
2139
|
+
paragraphs: [
|
|
2140
|
+
'ThumbGate is not trying to replace Postgres, MySQL, Prisma, Rails migrations, or a DBA. It is the pre-action control plane that checks the agent before those tools execute.',
|
|
2141
|
+
'The feedback loop matters: when a human gives a thumbs-down on an unsafe migration or query, ThumbGate can promote the failure pattern into a prevention rule so the next agent run cannot repeat it silently.',
|
|
2142
|
+
],
|
|
2143
|
+
},
|
|
2144
|
+
{
|
|
2145
|
+
heading: 'First workflow to gate',
|
|
2146
|
+
paragraphs: [
|
|
2147
|
+
'Start with one production migration path. Require the agent to show target environment, dry-run output, backup or snapshot evidence, rollback plan, and human approval before it can run the command. That single workflow makes the value visible to engineering leaders immediately.',
|
|
2148
|
+
],
|
|
2149
|
+
},
|
|
2150
|
+
],
|
|
2151
|
+
faq: [
|
|
2152
|
+
{
|
|
2153
|
+
question: 'Should AI agents be allowed to run production database migrations?',
|
|
2154
|
+
answer: 'Only behind an approval gate. Production migrations should require target verification, dry-run output, backup or snapshot evidence, rollback plan, and human approval before the command executes.',
|
|
2155
|
+
},
|
|
2156
|
+
{
|
|
2157
|
+
question: 'What database actions should be blocked by default?',
|
|
2158
|
+
answer: 'DROP, TRUNCATE, DROP DATABASE, DROP SCHEMA, role or grant changes, unbounded UPDATE or DELETE, and production migrations without rollback and dry-run evidence should be blocked or paused before execution.',
|
|
2159
|
+
},
|
|
2160
|
+
{
|
|
2161
|
+
question: 'Is this an AI DBA replacement?',
|
|
2162
|
+
answer: 'No. ThumbGate is the governance layer before an agent touches database tooling. It blocks known-bad actions and requires proof for risky actions; DBAs and platform teams still own database design and operations.',
|
|
2163
|
+
},
|
|
2164
|
+
],
|
|
2165
|
+
relatedPaths: ['/guides/pre-action-checks', '/guides/ai-agent-pre-action-approval-gates', '/guides/best-tools-stop-ai-agents-breaking-production'],
|
|
2166
|
+
},
|
|
1828
2167
|
buildHarnessOptimizationGuide(),
|
|
1829
2168
|
buildCodeKnowledgeGraphGuardrailsGuide(),
|
|
1830
2169
|
buildDeveloperMachineSupplyChainGuardrailsGuide(),
|
|
@@ -2074,6 +2413,234 @@ const PAGE_BLUEPRINTS = [
|
|
|
2074
2413
|
],
|
|
2075
2414
|
relatedPaths: ['/compare/mem0', '/guides/stop-repeated-ai-agent-mistakes'],
|
|
2076
2415
|
},
|
|
2416
|
+
{
|
|
2417
|
+
query: 'hermes agent guardrails',
|
|
2418
|
+
path: '/guides/hermes-agent-guardrails',
|
|
2419
|
+
pageType: 'integration',
|
|
2420
|
+
pillar: 'agent-workflows',
|
|
2421
|
+
title: 'Hermes Agent Guardrails | Firewall for Self-Improving Agents',
|
|
2422
|
+
heroTitle: 'Hermes Agent can grow with you. ThumbGate keeps the growing agent safe.',
|
|
2423
|
+
heroSummary: 'Hermes Agent points at the next wave: persistent memory, generated skills, messaging gateways, scheduled automations, and sandboxed execution. ThumbGate is the enforcement layer those workflows need before a remembered mistake becomes another real tool call.',
|
|
2424
|
+
takeaways: [
|
|
2425
|
+
'Hermes validates the market shift toward long-running, self-improving agents.',
|
|
2426
|
+
'Memory and generated skills increase leverage, but they also increase the blast radius of repeated mistakes.',
|
|
2427
|
+
'ThumbGate should be positioned as the local-first pre-action firewall for Hermes-style agents, not as a general agent clone.',
|
|
2428
|
+
],
|
|
2429
|
+
sections: [
|
|
2430
|
+
{
|
|
2431
|
+
heading: 'Why Hermes-style agents need a separate execution gate',
|
|
2432
|
+
paragraphs: [
|
|
2433
|
+
'A persistent agent can remember projects, generate its own skills, run scheduled automations, and accept instructions from messaging gateways. That is powerful, but it also means one bad habit can persist longer and reach more surfaces.',
|
|
2434
|
+
'The safety problem is not only whether the agent remembers. It is whether remembered lessons can stop the next risky shell command, git action, database write, deploy, browser click, or payment workflow before execution.',
|
|
2435
|
+
],
|
|
2436
|
+
},
|
|
2437
|
+
{
|
|
2438
|
+
heading: 'What ThumbGate adds to Hermes-style workflows',
|
|
2439
|
+
bullets: [
|
|
2440
|
+
'Pre-action checks before risky tool calls execute.',
|
|
2441
|
+
'Thumbs-down feedback that becomes explicit prevention rules.',
|
|
2442
|
+
'Evidence requirements for deploys, migrations, API calls, and production-facing changes.',
|
|
2443
|
+
'Audit trails that show which lesson, rule, and workflow context allowed or blocked the action.',
|
|
2444
|
+
'A local-first path for teams that want agent memory without handing every correction to a hosted black box.',
|
|
2445
|
+
],
|
|
2446
|
+
},
|
|
2447
|
+
{
|
|
2448
|
+
heading: 'The buyer message',
|
|
2449
|
+
paragraphs: [
|
|
2450
|
+
'Hermes can be the agent that grows with you. ThumbGate is the firewall that makes sure growth does not mean repeating expensive mistakes faster across more surfaces.',
|
|
2451
|
+
'For teams evaluating persistent agents, the practical first step is not another prompt. It is one enforced rule from one real failure, proven locally, then expanded into Pro or a workflow hardening sprint when the risk is recurring.',
|
|
2452
|
+
],
|
|
2453
|
+
},
|
|
2454
|
+
],
|
|
2455
|
+
faq: [
|
|
2456
|
+
{
|
|
2457
|
+
question: 'Does ThumbGate replace Hermes Agent?',
|
|
2458
|
+
answer: 'No. Hermes is a general self-improving agent surface. ThumbGate is the enforcement layer that can sit around Hermes-style workflows so risky actions are checked before execution.',
|
|
2459
|
+
},
|
|
2460
|
+
{
|
|
2461
|
+
question: 'What Hermes features create the biggest need for guardrails?',
|
|
2462
|
+
answer: 'Persistent memory, generated skills, messaging gateways, scheduled automations, browser and tool control, and sandbox backends all increase the value of pre-action gates because the agent can act longer, faster, and from more entry points.',
|
|
2463
|
+
},
|
|
2464
|
+
{
|
|
2465
|
+
question: 'What should teams implement first?',
|
|
2466
|
+
answer: 'Start with one repeated failure pattern: force-push, destructive SQL, unsafe deploy, risky browser action, or off-scope file edit. Capture it once, convert it into a prevention rule, and require evidence before the next similar action runs.',
|
|
2467
|
+
},
|
|
2468
|
+
],
|
|
2469
|
+
relatedPaths: ['/guides/long-running-agent-context-management', '/guides/background-agent-governance', '/guides/browser-automation-safety'],
|
|
2470
|
+
},
|
|
2471
|
+
{
|
|
2472
|
+
query: 'safe self evolution',
|
|
2473
|
+
path: '/guides/safe-self-evolution',
|
|
2474
|
+
pageType: 'guide',
|
|
2475
|
+
pillar: 'agent-workflows',
|
|
2476
|
+
title: 'Safe Self-Evolution | Autonomous Prompt Optimization without Regression',
|
|
2477
|
+
heroTitle: 'Self-Evolution is Polarizing. Make It Safe with Execution Gates.',
|
|
2478
|
+
heroSummary: 'Hermes-style autonomous agents learn by observing their own execution failures and automatically rewriting their skills or instructions. But critics warn that blind self-evolution can overwrite stable patterns and introduce silent regressions. ThumbGate introduces the Safe Self-Evolution loop: weakness mining from explicit thumbs-down feedback, automated prompt optimization, local verification suites, and atomic git rollbacks.',
|
|
2479
|
+
takeaways: [
|
|
2480
|
+
'Self-improving agents need execution guardrails so a synthesized skill cannot bypass safety constraints.',
|
|
2481
|
+
'Blind self-evolution is unstable; ThumbGate ensures prompt changes are verified against a local holdout suite before committing.',
|
|
2482
|
+
'Rollback capability is mandatory: if validation fails, the evolution engine immediately reverts prompts to the last known-good state.',
|
|
2483
|
+
'Explicit feedback is the anchor: optimize based on real thumbs-down signals, not hallucinatory failure guesses.'
|
|
2484
|
+
],
|
|
2485
|
+
sections: [
|
|
2486
|
+
{
|
|
2487
|
+
heading: 'The self-evolution dilemma',
|
|
2488
|
+
paragraphs: [
|
|
2489
|
+
'Nous Research’s Hermes Agent points at a future where developers do not write static instructions like CLAUDE.md. Instead, the agent learns from its execution failures and modifies its own SKILL.md files in real-time. This dynamic adaptation yields massive speedups and handles custom codebase quirks autonomously.',
|
|
2490
|
+
'However, the critics are correct: when an agent has the power to edit its own rules without a verification gate, it will eventually overwrite a perfectly stable skill. This introduces regressions, makes debugging impossible, and can lead to security loops where the agent modifies its own guardrails to make a failing task pass.'
|
|
2491
|
+
]
|
|
2492
|
+
},
|
|
2493
|
+
{
|
|
2494
|
+
heading: 'Safe self-evolution with ThumbGate',
|
|
2495
|
+
paragraphs: [
|
|
2496
|
+
'ThumbGate implements a Safe Self-Evolution loop (based on the Self-Harness paradigm) that gives you the speed of self-improving agents without the instability:',
|
|
2497
|
+
'1. Explicit Weakness Mining: ThumbGate captures structured thumbs-up/down signals on agent actions and compiles them into a JSON log, avoiding random self-diagnosis.',
|
|
2498
|
+
'2. Harness Proposal: The self-harness-optimizer automatically formats these rules and injects them directly into the agent’s prompt instructions (AGENTS.md, GEMINI.md).',
|
|
2499
|
+
'3. Verification Gate: Before the updated prompts are committed, the optimizer runs a local quick verification suite and holdout tests.',
|
|
2500
|
+
'4. Atomic Rollback: If any test fails, the optimizer instantly reverts the workspace prompts and restores the previous snapshot. If they pass, it commits the update to Git.'
|
|
2501
|
+
]
|
|
2502
|
+
},
|
|
2503
|
+
{
|
|
2504
|
+
heading: 'Competing with blind self-improvement',
|
|
2505
|
+
paragraphs: [
|
|
2506
|
+
'To compete with agents like Hermes, you do not need to give up control of your codebase. You need a pre-action firewall and a prompt optimizer that treats rule generation as code changes—complete with tests, verification, and rollbacks.',
|
|
2507
|
+
'This keeps your agent fast, keeps your instructions dynamic, and ensures your production-facing surfaces remain secure.'
|
|
2508
|
+
]
|
|
2509
|
+
}
|
|
2510
|
+
],
|
|
2511
|
+
faq: [
|
|
2512
|
+
{
|
|
2513
|
+
question: 'Does ThumbGate prevent the agent from changing its own rules?',
|
|
2514
|
+
answer: 'Yes. ThumbGate scans newly generated skills and prompt updates against established rules to prevent the agent from bypassing safety gates or deleting security constraints.'
|
|
2515
|
+
},
|
|
2516
|
+
{
|
|
2517
|
+
question: 'How does the rollback mechanism work?',
|
|
2518
|
+
answer: 'When the self-harness optimizer proposes new prompt sections, it saves a snapshot of the current prompt files. It then runs the verification commands. If the status is non-zero, it restores the backup files.'
|
|
2519
|
+
},
|
|
2520
|
+
{
|
|
2521
|
+
question: 'Is this compatible with Hermes Agent?',
|
|
2522
|
+
answer: 'Yes. You can use ThumbGate as the pre-action gate around a Hermes Agent deployment to secure the skills it generates and the messaging channels it posts to.'
|
|
2523
|
+
}
|
|
2524
|
+
],
|
|
2525
|
+
relatedPaths: ['/guides/hermes-agent-guardrails', '/guides/agent-context-governance', '/guides/stop-repeated-ai-agent-mistakes'],
|
|
2526
|
+
},
|
|
2527
|
+
{
|
|
2528
|
+
query: 'agent context governance',
|
|
2529
|
+
path: '/guides/agent-context-governance',
|
|
2530
|
+
pageType: 'guide',
|
|
2531
|
+
pillar: 'pre-action-checks',
|
|
2532
|
+
title: 'Agent Context Governance | Stop Tokenmaxxing Drift Before Agents Act',
|
|
2533
|
+
heroTitle: 'More Context Is Not Governance. Clean Context Plus Action Gates Is.',
|
|
2534
|
+
heroSummary: 'AdaCoM-style context managers, the tokenmaxxing backlash, Claude Managed Agents, anti-rubber-stamp response prompts, model-provenance scares, ChatGPT Lockdown Mode, MCP routing attacks, resilient graph architectures, rising AI-authored code volume, AI email assistants, platform-agent orchestration, on-device QAT models, and backprop-style failure attribution all point to the same buyer need: long-running agents need structured intent, cleaner context, durable session logs, approved models, isolated execution, credential boundaries, tool lockdown, direct pushback, distributed gates, provenance, and pre-action checks before they touch real systems.',
|
|
2535
|
+
takeaways: [
|
|
2536
|
+
'Long-context agents get better when a separate manager rewrites, preserves, prunes, or merges working context before the next step.',
|
|
2537
|
+
'Tokenmaxxing creates uncontrolled spend and weak governance when teams cannot prove which agent work returned value.',
|
|
2538
|
+
'Managed-agent architectures decouple the brain, hands, sessions, credentials, and sandboxes; ThumbGate adds the local-first action gate around those boundaries.',
|
|
2539
|
+
'Response customization should become a gate too: no padded agreement, no vague completion claims, and no confident answer without evidence or blind-spot checks.',
|
|
2540
|
+
'Lockdown modes validate the egress-control story: sensitive workflows need tool-surface limits, not just better prompts.',
|
|
2541
|
+
'Model leaks and proxy resale scares make approved-provider checks a governance requirement, especially when frontier model cost is high.',
|
|
2542
|
+
'MCP security research makes local config integrity a first-class control: endpoint rewrites and token-routing changes must be monitored before agents act.',
|
|
2543
|
+
'Random-graph infrastructure suggests a governance architecture: use many small local gates that degrade proportionally instead of one central approval bottleneck.',
|
|
2544
|
+
'As AI-authored code volume rises, teams need provenance and evidence gates so generated diffs are attributable, tested, and owned before merge.',
|
|
2545
|
+
'AI customer-response assistants need draft governance: retrieved sources, prompt variables, category routing, and feedback should improve drafts without letting the agent send unsupported claims.',
|
|
2546
|
+
'Enterprise agent platforms need one shared execution contract: structured specs, approved tools, scoped permissions, retries, evals, and traceability instead of 100 fragile team-specific agents.',
|
|
2547
|
+
'On-device QAT models can reduce cost and preserve privacy for first-pass risk classification, but they should escalate rather than approve high-risk actions.',
|
|
2548
|
+
'Backpropagation suggests a useful product metaphor: trace the agent run graph, score local risk at each edge, and cache the blame path so the same failure is blocked faster next time.',
|
|
2549
|
+
],
|
|
2550
|
+
sections: [
|
|
2551
|
+
{
|
|
2552
|
+
heading: 'Why this matters now',
|
|
2553
|
+
paragraphs: [
|
|
2554
|
+
'The market is moving away from prompt-only agents. New research shows that a separate context manager can improve long-horizon work without retraining the main agent. At the same time, developer teams are realizing that simply buying more tokens does not create accountable engineering process.',
|
|
2555
|
+
'Claude Managed Agents adds the production vocabulary buyers now expect: agents, environments, sessions, sandbox isolation, credential separation, event logs, observability, permission policies, outcomes, and webhooks. ThumbGate should attach to that vocabulary as the pre-action governance layer.',
|
|
2556
|
+
],
|
|
2557
|
+
},
|
|
2558
|
+
{
|
|
2559
|
+
heading: 'What ThumbGate should enforce',
|
|
2560
|
+
bullets: [
|
|
2561
|
+
'Context hygiene gate: block high-risk actions when the agent is acting from raw chat history, stale memory, or unresolved contradictions.',
|
|
2562
|
+
'Session evidence gate: require an append-only event log, resumable session ID, and proof links before long-running work can deploy, charge, message, or mutate production data.',
|
|
2563
|
+
'Sandbox boundary gate: require isolated execution and explicit network or filesystem scope before generated code runs.',
|
|
2564
|
+
'Credential boundary gate: block actions where tool credentials live beside generated code or where the action lacks user/on-behalf-of attribution.',
|
|
2565
|
+
'Token ROI gate: flag tokenmaxxing workflows that spend heavily without a defined outcome, eval, or proof of returned value.',
|
|
2566
|
+
'Response quality gate: require the agent to lead with the useful answer, call out weak assumptions, and avoid completion claims unless the evidence is attached.',
|
|
2567
|
+
'Model provenance gate: require approved provider domains, known model IDs, expected price ceilings, and no shadow API proxy before routing frontier work.',
|
|
2568
|
+
'Tool lockdown gate: disable or require explicit approval for browsing, downloads, agent mode, generated-code networking, and other outbound paths when sensitive data is in context.',
|
|
2569
|
+
'MCP config integrity gate: alert on ~/.claude.json routing changes, unfamiliar MCP endpoints, localhost proxy additions, OAuth refresh anomalies, and dependency postinstall hooks.',
|
|
2570
|
+
'Distributed gate mesh: keep enforcement close to each repo, tool, and workflow so one failed gate reduces coverage locally instead of collapsing the entire governance path.',
|
|
2571
|
+
'AI-authored code gate: require generated-diff provenance, human owner, tests, risk label, and rollback evidence once agent-authored changes cross a team-defined threshold.',
|
|
2572
|
+
'Customer-response draft gate: require retrieved source links, customer objective, response category, human approval, and no unsupported pricing/security claims before an email leaves draft mode.',
|
|
2573
|
+
'Structured intent gate: require scope, out-of-scope systems, ordered steps, allowed tools, acceptance criteria, and rollback expectations before async agent execution starts.',
|
|
2574
|
+
'Tool contract gate: require versioned schemas, explicit read/write permissions, stable error codes, observability hooks, and audit logging for every MCP tool call.',
|
|
2575
|
+
'Evaluation gate: require golden tasks, regression checks, build/test evidence, and traceable PR or artifact output before a repeated workflow is promoted to platform automation.',
|
|
2576
|
+
'Local classifier gate: run low-cost on-device models for first-pass risk labels, sensitive-data detection, and route selection, then escalate uncertain or high-blast-radius actions to stronger checks.',
|
|
2577
|
+
'Failure attribution graph: record intent, retrieved context, tool choice, local risk score, evidence, and outcome for each step so future gates reuse the causal path instead of starting from scratch.',
|
|
2578
|
+
],
|
|
2579
|
+
},
|
|
2580
|
+
{
|
|
2581
|
+
heading: 'The buyer message',
|
|
2582
|
+
paragraphs: [
|
|
2583
|
+
'The pitch is not "use fewer tokens" or "summarize harder." The pitch is: keep the agent productive by feeding it the right context, then stop it before risky actions unless the session, sandbox, credentials, and evidence are clean.',
|
|
2584
|
+
'This turns ThumbGate into the practitioner-led governance layer teams can adopt before top-down AI policy arrives. Start with one workflow, prove the gates locally, then expand to Pro or a hardening sprint once the same failure pattern recurs.',
|
|
2585
|
+
],
|
|
2586
|
+
},
|
|
2587
|
+
],
|
|
2588
|
+
faq: [
|
|
2589
|
+
{
|
|
2590
|
+
question: 'Is agent context governance just summarization?',
|
|
2591
|
+
answer: 'No. Summarization compresses. Context governance decides what to preserve, prune, merge, verify, or block based on the agent, task, risk, and evidence required before the next action.',
|
|
2592
|
+
},
|
|
2593
|
+
{
|
|
2594
|
+
question: 'Does this compete with Claude Managed Agents?',
|
|
2595
|
+
answer: 'No. Managed Agents provide production infrastructure. ThumbGate can sit beside managed or self-hosted agents as the local-first gate that turns session history, permissions, prior feedback, and evidence requirements into action-level enforcement.',
|
|
2596
|
+
},
|
|
2597
|
+
{
|
|
2598
|
+
question: 'What should teams implement first?',
|
|
2599
|
+
answer: 'Start with one high-cost workflow: deployments, billing, browser automation, database changes, or customer messaging. Require clean context, isolated execution, credential separation, and evidence before that workflow can run.',
|
|
2600
|
+
},
|
|
2601
|
+
{
|
|
2602
|
+
question: 'How does this apply to Claude custom instructions?',
|
|
2603
|
+
answer: 'Treat directness instructions as a policy, not a vibe. ThumbGate can turn them into checks that flag rubber-stamp agreement, missing pushback, and success claims that are not grounded in command output or artifacts.',
|
|
2604
|
+
},
|
|
2605
|
+
{
|
|
2606
|
+
question: 'How does ChatGPT Lockdown Mode help ThumbGate positioning?',
|
|
2607
|
+
answer: 'It validates the category. Lockdown Mode limits high-risk tools to reduce exfiltration paths; ThumbGate brings the same idea to coding and automation agents with local pre-action checks, scoped approvals, and audit evidence.',
|
|
2608
|
+
},
|
|
2609
|
+
{
|
|
2610
|
+
question: 'How should teams handle leaked or proxy-sold model claims?',
|
|
2611
|
+
answer: 'Do not route production work to unapproved proxy endpoints. Require provider provenance, expected model IDs, price ceilings, and security review before an agent can use a new frontier model route.',
|
|
2612
|
+
},
|
|
2613
|
+
{
|
|
2614
|
+
question: 'What is the first MCP security control to add?',
|
|
2615
|
+
answer: 'Watch the local MCP routing configuration for endpoint changes, new proxy addresses, and unexpected OAuth refresh behavior. Then rotate connected tokens only after the malicious hook or config rewrite has been removed.',
|
|
2616
|
+
},
|
|
2617
|
+
{
|
|
2618
|
+
question: 'Why mention random graph architecture in agent governance?',
|
|
2619
|
+
answer: 'Because centralized approval paths become bottlenecks. ThumbGate should use a mesh of local gates across repos, tools, agents, and workflows so control is resilient, inspectable, and does not require one fragile platform migration.',
|
|
2620
|
+
},
|
|
2621
|
+
{
|
|
2622
|
+
question: 'What changes when most new code is AI-authored?',
|
|
2623
|
+
answer: 'Review moves from typing every line to governing provenance, tests, ownership, and rollback. ThumbGate can require evidence before AI-authored diffs merge or touch production workflows.',
|
|
2624
|
+
},
|
|
2625
|
+
{
|
|
2626
|
+
question: 'How does this apply to AI email assistants?',
|
|
2627
|
+
answer: 'Treat every generated reply as a draft until it has source-backed context, a known category, customer-specific constraints, and human approval. Feedback from edited drafts should become retrieval and wording rules, not permission to send automatically.',
|
|
2628
|
+
},
|
|
2629
|
+
{
|
|
2630
|
+
question: 'What does platform ownership change?',
|
|
2631
|
+
answer: 'It prevents every team from building a slightly different unsafe agent loop. A shared platform defines intent shape, approved tools, retries, sandboxing, evals, logging, and gates while teams keep control over domain judgment.',
|
|
2632
|
+
},
|
|
2633
|
+
{
|
|
2634
|
+
question: 'Where do on-device QAT models fit?',
|
|
2635
|
+
answer: 'Use them for cheap private triage: classify risk, detect sensitive context, choose a route, or decide whether to escalate. Do not let a small local classifier silently approve destructive or external actions.',
|
|
2636
|
+
},
|
|
2637
|
+
{
|
|
2638
|
+
question: 'How does backpropagation help agent governance?',
|
|
2639
|
+
answer: 'Use the chain-rule idea as an audit pattern. Break the run into steps, score each local decision, multiply risk through the path, and cache the attribution so the next similar workflow is blocked or escalated earlier.',
|
|
2640
|
+
},
|
|
2641
|
+
],
|
|
2642
|
+
relatedPaths: ['/guides/long-running-agent-context-management', '/guides/background-agent-governance', '/guides/hermes-agent-guardrails'],
|
|
2643
|
+
},
|
|
2077
2644
|
{
|
|
2078
2645
|
query: 'roo code alternative cline',
|
|
2079
2646
|
path: '/guides/roo-code-alternative-cline',
|
|
@@ -2231,6 +2798,74 @@ const PAGE_BLUEPRINTS = [
|
|
|
2231
2798
|
],
|
|
2232
2799
|
relatedPaths: ['/guides/pre-action-checks', '/guides/mcp-tool-governance', '/guides/ai-agent-governance-sprint'],
|
|
2233
2800
|
},
|
|
2801
|
+
{
|
|
2802
|
+
query: 'agentic web governance',
|
|
2803
|
+
path: '/guides/agentic-web-governance',
|
|
2804
|
+
pageType: 'guide',
|
|
2805
|
+
pillar: 'pre-action-checks',
|
|
2806
|
+
title: 'Agentic Web Governance | Pre-Action Checks When Bots Outnumber Humans',
|
|
2807
|
+
heroTitle: 'Bots already outnumber humans on the web. AI agents need pre-action governance.',
|
|
2808
|
+
heroSummary: 'Cloudflare says automated requests now make up the majority of HTML traffic. ThumbGate turns that agentic-web shift into a buyer-ready governance story: machine-readable proof for AI search and pre-action checks before agents touch real systems.',
|
|
2809
|
+
takeaways: [
|
|
2810
|
+
'The promotion hook is immediate: the web is becoming agent-first, so AI-agent actions need governance before execution.',
|
|
2811
|
+
'AI search and AI browsers reward machine-readable, authoritative, proof-backed pages instead of vague product copy.',
|
|
2812
|
+
'ThumbGate should own the bridge between agentic traffic, MCP tool calls, and pre-action checks for code, deploys, data, money, and customer systems.',
|
|
2813
|
+
],
|
|
2814
|
+
sections: [
|
|
2815
|
+
{
|
|
2816
|
+
heading: 'Why the bot-majority milestone matters',
|
|
2817
|
+
paragraphs: [
|
|
2818
|
+
'Search Engine Land reported on June 5, 2026 that Cloudflare data showed automated traffic at about 57.3% of worldwide HTTP requests to HTML content, versus 42.7% for humans. That is not the same as human attention, but it is a real signal that AI agents and bots are becoming the default way the web is requested, summarized, and acted on.',
|
|
2819
|
+
'For ThumbGate promotion, the lesson is not "get more bot traffic." The lesson is that every company will need controls for agent actions that happen before a human click, before a dashboard session, and before a normal attribution path records intent.',
|
|
2820
|
+
],
|
|
2821
|
+
},
|
|
2822
|
+
{
|
|
2823
|
+
heading: 'The buyer problem this creates',
|
|
2824
|
+
bullets: [
|
|
2825
|
+
'AI crawlers and agents can visit far more pages than a human researcher, increasing load without creating normal referral or checkout signals.',
|
|
2826
|
+
'Agentic search can summarize the answer before the buyer ever lands on the site, so content must be structured enough for LLMs to cite accurately.',
|
|
2827
|
+
'Internal AI agents can also multiply actions: file edits, shell commands, API calls, database reads, deploy attempts, and customer-system writes.',
|
|
2828
|
+
'More agent actions without a pre-action boundary means more repeated mistakes, more hidden cost, and weaker auditability.',
|
|
2829
|
+
],
|
|
2830
|
+
},
|
|
2831
|
+
{
|
|
2832
|
+
heading: 'Where ThumbGate fits the agentic web',
|
|
2833
|
+
paragraphs: [
|
|
2834
|
+
'ThumbGate is the pre-action governance layer for the same agentic shift. The public website gives AI systems machine-readable context, proof links, FAQ schema, and canonical pages. The product then gives engineering teams runtime gates before agents act.',
|
|
2835
|
+
'That lets the promotion story stay concrete: bots and AI agents already outnumber humans in web requests; ThumbGate makes sure your own AI agents do not behave like unmanaged bots inside your repo, browser, database, CI, payment flow, or customer systems.',
|
|
2836
|
+
],
|
|
2837
|
+
bullets: [
|
|
2838
|
+
'Use /llm-context.md and /.well-known/llms.txt to make ThumbGate easy for ChatGPT, Claude, Perplexity, Gemini, Grok, and Google AI features to summarize.',
|
|
2839
|
+
'Use pre-action checks to govern MCP tool calls, browser automation, database writes, publish commands, and payment/customer-system actions.',
|
|
2840
|
+
'Use feedback capture so a thumbs-down on one bad agent pattern becomes a repeat-blocking rule across the next session and team workflow.',
|
|
2841
|
+
],
|
|
2842
|
+
},
|
|
2843
|
+
{
|
|
2844
|
+
heading: 'High-ROI promotion moves',
|
|
2845
|
+
bullets: [
|
|
2846
|
+
'Publish this page as the canonical "agentic web governance" explainer and link it from the homepage, learn hub, llms.txt, and sitemap.',
|
|
2847
|
+
'Pitch the line: "Bots already outnumber humans on the web. ThumbGate keeps AI agents from acting like unmanaged bots in your codebase."',
|
|
2848
|
+
'Target buyer prompts such as "how do I govern AI agents before they call tools?", "AI crawler visibility for developer tools", and "pre-action checks for MCP tools."',
|
|
2849
|
+
'Measure success in Search Console AI reports, first-party landing events, and checkout/intake paths instead of raw traffic alone.',
|
|
2850
|
+
],
|
|
2851
|
+
},
|
|
2852
|
+
],
|
|
2853
|
+
faq: [
|
|
2854
|
+
{
|
|
2855
|
+
question: 'What is agentic web governance?',
|
|
2856
|
+
answer: 'Agentic web governance is the content, policy, approval, and runtime-control layer needed when AI agents browse, summarize, and act on behalf of users or teams. For ThumbGate, it means machine-readable public proof plus pre-action checks before internal agents touch real systems.',
|
|
2857
|
+
},
|
|
2858
|
+
{
|
|
2859
|
+
question: 'Does bot traffic mean ThumbGate should block AI crawlers?',
|
|
2860
|
+
answer: 'No. For promotion, ThumbGate should allow legitimate AI discovery while publishing clear llms.txt, schema, canonical pages, and proof links. The product should block risky internal agent actions, not useful AI-search discovery.',
|
|
2861
|
+
},
|
|
2862
|
+
{
|
|
2863
|
+
question: 'How does this create revenue?',
|
|
2864
|
+
answer: 'It gives ThumbGate a timely category narrative for buyers: as agent actions multiply, teams need pre-action controls before code, data, deploys, payments, or customers are touched. The page routes that demand into Pro checkout and the Team workflow hardening sprint.',
|
|
2865
|
+
},
|
|
2866
|
+
],
|
|
2867
|
+
relatedPaths: ['/guides/ai-search-topical-presence', '/guides/mcp-tool-governance', '/guides/ai-agent-pre-action-approval-gates'],
|
|
2868
|
+
},
|
|
2234
2869
|
guideBlueprint({
|
|
2235
2870
|
query: 'autoresearch agent safety',
|
|
2236
2871
|
path: '/guides/autoresearch-agent-safety',
|