npm - thumbgate - Versions diffs - 1.5.0 → 1.5.2 - Mend

thumbgate 1.5.0 → 1.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/.claude-plugin/marketplace.json +2 -2
package/.claude-plugin/plugin.json +1 -1
package/.well-known/mcp/server-card.json +1 -1
package/CHANGELOG.md +504 -0
package/README.md +251 -223
package/adapters/README.md +1 -1
package/adapters/claude/.mcp.json +2 -2
package/adapters/codex/config.toml +4 -2
package/adapters/mcp/server-stdio.js +34 -3
package/adapters/opencode/opencode.json +1 -1
package/bench/prompt-eval-suite.json +106 -0
package/bin/cli.js +21 -8
package/bin/postinstall.js +25 -17
package/config/evals/agent-safety-eval.json +131 -0
package/config/github-about.json +5 -2
package/config/specs/agent-safety.json +79 -0
package/package.json +69 -29
package/public/compare.html +3 -3
package/public/dashboard.html +1399 -0
package/public/guide.html +2 -2
package/public/index.html +230 -98
package/scripts/auto-wire-hooks.js +77 -27
package/scripts/bot-detection.js +165 -0
package/scripts/cli-feedback.js +6 -2
package/scripts/commercial-offer.js +4 -4
package/scripts/dashboard.js +152 -2
package/scripts/decision-trace.js +354 -0
package/scripts/feedback-loop.js +4 -8
package/scripts/prompt-eval.js +363 -0
package/scripts/rate-limiter.js +77 -24
package/scripts/sales-pipeline.js +681 -0
package/scripts/session-episode-store.js +329 -0
package/scripts/session-health-sensor.js +242 -0
package/scripts/spec-gate.js +362 -0
package/scripts/statusline.sh +6 -9
package/skills/thumbgate/SKILL.md +1 -1
package/src/api/server.js +368 -12

package/scripts/decision-trace.js ADDED Viewed

@@ -0,0 +1,354 @@
+#!/usr/bin/env node
+'use strict';
+/**
+ * Decision Trace — full observability for gate evaluations.
+ *
+ * Inspired by Ethan Mollick's observation that operators need to *see* what
+ * the agent was thinking when it made a decision. ThumbGate already captures
+ * what was blocked; Decision Trace adds:
+ *
+ *   1. Full audit of every evaluation (passes, blocks, AND near-misses)
+ *   2. Near-miss detection: constraints that almost matched
+ *   3. Session trace summaries: single-glance safety posture view
+ *
+ * Near-miss heuristic: extract literal tokens from a regex deny pattern,
+ * count how many appear in the input. If >50% match but the full regex
+ * doesn't, flag as near-miss.
+ */
+const crypto = require('node:crypto');
+const path = require('node:path');
+const { readJsonl, appendJsonl } = require('./fs-utils');
+const { resolveFeedbackDir } = require('./feedback-paths');
+const {
+  evaluateConstraints,
+  evaluateInvariants,
+  loadSpecDir,
+} = require('./spec-gate');
+const TRACE_FILE = 'decision-trace.jsonl';
+const NEAR_MISS_THRESHOLD = 0.5;
+// ---------------------------------------------------------------------------
+// Near-Miss Detection
+// ---------------------------------------------------------------------------
+/**
+ * Extract literal tokens from a regex pattern.
+ * Strips metacharacters and splits on boundaries to find human-readable tokens.
+ */
+function extractLiteralTokens(pattern) {
+  // Remove common regex metacharacters and quantifiers
+  const cleaned = pattern
+    .replace(/\\[sdwbSDWB]/g, ' ')       // char classes
+    .replace(/[.*+?^${}()|[\]\\]/g, ' ') // metacharacters
+    .replace(/\s+/g, ' ')
+    .trim();
+  return cleaned
+    .split(/\s+/)
+    .filter((t) => t.length >= 2) // ignore single chars
+    .map((t) => t.toLowerCase());
+}
+/**
+ * Compute near-miss score for a constraint against input text.
+ * Returns { isNearMiss, score, matchedTokens, totalTokens }.
+ */
+function computeNearMiss(constraint, inputText) {
+  const tokens = extractLiteralTokens(constraint.deny);
+  if (tokens.length === 0) {
+    return { isNearMiss: false, score: 0, matchedTokens: 0, totalTokens: 0 };
+  }
+  const lower = String(inputText).toLowerCase();
+  let matched = 0;
+  for (const token of tokens) {
+    if (lower.includes(token)) matched++;
+  }
+  const score = matched / tokens.length;
+  return {
+    isNearMiss: score >= NEAR_MISS_THRESHOLD && score < 1.0,
+    score: Math.round(score * 100) / 100,
+    matchedTokens: matched,
+    totalTokens: tokens.length,
+  };
+}
+// ---------------------------------------------------------------------------
+// Trace Evaluation
+// ---------------------------------------------------------------------------
+/**
+ * Build the combined input text used for near-miss detection.
+ */
+function buildCombinedInput({ tool, command, content } = {}) {
+  return [command, content, tool].filter(Boolean).join(' ');
+}
+/**
+ * Evaluate specs with full trace: passes, blocks, and near-misses.
+ */
+function traceEvaluation(specs, context = {}) {
+  const traceId = `trace_${Date.now()}_${crypto.randomBytes(4).toString('hex')}`;
+  const timestamp = new Date().toISOString();
+  const combinedInput = buildCombinedInput(context);
+  const results = [];
+  for (const spec of specs) {
+    const constraintResults = evaluateConstraints(spec, context);
+    const invariantResults = evaluateInvariants(spec, context);
+    // Annotate constraint results with near-miss info
+    for (const cr of constraintResults) {
+      const constraint = spec.constraints.find((c) => c.id === cr.constraintId);
+      let nearMiss = { isNearMiss: false, score: 0, matchedTokens: 0, totalTokens: 0 };
+      if (cr.passed && constraint) {
+        // Only compute near-miss for constraints that passed (weren't blocked)
+        nearMiss = computeNearMiss(constraint, combinedInput);
+      }
+      results.push({
+        ...cr,
+        nearMiss: nearMiss.isNearMiss,
+        nearMissScore: nearMiss.score,
+        nearMissDetail: nearMiss.isNearMiss ? nearMiss : null,
+      });
+    }
+    // Invariant results (no near-miss concept for invariants)
+    for (const ir of invariantResults) {
+      results.push({
+        ...ir,
+        nearMiss: false,
+        nearMissScore: 0,
+        nearMissDetail: null,
+      });
+    }
+  }
+  const blocked = results.filter((r) => !r.passed);
+  const nearMisses = results.filter((r) => r.nearMiss);
+  const passed = results.filter((r) => r.passed && !r.nearMiss);
+  return {
+    traceId,
+    timestamp,
+    allowed: blocked.length === 0,
+    results,
+    blocked,
+    nearMisses,
+    passed,
+    counts: {
+      total: results.length,
+      blocked: blocked.length,
+      nearMiss: nearMisses.length,
+      passed: passed.length,
+    },
+    context: {
+      tool: context.tool || null,
+      command: truncate(context.command, 200),
+      action: truncate(context.action, 200),
+    },
+  };
+}
+// ---------------------------------------------------------------------------
+// Trace Persistence
+// ---------------------------------------------------------------------------
+function getTracePath({ feedbackDir } = {}) {
+  const dir = feedbackDir || resolveFeedbackDir();
+  return path.join(dir, TRACE_FILE);
+}
+function recordTrace(trace, options = {}) {
+  const entry = {
+    traceId: trace.traceId,
+    timestamp: trace.timestamp,
+    allowed: trace.allowed,
+    counts: trace.counts,
+    blocked: trace.blocked.map(summarizeResult),
+    nearMisses: trace.nearMisses.map(summarizeResult),
+    context: trace.context,
+  };
+  appendJsonl(getTracePath(options), entry);
+  return entry;
+}
+function loadTraces(options = {}) {
+  return readJsonl(getTracePath(options));
+}
+function summarizeResult(r) {
+  return {
+    specName: r.specName,
+    id: r.constraintId || r.invariantId,
+    type: r.type,
+    reason: r.reason,
+    severity: r.severity,
+    nearMissScore: r.nearMissScore || 0,
+  };
+}
+// ---------------------------------------------------------------------------
+// Session Trace Summary
+// ---------------------------------------------------------------------------
+/**
+ * Summarize all traces from a session into a single-glance safety posture.
+ */
+function summarizeSessionTraces(traces) {
+  let totalEvaluations = traces.length;
+  let totalChecks = 0;
+  let totalBlocked = 0;
+  let totalNearMisses = 0;
+  let totalPassed = 0;
+  const blocksBySpec = new Map();
+  const blocksByConstraint = new Map();
+  const nearMissByConstraint = new Map();
+  for (const trace of traces) {
+    const counts = trace.counts || {};
+    totalChecks += counts.total || 0;
+    totalBlocked += counts.blocked || 0;
+    totalNearMisses += counts.nearMiss || 0;
+    totalPassed += counts.passed || 0;
+    for (const block of trace.blocked || []) {
+      const specKey = block.specName || 'unknown';
+      blocksBySpec.set(specKey, (blocksBySpec.get(specKey) || 0) + 1);
+      const cKey = block.id || 'unknown';
+      blocksByConstraint.set(cKey, (blocksByConstraint.get(cKey) || 0) + 1);
+    }
+    for (const nm of trace.nearMisses || []) {
+      const cKey = nm.id || 'unknown';
+      const existing = nearMissByConstraint.get(cKey) || { count: 0, maxScore: 0 };
+      existing.count += 1;
+      existing.maxScore = Math.max(existing.maxScore, nm.nearMissScore || 0);
+      nearMissByConstraint.set(cKey, existing);
+    }
+  }
+  return {
+    totalEvaluations,
+    totalChecks,
+    totalBlocked,
+    totalNearMisses,
+    totalPassed,
+    blockRate: totalChecks > 0 ? Math.round((totalBlocked / totalChecks) * 100) : 0,
+    nearMissRate: totalChecks > 0 ? Math.round((totalNearMisses / totalChecks) * 100) : 0,
+    safetyPosture: computeSafetyPosture(totalBlocked, totalNearMisses, totalChecks),
+    topBlockedSpecs: mapToSorted(blocksBySpec, 'name', 'count'),
+    topBlockedConstraints: mapToSorted(blocksByConstraint, 'id', 'count'),
+    topNearMisses: Array.from(nearMissByConstraint.entries())
+      .sort(([, a], [, b]) => b.count - a.count)
+      .slice(0, 10)
+      .map(([id, data]) => ({ id, count: data.count, maxScore: data.maxScore })),
+  };
+}
+/**
+ * Format a trace summary as human-readable text.
+ */
+function formatTraceSummary(summary) {
+  const lines = [];
+  lines.push(`Safety Posture: ${summary.safetyPosture.toUpperCase()}`);
+  lines.push(`Evaluations: ${summary.totalEvaluations} | Checks: ${summary.totalChecks}`);
+  lines.push(`Blocked: ${summary.totalBlocked} (${summary.blockRate}%) | Near-Misses: ${summary.totalNearMisses} (${summary.nearMissRate}%) | Passed: ${summary.totalPassed}`);
+  if (summary.topBlockedConstraints.length > 0) {
+    lines.push('');
+    lines.push('Top Blocked:');
+    for (const c of summary.topBlockedConstraints) {
+      lines.push(`  - ${c.id}: ${c.count}x`);
+    }
+  }
+  if (summary.topNearMisses.length > 0) {
+    lines.push('');
+    lines.push('Top Near-Misses:');
+    for (const nm of summary.topNearMisses) {
+      lines.push(`  - ${nm.id}: ${nm.count}x (max score: ${nm.maxScore})`);
+    }
+  }
+  return lines.join('\n');
+}
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+function computeSafetyPosture(blocked, nearMisses, total) {
+  if (total === 0) return 'unknown';
+  if (blocked > 0) return 'critical';
+  if (nearMisses > 0) return 'cautious';
+  return 'clean';
+}
+function mapToSorted(map, keyName, valueName) {
+  return Array.from(map.entries())
+    .sort(([, a], [, b]) => b - a)
+    .slice(0, 10)
+    .map(([k, v]) => ({ [keyName]: k, [valueName]: v }));
+}
+function truncate(value, maxLength) {
+  if (value === undefined || value === null) return null;
+  const text = String(value).trim();
+  return text ? text.slice(0, maxLength) : null;
+}
+// ---------------------------------------------------------------------------
+// CLI
+// ---------------------------------------------------------------------------
+function isCliInvocation(argv = process.argv) {
+  const invokedPath = argv[1];
+  return invokedPath ? path.resolve(invokedPath) === __filename : false;
+}
+if (isCliInvocation()) {
+  const command = process.argv[2] || 'summary';
+  if (command === 'summary') {
+    const traces = loadTraces();
+    const summary = summarizeSessionTraces(traces);
+    console.log(formatTraceSummary(summary));
+  } else if (command === 'json') {
+    const traces = loadTraces();
+    const summary = summarizeSessionTraces(traces);
+    console.log(JSON.stringify(summary, null, 2));
+  } else if (command === 'eval') {
+    // Evaluate current specs against a test command
+    const testCommand = process.argv[3] || '';
+    const specs = loadSpecDir();
+    const trace = traceEvaluation(specs, { command: testCommand, action: testCommand });
+    console.log(JSON.stringify({
+      allowed: trace.allowed,
+      counts: trace.counts,
+      blocked: trace.blocked.map(summarizeResult),
+      nearMisses: trace.nearMisses.map(summarizeResult),
+    }, null, 2));
+  } else {
+    console.error(`Unknown command: ${command}. Use: summary, json, eval`);
+    process.exit(1);
+  }
+}
+module.exports = {
+  NEAR_MISS_THRESHOLD,
+  computeNearMiss,
+  extractLiteralTokens,
+  formatTraceSummary,
+  loadTraces,
+  recordTrace,
+  summarizeSessionTraces,
+  traceEvaluation,
+};

package/scripts/feedback-loop.js CHANGED Viewed

@@ -1393,8 +1393,6 @@ function analyzeFeedback(logPath) {
   let totalNegative = 0;
   for (const entry of entries) {
-    if (isAuditTrailEntry(entry)) continue;
     if (entry.signal === 'positive') totalPositive++;
     if (entry.signal === 'negative') totalNegative++;
@@ -1428,8 +1426,7 @@ function analyzeFeedback(logPath) {
   const total = totalPositive + totalNegative;
   const approvalRate = total > 0 ? Math.round((totalPositive / total) * 1000) / 1000 : 0;
-  const realEntries = entries.filter((entry) => !isAuditTrailEntry(entry));
-  const recent = realEntries.slice(-20);
+  const recent = entries.slice(-20);
   const recentPos = recent.filter((e) => e.signal === 'positive').length;
   const recentRate = recent.length > 0 ? Math.round((recentPos / recent.length) * 1000) / 1000 : 0;
@@ -1438,7 +1435,7 @@ function analyzeFeedback(logPath) {
   const SEVEN_DAYS_MS = 7 * 24 * 60 * 60 * 1000;
   const THIRTY_DAYS_MS = 30 * 24 * 60 * 60 * 1000;
   const windowStats = { '7d': { total: 0, positive: 0 }, '30d': { total: 0, positive: 0 } };
-  for (const entry of realEntries) {
+  for (const entry of entries) {
     const ts = entry.timestamp ? new Date(entry.timestamp).getTime() : 0;
     const age = now - ts;
     if (age <= SEVEN_DAYS_MS) {
@@ -1701,12 +1698,11 @@ function writePreventionRules(filePath, minOccurrences = 2) {
 function feedbackSummary(recentN = 20, options = {}) {
   const { FEEDBACK_LOG_PATH } = getFeedbackPaths(options);
   const entries = readJSONL(FEEDBACK_LOG_PATH);
-  const realEntries = entries.filter((entry) => !isAuditTrailEntry(entry));
-  if (realEntries.length === 0) {
+  if (entries.length === 0) {
     return '## Feedback Summary\nNo feedback recorded yet.';
   }
-  const recent = realEntries.slice(-recentN);
+  const recent = entries.slice(-recentN);
   const positive = recent.filter((e) => e.signal === 'positive').length;
   const negative = recent.filter((e) => e.signal === 'negative').length;
   const pct = Math.round((positive / recent.length) * 100);