npm - thumbgate - Versions diffs - 0.9.14 → 1.1.0 - Mend

thumbgate 0.9.14 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

package/.claude-plugin/marketplace.json +1 -1
package/.claude-plugin/plugin.json +1 -1
package/.well-known/mcp/server-card.json +1 -1
package/README.md +1 -0
package/adapters/README.md +1 -1
package/adapters/chatgpt/openapi.yaml +105 -0
package/adapters/claude/.mcp.json +2 -2
package/adapters/codex/config.toml +2 -2
package/adapters/forge/forge.yaml +28 -0
package/adapters/mcp/server-stdio.js +41 -1
package/adapters/opencode/opencode.json +1 -1
package/bin/cli.js +18 -3
package/config/mcp-allowlists.json +11 -0
package/openapi/openapi.yaml +105 -0
package/package.json +7 -5
package/plugins/amp-skill/INSTALL.md +3 -4
package/plugins/amp-skill/SKILL.md +0 -1
package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +1 -1
package/plugins/claude-codex-bridge/.mcp.json +1 -1
package/plugins/claude-skill/INSTALL.md +1 -2
package/plugins/codex-profile/.codex-plugin/plugin.json +1 -1
package/plugins/codex-profile/.mcp.json +1 -1
package/plugins/codex-profile/INSTALL.md +1 -1
package/plugins/codex-profile/README.md +1 -1
package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +1 -1
package/plugins/opencode-profile/INSTALL.md +1 -1
package/public/blog.html +1 -0
package/public/dashboard.html +1 -1
package/public/guide.html +1 -1
package/public/index.html +8 -4
package/public/learn/agent-harness-pattern.html +1 -1
package/public/learn/ai-agent-persistent-memory.html +1 -1
package/public/learn/mcp-pre-action-gates-explained.html +1 -1
package/public/learn/stop-ai-agent-force-push.html +1 -1
package/public/learn/vibe-coding-safety-net.html +1 -1
package/public/learn.html +1 -1
package/public/lessons.html +1 -1
package/public/pro.html +1 -1
package/scripts/__pycache__/train_from_feedback.cpython-312.pyc +0 -0
package/scripts/agent-security-hardening.js +4 -4
package/scripts/async-job-runner.js +84 -24
package/scripts/auto-wire-hooks.js +59 -1
package/scripts/context-manager.js +330 -0
package/scripts/dashboard.js +1 -1
package/scripts/distribution-surfaces.js +12 -0
package/scripts/ensure-repo-bootstrap.js +15 -14
package/scripts/export-hf-dataset.js +293 -0
package/scripts/gates-engine.js +96 -10
package/scripts/hook-auto-capture.sh +1 -1
package/scripts/hosted-job-launcher.js +260 -0
package/scripts/managed-dpo-export.js +91 -0
package/scripts/obsidian-export.js +0 -1
package/scripts/operational-integrity.js +50 -7
package/scripts/prove-lancedb.js +62 -4
package/scripts/publish-decision.js +16 -0
package/scripts/self-healing-check.js +6 -1
package/scripts/social-analytics/load-env.js +33 -2
package/scripts/social-analytics/store.js +200 -2
package/scripts/sync-version.js +18 -11
package/scripts/tool-registry.js +48 -0
package/scripts/train_from_feedback.py +0 -4
package/scripts/workflow-sentinel.js +793 -0
package/src/api/server.js +205 -27
/package/scripts/{rlhf_session_start.sh → thumbgate_session_start.sh} +0 -0

package/scripts/export-hf-dataset.js ADDED Viewed

@@ -0,0 +1,293 @@
+#!/usr/bin/env node
+'use strict';
+/**
+ * HuggingFace Dataset Exporter
+ *
+ * Exports ThumbGate agent traces as a HuggingFace-compatible dataset in two formats:
+ *
+ * 1. Agent Traces (traces split) — raw feedback entries with tool calls, signals,
+ *    context, and outcomes. Matches the "share your agent traces" initiative.
+ *
+ * 2. DPO Preferences (preferences split) — chosen/rejected preference pairs
+ *    derived from error→learning memory promotion. Ready for DPO/RLHF training.
+ *
+ * Output: Parquet-compatible JSONL files + dataset_info.json (HF Dataset Card metadata).
+ *
+ * HuggingFace Datasets format:
+ *   dataset_dir/
+ *     dataset_info.json        — metadata, features schema, splits
+ *     traces.jsonl             — agent trace rows
+ *     preferences.jsonl        — DPO preference pair rows
+ */
+const fs = require('fs');
+const path = require('path');
+const { resolveFeedbackDir } = require('./feedback-paths');
+const { exportDpoFromMemories } = require('./export-dpo-pairs');
+const { getProvenance } = require('./contextfs');
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+function readJSONL(filePath) {
+  if (!fs.existsSync(filePath)) return [];
+  const raw = fs.readFileSync(filePath, 'utf-8').trim();
+  if (!raw) return [];
+  return raw
+    .split('\n')
+    .map((line) => {
+      try { return JSON.parse(line); } catch { return null; }
+    })
+    .filter(Boolean);
+}
+function ensureDir(dirPath) {
+  if (!fs.existsSync(dirPath)) {
+    fs.mkdirSync(dirPath, { recursive: true });
+  }
+}
+function writeJSONL(filePath, rows) {
+  const content = rows.map((row) => JSON.stringify(row)).join('\n');
+  fs.writeFileSync(filePath, content ? `${content}\n` : '');
+}
+// ---------------------------------------------------------------------------
+// PII / path redaction
+// ---------------------------------------------------------------------------
+function redactPaths(text) {
+  if (!text || typeof text !== 'string') return text || '';
+  return text
+    .replace(/\/Users\/[^\s/]+/g, '/Users/redacted')
+    .replace(/\/home\/[^\s/]+/g, '/home/redacted')
+    .replace(/C:\\Users\\[^\s\\]+/g, 'C:\\Users\\redacted');
+}
+function redactEntry(obj) {
+  if (!obj || typeof obj !== 'object') return obj;
+  const out = {};
+  for (const [key, value] of Object.entries(obj)) {
+    if (typeof value === 'string') {
+      out[key] = redactPaths(value);
+    } else if (Array.isArray(value)) {
+      out[key] = value.map((v) => (typeof v === 'string' ? redactPaths(v) : v));
+    } else {
+      out[key] = value;
+    }
+  }
+  return out;
+}
+// ---------------------------------------------------------------------------
+// Trace row builder — converts feedback-log entries to HF trace rows
+// ---------------------------------------------------------------------------
+function buildTraceRow(entry, index) {
+  return {
+    trace_id: entry.id || `trace_${index}`,
+    timestamp: entry.timestamp || null,
+    signal: entry.signal || entry.feedback || 'unknown',
+    tool_name: entry.toolName || entry.actionType || 'unknown',
+    context: redactPaths(entry.context || ''),
+    what_worked: redactPaths(entry.whatWorked || ''),
+    what_went_wrong: redactPaths(entry.whatWentWrong || ''),
+    what_to_change: redactPaths(entry.whatToChange || ''),
+    tags: Array.isArray(entry.tags) ? entry.tags : [],
+    failure_type: entry.failureType || null,
+    source: 'thumbgate',
+  };
+}
+// ---------------------------------------------------------------------------
+// Preference row builder — converts DPO pairs to HF preference rows
+// ---------------------------------------------------------------------------
+function buildPreferenceRow(pair, index) {
+  return {
+    pair_id: `pref_${index}`,
+    prompt: redactPaths(pair.prompt || ''),
+    chosen: redactPaths(pair.chosen || ''),
+    rejected: redactPaths(pair.rejected || ''),
+    match_score: pair.metadata ? pair.metadata.matchScore : null,
+    matched_keys: pair.metadata ? pair.metadata.matchedKeys || [] : [],
+    rubric_delta: pair.metadata && pair.metadata.rubric
+      ? pair.metadata.rubric.weightedDelta
+      : null,
+    source: 'thumbgate',
+  };
+}
+// ---------------------------------------------------------------------------
+// Dataset info (HuggingFace Dataset Card metadata)
+// ---------------------------------------------------------------------------
+function buildDatasetInfo({ traceCount, preferenceCount, exportedAt }) {
+  return {
+    dataset_info: {
+      description: 'Agent traces and DPO preference pairs from ThumbGate — pre-action gates for AI coding agents. Contains real-world tool call feedback, failure patterns, and learned corrections.',
+      citation: '',
+      homepage: 'https://github.com/IgorGanapolsky/ThumbGate',
+      license: 'MIT',
+      features: {
+        traces: {
+          trace_id: { dtype: 'string' },
+          timestamp: { dtype: 'string' },
+          signal: { dtype: 'string' },
+          tool_name: { dtype: 'string' },
+          context: { dtype: 'string' },
+          what_worked: { dtype: 'string' },
+          what_went_wrong: { dtype: 'string' },
+          what_to_change: { dtype: 'string' },
+          tags: { dtype: 'list', inner: { dtype: 'string' } },
+          failure_type: { dtype: 'string' },
+          source: { dtype: 'string' },
+        },
+        preferences: {
+          pair_id: { dtype: 'string' },
+          prompt: { dtype: 'string' },
+          chosen: { dtype: 'string' },
+          rejected: { dtype: 'string' },
+          match_score: { dtype: 'float32' },
+          matched_keys: { dtype: 'list', inner: { dtype: 'string' } },
+          rubric_delta: { dtype: 'float32' },
+          source: { dtype: 'string' },
+        },
+      },
+      splits: {
+        traces: { num_examples: traceCount },
+        preferences: { num_examples: preferenceCount },
+      },
+    },
+    exported_at: exportedAt,
+    exporter: 'thumbgate/export-hf-dataset',
+    version: '1.0.0',
+  };
+}
+// ---------------------------------------------------------------------------
+// Main export function
+// ---------------------------------------------------------------------------
+/**
+ * Export ThumbGate data as a HuggingFace-compatible dataset.
+ *
+ * @param {Object} options
+ * @param {string} [options.outputDir] - Directory to write dataset files
+ * @param {string} [options.feedbackDir] - Override feedback data directory
+ * @param {boolean} [options.includeProvenance] - Include provenance events in traces
+ * @returns {Object} Export summary
+ */
+function exportHfDataset(options = {}) {
+  const feedbackDir = options.feedbackDir || resolveFeedbackDir();
+  const outputDir = options.outputDir || path.join(feedbackDir, 'hf-dataset');
+  const includeProvenance = options.includeProvenance !== false;
+  ensureDir(outputDir);
+  // --- Traces split ---
+  const feedbackLogPath = path.join(feedbackDir, 'feedback-log.jsonl');
+  const feedbackEntries = readJSONL(feedbackLogPath);
+  const traceRows = feedbackEntries.map((entry, i) => buildTraceRow(redactEntry(entry), i));
+  // Optionally append provenance events as traces
+  if (includeProvenance) {
+    try {
+      const provenanceEvents = getProvenance(200);
+      for (const evt of provenanceEvents) {
+        traceRows.push({
+          trace_id: evt.id || `prov_${traceRows.length}`,
+          timestamp: evt.timestamp || null,
+          signal: 'provenance',
+          tool_name: evt.type || 'context_assembly',
+          context: redactPaths(JSON.stringify(evt).slice(0, 500)),
+          what_worked: '',
+          what_went_wrong: '',
+          what_to_change: '',
+          tags: ['provenance'],
+          failure_type: null,
+          source: 'thumbgate',
+        });
+      }
+    } catch {
+      // Provenance read failure should not break export
+    }
+  }
+  writeJSONL(path.join(outputDir, 'traces.jsonl'), traceRows);
+  // --- Preferences split ---
+  const memoryLogPath = path.join(feedbackDir, 'memory-log.jsonl');
+  const memories = readJSONL(memoryLogPath);
+  let preferenceRows = [];
+  if (memories.length > 0) {
+    try {
+      const dpoResult = exportDpoFromMemories(memories);
+      preferenceRows = dpoResult.pairs.map((pair, i) => buildPreferenceRow(pair, i));
+    } catch {
+      // DPO export failure should not break the traces export
+    }
+  }
+  writeJSONL(path.join(outputDir, 'preferences.jsonl'), preferenceRows);
+  // --- Dataset info ---
+  const exportedAt = new Date().toISOString();
+  const info = buildDatasetInfo({
+    traceCount: traceRows.length,
+    preferenceCount: preferenceRows.length,
+    exportedAt,
+  });
+  fs.writeFileSync(
+    path.join(outputDir, 'dataset_info.json'),
+    JSON.stringify(info, null, 2) + '\n',
+  );
+  return {
+    outputDir,
+    traceCount: traceRows.length,
+    preferenceCount: preferenceRows.length,
+    files: ['traces.jsonl', 'preferences.jsonl', 'dataset_info.json'],
+    exportedAt,
+  };
+}
+// ---------------------------------------------------------------------------
+// CLI
+// ---------------------------------------------------------------------------
+function main() {
+  const args = {};
+  process.argv.slice(2).forEach((arg) => {
+    if (!arg.startsWith('--')) return;
+    const [key, ...rest] = arg.slice(2).split('=');
+    args[key] = rest.length ? rest.join('=') : true;
+  });
+  const result = exportHfDataset({
+    outputDir: args.output || undefined,
+    includeProvenance: args.provenance !== 'false',
+  });
+  console.log(`Exported HuggingFace dataset to ${result.outputDir}`);
+  console.log(`  Traces: ${result.traceCount}`);
+  console.log(`  Preferences: ${result.preferenceCount}`);
+  console.log(`  Files: ${result.files.join(', ')}`);
+}
+if (require.main === module) {
+  main();
+}
+module.exports = {
+  exportHfDataset,
+  buildTraceRow,
+  buildPreferenceRow,
+  buildDatasetInfo,
+  redactPaths,
+  redactEntry,
+  readJSONL,
+};

package/scripts/gates-engine.js CHANGED Viewed

@@ -11,6 +11,9 @@ const {
   DEFAULT_BASE_BRANCH,
   evaluateOperationalIntegrity,
 } = require('./operational-integrity');
+const {
+  evaluateWorkflowSentinel,
+} = require('./workflow-sentinel');
 /**
  * Computes the SHA-256 hash of an executable binary to prevent path-based bypasses.
@@ -764,6 +767,16 @@ function buildReasoning(gate, toolName, toolInput, extras = {}) {
     steps.push(`Memory guard matched (${extras.memoryGuard.source}): ${extras.memoryGuard.reason}`);
   }
+  if (extras.workflowSentinel) {
+    steps.push(`Workflow sentinel risk: ${extras.workflowSentinel.band} (${extras.workflowSentinel.riskScore})`);
+    if (extras.workflowSentinel.blastRadius && extras.workflowSentinel.blastRadius.summary) {
+      steps.push(`Workflow sentinel blast radius: ${extras.workflowSentinel.blastRadius.summary}`);
+    }
+    for (const remediation of (extras.workflowSentinel.remediations || []).slice(0, 3)) {
+      steps.push(`Workflow sentinel remediation: ${remediation.title} — ${remediation.action}`);
+    }
+  }
   // 5. Unless condition status
   if (gate.unless) {
     steps.push(`Bypassable via satisfy_gate("${gate.unless}") — not currently satisfied`);
@@ -973,6 +986,39 @@ function evaluateMemoryGuard(toolName, toolInput = {}) {
   };
 }
+function buildSentinelGateResult(report) {
+  return {
+    decision: report.decision,
+    gate: 'workflow-sentinel',
+    message: `${report.summary} ${report.blastRadius.summary}`,
+    severity: report.decision === 'deny' ? 'critical' : 'high',
+    reasoning: Array.isArray(report.reasoning) ? report.reasoning.slice() : [],
+    sentinel: report,
+  };
+}
+function enrichResultWithSentinel(result, report) {
+  if (!result || !report || report.decision === 'allow') {
+    return result;
+  }
+  const next = {
+    ...result,
+    reasoning: Array.isArray(result.reasoning) ? result.reasoning.slice() : [],
+    sentinel: report,
+  };
+  if (report.blastRadius && report.blastRadius.summary) {
+    next.message = `${result.message} Workflow sentinel: ${report.blastRadius.summary}`;
+  }
+  next.reasoning = next.reasoning.concat(
+    Array.isArray(report.reasoning) ? report.reasoning : []
+  );
+  return next;
+}
 async function checkMetricCondition(metricCondition) {
   if (!metricCondition) return true;
   const { getBusinessMetrics } = require('./semantic-layer');
@@ -1058,20 +1104,40 @@ async function evaluateGatesAsync(toolName, toolInput, configPath) {
     }
   }
+  const sentinelReport = evaluateWorkflowSentinel(toolName, toolInput, {
+    governanceState: loadGovernanceState(),
+  });
   const memoryGuard = evaluateMemoryGuard(toolName, toolInput);
   if (memoryGuard) {
-    recordStat(memoryGuard.gate, 'block');
+    const enrichedMemoryGuard = enrichResultWithSentinel(memoryGuard, sentinelReport);
+    recordStat(enrichedMemoryGuard.gate, 'block');
     const auditRecord = recordAuditEvent({
       toolName,
       toolInput,
       decision: 'deny',
-      gateId: memoryGuard.gate,
-      message: memoryGuard.message,
-      severity: memoryGuard.severity,
+      gateId: enrichedMemoryGuard.gate,
+      message: enrichedMemoryGuard.message,
+      severity: enrichedMemoryGuard.severity,
       source: 'gates-engine',
     });
     auditToFeedback(auditRecord);
-    return memoryGuard;
+    return enrichedMemoryGuard;
+  }
+  if (sentinelReport && sentinelReport.decision !== 'allow') {
+    const sentinelResult = buildSentinelGateResult(sentinelReport);
+    recordStat(sentinelResult.gate, sentinelResult.decision === 'deny' ? 'block' : 'warn');
+    const auditRecord = recordAuditEvent({
+      toolName,
+      toolInput,
+      decision: sentinelResult.decision,
+      gateId: sentinelResult.gate,
+      message: sentinelResult.message,
+      severity: sentinelResult.severity,
+      source: 'workflow-sentinel',
+    });
+    auditToFeedback(auditRecord);
+    return sentinelResult;
   }
   // Audit trail: record allow (no gate matched)
@@ -1124,20 +1190,40 @@ function evaluateGates(toolName, toolInput, configPath) {
     }
   }
+  const sentinelReport = evaluateWorkflowSentinel(toolName, toolInput, {
+    governanceState: loadGovernanceState(),
+  });
   const memoryGuard = evaluateMemoryGuard(toolName, toolInput);
   if (memoryGuard) {
-    recordStat(memoryGuard.gate, 'block');
+    const enrichedMemoryGuard = enrichResultWithSentinel(memoryGuard, sentinelReport);
+    recordStat(enrichedMemoryGuard.gate, 'block');
     const auditRecord = recordAuditEvent({
       toolName,
       toolInput,
       decision: 'deny',
-      gateId: memoryGuard.gate,
-      message: memoryGuard.message,
-      severity: memoryGuard.severity,
+      gateId: enrichedMemoryGuard.gate,
+      message: enrichedMemoryGuard.message,
+      severity: enrichedMemoryGuard.severity,
       source: 'gates-engine',
     });
     auditToFeedback(auditRecord);
-    return memoryGuard;
+    return enrichedMemoryGuard;
+  }
+  if (sentinelReport && sentinelReport.decision !== 'allow') {
+    const sentinelResult = buildSentinelGateResult(sentinelReport);
+    recordStat(sentinelResult.gate, sentinelResult.decision === 'deny' ? 'block' : 'warn');
+    const auditRecord = recordAuditEvent({
+      toolName,
+      toolInput,
+      decision: sentinelResult.decision,
+      gateId: sentinelResult.gate,
+      message: sentinelResult.message,
+      severity: sentinelResult.severity,
+      source: 'workflow-sentinel',
+    });
+    auditToFeedback(auditRecord);
+    return sentinelResult;
   }
   // Audit trail: record allow

package/scripts/hook-auto-capture.sh CHANGED Viewed

@@ -10,7 +10,7 @@ PROMPT_GUARD="$SCRIPT_DIR/prompt-guard.js"
 ACTIVE_CWD="${CLAUDE_PROJECT_DIR:-${PWD:-$(pwd)}}"
 FEEDBACK_DIR="$(node -e "const path = require('path'); const { resolveFeedbackDir } = require(path.join(process.argv[1], 'feedback-paths.js')); process.stdout.write(resolveFeedbackDir({ cwd: process.argv[2] || process.cwd(), feedbackDir: process.env.THUMBGATE_FEEDBACK_DIR || undefined }));" "$SCRIPT_DIR" "$ACTIVE_CWD" 2>/dev/null)"
 if [ -z "$FEEDBACK_DIR" ]; then
-  FEEDBACK_DIR="${THUMBGATE_FEEDBACK_DIR:-$ACTIVE_CWD/.rlhf}"
+  FEEDBACK_DIR="${THUMBGATE_FEEDBACK_DIR:-$ACTIVE_CWD/.thumbgate}"
 fi
 FEEDBACK_LOG="$FEEDBACK_DIR/feedback-log.jsonl"
 MEMORY_LOG="$FEEDBACK_DIR/memory-log.jsonl"