npm - thumbgate - Versions diffs - 1.5.8 → 1.7.0 - Mend

thumbgate 1.5.8 → 1.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

package/.claude-plugin/marketplace.json +2 -2
package/.claude-plugin/plugin.json +1 -1
package/.well-known/mcp/server-card.json +1 -1
package/CHANGELOG.md +198 -0
package/README.md +7 -6
package/adapters/README.md +1 -1
package/adapters/chatgpt/openapi.yaml +25 -0
package/adapters/claude/.mcp.json +2 -2
package/adapters/codex/config.toml +4 -4
package/adapters/mcp/server-stdio.js +41 -2
package/adapters/opencode/opencode.json +1 -1
package/bin/cli.js +100 -10
package/openapi/openapi.yaml +25 -0
package/package.json +13 -3
package/public/codex-plugin.html +277 -0
package/public/dashboard.html +141 -13
package/public/index.html +92 -34
package/public/learn.html +13 -2
package/public/lessons.html +5 -2
package/public/pro.html +8 -1
package/scripts/auto-wire-hooks.js +10 -5
package/scripts/billing.js +503 -8
package/scripts/contextfs.js +1 -1
package/scripts/dashboard.js +236 -0
package/scripts/feedback-loop.js +22 -0
package/scripts/gates-engine.js +461 -7
package/scripts/hook-runtime.js +42 -0
package/scripts/llm-client.js +25 -10
package/scripts/mailer/index.js +13 -0
package/scripts/mailer/resend-mailer.js +350 -0
package/scripts/mcp-config.js +13 -0
package/scripts/published-cli.js +8 -0
package/scripts/seo-gsd.js +118 -4
package/scripts/statusline.sh +8 -0
package/scripts/vector-store.js +21 -7
package/src/api/server.js +112 -7

package/scripts/gates-engine.js CHANGED Viewed

@@ -83,6 +83,11 @@ const DEFAULT_PROTECTED_FILE_GLOBS = [
 ];
 const EDIT_LIKE_TOOLS = new Set(['Edit', 'Write', 'MultiEdit']);
 const HIGH_RISK_BASH_PATTERN = /\b(?:git\s+(?:add|commit|push)|gh\s+pr\s+(?:create|merge)|npm\s+publish|yarn\s+publish|pnpm\s+publish|rm\s+-rf)\b/i;
+const BOOSTED_RISK_BLOCK_SCORE = 0.8;
+const BOOSTED_RISK_MIN_EXAMPLES = 3;
+const PR_THREAD_RESOLUTION_ACTION = 'pr_thread_resolution_verified_after_commit';
+const PR_THREAD_RESOLUTION_CLAIM_PATTERN = '(?:thread|review|comment).*?(?:resolved|verified|checked|addressed|fixed)|(?:resolved|verified|checked|addressed|fixed).*?(?:thread|review|comment)';
+const PR_THREAD_RESOLUTION_REQUIRED_ACTIONS = ['pr_threads_checked', 'thread_resolution_verified'];
 // ---------------------------------------------------------------------------
 // Config loading
@@ -609,6 +614,218 @@ function isHighRiskAction(toolName, toolInput = {}, affectedFiles = []) {
   return false;
 }
+function normalizeRiskToken(value) {
+  return String(value || '')
+    .toLowerCase()
+    .replace(/[^a-z0-9]+/g, ' ')
+    .trim();
+}
+function singularizeRiskToken(token) {
+  const value = String(token || '').trim();
+  if (value.length > 3 && value.endsWith('ies')) return `${value.slice(0, -3)}y`;
+  if (value.length > 3 && value.endsWith('s')) return value.slice(0, -1);
+  return value;
+}
+function riskTokenVariants(token) {
+  const normalized = singularizeRiskToken(token);
+  const variants = new Set([token, normalized]);
+  const synonyms = {
+    comment: ['comment', 'comments', 'review', 'reviews', 'reply', 'replies', 'thread', 'threads'],
+    thread: ['thread', 'threads', 'review', 'reviews', 'comment', 'comments'],
+    bot: ['bot', 'bots', 'automation', 'automated', 'assistant', 'claude', 'codex'],
+    pr: ['pr', 'pull', 'pullrequest', 'pullrequests'],
+    file: ['file', 'files', 'path', 'paths'],
+    test: ['test', 'tests', 'ci', 'coverage', 'verify', 'verification'],
+  };
+  for (const candidate of [token, normalized]) {
+    for (const item of synonyms[candidate] || []) {
+      variants.add(item);
+      variants.add(singularizeRiskToken(item));
+    }
+  }
+  return [...variants].filter(Boolean);
+}
+function normalizeRiskTagEntry(entry) {
+  if (!entry) return null;
+  if (typeof entry === 'string') {
+    return { tag: entry };
+  }
+  if (typeof entry !== 'object') return null;
+  const tag = entry.tag || entry.key || entry.name || entry.domain || entry.label || entry.id;
+  if (!tag) return null;
+  return {
+    tag: String(tag),
+    count: Number(entry.count ?? entry.examples ?? entry.exampleCount ?? entry.total ?? entry.samples),
+    failures: Number(entry.failures ?? entry.failureCount),
+    riskRate: Number(entry.riskRate ?? entry.rate ?? entry.failureRate ?? entry.score ?? entry.riskScore),
+  };
+}
+function collectBoostedRiskTags(toolInput = {}) {
+  const boostedRisk = toolInput.boostedRisk && typeof toolInput.boostedRisk === 'object'
+    ? toolInput.boostedRisk
+    : {};
+  const sources = [
+    toolInput.highRiskTags,
+    toolInput.riskTags,
+    boostedRisk.highRiskTags,
+    boostedRisk.tags,
+    boostedRisk.highRiskDomains,
+  ];
+  const tags = [];
+  for (const source of sources) {
+    if (Array.isArray(source)) {
+      tags.push(...source.map(normalizeRiskTagEntry).filter(Boolean));
+    }
+  }
+  return tags;
+}
+function isBoostedRiskHigh(toolInput = {}) {
+  const boostedRisk = toolInput.boostedRisk && typeof toolInput.boostedRisk === 'object'
+    ? toolInput.boostedRisk
+    : {};
+  const level = String(boostedRisk.riskLevel || boostedRisk.level || boostedRisk.mode || '').toLowerCase();
+  if (/\b(?:high|critical|block|deny)\b/.test(level)) return true;
+  const riskScore = Number(boostedRisk.riskScore ?? boostedRisk.score ?? boostedRisk.riskRate ?? boostedRisk.failureRate ?? boostedRisk.baseRate);
+  if (Number.isFinite(riskScore) && riskScore >= BOOSTED_RISK_BLOCK_SCORE) return true;
+  const exampleCount = Number(boostedRisk.exampleCount ?? boostedRisk.count ?? boostedRisk.samples ?? boostedRisk.total);
+  const failureCount = Number(boostedRisk.failureCount ?? boostedRisk.failures);
+  if (
+    Number.isFinite(exampleCount) &&
+    exampleCount >= BOOSTED_RISK_MIN_EXAMPLES &&
+    Number.isFinite(failureCount) &&
+    failureCount / Math.max(exampleCount, 1) >= BOOSTED_RISK_BLOCK_SCORE
+  ) {
+    return true;
+  }
+  return collectBoostedRiskTags(toolInput).some((entry) => {
+    if (Number.isFinite(entry.riskRate) && entry.riskRate >= BOOSTED_RISK_BLOCK_SCORE) return true;
+    if (Number.isFinite(entry.count) && entry.count >= BOOSTED_RISK_MIN_EXAMPLES && !Number.isFinite(entry.riskRate)) return true;
+    if (
+      Number.isFinite(entry.count) &&
+      entry.count >= BOOSTED_RISK_MIN_EXAMPLES &&
+      Number.isFinite(entry.failures) &&
+      entry.failures / Math.max(entry.count, 1) >= BOOSTED_RISK_BLOCK_SCORE
+    ) {
+      return true;
+    }
+    return false;
+  });
+}
+function riskTagMatchesAction(tag, actionContext) {
+  const normalizedTag = normalizeRiskToken(tag);
+  const normalizedAction = normalizeRiskToken(actionContext);
+  if (!normalizedTag || !normalizedAction) return false;
+  const actionTokens = new Set(normalizedAction.split(/\s+/).filter(Boolean));
+  const tagTokens = normalizedTag.split(/\s+/).filter(Boolean);
+  return tagTokens.some((token) => riskTokenVariants(token).some((variant) => actionTokens.has(variant)));
+}
+function evaluateBoostedRiskTagGuard(toolName, toolInput = {}) {
+  const tags = collectBoostedRiskTags(toolInput);
+  if (tags.length === 0 || !isBoostedRiskHigh(toolInput)) return null;
+  const actionContext = extractActionContext(toolName, toolInput);
+  const matchedTag = tags.find((entry) => riskTagMatchesAction(entry.tag, actionContext));
+  if (!matchedTag) return null;
+  const matchText = toolInput.command || toolInput.file_path || toolInput.path || actionContext;
+  const message = `Boosted-risk history matched this action (${matchedTag.tag}). This pattern is denied by default until explicit evidence lowers the risk.`;
+  return {
+    decision: 'deny',
+    gate: 'boosted-risk-tag-default-deny',
+    message,
+    severity: 'critical',
+    reasoning: [
+      `High-risk tag "${matchedTag.tag}" matched "${String(matchText).slice(0, 120)}"`,
+      `Risk threshold: score >= ${BOOSTED_RISK_BLOCK_SCORE} or at least ${BOOSTED_RISK_MIN_EXAMPLES} examples`,
+      'Hook enforcement blocks this pre-tool call instead of relying on advisory recall',
+    ],
+  };
+}
+function isGitCommitCommand(toolName, toolInput = {}) {
+  return toolName === 'Bash' && /\bgit\s+commit\b/i.test(String(toolInput.command || ''));
+}
+function isProtectedBranchName(branchName) {
+  return /^(?:main|master|develop|dev|trunk|release)$/i.test(String(branchName || '').trim());
+}
+function detectBranchName(toolInput = {}, repoRoot = null) {
+  const inline = toolInput.branchName || toolInput.currentBranch || toolInput.branch || toolInput.headRefName;
+  if (inline) return String(inline).trim();
+  if (!repoRoot) return '';
+  return safeExecFileLines('git', ['rev-parse', '--abbrev-ref', 'HEAD'], repoRoot)[0] || '';
+}
+function hasPrBranchContext(toolInput = {}, repoRoot = null) {
+  if (toolInput.prNumber || toolInput.prUrl || toolInput.pullRequestNumber || toolInput.pullRequestUrl) {
+    return true;
+  }
+  const branchName = detectBranchName(toolInput, repoRoot);
+  return Boolean(branchName && !isProtectedBranchName(branchName));
+}
+function registerPrThreadResolutionClaimGate(toolName, toolInput = {}) {
+  if (!isGitCommitCommand(toolName, toolInput)) return null;
+  const repoRoot = resolveRepoRoot(toolInput);
+  if (!hasPrBranchContext(toolInput, repoRoot)) return null;
+  const branchName = detectBranchName(toolInput, repoRoot);
+  const claimGate = registerClaimGate(
+    PR_THREAD_RESOLUTION_CLAIM_PATTERN,
+    PR_THREAD_RESOLUTION_REQUIRED_ACTIONS,
+    'A PR-branch commit requires verified review-thread resolution before more tool calls or readiness claims.',
+  );
+  trackAction(PR_THREAD_RESOLUTION_ACTION, {
+    branchName: branchName || null,
+    repoRoot: repoRoot || null,
+    commandHash: crypto.createHash('sha256').update(String(toolInput.command || '')).digest('hex'),
+  });
+  return claimGate;
+}
+function isThreadResolutionSatisfied() {
+  return PR_THREAD_RESOLUTION_REQUIRED_ACTIONS.some((actionId) => (
+    hasAction(actionId) || isConditionSatisfied(actionId)
+  ));
+}
+function isThreadResolutionEvidenceAction(toolName, toolInput = {}) {
+  if (isGitCommitCommand(toolName, toolInput)) return true;
+  if (['recall', 'search_lessons', 'verify_claim', 'satisfy_gate', 'track_action'].includes(toolName)) return true;
+  if (toolName !== 'Bash') return false;
+  const command = String(toolInput.command || '');
+  return /\b(?:gate-satisfy|satisfy_gate|track_action|gh\s+pr\s+(?:view|checks|status)|gh\s+api\b.*(?:reviewThreads|reviews|comments|threads)|git\s+(?:status|diff|show))\b/i.test(command);
+}
+function evaluatePendingPrThreadResolutionGate(toolName, toolInput = {}) {
+  if (!hasAction(PR_THREAD_RESOLUTION_ACTION)) return null;
+  if (isThreadResolutionSatisfied()) return null;
+  if (isThreadResolutionEvidenceAction(toolName, toolInput)) return null;
+  const message = 'A git commit was made on a PR branch. Verify review threads are resolved before the next tool call.';
+  return {
+    decision: 'deny',
+    gate: 'pr-thread-resolution-verified-required',
+    message,
+    severity: 'critical',
+    reasoning: [
+      `Tracked action ${PR_THREAD_RESOLUTION_ACTION} is pending`,
+      'Satisfy pr_threads_checked or thread_resolution_verified with evidence before continuing',
+    ],
+  };
+}
 function isScopeEnforcedAction(toolName, toolInput = {}, affectedFiles = []) {
   if (EDIT_LIKE_TOOLS.has(toolName) && affectedFiles.length > 0) return true;
   if (toolName !== 'Bash') return false;
@@ -1116,6 +1333,38 @@ async function evaluateGatesAsync(toolName, toolInput, configPath) {
   }
   const constraints = loadConstraints();
+  registerPrThreadResolutionClaimGate(toolName, toolInput);
+  const pendingThreadResolutionGate = evaluatePendingPrThreadResolutionGate(toolName, toolInput);
+  if (pendingThreadResolutionGate) {
+    recordStat(pendingThreadResolutionGate.gate, 'block');
+    const auditRecord = recordAuditEvent({
+      toolName,
+      toolInput,
+      decision: 'deny',
+      gateId: pendingThreadResolutionGate.gate,
+      message: pendingThreadResolutionGate.message,
+      severity: pendingThreadResolutionGate.severity,
+      source: 'gates-engine',
+    });
+    auditToFeedback(auditRecord);
+    return pendingThreadResolutionGate;
+  }
+  const boostedRiskGuard = evaluateBoostedRiskTagGuard(toolName, toolInput);
+  if (boostedRiskGuard) {
+    recordStat(boostedRiskGuard.gate, 'block');
+    const auditRecord = recordAuditEvent({
+      toolName,
+      toolInput,
+      decision: 'deny',
+      gateId: boostedRiskGuard.gate,
+      message: boostedRiskGuard.message,
+      severity: boostedRiskGuard.severity,
+      source: 'gates-engine',
+    });
+    auditToFeedback(auditRecord);
+    return boostedRiskGuard;
+  }
   // Fast-path: feedback/recall tools skip metric gates entirely (avoids Stripe API calls)
   const METRIC_SKIP_TOOLS = ['capture_feedback', 'feedback_stats', 'recall', 'feedback_summary', 'prevention_rules'];
@@ -1254,6 +1503,38 @@ function evaluateGates(toolName, toolInput, configPath) {
   }
   const constraints = loadConstraints();
+  registerPrThreadResolutionClaimGate(toolName, toolInput);
+  const pendingThreadResolutionGate = evaluatePendingPrThreadResolutionGate(toolName, toolInput);
+  if (pendingThreadResolutionGate) {
+    recordStat(pendingThreadResolutionGate.gate, 'block');
+    const auditRecord = recordAuditEvent({
+      toolName,
+      toolInput,
+      decision: 'deny',
+      gateId: pendingThreadResolutionGate.gate,
+      message: pendingThreadResolutionGate.message,
+      severity: pendingThreadResolutionGate.severity,
+      source: 'gates-engine',
+    });
+    auditToFeedback(auditRecord);
+    return pendingThreadResolutionGate;
+  }
+  const boostedRiskGuard = evaluateBoostedRiskTagGuard(toolName, toolInput);
+  if (boostedRiskGuard) {
+    recordStat(boostedRiskGuard.gate, 'block');
+    const auditRecord = recordAuditEvent({
+      toolName,
+      toolInput,
+      decision: 'deny',
+      gateId: boostedRiskGuard.gate,
+      message: boostedRiskGuard.message,
+      severity: boostedRiskGuard.severity,
+      source: 'gates-engine',
+    });
+    auditToFeedback(auditRecord);
+    return boostedRiskGuard;
+  }
   for (const gate of config.gates) {
     const matchDetails = matchGate(gate, toolName, toolInput);
@@ -1456,14 +1737,20 @@ function evaluateSecretGuard(input = {}) {
 // PreToolUse hook interface (stdin/stdout JSON)
 // ---------------------------------------------------------------------------
+function buildReminderOutput(context) {
+  return {
+    additionalContext: context,
+    systemReminder: context,
+    thumbgateSystemReminder: context,
+  };
+}
 function formatOutput(result, behavioralContext) {
   if (!result) {
     // No gate matched — inject behavioral context if available
     if (behavioralContext) {
       return JSON.stringify({
-        hookSpecificOutput: {
-          additionalContext: behavioralContext,
-        },
+        hookSpecificOutput: buildReminderOutput(behavioralContext),
       });
     }
     return JSON.stringify({});
@@ -1474,19 +1761,27 @@ function formatOutput(result, behavioralContext) {
     : '';
   if (result.decision === 'deny') {
+    const reminder = behavioralContext ? buildReminderOutput(behavioralContext) : {};
+    const reminderSuffix = behavioralContext ? `\n\nSystem reminder:\n${behavioralContext}` : '';
     return JSON.stringify({
       hookSpecificOutput: {
+        ...reminder,
         permissionDecision: 'deny',
-        permissionDecisionReason: `[GATE:${result.gate}] ${result.message}${reasoningSuffix}`,
+        permissionDecisionReason: `[GATE:${result.gate}] ${result.message}${reasoningSuffix}${reminderSuffix}`,
       },
     });
   }
   if (result.decision === 'warn') {
     const extra = behavioralContext ? `\n${behavioralContext}` : '';
+    const context = `[GATE:${result.gate}] WARNING: ${result.message}${reasoningSuffix}${extra}`;
     return JSON.stringify({
       hookSpecificOutput: {
-        additionalContext: `[GATE:${result.gate}] WARNING: ${result.message}${reasoningSuffix}${extra}`,
+        additionalContext: context,
+        ...(behavioralContext ? {
+          systemReminder: behavioralContext,
+          thumbgateSystemReminder: behavioralContext,
+        } : {}),
       },
     });
   }
@@ -1518,6 +1813,146 @@ function buildBehavioralContext() {
   }
 }
+/**
+ * Build "recent mistakes" context by reading the tail of memory-log.jsonl.
+ * Surfaces the 3 most recent negative-signal memories (captured via
+ * capture_feedback) as a reminder on EVERY tool call — even when semantic
+ * retrieval returns nothing and there are no recurring patterns yet.
+ *
+ * This plugs the cold-start gap: a mistake captured seconds ago should
+ * surface on the very next tool call, not wait for the recurring-pattern
+ * threshold (≥2 occurrences) that buildBehavioralContext requires.
+ *
+ * @param {Object} [options]
+ * @param {number} [options.maxAgeMs=86400000] - Only include memories from the last 24h by default
+ * @param {number} [options.limit=3]
+ * @returns {string|null}
+ */
+function buildRecentCorrectiveActionsContext(options = {}) {
+  const maxAgeMs = typeof options.maxAgeMs === 'number' ? options.maxAgeMs : 24 * 60 * 60 * 1000;
+  const limit = typeof options.limit === 'number' ? options.limit : 3;
+  let resolveFeedbackDir;
+  try {
+    ({ resolveFeedbackDir } = require('./feedback-paths'));
+  } catch {
+    return null;
+  }
+  let feedbackDir;
+  try {
+    feedbackDir = resolveFeedbackDir({});
+  } catch {
+    return null;
+  }
+  const memoryLogPath = path.join(feedbackDir, 'memory-log.jsonl');
+  if (!fs.existsSync(memoryLogPath)) return null;
+  let raw;
+  try {
+    raw = fs.readFileSync(memoryLogPath, 'utf8');
+  } catch {
+    return null;
+  }
+  const lines = raw.split('\n').filter(Boolean);
+  if (lines.length === 0) return null;
+  const cutoff = Date.now() - maxAgeMs;
+  const recent = [];
+  // Walk from the tail backwards so we get the newest entries first
+  for (let i = lines.length - 1; i >= 0 && recent.length < limit; i--) {
+    try {
+      const entry = JSON.parse(lines[i]);
+      if (entry.category !== 'error' && entry.category !== 'learning') continue;
+      const ts = entry.timestamp ? Date.parse(entry.timestamp) : NaN;
+      if (!Number.isFinite(ts) || ts < cutoff) continue;
+      recent.push(entry);
+    } catch {
+      // skip malformed line
+    }
+  }
+  if (recent.length === 0) return null;
+  const formatted = recent.map((m) => {
+    const title = String(m.title || '').replace(/^MISTAKE:\s*/, '').slice(0, 140);
+    const content = String(m.content || '');
+    const avoidMatch = content.match(/How to avoid:\s*([^\n]+)/i);
+    const advice = avoidMatch ? avoidMatch[1].trim().slice(0, 220) : null;
+    return advice ? `  • ${title}\n    → ${advice}` : `  • ${title}`;
+  });
+  return `[ThumbGate] Recent mistakes (last 24h) — do NOT repeat:\n${formatted.join('\n')}`;
+}
+/**
+ * Build per-action lesson context: retrieve semantically-relevant lessons for this
+ * specific tool call and inject the top negative ones into hook output so the agent
+ * sees its past mistakes BEFORE executing the action (not after).
+ *
+ * This is the enforcement mechanism that turns ThumbGate from a passive log into an
+ * active governor. Without this, lessons stay in the DB and never get surfaced at
+ * decision time — so the agent repeats mistakes.
+ */
+function buildRelevantLessonContext(toolName, toolInput) {
+  if (!toolName) return null;
+  let retrieveRelevantLessons;
+  try {
+    ({ retrieveRelevantLessons } = require('./lesson-retrieval'));
+  } catch {
+    return null;
+  }
+  // Extract a searchable action context from the tool input
+  const actionContext = extractActionContext(toolName, toolInput);
+  if (!actionContext) return null;
+  try {
+    const lessons = retrieveRelevantLessons(toolName, actionContext, { maxResults: 3 });
+    // retrieveRelevantLessons already filters at relevanceScore > 0.1 internally;
+    // any negative lesson that survives retrieval is relevant enough to surface.
+    const negative = lessons.filter((l) => l.signal === 'negative');
+    if (negative.length === 0) return null;
+    const formatted = negative.map((l) => {
+      const title = (l.title || '').replace(/^MISTAKE:\s*/, '').slice(0, 140);
+      const advice = extractAvoidanceAdvice(l.content);
+      return advice ? `  • ${title}\n    → ${advice}` : `  • ${title}`;
+    });
+    return `[ThumbGate] Past mistakes relevant to this action — read before proceeding:\n${formatted.join('\n')}`;
+  } catch {
+    return null;
+  }
+}
+function extractActionContext(toolName, toolInput) {
+  if (!toolInput) return toolName;
+  const parts = [toolName];
+  if (toolInput.command) parts.push(String(toolInput.command).slice(0, 400));
+  if (toolInput.file_path) parts.push(String(toolInput.file_path));
+  if (toolInput.description) parts.push(String(toolInput.description).slice(0, 200));
+  if (toolInput.prompt) parts.push(String(toolInput.prompt).slice(0, 400));
+  if (toolInput.pattern) parts.push(String(toolInput.pattern).slice(0, 200));
+  return parts.filter(Boolean).join(' ');
+}
+function extractAvoidanceAdvice(content) {
+  if (!content) return null;
+  // Extract the "How to avoid:" section if present
+  const match = content.match(/How to avoid:\s*([^\n]+)/i);
+  if (match) return match[1].trim().slice(0, 220);
+  return null;
+}
+function mergeContextStrings(...ctxs) {
+  return ctxs.filter((c) => typeof c === 'string' && c.length > 0).join('\n\n') || null;
+}
 async function runAsync(input) {
   const secretGuard = evaluateSecretGuard(input);
   if (secretGuard) {
@@ -1545,7 +1980,10 @@ async function runAsync(input) {
   }
   const behavioralContext = buildBehavioralContext();
-  return formatOutput(result, behavioralContext);
+  const lessonContext = buildRelevantLessonContext(toolName, toolInput);
+  const recentContext = buildRecentCorrectiveActionsContext();
+  const combinedContext = mergeContextStrings(lessonContext, recentContext, behavioralContext);
+  return formatOutput(result, combinedContext);
 }
 function run(input) {
@@ -1575,7 +2013,10 @@ function run(input) {
   }
   const behavioralContext = buildBehavioralContext();
-  return formatOutput(result, behavioralContext);
+  const lessonContext = buildRelevantLessonContext(toolName, toolInput);
+  const recentContext = buildRecentCorrectiveActionsContext();
+  const combinedContext = mergeContextStrings(lessonContext, recentContext, behavioralContext);
+  return formatOutput(result, combinedContext);
 }
 // ---------------------------------------------------------------------------
@@ -1796,7 +2237,20 @@ module.exports = {
   PROTECTED_APPROVAL_TTL_MS,
   DEFAULT_PROTECTED_FILE_GLOBS,
   buildBehavioralContext,
+  buildRecentCorrectiveActionsContext,
+  buildRelevantLessonContext,
+  extractActionContext,
+  extractAvoidanceAdvice,
+  mergeContextStrings,
+  buildReminderOutput,
   isHighRiskAction,
+  collectBoostedRiskTags,
+  isBoostedRiskHigh,
+  riskTagMatchesAction,
+  evaluateBoostedRiskTagGuard,
+  registerPrThreadResolutionClaimGate,
+  evaluatePendingPrThreadResolutionGate,
+  PR_THREAD_RESOLUTION_ACTION,
 };
 // ---------------------------------------------------------------------------

package/scripts/hook-runtime.js CHANGED Viewed

@@ -44,10 +44,25 @@ function resolveCliBaseCommand() {
   return publishedCliShellCommand(version);
 }
+function resolveCodexCliBaseCommand() {
+  const version = packageVersion();
+  if (publishedHookCommandsAvailable(version)) {
+    return publishedCliShellCommand('latest', [], { preferInstalled: false });
+  }
+  if (isSourceCheckout(PKG_ROOT)) {
+    return `node ${shellQuote(path.join(PKG_ROOT, 'bin', 'cli.js'))}`;
+  }
+  return publishedCliShellCommand('latest', [], { preferInstalled: false });
+}
 function buildPortableHookCommand(subcommand) {
   return `${resolveCliBaseCommand()} ${subcommand}`;
 }
+function buildCodexPortableHookCommand(subcommand) {
+  return `${resolveCodexCliBaseCommand()} ${subcommand}`;
+}
 function preToolHookCommand() {
   return buildPortableHookCommand('gate-check');
 }
@@ -68,12 +83,39 @@ function statuslineCommand() {
   return buildPortableHookCommand('statusline-render');
 }
+function codexPreToolHookCommand() {
+  return buildCodexPortableHookCommand('gate-check');
+}
+function codexUserPromptHookCommand() {
+  return buildCodexPortableHookCommand('hook-auto-capture');
+}
+function codexSessionStartHookCommand() {
+  return buildCodexPortableHookCommand('session-start');
+}
+function codexCacheUpdateHookCommand() {
+  return buildCodexPortableHookCommand('cache-update');
+}
+function codexStatuslineCommand() {
+  return buildCodexPortableHookCommand('statusline-render');
+}
 module.exports = {
   buildPortableHookCommand,
+  buildCodexPortableHookCommand,
   cacheUpdateHookCommand,
+  codexCacheUpdateHookCommand,
+  codexPreToolHookCommand,
+  codexSessionStartHookCommand,
+  codexStatuslineCommand,
+  codexUserPromptHookCommand,
   packageVersion,
   publishedHookCommandsAvailable,
   preToolHookCommand,
+  resolveCodexCliBaseCommand,
   resolveCliBaseCommand,
   sessionStartHookCommand,
   statuslineCommand,

package/scripts/llm-client.js CHANGED Viewed

@@ -1,6 +1,8 @@
 #!/usr/bin/env node
 'use strict';
+const { runStep } = require('./durability/step');
 const MODELS = {
   FAST: 'claude-haiku-4-5-20251001',
   SMART: 'claude-sonnet-4-6',
@@ -33,25 +35,38 @@ function stripCodeFences(text) {
   return fenced ? fenced[1].trim() : text.trim();
 }
+// Anthropic SDK throws errors with a `.status` field for HTTP failures.
+// Our defaultClassify already reads `.status`, so 429/5xx retry and 4xx
+// (bad request / unauthorized / not-found) bail immediately — which is
+// what we want: there is no point retrying a malformed prompt or a
+// revoked API key.
 async function callClaude({ systemPrompt, userPrompt, model, maxTokens } = {}) {
   const client = getClient();
   if (!client) return null;
   try {
-    const response = await client.messages.create({
-      model: model || DEFAULT_MODEL,
-      max_tokens: maxTokens || DEFAULT_MAX_TOKENS,
-      system: systemPrompt || undefined,
-      messages: [{ role: 'user', content: userPrompt }],
-    });
+    const text = await runStep('llm.callClaude', {
+      retries: 2,
+      logger: (msg) => console.warn(msg),
+    }, async () => {
+      const response = await client.messages.create({
+        model: model || DEFAULT_MODEL,
+        max_tokens: maxTokens || DEFAULT_MAX_TOKENS,
+        system: systemPrompt || undefined,
+        messages: [{ role: 'user', content: userPrompt }],
+      });
-    const text = response.content
-      .filter((b) => b.type === 'text')
-      .map((b) => b.text)
-      .join('');
+      return response.content
+        .filter((b) => b.type === 'text')
+        .map((b) => b.text)
+        .join('');
+    });
     return stripCodeFences(text);
   } catch {
+    // Preserve the original callClaude contract — callers expect `null` on
+    // failure, not an exception. runStep already logged retry attempts,
+    // so the permanent failure is visible in logs.
     return null;
   }
 }

package/scripts/mailer/index.js ADDED Viewed

@@ -0,0 +1,13 @@
+'use strict';
+/**
+ * scripts/mailer/index.js — public entry point for the mailer module.
+ */
+const { sendEmail, sendTrialWelcomeEmail, renderTrialWelcomeBodies } = require('./resend-mailer');
+module.exports = {
+  sendEmail,
+  sendTrialWelcomeEmail,
+  renderTrialWelcomeBodies,
+};