npm - @vibecheckai/cli - Versions diffs - 3.2.6 → 3.3.0 - Mend

@vibecheckai/cli 3.2.6 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

package/bin/registry.js +192 -5
package/bin/runners/lib/agent-firewall/change-packet/builder.js +280 -6
package/bin/runners/lib/agent-firewall/critic/index.js +151 -0
package/bin/runners/lib/agent-firewall/critic/judge.js +432 -0
package/bin/runners/lib/agent-firewall/critic/prompts.js +305 -0
package/bin/runners/lib/agent-firewall/lawbook/distributor.js +465 -0
package/bin/runners/lib/agent-firewall/lawbook/evaluator.js +604 -0
package/bin/runners/lib/agent-firewall/lawbook/index.js +304 -0
package/bin/runners/lib/agent-firewall/lawbook/registry.js +514 -0
package/bin/runners/lib/agent-firewall/lawbook/schema.js +420 -0
package/bin/runners/lib/agent-firewall/logger.js +141 -0
package/bin/runners/lib/agent-firewall/policy/loader.js +312 -4
package/bin/runners/lib/agent-firewall/policy/rules/ghost-env.js +113 -1
package/bin/runners/lib/agent-firewall/policy/rules/ghost-route.js +133 -6
package/bin/runners/lib/agent-firewall/proposal/extractor.js +394 -0
package/bin/runners/lib/agent-firewall/proposal/index.js +212 -0
package/bin/runners/lib/agent-firewall/proposal/schema.js +251 -0
package/bin/runners/lib/agent-firewall/proposal/validator.js +386 -0
package/bin/runners/lib/agent-firewall/reality/index.js +332 -0
package/bin/runners/lib/agent-firewall/reality/state.js +625 -0
package/bin/runners/lib/agent-firewall/reality/watcher.js +322 -0
package/bin/runners/lib/agent-firewall/risk/index.js +173 -0
package/bin/runners/lib/agent-firewall/risk/scorer.js +328 -0
package/bin/runners/lib/agent-firewall/risk/thresholds.js +321 -0
package/bin/runners/lib/agent-firewall/risk/vectors.js +421 -0
package/bin/runners/lib/agent-firewall/simulator/diff-simulator.js +472 -0
package/bin/runners/lib/agent-firewall/simulator/import-resolver.js +346 -0
package/bin/runners/lib/agent-firewall/simulator/index.js +181 -0
package/bin/runners/lib/agent-firewall/simulator/route-validator.js +380 -0
package/bin/runners/lib/agent-firewall/time-machine/incident-correlator.js +661 -0
package/bin/runners/lib/agent-firewall/time-machine/index.js +267 -0
package/bin/runners/lib/agent-firewall/time-machine/replay-engine.js +436 -0
package/bin/runners/lib/agent-firewall/time-machine/state-reconstructor.js +490 -0
package/bin/runners/lib/agent-firewall/time-machine/timeline-builder.js +530 -0
package/bin/runners/lib/analyzers.js +81 -18
package/bin/runners/lib/authority-badge.js +425 -0
package/bin/runners/lib/cli-output.js +7 -1
package/bin/runners/lib/error-handler.js +16 -9
package/bin/runners/lib/exit-codes.js +275 -0
package/bin/runners/lib/global-flags.js +37 -0
package/bin/runners/lib/help-formatter.js +413 -0
package/bin/runners/lib/logger.js +38 -0
package/bin/runners/lib/unified-cli-output.js +604 -0
package/bin/runners/lib/upsell.js +148 -0
package/bin/runners/runApprove.js +1200 -0
package/bin/runners/runAuth.js +324 -95
package/bin/runners/runCheckpoint.js +39 -21
package/bin/runners/runClassify.js +859 -0
package/bin/runners/runContext.js +136 -24
package/bin/runners/runDoctor.js +108 -68
package/bin/runners/runFix.js +6 -5
package/bin/runners/runGuard.js +212 -118
package/bin/runners/runInit.js +3 -2
package/bin/runners/runMcp.js +130 -52
package/bin/runners/runPolish.js +43 -20
package/bin/runners/runProve.js +1 -2
package/bin/runners/runReport.js +3 -2
package/bin/runners/runScan.js +63 -44
package/bin/runners/runShip.js +3 -4
package/bin/runners/runValidate.js +19 -2
package/bin/runners/runWatch.js +104 -53
package/bin/vibecheck.js +106 -19
package/mcp-server/HARDENING_SUMMARY.md +299 -0
package/mcp-server/agent-firewall-interceptor.js +367 -31
package/mcp-server/authority-tools.js +569 -0
package/mcp-server/conductor/conflict-resolver.js +588 -0
package/mcp-server/conductor/execution-planner.js +544 -0
package/mcp-server/conductor/index.js +377 -0
package/mcp-server/conductor/lock-manager.js +615 -0
package/mcp-server/conductor/request-queue.js +550 -0
package/mcp-server/conductor/session-manager.js +500 -0
package/mcp-server/conductor/tools.js +510 -0
package/mcp-server/index.js +1149 -243
package/mcp-server/lib/{api-client.js → api-client.cjs} +40 -4
package/mcp-server/lib/logger.cjs +30 -0
package/mcp-server/logger.js +173 -0
package/mcp-server/package.json +2 -2
package/mcp-server/premium-tools.js +2 -2
package/mcp-server/tier-auth.js +245 -35
package/mcp-server/truth-firewall-tools.js +145 -15
package/mcp-server/vibecheck-tools.js +2 -2
package/package.json +2 -3
package/mcp-server/index.old.js +0 -4137
package/mcp-server/package-lock.json +0 -165

package/bin/runners/lib/agent-firewall/critic/judge.js ADDED Viewed

@@ -0,0 +1,432 @@
+/**
+ * Critic LLM Judge
+ *
+ * The "savage" judge that evaluates proposal quality.
+ * Detects hand-waving, vague intent, and unverified assumptions.
+ *
+ * Philosophy: "If this change cannot be proven safe by the repository, block it."
+ */
+"use strict";
+const {
+  CRITIC_SYSTEM_PROMPT,
+  buildEvaluationPrompt,
+  buildVaguenessPrompt,
+  buildVerificationPrompt,
+  parseCriticResponse,
+} = require("./prompts");
+/**
+ * @typedef {Object} CriticVerdict
+ * @property {string} verdict - ALLOW, BLOCK, or REQUIRE_CONFIRMATION
+ * @property {number} confidence - Confidence in verdict (0-1)
+ * @property {Array} reasoning - Reasons for the verdict
+ * @property {Array} violations - Specific violations found
+ * @property {Array} recommendations - Suggestions for improvement
+ */
+/**
+ * Default LLM client configuration
+ */
+const DEFAULT_CONFIG = {
+  model: "gpt-4-turbo-preview",
+  temperature: 0.1, // Low temperature for consistent judgments
+  maxTokens: 1000,
+  timeout: 30000,
+};
+/**
+ * Critic Judge class
+ */
+class CriticJudge {
+  constructor(options = {}) {
+    this.config = { ...DEFAULT_CONFIG, ...options };
+    this.llmClient = options.llmClient || null;
+    this.enabled = options.enabled !== false;
+    this.fallbackMode = options.fallbackMode || "conservative";
+  }
+  /**
+   * Set the LLM client
+   * @param {Function} client - LLM client function
+   */
+  setClient(client) {
+    this.llmClient = client;
+  }
+  /**
+   * Check if critic is available
+   * @returns {boolean} Is available
+   */
+  isAvailable() {
+    return this.enabled && this.llmClient !== null;
+  }
+  /**
+   * Evaluate a proposal
+   * @param {Object} params - Evaluation parameters
+   * @returns {Promise<CriticVerdict>} Critic verdict
+   */
+  async evaluate(params) {
+    const {
+      proposal,
+      validationResults = {},
+      riskScore = {},
+      simulationResult = {},
+      realityState = {},
+    } = params;
+    // If critic is disabled, use rule-based evaluation
+    if (!this.isAvailable()) {
+      return this.ruleBasedEvaluation(params);
+    }
+    try {
+      // Build the evaluation prompt
+      const prompt = buildEvaluationPrompt({
+        proposal,
+        validationResults,
+        riskScore,
+        simulationResult,
+        realityState,
+      });
+      // Call LLM
+      const response = await this.callLLM(prompt);
+      // Parse response
+      const verdict = parseCriticResponse(response);
+      // Validate verdict
+      return this.validateVerdict(verdict);
+    } catch (error) {
+      console.warn(`Critic LLM evaluation failed: ${error.message}`);
+      // Fall back to rule-based evaluation
+      if (this.fallbackMode === "conservative") {
+        return this.ruleBasedEvaluation(params);
+      } else {
+        return {
+          verdict: "ALLOW",
+          confidence: 0.3,
+          reasoning: ["Critic unavailable, using permissive fallback"],
+          violations: [],
+          recommendations: ["Consider manual review"],
+        };
+      }
+    }
+  }
+  /**
+   * Check for vagueness in proposal
+   * @param {Object} proposal - Proposal to check
+   * @returns {Promise<Object>} Vagueness analysis
+   */
+  async checkVagueness(proposal) {
+    if (!this.isAvailable()) {
+      return this.ruleBasedVaguenessCheck(proposal);
+    }
+    try {
+      const prompt = buildVaguenessPrompt(proposal);
+      const response = await this.callLLM(prompt);
+      return parseCriticResponse(response);
+    } catch (error) {
+      return this.ruleBasedVaguenessCheck(proposal);
+    }
+  }
+  /**
+   * Verify assumptions against reality
+   * @param {Array} assumptions - Assumptions to verify
+   * @param {Object} realityState - Repository state
+   * @returns {Promise<Object>} Verification results
+   */
+  async verifyAssumptions(assumptions, realityState) {
+    if (!this.isAvailable()) {
+      return this.ruleBasedAssumptionVerification(assumptions, realityState);
+    }
+    try {
+      const prompt = buildVerificationPrompt(assumptions, realityState);
+      const response = await this.callLLM(prompt);
+      return parseCriticResponse(response);
+    } catch (error) {
+      return this.ruleBasedAssumptionVerification(assumptions, realityState);
+    }
+  }
+  /**
+   * Call the LLM
+   * @param {string} prompt - User prompt
+   * @returns {Promise<string>} LLM response
+   */
+  async callLLM(prompt) {
+    if (!this.llmClient) {
+      throw new Error("LLM client not configured");
+    }
+    return this.llmClient({
+      systemPrompt: CRITIC_SYSTEM_PROMPT,
+      userPrompt: prompt,
+      model: this.config.model,
+      temperature: this.config.temperature,
+      maxTokens: this.config.maxTokens,
+    });
+  }
+  /**
+   * Validate and normalize verdict
+   * @param {Object} verdict - Raw verdict
+   * @returns {CriticVerdict} Validated verdict
+   */
+  validateVerdict(verdict) {
+    const validVerdicts = ["ALLOW", "BLOCK", "REQUIRE_CONFIRMATION"];
+    return {
+      verdict: validVerdicts.includes(verdict.verdict) ? verdict.verdict : "BLOCK",
+      confidence: typeof verdict.confidence === "number"
+        ? Math.max(0, Math.min(1, verdict.confidence))
+        : 0.5,
+      reasoning: Array.isArray(verdict.reasoning) ? verdict.reasoning : [],
+      violations: Array.isArray(verdict.violations) ? verdict.violations : [],
+      recommendations: Array.isArray(verdict.recommendations) ? verdict.recommendations : [],
+    };
+  }
+  /**
+   * Rule-based evaluation fallback
+   * @param {Object} params - Evaluation parameters
+   * @returns {CriticVerdict} Verdict
+   */
+  ruleBasedEvaluation(params) {
+    const { proposal, validationResults, riskScore, simulationResult } = params;
+    const violations = [];
+    const reasoning = [];
+    let verdict = "ALLOW";
+    let confidence = 0.7;
+    // Check simulation result
+    if (simulationResult && !simulationResult.passed) {
+      violations.push("Simulation failed");
+      reasoning.push("Change would break imports or routes");
+      verdict = "BLOCK";
+      confidence = 0.9;
+    }
+    // Check risk score
+    if (riskScore?.total >= 80) {
+      violations.push(`High risk score: ${riskScore.total}`);
+      reasoning.push("Risk score exceeds safe threshold");
+      verdict = verdict === "BLOCK" ? "BLOCK" : "REQUIRE_CONFIRMATION";
+      confidence = Math.max(confidence, 0.8);
+    }
+    // Check unverified assumptions
+    if (validationResults?.invalid?.length > 0) {
+      for (const invalid of validationResults.invalid) {
+        violations.push(`Unverified assumption: ${invalid.assumption?.key || invalid.assumption?.type}`);
+      }
+      reasoning.push(`${validationResults.invalid.length} assumptions could not be verified`);
+      verdict = "BLOCK";
+      confidence = 0.85;
+    }
+    // Check vagueness
+    const vaguenessCheck = this.ruleBasedVaguenessCheck(proposal);
+    if (vaguenessCheck.specificityScore < 4) {
+      violations.push("Proposal is too vague");
+      reasoning.push(`Specificity score: ${vaguenessCheck.specificityScore}/10`);
+      if (verdict === "ALLOW") verdict = "REQUIRE_CONFIRMATION";
+    }
+    // Check for sensitive domains without explicit acknowledgment
+    const sensitiveDomains = ["auth", "payments", "database"];
+    const touchesSensitive = (proposal.operations || []).some(op => {
+      const path = (op.path || "").toLowerCase();
+      return sensitiveDomains.some(d => path.includes(d));
+    });
+    if (touchesSensitive && !proposal.riskAcknowledgment) {
+      violations.push("Touches sensitive domains without risk acknowledgment");
+      reasoning.push("Changes to auth/payments/database require explicit acknowledgment");
+      if (verdict === "ALLOW") verdict = "REQUIRE_CONFIRMATION";
+    }
+    // No violations = allow
+    if (violations.length === 0) {
+      reasoning.push("No violations detected");
+    }
+    return {
+      verdict,
+      confidence,
+      reasoning,
+      violations,
+      recommendations: violations.length > 0
+        ? ["Address violations before proceeding", "Add missing assumptions"]
+        : [],
+    };
+  }
+  /**
+   * Rule-based vagueness check
+   * @param {Object} proposal - Proposal to check
+   * @returns {Object} Vagueness analysis
+   */
+  ruleBasedVaguenessCheck(proposal) {
+    const vagueTerms = [];
+    let specificityScore = 10;
+    // Check intent
+    const vagueIntents = ["fix", "update", "change", "modify", "improve", "refactor", "adjust"];
+    const intentWords = (proposal.intent || "").toLowerCase().split("_");
+    if (intentWords.length === 1 && vagueIntents.includes(intentWords[0])) {
+      vagueTerms.push(proposal.intent);
+      specificityScore -= 3;
+    }
+    // Check summary
+    if (!proposal.summary) {
+      specificityScore -= 2;
+    } else if (proposal.summary.length < 20) {
+      specificityScore -= 1;
+    }
+    // Check assumptions
+    if (!proposal.assumptions || proposal.assumptions.length === 0) {
+      specificityScore -= 2;
+    }
+    // Check operation count vs explanation
+    const opCount = (proposal.operations || []).length;
+    if (opCount > 3 && (!proposal.summary || proposal.summary.length < 50)) {
+      specificityScore -= 2;
+    }
+    // Check for vague words in summary
+    const vagueWords = ["some", "various", "etc", "stuff", "things", "somehow"];
+    if (proposal.summary) {
+      for (const word of vagueWords) {
+        if (proposal.summary.toLowerCase().includes(word)) {
+          vagueTerms.push(word);
+          specificityScore -= 1;
+        }
+      }
+    }
+    specificityScore = Math.max(1, specificityScore);
+    return {
+      specificityScore,
+      vagueTerms,
+      suggestions: vagueTerms.length > 0
+        ? [`Replace vague terms: ${vagueTerms.join(", ")}`, "Add specific details"]
+        : [],
+    };
+  }
+  /**
+   * Rule-based assumption verification
+   * @param {Array} assumptions - Assumptions to verify
+   * @param {Object} realityState - Repository state
+   * @returns {Object} Verification results
+   */
+  ruleBasedAssumptionVerification(assumptions, realityState) {
+    const results = [];
+    let verifiedCount = 0;
+    for (const assumption of assumptions) {
+      let verified = false;
+      let evidence = null;
+      let reason = "";
+      switch (assumption.type) {
+        case "env":
+          if (realityState?.envVars?.has(assumption.key)) {
+            verified = true;
+            evidence = `Found in env vars: ${assumption.key}`;
+          } else {
+            reason = `Env var '${assumption.key}' not found in declared variables`;
+          }
+          break;
+        case "route":
+          const routeExists = realityState?.routes?.some(r =>
+            r.path === assumption.path &&
+            (r.method === assumption.method || !assumption.method)
+          );
+          if (routeExists) {
+            verified = true;
+            evidence = `Route ${assumption.method || "GET"} ${assumption.path} is registered`;
+          } else {
+            reason = `Route ${assumption.path} not found in registered routes`;
+          }
+          break;
+        case "service":
+          const serviceExists = realityState?.services?.some(s =>
+            s.name === assumption.key || s.name === assumption.name
+          );
+          if (serviceExists) {
+            verified = true;
+            evidence = `Service ${assumption.key || assumption.name} is registered`;
+          } else {
+            reason = `Service ${assumption.key || assumption.name} not found`;
+          }
+          break;
+        case "file":
+          if (realityState?.files?.has(assumption.path?.replace(/\\/g, "/"))) {
+            verified = true;
+            evidence = `File ${assumption.path} exists`;
+          } else {
+            reason = `File ${assumption.path} not found`;
+          }
+          break;
+        default:
+          reason = `Unknown assumption type: ${assumption.type}`;
+      }
+      if (verified) verifiedCount++;
+      results.push({
+        assumption: assumption.key || assumption.path || assumption.type,
+        verified,
+        evidence,
+        reason,
+      });
+    }
+    return {
+      results,
+      overallVerificationRate: assumptions.length > 0
+        ? verifiedCount / assumptions.length
+        : 1,
+    };
+  }
+}
+/**
+ * Create a critic judge instance
+ * @param {Object} options - Configuration options
+ * @returns {CriticJudge} Judge instance
+ */
+function createJudge(options = {}) {
+  return new CriticJudge(options);
+}
+/**
+ * Default judge instance
+ */
+const defaultJudge = createJudge();
+module.exports = {
+  CriticJudge,
+  createJudge,
+  defaultJudge,
+};