npm - @martinloop/mcp - Versions diffs - 0.3.0 → 0.3.2 - Mend

@martinloop/mcp 0.3.0 → 0.3.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

package/README.md +5 -4
package/dist/package-version.d.ts +1 -1
package/dist/package-version.js +1 -1
package/dist/server-validation.js +2 -2
package/dist/server.js +72 -10
package/dist/tools/doctor.d.ts +27 -0
package/dist/tools/doctor.js +39 -11
package/dist/tools/get-run.d.ts +2 -1
package/dist/tools/get-run.js +1 -0
package/dist/tools/get-verification-results.d.ts +2 -1
package/dist/tools/get-verification-results.js +1 -0
package/dist/tools/plan.js +4 -2
package/dist/tools/preflight.d.ts +27 -0
package/dist/tools/preflight.js +44 -20
package/dist/tools/run-dossier.d.ts +2 -1
package/dist/tools/run-dossier.js +1 -0
package/dist/tools/run-loop.d.ts +5 -1
package/dist/tools/run-loop.js +20 -8
package/dist/tools/run-store.js +67 -15
package/dist/tools/tool-support.d.ts +2 -0
package/dist/tools/tool-support.js +49 -13
package/dist/tools/workflow-governance.d.ts +19 -3
package/dist/tools/workflow-governance.js +107 -55
package/dist/vendor/adapters/claude-cli.d.ts +20 -3
package/dist/vendor/adapters/claude-cli.js +193 -33
package/dist/vendor/adapters/cli-bridge.d.ts +45 -0
package/dist/vendor/adapters/cli-bridge.js +107 -39
package/dist/vendor/adapters/codex-launcher.d.ts +32 -0
package/dist/vendor/adapters/codex-launcher.js +409 -118
package/dist/vendor/adapters/openai-compatible.js +8 -2
package/dist/vendor/adapters/runtime-support.js +1 -0
package/dist/vendor/adapters/stub-direct-provider.js +3 -0
package/dist/vendor/adapters/verifier-only.d.ts +2 -0
package/dist/vendor/adapters/verifier-only.js +9 -3
package/dist/vendor/contracts/index.d.ts +2 -1
package/dist/vendor/contracts/index.js +14 -0
package/dist/vendor/core/context-integrity.js +28 -3
package/dist/vendor/core/grounding.d.ts +1 -0
package/dist/vendor/core/grounding.js +6 -2
package/dist/vendor/core/index.d.ts +1 -0
package/dist/vendor/core/index.js +25 -6
package/dist/vendor/core/leash.js +90 -8
package/dist/vendor/core/persistence/integrity.d.ts +1 -1
package/dist/vendor/core/persistence/integrity.js +15 -6
package/dist/workflow-state.d.ts +9 -0
package/dist/workflow-state.js +44 -3
package/package.json +2 -2
package/server.json +2 -2

package/dist/tools/run-loop.js CHANGED Viewed

@@ -1,9 +1,17 @@
 import { createClaudeCliAdapter, createCodexCliAdapter, createGeminiCliAdapter, probeCodexLaunch, resolveCliCommandAvailability, createVerifierOnlyAdapter } from "../vendor/adapters/index.js";
 import { createFileRunStore, evaluateCostGovernor, resolveRunsRoot, runMartin } from "../vendor/core/index.js";
-import { DEFAULT_BUDGET } from "../vendor/contracts/index.js";
 import { normalizeSafePathPatterns, resolveSafeRepoRoot } from "../server-validation.js";
 import { MartinToolError } from "./tool-errors.js";
 import { buildArtifactSummary, buildVerificationSummary, buildLoopPreview, buildRunRecordPaths, getEngineAvailability, resolveExecutionMode } from "./tool-support.js";
+import { normalizeLoopBudget } from "./workflow-governance.js";
+let proofModeVerifierSpawnImpl;
+let runStoreOverrideForTests;
+export function __setProofModeVerifierSpawnImplForTests(spawnImpl) {
+    proofModeVerifierSpawnImpl = spawnImpl;
+}
+export function __setRunStoreOverrideForTests(store) {
+    runStoreOverrideForTests = store;
+}
 export async function runLoopTool(input) {
     const workingDirectory = resolveSafeRepoRoot(input.workingDirectory);
     const engine = input.engine ?? "claude";
@@ -19,6 +27,7 @@ export async function runLoopTool(input) {
         repoRoot: workingDirectory,
         runsRoot
     };
+    let codexCommandOverride;
     if (executionMode.liveMode) {
         if (engine === "codex") {
             const engineAvailability = resolveCliCommandAvailability("codex");
@@ -40,6 +49,7 @@ export async function runLoopTool(input) {
                     retryable: false
                 });
             }
+            codexCommandOverride = codexProbe.command;
         }
         else {
             const engineAvailability = getEngineAvailability(engine);
@@ -55,10 +65,15 @@ export async function runLoopTool(input) {
     const adapter = !executionMode.liveMode
         ? createVerifierOnlyAdapter({
             workingDirectory,
-            label: "Proof mode adapter (MARTIN_LIVE=false)"
+            label: "Proof mode adapter (MARTIN_LIVE=false)",
+            ...(proofModeVerifierSpawnImpl ? { spawnImpl: proofModeVerifierSpawnImpl } : {})
         })
         : engine === "codex"
-            ? createCodexCliAdapter({ workingDirectory, ...(model ? { model } : {}) })
+            ? createCodexCliAdapter({
+                workingDirectory,
+                ...(model ? { model } : {}),
+                ...(codexCommandOverride ? { command: codexCommandOverride } : {})
+            })
             : engine === "gemini"
                 ? createGeminiCliAdapter({ workingDirectory, ...(model ? { model } : {}) })
                 : createClaudeCliAdapter({ workingDirectory, ...(model ? { model } : {}) });
@@ -72,14 +87,11 @@ export async function runLoopTool(input) {
     if (input.maxTokens !== undefined) {
         partialBudget.maxTokens = input.maxTokens;
     }
-    const budget = {
-        ...DEFAULT_BUDGET,
-        ...partialBudget
-    };
+    const budget = normalizeLoopBudget(partialBudget);
     const result = await runMartin({
         workspaceId: input.workspaceId ?? "ws_mcp",
         projectId: input.projectId ?? "proj_mcp",
-        store: createFileRunStore({ runsRoot }),
+        store: runStoreOverrideForTests ?? createFileRunStore({ runsRoot }),
         receiptScope,
         task: {
             title: input.objective.slice(0, 100),

package/dist/tools/run-store.js CHANGED Viewed

@@ -1,8 +1,60 @@
 import { readFile, readdir, stat } from "node:fs/promises";
 import path from "node:path";
-import { readLatestLoopRecordFromFile, readLoopRecordsFromFile, resolveRunsRoot } from "../vendor/core/index.js";
+import { readLatestLoopRecordFromFile, readLoopRecordsFromFile, resolveRunsRoot, verifyReceiptIntegrityFromFiles } from "../vendor/core/index.js";
 import { resolveSafeLoopRecordPath, resolveSafeRunsJsonPath, resolveSafeRunsPath, resolveSafeRunsRootPath } from "../server-validation.js";
 import { attemptNotFoundError, invalidSelectorError, noLoopRecordsError, storeUnreadableError } from "./tool-errors.js";
+async function attachReceiptIntegrity(detail) {
+    const ledgerPath = detail.canonicalRunDirectory
+        ? await resolveReceiptEvidencePath(detail.canonicalRunDirectory)
+        : detail.ledgerPath;
+    const integrity = detail.canonicalLoopRecordPath && detail.canonicalRunDirectory && ledgerPath
+        ? await verifyReceiptIntegrityFromFiles({
+            runId: detail.loop.loopId,
+            runsRoot: detail.runsRoot,
+            loopRecordPath: detail.canonicalLoopRecordPath,
+            ledgerPath
+        }).catch(() => ({
+            state: "unsigned",
+            reason: "Receipt integrity verification could not be completed."
+        }))
+        : ({
+            state: "unsigned",
+            reason: "Receipt integrity is only available for canonical run directories."
+        });
+    const receiptScope = resolveReceiptScope(detail.loop, detail.runsRoot);
+    return {
+        ...detail,
+        ...(ledgerPath ? { ledgerPath } : {}),
+        loop: {
+            ...detail.loop,
+            receiptIntegrity: integrity,
+            ...(receiptScope ? { receiptScope } : {})
+        }
+    };
+}
+function resolveReceiptScope(loop, runsRoot) {
+    if (loop.receiptScope) {
+        return loop.receiptScope;
+    }
+    if (!loop.task?.repoRoot && !runsRoot) {
+        return undefined;
+    }
+    return {
+        ...(loop.task?.repoRoot ? { repoRoot: loop.task.repoRoot } : {}),
+        ...(loop.task?.repoRoot ? { workingDirectory: loop.task.repoRoot } : {}),
+        ...(runsRoot ? { runsRoot } : {})
+    };
+}
+async function resolveReceiptEvidencePath(runDirectory) {
+    for (const candidate of ["ledger.jsonl", "events.jsonl"]) {
+        const candidatePath = path.join(runDirectory, candidate);
+        const candidateStats = await safeStat(candidatePath);
+        if (candidateStats?.isFile()) {
+            return candidatePath;
+        }
+    }
+    return undefined;
+}
 export async function loadLoopRecordsForInspect(input) {
     const runsRoot = resolveSafeRunsRootPath(input.runsDir, resolveRunsRoot(process.env));
     if (!input.file) {
@@ -118,14 +170,14 @@ export async function loadDetailedLoopRecord(input) {
                 const canonicalStats = await safeStat(canonicalLoopRecordPath);
                 if (canonicalStats?.isFile()) {
                     const loop = await readCanonicalLoopRecord(canonicalLoopRecordPath);
-                    return buildDetailedLoopSource({
+                    return await attachReceiptIntegrity(buildDetailedLoopSource({
                         source: canonicalLoopRecordPath,
                         sourceKind: "file",
                         runsRoot,
                         loop,
                         canonicalLoopRecordPath,
                         canonicalRunDirectory: path.dirname(canonicalLoopRecordPath)
-                    });
+                    }));
                 }
             }
             const inspected = await readAllLoopRecordsSafely(targetPath);
@@ -139,10 +191,10 @@ export async function loadDetailedLoopRecord(input) {
                 runsRoot,
                 loop
             });
-            return {
+            return await attachReceiptIntegrity({
                 ...detail,
                 warnings: [...detail.warnings, ...inspected.warnings]
-            };
+            });
         }
         const latest = await readLatestLoopRecordFromFile(targetPath);
         if (!latest) {
@@ -150,35 +202,35 @@ export async function loadDetailedLoopRecord(input) {
         }
         if (path.basename(targetPath) === "loop-record.json") {
             const loop = await readCanonicalLoopRecord(targetPath);
-            return buildDetailedLoopSource({
+            return await attachReceiptIntegrity(buildDetailedLoopSource({
                 source: targetPath,
                 sourceKind: "file",
                 runsRoot,
                 loop,
                 canonicalLoopRecordPath: targetPath,
                 canonicalRunDirectory: path.dirname(targetPath)
-            });
+            }));
         }
-        return await buildDetailedLoopSourceFromDiscoveredLoop({
+        return await attachReceiptIntegrity(await buildDetailedLoopSourceFromDiscoveredLoop({
             source: targetPath,
             sourceKind: "file",
             runsRoot,
             loop: latest
-        });
+        }));
     }
     if (input.loopId) {
         const canonicalLoopRecordPath = resolvePotentialLoopRecordPath(input.loopId, runsRoot);
         const canonicalStats = await safeStat(canonicalLoopRecordPath);
         if (canonicalStats?.isFile()) {
             const loop = await readCanonicalLoopRecord(canonicalLoopRecordPath);
-            return buildDetailedLoopSource({
+            return await attachReceiptIntegrity(buildDetailedLoopSource({
                 source: canonicalLoopRecordPath,
                 sourceKind: "loop_id",
                 runsRoot,
                 loop,
                 canonicalLoopRecordPath,
                 canonicalRunDirectory: path.dirname(canonicalLoopRecordPath)
-            });
+            }));
         }
         const inspected = await readAllLoopRecordsSafely(runsRoot);
         const loop = inspected.loops.find((candidate) => candidate.loopId === input.loopId);
@@ -191,10 +243,10 @@ export async function loadDetailedLoopRecord(input) {
             runsRoot,
             loop
         });
-        return {
+        return await attachReceiptIntegrity({
             ...detail,
             warnings: [...detail.warnings, ...inspected.warnings]
-        };
+        });
     }
     const inspected = await readAllLoopRecordsSafely(runsRoot);
     const loop = inspected.loops[0];
@@ -207,10 +259,10 @@ export async function loadDetailedLoopRecord(input) {
         runsRoot,
         loop
     });
-    return {
+    return await attachReceiptIntegrity({
         ...detail,
         warnings: [...detail.warnings, ...inspected.warnings]
-    };
+    });
 }
 export async function loadAttemptFromLoop(input) {
     const detail = await loadDetailedLoopRecord(input);

package/dist/tools/tool-support.d.ts CHANGED Viewed

@@ -89,6 +89,7 @@ export interface CliAvailability {
     locator: string;
     detail: string;
     resolvedPath?: string;
+    candidatePaths?: string[];
 }
 export interface ExecutionMode {
     liveMode: boolean;
@@ -110,6 +111,7 @@ export interface CanonicalRunPaths {
 export declare function resolveExecutionMode(): ExecutionMode;
 export declare function detectCliAvailability(command: string): CliAvailability;
 export declare function getEngineAvailability(engine: MartinEngine): CliAvailability;
+export declare function createSkippedCliAvailability(command: string, detail?: string): CliAvailability;
 export declare function formatUsd(value: number): string;
 export declare function buildLoopPreview(loop: InspectableLoopRecord): LoopPreview;
 export declare function buildAttemptSummary(attempt: InspectableLoopAttempt, artifacts?: AttemptArtifactFiles): AttemptSummary;

package/dist/tools/tool-support.js CHANGED Viewed

@@ -1,4 +1,4 @@
-import { spawnSync } from "node:child_process";
+import { accessSync, constants } from "node:fs";
 import { readdir, stat } from "node:fs/promises";
 import { join } from "node:path";
 import { evaluateCostGovernor, resolveRunsRoot } from "../vendor/core/index.js";
@@ -23,18 +23,9 @@ export function detectCliAvailability(command) {
     if (cached && cached.expiresAt > Date.now()) {
         return cached.value;
     }
-    const locator = process.platform === "win32" ? "where.exe" : "which";
-    const result = spawnSync(locator, [command], {
-        encoding: "utf8",
-        stdio: ["ignore", "pipe", "pipe"]
-    });
-    const resolvedPath = result.status === 0
-        ? (result.stdout ?? "")
-            .split(/\r?\n/u)
-            .map((line) => line.trim())
-            .find(Boolean)
-        : undefined;
-    const value = result.status === 0
+    const locator = process.platform === "win32" ? "path-scan(win32)" : "path-scan(posix)";
+    const resolvedPath = findCommandOnPath(command);
+    const value = resolvedPath
         ? {
             command,
             available: true,
@@ -54,9 +45,54 @@ export function detectCliAvailability(command) {
     });
     return value;
 }
+function findCommandOnPath(command) {
+    const pathKey = Object.keys(process.env).find((key) => key.toLowerCase() === "path");
+    const rawPath = pathKey ? process.env[pathKey] : undefined;
+    if (!rawPath) {
+        return undefined;
+    }
+    const pathEntries = rawPath
+        .split(process.platform === "win32" ? ";" : ":")
+        .map((entry) => entry.trim())
+        .filter(Boolean);
+    const hasExtension = /\.[A-Za-z0-9]+$/u.test(command);
+    const candidateNames = process.platform === "win32" && !hasExtension
+        ? (process.env.PATHEXT ?? ".COM;.EXE;.BAT;.CMD")
+            .split(";")
+            .map((extension) => extension.trim())
+            .filter(Boolean)
+            .map((extension) => `${command}${extension.toLowerCase()}`)
+        : [command];
+    for (const directory of pathEntries) {
+        for (const candidateName of candidateNames) {
+            const candidatePath = join(directory, candidateName);
+            if (isExecutablePath(candidatePath)) {
+                return candidatePath;
+            }
+        }
+    }
+    return undefined;
+}
+function isExecutablePath(candidatePath) {
+    try {
+        accessSync(candidatePath, process.platform === "win32" ? constants.F_OK : constants.X_OK);
+        return true;
+    }
+    catch {
+        return false;
+    }
+}
 export function getEngineAvailability(engine) {
     return detectCliAvailability(engine);
 }
+export function createSkippedCliAvailability(command, detail = "Proof mode skipped live CLI availability detection.") {
+    return {
+        command,
+        available: false,
+        locator: "skipped",
+        detail
+    };
+}
 export function formatUsd(value) {
     return `$${value.toFixed(2)}`;
 }

package/dist/tools/workflow-governance.d.ts CHANGED Viewed

@@ -1,3 +1,4 @@
+import { type LoopBudget } from "../vendor/contracts/index.js";
 import { type RunStoreInspection } from "./tool-support.js";
 export type MartinPolicyPack = "solo-founder" | "startup-team" | "enterprise-strict" | "oss-maintainer" | "security-sensitive";
 export interface RepoGitState {
@@ -23,6 +24,7 @@ export interface RepoSignals {
     packageScripts: Record<string, string>;
     git: RepoGitState;
     sensitivePaths: string[];
+    hostAvailabilityChecked: boolean;
     availableHosts: Record<"claude" | "codex" | "cursor" | "gemini", {
         available: boolean;
         detail: string;
@@ -110,11 +112,25 @@ interface ContractOverrides {
     maxFilesChanged?: number;
     maxCommands?: number;
 }
-export declare function inspectRepoSignals(workingDirectory: string): RepoSignals;
+interface LoopBudgetOverrides {
+    maxUsd?: number;
+    softLimitUsd?: number;
+    maxIterations?: number;
+    maxTokens?: number;
+}
+export declare function inspectRepoSignals(workingDirectory: string, options?: {
+    includeHostAvailability?: boolean;
+}): RepoSignals;
 export declare function buildReadinessReport(signals: RepoSignals, runStore: RunStoreInspection): MartinReadinessReport;
 export declare function buildPolicyPackDefinition(policyPack: MartinPolicyPack | undefined, signals: RepoSignals): MartinPolicyPackDefinition;
-export declare function buildPlanProposal(workingDirectory: string, overrides: ContractOverrides): MartinPlanProposal;
-export declare function buildRunContract(workingDirectory: string, overrides: ContractOverrides): MartinRunContract;
+export declare function buildPlanProposal(workingDirectory: string, overrides: ContractOverrides, options?: {
+    signals?: RepoSignals;
+}): MartinPlanProposal;
+export declare function buildRunContract(workingDirectory: string, overrides: ContractOverrides, options?: {
+    signals?: RepoSignals;
+    plan?: MartinPlanProposal;
+}): MartinRunContract;
+export declare function normalizeLoopBudget(overrides?: LoopBudgetOverrides): LoopBudget;
 export declare function assessRunRisk(input: {
     objective: string;
     context?: string;

package/dist/tools/workflow-governance.js CHANGED Viewed

@@ -2,13 +2,17 @@ import { existsSync, readFileSync } from "node:fs";
 import path from "node:path";
 import { spawnSync } from "node:child_process";
 import { DEFAULT_BUDGET } from "../vendor/contracts/index.js";
-import { detectCliAvailability } from "./tool-support.js";
+import { createSkippedCliAvailability, detectCliAvailability } from "./tool-support.js";
 const HOST_COMMANDS = {
     claude: "claude",
     codex: "codex",
     cursor: "cursor",
     gemini: "gemini"
 };
+const REPO_SIGNALS_CACHE_TTL_MS = 5_000;
+const repoSignalsCache = new Map();
+const GIT_STATE_CACHE_TTL_MS = 60_000;
+const repoGitStateCache = new Map();
 const POLICY_PACKS = {
     "solo-founder": {
         name: "solo-founder",
@@ -110,13 +114,19 @@ const POLICY_PACKS = {
         requireApprovalAtOrAbove: "medium"
     }
 };
-export function inspectRepoSignals(workingDirectory) {
+export function inspectRepoSignals(workingDirectory, options = {}) {
+    const includeHostAvailability = options.includeHostAvailability ?? true;
+    const cacheKey = `${workingDirectory}::hosts=${includeHostAvailability ? "live" : "skipped"}`;
+    const cached = repoSignalsCache.get(cacheKey);
+    if (cached && cached.expiresAt > Date.now()) {
+        return cached.value;
+    }
     const packageScripts = readPackageScripts(workingDirectory);
     const packageManager = detectPackageManager(workingDirectory);
     const frameworks = detectFrameworks(workingDirectory, packageScripts);
     const languages = detectLanguages(workingDirectory, frameworks);
     const verifiers = detectVerifierCommands(packageScripts, packageManager);
-    return {
+    const signals = {
         workingDirectory,
         packageManager,
         languages,
@@ -125,13 +135,27 @@ export function inspectRepoSignals(workingDirectory) {
         packageScripts,
         git: detectGitState(workingDirectory),
         sensitivePaths: detectSensitivePaths(workingDirectory),
+        hostAvailabilityChecked: includeHostAvailability,
         availableHosts: {
-            claude: detectCliAvailability(HOST_COMMANDS.claude),
-            codex: detectCliAvailability(HOST_COMMANDS.codex),
-            cursor: detectCliAvailability(HOST_COMMANDS.cursor),
-            gemini: detectCliAvailability(HOST_COMMANDS.gemini)
+            claude: includeHostAvailability
+                ? detectCliAvailability(HOST_COMMANDS.claude)
+                : createSkippedCliAvailability(HOST_COMMANDS.claude),
+            codex: includeHostAvailability
+                ? detectCliAvailability(HOST_COMMANDS.codex)
+                : createSkippedCliAvailability(HOST_COMMANDS.codex),
+            cursor: includeHostAvailability
+                ? detectCliAvailability(HOST_COMMANDS.cursor)
+                : createSkippedCliAvailability(HOST_COMMANDS.cursor),
+            gemini: includeHostAvailability
+                ? detectCliAvailability(HOST_COMMANDS.gemini)
+                : createSkippedCliAvailability(HOST_COMMANDS.gemini)
         }
     };
+    repoSignalsCache.set(cacheKey, {
+        expiresAt: Date.now() + REPO_SIGNALS_CACHE_TTL_MS,
+        value: signals
+    });
+    return signals;
 }
 export function buildReadinessReport(signals, runStore) {
     const missingSafeguards = [];
@@ -155,7 +179,9 @@ export function buildReadinessReport(signals, runStore) {
     if (signals.frameworks.length === 0) {
         score -= 8;
     }
-    if (!signals.availableHosts.claude.available && !signals.availableHosts.codex.available) {
+    if (signals.hostAvailabilityChecked &&
+        !signals.availableHosts.claude.available &&
+        !signals.availableHosts.codex.available) {
         score -= 18;
     }
     score = Math.max(0, Math.min(100, score));
@@ -189,8 +215,8 @@ export function buildPolicyPackDefinition(policyPack, signals) {
             : fallbackVerifierPlan(signals.packageManager)
     };
 }
-export function buildPlanProposal(workingDirectory, overrides) {
-    const signals = inspectRepoSignals(workingDirectory);
+export function buildPlanProposal(workingDirectory, overrides, options = {}) {
+    const signals = options.signals ?? inspectRepoSignals(workingDirectory);
     const policy = buildPolicyPackDefinition(overrides.policyPack, signals);
     const scope = inferScopeFromObjective(overrides.objective, policy, overrides);
     const estimatedBudget = buildBudget(overrides, signals);
@@ -223,8 +249,8 @@ export function buildPlanProposal(workingDirectory, overrides) {
         ]
     };
 }
-export function buildRunContract(workingDirectory, overrides) {
-    const plan = buildPlanProposal(workingDirectory, overrides);
+export function buildRunContract(workingDirectory, overrides, options = {}) {
+    const plan = options.plan ?? buildPlanProposal(workingDirectory, overrides, options);
     return {
         objective: overrides.objective,
         ...(overrides.context ? { context: overrides.context } : {}),
@@ -238,6 +264,16 @@ export function buildRunContract(workingDirectory, overrides) {
             shouldRequireApproval(plan.policyPack.requireApprovalAtOrAbove, plan.risk.level)
     };
 }
+export function normalizeLoopBudget(overrides = {}) {
+    const maxUsd = overrides.maxUsd ?? DEFAULT_BUDGET.maxUsd;
+    const softLimitUsd = Math.min(overrides.softLimitUsd ?? DEFAULT_BUDGET.softLimitUsd, maxUsd);
+    return {
+        maxUsd,
+        softLimitUsd,
+        maxIterations: overrides.maxIterations ?? DEFAULT_BUDGET.maxIterations,
+        maxTokens: overrides.maxTokens ?? DEFAULT_BUDGET.maxTokens
+    };
+}
 export function assessRunRisk(input) {
     const reasons = [];
     let score = 12;
@@ -406,17 +442,10 @@ function detectVerifierCommands(scripts, packageManager) {
     return { test, lint, build, defaultPlan };
 }
 function detectGitState(workingDirectory) {
-    const availability = spawnSync("git", ["--version"], {
-        cwd: workingDirectory,
-        encoding: "utf8",
-        stdio: ["ignore", "pipe", "pipe"]
-    });
-    if (availability.status !== 0) {
-        return {
-            available: false,
-            isRepo: false,
-            clean: false
-        };
+    const cacheKey = workingDirectory;
+    const cached = repoGitStateCache.get(cacheKey);
+    if (cached && cached.expiresAt > Date.now()) {
+        return cached.value;
     }
     const isRepo = spawnSync("git", ["rev-parse", "--is-inside-work-tree"], {
         cwd: workingDirectory,
@@ -424,18 +453,29 @@ function detectGitState(workingDirectory) {
         stdio: ["ignore", "pipe", "pipe"]
     });
     if (isRepo.status !== 0 || !/true/u.test(isRepo.stdout ?? "")) {
-        return {
-            available: true,
-            isRepo: false,
-            clean: false
-        };
+        const availability = spawnSync("git", ["--version"], {
+            cwd: workingDirectory,
+            encoding: "utf8",
+            stdio: ["ignore", "pipe", "pipe"]
+        });
+        const value = availability.status !== 0
+            ? {
+                available: false,
+                isRepo: false,
+                clean: false
+            }
+            : {
+                available: true,
+                isRepo: false,
+                clean: false
+            };
+        repoGitStateCache.set(cacheKey, {
+            expiresAt: Date.now() + GIT_STATE_CACHE_TTL_MS,
+            value
+        });
+        return value;
     }
-    const branch = spawnSync("git", ["branch", "--show-current"], {
-        cwd: workingDirectory,
-        encoding: "utf8",
-        stdio: ["ignore", "pipe", "pipe"]
-    }).stdout.trim();
-    const status = spawnSync("git", ["status", "--porcelain", "--branch"], {
+    const status = spawnSync("git", ["status", "--porcelain=v2", "--branch", "--untracked-files=normal", "--ignored=no", "--", "."], {
         cwd: workingDirectory,
         encoding: "utf8",
         stdio: ["ignore", "pipe", "pipe"]
@@ -444,20 +484,42 @@ function detectGitState(workingDirectory) {
         .split(/\r?\n/u)
         .map((line) => line.trim())
         .filter(Boolean);
-    const dirty = statusLines.some((line) => !line.startsWith("##"));
-    const header = statusLines.find((line) => line.startsWith("##"));
-    const upstream = header?.match(/\.\.\.([^\s[]+)/u)?.[1];
-    const ahead = parseCount(header, /ahead (\d+)/u);
-    const behind = parseCount(header, /behind (\d+)/u);
-    return {
+    const dirty = statusLines.some((line) => !line.startsWith("#"));
+    const branch = statusLines
+        .find((line) => line.startsWith("# branch.head "))
+        ?.replace("# branch.head ", "")
+        .trim();
+    const upstream = statusLines
+        .find((line) => line.startsWith("# branch.upstream "))
+        ?.replace("# branch.upstream ", "")
+        .trim();
+    const aheadBehind = statusLines
+        .find((line) => line.startsWith("# branch.ab "))
+        ?.replace("# branch.ab ", "")
+        .trim()
+        .split(/\s+/u);
+    const aheadToken = aheadBehind?.find((token) => token.startsWith("+"));
+    const behindToken = aheadBehind?.find((token) => token.startsWith("-"));
+    const ahead = aheadToken && aheadToken.length > 1
+        ? Number.parseInt(aheadToken.slice(1), 10)
+        : undefined;
+    const behind = behindToken && behindToken.length > 1
+        ? Number.parseInt(behindToken.slice(1), 10)
+        : undefined;
+    const value = {
         available: true,
         isRepo: true,
         clean: !dirty,
-        ...(branch ? { branch } : {}),
+        ...(branch && branch !== "(detached)" ? { branch } : {}),
         ...(upstream ? { upstream } : {}),
-        ...(ahead !== undefined ? { ahead } : {}),
-        ...(behind !== undefined ? { behind } : {})
+        ...(Number.isFinite(ahead) ? { ahead } : {}),
+        ...(Number.isFinite(behind) ? { behind } : {})
     };
+    repoGitStateCache.set(cacheKey, {
+        expiresAt: Date.now() + GIT_STATE_CACHE_TTL_MS,
+        value
+    });
+    return value;
 }
 function detectSensitivePaths(workingDirectory) {
     const candidates = [
@@ -520,11 +582,9 @@ function inferScopeFromObjective(objective, policy, overrides) {
 }
 function buildBudget(overrides, signals) {
     const defaultCommands = signals.verifiers.defaultPlan.length > 0 ? 12 : 8;
+    const normalizedBudget = normalizeLoopBudget(overrides);
     return {
-        maxUsd: overrides.maxUsd ?? DEFAULT_BUDGET.maxUsd,
-        softLimitUsd: Math.min(overrides.maxUsd ?? DEFAULT_BUDGET.maxUsd, DEFAULT_BUDGET.softLimitUsd),
-        maxIterations: overrides.maxIterations ?? DEFAULT_BUDGET.maxIterations,
-        maxTokens: overrides.maxTokens ?? DEFAULT_BUDGET.maxTokens,
+        ...normalizedBudget,
         maxMinutes: overrides.maxMinutes ?? 20,
         maxFilesChanged: overrides.maxFilesChanged ?? 8,
         maxCommands: overrides.maxCommands ?? defaultCommands
@@ -571,11 +631,3 @@ function shouldRequireApproval(threshold, level) {
     const ordering = ["low", "medium", "high"];
     return ordering.indexOf(level) >= ordering.indexOf(threshold);
 }
-function parseCount(value, pattern) {
-    const match = value?.match(pattern)?.[1];
-    if (!match) {
-        return undefined;
-    }
-    const parsed = Number.parseInt(match, 10);
-    return Number.isFinite(parsed) ? parsed : undefined;
-}

package/dist/vendor/adapters/claude-cli.d.ts CHANGED Viewed

@@ -45,6 +45,15 @@ export interface AgentCliAdapterOptions {
      * Defaults to true for Claude.
      */
     supportsJsonOutput?: boolean;
+    /**
+     * Set when `argsBuilder` requests `--output-format stream-json` (newline-
+     * delimited JSON events) rather than single-blob `json`. Enables (a)
+     * incremental result parsing that scans for the final `result` event, and
+     * (b) a live cumulative-cost circuit breaker that terminates the subprocess
+     * the moment projected spend crosses the remaining per-attempt budget,
+     * rather than only learning about an overspend after the process exits.
+     */
+    streamingUsageCap?: boolean;
     /** Test-only override for subprocess spawning. */
     spawnImpl?: SpawnLike;
 }
@@ -60,6 +69,8 @@ export interface ClaudeCliAdapterOptions {
     spawnImpl?: SpawnLike;
 }
 export interface CodexCliAdapterOptions {
+    /** Override the executable or absolute command path used to launch Codex. */
+    command?: string;
     workingDirectory?: string;
     timeoutMs?: number;
     verifyTimeoutMs?: number;
@@ -97,10 +108,16 @@ export interface GeminiCliAdapterOptions {
 }
 export declare function createAgentCliAdapter(options: AgentCliAdapterOptions): MartinAdapter;
 /**
- * Spawns `claude --output-format json --print "<prompt>" --dangerously-skip-permissions [extraArgs]`.
+ * Spawns `claude --output-format stream-json --verbose --print "<prompt>" [extraArgs]`.
  *
- * The --output-format json flag causes Claude CLI to return structured JSON
- * including real token usage counts, enabling accurate cost tracking.
+ * `stream-json` emits one JSON event per line — including per-turn usage on
+ * each `assistant` message and a final `result` event carrying the same
+ * `result`/`usage`/`total_cost_usd` fields as single-blob `json` output — so
+ * MartinLoop can both (a) recover real token usage/cost as before, and
+ * (b) watch cumulative spend live and self-terminate the subprocess the
+ * moment it crosses the remaining per-attempt budget (see
+ * `streamingUsageCap` / `createStreamingUsageInspector`), instead of only
+ * discovering an overspend after the whole process has already exited.
  *
  * Requires the Claude Code CLI to be installed and authenticated:
  *   https://docs.anthropic.com/claude-code