npm - claude-overnight - Versions diffs - 1.50.5 → 1.51.1 - Mend

claude-overnight 1.50.5 → 1.51.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/dist/core/_version.d.ts +1 -1
package/dist/core/_version.js +1 -1
package/dist/planner/query.js +20 -10
package/dist/planner/steering.js +5 -1
package/dist/providers/index.js +0 -3
package/dist/run/run.js +11 -3
package/dist/run/summary.d.ts +2 -0
package/dist/run/summary.js +52 -28
package/dist/run/wave-loop.js +2 -1
package/dist/skills/librarian.js +28 -29
package/package.json +1 -1
package/plugins/claude-overnight/.claude-plugin/plugin.json +1 -1

package/dist/core/_version.d.ts CHANGED Viewed

	@@ -1 +1 @@
1	- export declare const VERSION = "1.50.5";
1	+ export declare const VERSION = "1.51.1";

package/dist/core/_version.js CHANGED Viewed

@@ -1,2 +1,2 @@
 // Auto-generated by build — do not edit manually.
-export const VERSION = "1.50.5";
+export const VERSION = "1.51.1";

package/dist/planner/query.js CHANGED Viewed

@@ -21,10 +21,16 @@ let _envResolver;
 export function setPlannerEnvResolver(fn) {
     _envResolver = fn;
 }
-// ── Cursor proxy: direct HTTP bypass ──
-// SDK spawns 4+ subprocesses (~15s each) for the proxy; one direct POST is 4-10x faster.
-function isCursorProxyEnv(env) {
-    return !!env?.CURSOR_API_KEY && !env?.ANTHROPIC_API_KEY;
+// ── Direct HTTP bypass for non-Anthropic endpoints ──
+// The Claude Code CLI subprocess spawned by @anthropic-ai/claude-agent-sdk validates
+// model names against its built-in Anthropic list and rejects custom ids (qwen3.6-plus,
+// composer-2, etc.) pre-flight, even when ANTHROPIC_BASE_URL points at an Anthropic-
+// compatible proxy. Bypass the SDK with a direct POST for any non-anthropic.com base.
+function shouldUseDirectFetch(env) {
+    const base = env?.ANTHROPIC_BASE_URL;
+    if (!base)
+        return false;
+    return !/^https?:\/\/(api\.)?anthropic\.com/i.test(base);
 }
 async function runViaDirectFetch(prompt, opts, onLog) {
     const env = opts.env ?? _envResolver?.(opts.model);
@@ -39,30 +45,34 @@ async function runViaDirectFetch(prompt, opts, onLog) {
         await apiEndpointLimiter.waitIfNeeded();
         const waited = await rl.waitIfNeeded();
         if (waited > 0)
-            onLog(`Cursor proxy rate gate — waited ${Math.round(waited / 1000)}s`, "event");
+            onLog(`Planner proxy rate gate — waited ${Math.round(waited / 1000)}s`, "event");
         const res = await fetch(`${baseUrl}/v1/messages`, {
             method: "POST",
-            headers: { "Content-Type": "application/json", "Authorization": `Bearer ${authToken}` },
+            headers: {
+                "Content-Type": "application/json",
+                "Authorization": `Bearer ${authToken}`,
+                "anthropic-version": "2023-06-01",
+            },
             body: JSON.stringify({ model: opts.model, max_tokens: 8192, messages: [{ role: "user", content: prompt }] }),
         });
         if (res.status === 429 && attempt < MAX_RETRIES) {
             const waitMs = BACKOFF[attempt];
-            onLog(`Cursor proxy rate limited — waiting ${Math.round(waitMs / 1000)}s`, "event");
+            onLog(`Planner proxy rate limited — waiting ${Math.round(waitMs / 1000)}s`, "event");
             await sleep(waitMs);
             continue;
         }
         if (!res.ok)
-            throw new Error(`Cursor proxy ${res.status}: ${(await res.text().catch(() => ""))}`);
+            throw new Error(`Planner proxy ${res.status}: ${(await res.text().catch(() => ""))}`);
         rl.record();
         apiEndpointLimiter.record();
         const data = await res.json();
         return data.content?.[0]?.text ?? "";
     }
-    throw new Error("Cursor proxy direct fetch failed after retries");
+    throw new Error("Planner proxy direct fetch failed after retries");
 }
 export async function runPlannerQuery(prompt, opts, onLog) {
     const env = opts.env ?? _envResolver?.(opts.model);
-    if (isCursorProxyEnv(env))
+    if (shouldUseDirectFetch(env))
         return runViaDirectFetch(prompt, opts, onLog);
     const MAX_RETRIES = 3;
     const BACKOFF = [30_000, 60_000, 120_000];

package/dist/planner/steering.js CHANGED Viewed

@@ -27,7 +27,11 @@ export const STEER_SCHEMA = {
         required: ["done", "tasks", "reasoning", "statusUpdate", "estimatedSessionsRemaining"],
     },
 };
-const PROMPT_BUDGET = 6000;
+// The base 30-1_steer template alone is ~7 KB, so any budget below that is
+// unreachable no matter how aggressively we trim variables. 20 KB leaves room
+// for the template + moderate run memory while still being a tiny fraction of
+// any planner's context window.
+const PROMPT_BUDGET = 20_000;
 const DEFAULT_CAPS = {
     milestones: 2000, designs: 1500, reflections: 1000,
     verifications: 1000, previousRuns: 800, userGuidance: 4000,

package/dist/providers/index.js CHANGED Viewed

@@ -109,9 +109,6 @@ export function envFor(p) {
         base.ANTHROPIC_AUTH_TOKEN = key;
     }
     delete base.ANTHROPIC_API_KEY;
-    // Prevent CURSOR_API_KEY from leaking into non-proxy envs — would trip
-    // isCursorProxyEnv false-positive, silently rerouting through direct fetch
-    // which ignores outputFormat (no JSON schema enforcement).
     delete base.CURSOR_API_KEY;
     delete base.CURSOR_AUTH_TOKEN;
     return base;

package/dist/run/run.js CHANGED Viewed

@@ -545,10 +545,18 @@ export async function executeRun(cfg) {
     display.stop();
     // ── Finalize ──
     const trulyDone = objectiveComplete || (!flex && remaining <= 0);
-    // User-initiated quit (or abort via 'q' / SIGINT / stall-watchdog) ⇒ save as
-    // "stopped" so resume.ts offers the run and the incomplete work comes back.
     const userQuit = stopping || lastAborted;
     const wasCapped = lastCapped && !userQuit;
+    // Determine specific exit reason for the end brief
+    let exitReason;
+    if (trulyDone)
+        exitReason = "done";
+    else if (userQuit)
+        exitReason = "user-interrupted";
+    else if (wasCapped || remaining <= 0)
+        exitReason = "budget-exhausted";
+    else
+        exitReason = "planner-gave-up"; // steering returned false, planner couldn't produce tasks
     const finalPhase = trulyDone ? "done"
         : userQuit ? "stopped"
             : wasCapped ? "capped"
@@ -632,7 +640,7 @@ export async function executeRun(cfg) {
         runDir, runBranch, objective, waveNum, runStartedAt: cfg.runStartedAt,
         branches, waveHistory,
         accCost, accCompleted, accFailed, accTools, accIn, accOut,
-        remaining, lastCapped, lastAborted, stopping, trulyDone,
+        remaining, lastCapped, lastAborted, stopping, trulyDone, exitReason,
         peakWorkerCtxTokens, peakWorkerCtxPct,
         currentSwarmLogFile: currentSwarm?.logFile,
         narrativeDeps: {

package/dist/run/summary.d.ts CHANGED Viewed

@@ -11,6 +11,7 @@ export interface FinalNarrativeDeps {
 /** Generate a longer narrative summary at run end. Awaited (not fire-and-forget)
  *  because the caller wants the text inline in the final status block. */
 export declare function generateFinalNarrative(deps: FinalNarrativeDeps, phase: string): Promise<string>;
+export type ExitReason = "done" | "budget-exhausted" | "user-interrupted" | "planner-gave-up" | "circuit-breaker" | "stalled";
 export interface SummaryArgs {
     runDir: string;
     runBranch?: string;
@@ -30,6 +31,7 @@ export interface SummaryArgs {
     lastAborted: boolean;
     stopping: boolean;
     trulyDone: boolean;
+    exitReason: ExitReason;
     peakWorkerCtxTokens: number;
     peakWorkerCtxPct: number;
     currentSwarmLogFile?: string;

package/dist/run/summary.js CHANGED Viewed

@@ -32,7 +32,7 @@ export async function generateFinalNarrative(deps, phase) {
     }
 }
 export async function printFinalSummary(args) {
-    const { runDir, runBranch, objective, waveNum, runStartedAt, branches, waveHistory, accCost, accCompleted, accFailed, accTools, accIn, accOut, remaining, lastCapped, lastAborted, stopping, trulyDone, peakWorkerCtxTokens, peakWorkerCtxPct, currentSwarmLogFile, narrativeDeps, } = args;
+    const { runDir, runBranch, objective, waveNum, runStartedAt, branches, waveHistory, accCost, accCompleted, accFailed, accTools, accIn, accOut, remaining, lastCapped, exitReason, peakWorkerCtxTokens, peakWorkerCtxPct, currentSwarmLogFile, narrativeDeps, } = args;
     const waves = waveNum + 1;
     const elapsed = Math.round((Date.now() - runStartedAt) / 1000);
     const elapsedStr = elapsed < 60 ? `${elapsed}s` : elapsed < 3600 ? `${Math.floor(elapsed / 60)}m ${elapsed % 60}s` : `${Math.floor(elapsed / 3600)}h ${Math.floor((elapsed % 3600) / 60)}m`;
@@ -40,26 +40,31 @@ export async function printFinalSummary(args) {
     const totalConflicts = branches.filter(b => b.status === "merge-failed").length;
     const termW = Math.max((process.stdout.columns ?? 80) || 80, 50);
     const rule = (c = "─") => chalk.dim(`  ${c.repeat(Math.min(termW - 4, 60))}`);
-    const phaseWord = trulyDone ? "complete"
-        : remaining <= 0 || lastCapped ? "budget exhausted"
-            : stopping || lastAborted ? "interrupted"
-                : "stopped";
+    const bannerChar = accFailed === 0 ? "━" : "─";
+    // Banner: title + subtitle explaining why the run ended
+    const banner = {
+        done: { icon: "✓", title: "CLAUDE OVERNIGHT  -- COMPLETE", color: chalk.green, explain: "The planner determined the objective was achieved." },
+        "budget-exhausted": { icon: "⚠", title: "CLAUDE OVERNIGHT  -- BUDGET EXHAUSTED", color: chalk.yellow, explain: "All allocated sessions were consumed." },
+        "user-interrupted": { icon: "⚠", title: "CLAUDE OVERNIGHT  -- INTERRUPTED", color: chalk.yellow, explain: "You quit mid-run with [q] or a signal." },
+        "planner-gave-up": { icon: "⚠", title: "CLAUDE OVERNIGHT  -- PLANNER GAVE UP", color: chalk.magenta, explain: "The planner could not decompose the remaining work into actionable tasks." },
+        "circuit-breaker": { icon: "⚠", title: "CLAUDE OVERNIGHT  -- HALTED", color: chalk.red, explain: "2+ consecutive waves produced no merged changes." },
+        stalled: { icon: "⚠", title: "CLAUDE OVERNIGHT  -- STALLED", color: chalk.magenta, explain: "No progress detected; the run was halted to preserve budget." },
+    }[exitReason] ?? { icon: "⚠", title: "CLAUDE OVERNIGHT  -- STOPPED", color: chalk.magenta, explain: "The run ended without a clear reason." };
+    const narrativePhase = exitReason === "done" ? "complete"
+        : exitReason === "budget-exhausted" ? "budget exhausted"
+            : exitReason === "user-interrupted" ? "interrupted"
+                : exitReason === "planner-gave-up" ? "planner gave up"
+                    : exitReason === "circuit-breaker" ? "circuit breaker"
+                        : exitReason === "stalled" ? "stalled"
+                            : "stopped";
     process.stdout.write(chalk.dim(`\n  Writing final summary…`));
-    const narrative = await generateFinalNarrative(narrativeDeps, phaseWord);
+    const narrative = await generateFinalNarrative(narrativeDeps, narrativePhase);
     process.stdout.write("\r" + " ".repeat(40) + "\r");
     console.log("");
-    const bannerChar = accFailed === 0 ? "━" : "─";
-    const bannerColor = trulyDone ? chalk.green : (stopping || lastAborted) ? chalk.yellow : chalk.magenta;
-    console.log(bannerColor(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
-    if (trulyDone)
-        console.log(chalk.bold.green(`  ✓ CLAUDE OVERNIGHT  -- COMPLETE`));
-    else if (remaining <= 0 || lastCapped)
-        console.log(chalk.bold.yellow(`  ⚠ CLAUDE OVERNIGHT  -- BUDGET EXHAUSTED`));
-    else if (stopping || lastAborted)
-        console.log(chalk.bold.yellow(`  ⚠ CLAUDE OVERNIGHT  -- INTERRUPTED`));
-    else
-        console.log(chalk.bold.yellow(`  ⚠ CLAUDE OVERNIGHT  -- STOPPED`));
-    console.log(bannerColor(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
+    console.log(banner.color(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
+    console.log(chalk.bold(banner.color(`  ${banner.icon} ${banner.title}`)));
+    console.log(chalk.dim(`  ${banner.explain}`));
+    console.log(banner.color(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
     console.log("");
     if (objective) {
         console.log(chalk.bold("  Objective"));
@@ -162,15 +167,34 @@ export async function printFinalSummary(args) {
     if (currentSwarmLogFile)
         console.log(chalk.dim(`  Log: ${currentSwarmLogFile}`));
     console.log("");
-    console.log(bannerColor(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
-    if (trulyDone)
-        console.log(chalk.bold.green(`  Done. Review the diff, then ship it.`));
-    else if (remaining <= 0 || lastCapped)
-        console.log(chalk.bold.yellow(`  Paused on budget. Re-run with --resume to continue.`));
-    else if (stopping || lastAborted)
-        console.log(chalk.bold.yellow(`  Interrupted. --resume to pick up where this left off.`));
-    else
-        console.log(chalk.bold.yellow(`  Stopped. --resume to continue.`));
-    console.log(bannerColor(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
+    console.log(banner.color(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
+    // Actionable next-steps based on exit reason
+    const endMsg = (() => {
+        switch (exitReason) {
+            case "done":
+                return "Review the diff, then ship it.";
+            case "budget-exhausted":
+                return remaining > 0
+                    ? "Budget sessions remaining but usage cap hit. Raise the cap or re-run with --resume."
+                    : "All sessions spent. Re-run with --resume to continue, or raise the budget.";
+            case "user-interrupted":
+                return "Run preserved. Use --resume to pick up where this left off.";
+            case "planner-gave-up": {
+                const lines = ["Planner could not decompose remaining work."];
+                if (remaining > 0)
+                    lines.push(`${remaining} sessions unused — the work may be too vague or out of scope.`);
+                lines.push("Refine the objective or break it down manually, then re-run.");
+                return lines.join(" ");
+            }
+            case "circuit-breaker":
+                return "No changes landed in 2+ waves. Check for merge conflicts or agent errors in the log.";
+            case "stalled":
+                return "Run halted to preserve budget. Inspect status.md for blockers, then --resume.";
+            default:
+                return "Run preserved. --resume to continue.";
+        }
+    })();
+    console.log(chalk.bold(banner.color(`  ${endMsg}`)));
+    console.log(banner.color(`  ${bannerChar.repeat(Math.min(termW - 4, 60))}`));
     console.log("");
 }

package/dist/run/wave-loop.js CHANGED Viewed

@@ -362,12 +362,13 @@ export async function runWaveLoop(host, ctx) {
             const librarianStart = Date.now();
             let librarianPromoted = 0, librarianPatched = 0, librarianQuarantined = 0, librarianRejected = 0;
             try {
+                const librarianModel = host.fastModel ?? host.workerModel;
                 const lr = await runLibrarian({
                     fingerprint: host.repoFingerprint,
                     runId: host.runId,
                     wave: host.waveNum,
                     cwd: ctx.cwd,
-                    model: host.plannerModel,
+                    model: librarianModel,
                     envForModel: ctx.envForModel,
                 });
                 librarianPromoted = lr.promoted;

package/dist/skills/librarian.js CHANGED Viewed

@@ -1,4 +1,3 @@
-import { query } from "@anthropic-ai/claude-agent-sdk";
 import { readFileSync, writeFileSync, mkdirSync, renameSync, existsSync, readdirSync, appendFileSync, } from "node:fs";
 import { join } from "node:path";
 import { openSkillsDb } from "./index-db.js";
@@ -84,44 +83,44 @@ function buildSubagentInput(canon, candidates, abOutcomes) {
     return JSON.stringify({ canon, candidates, ab_outcomes: abOutcomes });
 }
 // ── Subagent call ──
+// Direct POST /v1/messages — no tools needed, so the Agent SDK's CLI subprocess
+// (with its multi-KB built-in system prompt and turn loop) is pure overhead and
+// also pre-flight-rejects non-Anthropic model ids (qwen, composer-2, ...) even
+// when routed through an Anthropic-compatible proxy.
 async function callLibrarianSubagent(input, data) {
     const env = input.envForModel?.(input.model);
     const prompt = renderPrompt("40_skills/40-3_librarian-wrap", { vars: { data } });
-    let timedOut = false;
-    const timer = setTimeout(() => { timedOut = true; }, LIBRARIAN_TIMEOUT_MS);
+    const baseUrl = (env?.ANTHROPIC_BASE_URL ?? process.env.ANTHROPIC_BASE_URL ?? "https://api.anthropic.com").replace(/\/$/, "");
+    const headers = {
+        "Content-Type": "application/json",
+        "anthropic-version": "2023-06-01",
+    };
+    const bearer = env?.ANTHROPIC_AUTH_TOKEN ?? process.env.ANTHROPIC_AUTH_TOKEN;
+    const apiKey = env?.ANTHROPIC_API_KEY ?? process.env.ANTHROPIC_API_KEY;
+    if (bearer)
+        headers["Authorization"] = `Bearer ${bearer}`;
+    else if (apiKey)
+        headers["x-api-key"] = apiKey;
     try {
-        const pq = query({
-            prompt,
-            options: {
-                cwd: input.cwd,
-                model: input.model,
-                permissionMode: "bypassPermissions",
-                allowDangerouslySkipPermissions: true,
-                maxTurns: 8,
-                ...(env && { env }),
-            },
+        const res = await fetch(`${baseUrl}/v1/messages`, {
+            method: "POST",
+            headers,
+            body: JSON.stringify({ model: input.model, max_tokens: 8192, messages: [{ role: "user", content: prompt }] }),
+            signal: AbortSignal.timeout(LIBRARIAN_TIMEOUT_MS),
         });
-        let resultText = "";
-        for await (const msg of pq) {
-            if (timedOut) {
-                pq.interrupt().catch(() => { });
-                break;
-            }
-            if (msg.type === "result" && msg.subtype === "success") {
-                resultText = msg.result || "";
-            }
-        }
-        pq.close();
-        if (timedOut) {
-            process.stderr.write("[librarian] subagent timed out\n");
+        if (!res.ok) {
+            process.stderr.write(`[librarian] HTTP ${res.status}: ${(await res.text().catch(() => "")).slice(0, 200)}\n`);
             return null;
         }
-        // Parse JSON — try direct parse first, then strip markdown fences
+        const body = await res.json();
+        const resultText = body.content?.map(c => c.text ?? "").join("") ?? "";
         const cleaned = resultText.replace(/^```(?:json)?\s*\n([\s\S]*?)\n```\s*$/, "$1").trim();
         return JSON.parse(cleaned);
     }
-    finally {
-        clearTimeout(timer);
+    catch (err) {
+        const msg = err instanceof Error ? err.message : String(err);
+        process.stderr.write(`[librarian] ${msg.includes("aborted") ? "timed out" : `error: ${msg}`}\n`);
+        return null;
     }
 }
 // ── Action application ──

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "claude-overnight",
-  "version": "1.50.5",
+  "version": "1.51.1",
   "description": "Parallel Claude agents in git worktrees with a usage cap that reserves headroom for your interactive Claude Code. Crash-safe resume. Provider-agnostic model catalog (Anthropic, Cursor, OpenAI, Gemini, DeepSeek, Llama, Qwen) with capability-based task scoping.",
   "type": "module",
   "bin": {

package/plugins/claude-overnight/.claude-plugin/plugin.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "claude-overnight",
-  "version": "1.50.5",
+  "version": "1.51.1",
   "description": "Claude Code skill for understanding, installing, and inspecting claude-overnight runs  -- parallel Claude agents in git worktrees with thinking waves, multi-wave steering, and crash-safe resume. Supports Cursor API Proxy, Qwen, OpenRouter.",
   "author": {
     "name": "Francesco Fornace"