npm - swarm-code - Versions diffs - 0.1.4 → 0.1.6 - Mend

swarm-code 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/dist/config.js +1 -1
package/dist/hooks/runner.d.ts +35 -0
package/dist/hooks/runner.js +95 -0
package/dist/interactive-swarm.js +1 -2
package/dist/interactive.js +65 -22
package/dist/main.d.ts +1 -1
package/dist/main.js +11 -8
package/dist/prompts/orchestrator.js +4 -3
package/dist/swarm.js +40 -0
package/package.json +1 -1

package/dist/config.js CHANGED Viewed

@@ -23,7 +23,7 @@ const DEFAULTS = {
     max_session_budget_usd: 10.0,
     default_agent: "opencode",
     default_model: "anthropic/claude-sonnet-4-6",
-    auto_model_selection: false,
+    auto_model_selection: true,
     compression_strategy: "structured",
     compression_max_tokens: 1000,
     worktree_base_dir: ".swarm-worktrees",

package/dist/hooks/runner.d.ts ADDED Viewed

@@ -0,0 +1,35 @@
+/**
+ * Hook runner — executes user-defined commands at lifecycle points.
+ *
+ * Hooks provide deterministic control flow (not LLM-decided).
+ * They run shell commands and surface only errors — success is silent.
+ *
+ * Lifecycle points:
+ *   - post_thread: After a thread commits (before compression)
+ *   - post_merge: After merge_threads() completes
+ *   - post_session: When the session ends
+ */
+export interface HookConfig {
+    command: string;
+    on_failure: "warn" | "block";
+}
+export interface HooksConfig {
+    post_thread: HookConfig[];
+    post_merge: HookConfig[];
+    post_session: HookConfig[];
+}
+export interface HookResult {
+    success: boolean;
+    output: string;
+    command: string;
+}
+/**
+ * Load hooks from swarm_config.yaml hooks section, or from .swarm/hooks.yaml.
+ */
+export declare function loadHooks(projectDir: string): HooksConfig;
+/**
+ * Run hooks for a lifecycle point.
+ * Returns results for each hook. On "block" failure, throws.
+ * Success output is swallowed — only errors are surfaced.
+ */
+export declare function runHooks(hooks: HookConfig[], cwd: string, label: string): HookResult[];

package/dist/hooks/runner.js ADDED Viewed

@@ -0,0 +1,95 @@
+/**
+ * Hook runner — executes user-defined commands at lifecycle points.
+ *
+ * Hooks provide deterministic control flow (not LLM-decided).
+ * They run shell commands and surface only errors — success is silent.
+ *
+ * Lifecycle points:
+ *   - post_thread: After a thread commits (before compression)
+ *   - post_merge: After merge_threads() completes
+ *   - post_session: When the session ends
+ */
+import { execSync } from "node:child_process";
+import * as fs from "node:fs";
+import * as path from "node:path";
+const DEFAULT_HOOKS = {
+    post_thread: [],
+    post_merge: [],
+    post_session: [],
+};
+/**
+ * Load hooks from swarm_config.yaml hooks section, or from .swarm/hooks.yaml.
+ */
+export function loadHooks(projectDir) {
+    const hooksFile = path.join(projectDir, ".swarm", "hooks.yaml");
+    if (!fs.existsSync(hooksFile))
+        return { ...DEFAULT_HOOKS };
+    try {
+        const raw = fs.readFileSync(hooksFile, "utf-8");
+        return parseHooksYaml(raw);
+    }
+    catch {
+        return { ...DEFAULT_HOOKS };
+    }
+}
+function parseHooksYaml(raw) {
+    const hooks = { post_thread: [], post_merge: [], post_session: [] };
+    let currentSection = null;
+    for (const line of raw.split("\n")) {
+        const trimmed = line.trim();
+        if (!trimmed || trimmed.startsWith("#"))
+            continue;
+        if (trimmed === "post_thread:" || trimmed === "post_merge:" || trimmed === "post_session:") {
+            currentSection = trimmed.replace(":", "");
+            continue;
+        }
+        if (currentSection && trimmed.startsWith("- command:")) {
+            const command = trimmed
+                .replace("- command:", "")
+                .trim()
+                .replace(/^["']|["']$/g, "");
+            if (command) {
+                hooks[currentSection].push({ command, on_failure: "warn" });
+            }
+        }
+        if (currentSection && trimmed.startsWith("on_failure:")) {
+            const val = trimmed.replace("on_failure:", "").trim();
+            const last = hooks[currentSection][hooks[currentSection].length - 1];
+            if (last && (val === "warn" || val === "block")) {
+                last.on_failure = val;
+            }
+        }
+    }
+    return hooks;
+}
+/**
+ * Run hooks for a lifecycle point.
+ * Returns results for each hook. On "block" failure, throws.
+ * Success output is swallowed — only errors are surfaced.
+ */
+export function runHooks(hooks, cwd, label) {
+    const results = [];
+    for (const hook of hooks) {
+        try {
+            execSync(hook.command, {
+                cwd,
+                stdio: ["ignore", "pipe", "pipe"],
+                timeout: 60_000,
+                encoding: "utf-8",
+            });
+            // Success — silent (context-efficient per harness engineering best practice)
+            results.push({ success: true, output: "", command: hook.command });
+        }
+        catch (err) {
+            const stderr = err.stderr || err.stdout || err.message || "unknown error";
+            // Only surface error output
+            const output = `[${label}] Hook failed: ${hook.command}\n${stderr}`.trim();
+            results.push({ success: false, output, command: hook.command });
+            if (hook.on_failure === "block") {
+                throw new Error(output);
+            }
+        }
+    }
+    return results;
+}
+//# sourceMappingURL=runner.js.map

package/dist/interactive-swarm.js CHANGED Viewed

@@ -80,8 +80,7 @@ function parseInteractiveArgs(args) {
         // Silently ignore unknown flags and positional args
     }
     if (!dir) {
-        logError("--dir <path> is required for interactive swarm mode");
-        process.exit(1);
+        dir = process.cwd();
     }
     return {
         dir: path.resolve(dir),

package/dist/interactive.js CHANGED Viewed

@@ -1582,30 +1582,73 @@ async function interactive() {
                 console.log();
             }
             else {
-                // Agent works without keys (e.g. OpenCode) — set up Ollama directly
-                console.log(`  ${c.bold}${agent.name}${c.reset} ${c.dim}— setting up Ollama for local models:${c.reset}\n`);
-                const ok = await ensureOllamaSetup(setupRl, "ollama/deepseek-coder-v2");
-                if (ok)
-                    usesOllama = true;
+                // Agent works without keys (e.g. OpenCode) — choose backend
+                console.log(`  ${c.bold}${agent.name}${c.reset} ${c.dim}— choose your backend:${c.reset}\n`);
+                console.log(`  ${c.dim}1${c.reset}  Ollama       ${c.dim}Run models locally (free, requires download)${c.reset}`);
+                console.log(`  ${c.dim}2${c.reset}  OpenRouter   ${c.dim}Cloud API for 200+ models (requires API key)${c.reset}`);
+                console.log();
+                const backendChoice = await questionWithEsc(setupRl, `  ${c.cyan}Backend [1-2]:${c.reset} `);
+                const pickedOpenRouter = backendChoice !== null && backendChoice.trim() === "2";
+                if (pickedOpenRouter) {
+                    // OpenRouter setup
+                    console.log();
+                    const orKey = await questionWithEsc(setupRl, `  ${c.cyan}OPENROUTER_API_KEY:${c.reset} `);
+                    if (orKey?.trim()) {
+                        process.env.OPENROUTER_API_KEY = orKey.trim();
+                        try {
+                            const envPath = path.join(process.cwd(), ".env");
+                            let envContent = "";
+                            try {
+                                envContent = fs.readFileSync(envPath, "utf-8");
+                            }
+                            catch { }
+                            if (!envContent.includes("OPENROUTER_API_KEY")) {
+                                fs.appendFileSync(envPath, `\nOPENROUTER_API_KEY=${orKey.trim()}\n`);
+                            }
+                            console.log(`  ${c.green}✓${c.reset} OpenRouter configured`);
+                        }
+                        catch {
+                            console.log(`  ${c.green}✓${c.reset} OpenRouter key set for this session`);
+                        }
+                        currentModelId = "openrouter/auto";
+                        saveModelPreference(currentModelId);
+                    }
+                    else {
+                        console.log(`  ${c.dim}No key provided — you can set OPENROUTER_API_KEY in .env later${c.reset}`);
+                    }
+                }
+                else {
+                    // Ollama setup
+                    console.log();
+                    const ok = await ensureOllamaSetup(setupRl, "ollama/deepseek-coder-v2");
+                    if (ok)
+                        usesOllama = true;
+                }
                 console.log();
             }
         }
         // ── Step 3: Set default model ────────────────────────────────
-        const activeProvider = Object.keys(PROVIDER_KEYS).find((p) => process.env[providerEnvKey(p)]);
-        if (activeProvider) {
-            currentProviderName = activeProvider;
-            const defaultModel = getDefaultModelForProvider(activeProvider);
-            if (defaultModel) {
-                currentModelId = defaultModel;
+        if (currentModelId.startsWith("openrouter/")) {
+            // Already set during OpenRouter setup
+            console.log(`  ${c.green}✓${c.reset} Default model: ${c.bold}${currentModelId}${c.reset} ${c.dim}(OpenRouter)${c.reset}`);
+        }
+        else {
+            const activeProvider = Object.keys(PROVIDER_KEYS).find((p) => process.env[providerEnvKey(p)]);
+            if (activeProvider) {
+                currentProviderName = activeProvider;
+                const defaultModel = getDefaultModelForProvider(activeProvider);
+                if (defaultModel) {
+                    currentModelId = defaultModel;
+                    saveModelPreference(currentModelId);
+                    console.log(`  ${c.green}✓${c.reset} Default model: ${c.bold}${currentModelId}${c.reset}`);
+                }
+            }
+            else if (usesOllama) {
+                currentModelId = "ollama/deepseek-coder-v2";
                 saveModelPreference(currentModelId);
-                console.log(`  ${c.green}✓${c.reset} Default model: ${c.bold}${currentModelId}${c.reset}`);
+                console.log(`  ${c.green}✓${c.reset} Default model: ${c.bold}${currentModelId}${c.reset} ${c.dim}(local)${c.reset}`);
             }
         }
-        else if (usesOllama) {
-            currentModelId = "ollama/deepseek-coder-v2";
-            saveModelPreference(currentModelId);
-            console.log(`  ${c.green}✓${c.reset} Default model: ${c.bold}${currentModelId}${c.reset} ${c.dim}(local)${c.reset}`);
-        }
         console.log();
         setupRl.close();
     }
@@ -1637,12 +1680,12 @@ async function interactive() {
         }
     }
     if (!currentModel) {
-        if (currentModelId.startsWith("ollama/")) {
-            // Ollama model selected — this interactive REPL mode needs a cloud API.
-            // Redirect to swarm mode which works with OpenCode + Ollama.
-            console.log(`\n  ${c.green}✓${c.reset} Ollama model selected: ${c.bold}${currentModelId}${c.reset}`);
+        if (currentModelId.startsWith("ollama/") || currentModelId.startsWith("openrouter/")) {
+            // Non-pi-ai model — redirect to swarm mode which uses OpenCode natively.
+            const backend = currentModelId.startsWith("ollama/") ? "Ollama" : "OpenRouter";
+            console.log(`\n  ${c.green}✓${c.reset} ${backend} model selected: ${c.bold}${currentModelId}${c.reset}`);
             console.log(`\n  ${c.dim}This interactive REPL uses direct LLM API calls.${c.reset}`);
-            console.log(`  ${c.dim}To use Ollama models with OpenCode, run:${c.reset}\n`);
+            console.log(`  ${c.dim}To use ${backend} with OpenCode, run:${c.reset}\n`);
             console.log(`  ${c.bold}swarm --dir ./your-project "your task"${c.reset}\n`);
             process.exit(0);
         }

package/dist/main.d.ts CHANGED Viewed

@@ -10,6 +10,6 @@
  *   swarm run                    → single-shot RLM CLI run
  *   swarm viewer                 → browse trajectory files
  *   swarm benchmark              → run benchmarks
- *   swarm                        → interactive terminal (RLM mode, default)
+ *   swarm                        → interactive REPL (uses current directory)
  */
 export declare function buildHelp(): string;

package/dist/main.js CHANGED Viewed

@@ -10,7 +10,7 @@
  *   swarm run                    → single-shot RLM CLI run
  *   swarm viewer                 → browse trajectory files
  *   swarm benchmark              → run benchmarks
- *   swarm                        → interactive terminal (RLM mode, default)
+ *   swarm                        → interactive REPL (uses current directory)
  */
 import { bold, coral, cyan, dim, isTTY, symbols, termWidth, yellow } from "./ui/theme.js";
 export function buildHelp() {
@@ -45,8 +45,10 @@ export function buildHelp() {
     lines.push(`    ${yellow("swarm mcp")}                       ${dim("Start MCP server (stdio)")}`);
     lines.push(`    ${yellow("swarm mcp")} --dir ./project       ${dim("Start with default directory")}`);
     lines.push("");
+    lines.push(`  ${bold("INTERACTIVE")} ${dim("(default — uses current directory)")}`);
+    lines.push(`    ${yellow("swarm")}                          ${dim("Interactive REPL in current dir")}`);
+    lines.push("");
     lines.push(`  ${bold("RLM MODE")} ${dim("(text processing, inherited from rlm-cli)")}`);
-    lines.push(`    ${yellow("swarm")}                          ${dim("Interactive terminal (default)")}`);
     lines.push(`    ${yellow("swarm run")} [options] "<query>"  ${dim("Run a single query")}`);
     lines.push(`    ${yellow("swarm viewer")}                    ${dim("Browse saved trajectory files")}`);
     lines.push(`    ${yellow("swarm benchmark")} <name> [--idx]  ${dim("Run benchmark")}`);
@@ -125,13 +127,14 @@ async function main() {
         }
         return;
     }
-    const command = args[0] || "interactive";
+    const command = args[0] || "";
+    // Default: no command → interactive swarm mode using current directory
+    if (!command || command === "interactive" || command === "i") {
+        const { runInteractiveSwarm } = await import("./interactive-swarm.js");
+        await runInteractiveSwarm(["--dir", process.cwd(), ...args.slice(command ? 1 : 0)]);
+        return;
+    }
     switch (command) {
-        case "interactive":
-        case "i": {
-            await import("./interactive.js");
-            break;
-        }
         case "viewer":
         case "view": {
             process.argv = [process.argv[0], process.argv[1], ...args.slice(1)];

package/dist/prompts/orchestrator.js CHANGED Viewed

@@ -56,11 +56,11 @@ ${agentDescriptions}
 1. **Analyze first**: Use \`llm_query()\` or direct Python to understand the codebase/task
 2. **Decompose**: Break the task into independent, parallelizable units
-3. **Extract context**: For each thread, extract ONLY the relevant code/context — don't send everything
+3. **Extract context**: For each thread, extract ONLY the relevant code/context — don't send everything. Keep thread context under 5000 chars; agents have access to the full worktree
 4. **Spawn threads**: Use \`async_thread()\` + \`asyncio.gather()\` for parallel work
 5. **Inspect results**: Check each thread's result for success/failure
 6. **Merge**: Call \`merge_threads()\` to integrate changes
-7. **Verify**: Optionally spawn a test thread to verify the merged result
+7. **Verify**: ALWAYS spawn a verification thread after merging — run the project's test/typecheck/lint commands. If verification fails, fix before calling FINAL()
 8. **Report**: Call \`FINAL()\` with a summary
 ## Episode Quality & Caching
@@ -77,7 +77,8 @@ ${agentDescriptions}
 4. Use \`print()\` for intermediate output visible in the next iteration
 5. Max ${config.max_threads} concurrent threads, ${config.max_total_threads} total per session
 6. Thread timeout: ${config.thread_timeout_ms / 1000}s per thread
-7. Don't call FINAL prematurely — verify thread results first
+7. Don't call FINAL prematurely — verify thread results first. Always run verification after merge.
+8. Prefer cheap models for sub-agent threads (haiku, gpt-4o-mini) — save premium models for complex work
 8. The REPL persists state — variables survive across iterations
 ## Examples

package/dist/swarm.js CHANGED Viewed

@@ -25,6 +25,7 @@ await import("./agents/claude-code.js");
 await import("./agents/codex.js");
 await import("./agents/aider.js");
 import { randomBytes } from "node:crypto";
+import { loadHooks, runHooks } from "./hooks/runner.js";
 import { EpisodicMemory } from "./memory/episodic.js";
 import { buildSwarmSystemPrompt } from "./prompts/orchestrator.js";
 import { classifyTaskComplexity, describeAvailableAgents, FailureTracker, routeTask } from "./routing/model-router.js";
@@ -296,6 +297,7 @@ function resolveModel(modelId) {
 export async function runSwarmMode(rawArgs) {
     const args = parseSwarmArgs(rawArgs);
     const config = loadConfig();
+    const hooks = loadHooks(args.dir);
     // Configure UI
     if (args.json)
         setJsonMode(true);
@@ -420,6 +422,12 @@ export async function runSwarmMode(rawArgs) {
         }
         // Thread handler
         const threadHandler = async (task, threadContext, agentBackend, model, files) => {
+            // Context-size guard: warn and truncate if orchestrator sends too much context
+            const MAX_THREAD_CONTEXT = 50_000;
+            if (threadContext.length > MAX_THREAD_CONTEXT) {
+                logWarn(`Thread context too large (${(threadContext.length / 1024).toFixed(0)}KB) — truncating to ${MAX_THREAD_CONTEXT / 1000}KB. Agents have full worktree access; pass only relevant excerpts.`);
+                threadContext = `${threadContext.slice(0, MAX_THREAD_CONTEXT)}\n\n[... truncated — ${threadContext.length - MAX_THREAD_CONTEXT} chars removed ...]`;
+            }
             let resolvedAgent = agentBackend || config.default_agent;
             let resolvedModel = model || config.default_model;
             let routeSlot = "";
@@ -449,6 +457,18 @@ export async function runSwarmMode(rawArgs) {
                 },
                 files,
             });
+            // Run post-thread hooks (typecheck, lint, etc.) — success is silent, only errors surface
+            if (result.success && hooks.post_thread.length > 0) {
+                try {
+                    const worktreePath = path.join(args.dir, config.worktree_base_dir, `wt-${threadId}`);
+                    if (fs.existsSync(worktreePath)) {
+                        runHooks(hooks.post_thread, worktreePath, "post_thread");
+                    }
+                }
+                catch (hookErr) {
+                    logWarn(`Post-thread hook failed: ${hookErr.message}`);
+                }
+            }
             // Track failure in the failure tracker for routing adjustments
             if (!result.success) {
                 failureTracker.recordFailure(resolvedAgent, resolvedModel, task, result.summary || "unknown error");
@@ -494,6 +514,26 @@ export async function runSwarmMode(rawArgs) {
             const summary = results
                 .map((r) => (r.success ? `Merged ${r.branch}: ${r.message}` : `FAILED ${r.branch}: ${r.message}`))
                 .join("\n");
+            // Run post-merge hooks (tests, etc.) — success is silent
+            if (merged > 0 && hooks.post_merge.length > 0) {
+                try {
+                    const hookResults = runHooks(hooks.post_merge, args.dir, "post_merge");
+                    const hookFailures = hookResults.filter((r) => !r.success);
+                    if (hookFailures.length > 0) {
+                        const hookOutput = hookFailures.map((r) => r.output).join("\n");
+                        return {
+                            result: `${summary}\n\nPost-merge verification failed:\n${hookOutput}`,
+                            success: false,
+                        };
+                    }
+                }
+                catch (hookErr) {
+                    return {
+                        result: `${summary}\n\nPost-merge hook blocked: ${hookErr.message}`,
+                        success: false,
+                    };
+                }
+            }
             return {
                 result: summary || "No threads to merge",
                 success: results.every((r) => r.success),

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "swarm-code",
-  "version": "0.1.4",
+  "version": "0.1.6",
   "description": "Open-source swarm-native coding agent orchestrator — spawns parallel coding agents in isolated git worktrees, built on RLM (arXiv:2512.24601)",
   "type": "module",
   "bin": {