npm - @desplega.ai/agent-swarm - Versions diffs - 1.91.0 → 1.92.0 - Mend

@desplega.ai/agent-swarm 1.91.0 → 1.92.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

package/README.md +2 -1
package/openapi.json +585 -5
package/package.json +1 -1
package/src/be/db.ts +337 -1
package/src/be/migrations/083_script_workflows.sql +51 -0
package/src/be/modelsdev-cache.json +42352 -38595
package/src/be/scripts/typecheck.ts +49 -0
package/src/be/seed-scripts/catalog/compound-insights.ts +216 -6
package/src/be/seed-scripts/catalog/ops-catalog-audit.ts +911 -0
package/src/be/seed-scripts/catalog/task-context-gathering.ts +92 -0
package/src/be/seed-scripts/catalog/tool-usage.ts +6 -3
package/src/be/seed-scripts/index.ts +20 -2
package/src/be/seed-skills/index.ts +7 -0
package/src/be/swarm-config-guard.ts +17 -0
package/src/commands/runner.ts +43 -2
package/src/http/db-query.ts +20 -5
package/src/http/index.ts +10 -0
package/src/http/script-runs.ts +555 -0
package/src/prompts/session-templates.ts +24 -4
package/src/providers/claude-adapter.ts +60 -13
package/src/script-workflows/executor.ts +110 -0
package/src/script-workflows/harness.ts +73 -0
package/src/script-workflows/label-lint.ts +51 -0
package/src/script-workflows/limits.ts +22 -0
package/src/script-workflows/supervisor.ts +139 -0
package/src/script-workflows/workflow-ctx.ts +205 -0
package/src/scripts-runtime/sdk-allowlist.ts +3 -0
package/src/scripts-runtime/types/stdlib.d.ts +60 -0
package/src/scripts-runtime/types/swarm-sdk.d.ts +60 -0
package/src/server.ts +2 -0
package/src/slack/handlers.ts +11 -4
package/src/slack/message-text.ts +98 -0
package/src/slack/thread-buffer.ts +5 -3
package/src/tests/claude-adapter-binary.test.ts +147 -4
package/src/tests/db-query.test.ts +28 -0
package/src/tests/error-tracker.test.ts +121 -0
package/src/tests/harness-provider-resolution.test.ts +33 -0
package/src/tests/mcp-tools.test.ts +6 -0
package/src/tests/prompt-template-session.test.ts +34 -5
package/src/tests/script-runs-http.test.ts +278 -0
package/src/tests/script-workflows-label-lint.test.ts +43 -0
package/src/tests/script-workflows-runtime-e2e.test.ts +170 -0
package/src/tests/scripts-mcp-e2e.test.ts +49 -2
package/src/tests/seed-scripts.test.ts +347 -2
package/src/tests/slack-message-text.test.ts +250 -0
package/src/tests/system-default-skills.test.ts +40 -0
package/src/tools/db-query.ts +16 -6
package/src/tools/script-runs.ts +123 -0
package/src/tools/slack-read.ts +12 -3
package/src/tools/tool-config.ts +4 -1
package/src/types.ts +52 -0
package/src/utils/error-tracker.ts +40 -1
package/src/utils/internal-ai/complete-structured.ts +10 -4
package/src/workflows/executors/raw-llm.ts +76 -59
package/templates/skills/pages/content.md +205 -55
package/templates/skills/script-workflows/config.json +14 -0
package/templates/skills/script-workflows/content.md +68 -0
package/templates/skills/swarm-scripts/content.md +2 -3

package/src/providers/claude-adapter.ts CHANGED Viewed

@@ -108,6 +108,45 @@ export function resolveClaudeBinary(
   return candidate || "claude";
 }
+const CLAUDE_BRIDGE_BINARY = "claude-bridge";
+/**
+ * Parse a boolean env toggle. Only true/1 enable and false/0 disable; unset
+ * and invalid values are treated as disabled.
+ *
+ * Exported for unit testing.
+ */
+export function parseClaudeBridgeEnabled(raw: string | undefined): boolean {
+  const normalized = raw?.trim().toLowerCase();
+  return normalized === "true" || normalized === "1";
+}
+/**
+ * Resolve the reloadable claude-bridge toggle from the same resolved-env
+ * overlay used for `CLAUDE_BINARY`.
+ *
+ * Exported for unit testing.
+ */
+export function resolveClaudeBridgeEnabled(
+  resolvedEnv: Record<string, string | undefined>,
+  fallbackEnv: Record<string, string | undefined> = process.env,
+): boolean {
+  const candidate =
+    resolvedEnv.SWARM_USE_CLAUDE_BRIDGE?.trim() || fallbackEnv.SWARM_USE_CLAUDE_BRIDGE?.trim();
+  return parseClaudeBridgeEnabled(candidate);
+}
+function resolveClaudeBinaryArgv(
+  resolvedEnv: Record<string, string | undefined>,
+  fallbackEnv: Record<string, string | undefined> = process.env,
+): { raw: string; argv: string[]; useClaudeBridge: boolean } {
+  const useClaudeBridge = resolveClaudeBridgeEnabled(resolvedEnv, fallbackEnv);
+  const raw = useClaudeBridge
+    ? CLAUDE_BRIDGE_BINARY
+    : resolveClaudeBinary(resolvedEnv, fallbackEnv);
+  return { raw, argv: parseClaudeBinary(raw), useClaudeBridge };
+}
 /**
  * Pre-seed `~/.claude.json` so the per-project trust-dialog ("Quick safety
  * check: Is this a project you trust?") doesn't block on first run.
@@ -797,12 +836,9 @@ export class ClaudeAdapter implements ProviderAdapter {
     console.log(`\x1b[2m[claude]\x1b[0m Using credential: ${credType}`);
     // Resolve the argv prefix. Same flags (`-p`, `--model`, ...) work across
-    // alternates; only argv[0..n] changes. `CLAUDE_BINARY` accepts a single
-    // binary (`"shannon"`, `"/usr/local/bin/shannon"`) or a whitespace-separated
-    // command string (`"bunx @dexh/shannon"`, `"npx -y @dexh/shannon"`).
-    // Setting it to anything containing `shannon` opts into the dexhorthy/shannon
-    // variant, which drives `claude` interactively in tmux to stay on the
-    // subscription credit pool after the 2026-06-15 programmatic-credit split.
+    // alternates; only argv[0..n] changes. Prefer SWARM_USE_CLAUDE_BRIDGE=true
+    // for the Desplega-owned bridge. CLAUDE_BINARY remains as the low-level
+    // override for custom binaries and the deprecated shannon path.
     //
     // `config.env` carries the swarm_config overlay (resolved repo > agent > global
     // by `fetchResolvedEnv` in src/commands/runner.ts), so operators can flip
@@ -811,19 +847,30 @@ export class ClaudeAdapter implements ProviderAdapter {
     //
     // See `docs-site/.../shannon-experimental.mdx` for the user-facing guide
     // and `runbooks/harness-providers.md` for engineering notes.
-    const claudeBinaryRaw = resolveClaudeBinary(config.env || process.env);
-    const claudeBinaryArgv = parseClaudeBinary(claudeBinaryRaw);
+    const {
+      raw: claudeBinaryRaw,
+      argv: claudeBinaryArgv,
+      useClaudeBridge,
+    } = resolveClaudeBinaryArgv(config.env || process.env);
     const isShannon = claudeBinaryRaw.toLowerCase().includes("shannon");
+    const configuredClaudeBinaryRaw = resolveClaudeBinary(config.env || process.env);
+    if (configuredClaudeBinaryRaw.toLowerCase().includes("shannon")) {
+      console.warn(
+        "\x1b[33m[claude]\x1b[0m CLAUDE_BINARY=shannon is deprecated; set SWARM_USE_CLAUDE_BRIDGE=true to use @desplega.ai/claude-bridge.",
+      );
+    }
     console.log(
-      `\x1b[2m[${config.role}]\x1b[0m Resolved CLAUDE_BINARY: ${claudeBinaryArgv.join(" ")} (isShannon: ${isShannon})`,
+      `\x1b[2m[${config.role}]\x1b[0m Resolved claude binary: ${claudeBinaryArgv.join(" ")} (useClaudeBridge: ${useClaudeBridge}, isShannon: ${isShannon})`,
     );
-    // Fail fast: shannon shells out to tmux. If it's missing, surface a
-    // clear error here rather than letting the spawn fail opaquely.
-    if (isShannon && !Bun.which("tmux")) {
+    // Fail fast: shannon and claude-bridge both shell out to tmux. If it's
+    // missing, surface a clear error here rather than letting startup fail
+    // opaquely.
+    if ((isShannon || useClaudeBridge) && !Bun.which("tmux")) {
+      const label = useClaudeBridge ? "SWARM_USE_CLAUDE_BRIDGE=true" : "CLAUDE_BINARY=shannon";
       throw new Error(
-        "CLAUDE_BINARY=shannon requires 'tmux' on PATH (install via apt/brew). See runbooks/harness-providers.md.",
+        `${label} requires 'tmux' on PATH (install via apt/brew). See runbooks/harness-providers.md.`,
       );
     }

package/src/script-workflows/executor.ts ADDED Viewed

@@ -0,0 +1,110 @@
+import { existsSync } from "node:fs";
+import { mkdir, rm } from "node:fs/promises";
+import { resolve } from "node:path";
+import type { ScriptRun } from "../types";
+export type ScriptExecutionResult = {
+  exitCode: number | null;
+  stderr: string;
+};
+export type ScriptExecutionHandle = {
+  pid: number | null;
+  tmpdir: string;
+  startedAtMs: number;
+  exited: Promise<ScriptExecutionResult>;
+  terminate(signal?: NodeJS.Signals): void;
+  cleanup(): Promise<void>;
+};
+export type StartScriptExecutionInput = {
+  run: ScriptRun;
+  baseUrl: string;
+  apiKey: string;
+};
+export interface ScriptExecutor {
+  start(input: StartScriptExecutionInput): Promise<ScriptExecutionHandle>;
+  isRunning(pid: number): boolean;
+  terminatePid(pid: number, signal?: NodeJS.Signals): void;
+}
+export function getScriptWorkflowHarnessPath(): string {
+  const runtimeDir = process.env.SCRIPT_WORKFLOW_RUNTIME_DIR;
+  if (!runtimeDir) return new URL("./harness.ts", import.meta.url).pathname;
+  const bundledHarness = `${resolve(runtimeDir)}/harness.bundle.js`;
+  if (!existsSync(bundledHarness)) {
+    throw new Error(
+      `Script workflow harness bundle not found at ${bundledHarness}. ` +
+        "Build/copy harness.bundle.js and set SCRIPT_WORKFLOW_RUNTIME_DIR to its directory.",
+    );
+  }
+  return bundledHarness;
+}
+export class LocalProcessScriptExecutor implements ScriptExecutor {
+  async start(input: StartScriptExecutionInput): Promise<ScriptExecutionHandle> {
+    const { run, baseUrl, apiKey } = input;
+    const tmpdir = `${process.env.TMPDIR ?? "/tmp"}/script-workflow-${run.id}`;
+    await mkdir(tmpdir, { recursive: true });
+    const sourceFile = `${tmpdir}/source.ts`;
+    const argsFile = `${tmpdir}/args.json`;
+    await Bun.write(sourceFile, run.source);
+    await Bun.write(argsFile, JSON.stringify(run.args ?? null));
+    const proc = Bun.spawn(["bun", "run", getScriptWorkflowHarnessPath()], {
+      cwd: tmpdir,
+      stdin: "ignore",
+      stdout: "ignore",
+      stderr: "pipe",
+      env: {
+        PATH: process.env.PATH ?? "/usr/bin:/bin",
+        HOME: process.env.HOME ?? "/tmp",
+        LANG: process.env.LANG ?? "C.UTF-8",
+        LC_ALL: process.env.LC_ALL ?? "C.UTF-8",
+        TMPDIR: tmpdir,
+        AGENT_SWARM_API_KEY: apiKey,
+        MCP_BASE_URL: baseUrl,
+        SCRIPT_RUN_ID: run.id,
+        SCRIPT_RUN_AGENT_ID: run.agentId,
+        SCRIPT_RUN_TMPDIR: tmpdir,
+        SCRIPT_RUN_SOURCE_FILE: sourceFile,
+        SCRIPT_RUN_ARGS_FILE: argsFile,
+      },
+    });
+    const stderrPromise = new Response(proc.stderr).text().catch(() => "");
+    return {
+      pid: proc.pid,
+      tmpdir,
+      startedAtMs: Date.now(),
+      exited: proc.exited.then(async (exitCode) => ({
+        exitCode,
+        stderr: await stderrPromise,
+      })),
+      terminate: (signal = "SIGTERM") => {
+        proc.kill(signal);
+      },
+      cleanup: async () => {
+        await rm(tmpdir, { recursive: true, force: true });
+      },
+    };
+  }
+  isRunning(pid: number): boolean {
+    try {
+      process.kill(pid, 0);
+      return true;
+    } catch {
+      return false;
+    }
+  }
+  terminatePid(pid: number, signal: NodeJS.Signals = "SIGTERM"): void {
+    process.kill(pid, signal);
+  }
+}
+export const localProcessScriptExecutor = new LocalProcessScriptExecutor();

package/src/script-workflows/harness.ts ADDED Viewed

@@ -0,0 +1,73 @@
+import { buildWorkflowCtx } from "./workflow-ctx";
+function requiredEnv(name: string): string {
+  const value = process.env[name];
+  if (!value) throw new Error(`Missing required env ${name}`);
+  return value;
+}
+async function postStatus(
+  runId: string,
+  baseUrl: string,
+  agentId: string,
+  apiKey: string,
+  body: Record<string, unknown>,
+): Promise<void> {
+  const res = await fetch(`${baseUrl}/api/internal/script-runs/${runId}/status`, {
+    method: "POST",
+    headers: {
+      Authorization: `Bearer ${apiKey}`,
+      "X-Agent-ID": agentId,
+      "Content-Type": "application/json",
+    },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) {
+    throw new Error(`status callback failed with ${res.status}: ${await res.text()}`);
+  }
+}
+const runId = requiredEnv("SCRIPT_RUN_ID");
+const agentId = requiredEnv("SCRIPT_RUN_AGENT_ID");
+const apiKey = requiredEnv("AGENT_SWARM_API_KEY");
+const baseUrl = requiredEnv("MCP_BASE_URL").replace(/\/$/, "");
+const sourceFile = requiredEnv("SCRIPT_RUN_SOURCE_FILE");
+const argsFile = requiredEnv("SCRIPT_RUN_ARGS_FILE");
+const userModulePath = `${requiredEnv("SCRIPT_RUN_TMPDIR")}/user-script.ts`;
+const heartbeat = setInterval(() => {
+  fetch(`${baseUrl}/api/internal/script-runs/${runId}/heartbeat`, {
+    method: "POST",
+    headers: {
+      Authorization: `Bearer ${apiKey}`,
+      "X-Agent-ID": agentId,
+    },
+  }).catch(() => {});
+}, 10_000);
+heartbeat.unref?.();
+try {
+  const source = await Bun.file(sourceFile).text();
+  const args = JSON.parse(await Bun.file(argsFile).text());
+  await Bun.write(userModulePath, source);
+  const mod = await import(userModulePath);
+  if (typeof mod.default !== "function") {
+    throw new Error("Script workflow must export a default function");
+  }
+  const ctx = buildWorkflowCtx({ runId, agentId, apiKey, baseUrl, args });
+  const output = await mod.default(args, ctx);
+  await postStatus(runId, baseUrl, agentId, apiKey, {
+    status: "completed",
+    output: output ?? null,
+  });
+  process.exit(0);
+} catch (err) {
+  console.error(err instanceof Error ? err.stack || err.message : String(err));
+  await postStatus(runId, baseUrl, agentId, apiKey, {
+    status: "failed",
+    error: err instanceof Error ? err.message : String(err),
+  });
+  process.exit(1);
+} finally {
+  clearInterval(heartbeat);
+}

package/src/script-workflows/label-lint.ts ADDED Viewed

@@ -0,0 +1,51 @@
+export type LabelLintError = {
+  label: string;
+  lineNumber: number | null;
+  detail: string;
+};
+export type LabelLintResult = { ok: true } | { ok: false; errors: LabelLintError[] };
+const CTX_STEP_LITERAL_LABEL_PATTERN = /ctx\.step\.\w+\(\s*"([^"]+)"/g;
+const LOOP_PATTERNS = [
+  /\bfor\s*\(/,
+  /\bwhile\s*\(/,
+  /\.map\s*\(/,
+  /\.forEach\s*\(/,
+  /\.reduce\s*\(/,
+  /\.flatMap\s*\(/,
+];
+export function lintWorkflowLabels(source: string): LabelLintResult {
+  const errors: LabelLintError[] = [];
+  const lines = source.split("\n");
+  for (let i = 0; i < lines.length; i++) {
+    const line = lines[i] ?? "";
+    CTX_STEP_LITERAL_LABEL_PATTERN.lastIndex = 0;
+    let match = CTX_STEP_LITERAL_LABEL_PATTERN.exec(line);
+    while (match !== null) {
+      const label = match[1];
+      if (!label) {
+        match = CTX_STEP_LITERAL_LABEL_PATTERN.exec(line);
+        continue;
+      }
+      const windowStart = Math.max(0, i - 10);
+      const context = lines.slice(windowStart, i + 1).join("\n");
+      if (!LOOP_PATTERNS.some((pattern) => pattern.test(context))) {
+        match = CTX_STEP_LITERAL_LABEL_PATTERN.exec(line);
+        continue;
+      }
+      errors.push({
+        label,
+        lineNumber: i + 1,
+        detail:
+          `Literal string label "${label}" at line ${i + 1} appears inside a loop. ` +
+          "Labels must be unique per run; use a template literal that includes the loop variable.",
+      });
+      match = CTX_STEP_LITERAL_LABEL_PATTERN.exec(line);
+    }
+  }
+  return errors.length > 0 ? { ok: false, errors } : { ok: true };
+}

package/src/script-workflows/limits.ts ADDED Viewed

@@ -0,0 +1,22 @@
+const DEFAULT_MAX_STEPS = 1000;
+const DEFAULT_MAX_WALL_MS = 24 * 60 * 60 * 1000;
+const DEFAULT_MAX_AGENT_TASKS = 50;
+function positiveIntEnv(name: string, fallback: number): number {
+  const raw = process.env[name];
+  if (!raw) return fallback;
+  const parsed = Number(raw);
+  return Number.isFinite(parsed) && parsed > 0 ? Math.floor(parsed) : fallback;
+}
+export function scriptRunMaxSteps(): number {
+  return positiveIntEnv("SCRIPT_RUN_MAX_STEPS", DEFAULT_MAX_STEPS);
+}
+export function scriptRunMaxWallMs(): number {
+  return positiveIntEnv("SCRIPT_RUN_MAX_WALL_MS", DEFAULT_MAX_WALL_MS);
+}
+export function scriptRunMaxAgentTasks(): number {
+  return positiveIntEnv("SCRIPT_RUN_MAX_AGENT_TASKS", DEFAULT_MAX_AGENT_TASKS);
+}

package/src/script-workflows/supervisor.ts ADDED Viewed

@@ -0,0 +1,139 @@
+import { getRunningScriptRuns, getScriptRun, updateScriptRun } from "../be/db";
+import type { ScriptRun } from "../types";
+import { getApiKey } from "../utils/api-key";
+import {
+  localProcessScriptExecutor,
+  type ScriptExecutionHandle,
+  type ScriptExecutor,
+} from "./executor";
+import { scriptRunMaxWallMs } from "./limits";
+type ManagedRun = {
+  execution: ScriptExecutionHandle;
+};
+const managed = new Map<string, ManagedRun>();
+let reconcileTimer: ReturnType<typeof setInterval> | null = null;
+let scriptExecutor: ScriptExecutor = localProcessScriptExecutor;
+function supervisorDisabled(): boolean {
+  return process.env.SCRIPT_RUN_SUPERVISOR_DISABLE === "true";
+}
+export function setScriptRunExecutor(executor: ScriptExecutor): void {
+  scriptExecutor = executor;
+}
+export async function startScriptRunProcess(
+  run: ScriptRun,
+  baseUrl: string,
+  apiKeyOverride?: string,
+): Promise<void> {
+  if (supervisorDisabled()) return;
+  if (managed.has(run.id)) return;
+  const apiKey = apiKeyOverride ?? getApiKey();
+  if (!apiKey) throw new Error("AGENT_SWARM_API_KEY is required to spawn script runs");
+  if (process.env.SCRIPT_WORKFLOW_DEBUG === "true") {
+    console.error(
+      `[script-workflows] spawning ${run.id} auth override=${apiKeyOverride ? "yes" : "no"} len=${apiKey.length}`,
+    );
+  }
+  const execution = await scriptExecutor.start({ run, baseUrl, apiKey });
+  managed.set(run.id, { execution });
+  updateScriptRun(run.id, {
+    status: "running",
+    pid: execution.pid,
+    lastHeartbeatAt: new Date().toISOString(),
+  });
+  execution.exited
+    .then(async ({ exitCode, stderr }) => {
+      const current = getScriptRun(run.id);
+      if (current && current.status === "running") {
+        if (exitCode !== 0) {
+          console.error(
+            `[script-workflows] run ${run.id} subprocess exited ${exitCode}: ${stderr.trim() || "(no stderr)"}`,
+          );
+        }
+        updateScriptRun(run.id, {
+          status: exitCode === 0 ? "completed" : "failed",
+          pid: null,
+          finishedAt: new Date().toISOString(),
+          error:
+            exitCode === 0
+              ? null
+              : stderr.trim() || `Script workflow subprocess exited ${exitCode}`,
+        });
+      }
+    })
+    .finally(async () => {
+      managed.delete(run.id);
+      await execution.cleanup();
+    });
+}
+export function terminateScriptRunProcess(runId: string): boolean {
+  const managedRun = managed.get(runId);
+  const run = getScriptRun(runId);
+  if (managedRun) {
+    managedRun.execution.terminate("SIGTERM");
+    managed.delete(runId);
+    return true;
+  }
+  if (run?.pid && scriptExecutor.isRunning(run.pid)) {
+    scriptExecutor.terminatePid(run.pid, "SIGTERM");
+    return true;
+  }
+  return false;
+}
+export function pauseScriptRunProcess(runId: string): void {
+  terminateScriptRunProcess(runId);
+  updateScriptRun(runId, { status: "paused", pid: null });
+}
+export function abortScriptRunLimit(runId: string, reason: string): void {
+  terminateScriptRunProcess(runId);
+  updateScriptRun(runId, {
+    status: "aborted_limit",
+    pid: null,
+    finishedAt: new Date().toISOString(),
+    error: reason,
+  });
+}
+export function reconcileScriptRuns(baseUrl: string): void {
+  if (supervisorDisabled()) return;
+  for (const run of getRunningScriptRuns()) {
+    if (run.status === "paused") continue;
+    const current = managed.get(run.id);
+    if (current && Date.now() - current.execution.startedAtMs > scriptRunMaxWallMs()) {
+      abortScriptRunLimit(run.id, `SCRIPT_RUN_MAX_WALL_MS exceeded (${scriptRunMaxWallMs()})`);
+      continue;
+    }
+    if (!current && (!run.pid || !scriptExecutor.isRunning(run.pid))) {
+      startScriptRunProcess(run, baseUrl).catch((err) => {
+        updateScriptRun(run.id, {
+          status: "failed",
+          pid: null,
+          finishedAt: new Date().toISOString(),
+          error: err instanceof Error ? err.message : String(err),
+        });
+      });
+    }
+  }
+}
+export function startScriptRunSupervisor(baseUrl: string): void {
+  if (supervisorDisabled() || reconcileTimer) return;
+  reconcileScriptRuns(baseUrl);
+  reconcileTimer = setInterval(() => reconcileScriptRuns(baseUrl), 15_000);
+  reconcileTimer.unref?.();
+}
+export function stopScriptRunSupervisor(): void {
+  if (reconcileTimer) clearInterval(reconcileTimer);
+  reconcileTimer = null;
+  for (const runId of [...managed.keys()]) terminateScriptRunProcess(runId);
+}