npm - @desplega.ai/agent-swarm - Versions diffs - 1.85.0 → 1.87.0 - Mend

@desplega.ai/agent-swarm 1.85.0 → 1.87.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/README.md +1 -0
package/openapi.json +72 -1
package/package.json +10 -6
package/src/be/db-queries/tracker.ts +21 -0
package/src/be/db.ts +279 -14
package/src/be/migrations/078_backfill_gpt_5_5_pricing.sql +15 -0
package/src/be/migrations/079_task_followup_config.sql +1 -0
package/src/be/modelsdev-cache.json +155618 -0
package/src/be/modelsdev-cache.ts +46 -0
package/src/be/seed-pricing.ts +7 -44
package/src/cli.tsx +38 -2
package/src/commands/codex-session-runner.ts +132 -0
package/src/commands/context-preamble.ts +272 -0
package/src/commands/credential-wait.ts +2 -2
package/src/commands/e2b.ts +728 -0
package/src/commands/provider-credentials.ts +10 -5
package/src/commands/resume-session.ts +35 -78
package/src/commands/runner.ts +128 -16
package/src/e2b/dispatch.ts +429 -0
package/src/e2b/env.ts +206 -0
package/src/heartbeat/heartbeat.ts +145 -30
package/src/heartbeat/templates.ts +11 -7
package/src/http/session-data.ts +8 -1
package/src/http/tasks.ts +152 -3
package/src/jira/sync.ts +4 -4
package/src/linear/sync.ts +6 -5
package/src/prompts/base-prompt.ts +49 -3
package/src/providers/claude-adapter.ts +76 -61
package/src/providers/claude-managed-adapter.ts +61 -75
package/src/providers/claude-managed-models.ts +18 -2
package/src/providers/codex-adapter.ts +429 -112
package/src/providers/codex-models.ts +9 -2
package/src/providers/codex-oauth/auth-json.ts +18 -1
package/src/providers/codex-oauth/flow.ts +24 -1
package/src/providers/index.ts +28 -19
package/src/providers/pricing-sources.md +7 -4
package/src/providers/swarm-events-shared.ts +14 -0
package/src/providers/types.ts +6 -0
package/src/slack/HEURISTICS.md +5 -1
package/src/slack/handlers.test.ts +35 -0
package/src/slack/handlers.ts +79 -2
package/src/tasks/worker-follow-up.ts +162 -2
package/src/telemetry.ts +11 -1
package/src/tests/base-prompt.test.ts +46 -8
package/src/tests/claude-adapter.test.ts +5 -27
package/src/tests/claude-managed-adapter.test.ts +42 -56
package/src/tests/codex-adapter-otel.test.ts +4 -4
package/src/tests/codex-adapter.test.ts +25 -37
package/src/tests/codex-oauth.test.ts +149 -3
package/src/tests/codex-pool.test.ts +14 -3
package/src/tests/codex-swarm-events.test.ts +35 -0
package/src/tests/context-window.test.ts +1 -0
package/src/tests/credential-check.test.ts +48 -29
package/src/tests/e2b-dispatch.test.ts +330 -0
package/src/tests/entrypoint-config-env-export.test.ts +81 -0
package/src/tests/follow-up-redelivery-guard.test.ts +165 -0
package/src/tests/heartbeat-supersede-resume.test.ts +285 -0
package/src/tests/heartbeat.test.ts +26 -16
package/src/tests/migration-046-budgets.test.ts +6 -5
package/src/tests/pricing-routes.test.ts +6 -5
package/src/tests/prompt-template-remaining.test.ts +4 -0
package/src/tests/provider-adapter.test.ts +10 -10
package/src/tests/provider-command-format.test.ts +4 -4
package/src/tests/resume-session.test.ts +42 -50
package/src/tests/session-costs-codex-recompute.test.ts +25 -0
package/src/tests/structured-output.test.ts +69 -0
package/src/tests/task-completion-idempotency.test.ts +185 -2
package/src/tests/task-supersede-resume.test.ts +722 -0
package/src/tests/telemetry-init.test.ts +69 -0
package/src/tests/vcs-tracking.test.ts +39 -0
package/src/tools/send-task.ts +42 -10
package/src/tools/store-progress.ts +2 -2
package/src/tools/templates.ts +14 -2
package/src/types.ts +46 -1
package/src/utils/context-window.ts +1 -0
package/src/workflows/executors/agent-task.ts +3 -0
package/templates/schedules/daily-blocker-digest/config.json +13 -0
package/templates/schedules/daily-blocker-digest/content.md +150 -0
package/templates/schedules/daily-compounding-reflection/config.json +21 -0
package/templates/schedules/daily-compounding-reflection/content.md +210 -0
package/templates/schedules/daily-hn-briefing/config.json +13 -0
package/templates/schedules/daily-hn-briefing/content.md +97 -0
package/templates/schedules/daily-workflow-health-audit/config.json +13 -0
package/templates/schedules/daily-workflow-health-audit/content.md +189 -0
package/templates/schedules/gtm-weekly-review/config.json +13 -0
package/templates/schedules/gtm-weekly-review/content.md +58 -0
package/templates/schedules/weekly-dependabot-triage/config.json +13 -0
package/templates/schedules/weekly-dependabot-triage/content.md +45 -0
package/templates/schema.ts +26 -0
package/templates/skills/agentmail-sending/config.json +13 -0
package/templates/skills/agentmail-sending/content.md +48 -0
package/templates/skills/artifacts/config.json +13 -0
package/templates/skills/artifacts/content.md +87 -0
package/templates/skills/browser-use-cloud/config.json +13 -0
package/templates/skills/browser-use-cloud/content.md +155 -0
package/templates/skills/desloppify/config.json +13 -0
package/templates/skills/desloppify/content.md +201 -0
package/templates/skills/exa-search/config.json +13 -0
package/templates/skills/exa-search/content.md +106 -0
package/templates/skills/jira-interaction/config.json +13 -0
package/templates/skills/jira-interaction/content.md +252 -0
package/templates/skills/kapso-whatsapp/config.json +13 -0
package/templates/skills/kapso-whatsapp/content.md +369 -0
package/templates/skills/kv-storage/config.json +13 -0
package/templates/skills/kv-storage/content.md +111 -0
package/templates/skills/linear-interaction/config.json +20 -0
package/templates/skills/linear-interaction/content.md +230 -0
package/templates/skills/pages/config.json +18 -0
package/templates/skills/pages/content.md +85 -0
package/templates/skills/profile-corruption-escalation/config.json +13 -0
package/templates/skills/profile-corruption-escalation/content.md +105 -0
package/templates/skills/scheduled-task-resilience/config.json +13 -0
package/templates/skills/scheduled-task-resilience/content.md +95 -0
package/templates/skills/sprite-cli/config.json +13 -0
package/templates/skills/sprite-cli/content.md +133 -0
package/templates/skills/turso-interaction/config.json +13 -0
package/templates/skills/turso-interaction/content.md +192 -0
package/templates/skills/workflow-iterate/config.json +18 -0
package/templates/skills/workflow-iterate/content.md +399 -0
package/templates/skills/workflow-structured-output/config.json +13 -0
package/templates/skills/workflow-structured-output/content.md +101 -0
package/templates/skills/x-api-interactions/config.json +13 -0
package/templates/skills/x-api-interactions/content.md +109 -0
package/templates/workflows/autopilot/config.json +13 -0
package/templates/workflows/autopilot/content.md +58 -0
package/templates/workflows/linear-drain-loop/config.json +21 -0
package/templates/workflows/linear-drain-loop/content.md +72 -0
package/templates/workflows/ralph-loop/config.json +13 -0
package/templates/workflows/ralph-loop/content.md +75 -0

package/README.md CHANGED Viewed

@@ -124,6 +124,7 @@ Check [our templates](https://templates.agent-swarm.dev) for a quick start.
 - **Workflow engine with Human-in-the-Loop** — DAG-based automation with approval gates, retries, and structured I/O. [Workflows →](https://docs.agent-swarm.dev/docs/concepts/workflows)
 - **Scheduled & recurring tasks** — cron-based automation for standing work. [Scheduling →](https://docs.agent-swarm.dev/docs/concepts/scheduling)
 - **Harness & LLM agnostic** — run with Claude Code, OpenAI Codex, pi-mono, Devin, Claude Managed Agents, raw LLMs, or opencode. [Harness config →](https://docs.agent-swarm.dev/docs/guides/harness-configuration) · [Add a new provider →](https://docs.agent-swarm.dev/docs/guides/harness-providers)
+- **Follow-up continuity across all harnesses** — child tasks inherit bounded prior-task context even on providers without native session resume, while resumable providers still reuse prior sessions when possible. [Task lifecycle →](https://docs.agent-swarm.dev/docs/concepts/task-lifecycle)
 - **Skills & MCP servers** — reusable procedural knowledge and per-agent MCP servers with scope cascade. [MCP tools →](https://docs.agent-swarm.dev/docs/reference/mcp-tools)
 - **DB-backed pages** — agents publish HTML or JSON pages (reports, dashboards, action specs) via the `create_page` MCP tool with public / authed / password modes, version history, view counters, diff helpers, and PDF export. [MCP tools → Pages](https://docs.agent-swarm.dev/docs/reference/mcp-tools#pages-tools)
 - **KV store** — Redis-like namespaced key/value store with auto-scoped context (Slack thread / PR / Linear issue / page). [MCP tools → KV](https://docs.agent-swarm.dev/docs/reference/mcp-tools#kv-tools)

package/openapi.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "openapi": "3.1.0",
   "info": {
     "title": "Agent Swarm API",
-    "version": "1.85.0",
+    "version": "1.87.0",
     "description": "Multi-agent orchestration API for Claude Code, Codex, and Gemini CLI. Enables task distribution, agent communication, and service discovery.\n\nMCP tools are documented separately in [MCP.md](./MCP.md)."
   },
   "servers": [
@@ -7139,6 +7139,16 @@
             "required": true,
             "name": "taskId",
             "in": "path"
+          },
+          {
+            "schema": {
+              "type": "integer",
+              "minimum": 1,
+              "maximum": 1000
+            },
+            "required": false,
+            "name": "limit",
+            "in": "query"
           }
         ],
         "responses": {
@@ -10114,6 +10124,67 @@
         }
       }
     },
+    "/api/tasks/{id}/supersede": {
+      "post": {
+        "summary": "Supersede an in-progress task (terminate + spawn resume follow-up)",
+        "description": "Marks the original task `superseded` (terminal) and creates a fresh `taskType=\"resume\"` follow-up so a worker can pick up the work in a new provider session. Workflow-step tasks (those with `workflowRunStepId`) are carved out: the original is marked `failed` with reason `superseded_workflow_task` and no follow-up is created — the workflow engine's retry/failure policy applies.",
+        "tags": [
+          "Tasks"
+        ],
+        "security": [
+          {
+            "bearerAuth": []
+          }
+        ],
+        "parameters": [
+          {
+            "schema": {
+              "type": "string"
+            },
+            "required": true,
+            "name": "id",
+            "in": "path"
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "type": "object",
+                "properties": {
+                  "reason": {
+                    "type": "string",
+                    "enum": [
+                      "graceful_shutdown",
+                      "context_limits",
+                      "manual_supersede",
+                      "crash_recovery"
+                    ]
+                  }
+                },
+                "required": [
+                  "reason"
+                ]
+              }
+            }
+          }
+        },
+        "responses": {
+          "200": {
+            "description": "Task superseded (or workflow-failed)"
+          },
+          "400": {
+            "description": "Task not in_progress"
+          },
+          "403": {
+            "description": "Task belongs to another agent"
+          },
+          "404": {
+            "description": "Task not found"
+          }
+        }
+      }
+    },
     "/api/tasks/{id}/vcs": {
       "patch": {
         "summary": "Update VCS (PR/MR) info for a task",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@desplega.ai/agent-swarm",
-  "version": "1.85.0",
+  "version": "1.87.0",
   "description": "Multi-agent orchestration for Claude Code, Codex, Gemini CLI, and other AI coding assistants",
   "license": "MIT",
   "author": "desplega.sh <contact@desplega.sh>",
@@ -45,6 +45,9 @@
     "tsc:check": "bun tsc --noEmit",
     "check:db-boundary": "bash scripts/check-db-boundary.sh",
     "check:api-key-boundary": "bash scripts/check-api-key-boundary.sh",
+    "prepare-release": "bun scripts/prepare-release.ts",
+    "sync-chart-version": "bun scripts/sync-chart-version.ts",
+    "check-chart-version": "bun scripts/sync-chart-version.ts --check-if-package-version-changed",
     "cli": "bun src/cli.tsx",
     "hook": "bun src/hooks/hook.ts",
     "claude": "bun src/cli.tsx claude",
@@ -108,12 +111,12 @@
     "@desplega.ai/localtunnel": "^2.2.0",
     "@inkjs/ui": "^2.0.0",
     "@linear/sdk": "^77.0.0",
-    "@earendil-works/pi-agent-core": "^0.75.5",
-    "@earendil-works/pi-ai": "^0.75.5",
-    "@earendil-works/pi-coding-agent": "^0.75.5",
+    "@earendil-works/pi-agent-core": "^0.76.0",
+    "@earendil-works/pi-ai": "^0.76.0",
+    "@earendil-works/pi-coding-agent": "^0.76.0",
     "@modelcontextprotocol/sdk": "^1.25.1",
-    "@openai/codex-sdk": "^0.133.0",
-    "@opencode-ai/sdk": "^1.15.10",
+    "@openai/codex-sdk": "^0.135.0",
+    "@opencode-ai/sdk": "^1.15.12",
     "@openfort/openfort-node": "^0.9.1",
     "@opentelemetry/api": "^1.9.1",
     "@opentelemetry/exporter-trace-otlp-http": "^0.218.0",
@@ -128,6 +131,7 @@
     "ai": "^6.0.116",
     "cron-parser": "^5.4.0",
     "date-fns": "^4.1.0",
+    "e2b": "2.26.0",
     "hono": "^4.12.3",
     "ink": "^6.5.1",
     "oauth4webapi": "^3.8.5",

package/src/be/db-queries/tracker.ts CHANGED Viewed

@@ -110,6 +110,27 @@ export function updateTrackerSyncSwarmId(id: string, swarmId: string): void {
   getDb().query("UPDATE tracker_sync SET swarmId = ? WHERE id = ?").run(swarmId, id);
 }
+/**
+ * Repoint ALL `tracker_sync` rows currently keyed to `oldSwarmId` to
+ * `newSwarmId`. Returns the number of rows updated.
+ *
+ * Used when a task is superseded (PR #594): the supersede parent becomes
+ * terminal but the Linear/Jira issue is still active, and outbound
+ * completion posts + inbound webhooks lookup by swarmId. Without
+ * repointing, the resume child's completion never makes it back to the
+ * tracker and subsequent inbound events load the terminal parent and
+ * create duplicates.
+ *
+ * Safe to call when no rows match (no-op, returns 0). Repoints across
+ * all providers (Linear AND Jira) and all entity types in one call.
+ */
+export function repointTrackerSyncBySwarmId(oldSwarmId: string, newSwarmId: string): number {
+  const result = getDb()
+    .query("UPDATE tracker_sync SET swarmId = ? WHERE swarmId = ?")
+    .run(newSwarmId, oldSwarmId);
+  return Number(result.changes ?? 0);
+}
 export function createTrackerSync(data: {
   provider: string;
   entityType: "task";

package/src/be/db.ts CHANGED Viewed

@@ -29,6 +29,7 @@ import type {
   ContextSnapshotEventType,
   ContextVersion,
   CooldownConfig,
+  FollowUpConfig,
   InboxItemState,
   InboxItemStatus,
   InboxItemType,
@@ -87,6 +88,7 @@ import type {
   WorkflowSummary,
   WorkflowVersion,
 } from "../types";
+import { FollowUpConfigSchema, isTerminalTaskStatus } from "../types";
 import { deriveProviderFromKeyType } from "../utils/credentials";
 import { scrubSecrets } from "../utils/secret-scrubber";
 import { decryptSecret, encryptSecret, getEncryptionKey, resolveEncryptionKey } from "./crypto";
@@ -993,6 +995,7 @@ type AgentTaskRow = {
   workflowRunId: string | null;
   workflowRunStepId: string | null;
   outputSchema: string | null;
+  followUpConfig: string | null;
   contextKey: string | null;
   createdAt: string;
   lastUpdatedAt: string;
@@ -1016,6 +1019,27 @@ type AgentTaskRow = {
 };
 function rowToAgentTask(row: AgentTaskRow): AgentTask {
+  let followUpConfig: FollowUpConfig | undefined;
+  if (row.followUpConfig) {
+    try {
+      const parsed = FollowUpConfigSchema.safeParse(JSON.parse(row.followUpConfig));
+      if (parsed.success) {
+        followUpConfig = parsed.data;
+      } else {
+        console.warn(
+          `[db] Ignoring invalid agent_tasks.followUpConfig for task ${row.id}:`,
+          parsed.error.message,
+        );
+      }
+    } catch (error) {
+      console.warn(
+        `[db] Ignoring malformed agent_tasks.followUpConfig for task ${row.id}:`,
+        error instanceof Error ? error.message : String(error),
+      );
+      followUpConfig = undefined;
+    }
+  }
   return {
     id: row.id,
     agentId: row.agentId,
@@ -1057,6 +1081,7 @@ function rowToAgentTask(row: AgentTaskRow): AgentTask {
     workflowRunId: row.workflowRunId ?? undefined,
     workflowRunStepId: row.workflowRunStepId ?? undefined,
     outputSchema: row.outputSchema ? JSON.parse(row.outputSchema) : undefined,
+    followUpConfig,
     contextKey: row.contextKey ?? undefined,
     compactionCount: row.compactionCount ?? undefined,
     peakContextPercent: row.peakContextPercent ?? undefined,
@@ -1173,7 +1198,7 @@ export const taskQueries = {
   setProgress: () =>
     getDb().prepare<AgentTaskRow, [string, string]>(
       `UPDATE agent_tasks SET progress = ?,
-       status = CASE WHEN status IN ('completed', 'failed', 'cancelled') THEN status ELSE 'in_progress' END,
+       status = CASE WHEN status IN ('completed', 'failed', 'cancelled', 'superseded') THEN status ELSE 'in_progress' END,
        lastUpdatedAt = strftime('%Y-%m-%dT%H:%M:%fZ', 'now')
        WHERE id = ? RETURNING *`,
     ),
@@ -1244,14 +1269,14 @@ export function startTask(taskId: string): AgentTask | null {
   if (!oldTask) return null;
   // Guard: never revive tasks that are already in a terminal state
-  if (["completed", "failed", "cancelled"].includes(oldTask.status)) {
+  if (isTerminalTaskStatus(oldTask.status)) {
     return null;
   }
   const row = getDb()
     .prepare<AgentTaskRow, [string]>(
       `UPDATE agent_tasks SET status = 'in_progress', lastUpdatedAt = strftime('%Y-%m-%dT%H:%M:%fZ', 'now')
-       WHERE id = ? AND status NOT IN ('completed', 'failed', 'cancelled') RETURNING *`,
+       WHERE id = ? AND status NOT IN ('completed', 'failed', 'cancelled', 'superseded') RETURNING *`,
     )
     .get(taskId);
   if (row && oldTask) {
@@ -1291,6 +1316,31 @@ export function getChildTasks(parentTaskId: string): AgentTask[] {
     .map(rowToAgentTask);
 }
+/**
+ * Returns true if `parentId` has at least one non-terminal child task with
+ * `taskType = 'resume'`. Used by the heartbeat sweep as an idempotency guard:
+ * if a prior sweep tick already created a resume follow-up for this parent,
+ * don't create a duplicate.
+ *
+ * **Filters by taskType = 'resume'** specifically. A parent task can also
+ * have ordinary non-terminal delegation children (`send-task` auto-defaults
+ * `parentTaskId` to the caller's current task — see src/tools/send-task.ts).
+ * Treating those as "already resumed" would incorrectly skip the resume
+ * path for a crashed worker that had delegated subtasks (PR #594 review).
+ */
+export function hasNonTerminalResumeChild(parentId: string): boolean {
+  const row = getDb()
+    .prepare(
+      `SELECT 1 FROM agent_tasks
+       WHERE parentTaskId = ?
+         AND taskType = 'resume'
+         AND status NOT IN ('completed', 'failed', 'cancelled', 'superseded')
+       LIMIT 1`,
+    )
+    .get(parentId);
+  return row !== undefined && row !== null;
+}
 export function updateTaskClaudeSessionId(
   taskId: string,
   claudeSessionId: string,
@@ -1370,14 +1420,18 @@ export function getTasksByStatus(status: AgentTaskStatus): AgentTask[] {
 /**
  * Find a task by VCS repo and issue/PR/MR number.
- * Returns the most recent non-completed/failed task for this VCS entity.
+ * Returns the most recent non-terminal task for this VCS entity.
+ *
+ * Terminal exclusion MUST stay in lock-step with `TERMINAL_TASK_STATUSES`
+ * in `src/types.ts`. SQL strings can't import a TS const — if you add a
+ * new terminal status, grep for `NOT IN ('completed'` across this file.
  */
 export function findTaskByVcs(vcsRepo: string, vcsNumber: number): AgentTask | null {
   const row = getDb()
     .prepare<AgentTaskRow, [string, number]>(
       `SELECT * FROM agent_tasks
        WHERE vcsRepo = ? AND vcsNumber = ?
-       AND status NOT IN ('completed', 'failed')
+       AND status NOT IN ('completed', 'failed', 'cancelled', 'superseded')
        ORDER BY createdAt DESC
        LIMIT 1`,
     )
@@ -1875,6 +1929,50 @@ export function findCompletedTaskInThread(
   return row ? rowToAgentTask(row) : null;
 }
+/**
+ * Find the most recent CANCELLED task in a Slack thread. Used by the
+ * follow-up re-delegation guard so a cancellation (worker SIGTERM,
+ * runner-side abort, swarm-events tool-loop abort) doesn't permanently
+ * jam re-dispatch when an earlier sibling task in the same thread also
+ * completed.
+ *
+ * Matches both:
+ *   - `status = 'cancelled'` (the canonical terminal state from cancelTask)
+ *   - `status = 'failed'` with a failureReason that starts with "cancelled"
+ *     or "exit 130" or contains "cancelled" (the codex-adapter abort path
+ *     emits `failureReason: "cancelled"` and exits 130).
+ */
+export function findRecentCancelledTaskInThread(
+  channelId: string,
+  threadTs: string,
+  windowMinutes: number,
+): AgentTask | null {
+  const since = new Date(Date.now() - windowMinutes * 60 * 1000).toISOString();
+  const row = getDb()
+    .prepare<AgentTaskRow, [string, string, string]>(
+      `SELECT * FROM agent_tasks
+       WHERE slackChannelId = ?
+       AND slackThreadTs = ?
+       AND lastUpdatedAt > ?
+       AND (
+         status = 'cancelled'
+         OR (
+           status = 'failed'
+           AND failureReason IS NOT NULL
+           AND (
+             failureReason LIKE 'cancelled%'
+             OR failureReason LIKE 'exit 130%'
+             OR failureReason LIKE '%cancelled%'
+           )
+         )
+       )
+       ORDER BY lastUpdatedAt DESC
+       LIMIT 1`,
+    )
+    .get(channelId, threadTs, since);
+  return row ? rowToAgentTask(row) : null;
+}
 export function completeTask(id: string, output?: string): AgentTask | null {
   const oldTask = getTaskById(id);
   if (!oldTask) return null;
@@ -1882,7 +1980,7 @@ export function completeTask(id: string, output?: string): AgentTask | null {
   // Idempotency guard: don't re-complete a task already in a terminal state.
   // Mirrors cancelTask. Prevents duplicate task.completed events, duplicate
   // log entries, and duplicate follow-up tasks when multiple sessions race.
-  if (["completed", "failed", "cancelled"].includes(oldTask.status)) {
+  if (isTerminalTaskStatus(oldTask.status)) {
     return null;
   }
@@ -1927,7 +2025,7 @@ export function failTask(id: string, reason: string): AgentTask | null {
   // Idempotency guard: don't re-fail a task already in a terminal state.
   // Mirrors cancelTask / completeTask. Prevents duplicate task.failed events
   // and duplicate follow-up tasks when multiple sessions race.
-  if (["completed", "failed", "cancelled"].includes(oldTask.status)) {
+  if (isTerminalTaskStatus(oldTask.status)) {
     return null;
   }
@@ -1964,8 +2062,7 @@ export function cancelTask(id: string, reason?: string): AgentTask | null {
   if (!oldTask) return null;
   // Only cancel tasks that are not already in a terminal state
-  const terminalStatuses = ["completed", "failed", "cancelled"];
-  if (terminalStatuses.includes(oldTask.status)) {
+  if (isTerminalTaskStatus(oldTask.status)) {
     return null;
   }
@@ -1999,6 +2096,69 @@ export function cancelTask(id: string, reason?: string): AgentTask | null {
   return row ? rowToAgentTask(row) : null;
 }
+/**
+ * Supersede a task: mark it as `superseded` (terminal) so a fresh "resume"
+ * follow-up task can pick up where it left off. Used by the graceful-shutdown
+ * path and the `POST /api/tasks/:id/supersede` route. Returns null if the task
+ * is already terminal (mirrors `completeTask` / `cancelTask` idempotency).
+ *
+ * Writes a `task_superseded` agent_log with `{ reason, resumeTaskId }` payload
+ * and emits a `task.superseded` workflow event. The caller is responsible for
+ * creating the resume follow-up (via `createResumeFollowUp`) and passing the
+ * resulting id as `resumeTaskId`.
+ */
+export function supersedeTask(
+  id: string,
+  args: { reason: string; resumeTaskId: string | null },
+): AgentTask | null {
+  const oldTask = getTaskById(id);
+  if (!oldTask) return null;
+  // Idempotency guard: don't re-supersede a task already in a terminal state.
+  if (isTerminalTaskStatus(oldTask.status)) {
+    return null;
+  }
+  const finishedAt = new Date().toISOString();
+  const row = getDb()
+    .prepare<AgentTaskRow, [string, string]>(
+      `UPDATE agent_tasks
+       SET status = 'superseded',
+           finishedAt = ?,
+           lastUpdatedAt = strftime('%Y-%m-%dT%H:%M:%fZ', 'now')
+       WHERE id = ? AND status NOT IN ('completed', 'failed', 'cancelled', 'superseded')
+       RETURNING *`,
+    )
+    .get(finishedAt, id);
+  if (row && oldTask) {
+    try {
+      createLogEntry({
+        eventType: "task_superseded",
+        taskId: id,
+        agentId: row.agentId ?? undefined,
+        oldValue: oldTask.status,
+        newValue: "superseded",
+        metadata: { reason: args.reason, resumeTaskId: args.resumeTaskId },
+      });
+    } catch {}
+    try {
+      import("../workflows/event-bus").then(({ workflowEventBus }) => {
+        workflowEventBus.emit("task.superseded", {
+          taskId: id,
+          reason: args.reason,
+          resumeTaskId: args.resumeTaskId,
+          agentId: row.agentId,
+          workflowRunId: row.workflowRunId,
+          workflowRunStepId: row.workflowRunStepId,
+        });
+      });
+    } catch {}
+  }
+  return row ? rowToAgentTask(row) : null;
+}
 /**
  * Pause a task that is currently in progress.
  * Used during graceful shutdown to allow tasks to resume after container restart.
@@ -2516,6 +2676,7 @@ export interface CreateTaskOptions {
    * a schema'd task should be defensive about JSON parsing.
    */
   outputSchema?: Record<string, unknown>;
+  followUpConfig?: FollowUpConfig;
   requestedByUserId?: string;
   contextKey?: string;
 }
@@ -2534,8 +2695,9 @@ export function findRecentSimilarTasks(opts: {
   const conditions: string[] = ["createdAt > ?"];
   const params: (string | number)[] = [since];
-  // Exclude completed/failed/cancelled tasks — only active or recently created
-  conditions.push("status NOT IN ('completed', 'failed', 'cancelled')");
+  // Exclude all terminal statuses — only active or recently created.
+  // Keep in lock-step with `TERMINAL_TASK_STATUSES` in src/types.ts.
+  conditions.push("status NOT IN ('completed', 'failed', 'cancelled', 'superseded')");
   if (opts.creatorAgentId) {
     conditions.push("creatorAgentId = ?");
@@ -2570,6 +2732,16 @@ export function createTaskExtended(task: string, options?: CreateTaskOptions): A
   if (options?.parentTaskId) {
     const parent = getTaskById(options.parentTaskId);
     if (parent) {
+      // Identity & routing — anything that says "what work is this, who asked
+      // for it, where does it run" carries forward to every child (follow-ups,
+      // reboot retries, resume tasks). Explicit options always win.
+      //
+      // When adding a new identity-shaped column to `agent_tasks`, ADD IT HERE
+      // unless you have a specific reason a child should NOT inherit it. This
+      // is the single source of truth — `createResumeFollowUp` and the other
+      // follow-up creators rely on this block instead of re-listing fields.
+      // Slack context
       if (parent.slackChannelId && !options.slackChannelId) {
         options.slackChannelId = parent.slackChannelId;
       }
@@ -2579,18 +2751,98 @@ export function createTaskExtended(task: string, options?: CreateTaskOptions): A
       if (parent.slackUserId && !options.slackUserId) {
         options.slackUserId = parent.slackUserId;
       }
+      // AgentMail context
       if (parent.agentmailInboxId && !options.agentmailInboxId) {
         options.agentmailInboxId = parent.agentmailInboxId;
       }
+      if (parent.agentmailMessageId && !options.agentmailMessageId) {
+        options.agentmailMessageId = parent.agentmailMessageId;
+      }
       if (parent.agentmailThreadId && !options.agentmailThreadId) {
         options.agentmailThreadId = parent.agentmailThreadId;
       }
+      // Mention context (Slack @-mentions)
+      if (parent.mentionMessageId && !options.mentionMessageId) {
+        options.mentionMessageId = parent.mentionMessageId;
+      }
+      if (parent.mentionChannelId && !options.mentionChannelId) {
+        options.mentionChannelId = parent.mentionChannelId;
+      }
+      // VCS identity (GitHub / GitLab issue / PR / MR + webhook routing)
+      // Webhook handlers locate active work via `findTaskByVcs(repo, number)`,
+      // so a resume / follow-up child MUST carry the full VCS identity or
+      // subsequent review/update events get dropped.
+      if (parent.vcsProvider && !options.vcsProvider) {
+        options.vcsProvider = parent.vcsProvider;
+      }
+      if (parent.vcsRepo && !options.vcsRepo) {
+        options.vcsRepo = parent.vcsRepo;
+      }
+      if (parent.vcsNumber != null && options.vcsNumber == null) {
+        options.vcsNumber = parent.vcsNumber;
+      }
+      if (parent.vcsEventType && !options.vcsEventType) {
+        options.vcsEventType = parent.vcsEventType;
+      }
+      if (parent.vcsCommentId != null && options.vcsCommentId == null) {
+        options.vcsCommentId = parent.vcsCommentId;
+      }
+      if (parent.vcsAuthor && !options.vcsAuthor) {
+        options.vcsAuthor = parent.vcsAuthor;
+      }
+      if (parent.vcsUrl && !options.vcsUrl) {
+        options.vcsUrl = parent.vcsUrl;
+      }
+      if (parent.vcsInstallationId != null && options.vcsInstallationId == null) {
+        options.vcsInstallationId = parent.vcsInstallationId;
+      }
+      if (parent.vcsNodeId && !options.vcsNodeId) {
+        options.vcsNodeId = parent.vcsNodeId;
+      }
+      // Execution context (per-task overrides)
+      //
+      // `model` is DELIBERATELY NOT inherited. A parent task's `model` is a
+      // concrete, provider-specific resolved string (e.g. `claude-opus-4-8`,
+      // `openrouter/moonshotai/kimi-k2.6`). Derived tasks (resume follow-ups,
+      // completion/review follow-ups, re-dispatches) routinely land on a
+      // DIFFERENT agent — and therefore a different harness/provider — than the
+      // parent. Carrying the parent's concrete model across that boundary makes
+      // the child die at session-init with a model-incompatibility error before
+      // any worker code runs (e.g. a `claude-opus-4-8` resume claimed by a Codex
+      // worker → `400 model is not supported when using Codex`, or a
+      // `kimi-k2.6` review follow-up routed to a Claude-harness Lead → session
+      // exit 1). Per Taras's directive (2026-05-29): derived tasks must never
+      // set the model — it resolves from the ASSIGNEE agent's own provider /
+      // `MODEL_OVERRIDE` config at session-init (see
+      // `src/commands/runner.ts` — `opts.model || configModel`). A null `model`
+      // here is the correct, intended state. Do NOT re-add inheritance here; if
+      // a same-provider child genuinely needs a specific model, the creator must
+      // pass it explicitly.
+      if (parent.dir && !options.dir) {
+        options.dir = parent.dir;
+      }
+      // Contract (schema validation) — `store-progress` validates completion
+      // output against `outputSchema`, runner injects structured-output
+      // instructions only when it's present.
+      if (parent.outputSchema && !options.outputSchema) {
+        options.outputSchema = parent.outputSchema;
+      }
+      // Attribution
       if (parent.requestedByUserId && !options.requestedByUserId) {
         options.requestedByUserId = parent.requestedByUserId;
       }
       if (parent.contextKey && !options.contextKey) {
         options.contextKey = parent.contextKey;
       }
+      if (parent.followUpConfig && !options.followUpConfig) {
+        options.followUpConfig = parent.followUpConfig;
+      }
     }
   }
@@ -2616,8 +2868,8 @@ export function createTaskExtended(task: string, options?: CreateTaskOptions): A
         vcsInstallationId, vcsNodeId,
         agentmailInboxId, agentmailMessageId, agentmailThreadId,
         mentionMessageId, mentionChannelId, dir, parentTaskId, model, scheduleId,
-        workflowRunId, workflowRunStepId, outputSchema, requestedByUserId, contextKey, swarmVersion, createdAt, lastUpdatedAt
-      ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?) RETURNING *`,
+        workflowRunId, workflowRunStepId, outputSchema, followUpConfig, requestedByUserId, contextKey, swarmVersion, createdAt, lastUpdatedAt
+      ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?) RETURNING *`,
     )
     .get(
       id,
@@ -2656,6 +2908,7 @@ export function createTaskExtended(task: string, options?: CreateTaskOptions): A
       options?.workflowRunId ?? null,
       options?.workflowRunStepId ?? null,
       options?.outputSchema ? JSON.stringify(options.outputSchema) : null,
+      options?.followUpConfig ? JSON.stringify(options.followUpConfig) : null,
       options?.requestedByUserId ?? null,
       options?.contextKey ?? null,
       pkg.version,
@@ -3973,6 +4226,15 @@ export const sessionLogQueries = {
       "SELECT * FROM session_logs WHERE taskId = ? ORDER BY iteration ASC, lineNumber ASC",
     ),
+  getRecentByTaskId: () =>
+    getDb().prepare<SessionLogRow, [string, number]>(
+      `SELECT * FROM (
+         SELECT * FROM session_logs WHERE taskId = ?
+         ORDER BY iteration DESC, lineNumber DESC
+         LIMIT ?
+       ) ORDER BY iteration ASC, lineNumber ASC`,
+    ),
   getBySessionId: () =>
     getDb().prepare<SessionLogRow, [string, number]>(
       "SELECT * FROM session_logs WHERE sessionId = ? AND iteration = ? ORDER BY lineNumber ASC",
@@ -4008,7 +4270,10 @@ export function createSessionLogs(logs: {
   })();
 }
-export function getSessionLogsByTaskId(taskId: string): SessionLog[] {
+export function getSessionLogsByTaskId(taskId: string, limit?: number): SessionLog[] {
+  if (typeof limit === "number" && limit > 0) {
+    return sessionLogQueries.getRecentByTaskId().all(taskId, limit).map(rowToSessionLog);
+  }
   return sessionLogQueries.getByTaskId().all(taskId).map(rowToSessionLog);
 }

package/src/be/migrations/078_backfill_gpt_5_5_pricing.sql ADDED Viewed

@@ -0,0 +1,15 @@
+-- 078_backfill_gpt_5_5_pricing.sql
+-- Backfill Codex GPT-5.5 pricing into existing databases.
+--
+-- The vendored models.dev cache already contains gpt-5.5, and fresh server
+-- boots seed it from src/be/seed-pricing.ts. Existing long-lived DBs can still
+-- be missing those rows, which makes real gpt-5.5 Codex runs land as
+-- costSource='unpriced'. Keep this migration idempotent so every environment
+-- gets the baseline Standard-tier rates.
+INSERT OR IGNORE INTO pricing
+  (provider, model, token_class, effective_from, price_per_million_usd, createdAt, lastUpdatedAt)
+VALUES
+  ('codex', 'gpt-5.5', 'input',        0, 5.0,  0, 0),
+  ('codex', 'gpt-5.5', 'cached_input', 0, 0.5,  0, 0),
+  ('codex', 'gpt-5.5', 'output',       0, 30.0, 0, 0);

package/src/be/migrations/079_task_followup_config.sql ADDED Viewed

	@@ -0,0 +1 @@
1	+ ALTER TABLE agent_tasks ADD COLUMN followUpConfig TEXT;