npm - vellum - Versions diffs - 0.2.0 → 0.2.2 - Mend

vellum 0.2.0 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (361) hide show

package/README.md +15 -2
package/bun.lock +5 -2
package/package.json +4 -2
package/scripts/capture-x-graphql.ts +562 -0
package/scripts/ipc/check-swift-decoder-drift.ts +2 -1
package/scripts/test.sh +5 -0
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +161 -34
package/src/__tests__/account-registry.test.ts +2 -1
package/src/__tests__/agent-heartbeat-service.test.ts +250 -0
package/src/__tests__/app-bundler.test.ts +12 -33
package/src/__tests__/asset-materialize-tool.test.ts +16 -15
package/src/__tests__/asset-search-tool.test.ts +23 -22
package/src/__tests__/attachments-store.test.ts +56 -127
package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +5 -4
package/src/__tests__/browser-skill-endstate.test.ts +5 -8
package/src/__tests__/call-bridge.test.ts +385 -0
package/src/__tests__/call-constants.test.ts +40 -0
package/src/__tests__/call-orchestrator.test.ts +454 -0
package/src/__tests__/call-recovery.test.ts +518 -0
package/src/__tests__/call-routes-http.test.ts +459 -0
package/src/__tests__/call-state-machine.test.ts +143 -0
package/src/__tests__/call-state.test.ts +133 -0
package/src/__tests__/call-store.test.ts +691 -0
package/src/__tests__/cli-discover.test.ts +1 -1
package/src/__tests__/commit-message-enrichment-service.test.ts +550 -0
package/src/__tests__/compaction.benchmark.test.ts +176 -0
package/src/__tests__/computer-use-tools.test.ts +250 -0
package/src/__tests__/config-schema.test.ts +348 -3
package/src/__tests__/conflict-store.test.ts +2 -1
package/src/__tests__/contacts-tools.test.ts +331 -0
package/src/__tests__/conversation-store.test.ts +30 -32
package/src/__tests__/credential-security-invariants.test.ts +4 -0
package/src/__tests__/date-context.test.ts +373 -0
package/src/__tests__/db-schedule-syntax-migration.test.ts +129 -0
package/src/__tests__/doordash-session.test.ts +9 -0
package/src/__tests__/fixtures/media-reuse-fixtures.ts +3 -3
package/src/__tests__/followup-tools.test.ts +303 -0
package/src/__tests__/handlers-twitter-config.test.ts +718 -0
package/src/__tests__/intent-routing.test.ts +64 -57
package/src/__tests__/ipc-roundtrip.benchmark.test.ts +237 -0
package/src/__tests__/ipc-snapshot.test.ts +96 -28
package/src/__tests__/llm-usage-store.test.ts +3 -8
package/src/__tests__/media-generate-image.test.ts +1 -1
package/src/__tests__/media-reuse-story.e2e.test.ts +7 -7
package/src/__tests__/memory-retrieval.benchmark.test.ts +430 -0
package/src/__tests__/parallel-tool.benchmark.test.ts +294 -0
package/src/__tests__/playbook-tools.test.ts +342 -0
package/src/__tests__/profile-compiler.test.ts +2 -1
package/src/__tests__/provider-streaming.benchmark.test.ts +773 -0
package/src/__tests__/recurrence-engine-rruleset.test.ts +78 -0
package/src/__tests__/recurrence-engine.test.ts +69 -0
package/src/__tests__/recurrence-types.test.ts +71 -0
package/src/__tests__/registry.test.ts +17 -10
package/src/__tests__/relay-server.test.ts +633 -0
package/src/__tests__/reminder-store.test.ts +6 -3
package/src/__tests__/reminder.test.ts +43 -77
package/src/__tests__/run-orchestrator-assistant-events.test.ts +222 -0
package/src/__tests__/run-orchestrator.test.ts +7 -7
package/src/__tests__/runtime-attachment-metadata.test.ts +19 -20
package/src/__tests__/runtime-runs-http.test.ts +5 -23
package/src/__tests__/runtime-runs.test.ts +11 -11
package/src/__tests__/schedule-store.test.ts +482 -0
package/src/__tests__/schedule-tools.test.ts +700 -0
package/src/__tests__/scheduler-recurrence.test.ts +329 -0
package/src/__tests__/server-history-render.test.ts +14 -13
package/src/__tests__/session-error.test.ts +28 -0
package/src/__tests__/session-init.benchmark.test.ts +462 -0
package/src/__tests__/session-queue.test.ts +89 -16
package/src/__tests__/session-runtime-assembly.test.ts +161 -0
package/src/__tests__/session-surfaces-task-progress.test.ts +104 -0
package/src/__tests__/signup-e2e.test.ts +2 -1
package/src/__tests__/skill-projection.benchmark.test.ts +328 -0
package/src/__tests__/skill-script-runner.test.ts +159 -0
package/src/__tests__/speaker-identification.test.ts +52 -0
package/src/__tests__/subagent-manager-notify.test.ts +42 -10
package/src/__tests__/subagent-tools.test.ts +141 -41
package/src/__tests__/task-compiler.test.ts +2 -1
package/src/__tests__/task-runner.test.ts +2 -1
package/src/__tests__/task-scheduler.test.ts +2 -1
package/src/__tests__/task-tools.test.ts +49 -56
package/src/__tests__/tool-audit-listener.test.ts +1 -0
package/src/__tests__/tool-domain-event-publisher.test.ts +2 -0
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +500 -0
package/src/__tests__/tool-executor.test.ts +13 -17
package/src/__tests__/turn-commit.test.ts +273 -2
package/src/__tests__/twilio-provider.test.ts +143 -0
package/src/__tests__/twilio-routes.test.ts +789 -0
package/src/__tests__/twitter-auth-handler.test.ts +581 -0
package/src/__tests__/view-image-tool.test.ts +217 -0
package/src/__tests__/workspace-git-service.test.ts +403 -0
package/src/__tests__/workspace-heartbeat-service.test.ts +141 -2
package/src/agent-heartbeat/agent-heartbeat-service.ts +155 -0
package/src/bundler/app-bundler.ts +35 -14
package/src/calls/call-bridge.ts +95 -0
package/src/calls/call-constants.ts +48 -0
package/src/calls/call-domain.ts +276 -0
package/src/calls/call-orchestrator.ts +390 -0
package/src/calls/call-recovery.ts +207 -0
package/src/calls/call-state-machine.ts +68 -0
package/src/calls/call-state.ts +64 -0
package/src/calls/call-store.ts +416 -0
package/src/calls/relay-server.ts +335 -0
package/src/calls/speaker-identification.ts +213 -0
package/src/calls/twilio-config.ts +34 -0
package/src/calls/twilio-provider.ts +173 -0
package/src/calls/twilio-routes.ts +250 -0
package/src/calls/types.ts +37 -0
package/src/calls/voice-provider.ts +14 -0
package/src/cli/config-commands.ts +334 -0
package/src/cli/core-commands.ts +776 -0
package/src/cli/doordash.ts +256 -25
package/src/cli/ipc-client.ts +82 -0
package/src/cli/map.ts +246 -0
package/src/cli/twitter.ts +575 -0
package/src/cli.ts +7 -5
package/src/commands/__tests__/cc-command-registry.test.ts +319 -0
package/src/commands/cc-command-registry.ts +209 -0
package/src/config/bundled-skills/contacts/SKILL.md +39 -0
package/src/config/bundled-skills/contacts/TOOLS.json +122 -0
package/src/config/bundled-skills/contacts/tools/contact-merge.ts +9 -0
package/src/config/bundled-skills/contacts/tools/contact-search.ts +9 -0
package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +9 -0
package/src/config/bundled-skills/document/SKILL.md +18 -0
package/src/config/bundled-skills/document/TOOLS.json +53 -0
package/src/config/bundled-skills/document/tools/document-create.ts +9 -0
package/src/config/bundled-skills/document/tools/document-update.ts +9 -0
package/src/config/bundled-skills/doordash/SKILL.md +163 -0
package/src/config/bundled-skills/followups/SKILL.md +32 -0
package/src/config/bundled-skills/followups/TOOLS.json +100 -0
package/src/config/bundled-skills/followups/tools/followup-create.ts +9 -0
package/src/config/bundled-skills/followups/tools/followup-list.ts +9 -0
package/src/config/bundled-skills/followups/tools/followup-resolve.ts +9 -0
package/src/config/bundled-skills/image-studio/TOOLS.json +2 -2
package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +2 -24
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +2 -1
package/src/config/bundled-skills/playbooks/SKILL.md +31 -0
package/src/config/bundled-skills/playbooks/TOOLS.json +126 -0
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +9 -0
package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +9 -0
package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +9 -0
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +9 -0
package/src/config/bundled-skills/reminder/SKILL.md +20 -0
package/src/config/bundled-skills/reminder/TOOLS.json +67 -0
package/src/config/bundled-skills/reminder/tools/reminder-cancel.ts +9 -0
package/src/config/bundled-skills/reminder/tools/reminder-create.ts +9 -0
package/src/config/bundled-skills/reminder/tools/reminder-list.ts +9 -0
package/src/config/bundled-skills/schedule/SKILL.md +74 -0
package/src/config/bundled-skills/schedule/TOOLS.json +135 -0
package/src/config/bundled-skills/schedule/tools/schedule-create.ts +9 -0
package/src/config/bundled-skills/schedule/tools/schedule-delete.ts +9 -0
package/src/config/bundled-skills/schedule/tools/schedule-list.ts +9 -0
package/src/config/bundled-skills/schedule/tools/schedule-update.ts +9 -0
package/src/config/bundled-skills/subagent/SKILL.md +25 -0
package/src/config/bundled-skills/subagent/TOOLS.json +107 -0
package/src/config/bundled-skills/subagent/tools/subagent-abort.ts +9 -0
package/src/config/bundled-skills/subagent/tools/subagent-message.ts +9 -0
package/src/config/bundled-skills/subagent/tools/subagent-read.ts +9 -0
package/src/config/bundled-skills/subagent/tools/subagent-spawn.ts +9 -0
package/src/config/bundled-skills/subagent/tools/subagent-status.ts +9 -0
package/src/config/bundled-skills/tasks/SKILL.md +28 -0
package/src/config/bundled-skills/tasks/TOOLS.json +256 -0
package/src/config/bundled-skills/tasks/tools/task-delete.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-list-add.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-list-remove.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-list-show.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-list-update.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-list.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-run.ts +9 -0
package/src/config/bundled-skills/tasks/tools/task-save.ts +9 -0
package/src/config/bundled-skills/twitter/SKILL.md +134 -0
package/src/config/bundled-skills/watcher/SKILL.md +27 -0
package/src/config/bundled-skills/watcher/TOOLS.json +147 -0
package/src/config/bundled-skills/watcher/tools/watcher-create.ts +9 -0
package/src/config/bundled-skills/watcher/tools/watcher-delete.ts +9 -0
package/src/config/bundled-skills/watcher/tools/watcher-digest.ts +9 -0
package/src/config/bundled-skills/watcher/tools/watcher-list.ts +9 -0
package/src/config/bundled-skills/watcher/tools/watcher-update.ts +9 -0
package/src/config/defaults.ts +44 -0
package/src/config/loader.ts +4 -1
package/src/config/schema.ts +218 -1
package/src/config/system-prompt.ts +100 -6
package/src/config/templates/IDENTITY.md +7 -0
package/src/config/types.ts +5 -0
package/src/contacts/contact-store.ts +4 -4
package/src/daemon/assistant-attachments.ts +10 -0
package/src/daemon/classifier.ts +3 -1
package/src/daemon/computer-use-session.ts +3 -1
package/src/daemon/date-context.ts +136 -0
package/src/daemon/handlers/apps.ts +16 -1
package/src/daemon/handlers/browser.ts +54 -0
package/src/daemon/handlers/computer-use.ts +7 -1
package/src/daemon/handlers/config.ts +192 -4
package/src/daemon/handlers/diagnostics.ts +5 -1
package/src/daemon/handlers/documents.ts +18 -29
package/src/daemon/handlers/home-base.ts +5 -1
package/src/daemon/handlers/index.ts +40 -271
package/src/daemon/handlers/misc.ts +9 -1
package/src/daemon/handlers/publish.ts +6 -1
package/src/daemon/handlers/sessions.ts +65 -12
package/src/daemon/handlers/shared.ts +36 -1
package/src/daemon/handlers/signing.ts +37 -0
package/src/daemon/handlers/skills.ts +20 -6
package/src/daemon/handlers/subagents.ts +8 -3
package/src/daemon/handlers/twitter-auth.ts +169 -0
package/src/daemon/handlers/work-items.ts +495 -39
package/src/daemon/ipc-contract-inventory.json +40 -4
package/src/daemon/ipc-contract.ts +185 -37
package/src/daemon/ipc-protocol.ts +7 -2
package/src/daemon/lifecycle.ts +48 -5
package/src/daemon/main.ts +10 -4
package/src/daemon/ride-shotgun-handler.ts +74 -10
package/src/daemon/server.ts +144 -29
package/src/daemon/session-agent-loop.ts +887 -0
package/src/daemon/session-attachments.ts +28 -5
package/src/daemon/session-error.ts +24 -3
package/src/daemon/session-lifecycle.ts +147 -0
package/src/daemon/session-media-retry.ts +147 -0
package/src/daemon/session-messaging.ts +145 -0
package/src/daemon/session-notifiers.ts +164 -0
package/src/daemon/session-process.ts +2 -2
package/src/daemon/session-queue-manager.ts +1 -0
package/src/daemon/session-runtime-assembly.ts +52 -0
package/src/daemon/session-skill-tools.ts +124 -5
package/src/daemon/session-slash.ts +3 -0
package/src/daemon/session-surfaces.ts +77 -2
package/src/daemon/session-tool-setup.ts +222 -2
package/src/daemon/session-usage.ts +0 -2
package/src/daemon/session.ts +114 -1365
package/src/daemon/video-thumbnail.ts +60 -0
package/src/doordash/client.ts +121 -27
package/src/doordash/queries.ts +1 -2
package/src/export/formatter.ts +3 -1
package/src/followups/followup-store.ts +4 -2
package/src/followups/types.ts +6 -0
package/src/hooks/templates.ts +1 -1
package/src/index.ts +32 -1151
package/src/media/gemini-image-service.ts +1 -1
package/src/memory/attachments-store.ts +28 -83
package/src/memory/channel-delivery-store.ts +7 -21
package/src/memory/clarification-resolver.ts +6 -5
package/src/memory/contradiction-checker.ts +3 -2
package/src/memory/conversation-key-store.ts +10 -29
package/src/memory/conversation-store.ts +2 -1
package/src/memory/db.ts +362 -2
package/src/memory/entity-extractor.ts +6 -3
package/src/memory/items-extractor.ts +5 -4
package/src/memory/jobs-store.ts +3 -2
package/src/memory/llm-usage-store.ts +1 -2
package/src/memory/runs-store.ts +1 -2
package/src/memory/schema.ts +65 -2
package/src/messaging/style-analyzer.ts +3 -2
package/src/messaging/thread-summarizer.ts +8 -12
package/src/messaging/triage-engine.ts +4 -2
package/src/providers/openrouter/client.ts +20 -0
package/src/providers/registry.ts +8 -0
package/src/runtime/http-server.ts +277 -25
package/src/runtime/http-types.ts +0 -2
package/src/runtime/routes/attachment-routes.ts +5 -6
package/src/runtime/routes/call-routes.ts +140 -0
package/src/runtime/routes/channel-routes.ts +12 -19
package/src/runtime/routes/conversation-routes.ts +5 -9
package/src/runtime/routes/run-routes.ts +4 -8
package/src/runtime/run-orchestrator.ts +39 -6
package/src/schedule/recurrence-engine.ts +138 -0
package/src/schedule/recurrence-types.ts +67 -0
package/src/schedule/schedule-store.ts +102 -57
package/src/schedule/scheduler.ts +9 -6
package/src/security/oauth2.ts +29 -4
package/src/security/secret-allowlist.ts +46 -0
package/src/skills/clawhub.ts +1 -1
package/src/subagent/manager.ts +40 -8
package/src/swarm/backend-claude-code.ts +64 -9
package/src/swarm/worker-prompts.ts +2 -1
package/src/tasks/SPEC.md +34 -28
package/src/tasks/ephemeral-permissions.ts +16 -7
package/src/tasks/task-compiler.ts +5 -4
package/src/tasks/task-runner.ts +10 -5
package/src/tasks/task-scheduler.ts +1 -1
package/src/tasks/tool-sanitizer.ts +36 -0
package/src/tools/assets/search.ts +4 -4
package/src/tools/browser/api-map.ts +220 -0
package/src/tools/browser/auto-navigate.ts +270 -0
package/src/tools/browser/browser-execution.ts +2 -1
package/src/tools/browser/browser-manager.ts +2 -2
package/src/tools/browser/network-recorder.ts +5 -4
package/src/tools/browser/x-auto-navigate.ts +207 -0
package/src/tools/calls/call-end.ts +67 -0
package/src/tools/calls/call-start.ts +73 -0
package/src/tools/calls/call-status.ts +81 -0
package/src/tools/claude-code/claude-code.ts +77 -11
package/src/tools/contacts/contact-merge.ts +46 -78
package/src/tools/contacts/contact-search.ts +35 -79
package/src/tools/contacts/contact-upsert.ts +35 -108
package/src/tools/credentials/vault.ts +21 -5
package/src/tools/document/document-tool.ts +71 -144
package/src/tools/executor.ts +129 -10
package/src/tools/followups/followup_create.ts +46 -88
package/src/tools/followups/followup_list.ts +34 -74
package/src/tools/followups/followup_resolve.ts +31 -66
package/src/tools/host-terminal/cli-discover.ts +2 -1
package/src/tools/host-terminal/host-shell.ts +10 -0
package/src/tools/memory/handlers.ts +5 -4
package/src/tools/network/__tests__/web-search.test.ts +427 -0
package/src/tools/network/script-proxy/__tests__/logging.test.ts +248 -0
package/src/tools/network/script-proxy/__tests__/policy.test.ts +234 -0
package/src/tools/network/script-proxy/__tests__/router.test.ts +76 -0
package/src/tools/network/web-fetch.ts +18 -6
package/src/tools/playbooks/index.ts +4 -5
package/src/tools/playbooks/playbook-create.ts +3 -47
package/src/tools/playbooks/playbook-delete.ts +1 -25
package/src/tools/playbooks/playbook-list.ts +1 -28
package/src/tools/playbooks/playbook-update.ts +3 -51
package/src/tools/registry.ts +2 -4
package/src/tools/reminder/reminder.ts +5 -78
package/src/tools/schedule/create.ts +69 -74
package/src/tools/schedule/delete.ts +21 -47
package/src/tools/schedule/list.ts +55 -74
package/src/tools/schedule/update.ts +77 -84
package/src/tools/subagent/abort.ts +29 -58
package/src/tools/subagent/message.ts +30 -63
package/src/tools/subagent/read.ts +53 -84
package/src/tools/subagent/spawn.ts +43 -82
package/src/tools/subagent/status.ts +42 -71
package/src/tools/swarm/delegate.ts +2 -1
package/src/tools/tasks/index.ts +8 -6
package/src/tools/tasks/task-delete.ts +69 -56
package/src/tools/tasks/task-list.ts +31 -52
package/src/tools/tasks/task-run.ts +74 -102
package/src/tools/tasks/task-save.ts +33 -65
package/src/tools/tasks/work-item-enqueue.ts +192 -134
package/src/tools/tasks/work-item-list.ts +33 -78
package/src/tools/tasks/work-item-remove.ts +60 -0
package/src/tools/tasks/work-item-update.ts +114 -0
package/src/tools/terminal/backends/native.ts +3 -1
package/src/tools/tool-manifest.ts +20 -74
package/src/tools/types.ts +6 -0
package/src/tools/ui-surface/definitions.ts +6 -1
package/src/tools/watch/screen-watch.ts +3 -1
package/src/tools/watcher/create.ts +52 -98
package/src/tools/watcher/delete.ts +20 -46
package/src/tools/watcher/digest.ts +36 -70
package/src/tools/watcher/list.ts +49 -79
package/src/tools/watcher/update.ts +45 -91
package/src/twitter/client.ts +690 -0
package/src/twitter/session.ts +91 -0
package/src/usage/types.ts +0 -1
package/src/util/truncate.ts +6 -0
package/src/watcher/providers/slack.ts +2 -1
package/src/watcher/watcher-store.ts +3 -2
package/src/work-items/work-item-store.ts +236 -2
package/src/workspace/commit-message-enrichment-service.ts +284 -0
package/src/workspace/commit-message-provider.ts +95 -0
package/src/workspace/git-service.ts +272 -52
package/src/workspace/heartbeat-service.ts +70 -13
package/src/workspace/provider-commit-message-generator.ts +242 -0
package/src/workspace/turn-commit.ts +100 -51
package/src/tools/contacts/index.ts +0 -4
package/src/tools/document/index.ts +0 -5
package/src/tools/followups/index.ts +0 -3
package/src/tools/subagent/index.ts +0 -5
/package/src/__tests__/{memory-context-benchmark.test.ts → memory-context-benchmark.benchmark.test.ts} +0 -0

package/src/security/secret-allowlist.ts CHANGED Viewed

@@ -104,6 +104,52 @@ export function isAllowlisted(value: string): boolean {
   return false;
 }
+export interface AllowlistValidationError {
+  index: number;
+  pattern: string;
+  message: string;
+}
+/**
+ * Validate all regex patterns in an allowlist config without loading them.
+ * Returns an array of validation errors (empty = all valid).
+ */
+export function validateAllowlist(config: AllowlistConfig): AllowlistValidationError[] {
+  const errors: AllowlistValidationError[] = [];
+  if (!config.patterns) return errors;
+  if (!Array.isArray(config.patterns)) {
+    errors.push({ index: -1, pattern: String(config.patterns), message: '"patterns" must be an array' });
+    return errors;
+  }
+  for (let i = 0; i < config.patterns.length; i++) {
+    const p = config.patterns[i];
+    if (typeof p !== 'string') {
+      errors.push({ index: i, pattern: String(p), message: 'Pattern is not a string' });
+      continue;
+    }
+    try {
+      new RegExp(p);
+    } catch (err) {
+      errors.push({ index: i, pattern: p, message: (err as Error).message });
+    }
+  }
+  return errors;
+}
+/**
+ * Read secret-allowlist.json from disk and validate it.
+ * Returns validation errors, or null if the file doesn't exist.
+ */
+export function validateAllowlistFile(): AllowlistValidationError[] | null {
+  const filePath = join(getRootDir(), 'protected', 'secret-allowlist.json');
+  if (!existsSync(filePath)) return null;
+  const raw = readFileSync(filePath, 'utf-8');
+  const config: AllowlistConfig = JSON.parse(raw);
+  return validateAllowlist(config);
+}
 /**
  * Reset cached state so the allowlist is reloaded on next check.
  * Called by the daemon file watcher when secret-allowlist.json changes,

package/src/skills/clawhub.ts CHANGED Viewed

@@ -395,7 +395,7 @@ export async function clawhubInspect(slug: string): Promise<{ data?: ClawhubInsp
           size: (f.size as number) ?? 0,
           contentType: (f.contentType as string) ?? undefined,
         })) : null,
-        skillMdContent: parsed.skillMdContent ?? parsed.fileContents?.['SKILL.md'] ?? null,
+        skillMdContent: parsed.skillMdContent ?? parsed.fileContents?.['SKILL.md'] ?? parsed.file?.content ?? null,
       };
       return { data };
     } catch {

package/src/subagent/manager.ts CHANGED Viewed

@@ -52,10 +52,18 @@ interface ManagedSubagent {
   parentSendToClient: (msg: ServerMessage) => void;
 }
+export interface SubagentNotificationInfo {
+  subagentId: string;
+  label: string;
+  status: 'completed' | 'failed' | 'aborted';
+  error?: string;
+}
 export type ParentNotifyCallback = (
   parentSessionId: string,
   message: string,
   sendToClient: (msg: ServerMessage) => void,
+  notification: SubagentNotificationInfo,
 ) => void;
 export class SubagentManager {
@@ -221,6 +229,8 @@ export class SubagentManager {
       await managed.session.runAgentLoop(objective, messageId, onEvent);
       // Agent loop completed successfully.
+      // Copy usage stats from the session before sending status (which includes usage).
+      managed.state.usage = { ...managed.session.usageStats };
       // Only update state + notify if still non-terminal (guards against abort race).
       if (!TERMINAL_STATUSES.has(managed.state.status)) {
         managed.state.completedAt = Date.now();
@@ -235,6 +245,7 @@ export class SubagentManager {
       const errorMsg = err instanceof Error ? err.message : String(err);
       managed.state.error = errorMsg;
       managed.state.completedAt = Date.now();
+      managed.state.usage = { ...managed.session.usageStats };
       // Only update status if not already terminal (e.g. aborted).
       if (!TERMINAL_STATUSES.has(managed.state.status)) {
@@ -267,16 +278,28 @@ export class SubagentManager {
     managed.session.abort();
     managed.state.completedAt = Date.now();
     if (parentSendToClient) {
-      this.setStatus(subagentId, 'aborted', parentSendToClient);
-      // Notify parent about the abort — skip when the parent already has the
-      // tool result (e.g. subagent_abort tool) to avoid duplicate turns.
+      // Route the status update through the stored parent sender so the
+      // owning session's UI chip updates, even when the abort comes from a
+      // different socket (e.g. after thread switching). Fall back to the
+      // caller-provided sender if no stored sender exists.
+      const statusSender = managed.parentSendToClient ?? parentSendToClient;
+      this.setStatus(subagentId, 'aborted', statusSender);
+      // Notify parent that the subagent was explicitly aborted — tell it NOT to re-spawn.
+      // Skip when the parent LLM itself called subagent_abort (it already has the tool result).
       if (this.onSubagentFinished && !options?.suppressNotification) {
         const label = managed.state.config.label;
+        const message =
+          `[Subagent "${label}" was explicitly aborted]\n\n` +
+          `This subagent was cancelled on purpose. Do NOT re-spawn or retry it.`;
         try {
+          // Use the managed subagent's stored parentSendToClient so the
+          // notification routes to the parent session's socket, not the
+          // aborting socket (which may be a different thread after switching).
           this.onSubagentFinished(
             managed.state.config.parentSessionId,
-            `[Subagent "${label}" was aborted]`,
-            parentSendToClient,
+            message,
+            managed.parentSendToClient,
+            { subagentId, label, status: 'aborted' },
           );
         } catch (err) {
           log.error({ subagentId, err }, 'Failed to notify parent about abort');
@@ -460,16 +483,25 @@ export class SubagentManager {
     if (outcome === 'completed') {
       message =
         `[Subagent "${config.label}" completed]\n\n` +
-        `Use subagent_read with subagent_id "${config.id}" to retrieve the full output.`;
+        `Use subagent_read with subagent_id "${config.id}" to retrieve the full output.\n` +
+        `Do NOT re-spawn this subagent — just read and share the results.`;
     } else {
       const error = managed.state.error ?? 'Unknown error';
       message =
         `[Subagent "${config.label}" failed]\n\n` +
-        `Error: ${error}`;
+        `Error: ${error}\n` +
+        `Do NOT re-spawn or retry this subagent unless the user explicitly asks.`;
     }
+    const notification: SubagentNotificationInfo = {
+      subagentId: config.id,
+      label: config.label,
+      status: outcome,
+      ...(outcome === 'failed' ? { error: managed.state.error ?? 'Unknown error' } : {}),
+    };
     try {
-      this.onSubagentFinished(config.parentSessionId, message, parentSendToClient);
+      this.onSubagentFinished(config.parentSessionId, message, parentSendToClient, notification);
     } catch (err) {
       log.error({ subagentId: config.id, err }, 'Failed to notify parent session');
     }

package/src/swarm/backend-claude-code.ts CHANGED Viewed

@@ -12,6 +12,9 @@ import { getProfilePolicy } from './worker-backend.js';
 const log = getLogger('swarm-backend-claude-code');
+const MAX_CLAUDE_CODE_DEPTH = 1;
+const DEPTH_ENV_VAR = 'VELLUM_CLAUDE_CODE_DEPTH';
 /**
  * Create a Claude Code worker backend that enforces profile-based tool policies.
  * Uses the Claude Agent SDK to run autonomous worker tasks.
@@ -28,6 +31,7 @@ export function createClaudeCodeBackend(): SwarmWorkerBackend {
     async runTask(input: SwarmWorkerBackendInput) {
       const start = Date.now();
+      const stderrLines: string[] = [];
       try {
         const { query } = await import('@anthropic-ai/claude-agent-sdk');
         const config = getConfig();
@@ -49,6 +53,22 @@ export function createClaudeCodeBackend(): SwarmWorkerBackend {
           return { behavior: 'allow' as const };
         };
+        // Enforce nesting depth limit
+        const currentDepth = parseInt(process.env[DEPTH_ENV_VAR] ?? '0', 10);
+        if (currentDepth >= MAX_CLAUDE_CODE_DEPTH) {
+          log.warn({ currentDepth, max: MAX_CLAUDE_CODE_DEPTH }, 'Swarm worker nesting depth exceeded');
+          return { success: false, output: `Nesting depth exceeded (depth ${currentDepth}, max ${MAX_CLAUDE_CODE_DEPTH})`, failureReason: 'backend_unavailable' as const, durationMs: Date.now() - start };
+        }
+        // Strip the SDK's nesting guard but set our own depth counter.
+        const subprocessEnv: Record<string, string | undefined> = {
+          ...process.env,
+          ANTHROPIC_API_KEY: apiKey,
+          [DEPTH_ENV_VAR]: String(currentDepth + 1),
+        };
+        delete subprocessEnv.CLAUDECODE;
+        delete subprocessEnv.CLAUDE_CODE_ENTRYPOINT;
         const conversation = query({
           prompt: input.prompt,
           options: {
@@ -57,20 +77,48 @@ export function createClaudeCodeBackend(): SwarmWorkerBackend {
             canUseTool,
             permissionMode: 'default',
             maxTurns: 30,
-            env: { ...process.env, ANTHROPIC_API_KEY: apiKey },
+            env: subprocessEnv,
+            stderr: (data: string) => {
+              const trimmed = data.trimEnd();
+              if (trimmed) {
+                stderrLines.push(trimmed);
+                log.debug({ stderr: trimmed }, 'Swarm worker subprocess stderr');
+              }
+            },
           },
         });
         let resultText = '';
+        let hasError = false;
         for await (const message of conversation) {
           if (input.signal?.aborted) break;
-          if (message.type === 'assistant' && message.message?.content) {
-            for (const block of message.message.content) {
-              if (block.type === 'text') resultText += block.text;
+          if (message.type === 'assistant') {
+            if (message.error) {
+              log.error({ error: message.error, sessionId: message.session_id }, 'Swarm worker assistant message error');
+              hasError = true;
+              resultText += `\n[Claude Code error: ${message.error}]`;
+            }
+            if (message.message?.content) {
+              for (const block of message.message.content) {
+                if (block.type === 'text') resultText += block.text;
+              }
             }
           } else if (message.type === 'result') {
-            if (message.subtype === 'success' && message.result && !resultText) {
-              resultText = message.result;
+            if (message.subtype === 'success') {
+              log.info({ numTurns: message.num_turns, durationMs: message.duration_ms, costUsd: message.total_cost_usd }, 'Swarm worker completed');
+              if (message.result && !resultText) {
+                resultText = message.result;
+              }
+            } else {
+              hasError = true;
+              const errors = message.errors ?? [];
+              const denials = message.permission_denials ?? [];
+              log.error({ subtype: message.subtype, errors, permissionDenials: denials.length, numTurns: message.num_turns, durationMs: message.duration_ms }, 'Swarm worker session failed');
+              const parts: string[] = [`[${message.subtype}] (${message.num_turns} turns, ${(message.duration_ms / 1000).toFixed(1)}s)`];
+              if (errors.length > 0) parts.push(`Errors: ${errors.join('; ')}`);
+              if (denials.length > 0) parts.push(`Permission denied: ${denials.map(d => d.tool_name).join(', ')}`);
+              resultText += `\n${parts.join('\n')}`;
             }
           }
         }
@@ -80,10 +128,17 @@ export function createClaudeCodeBackend(): SwarmWorkerBackend {
           return { success: false, output: 'Cancelled (aborted)', failureReason: 'cancelled' as const, durationMs: Date.now() - start };
         }
-        return { success: true, output: resultText || 'Completed', durationMs: Date.now() - start };
+        return { success: !hasError, output: resultText || 'Completed', durationMs: Date.now() - start };
       } catch (err) {
-        const message = err instanceof Error ? err.message : String(err);
-        return { success: false, output: message, failureReason: 'backend_unavailable' as const, durationMs: Date.now() - start };
+        const errMessage = err instanceof Error ? err.message : String(err);
+        const recentStderr = stderrLines.slice(-20);
+        log.error({ err, stderrTail: recentStderr }, 'Swarm worker execution failed');
+        const parts = [errMessage];
+        if (recentStderr.length > 0) {
+          parts.push(`\nSubprocess stderr (last ${recentStderr.length} lines):\n${recentStderr.join('\n')}`);
+        }
+        return { success: false, output: parts.join(''), failureReason: 'backend_unavailable' as const, durationMs: Date.now() - start };
       }
     },
   };

package/src/swarm/worker-prompts.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { SwarmRole, SwarmTaskResult } from './types.js';
+import { truncate } from '../util/truncate.js';
 /**
  * Build a role-specific worker prompt for a swarm task.
@@ -70,7 +71,7 @@ export function parseWorkerOutput(raw: string): Pick<SwarmTaskResult, 'summary'
   }
   return {
-    summary: raw.slice(0, 500),
+    summary: truncate(raw, 500, ''),
     artifacts: [],
     issues: [],
     nextSteps: [],

package/src/tasks/SPEC.md CHANGED Viewed

@@ -87,18 +87,23 @@ Each task run creates a new conversation thread with `threadType: 'background'`.
 ### Lifecycle
-1. **Start**: The daemon creates a `background` thread, substitutes template
-   placeholders, and sends the prompt to the LLM. An IPC notification
-   (`task_run_started`) is broadcast to all connected clients with the run ID,
-   task ID, and thread ID.
-2. **Completion**: When the LLM response is received and stored, the daemon
-   broadcasts a `task_run_completed` notification with the run ID, task ID,
-   thread ID, and a status (`success` | `error`).
-3. **Visibility**: Background threads are excluded from the default thread list
-   (existing behavior in `conversation-store.ts`). Clients can query for them
-   explicitly to surface task results in a dedicated UI.
-**Why background threads:** Reuses the existing `threadType: 'background'`
+1. **Preflight**: The client requests a permission preflight for the work item.
+   The daemon classifies risk for each required tool and returns the permission
+   set. The client displays an approval dialog; approved tools are stored on
+   the work item.
+2. **Start**: The daemon creates a `background` conversation, substitutes
+   template placeholders, sets up ephemeral permission rules for the approved
+   tools, and processes the rendered prompt through a daemon `Session`. Status
+   updates are broadcast to all connected clients via `work_item_status_changed`
+   and `tasks_changed` IPC messages.
+3. **Completion**: When the session finishes, the work item transitions to
+   `awaiting_review` (on success) or `failed` (on error). The daemon broadcasts
+   the final status to all clients.
+4. **Visibility**: Background conversations are excluded from the default thread
+   list (existing behavior in `conversation-store.ts`). Clients can query for
+   them explicitly to surface task results in a dedicated UI.
+**Why background conversations:** Reuses the existing `threadType: 'background'`
 infrastructure. Task runs don't interrupt the user's current conversation, and
 clients can choose how and when to display results (toast, panel, separate
 tab).
@@ -107,27 +112,28 @@ tab).
 ## 4. Safety Invariants
-- **No auto-execution**: Tasks are never triggered automatically. Every run
-  requires an explicit user action (CLI command, API call, or UI button press).
+- **Explicit trigger required**: Task runs are triggered either by an explicit
+  user action (UI button press, API call) or by a user-configured schedule
+  (`run_task:<task_id>` via the scheduler).
 - **Ephemeral permission bundles**: If a task is configured with tool access,
   the permission grants are scoped to the single run and discarded afterward.
   No persistent allowlist entries are created on behalf of a task.
-- **High-risk tools always prompt**: Regardless of any task-level permission
-  configuration, tools classified as `RiskLevel.High` (destructive shell
-  commands, private-network fetches, etc.) always require interactive user
-  confirmation. This invariant cannot be overridden by task definitions.
+- **High-risk tools require upfront approval**: Tools classified as
+  `RiskLevel.High` (destructive shell commands, private-network fetches, etc.)
+  are surfaced in the preflight dialog so the user can explicitly approve or
+  deny them before execution begins. During the run itself, approved tools
+  (including high-risk ones) execute without further prompting.
 ---
-## 5. PR Dependency Chain
+## 5. Implementation Notes
-Implementation is split into sequential PRs, each building on the previous:
+The implementation is complete. Key modules:
-| PR | Title | What it delivers |
-|----|-------|------------------|
-| 0  | Spec decisions | This document. |
-| 1  | Schema + storage | `tasks` and `task_runs` tables, Drizzle schema, migration in `db.ts`, CRUD functions in `task-store.ts`. |
-| 2  | Template engine | `renderTemplate()` — placeholder substitution with input validation against the JSON Schema. |
-| 3  | Run executor | `executeTaskRun()` — creates background thread, calls LLM, writes result, broadcasts IPC notifications (`task_run_started`, `task_run_completed`). |
-| 4  | CLI surface | `vellum task create`, `vellum task run`, `vellum task list` commands. |
-| 5  | IPC + macOS integration | Wire up IPC message types; macOS client displays task run results. |
+| Module | What it delivers |
+|--------|------------------|
+| `task-store.ts` | `tasks` and `task_runs` tables, CRUD functions. |
+| `task-runner.ts` | `runTask()` — creates background conversation, renders template, processes through daemon Session. |
+| `ephemeral-permissions.ts` | Scoped permission rules for the duration of a single task run. |
+| `work-items.ts` (daemon handler) | IPC handlers for preflight, run, cancel, and status queries. |
+| Bundled skill (`tasks/`) | Tool definitions (`task_save`, `task_run`, `task_list`, `task_delete`, `task_list_*`) for the LLM. |

package/src/tasks/ephemeral-permissions.ts CHANGED Viewed

@@ -21,19 +21,28 @@ export function clearTaskRunRules(taskRunId: string): void {
 /**
  * Build ephemeral TrustRule entries from a task's required_tools list.
  *
- * Each rule allows the specified tool with a wildcard pattern scoped to the
- * given working directory. Priority is set to 50 — lower than user rules (100)
- * so that user deny rules still take precedence. `allowHighRisk` is NOT set,
- * so high-risk operations continue to prompt for approval.
+ * Each rule allows the specified tool with a wildcard pattern scoped
+ * globally ('everywhere'). The scope is intentionally broad because the
+ * session's workingDir (sandbox path like ~/.vellum/workspace) differs
+ * from process.cwd() — using a directory-scoped rule would fail
+ * matchesScope() and silently miss. Priority is set to 75 — above
+ * default rules (50) so pre-approved tools aren't shadowed by default
+ * `ask` rules (which would trigger prompting and auto-deny in
+ * non-interactive task runs), but below user rules (100) so user deny
+ * rules still take precedence. `allowHighRisk` is set because task runs
+ * execute asynchronously without interactive confirmation — the client
+ * pre-approves tools via the preflight flow before execution begins,
+ * so there is no interactive prompt during the run itself.
  */
-export function buildTaskRules(taskRunId: string, requiredTools: string[], workingDir: string): TrustRule[] {
+export function buildTaskRules(taskRunId: string, requiredTools: string[], _workingDir: string): TrustRule[] {
   return requiredTools.map((tool) => ({
     id: `ephemeral:${taskRunId}:${tool}`,
     tool,
     pattern: '**',
-    scope: workingDir,
+    scope: 'everywhere',
     decision: 'allow' as const,
-    priority: 50,
+    allowHighRisk: true,
+    priority: 75,
     createdAt: Date.now(),
     principalKind: 'task',
     principalId: taskRunId,

package/src/tasks/task-compiler.ts CHANGED Viewed

@@ -3,6 +3,8 @@ import { getDb } from '../memory/db.js';
 import { messages as messagesTable } from '../memory/schema.js';
 import { createTask } from './task-store.js';
 import type { Task } from './task-store.js';
+import { truncate } from '../util/truncate.js';
+import { sanitizeToolList } from './tool-sanitizer.js';
 /** Output schema for the task compiler. */
 export interface CompiledTask {
@@ -44,8 +46,8 @@ export function compileTaskFromConversation(conversationId: string): CompiledTas
   // Extract user message text content
   const userText = extractTextContent(firstUserMsg.content);
-  // Extract unique tool names from assistant messages
-  const requiredTools = extractToolNames(msgs);
+  // Extract unique tool names from assistant messages.
+  const requiredTools = sanitizeToolList(extractToolNames(msgs));
   // Build template with placeholder substitutions
   const { template, properties } = buildTemplate(userText);
@@ -193,6 +195,5 @@ function buildTemplate(text: string): {
 function deriveTitle(text: string): string {
   // Take the first line and trim whitespace
   const firstLine = text.split('\n')[0].trim();
-  if (firstLine.length <= 60) return firstLine;
-  return firstLine.slice(0, 57) + '...';
+  return truncate(firstLine, 60);
 }

package/src/tasks/task-runner.ts CHANGED Viewed

@@ -2,6 +2,7 @@ import { getLogger } from '../util/logger.js';
 import { createConversation } from '../memory/conversation-store.js';
 import { getTask, createTaskRun, updateTaskRun } from './task-store.js';
 import { buildTaskRules, setTaskRunRules, clearTaskRunRules } from './ephemeral-permissions.js';
+import { sanitizeToolList } from './tool-sanitizer.js';
 const log = getLogger('task-runner');
@@ -9,6 +10,8 @@ export interface TaskRunOptions {
   taskId: string;
   inputs?: Record<string, string>;
   workingDir: string;
+  /** Pre-approved tools from the permission preflight flow. When set, only these tools get ephemeral allow rules. */
+  approvedTools?: string[];
 }
 export interface TaskRunResult {
@@ -32,7 +35,7 @@ export function renderTemplate(template: string, inputs: Record<string, string>)
  */
 export async function runTask(
   opts: TaskRunOptions,
-  processMessage: (conversationId: string, message: string) => Promise<void>,
+  processMessage: (conversationId: string, message: string, taskRunId: string) => Promise<void>,
 ): Promise<TaskRunResult> {
   const task = getTask(opts.taskId);
   if (!task) {
@@ -47,9 +50,11 @@ export async function runTask(
     memoryScopeId: `task:${task.id}`,
   });
-  // Build and register ephemeral permission rules from the task's required tools
-  const requiredTools: string[] = task.requiredTools ? JSON.parse(task.requiredTools) : [];
-  const rules = buildTaskRules(run.id, requiredTools, opts.workingDir);
+  // Build and register ephemeral permission rules. If the user pre-approved
+  // specific tools via the preflight flow, use those instead of all requiredTools.
+  const requiredTools = sanitizeToolList(task.requiredTools ? JSON.parse(task.requiredTools) : []);
+  const toolsForRules = opts.approvedTools ? sanitizeToolList(opts.approvedTools) : requiredTools;
+  const rules = buildTaskRules(run.id, toolsForRules, opts.workingDir);
   setTaskRunRules(run.id, rules);
   try {
@@ -58,7 +63,7 @@ export async function runTask(
     updateTaskRun(run.id, { status: 'running', startedAt: Date.now() });
     log.info({ taskId: task.id, taskRunId: run.id, conversationId: conversation.id }, 'Executing task');
-    await processMessage(conversation.id, renderedTemplate);
+    await processMessage(conversation.id, renderedTemplate, run.id);
     updateTaskRun(run.id, { status: 'completed', finishedAt: Date.now() });

package/src/tasks/task-scheduler.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import { createSchedule } from '../schedule/schedule-store.js';
 /**
- * Create a schedule that runs a task on a cron expression.
+ * Create a recurrence schedule that runs a task on a cron or RRULE expression.
  * The scheduler detects the `run_task:<taskId>` message format
  * and delegates to runTask() instead of processMessage().
  */

package/src/tasks/tool-sanitizer.ts ADDED Viewed

@@ -0,0 +1,36 @@
+import { getTool, getAllTools } from '../tools/registry.js';
+/**
+ * Deduplicate and sort a list of tool names, validating against the live
+ * tool registry. Unknown tool names are logged at warn level but kept —
+ * they may refer to skill tools that will be loaded at runtime.
+ *
+ * The returned array is deterministic: sorted alphabetically with no duplicates.
+ */
+export function sanitizeToolList(tools: string[]): string[] {
+  const seen = new Set<string>();
+  for (const tool of tools) {
+    if (!tool || typeof tool !== 'string') continue;
+    seen.add(tool);
+  }
+  return [...seen].sort();
+}
+/**
+ * Get all registered tool names from the live tool registry.
+ * Used as the fallback when a task/work-item has no explicit requiredTools.
+ */
+export function getRegisteredToolNames(): string[] {
+  return getAllTools()
+    .filter((t) => t.executionMode !== 'proxy' && t.origin !== 'skill')
+    .map((t) => t.name)
+    .sort();
+}
+/** Look up the human-readable description for a tool from the registry. */
+export function getToolDescription(tool: string): string {
+  const registered = getTool(tool);
+  return registered?.description ?? tool;
+}

package/src/tools/assets/search.ts CHANGED Viewed

@@ -214,7 +214,7 @@ export function searchAttachments(params: AssetSearchParams): StoredAttachment[]
     const limit = Math.min(params.limit ?? DEFAULT_LIMIT, MAX_RESULTS);
     const stmt = raw.prepare(
-      `SELECT a.id, a.assistant_id, a.original_filename, a.mime_type, a.size_bytes, a.kind, a.created_at
+      `SELECT a.id, a.original_filename, a.mime_type, a.size_bytes, a.kind, a.thumbnail_base64, a.created_at
        FROM attachments a
        WHERE ${whereParts.join(' AND ')}
        ORDER BY a.created_at DESC
@@ -223,21 +223,21 @@ export function searchAttachments(params: AssetSearchParams): StoredAttachment[]
     const rows = stmt.all(...bindValues, limit) as Array<{
       id: string;
-      assistant_id: string;
       original_filename: string;
       mime_type: string;
       size_bytes: number;
       kind: string;
+      thumbnail_base64: string | null;
       created_at: number;
     }>;
     return rows.map((r) => ({
       id: r.id,
-      assistantId: r.assistant_id,
       originalFilename: r.original_filename,
       mimeType: r.mime_type,
       sizeBytes: r.size_bytes,
       kind: r.kind,
+      thumbnailBase64: r.thumbnail_base64,
       createdAt: r.created_at,
     }));
   }
@@ -249,11 +249,11 @@ export function searchAttachments(params: AssetSearchParams): StoredAttachment[]
   const query = db
     .select({
       id: attachments.id,
-      assistantId: attachments.assistantId,
       originalFilename: attachments.originalFilename,
       mimeType: attachments.mimeType,
       sizeBytes: attachments.sizeBytes,
       kind: attachments.kind,
+      thumbnailBase64: attachments.thumbnailBase64,
       createdAt: attachments.createdAt,
     })
     .from(attachments)