npm - @swarmclawai/swarmclaw - Versions diffs - 0.6.7 → 0.7.0 - Mend

@swarmclawai/swarmclaw 0.6.7 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (203) hide show

package/README.md +82 -39
package/next.config.ts +31 -6
package/package.json +3 -2
package/src/app/api/agents/[id]/thread/route.ts +1 -0
package/src/app/api/agents/route.ts +19 -5
package/src/app/api/approvals/route.ts +22 -0
package/src/app/api/chatrooms/[id]/chat/route.ts +4 -0
package/src/app/api/clawhub/install/route.ts +2 -2
package/src/app/api/eval/run/route.ts +37 -0
package/src/app/api/eval/scenarios/route.ts +24 -0
package/src/app/api/eval/suite/route.ts +29 -0
package/src/app/api/mcp-servers/[id]/conformance/route.ts +26 -0
package/src/app/api/mcp-servers/[id]/invoke/route.ts +81 -0
package/src/app/api/memory/graph/route.ts +46 -0
package/src/app/api/memory/route.ts +36 -5
package/src/app/api/notifications/route.ts +3 -0
package/src/app/api/plugins/install/route.ts +57 -5
package/src/app/api/plugins/marketplace/route.ts +73 -22
package/src/app/api/plugins/route.ts +61 -1
package/src/app/api/plugins/ui/route.ts +34 -0
package/src/app/api/sessions/[id]/checkpoints/route.ts +31 -0
package/src/app/api/sessions/[id]/restore/route.ts +36 -0
package/src/app/api/settings/route.ts +62 -0
package/src/app/api/setup/doctor/route.ts +22 -5
package/src/app/api/souls/[id]/route.ts +65 -0
package/src/app/api/souls/route.ts +70 -0
package/src/app/api/tasks/[id]/approve/route.ts +4 -3
package/src/app/api/tasks/[id]/route.ts +16 -3
package/src/app/api/tasks/route.ts +10 -2
package/src/app/api/usage/route.ts +9 -2
package/src/app/globals.css +27 -0
package/src/app/page.tsx +10 -5
package/src/cli/index.js +37 -0
package/src/components/activity/activity-feed.tsx +9 -2
package/src/components/agents/agent-avatar.tsx +5 -1
package/src/components/agents/agent-card.tsx +55 -9
package/src/components/agents/agent-sheet.tsx +112 -34
package/src/components/agents/inspector-panel.tsx +1 -1
package/src/components/agents/soul-library-picker.tsx +84 -13
package/src/components/auth/access-key-gate.tsx +63 -54
package/src/components/auth/user-picker.tsx +37 -32
package/src/components/chat/activity-moment.tsx +2 -0
package/src/components/chat/chat-area.tsx +11 -0
package/src/components/chat/chat-header.tsx +69 -25
package/src/components/chat/chat-tool-toggles.tsx +2 -2
package/src/components/chat/checkpoint-timeline.tsx +112 -0
package/src/components/chat/code-block.tsx +3 -1
package/src/components/chat/exec-approval-card.tsx +8 -1
package/src/components/chat/message-bubble.tsx +164 -4
package/src/components/chat/message-list.tsx +46 -4
package/src/components/chat/session-approval-card.tsx +80 -0
package/src/components/chat/session-debug-panel.tsx +106 -84
package/src/components/chat/streaming-bubble.tsx +6 -5
package/src/components/chat/task-approval-card.tsx +78 -0
package/src/components/chat/thinking-indicator.tsx +48 -12
package/src/components/chat/tool-call-bubble.tsx +3 -0
package/src/components/chat/tool-request-banner.tsx +39 -20
package/src/components/chatrooms/chatroom-list.tsx +11 -4
package/src/components/chatrooms/chatroom-sheet.tsx +7 -2
package/src/components/connectors/connector-list.tsx +33 -11
package/src/components/connectors/connector-sheet.tsx +37 -7
package/src/components/home/home-view.tsx +54 -24
package/src/components/input/chat-input.tsx +22 -1
package/src/components/knowledge/knowledge-list.tsx +17 -18
package/src/components/knowledge/knowledge-sheet.tsx +9 -5
package/src/components/layout/app-layout.tsx +87 -19
package/src/components/mcp-servers/mcp-server-list.tsx +352 -50
package/src/components/mcp-servers/mcp-server-sheet.tsx +25 -9
package/src/components/memory/memory-browser.tsx +73 -45
package/src/components/memory/memory-graph-view.tsx +203 -0
package/src/components/memory/memory-list.tsx +20 -13
package/src/components/plugins/plugin-list.tsx +214 -60
package/src/components/plugins/plugin-sheet.tsx +119 -24
package/src/components/projects/project-list.tsx +17 -9
package/src/components/providers/provider-list.tsx +21 -6
package/src/components/providers/provider-sheet.tsx +42 -25
package/src/components/runs/run-list.tsx +17 -13
package/src/components/schedules/schedule-card.tsx +10 -3
package/src/components/schedules/schedule-list.tsx +2 -2
package/src/components/schedules/schedule-sheet.tsx +28 -9
package/src/components/secrets/secret-sheet.tsx +7 -2
package/src/components/secrets/secrets-list.tsx +18 -5
package/src/components/sessions/new-session-sheet.tsx +183 -376
package/src/components/sessions/session-card.tsx +10 -2
package/src/components/settings/gateway-connection-panel.tsx +9 -8
package/src/components/shared/command-palette.tsx +13 -5
package/src/components/shared/empty-state.tsx +20 -8
package/src/components/shared/hint-tip.tsx +31 -0
package/src/components/shared/notification-center.tsx +134 -86
package/src/components/shared/profile-sheet.tsx +4 -0
package/src/components/shared/settings/plugin-manager.tsx +360 -135
package/src/components/shared/settings/section-capability-policy.tsx +3 -3
package/src/components/shared/settings/section-runtime-loop.tsx +149 -4
package/src/components/skills/clawhub-browser.tsx +1 -0
package/src/components/skills/skill-list.tsx +31 -12
package/src/components/skills/skill-sheet.tsx +20 -7
package/src/components/tasks/approvals-panel.tsx +224 -0
package/src/components/tasks/task-board.tsx +20 -12
package/src/components/tasks/task-card.tsx +21 -7
package/src/components/tasks/task-column.tsx +4 -3
package/src/components/tasks/task-list.tsx +1 -1
package/src/components/tasks/task-sheet.tsx +130 -1
package/src/components/ui/dialog.tsx +1 -0
package/src/components/ui/sheet.tsx +1 -0
package/src/components/usage/metrics-dashboard.tsx +72 -48
package/src/components/wallets/wallet-panel.tsx +65 -41
package/src/components/wallets/wallet-section.tsx +9 -3
package/src/components/webhooks/webhook-list.tsx +21 -12
package/src/components/webhooks/webhook-sheet.tsx +13 -3
package/src/lib/approval-display.test.ts +45 -0
package/src/lib/approval-display.ts +62 -0
package/src/lib/clipboard.ts +38 -0
package/src/lib/memory.ts +8 -0
package/src/lib/providers/claude-cli.ts +5 -3
package/src/lib/providers/index.ts +67 -21
package/src/lib/runtime-loop.ts +3 -2
package/src/lib/server/approvals.ts +150 -0
package/src/lib/server/chat-execution.ts +319 -74
package/src/lib/server/chatroom-helpers.ts +63 -5
package/src/lib/server/chatroom-orchestration.ts +74 -0
package/src/lib/server/clawhub-client.ts +82 -6
package/src/lib/server/connectors/manager.ts +27 -1
package/src/lib/server/context-manager.ts +132 -50
package/src/lib/server/cost.test.ts +73 -0
package/src/lib/server/cost.ts +165 -34
package/src/lib/server/daemon-state.ts +112 -1
package/src/lib/server/data-dir.ts +18 -1
package/src/lib/server/eval/runner.ts +126 -0
package/src/lib/server/eval/scenarios.ts +218 -0
package/src/lib/server/eval/scorer.ts +96 -0
package/src/lib/server/eval/store.ts +37 -0
package/src/lib/server/eval/types.ts +48 -0
package/src/lib/server/execution-log.ts +12 -8
package/src/lib/server/guardian.ts +34 -0
package/src/lib/server/heartbeat-service.ts +53 -1
package/src/lib/server/integrity-monitor.ts +208 -0
package/src/lib/server/langgraph-checkpoint.ts +10 -0
package/src/lib/server/link-understanding.ts +55 -0
package/src/lib/server/llm-response-cache.test.ts +102 -0
package/src/lib/server/llm-response-cache.ts +227 -0
package/src/lib/server/main-agent-loop.ts +115 -16
package/src/lib/server/main-session.ts +6 -3
package/src/lib/server/mcp-conformance.test.ts +18 -0
package/src/lib/server/mcp-conformance.ts +233 -0
package/src/lib/server/memory-db.ts +193 -19
package/src/lib/server/memory-retrieval.test.ts +56 -0
package/src/lib/server/mmr.ts +73 -0
package/src/lib/server/orchestrator-lg.ts +7 -1
package/src/lib/server/orchestrator.ts +4 -3
package/src/lib/server/plugins.ts +662 -132
package/src/lib/server/process-manager.ts +18 -0
package/src/lib/server/query-expansion.ts +57 -0
package/src/lib/server/queue.ts +280 -11
package/src/lib/server/runtime-settings.ts +9 -0
package/src/lib/server/session-run-manager.test.ts +23 -0
package/src/lib/server/session-run-manager.ts +32 -2
package/src/lib/server/session-tools/canvas.ts +85 -50
package/src/lib/server/session-tools/chatroom.ts +130 -127
package/src/lib/server/session-tools/connector.ts +233 -454
package/src/lib/server/session-tools/context-mgmt.ts +87 -105
package/src/lib/server/session-tools/crud.ts +84 -7
package/src/lib/server/session-tools/delegate.ts +351 -752
package/src/lib/server/session-tools/discovery.ts +198 -0
package/src/lib/server/session-tools/edit_file.ts +82 -0
package/src/lib/server/session-tools/file-send.test.ts +39 -0
package/src/lib/server/session-tools/file.ts +257 -425
package/src/lib/server/session-tools/git.ts +87 -47
package/src/lib/server/session-tools/http.ts +95 -33
package/src/lib/server/session-tools/index.ts +217 -138
package/src/lib/server/session-tools/memory.ts +154 -239
package/src/lib/server/session-tools/monitor.ts +126 -0
package/src/lib/server/session-tools/normalize-tool-args.test.ts +61 -0
package/src/lib/server/session-tools/normalize-tool-args.ts +48 -0
package/src/lib/server/session-tools/openclaw-nodes.ts +82 -99
package/src/lib/server/session-tools/openclaw-workspace.ts +103 -93
package/src/lib/server/session-tools/platform.ts +86 -0
package/src/lib/server/session-tools/plugin-creator.ts +239 -0
package/src/lib/server/session-tools/sample-ui.ts +97 -0
package/src/lib/server/session-tools/sandbox.ts +175 -148
package/src/lib/server/session-tools/schedule.ts +78 -0
package/src/lib/server/session-tools/session-info.ts +104 -410
package/src/lib/server/session-tools/shell-normalize.test.ts +43 -0
package/src/lib/server/session-tools/shell.ts +171 -143
package/src/lib/server/session-tools/subagent.ts +77 -77
package/src/lib/server/session-tools/wallet.ts +182 -106
package/src/lib/server/session-tools/web.ts +181 -327
package/src/lib/server/storage.ts +36 -0
package/src/lib/server/stream-agent-chat.ts +348 -242
package/src/lib/server/task-quality-gate.test.ts +44 -0
package/src/lib/server/task-quality-gate.ts +67 -0
package/src/lib/server/task-validation.test.ts +78 -0
package/src/lib/server/task-validation.ts +67 -2
package/src/lib/server/tool-aliases.ts +68 -0
package/src/lib/server/tool-capability-policy.ts +24 -5
package/src/lib/server/tool-retry.ts +62 -0
package/src/lib/server/transcript-repair.ts +72 -0
package/src/lib/setup-defaults.ts +1 -0
package/src/lib/tasks.ts +7 -1
package/src/lib/tool-definitions.ts +24 -23
package/src/lib/validation/schemas.ts +13 -0
package/src/lib/view-routes.ts +2 -23
package/src/stores/use-app-store.ts +23 -1
package/src/types/index.ts +155 -10

package/src/lib/server/process-manager.ts CHANGED Viewed

@@ -5,6 +5,7 @@ const MAX_LOG_CHARS = 200_000
 const DEFAULT_BACKGROUND_YIELD_MS = 10_000
 const DEFAULT_TIMEOUT_MS = 30 * 60_000
 const DEFAULT_TTL_MS = 30 * 60_000
+const BACKGROUND_STARTUP_GRACE_MS = 500
 export type ProcessStatus = 'running' | 'exited' | 'killed' | 'failed' | 'timeout'
@@ -170,6 +171,23 @@ export async function startManagedProcess(opts: StartProcessOptions): Promise<St
   state.exitWaiters.set(id, exitPromise)
   if (opts.background) {
+    // Give background processes a brief grace window so immediate crashes
+    // (e.g., bind/permission errors) are surfaced instead of misreported as running.
+    const startupWaitMs = Math.min(
+      Math.max(100, BACKGROUND_STARTUP_GRACE_MS),
+      Math.max(200, timeoutMs),
+    )
+    await wait(startupWaitMs)
+    const rec = state.records.get(id)
+    if (rec && rec.status !== 'running') {
+      return {
+        status: 'completed',
+        processId: id,
+        output: rec.log,
+        exitCode: rec.exitCode,
+        signal: rec.signal,
+      }
+    }
     return {
       status: 'running',
       processId: id,

package/src/lib/server/query-expansion.ts ADDED Viewed

@@ -0,0 +1,57 @@
+import { loadAgents, loadSettings, loadCredentials, decryptKey } from './storage'
+import { getProvider } from '../providers'
+/**
+ * Expands a single user query into multiple semantic search variants
+ * to improve vector database recall (OpenClaw-style).
+ */
+export async function expandQuery(query: string): Promise<string[]> {
+  const agents = loadAgents()
+  const settings = loadSettings()
+  const defaultAgent = agents[settings.defaultAgentId]
+  if (!defaultAgent) return [query]
+  const providerEntry = getProvider(defaultAgent.provider)
+  if (!providerEntry?.handler?.streamChat) return [query]
+  const creds = loadCredentials()
+  const cred = creds[defaultAgent.credentialId || '']
+  const apiKey = cred ? decryptKey(cred.encryptedKey) : undefined
+  const systemPrompt = `You are a search query expansion assistant.
+Given a user's question, generate 3 different semantic search queries that would help find the answer in a vector database.
+Use different vocabulary and focus on different aspects of the intent.
+Format your response as a simple newline-separated list. No numbering, no bullets, no introduction.`
+  let expanded = ''
+  try {
+    await providerEntry.handler.streamChat({
+      session: { id: 'expansion', messages: [], model: defaultAgent.model, provider: defaultAgent.provider },
+      message: query,
+      apiKey,
+      systemPrompt,
+      write: (raw: string) => {
+        const lines = raw.split('\n').filter(Boolean)
+        for (const line of lines) {
+          if (!line.startsWith('data: ')) continue
+          try {
+            const ev = JSON.parse(line.slice(6))
+            if (ev.t === 'd' && ev.text) expanded += ev.text
+          } catch { /* skip */ }
+        }
+      },
+      active: new Map(),
+      loadHistory: () => [],
+    })
+    const variants = expanded.split('\n').map(l => l.trim()).filter(Boolean)
+    if (variants.length > 0) {
+      // Return original query + variants
+      return [query, ...variants.slice(0, 3)]
+    }
+  } catch (err) {
+    console.error('[query-expansion] Failed to expand query:', err)
+  }
+  return [query]
+}

package/src/lib/server/queue.ts CHANGED Viewed

@@ -13,6 +13,7 @@ import { extractTaskResult, formatResultBody } from './task-result'
 import { getCheckpointSaver } from './langgraph-checkpoint'
 import { isProtectedMainSession } from './main-session'
 import { cascadeUnblock } from './dag-validation'
+import { performGuardianRollback } from './guardian'
 import type { Agent, BoardTask, Connector, Message } from '@/types'
 // HMR-safe: pin processing flag to globalThis so hot reloads don't reset it
@@ -22,12 +23,14 @@ interface SessionMessageLike {
   role?: string
   text?: string
   time?: number
-  kind?: 'chat' | 'heartbeat' | 'system' | 'context-clear'
+  kind?: string
   source?: {
     connectorId?: string
     channelId?: string
   }
   toolEvents?: Array<{ name?: string; output?: string }>
+  streaming?: boolean
+  imageUrl?: string
 }
 interface SessionLike {
@@ -96,6 +99,181 @@ function applyTaskPolicyDefaults(task: BoardTask): void {
   if (task.deadLetteredAt === undefined) task.deadLetteredAt = null
 }
+const DEV_TASK_HINT = /\b(dev(?:\s+server)?|start(?:ing)?\s+(?:the\s+)?server|run(?:ning)?\s+(?:the\s+)?(?:app|project|site)|serve|localhost|http\s+server|web\s+server|npm\b|pnpm\b|yarn\b|bun\b|vite|next(?:\.js)?|react|build|compile)\b/i
+const TASK_CWD_NOISE_DIRS = new Set([
+  'uploads',
+  'data',
+  'projects',
+  'tasks',
+  '.swarm-data-test',
+  '.git',
+  '.next',
+  'node_modules',
+])
+const PROJECT_MARKER_FILES = ['package.json', 'pyproject.toml', 'Cargo.toml', 'go.mod', '.git']
+const SOURCE_MARKER_DIRS = ['src', 'app', 'public', 'pages']
+const WORKSPACE_PROJECTS_DIR = path.join(WORKSPACE_DIR, 'projects')
+interface WorkspaceDirCandidate {
+  dir: string
+  name: string
+  hasProjectMarker: boolean
+  hasSourceMarker: boolean
+}
+let workspaceDirCache: { expiresAt: number; candidates: WorkspaceDirCandidate[] } | null = null
+function isExistingDirectory(dirPath: string): boolean {
+  try {
+    return fs.statSync(dirPath).isDirectory()
+  } catch {
+    return false
+  }
+}
+function isWithinDirectory(parent: string, child: string): boolean {
+  const parentResolved = path.resolve(parent)
+  const childResolved = path.resolve(child)
+  const rel = path.relative(parentResolved, childResolved)
+  return rel === '' || (!rel.startsWith('..') && !path.isAbsolute(rel))
+}
+function normalizeForMatch(value: string): string {
+  return value.toLowerCase().replace(/[^a-z0-9]+/g, ' ').trim()
+}
+function hasAnyMarker(dirPath: string, markers: string[]): boolean {
+  return markers.some((marker) => fs.existsSync(path.join(dirPath, marker)))
+}
+function normalizeDirCandidate(raw: unknown, baseDir: string): string | null {
+  if (typeof raw !== 'string') return null
+  const trimmed = raw.trim()
+  if (!trimmed) return null
+  const homeDir = process.env.HOME || ''
+  const expanded = trimmed === '~'
+    ? homeDir
+    : trimmed.startsWith('~/')
+      ? path.join(homeDir, trimmed.slice(2))
+      : trimmed
+  const resolved = path.isAbsolute(expanded) ? path.resolve(expanded) : path.resolve(baseDir, expanded)
+  return isExistingDirectory(resolved) ? resolved : null
+}
+function looksLikeDevTask(task: Pick<BoardTask, 'title' | 'description'>): boolean {
+  const text = `${task.title || ''} ${task.description || ''}`.trim()
+  return DEV_TASK_HINT.test(text)
+}
+function listWorkspaceDirCandidates(): WorkspaceDirCandidate[] {
+  const now = Date.now()
+  if (workspaceDirCache && workspaceDirCache.expiresAt > now) return workspaceDirCache.candidates
+  const candidates: WorkspaceDirCandidate[] = []
+  const seen = new Set<string>()
+  const roots = [WORKSPACE_DIR, WORKSPACE_PROJECTS_DIR]
+  for (const root of roots) {
+    if (!isExistingDirectory(root)) continue
+    let entries: fs.Dirent[] = []
+    try {
+      entries = fs.readdirSync(root, { withFileTypes: true })
+    } catch {
+      continue
+    }
+    for (const entry of entries) {
+      if (!entry.isDirectory()) continue
+      const name = entry.name
+      if (!name || name.startsWith('.')) continue
+      if (TASK_CWD_NOISE_DIRS.has(name)) continue
+      const dir = path.join(root, name)
+      const key = path.resolve(dir)
+      if (seen.has(key)) continue
+      seen.add(key)
+      candidates.push({
+        dir: key,
+        name,
+        hasProjectMarker: hasAnyMarker(key, PROJECT_MARKER_FILES),
+        hasSourceMarker: hasAnyMarker(key, SOURCE_MARKER_DIRS),
+      })
+    }
+  }
+  candidates.sort((a, b) => a.name.localeCompare(b.name))
+  workspaceDirCache = {
+    expiresAt: now + 15_000,
+    candidates,
+  }
+  return candidates
+}
+function inferWorkspaceProjectCwd(task: Pick<BoardTask, 'title' | 'description' | 'file'>): string | null {
+  const candidates = listWorkspaceDirCandidates()
+  if (!candidates.length) return null
+  const taskText = normalizeForMatch(`${task.title || ''} ${task.description || ''} ${task.file || ''}`)
+  const devTask = looksLikeDevTask(task)
+  const markerCandidates = candidates.filter((candidate) => candidate.hasProjectMarker)
+  let best: { dir: string; score: number } | null = null
+  for (const candidate of candidates) {
+    const nameNorm = normalizeForMatch(candidate.name)
+    if (!nameNorm) continue
+    let score = 0
+    if (taskText.includes(nameNorm)) score += 8
+    for (const token of nameNorm.split(' ')) {
+      if (token.length < 3) continue
+      if (taskText.includes(token)) score += 1
+    }
+    if (candidate.hasProjectMarker) score += devTask ? 3 : 1
+    if (candidate.hasSourceMarker) score += 1
+    if (!best || score > best.score) best = { dir: candidate.dir, score }
+  }
+  if (best && best.score >= 4) return best.dir
+  if (devTask && markerCandidates.length === 1) return markerCandidates[0].dir
+  return null
+}
+function resolveTaskExecutionCwd(task: ScheduleTaskMeta, sessions: Record<string, SessionLike>): string {
+  const workspaceRoot = path.resolve(WORKSPACE_DIR)
+  const explicitCwd = normalizeDirCandidate(task.cwd, workspaceRoot)
+  if (explicitCwd) return explicitCwd
+  const projectId = typeof task.projectId === 'string' ? task.projectId.trim() : ''
+  if (projectId) {
+    const projectDir = path.join(WORKSPACE_PROJECTS_DIR, projectId)
+    if (isExistingDirectory(projectDir)) return projectDir
+  }
+  const fileRef = typeof task.file === 'string' ? task.file.trim() : ''
+  if (fileRef) {
+    const filePath = path.isAbsolute(fileRef) ? fileRef : path.resolve(workspaceRoot, fileRef)
+    const fileDir = isExistingDirectory(filePath) ? filePath : path.dirname(filePath)
+    if (isExistingDirectory(fileDir) && isWithinDirectory(workspaceRoot, fileDir)) return fileDir
+  }
+  const inferredCwd = inferWorkspaceProjectCwd(task)
+  if (inferredCwd) return inferredCwd
+  const sourceSessionId = typeof task.createdInSessionId === 'string' ? task.createdInSessionId.trim() : ''
+  const sourceSessionCwd = sourceSessionId
+    ? normalizeDirCandidate(sessions[sourceSessionId]?.cwd, workspaceRoot)
+    : null
+  if (sourceSessionCwd && path.resolve(sourceSessionCwd) !== workspaceRoot) return sourceSessionCwd
+  const runSessionId = typeof task.sessionId === 'string' ? task.sessionId.trim() : ''
+  const runSessionCwd = runSessionId
+    ? normalizeDirCandidate(sessions[runSessionId]?.cwd, workspaceRoot)
+    : null
+  if (runSessionCwd && path.resolve(runSessionCwd) !== workspaceRoot) return runSessionCwd
+  const sandboxDir = path.join(workspaceRoot, 'tasks', task.id)
+  fs.mkdirSync(sandboxDir, { recursive: true })
+  return sandboxDir
+}
 function queueContains(queue: string[], id: string): boolean {
   return queue.includes(id)
 }
@@ -315,12 +493,34 @@ export function resolveTaskOriginConnectorFollowupTarget(params: {
 // Task result extraction now uses Zod-validated structured data
 // from ./task-result.ts (extractTaskResult, formatResultBody)
+/** Check if a task result looks incomplete (agent stopped mid-objective). */
+function looksIncomplete(text: string): boolean {
+  if (!text) return false
+  const trimmed = text.trim()
+  // Ends with ellipsis or continuation signal
+  if (trimmed.endsWith('...') || trimmed.endsWith('…')) return true
+  // Ends with a step/phase header (agent was listing next steps)
+  if (/(?:^|\n)#{1,3}\s+(?:Step|Phase|Next)\s+\d/i.test(trimmed.slice(-200))) return true
+  // Contains forward-looking language at the end
+  const lastChunk = trimmed.slice(-300).toLowerCase()
+  if (/\b(?:next i(?:'ll| will)|now i(?:'ll| will)|let me (?:now|next)|moving on to|proceeding to)\b/.test(lastChunk)) return true
+  return false
+}
 async function executeTaskRun(
   task: BoardTask,
   agent: Agent,
   sessionId: string,
 ): Promise<string> {
-  const prompt = task.description || task.title
+  const basePrompt = task.description || task.title
+  const prompt = [
+    basePrompt,
+    '',
+    'Completion requirements:',
+    '- Execute the task before replying; do not reply with only a plan.',
+    '- Include concrete evidence in your final summary: changed file paths, commands run, and verification results.',
+    '- If blocked, state the blocker explicitly and what input or permission is missing.',
+  ].join('\n')
   if (agent?.isOrchestrator) {
     return executeOrchestrator(agent, prompt, sessionId, task.id)
   }
@@ -330,11 +530,24 @@ async function executeTaskRun(
     message: prompt,
     internal: false,
     source: 'task',
+    runId: task.id,
   })
-  const text = typeof run.text === 'string' ? run.text.trim() : ''
-  if (text) return text
-  if (run.error) return `Error: ${run.error}`
-  return ''
+  let text = typeof run.text === 'string' ? run.text.trim() : ''
+  if (run.error) return text ? text : `Error: ${run.error}`
+  // Auto-continue if the result looks incomplete
+  if (text && looksIncomplete(text)) {
+    const followUp = await executeSessionChatTurn({
+      sessionId,
+      message: 'Continue and complete the remaining steps. Provide a final summary when done.',
+      internal: false,
+      source: 'task',
+    })
+    const contText = typeof followUp.text === 'string' ? followUp.text.trim() : ''
+    if (contText) text = contText
+  }
+  return text
 }
 function notifyMainChatScheduleResult(task: BoardTask): void {
@@ -377,8 +590,8 @@ function notifyMainChatScheduleResult(task: BoardTask): void {
   const now = Date.now()
   let changed = false
-  const buildMsg = (): Message => {
-    const msg: Message = { role: 'assistant', text: body, time: now, kind: 'system' }
+  const buildMsg = (): SessionMessageLike => {
+    const msg: SessionMessageLike = { role: 'assistant', text: body, time: now, kind: 'system' }
     if (firstImage) msg.imageUrl = firstImage.url
     return msg
   }
@@ -701,6 +914,7 @@ export function enqueueTask(taskId: string) {
 export function validateCompletedTasksQueue() {
   const tasks = loadTasks()
   const sessions = loadSessions()
+  const settings = loadSettings()
   const now = Date.now()
   let checked = 0
   let demoted = 0
@@ -717,7 +931,7 @@ export function validateCompletedTasksQueue() {
       tasksDirty = true
     }
-    const validation = validateTaskCompletion(task, { report })
+    const validation = validateTaskCompletion(task, { report, settings })
     const prevValidation = task.validation || null
     const validationChanged = !prevValidation
       || prevValidation.ok !== validation.ok
@@ -802,6 +1016,32 @@ function scheduleRetryOrDeadLetter(task: BoardTask, reason: string): 'retry' | '
     text: `Task moved to dead-letter after ${task.attempts}/${task.maxAttempts} attempts.\n\nReason: ${reason}`,
     createdAt: now,
   })
+  // Guardian Auto-Rollback
+  const agents = loadAgents()
+  const agent = task.agentId ? agents[task.agentId] : null
+  if (agent?.autoRecovery) {
+    const cwd = task.projectId
+      ? path.join(WORKSPACE_DIR, 'projects', task.projectId)
+      : WORKSPACE_DIR
+    const rollback = performGuardianRollback(cwd)
+    if (rollback.ok) {
+      task.comments.push({
+        id: genId(),
+        author: 'Guardian',
+        text: `Auto-recovery triggered: Workspace successfully rolled back to last clean state.`,
+        createdAt: now + 1,
+      })
+    } else {
+      task.comments.push({
+        id: genId(),
+        author: 'Guardian',
+        text: `Auto-recovery failed: ${rollback.reason}`,
+        createdAt: now + 1,
+      })
+    }
+  }
   return 'dead_lettered'
 }
@@ -903,7 +1143,9 @@ export async function processNext() {
       task.validation = null
       task.updatedAt = Date.now()
-      const taskCwd = task.cwd || WORKSPACE_DIR
+      const sessionsForCwd = loadSessions() as Record<string, SessionLike>
+      const taskCwd = resolveTaskExecutionCwd(task as ScheduleTaskMeta, sessionsForCwd)
+      task.cwd = taskCwd
       let sessionId = ''
       const scheduleTask = task as ScheduleTaskMeta
       const isScheduleTask = scheduleTask.sourceType === 'schedule'
@@ -1002,6 +1244,7 @@ export async function processNext() {
       try {
         const result = await executeTaskRun(task, agent, sessionId)
         const t2 = loadTasks()
+        const settings = loadSettings()
         if (t2[taskId]) {
           applyTaskPolicyDefaults(t2[taskId])
           // Structured extraction: Zod-validated result with typed artifacts
@@ -1018,7 +1261,7 @@ export async function processNext() {
           t2[taskId].updatedAt = Date.now()
           const report = ensureTaskCompletionReport(t2[taskId])
           if (report?.relativePath) t2[taskId].completionReportPath = report.relativePath
-          const validation = validateTaskCompletion(t2[taskId], { report })
+          const validation = validateTaskCompletion(t2[taskId], { report, settings })
           t2[taskId].validation = validation
           const now = Date.now()
@@ -1233,6 +1476,29 @@ export function recoverStalledRunningTasks(): { recovered: number; deadLettered:
   for (const task of Object.values(tasks) as BoardTask[]) {
     if (task.status !== 'running') continue
+    if (!task.startedAt) {
+      const recoveredAt = Date.now()
+      task.status = 'queued'
+      task.queuedAt = task.queuedAt || recoveredAt
+      task.retryScheduledAt = null
+      task.updatedAt = recoveredAt
+      task.error = 'Recovered inconsistent running state (missing startedAt); requeued.'
+      if (!task.comments) task.comments = []
+      task.comments.push({
+        id: genId(),
+        author: 'System',
+        text: 'Recovered inconsistent running state (missing startedAt). Task requeued.',
+        createdAt: recoveredAt,
+      })
+      pushQueueUnique(queue, task.id)
+      recovered++
+      changed = true
+      pushMainLoopEventToMainSessions({
+        type: 'task_stall_recovered',
+        text: `Recovered inconsistent running task "${task.title}" (${task.id}) and requeued it.`,
+      })
+      continue
+    }
     const since = Math.max(task.updatedAt || 0, task.startedAt || 0)
     if (!since || (now - since) < staleMs) continue
@@ -1259,6 +1525,9 @@ export function recoverStalledRunningTasks(): { recovered: number; deadLettered:
   if (changed) {
     saveTasks(tasks)
     saveQueue(queue)
+    if (recovered > 0) {
+      setTimeout(() => processNext(), 250)
+    }
   }
   return { recovered, deadLettered }

package/src/lib/server/runtime-settings.ts CHANGED Viewed

@@ -3,6 +3,7 @@ import {
   DEFAULT_AGENT_LOOP_RECURSION_LIMIT,
   DEFAULT_CLAUDE_CODE_TIMEOUT_SEC,
   DEFAULT_CLI_PROCESS_TIMEOUT_SEC,
+  DEFAULT_DELEGATION_MAX_DEPTH,
   DEFAULT_LEGACY_ORCHESTRATOR_MAX_TURNS,
   DEFAULT_LOOP_MODE,
   DEFAULT_ONGOING_LOOP_MAX_ITERATIONS,
@@ -17,6 +18,7 @@ export interface RuntimeSettings {
   agentLoopRecursionLimit: number
   orchestratorLoopRecursionLimit: number
   legacyOrchestratorMaxTurns: number
+  delegationMaxDepth: number
   ongoingLoopMaxIterations: number
   ongoingLoopMaxRuntimeMs: number | null
   shellCommandTimeoutMs: number
@@ -61,6 +63,12 @@ export function loadRuntimeSettings(): RuntimeSettings {
     1,
     300,
   )
+  const delegationMaxDepth = parseIntSetting(
+    settings.delegationMaxDepth,
+    DEFAULT_DELEGATION_MAX_DEPTH,
+    1,
+    12,
+  )
   const ongoingLoopMaxIterations = parseIntSetting(
     settings.ongoingLoopMaxIterations,
     DEFAULT_ONGOING_LOOP_MAX_ITERATIONS,
@@ -98,6 +106,7 @@ export function loadRuntimeSettings(): RuntimeSettings {
     agentLoopRecursionLimit,
     orchestratorLoopRecursionLimit,
     legacyOrchestratorMaxTurns,
+    delegationMaxDepth,
     ongoingLoopMaxIterations,
     ongoingLoopMaxRuntimeMs: ongoingLoopMaxRuntimeMinutes > 0 ? ongoingLoopMaxRuntimeMinutes * 60_000 : null,
     shellCommandTimeoutMs: shellCommandTimeoutSec * 1000,

package/src/lib/server/session-run-manager.test.ts ADDED Viewed

@@ -0,0 +1,23 @@
+import { describe, it } from 'node:test'
+import assert from 'node:assert/strict'
+import { isMainMissionSession } from './session-run-manager'
+describe('isMainMissionSession', () => {
+  it('accepts explicit main sessions', () => {
+    assert.equal(isMainMissionSession({ id: 'main-user', name: '__main__' }), true)
+  })
+  it('rejects human agent-thread sessions', () => {
+    assert.equal(
+      isMainMissionSession({ id: 'agent-thread-agent_coder-123', name: 'agent-thread:agent_coder', sessionType: 'human' }),
+      false,
+    )
+  })
+  it('accepts orchestrated sessions', () => {
+    assert.equal(
+      isMainMissionSession({ id: 'agent-thread-worker-1', name: 'agent-thread:worker', sessionType: 'orchestrated' }),
+      true,
+    )
+  })
+})

package/src/lib/server/session-run-manager.ts CHANGED Viewed

@@ -203,7 +203,7 @@ function scheduleMainLoopFollowup(sessionId: string, followup: MainLoopFollowupR
     try {
       const sessions = loadSessions()
       const session = sessions[sessionId]
-      if (!session || session.name !== '__main__') return
+      if (!session || !isMainMissionSession(session)) return
       enqueueSessionRun({
         sessionId,
         message: followup.message,
@@ -218,6 +218,16 @@ function scheduleMainLoopFollowup(sessionId: string, followup: MainLoopFollowupR
   }, delayMs)
 }
+export function isMainMissionSession(session: Record<string, unknown>): boolean {
+  const id = typeof session.id === 'string' ? session.id.trim() : ''
+  const name = typeof session.name === 'string' ? session.name.trim() : ''
+  const sessionType = typeof session.sessionType === 'string' ? session.sessionType : ''
+  if (id.startsWith('main-') || name === '__main__') return true
+  // Only orchestrated thread sessions should receive autonomous main-loop followups.
+  if (sessionType === 'orchestrated') return true
+  return false
+}
 async function drainExecution(executionKey: string): Promise<void> {
   if (state.runningByExecution.has(executionKey)) return
   const q = queueForExecution(executionKey)
@@ -271,6 +281,9 @@ async function drainExecution(executionKey: string): Promise<void> {
         resultText: result.text,
         error: result.error,
         toolEvents: result.toolEvents,
+        inputTokens: result.inputTokens,
+        outputTokens: result.outputTokens,
+        estimatedCost: result.estimatedCost,
       })
     } catch (mainLoopErr: any) {
       log.warn('session-run', `Main-loop update failed for ${next.run.id}`, mainLoopErr?.message || String(mainLoopErr))
@@ -372,6 +385,19 @@ export interface EnqueueSessionRunResult {
   abort: () => void
 }
+const LONG_TOOL_NAMES: ReadonlySet<string> = new Set(['claude_code', 'codex_cli', 'opencode_cli'])
+function computeEffectiveRunTimeoutMs(
+  baseTimeoutMs: number,
+  sessionTools: string[],
+  runtime: { claudeCodeTimeoutMs: number },
+): number {
+  const hasLongTool = sessionTools.some(t => LONG_TOOL_NAMES.has(t))
+  if (!hasLongTool) return baseTimeoutMs
+  const toolTimeout = runtime.claudeCodeTimeoutMs + 120_000
+  return Math.max(baseTimeoutMs, toolTimeout)
+}
 export function enqueueSessionRun(input: EnqueueSessionRunInput): EnqueueSessionRunResult {
   const internal = input.internal === true
   const mode = normalizeMode(input.mode, internal)
@@ -379,9 +405,13 @@ export function enqueueSessionRun(input: EnqueueSessionRunInput): EnqueueSession
   const executionKey = executionKeyForSession(input.sessionId)
   const runtime = loadRuntimeSettings()
   const defaultMaxRuntimeMs = runtime.ongoingLoopMaxRuntimeMs ?? (10 * 60_000)
+  const sessions = loadSessions()
+  const sessionData = sessions[input.sessionId]
+  const sessionTools: string[] = sessionData?.tools || []
+  const adjustedDefaultMs = computeEffectiveRunTimeoutMs(defaultMaxRuntimeMs, sessionTools, runtime)
   const effectiveMaxRuntimeMs = typeof input.maxRuntimeMs === 'number'
     ? input.maxRuntimeMs
-    : defaultMaxRuntimeMs
+    : adjustedDefaultMs
   const dedupe = findDedupeMatch(input.sessionId, input.dedupeKey)
   if (dedupe) {