npm - bosun - Versions diffs - 0.36.8 → 0.37.0 - Mend

bosun 0.36.8 → 0.37.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

package/.env.example +2 -32
package/README.md +19 -3
package/agent-prompts.mjs +0 -91
package/bosun.config.example.json +3 -0
package/bosun.schema.json +10 -0
package/config.mjs +6 -75
package/copilot-shell.mjs +18 -1
package/desktop/desktop-shortcuts.mjs +200 -27
package/desktop/main.mjs +734 -113
package/desktop/package.json +1 -2
package/desktop/preload.mjs +39 -0
package/desktop-shortcut.mjs +106 -13
package/fleet-coordinator.mjs +4 -16
package/maintenance.mjs +1 -2
package/monitor.mjs +234 -3261
package/package.json +8 -5
package/primary-agent.mjs +47 -8
package/session-tracker.mjs +30 -1
package/setup-web-server.mjs +208 -0
package/task-cli.mjs +4 -38
package/task-executor.mjs +153 -2838
package/telegram-bot.mjs +55 -140
package/ui/app.js +237 -29
package/ui/components/agent-selector.js +26 -4
package/ui/components/workspace-switcher.js +18 -6
package/ui/demo.html +115 -0
package/ui/index.html +17 -3
package/ui/modules/icon-utils.js +57 -0
package/ui/modules/settings-schema.js +4 -4
package/ui/modules/streaming.js +15 -0
package/ui/modules/vision-stream.js +196 -22
package/ui/modules/voice-client-sdk.js +567 -60
package/ui/modules/voice-client.js +740 -15
package/ui/modules/voice-fallback.js +28 -6
package/ui/modules/voice-overlay.js +1505 -494
package/ui/setup.html +618 -106
package/ui/styles/components.css +65 -0
package/ui/styles/layout.css +4 -0
package/ui/styles/sessions.css +24 -0
package/ui/tabs/agents.js +125 -28
package/ui/tabs/chat.js +233 -21
package/ui/tabs/settings.js +318 -109
package/ui/tabs/tasks.js +5 -11
package/ui-server.mjs +458 -123
package/vision-session-state.mjs +35 -0
package/voice-action-dispatcher.mjs +163 -20
package/voice-agents-sdk.mjs +32 -10
package/voice-auth-manager.mjs +95 -28
package/voice-relay.mjs +555 -81
package/voice-tools.mjs +1565 -92
package/workflow-engine.mjs +38 -0
package/workflow-migration.mjs +2 -0
package/workflow-nodes.mjs +1101 -0
package/workflow-templates/agents.mjs +1 -0
package/workflow-templates/github.mjs +2 -1
package/workflow-templates/reliability.mjs +2 -0
package/workflow-templates/task-lifecycle.mjs +595 -0
package/workflow-templates.mjs +144 -3

package/.env.example CHANGED Viewed

@@ -4,8 +4,8 @@
 # All variables are optional unless marked [REQUIRED].
 # Boolean flags use true/false (preferred). Legacy 1/0 is still accepted.
 # Profile guidance:
-#  - Local development: DEVMODE=true, DEVMODE_MONITOR_MONITOR_ENABLED=true, *_TRANSPORT=sdk
-#  - End-user stable:  DEVMODE=false, DEVMODE_MONITOR_MONITOR_ENABLED=false, *_TRANSPORT=sdk
+#  - Local development: DEVMODE=true, *_TRANSPORT=sdk
+#  - End-user stable:  DEVMODE=false, *_TRANSPORT=sdk
 # ─── Task Claims and Coordination ─────────────────────────────────────────────
 # Shared state manager enables distributed task coordination across multiple
@@ -222,10 +222,6 @@ VOICE_DELEGATE_EXECUTOR=codex-sdk
 # SENTINEL_RESTART_BACKOFF_SEC=5
 # After manual /stop, suppress auto-restart for this many minutes (default: 10)
 # SENTINEL_MANUAL_STOP_HOLD_MIN=10
-# In devmode, validate monitor-monitor freshness before restart decisions (default: 1)
-# SENTINEL_MONITOR_MONITOR_CHECK_ENABLED=true
-# Max acceptable monitor-monitor age in minutes (default: 20)
-# SENTINEL_MONITOR_MONITOR_MAX_AGE_MIN=20
 # ─── Notification Batching (RECOMMENDED) ─────────────────────────────────────
 # Batch notifications into periodic summaries instead of spamming individual messages
@@ -776,31 +772,6 @@ VK_RECOVERY_PORT=54089
 # scripts check for this and exit silently if not present, preventing
 # hooks from firing in standalone Copilot/Codex/Claude sessions.
-# ─── Devmode Monitor-Monitor (24/7 reliability guardian) ───────────────────
-# Prompt is injected directly from bosun source (no .github/agents file required).
-# Enabled by default in devmode source checkouts. Set to false to disable.
-# DEVMODE_MONITOR_MONITOR_ENABLED=true
-# Poll interval for monitor-monitor runs (milliseconds). Default: 300000 (5 min)
-# DEVMODE_MONITOR_MONITOR_INTERVAL_MS=300000
-# Status stream update interval (milliseconds). Default: 1800000 (30 min)
-# DEVMODE_MONITOR_MONITOR_STATUS_INTERVAL_MS=1800000
-# Per-run timeout before watchdog abort/failover (milliseconds).
-# Default is 21600000 (6h) for long-running reliability analysis sessions.
-# 30 minutes (1800000) is safe if you prefer faster failover on stuck runs.
-# Watchdog abort triggers at timeout+60s, then accelerated force-reset at +120s.
-# Set this explicitly to avoid inherited shell
-# defaults (for example DEVMODE_AUTO_CODE_FIX_TIMEOUT_MS=300000).
-# DEVMODE_MONITOR_MONITOR_TIMEOUT_MS=1800000
-# Optional timeout bounds (applied only when set):
-# DEVMODE_MONITOR_MONITOR_TIMEOUT_MIN_MS=600000
-# DEVMODE_MONITOR_MONITOR_TIMEOUT_MAX_MS=7200000
-# Optional override for Claude tool access (comma-separated)
-# DEVMODE_MONITOR_MONITOR_CLAUDE_ALLOWED_TOOLS=Read,Write,Edit,Grep,Glob,Bash,WebSearch,Task,Skill
-# Legacy alias: DEVMODE_AUTO_CODE_FIX=true also enables this subsystem.
-# Legacy timeout fallback: if DEVMODE_MONITOR_MONITOR_TIMEOUT_MS is unset and
-# DEVMODE_AUTO_CODE_FIX_TIMEOUT_MS is set, monitor-monitor will use it (and
-# still apply DEVMODE_MONITOR_MONITOR_TIMEOUT_MIN_MS/MAX_MS bounds if provided).
 # ─── Copilot SDK (Primary Agent) ─────────────────────────────────────────────
 # Requires GitHub Copilot CLI installed and authenticated.
 # Set to true to disable Copilot SDK (primary agent) usage.
@@ -1046,7 +1017,6 @@ COPILOT_CLOUD_DISABLED=true
 # Files in that folder are loaded automatically and are intended for per-project customization.
 # You can also override any prompt path explicitly with env vars:
 # BOSUN_PROMPT_PLANNER=.bosun/agents/task-planner.md
-# BOSUN_PROMPT_MONITOR_MONITOR=.bosun/agents/monitor-monitor.md
 # BOSUN_PROMPT_TASK_EXECUTOR=.bosun/agents/task-executor.md
 # BOSUN_PROMPT_REVIEWER=.bosun/agents/reviewer.md
 # BOSUN_PROMPT_SDK_CONFLICT_RESOLVER=.bosun/agents/sdk-conflict-resolver.md

package/README.md CHANGED Viewed

@@ -3,10 +3,10 @@
 </p>
 <h1 align="center">bosun</h1>
-Bosun is a production-grade supervisor for AI coding agents. It routes tasks across executors, automates PR lifecycles, and keeps operators in control through Telegram, the Mini App dashboard, and optional WhatsApp notifications.
+Bosun is a production-grade control plane for an autonomous software engineer. It plans and routes work across executors, automates PR lifecycles, and keeps operators in control through Telegram, the Mini App dashboard, and optional WhatsApp notifications.
 <p align="center">
-  <a href="https://bosun.virtengine.com">Website</a> · <a href="https://bosun.virtengine.com/docs/">Docs</a> · <a href="https://github.com/virtengine/bosun?tab=readme-ov-file#bosun">GitHub</a> · <a href="https://www.npmjs.com/package/bosun">npm</a> · <a href="https://github.com/virtengine/bosun/issues">Issues</a>
+  <a href="https://bosun.engineer">Website</a> · <a href="https://bosun.engineer/docs/">Docs</a> · <a href="https://github.com/virtengine/bosun?tab=readme-ov-file#bosun">GitHub</a> · <a href="https://www.npmjs.com/package/bosun">npm</a> · <a href="https://github.com/virtengine/bosun/issues">Issues</a>
 </p>
 <p align="center">
@@ -82,6 +82,22 @@ Fallback admin auth (secondary path) is available and stores only Argon2id hash
 - Provides Telegram control and a Mini App dashboard
 - Integrates with GitHub, Jira, and Vibe-Kanban boards
+## Autonomous Engineer Workflow Capabilities
+Bosun workflows provide a professional, end-to-end execution loop for autonomous delivery:
+- Trigger intake: consume issues, comments, schedules, and webhook events
+- Planning and decomposition: convert goals into scoped tasks with execution context
+- Routed execution: dispatch tasks to the best executor profile with retries and failover
+- Quality gates: enforce test/build/review checks before merge decisions
+- Recovery and escalation: auto-heal stalled runs, then escalate with clear operator signals
+Setup profiles for default workflow behavior:
+- Manual Dispatch: human-directed flow with guardrails and review automations
+- Balanced (Recommended): daily default with PR quality gates and targeted self-healing
+- Autonomous: expanded end-to-end automation for planning, recovery, and maintenance
 ### Executor quick-start
 | Executor          | `primaryAgent` value | Key env vars                                                                          |
@@ -103,7 +119,7 @@ Set `primaryAgent` in `.bosun/bosun.config.json` or choose an executor preset du
 ## Documentation
-**Published docs (website):** https://bosun.virtengine.com/docs/
+**Published docs (website):** https://bosun.engineer/docs/
 **Source docs (markdown):** `_docs/` is the source of truth for long-form documentation. The website should be generated from the same markdown content so docs stay in sync.

package/agent-prompts.mjs CHANGED Viewed

@@ -17,16 +17,6 @@ const PROMPT_DEFS = [
     filename: "orchestrator.md",
     description: "Primary task execution prompt for autonomous task agents.",
   },
-  {
-    key: "planner",
-    filename: "task-planner.md",
-    description: "Backlog planning prompt used by task planner runs.",
-  },
-  {
-    key: "monitorMonitor",
-    filename: "monitor-monitor.md",
-    description: "Long-running reliability monitor prompt used in devmode.",
-  },
   {
     key: "taskExecutor",
     filename: "task-executor.md",
@@ -199,68 +189,6 @@ apply patterns discovered by previous agents:
 After completing a task, if you discovered a non-obvious pattern, workaround, or
 domain-specific fact, write or update a skill file at \`.bosun/skills/<module>.md\`
 so the next agent benefits from your investigation.
-`,
-  planner: `# Codex-Task-Planner Agent
-You generate production-grade backlog tasks for autonomous executors.
-## Mission
-1. Analyze current repo and delivery state.
-2. Identify highest-value next work.
-3. Create concrete, execution-ready tasks.
-## Requirements
-- Avoid vague tasks and duplicate work.
-- Balance reliability fixes, feature delivery, and debt reduction.
-- Every task includes implementation steps, acceptance criteria, and verification plan.
-- Every task title starts with one size label: [xs], [s], [m], [l], [xl], [xxl].
-- Prefer task sets that can run in parallel with low file overlap.
-- Do not call any kanban API, CLI, or external service to create tasks.
-  The workflow will automatically materialize your output into kanban tasks.
-- Output must be machine-parseable JSON — see Output Contract below.
-- Task objects must be valid for Bosun backlog creation with fields:
-  \'title\', \'description\', \'implementation_steps\', \'acceptance_criteria\',
-  \'verification\', optional \'base_branch\'.
-- Do not emit empty or placeholder tasks. Every task must be actionable and execution-ready.
-## Output Contract (MANDATORY — STRICT)
-Your ENTIRE response must be a single fenced JSON block. Do NOT include any
-text, commentary, explanations, or markdown before or after the JSON block.
-The downstream parser extracts JSON from fenced blocks — any deviation causes
-task creation to hard-fail.
-Return exactly this shape:
-\`\`\`json
-{
-  "tasks": [
-    {
-      "title": "[m] feat(veid): example task title",
-      "description": "Problem statement and scope",
-      "implementation_steps": ["step 1", "step 2"],
-      "acceptance_criteria": ["criterion 1", "criterion 2"],
-      "verification": ["test/check 1", "test/check 2"],
-      "base_branch": "origin/veid"
-    }
-  ]
-}
-\`\`\`
-Rules:
-- The \`tasks\` array MUST contain at least the requested task count.
-- Do NOT output partial JSON, truncated arrays, or commentary mixed with JSON.
-- Keep titles unique and specific.
-- Keep file overlap low across tasks to maximize parallel execution.
-- Descriptions must include concrete implementation details, not generic intent text.
-- Include verification commands/checks that a worker can run without additional planning.
-- **Module branch routing:** When the task title follows conventional commit format
-  \`feat(module):\` or \`fix(module):\`, set \`base_branch\` to \`origin/<module>\`.
-  This routes the task to the module's dedicated branch for parallel, isolated development.
-  Examples: \`feat(veid):\` → \`"base_branch": "origin/veid"\`, \`fix(market):\` → \`"base_branch": "origin/market"\`.
-  Omit \`base_branch\` for cross-cutting tasks that span multiple modules.
 `,
   taskManager: `# Bosun Task Manager Agent
@@ -305,8 +233,6 @@ bosun task stats --json
 # Bulk import from JSON file
 bosun task import ./backlog.json
-# Trigger AI task planner
-bosun task plan --count 5 --reason "Sprint planning"
 \`\`\`
 ### 2. REST API (port 18432 — always available when bosun daemon runs)
@@ -440,23 +366,6 @@ draft → todo → inprogress → inreview → done
 7. **Module branch routing** — When a task title follows conventional commit format
    \`feat(module):\` or \`fix(module):\`, set \`baseBranch\` to \`origin/<module>\` to route the task
    to the module's dedicated branch for parallel, isolated development.
-`,
-  monitorMonitor: `# Bosun-Monitor Agent
-You are the always-on reliability guardian for bosun in devmode.
-## Core Role
-- Monitor logs, failures, and agent/orchestrator behavior continuously.
-- Immediately fix reliability regressions and execution blockers.
-- Improve prompt/tool/executor reliability to reduce failure loops.
-- Only when runtime is healthy, perform code-analysis improvements.
-## Constraints
-- Operate only in devmode.
-- Do not commit/push/initiate PR lifecycle changes in this context.
-- Apply focused fixes, run focused validation, and keep monitoring.
 `,
   taskExecutor: `# {{TASK_ID}} — {{TASK_TITLE}}

package/bosun.config.example.json CHANGED Viewed

@@ -2,6 +2,9 @@
   "$schema": "./bosun.schema.json",
   "projectName": "my-project",
   "primaryAgent": "codex-sdk",
+  "_comment_workflowFirst": "Set to true to run everything as workflows (task lifecycle, PR management, etc.)",
+  "workflowFirst": false,
   "kanban": {
     "backend": "vk"
   },

package/bosun.schema.json CHANGED Viewed

@@ -33,6 +33,16 @@
     "watchEnabled": { "type": "boolean" },
     "echoLogs": { "type": "boolean" },
     "autoFixEnabled": { "type": "boolean" },
+    "workflowFirst": {
+      "type": "boolean",
+      "default": false,
+      "description": "When true, all modules start in WORKFLOW mode by default. The task executor lifecycle is fully delegated to workflow templates (workflowOwnsTaskLifecycle). Bosun acts as a thin shell around the workflow engine."
+    },
+    "workflowOwnsTaskLifecycle": {
+      "type": "boolean",
+      "default": false,
+      "description": "Delegate task finalization and recovery to workflow automation instead of the legacy TaskExecutor. Automatically set to true when workflowFirst is enabled."
+    },
     "interactiveShellEnabled": { "type": "boolean" },
     "shellEnabled": { "type": "boolean" },
     "codexEnabled": { "type": "boolean" },

package/config.mjs CHANGED Viewed

@@ -506,7 +506,9 @@ function normalizeExecutorModels(executor, models, variant = "DEFAULT") {
     );
     return inferred.length > 0 ? inferred : [...known];
   }
-  return input.filter((model) => known.has(model));
+  // Preserve custom/deployment slugs in addition to known models so user-provided
+  // model routing survives normalization (for example Azure deployment names).
+  return [...new Set(input.filter(Boolean))];
 }
 function normalizeExecutorEntry(entry, index = 0, total = 1) {
@@ -540,49 +542,8 @@ function normalizeExecutorEntry(entry, index = 0, total = 1) {
   };
 }
-function buildDefaultTriggerTemplates({
-  plannerMode,
-  plannerPerCapitaThreshold,
-  plannerIdleSlotThreshold,
-  plannerDedupHours,
-} = {}) {
+function buildDefaultTriggerTemplates() {
   return [
-    {
-      id: "task-planner",
-      name: "Task Planner",
-      description: "Create planning tasks when backlog/slot metrics indicate replenishment.",
-      enabled: false,
-      action: "task-planner",
-      trigger: {
-        anyOf: [
-          {
-            kind: "metric",
-            metric: "backlogPerCapita",
-            operator: "lt",
-            value: plannerPerCapitaThreshold,
-          },
-          {
-            kind: "metric",
-            metric: "idleSlots",
-            operator: "gte",
-            value: plannerIdleSlotThreshold,
-          },
-          {
-            kind: "metric",
-            metric: "backlogRemaining",
-            operator: "eq",
-            value: 0,
-          },
-        ],
-      },
-      minIntervalMinutes: Math.max(1, Number(plannerDedupHours || 6) * 60),
-      config: {
-        plannerMode,
-        defaultTaskCount: Number(process.env.TASK_PLANNER_DEFAULT_COUNT || "30"),
-        executor: "auto",
-        model: "auto",
-      },
-    },
     {
       id: "daily-review-digest",
       name: "Daily Review Digest",
@@ -1990,32 +1951,8 @@ export function loadConfig(argv = process.argv, options = {}) {
     "summary"
   ).toLowerCase();
-  // ── Task Planner ─────────────────────────────────────────
-  // Mode: "codex-sdk" (default) runs Codex directly, "kanban" creates a VK
-  // task for a real agent to plan, "disabled" turns off the planner entirely.
-  const plannerMode = (
-    process.env.TASK_PLANNER_MODE ||
-    configData.plannerMode ||
-    (mode === "generic" ? "disabled" : "codex-sdk")
-  ).toLowerCase();
-  const plannerPerCapitaThreshold = Number(
-    process.env.TASK_PLANNER_PER_CAPITA_THRESHOLD || "1",
-  );
-  const plannerIdleSlotThreshold = Number(
-    process.env.TASK_PLANNER_IDLE_SLOT_THRESHOLD || "1",
-  );
-  const plannerDedupHours = Number(process.env.TASK_PLANNER_DEDUP_HOURS || "6");
-  const plannerDedupMs = Number.isFinite(plannerDedupHours)
-    ? plannerDedupHours * 60 * 60 * 1000
-    : 24 * 60 * 60 * 1000;
   const triggerSystemDefaults = Object.freeze({
-    templates: buildDefaultTriggerTemplates({
-      plannerMode,
-      plannerPerCapitaThreshold,
-      plannerIdleSlotThreshold,
-      plannerDedupHours,
-    }),
+    templates: buildDefaultTriggerTemplates(),
     defaults: Object.freeze({
       executor: "auto",
       model: "auto",
@@ -2290,12 +2227,6 @@ export function loadConfig(argv = process.argv, options = {}) {
     telegramCommandEnabled,
     telegramVerbosity,
-    // Task Planner
-    plannerMode,
-    plannerPerCapitaThreshold,
-    plannerIdleSlotThreshold,
-    plannerDedupHours,
-    plannerDedupMs,
     triggerSystem,
     // GitHub Reconciler
@@ -2349,7 +2280,7 @@ export function loadConfig(argv = process.argv, options = {}) {
         configData.trustedCreators ||
         process.env.BOSUN_TRUSTED_CREATORS?.split(",") ||
         [],
-      // Enforce all new tasks go to backlog unless planner config allows auto-push
+      // Enforce all new tasks go to backlog
       enforceBacklog:
         typeof configData.enforceBacklog === "boolean"
           ? configData.enforceBacklog

package/copilot-shell.mjs CHANGED Viewed

@@ -469,9 +469,26 @@ async function ensureClientStarted() {
   const modeLabel = clientOptions.cliUrl ? "remote" : "local (stdio)";
   console.log(`[copilot-shell] starting client in ${modeLabel} mode`);
+  const START_TIMEOUT_MS =
+    Number(process.env.COPILOT_START_TIMEOUT_MS) || 20_000;
   await withSanitizedOpenAiEnv(async () => {
     copilotClient = new Cls(clientOptions);
-    await copilotClient.start();
+    await Promise.race([
+      copilotClient.start(),
+      new Promise((_, reject) =>
+        setTimeout(
+          () =>
+            reject(
+              new Error(
+                `Copilot CLI failed to start within ${START_TIMEOUT_MS / 1000}s — ` +
+                  `verify COPILOT_CLI_PATH or run \`gh auth login\``,
+              ),
+            ),
+          START_TIMEOUT_MS,
+        ),
+      ),
+    ]);
   });
   clientStarted = true;
   console.log("[copilot-shell] client started");