npm - opencode-swarm-plugin - Versions diffs - 0.35.0 → 0.36.1 - Mend

opencode-swarm-plugin 0.35.0 → 0.36.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

package/.hive/issues.jsonl +4 -4
package/.hive/memories.jsonl +274 -1
package/.turbo/turbo-build.log +4 -4
package/.turbo/turbo-test.log +307 -307
package/CHANGELOG.md +133 -0
package/bin/swarm.ts +234 -179
package/dist/compaction-hook.d.ts +54 -4
package/dist/compaction-hook.d.ts.map +1 -1
package/dist/eval-capture.d.ts +122 -17
package/dist/eval-capture.d.ts.map +1 -1
package/dist/index.d.ts +1 -7
package/dist/index.d.ts.map +1 -1
package/dist/index.js +1278 -619
package/dist/planning-guardrails.d.ts +121 -0
package/dist/planning-guardrails.d.ts.map +1 -1
package/dist/plugin.d.ts +9 -9
package/dist/plugin.d.ts.map +1 -1
package/dist/plugin.js +1283 -329
package/dist/schemas/task.d.ts +0 -1
package/dist/schemas/task.d.ts.map +1 -1
package/dist/swarm-decompose.d.ts +0 -8
package/dist/swarm-decompose.d.ts.map +1 -1
package/dist/swarm-orchestrate.d.ts.map +1 -1
package/dist/swarm-prompts.d.ts +0 -4
package/dist/swarm-prompts.d.ts.map +1 -1
package/dist/swarm-review.d.ts.map +1 -1
package/dist/swarm.d.ts +0 -6
package/dist/swarm.d.ts.map +1 -1
package/evals/README.md +38 -0
package/evals/coordinator-session.eval.ts +154 -0
package/evals/fixtures/coordinator-sessions.ts +328 -0
package/evals/lib/data-loader.ts +69 -0
package/evals/scorers/coordinator-discipline.evalite-test.ts +536 -0
package/evals/scorers/coordinator-discipline.ts +315 -0
package/evals/scorers/index.ts +12 -0
package/examples/plugin-wrapper-template.ts +747 -34
package/package.json +2 -2
package/src/compaction-hook.test.ts +234 -281
package/src/compaction-hook.ts +221 -63
package/src/eval-capture.test.ts +390 -0
package/src/eval-capture.ts +168 -10
package/src/index.ts +89 -2
package/src/learning.integration.test.ts +0 -2
package/src/planning-guardrails.test.ts +387 -2
package/src/planning-guardrails.ts +289 -0
package/src/plugin.ts +10 -10
package/src/schemas/task.ts +0 -1
package/src/swarm-decompose.ts +21 -8
package/src/swarm-orchestrate.ts +44 -0
package/src/swarm-prompts.ts +20 -0
package/src/swarm-review.ts +41 -0
package/src/swarm.integration.test.ts +0 -40

package/src/compaction-hook.ts CHANGED Viewed

@@ -68,11 +68,31 @@ function getLog() {
  * This is NOT about preserving state for a human - it's about the swarm continuing
  * autonomously after context compression.
  */
-export const SWARM_COMPACTION_CONTEXT = `## 🐝 SWARM ACTIVE - Keep Cooking
+export const SWARM_COMPACTION_CONTEXT = `## 🐝 SWARM ACTIVE - You Are The COORDINATOR
-You are the **COORDINATOR** of an active swarm. Context was compacted but the swarm is still running.
+Context was compacted but the swarm is still running. You are the **COORDINATOR**.
-**YOUR JOB:** Keep orchestrating. Spawn agents. Monitor progress. Unblock work. Ship it.
+### ⛔ NEVER DO THESE (Coordinator Anti-Patterns)
+**CRITICAL: Coordinators NEVER do implementation work. ALWAYS spawn workers.**
+- ❌ **NEVER** use \`edit\` or \`write\` tools - SPAWN A WORKER
+- ❌ **NEVER** run tests with \`bash\` - SPAWN A WORKER
+- ❌ **NEVER** implement features yourself - SPAWN A WORKER
+- ❌ **NEVER** "just do it myself to save time" - NO. SPAWN A WORKER.
+- ❌ **NEVER** reserve files with \`swarmmail_reserve\` - Workers reserve files
+**If you catch yourself about to edit a file, STOP. Use \`swarm_spawn_subtask\` instead.**
+### ✅ ALWAYS DO THESE (Coordinator Checklist)
+On resume, execute this checklist IN ORDER:
+1. \`swarm_status(epic_id="<epic>", project_key="<path>")\` - Get current state
+2. \`swarmmail_inbox(limit=5)\` - Check for agent messages
+3. For completed work: \`swarm_review\` → \`swarm_review_feedback\`
+4. For open subtasks: \`swarm_spawn_subtask\` (NOT "do it yourself")
+5. For blocked work: Investigate, unblock, reassign
 ### Preserve in Summary
@@ -89,41 +109,31 @@ Extract from session context:
 \`\`\`
 ## 🐝 Swarm State
-**Epic:** <bd-xxx> - <title>
+**Epic:** <cell-xxx> - <title>
 **Project:** <path>
 **Progress:** X/Y subtasks complete
 **Active:**
-- <bd-xxx>: <title> [in_progress] → <agent> working on <files>
+- <cell-xxx>: <title> [in_progress] → <agent> working on <files>
 **Blocked:**
-- <bd-xxx>: <title> - BLOCKED: <reason>
+- <cell-xxx>: <title> - BLOCKED: <reason>
 **Completed:**
-- <bd-xxx>: <title> ✓
+- <cell-xxx>: <title> ✓
 **Ready to Spawn:**
-- <bd-xxx>: <title> (files: <...>)
+- <cell-xxx>: <title> (files: <...>)
 \`\`\`
-### On Resume - IMMEDIATELY
-1. \`swarm_status(epic_id="<epic>", project_key="<path>")\` - Get current state
-2. \`swarmmail_inbox(limit=5)\` - Check for agent messages
-3. \`swarm_review(project_key, epic_id, task_id, files_touched)\` - Review any completed work
-4. \`swarm_review_feedback(project_key, task_id, worker_id, status, issues)\` - Approve or request changes
-5. **Spawn ready subtasks** - Don't wait, fire them off
-6. **Unblock blocked work** - Resolve dependencies, reassign if needed
-7. **Collect completed work** - Close done subtasks, verify quality
-### Keep the Swarm Cooking
+### Your Role
 - **Spawn aggressively** - If a subtask is ready and unblocked, spawn an agent
 - **Monitor actively** - Check status, read messages, respond to blockers
+- **Review work** - Use \`swarm_review\` and \`swarm_review_feedback\` for completed work
 - **Close the loop** - When all subtasks done, verify and close the epic
-- **Don't stop** - The swarm runs until the epic is closed
-**You are not waiting for instructions. You are the coordinator. Coordinate.**
+**You are the COORDINATOR. You orchestrate. You do NOT implement. Spawn workers.**
 `;
 /**
@@ -236,29 +246,30 @@ interface ToolPart {
 /**
  * Tool state (completed tools have input/output we need)
  */
-type ToolState = {
-  status: "completed";
-  input: { [key: string]: unknown };
-  output: string;
-  title: string;
-  metadata: { [key: string]: unknown };
-  time: { start: number; end: number };
-} | {
-  status: string;
-  [key: string]: unknown;
-};
+type ToolState =
+  | {
+      status: "completed";
+      input: { [key: string]: unknown };
+      output: string;
+      title: string;
+      metadata: { [key: string]: unknown };
+      time: { start: number; end: number };
+    }
+  | {
+      status: string;
+      [key: string]: unknown;
+    };
 /**
  * SDK Client type (minimal interface for scanSessionMessages)
+ *
+ * The actual SDK client uses a more complex Options-based API:
+ * client.session.messages({ path: { id: sessionID }, query: { limit } })
+ *
+ * We accept `unknown` and handle the type internally to avoid
+ * tight coupling to SDK internals.
  */
-interface OpencodeClient {
-  session: {
-    messages: (opts: { sessionID: string; limit?: number }) => Promise<{
-      info: { id: string; sessionID: string };
-      parts: ToolPart[];
-    }[]>;
-  };
-}
+export type OpencodeClient = unknown;
 /**
  * Scanned swarm state extracted from session messages
@@ -268,29 +279,32 @@ export interface ScannedSwarmState {
   epicTitle?: string;
   projectPath?: string;
   agentName?: string;
-  subtasks: Map<string, { title: string; status: string; worker?: string; files?: string[] }>;
+  subtasks: Map<
+    string,
+    { title: string; status: string; worker?: string; files?: string[] }
+  >;
   lastAction?: { tool: string; args: unknown; timestamp: number };
 }
 /**
  * Scan session messages for swarm state using SDK client
- *
+ *
  * Extracts swarm coordination state from actual tool calls:
  * - swarm_spawn_subtask → subtask tracking
  * - swarmmail_init → agent name, project path
  * - hive_create_epic → epic ID and title
  * - swarm_status → epic reference
  * - swarm_complete → subtask completion
- *
+ *
  * @param client - OpenCode SDK client (undefined if not available)
  * @param sessionID - Session to scan
  * @param limit - Max messages to fetch (default 100)
  * @returns Extracted swarm state
  */
 export async function scanSessionMessages(
-  client: OpencodeClient | undefined,
+  client: OpencodeClient,
   sessionID: string,
-  limit: number = 100
+  limit: number = 100,
 ): Promise<ScannedSwarmState> {
   const state: ScannedSwarmState = {
     subtasks: new Map(),
@@ -301,7 +315,22 @@ export async function scanSessionMessages(
   }
   try {
-    const messages = await client.session.messages({ sessionID, limit });
+    // SDK client uses Options-based API: { path: { id }, query: { limit } }
+    const sdkClient = client as {
+      session: {
+        messages: (opts: {
+          path: { id: string };
+          query?: { limit?: number };
+        }) => Promise<{ data?: Array<{ info: unknown; parts: ToolPart[] }> }>;
+      };
+    };
+    const response = await sdkClient.session.messages({
+      path: { id: sessionID },
+      query: { limit },
+    });
+    const messages = response.data || [];
     for (const message of messages) {
       for (const part of message.parts) {
@@ -310,7 +339,10 @@ export async function scanSessionMessages(
         }
         const { tool, state: toolState } = part;
-        const { input, output, time } = toolState as Extract<ToolState, { status: "completed" }>;
+        const { input, output, time } = toolState as Extract<
+          ToolState,
+          { status: "completed" }
+        >;
         // Track last action
         state.lastAction = {
@@ -407,12 +439,102 @@ export async function scanSessionMessages(
       }
     }
   } catch (error) {
+    getLog().debug(
+      {
+        error: error instanceof Error ? error.message : String(error),
+      },
+      "SDK message scanning failed",
+    );
     // SDK not available or error fetching messages - return what we have
   }
   return state;
 }
+/**
+ * Build dynamic swarm state from scanned messages (more precise than hive detection)
+ */
+function buildDynamicSwarmStateFromScanned(
+  scanned: ScannedSwarmState,
+  detected: SwarmState,
+): string {
+  const parts: string[] = [];
+  parts.push("## 🐝 Current Swarm State\n");
+  // Prefer scanned data over detected
+  const epicId = scanned.epicId || detected.epicId;
+  const epicTitle = scanned.epicTitle || detected.epicTitle;
+  const projectPath = scanned.projectPath || detected.projectPath;
+  if (epicId) {
+    parts.push(`**Epic:** ${epicId}${epicTitle ? ` - ${epicTitle}` : ""}`);
+  }
+  if (scanned.agentName) {
+    parts.push(`**Coordinator:** ${scanned.agentName}`);
+  }
+  parts.push(`**Project:** ${projectPath}`);
+  // Show detailed subtask info from scanned state
+  if (scanned.subtasks.size > 0) {
+    parts.push(`\n**Subtasks:**`);
+    for (const [id, subtask] of scanned.subtasks) {
+      const status = subtask.status === "completed" ? "✓" : `[${subtask.status}]`;
+      const worker = subtask.worker ? ` → ${subtask.worker}` : "";
+      const files = subtask.files?.length ? ` (${subtask.files.join(", ")})` : "";
+      parts.push(`  - ${id}: ${subtask.title} ${status}${worker}${files}`);
+    }
+  } else if (detected.subtasks) {
+    // Fall back to counts from hive detection
+    const total =
+      detected.subtasks.closed +
+      detected.subtasks.in_progress +
+      detected.subtasks.open +
+      detected.subtasks.blocked;
+    if (total > 0) {
+      parts.push(`**Subtasks:**`);
+      if (detected.subtasks.closed > 0)
+        parts.push(`  - ${detected.subtasks.closed} closed`);
+      if (detected.subtasks.in_progress > 0)
+        parts.push(`  - ${detected.subtasks.in_progress} in_progress`);
+      if (detected.subtasks.open > 0)
+        parts.push(`  - ${detected.subtasks.open} open`);
+      if (detected.subtasks.blocked > 0)
+        parts.push(`  - ${detected.subtasks.blocked} blocked`);
+    }
+  }
+  // Show last action if available
+  if (scanned.lastAction) {
+    parts.push(`\n**Last Action:** \`${scanned.lastAction.tool}\``);
+  }
+  if (epicId) {
+    parts.push(`\n## 🎯 YOU ARE THE COORDINATOR`);
+    parts.push(``);
+    parts.push(
+      `**Primary role:** Orchestrate workers, review their output, unblock dependencies.`,
+    );
+    parts.push(`**Spawn workers** for implementation tasks - don't do them yourself.`);
+    parts.push(``);
+    parts.push(`**RESUME STEPS:**`);
+    parts.push(
+      `1. Check swarm status: \`swarm_status(epic_id="${epicId}", project_key="${projectPath}")\``,
+    );
+    parts.push(`2. Check inbox for worker messages: \`swarmmail_inbox(limit=5)\``);
+    parts.push(
+      `3. For in_progress subtasks: Review worker results with \`swarm_review\``,
+    );
+    parts.push(`4. For open subtasks: Spawn workers with \`swarm_spawn_subtask\``);
+    parts.push(`5. For blocked subtasks: Investigate and unblock`);
+  }
+  return parts.join("\n");
+}
 // ============================================================================
 // Swarm Detection
 // ============================================================================
@@ -678,17 +800,21 @@ async function detectSwarm(): Promise<SwarmDetection> {
  * Philosophy: Err on the side of continuation. A false positive costs
  * a bit of context space. A false negative loses the swarm.
  *
+ * @param client - Optional OpenCode SDK client for scanning session messages.
+ *                 When provided, extracts PRECISE swarm state from actual tool calls.
+ *                 When undefined, falls back to hive/swarm-mail heuristic detection.
+ *
  * @example
  * ```typescript
  * import { createCompactionHook } from "opencode-swarm-plugin";
  *
- * export const SwarmPlugin: Plugin = async () => ({
+ * export const SwarmPlugin: Plugin = async (input) => ({
  *   tool: { ... },
- *   "experimental.session.compacting": createCompactionHook(),
+ *   "experimental.session.compacting": createCompactionHook(input.client),
  * });
  * ```
  */
-export function createCompactionHook() {
+export function createCompactionHook(client?: OpencodeClient) {
   return async (
     input: { sessionID: string },
     output: { context: string[] },
@@ -699,41 +825,73 @@ export function createCompactionHook() {
       {
         session_id: input.sessionID,
         trigger: "session_compaction",
+        has_sdk_client: !!client,
       },
       "compaction started",
     );
     try {
+      // Scan session messages for precise swarm state (if client available)
+      const scannedState = await scanSessionMessages(client, input.sessionID);
+      // Also run heuristic detection from hive/swarm-mail
       const detection = await detectSwarm();
+      // Boost confidence if we found swarm evidence in session messages
+      let effectiveConfidence = detection.confidence;
+      if (scannedState.epicId || scannedState.subtasks.size > 0) {
+        // Session messages show swarm activity - this is HIGH confidence
+        if (effectiveConfidence === "none" || effectiveConfidence === "low") {
+          effectiveConfidence = "medium";
+          detection.reasons.push("swarm tool calls found in session");
+        }
+        if (scannedState.subtasks.size > 0) {
+          effectiveConfidence = "high";
+          detection.reasons.push(`${scannedState.subtasks.size} subtasks spawned`);
+        }
+      }
       if (
-        detection.confidence === "high" ||
-        detection.confidence === "medium"
+        effectiveConfidence === "high" ||
+        effectiveConfidence === "medium"
       ) {
         // Definite or probable swarm - inject full context
         const header = `[Swarm detected: ${detection.reasons.join(", ")}]\n\n`;
-        // Build dynamic state section if we have specific data
+        // Build dynamic state section - prefer scanned state (ground truth) over detected
         let dynamicState = "";
-        if (detection.state && detection.state.epicId) {
+        if (scannedState.epicId || scannedState.subtasks.size > 0) {
+          // Use scanned state (more precise)
+          dynamicState =
+            buildDynamicSwarmStateFromScanned(
+              scannedState,
+              detection.state || {
+                projectPath: scannedState.projectPath || process.cwd(),
+                subtasks: { closed: 0, in_progress: 0, open: 0, blocked: 0 },
+              },
+            ) + "\n\n";
+        } else if (detection.state && detection.state.epicId) {
+          // Fall back to hive-detected state
           dynamicState = buildDynamicSwarmState(detection.state) + "\n\n";
         }
         const contextContent = header + dynamicState + SWARM_COMPACTION_CONTEXT;
         output.context.push(contextContent);
         getLog().info(
           {
-            confidence: detection.confidence,
+            confidence: effectiveConfidence,
             context_length: contextContent.length,
             context_type: "full",
             reasons: detection.reasons,
             has_dynamic_state: !!dynamicState,
-            epic_id: detection.state?.epicId,
+            epic_id: scannedState.epicId || detection.state?.epicId,
+            scanned_subtasks: scannedState.subtasks.size,
+            scanned_agent: scannedState.agentName,
           },
           "injected swarm context",
         );
-      } else if (detection.confidence === "low") {
+      } else if (effectiveConfidence === "low") {
         // Possible swarm - inject fallback detection prompt
         const header = `[Possible swarm: ${detection.reasons.join(", ")}]\n\n`;
         const contextContent = header + SWARM_DETECTION_FALLBACK;
@@ -741,7 +899,7 @@ export function createCompactionHook() {
         getLog().info(
           {
-            confidence: detection.confidence,
+            confidence: effectiveConfidence,
             context_length: contextContent.length,
             context_type: "fallback",
             reasons: detection.reasons,
@@ -751,7 +909,7 @@ export function createCompactionHook() {
       } else {
         getLog().debug(
           {
-            confidence: detection.confidence,
+            confidence: effectiveConfidence,
             context_type: "none",
           },
           "no swarm detected, skipping injection",
@@ -764,8 +922,8 @@ export function createCompactionHook() {
         {
           duration_ms: duration,
           success: true,
-          detected: detection.detected,
-          confidence: detection.confidence,
+          detected: detection.detected || scannedState.epicId !== undefined,
+          confidence: effectiveConfidence,
           context_injected: output.context.length > 0,
         },
         "compaction complete",