npm - opencode-swarm-plugin - Versions diffs - 0.38.0 → 0.40.0 - Mend

opencode-swarm-plugin 0.38.0 → 0.40.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (91) hide show

package/.env +2 -0
package/.hive/eval-results.json +26 -0
package/.hive/issues.jsonl +27 -0
package/.hive/memories.jsonl +23 -1
package/.opencode/eval-history.jsonl +12 -0
package/CHANGELOG.md +182 -0
package/README.md +29 -12
package/bin/swarm.test.ts +881 -0
package/bin/swarm.ts +686 -0
package/dist/compaction-hook.d.ts +8 -1
package/dist/compaction-hook.d.ts.map +1 -1
package/dist/compaction-observability.d.ts +173 -0
package/dist/compaction-observability.d.ts.map +1 -0
package/dist/compaction-prompt-scoring.d.ts +124 -0
package/dist/compaction-prompt-scoring.d.ts.map +1 -0
package/dist/eval-capture.d.ts +174 -1
package/dist/eval-capture.d.ts.map +1 -1
package/dist/eval-gates.d.ts +84 -0
package/dist/eval-gates.d.ts.map +1 -0
package/dist/eval-history.d.ts +117 -0
package/dist/eval-history.d.ts.map +1 -0
package/dist/eval-learning.d.ts +216 -0
package/dist/eval-learning.d.ts.map +1 -0
package/dist/hive.d.ts.map +1 -1
package/dist/index.d.ts +80 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +16098 -651
package/dist/plugin.js +16012 -756
package/dist/post-compaction-tracker.d.ts +133 -0
package/dist/post-compaction-tracker.d.ts.map +1 -0
package/dist/schemas/task.d.ts +3 -3
package/dist/swarm-orchestrate.d.ts +23 -0
package/dist/swarm-orchestrate.d.ts.map +1 -1
package/dist/swarm-prompts.d.ts +25 -1
package/dist/swarm-prompts.d.ts.map +1 -1
package/dist/swarm.d.ts +4 -0
package/dist/swarm.d.ts.map +1 -1
package/evals/README.md +702 -105
package/evals/compaction-prompt.eval.ts +149 -0
package/evals/coordinator-behavior.eval.ts +8 -8
package/evals/fixtures/compaction-prompt-cases.ts +305 -0
package/evals/lib/compaction-loader.test.ts +248 -0
package/evals/lib/compaction-loader.ts +320 -0
package/evals/lib/data-loader.test.ts +345 -0
package/evals/lib/data-loader.ts +107 -6
package/evals/scorers/compaction-prompt-scorers.ts +145 -0
package/evals/scorers/compaction-scorers.ts +13 -13
package/evals/scorers/coordinator-discipline.evalite-test.ts +166 -2
package/evals/scorers/coordinator-discipline.ts +348 -15
package/evals/scorers/index.test.ts +146 -0
package/evals/scorers/index.ts +104 -0
package/evals/swarm-decomposition.eval.ts +9 -2
package/examples/commands/swarm.md +291 -21
package/examples/plugin-wrapper-template.ts +117 -0
package/package.json +7 -5
package/scripts/migrate-unknown-sessions.ts +349 -0
package/src/compaction-capture.integration.test.ts +257 -0
package/src/compaction-hook.test.ts +42 -0
package/src/compaction-hook.ts +315 -86
package/src/compaction-observability.integration.test.ts +139 -0
package/src/compaction-observability.test.ts +187 -0
package/src/compaction-observability.ts +324 -0
package/src/compaction-prompt-scorers.test.ts +299 -0
package/src/compaction-prompt-scoring.ts +298 -0
package/src/eval-capture.test.ts +626 -1
package/src/eval-capture.ts +286 -2
package/src/eval-gates.test.ts +306 -0
package/src/eval-gates.ts +218 -0
package/src/eval-history.test.ts +508 -0
package/src/eval-history.ts +214 -0
package/src/eval-learning.test.ts +378 -0
package/src/eval-learning.ts +360 -0
package/src/eval-runner.test.ts +96 -0
package/src/eval-runner.ts +356 -0
package/src/hive.ts +34 -0
package/src/index.ts +115 -2
package/src/memory.test.ts +110 -0
package/src/memory.ts +34 -0
package/src/post-compaction-tracker.test.ts +251 -0
package/src/post-compaction-tracker.ts +237 -0
package/src/swarm-decompose.ts +2 -2
package/src/swarm-orchestrate.ts +2 -2
package/src/swarm-prompts.ts +2 -2
package/src/swarm-review.ts +3 -3
package/dist/beads.d.ts +0 -386
package/dist/beads.d.ts.map +0 -1
package/dist/schemas/bead-events.d.ts +0 -698
package/dist/schemas/bead-events.d.ts.map +0 -1
package/dist/schemas/bead.d.ts +0 -255
package/dist/schemas/bead.d.ts.map +0 -1
/package/evals/{evalite.config.ts → evalite.config.ts.bak} +0 -0

package/src/compaction-hook.ts CHANGED Viewed

@@ -29,8 +29,17 @@
  * ```
  */
-import { getHiveAdapter, getHiveWorkingDirectory } from "./hive";
 import { checkSwarmHealth } from "swarm-mail";
+import {
+  CompactionPhase,
+  createMetricsCollector,
+  getMetricsSummary,
+  recordPatternExtracted,
+  recordPatternSkipped,
+  recordPhaseComplete,
+  recordPhaseStart,
+} from "./compaction-observability";
+import { getHiveAdapter, getHiveWorkingDirectory } from "./hive";
 import { createChildLogger } from "./logger";
 let _logger: any | undefined;
@@ -67,6 +76,15 @@ function getLog() {
  *
  * This is NOT about preserving state for a human - it's about the swarm continuing
  * autonomously after context compression.
+ *
+ * Structure optimized for eval scores:
+ * 1. ASCII header (visual anchor, coordinatorIdentity scorer)
+ * 2. What Good Looks Like (behavioral examples, outcome-focused)
+ * 3. Immediate actions (actionable tool calls, postCompactionDiscipline scorer)
+ * 4. Forbidden tools (explicit list, forbiddenToolsPresent scorer)
+ * 5. Mandatory behaviors (inbox, skills, review)
+ * 6. Role & mandates (strong language, coordinatorIdentity scorer)
+ * 7. Reference sections (supporting material)
  */
 export const SWARM_COMPACTION_CONTEXT = `
 ┌─────────────────────────────────────────────────────────────┐
@@ -78,28 +96,43 @@ export const SWARM_COMPACTION_CONTEXT = `
 │                                                             │
 └─────────────────────────────────────────────────────────────┘
-## 🎯 NON-NEGOTIABLE: YOU ARE THE COORDINATOR
 Context was compacted but the swarm is still running. **YOU ARE THE COORDINATOR.**
-Your role is ORCHESTRATION, not implementation. When you catch yourself about to do work directly, STOP.
+Your role is ORCHESTRATION, not implementation. The resume steps above (if present) tell you exactly what to do first.
-### ⛔ NEVER DO THESE (Coordinator Anti-Patterns)
+---
-**CRITICAL: Coordinators NEVER do implementation work. ALWAYS spawn workers.**
+## 🎯 WHAT GOOD LOOKS LIKE (Behavioral Examples)
-- ❌ **NEVER** use \`edit\` or \`write\` tools - SPAWN A WORKER
-- ❌ **NEVER** run tests with \`bash\` - SPAWN A WORKER
-- ❌ **NEVER** implement features yourself - SPAWN A WORKER
-- ❌ **NEVER** "just do it myself to save time" - NO. SPAWN A WORKER.
-- ❌ **NEVER** reserve files with \`swarmmail_reserve\` - Workers reserve files
-- ❌ **NEVER** fetch files/docs directly - SPAWN A RESEARCHER
+**✅ GOOD Coordinator Behavior:**
+- Spawned researcher for unfamiliar tech → got summary → stored in semantic-memory
+- Loaded \`skills_use(name="testing-patterns")\` BEFORE spawning test workers
+- Checked \`swarmmail_inbox()\` every 5-10 minutes → caught blocked worker → unblocked in 2min
+- Delegated planning to swarm/planner subagent → main context stayed clean
+- Workers reserved their OWN files → no conflicts
+- Reviewed all worker output with \`swarm_review\` → caught integration issue before merge
-**If you catch yourself about to edit a file, STOP. Use \`swarm_spawn_subtask\` instead.**
+**❌ COMMON MISTAKES (Avoid These):**
+- Called context7/pdf-brain directly → dumped 50KB into thread → context exhaustion
+- Skipped skill loading → workers reinvented patterns already in skills
+- Never checked inbox → worker stuck 25 minutes → silent failure
+- Reserved files as coordinator → workers blocked → swarm stalled
+- Closed cells when workers said "done" → skipped review → shipped broken code
+---
+## 🚫 FORBIDDEN TOOLS (NEVER Use These Directly)
+Coordinators do NOT do implementation work. These tools are **FORBIDDEN**:
-### 🚫 FORBIDDEN TOOLS (Coordinators MUST delegate these)
+### File Modification (ALWAYS spawn workers instead)
+- \`Edit\` - SPAWN A WORKER
+- \`Write\` - SPAWN A WORKER
+- \`bash\` (for file modifications) - SPAWN A WORKER
+- \`swarmmail_reserve\` - Workers reserve their own files
+- \`git commit\` - Workers commit their own changes
-**NEVER use these tools directly. ALWAYS spawn a researcher worker via \`swarm_spawn_researcher\`:**
+### External Data Fetching (SPAWN A RESEARCHER instead)
 **Repository fetching:**
 - \`repo-crawl_file\`, \`repo-crawl_readme\`, \`repo-crawl_search\`, \`repo-crawl_structure\`, \`repo-crawl_tree\`
@@ -112,56 +145,185 @@ Your role is ORCHESTRATION, not implementation. When you catch yourself about to
 **Knowledge base:**
 - \`pdf-brain_search\`, \`pdf-brain_read\`
-**If you need external data:** Use \`swarm_spawn_researcher\` with a clear research task. The researcher will fetch, summarize, and return findings.
+**Instead:** Use \`swarm_spawn_researcher\` with a clear research task. The researcher will fetch, summarize, and return findings.
-### ✅ ALWAYS DO THESE (Coordinator Checklist)
+---
-On resume, execute this checklist IN ORDER:
+## 💼 YOUR ROLE (Non-Negotiable)
-1. \`swarm_status(epic_id="<epic>", project_key="<path>")\` - Get current state
-2. \`swarmmail_inbox(limit=5)\` - Check for agent messages
-3. For completed work: \`swarm_review\` → \`swarm_review_feedback\`
-4. For open subtasks: \`swarm_spawn_subtask\` (NOT "do it yourself")
-5. For blocked work: Investigate, unblock, reassign
+You are the **COORDINATOR**. Your job is ORCHESTRATION, not implementation.
-### Preserve in Summary
+### What Coordinators Do:
+- ✅ Spawn workers for implementation tasks
+- ✅ Monitor worker progress via \`swarm_status\` and \`swarmmail_inbox\`
+- ✅ Review completed work with \`swarm_review\`
+- ✅ Unblock dependencies and resolve conflicts
+- ✅ Close the loop when epics complete
-Extract from session context:
+### What Coordinators NEVER Do:
+- ❌ **NEVER** edit or write files directly
+- ❌ **NEVER** run tests with \`bash\`
+- ❌ **NEVER** "just do it myself to save time"
+- ❌ **NEVER** reserve files (workers reserve)
+- ❌ **NEVER** fetch external data directly (spawn researchers)
-1. **Epic & Subtasks** - IDs, titles, status, file assignments
-2. **What's Running** - Which agents are active, what they're working on
-3. **What's Blocked** - Blockers and what's needed to unblock
-4. **What's Done** - Completed work and any follow-ups needed
-5. **What's Next** - Pending subtasks ready to spawn
+**If you catch yourself about to edit a file, STOP. Use \`swarm_spawn_subtask\` instead.**
+### Strong Mandates:
+- **ALWAYS** spawn workers for implementation tasks
+- **ALWAYS** check status and inbox before decisions
+- **ALWAYS** review worker output before accepting
+- **NON-NEGOTIABLE:** You orchestrate. You do NOT implement.
+---
+## 📋 MANDATORY BEHAVIORS (Post-Compaction Checklist)
-### Summary Format
+### 1. Inbox Monitoring (EVERY 5-10 MINUTES)
+\`\`\`
+swarmmail_inbox(limit=5)           # Check for messages
+swarmmail_read_message(message_id=N)  # Read urgent ones
+swarm_status(epic_id, project_key)    # Overall progress
+\`\`\`
+**Intervention triggers:** Worker blocked >5min, file conflict, scope creep
+### 2. Skill Loading (BEFORE spawning workers)
+\`\`\`
+skills_use(name="swarm-coordination")  # ALWAYS for swarms
+skills_use(name="testing-patterns")    # If task involves tests
+skills_use(name="system-design")       # If architectural decisions
+\`\`\`
+**Include skill recommendations in shared_context for workers.**
+### 3. Worker Review (AFTER EVERY worker returns)
+\`\`\`
+swarm_review(project_key, epic_id, task_id, files_touched)
+# Evaluate: Does it fulfill requirements? Enable downstream tasks? Type safe?
+swarm_review_feedback(project_key, task_id, worker_id, status, issues)
+\`\`\`
+**3-Strike Rule:** After 3 rejections → mark blocked → escalate to human.
+### 4. Research Spawning (For unfamiliar tech)
+\`\`\`
+Task(subagent_type="swarm-researcher", prompt="Research <topic>...")
+\`\`\`
+**NEVER call context7, pdf-brain, webfetch directly.** Spawn a researcher.
+---
+## 📝 SUMMARY FORMAT (Preserve This State)
+When compaction occurs, extract and preserve this structure:
 \`\`\`
 ## 🐝 Swarm State
-**Epic:** <cell-xxx> - <title>
-**Project:** <path>
+**Epic:** CELL_ID - TITLE
+**Project:** PROJECT_PATH
 **Progress:** X/Y subtasks complete
 **Active:**
-- <cell-xxx>: <title> [in_progress] → <agent> working on <files>
+- CELL_ID: TITLE [in_progress] → AGENT working on FILES
 **Blocked:**
-- <cell-xxx>: <title> - BLOCKED: <reason>
+- CELL_ID: TITLE - BLOCKED: REASON
 **Completed:**
-- <cell-xxx>: <title> ✓
+- CELL_ID: TITLE ✓
 **Ready to Spawn:**
-- <cell-xxx>: <title> (files: <...>)
+- CELL_ID: TITLE (files: FILES)
+\`\`\`
+### What to Extract:
+1. **Epic & Subtasks** - IDs, titles, status, file assignments
+2. **What's Running** - Active agents and their current work
+3. **What's Blocked** - Blockers and what's needed to unblock
+4. **What's Done** - Completed work and follow-ups
+5. **What's Next** - Pending subtasks ready to spawn
+---
+## 📋 REFERENCE: Full Coordinator Workflow
+You are ALWAYS swarming. Use this workflow for any new work:
+### Phase 1.5: Research (For Complex Tasks)
+If the task requires unfamiliar technologies, spawn a researcher FIRST:
+\`\`\`
+swarm_spawn_researcher(
+  research_id="research-TOPIC",
+  epic_id="mjkw...",  # your epic ID
+  tech_stack=["TECHNOLOGY"],
+  project_path="PROJECT_PATH"
+)
+// Then spawn with Task(subagent_type="swarm/researcher", prompt="...")
+\`\`\`
+### Phase 2: Knowledge Gathering
+\`\`\`
+semantic-memory_find(query="TASK_KEYWORDS", limit=5)   # Past learnings
+cass_search(query="TASK_DESCRIPTION", limit=5)         # Similar past tasks
+skills_list()                                          # Available skills
+\`\`\`
+### Phase 3: Decompose
+\`\`\`
+swarm_select_strategy(task="TASK")
+swarm_plan_prompt(task="TASK", context="KNOWLEDGE")
+swarm_validate_decomposition(response="CELLTREE_JSON")
+\`\`\`
+### Phase 4: Create Cells
+\`hive_create_epic(epic_title="TASK", subtasks=[...])\`
+### Phase 5: File Reservations
+> **⚠️ Coordinator NEVER reserves files.** Workers reserve their own files with \`swarmmail_reserve\`.
+### Phase 6: Spawn Workers
+\`\`\`
+swarm_spawn_subtask(bead_id, epic_id, title, files, shared_context, project_path)
+Task(subagent_type="swarm/worker", prompt="GENERATED_PROMPT")
+\`\`\`
+### Phase 7: Review Loop (MANDATORY)
+**AFTER EVERY Task() RETURNS:**
+1. \`swarmmail_inbox()\` - Check for messages
+2. \`swarm_review(project_key, epic_id, task_id, files_touched)\` - Generate review
+3. Evaluate against epic goals
+4. \`swarm_review_feedback(project_key, task_id, worker_id, status, issues)\`
+**If needs_changes:**
+\`\`\`
+swarm_spawn_retry(bead_id, epic_id, original_prompt, attempt, issues, diff, files, project_path)
+// Spawn NEW worker with Task() using retry prompt
+// Max 3 attempts before marking task blocked
 \`\`\`
-### Your Role
+### Phase 8: Complete
+\`hive_sync()\` - Sync all cells to git
+---
+## 📊 REFERENCE: Decomposition Strategies
+| Strategy       | Best For                 | Keywords                               |
+| -------------- | ------------------------ | -------------------------------------- |
+| file-based     | Refactoring, migrations  | refactor, migrate, rename, update all  |
+| feature-based  | New features             | add, implement, build, create, feature |
+| risk-based     | Bug fixes, security      | fix, bug, security, critical, urgent   |
-- **Spawn aggressively** - If a subtask is ready and unblocked, spawn an agent
-- **Monitor actively** - Check status, read messages, respond to blockers
-- **Review work** - Use \`swarm_review\` and \`swarm_review_feedback\` for completed work
-- **Close the loop** - When all subtasks done, verify and close the epic
+---
 **You are the COORDINATOR. You orchestrate. You do NOT implement. Spawn workers.**
 `;
@@ -220,7 +382,27 @@ Include this in your summary:
 function buildDynamicSwarmState(state: SwarmState): string {
   const parts: string[] = [];
-  parts.push("## 🐝 Current Swarm State\n");
+  // Lead with epic context
+  if (state.epicId && state.epicTitle) {
+    parts.push(`You are coordinating epic **${state.epicId}** - ${state.epicTitle}`);
+  } else if (state.epicId) {
+    parts.push(`You are coordinating epic **${state.epicId}**`);
+  }
+  parts.push(`Project: ${state.projectPath}\n`);
+  // IMMEDIATE ACTIONS section (must come FIRST for postCompactionDiscipline scoring)
+  if (state.epicId) {
+    parts.push(`## 1️⃣ IMMEDIATE ACTIONS (Do These FIRST)\n`);
+    parts.push(`1. \`swarm_status(epic_id="${state.epicId}", project_key="${state.projectPath}")\` - Get current swarm state`);
+    parts.push(`2. \`swarmmail_inbox(limit=5)\` - Check for worker messages and blockers`);
+    parts.push(`3. For completed work: Review with \`swarm_review\` → \`swarm_review_feedback\``);
+    parts.push(`4. For open subtasks: Spawn workers with \`swarm_spawn_subtask\``);
+    parts.push(`5. For blocked work: Investigate, unblock, or reassign\n`);
+  }
+  // Swarm state summary
+  parts.push(`## 🐝 Current Swarm State\n`);
   if (state.epicId && state.epicTitle) {
     parts.push(`**Epic:** ${state.epicId} - ${state.epicTitle}`);
@@ -237,21 +419,7 @@ function buildDynamicSwarmState(state: SwarmState): string {
     }
   }
-  parts.push(`**Project:** ${state.projectPath}`);
-  if (state.epicId) {
-    parts.push(`\n## 🎯 YOU ARE THE COORDINATOR`);
-    parts.push(``);
-    parts.push(`**Primary role:** Orchestrate workers, review their output, unblock dependencies.`);
-    parts.push(`**Spawn workers** for implementation tasks - don't do them yourself.`);
-    parts.push(``);
-    parts.push(`**RESUME STEPS:**`);
-    parts.push(`1. Check swarm status: \`swarm_status(epic_id="${state.epicId}", project_key="${state.projectPath}")\``);
-    parts.push(`2. Check inbox for worker messages: \`swarmmail_inbox(limit=5)\``);
-    parts.push(`3. For in_progress subtasks: Review worker results with \`swarm_review\``);
-    parts.push(`4. For open subtasks: Spawn workers with \`swarm_spawn_subtask\``);
-    parts.push(`5. For blocked subtasks: Investigate and unblock`);
-  }
+  parts.push(`**Project:** ${state.projectPath}\n`);
   return parts.join("\n");
 }
@@ -490,22 +658,44 @@ function buildDynamicSwarmStateFromScanned(
 ): string {
   const parts: string[] = [];
-  parts.push("## 🐝 Current Swarm State\n");
   // Prefer scanned data over detected
   const epicId = scanned.epicId || detected.epicId;
   const epicTitle = scanned.epicTitle || detected.epicTitle;
   const projectPath = scanned.projectPath || detected.projectPath;
-  if (epicId) {
-    parts.push(`**Epic:** ${epicId}${epicTitle ? ` - ${epicTitle}` : ""}`);
+  // Lead with epic context
+  if (epicId && epicTitle) {
+    parts.push(`You are coordinating epic **${epicId}** - ${epicTitle}`);
+  } else if (epicId) {
+    parts.push(`You are coordinating epic **${epicId}**`);
   }
   if (scanned.agentName) {
-    parts.push(`**Coordinator:** ${scanned.agentName}`);
+    parts.push(`Coordinator: ${scanned.agentName}`);
   }
-  parts.push(`**Project:** ${projectPath}`);
+  parts.push(`Project: ${projectPath}\n`);
+  // IMMEDIATE ACTIONS section (must come FIRST for postCompactionDiscipline scoring)
+  if (epicId) {
+    parts.push(`## 1️⃣ IMMEDIATE ACTIONS (Do These FIRST)\n`);
+    parts.push(
+      `1. \`swarm_status(epic_id="${epicId}", project_key="${projectPath}")\` - Get current swarm state`,
+    );
+    parts.push(`2. \`swarmmail_inbox(limit=5)\` - Check for worker messages and blockers`);
+    parts.push(
+      `3. For completed work: Review with \`swarm_review\` → \`swarm_review_feedback\``,
+    );
+    parts.push(`4. For open subtasks: Spawn workers with \`swarm_spawn_subtask\``);
+    parts.push(`5. For blocked work: Investigate, unblock, or reassign\n`);
+  }
+  // Swarm state summary
+  parts.push(`## 🐝 Current Swarm State\n`);
+  if (epicId) {
+    parts.push(`**Epic:** ${epicId}${epicTitle ? ` - ${epicTitle}` : ""}`);
+  }
   // Show detailed subtask info from scanned state
   if (scanned.subtasks.size > 0) {
@@ -525,7 +715,7 @@ function buildDynamicSwarmStateFromScanned(
       detected.subtasks.blocked;
     if (total > 0) {
-      parts.push(`**Subtasks:**`);
+      parts.push(`\n**Subtasks:**`);
       if (detected.subtasks.closed > 0)
         parts.push(`  - ${detected.subtasks.closed} closed`);
       if (detected.subtasks.in_progress > 0)
@@ -537,29 +727,11 @@ function buildDynamicSwarmStateFromScanned(
     }
   }
+  parts.push(`\n**Project:** ${projectPath}`);
   // Show last action if available
   if (scanned.lastAction) {
-    parts.push(`\n**Last Action:** \`${scanned.lastAction.tool}\``);
-  }
-  if (epicId) {
-    parts.push(`\n## 🎯 YOU ARE THE COORDINATOR`);
-    parts.push(``);
-    parts.push(
-      `**Primary role:** Orchestrate workers, review their output, unblock dependencies.`,
-    );
-    parts.push(`**Spawn workers** for implementation tasks - don't do them yourself.`);
-    parts.push(``);
-    parts.push(`**RESUME STEPS:**`);
-    parts.push(
-      `1. Check swarm status: \`swarm_status(epic_id="${epicId}", project_key="${projectPath}")\``,
-    );
-    parts.push(`2. Check inbox for worker messages: \`swarmmail_inbox(limit=5)\``);
-    parts.push(
-      `3. For in_progress subtasks: Review worker results with \`swarm_review\``,
-    );
-    parts.push(`4. For open subtasks: Spawn workers with \`swarm_spawn_subtask\``);
-    parts.push(`5. For blocked subtasks: Investigate and unblock`);
+    parts.push(`**Last Action:** \`${scanned.lastAction.tool}\``);
   }
   return parts.join("\n");
@@ -850,6 +1022,12 @@ export function createCompactionHook(client?: OpencodeClient) {
     output: { context: string[] },
   ): Promise<void> => {
     const startTime = Date.now();
+    // Create metrics collector
+    const metrics = createMetricsCollector({
+      session_id: input.sessionID,
+      has_sdk_client: !!client,
+    });
     getLog().info(
       {
@@ -859,12 +1037,19 @@ export function createCompactionHook(client?: OpencodeClient) {
       },
       "compaction started",
     );
+    recordPhaseStart(metrics, CompactionPhase.START);
     try {
+      recordPhaseComplete(metrics, CompactionPhase.START);
       // Scan session messages for precise swarm state (if client available)
+      recordPhaseStart(metrics, CompactionPhase.GATHER_SWARM_MAIL);
       const scannedState = await scanSessionMessages(client, input.sessionID);
+      recordPhaseComplete(metrics, CompactionPhase.GATHER_SWARM_MAIL);
       // Also run heuristic detection from hive/swarm-mail
+      recordPhaseStart(metrics, CompactionPhase.DETECT);
       const detection = await detectSwarm();
       // Boost confidence if we found swarm evidence in session messages
@@ -874,13 +1059,21 @@ export function createCompactionHook(client?: OpencodeClient) {
         if (effectiveConfidence === "none" || effectiveConfidence === "low") {
           effectiveConfidence = "medium";
           detection.reasons.push("swarm tool calls found in session");
+          recordPatternExtracted(metrics, "swarm_tool_calls", "Found swarm tool calls in session");
         }
         if (scannedState.subtasks.size > 0) {
           effectiveConfidence = "high";
           detection.reasons.push(`${scannedState.subtasks.size} subtasks spawned`);
+          recordPatternExtracted(metrics, "subtasks", `${scannedState.subtasks.size} subtasks spawned`);
         }
       }
+      recordPhaseComplete(metrics, CompactionPhase.DETECT, {
+        confidence: effectiveConfidence,
+        detected: detection.detected || scannedState.epicId !== undefined,
+      });
+      recordPhaseStart(metrics, CompactionPhase.INJECT);
       if (
         effectiveConfidence === "high" ||
         effectiveConfidence === "medium"
@@ -907,6 +1100,11 @@ export function createCompactionHook(client?: OpencodeClient) {
         const contextContent = header + dynamicState + SWARM_COMPACTION_CONTEXT;
         output.context.push(contextContent);
+        recordPhaseComplete(metrics, CompactionPhase.INJECT, {
+          context_length: contextContent.length,
+          context_type: "full",
+        });
         getLog().info(
           {
@@ -926,6 +1124,11 @@ export function createCompactionHook(client?: OpencodeClient) {
         const header = `[Possible swarm: ${detection.reasons.join(", ")}]\n\n`;
         const contextContent = header + SWARM_DETECTION_FALLBACK;
         output.context.push(contextContent);
+        recordPhaseComplete(metrics, CompactionPhase.INJECT, {
+          context_length: contextContent.length,
+          context_type: "fallback",
+        });
         getLog().info(
           {
@@ -937,6 +1140,10 @@ export function createCompactionHook(client?: OpencodeClient) {
           "injected swarm context",
         );
       } else {
+        recordPhaseComplete(metrics, CompactionPhase.INJECT, {
+          context_type: "none",
+        });
         getLog().debug(
           {
             confidence: effectiveConfidence,
@@ -947,7 +1154,10 @@ export function createCompactionHook(client?: OpencodeClient) {
       }
       // confidence === "none" - no injection, probably not a swarm
+      recordPhaseStart(metrics, CompactionPhase.COMPLETE);
       const duration = Date.now() - startTime;
+      const summary = getMetricsSummary(metrics);
       getLog().info(
         {
           duration_ms: duration,
@@ -955,11 +1165,30 @@ export function createCompactionHook(client?: OpencodeClient) {
           detected: detection.detected || scannedState.epicId !== undefined,
           confidence: effectiveConfidence,
           context_injected: output.context.length > 0,
+          // Add metrics summary
+          metrics: {
+            phases: Object.keys(summary.phases).map(phase => ({
+              name: phase,
+              duration_ms: summary.phases[phase].duration_ms,
+              success: summary.phases[phase].success,
+            })),
+            patterns_extracted: summary.patterns_extracted,
+            patterns_skipped: summary.patterns_skipped,
+            extraction_success_rate: summary.extraction_success_rate,
+          },
         },
         "compaction complete",
       );
+      recordPhaseComplete(metrics, CompactionPhase.COMPLETE);
     } catch (error) {
       const duration = Date.now() - startTime;
+      recordPhaseComplete(metrics, CompactionPhase.COMPLETE, {
+        success: false,
+        error: error instanceof Error ? error.message : String(error),
+      });
       getLog().error(
         {
           duration_ms: duration,