npm - opencode-swarm-plugin - Versions diffs - 0.36.0 → 0.37.0 - Mend

opencode-swarm-plugin 0.36.0 → 0.37.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

package/.hive/issues.jsonl +16 -4
package/.hive/memories.jsonl +274 -1
package/.turbo/turbo-build.log +4 -4
package/.turbo/turbo-test.log +318 -318
package/CHANGELOG.md +113 -0
package/bin/swarm.test.ts +106 -0
package/bin/swarm.ts +413 -179
package/dist/compaction-hook.d.ts +54 -4
package/dist/compaction-hook.d.ts.map +1 -1
package/dist/eval-capture.d.ts +122 -17
package/dist/eval-capture.d.ts.map +1 -1
package/dist/index.d.ts +1 -7
package/dist/index.d.ts.map +1 -1
package/dist/index.js +1278 -619
package/dist/planning-guardrails.d.ts +121 -0
package/dist/planning-guardrails.d.ts.map +1 -1
package/dist/plugin.d.ts +9 -9
package/dist/plugin.d.ts.map +1 -1
package/dist/plugin.js +1283 -329
package/dist/schemas/task.d.ts +0 -1
package/dist/schemas/task.d.ts.map +1 -1
package/dist/swarm-decompose.d.ts +0 -8
package/dist/swarm-decompose.d.ts.map +1 -1
package/dist/swarm-orchestrate.d.ts.map +1 -1
package/dist/swarm-prompts.d.ts +0 -4
package/dist/swarm-prompts.d.ts.map +1 -1
package/dist/swarm-review.d.ts.map +1 -1
package/dist/swarm.d.ts +0 -6
package/dist/swarm.d.ts.map +1 -1
package/evals/README.md +38 -0
package/evals/coordinator-session.eval.ts +154 -0
package/evals/fixtures/coordinator-sessions.ts +328 -0
package/evals/lib/data-loader.ts +69 -0
package/evals/scorers/coordinator-discipline.evalite-test.ts +536 -0
package/evals/scorers/coordinator-discipline.ts +315 -0
package/evals/scorers/index.ts +12 -0
package/examples/plugin-wrapper-template.ts +303 -4
package/package.json +2 -2
package/src/compaction-hook.test.ts +8 -1
package/src/compaction-hook.ts +31 -21
package/src/eval-capture.test.ts +390 -0
package/src/eval-capture.ts +163 -4
package/src/hive.integration.test.ts +148 -0
package/src/hive.ts +89 -0
package/src/index.ts +68 -1
package/src/planning-guardrails.test.ts +387 -2
package/src/planning-guardrails.ts +289 -0
package/src/plugin.ts +10 -10
package/src/swarm-decompose.test.ts +195 -0
package/src/swarm-decompose.ts +72 -1
package/src/swarm-orchestrate.ts +44 -0
package/src/swarm-prompts.ts +20 -0
package/src/swarm-review.integration.test.ts +24 -29
package/src/swarm-review.ts +41 -0

package/evals/scorers/coordinator-discipline.ts ADDED Viewed

@@ -0,0 +1,315 @@
+/**
+ * Coordinator Discipline Scorers - Evaluate coordinator behavior
+ *
+ * These scorers measure whether a coordinator follows the protocol:
+ * 1. Don't edit files directly (spawn workers)
+ * 2. Don't run tests directly (workers do verification)
+ * 3. Spawn workers for all subtasks
+ * 4. Review worker output before accepting
+ * 5. Minimize time to first spawn (don't overthink)
+ *
+ * Inputs: CoordinatorSession from eval-capture
+ */
+import { createScorer } from "evalite";
+import type { CoordinatorSession } from "../../src/eval-capture.js";
+/**
+ * Violation Count Scorer
+ *
+ * Counts VIOLATION events in the session.
+ * Each violation reduces score by 0.2.
+ *
+ * Violations tracked:
+ * - coordinator_edited_file (should spawn worker instead)
+ * - coordinator_ran_tests (workers do verification)
+ * - coordinator_reserved_files (only workers reserve)
+ * - no_worker_spawned (subtask exists but no worker)
+ *
+ * Score: 1.0 - (0.2 * violation_count), floored at 0.0
+ */
+export const violationCount = createScorer({
+  name: "Violation Count",
+  description: "Coordinator followed protocol (no direct edits, tests, or reservations)",
+  scorer: ({ output }) => {
+    try {
+      const session = JSON.parse(String(output)) as CoordinatorSession;
+      // Count violations
+      const violations = session.events.filter(
+        (e) => e.event_type === "VIOLATION"
+      );
+      const count = violations.length;
+      const score = Math.max(0, 1.0 - count * 0.2);
+      if (count === 0) {
+        return {
+          score: 1.0,
+          message: "Perfect - 0 violations",
+        };
+      }
+      return {
+        score,
+        message: `${count} violations detected`,
+      };
+    } catch (error) {
+      return {
+        score: 0,
+        message: `Failed to parse CoordinatorSession: ${error}`,
+      };
+    }
+  },
+});
+/**
+ * Spawn Efficiency Scorer
+ *
+ * Measures whether workers were spawned for all subtasks.
+ * Coordinators should delegate work, not do it themselves.
+ *
+ * Score: workers_spawned / subtasks_planned
+ */
+export const spawnEfficiency = createScorer({
+  name: "Spawn Efficiency",
+  description: "Workers spawned for all subtasks (delegation ratio)",
+  scorer: ({ output }) => {
+    try {
+      const session = JSON.parse(String(output)) as CoordinatorSession;
+      // Find decomposition_complete event (has subtask count)
+      const decomp = session.events.find(
+        (e) =>
+          e.event_type === "DECISION" &&
+          e.decision_type === "decomposition_complete"
+      );
+      if (!decomp) {
+        return {
+          score: 0,
+          message: "No decomposition event found",
+        };
+      }
+      const subtaskCount = (decomp.payload as { subtask_count?: number })?.subtask_count || 0;
+      if (subtaskCount === 0) {
+        return {
+          score: 0,
+          message: "No subtasks planned",
+        };
+      }
+      // Count worker_spawned events
+      const spawned = session.events.filter(
+        (e) =>
+          e.event_type === "DECISION" && e.decision_type === "worker_spawned"
+      ).length;
+      const score = spawned / subtaskCount;
+      return {
+        score,
+        message: `${spawned}/${subtaskCount} workers spawned (${(score * 100).toFixed(0)}%)`,
+      };
+    } catch (error) {
+      return {
+        score: 0,
+        message: `Failed to parse CoordinatorSession: ${error}`,
+      };
+    }
+  },
+});
+/**
+ * Review Thoroughness Scorer
+ *
+ * Measures whether coordinator reviewed worker output.
+ * Should have review_completed events for all finished subtasks.
+ *
+ * Score: reviews_completed / workers_finished
+ */
+export const reviewThoroughness = createScorer({
+  name: "Review Thoroughness",
+  description: "Coordinator reviewed all worker output",
+  scorer: ({ output }) => {
+    try {
+      const session = JSON.parse(String(output)) as CoordinatorSession;
+      // Count finished workers (subtask_success or subtask_failed)
+      const finished = session.events.filter(
+        (e) =>
+          e.event_type === "OUTCOME" &&
+          (e.outcome_type === "subtask_success" ||
+            e.outcome_type === "subtask_failed")
+      ).length;
+      if (finished === 0) {
+        return {
+          score: 1.0,
+          message: "No finished workers to review",
+        };
+      }
+      // Count review_completed events
+      const reviewed = session.events.filter(
+        (e) =>
+          e.event_type === "DECISION" && e.decision_type === "review_completed"
+      ).length;
+      const score = reviewed / finished;
+      return {
+        score,
+        message: `${reviewed}/${finished} workers reviewed (${(score * 100).toFixed(0)}%)`,
+      };
+    } catch (error) {
+      return {
+        score: 0,
+        message: `Failed to parse CoordinatorSession: ${error}`,
+      };
+    }
+  },
+});
+/**
+ * Time to First Spawn Scorer
+ *
+ * Measures how fast the coordinator spawned the first worker.
+ * Overthinking and perfectionism delays workers and blocks progress.
+ *
+ * Normalization:
+ * - < 60s: 1.0 (excellent)
+ * - 60-300s: linear decay to 0.5
+ * - > 300s: 0.0 (way too slow)
+ *
+ * Score: normalized to 0-1 (faster is better)
+ */
+export const timeToFirstSpawn = createScorer({
+  name: "Time to First Spawn",
+  description: "Coordinator spawned workers quickly (no overthinking)",
+  scorer: ({ output }) => {
+    try {
+      const session = JSON.parse(String(output)) as CoordinatorSession;
+      // Find decomposition_complete event
+      const decomp = session.events.find(
+        (e) =>
+          e.event_type === "DECISION" &&
+          e.decision_type === "decomposition_complete"
+      );
+      if (!decomp) {
+        return {
+          score: 0,
+          message: "No decomposition event found",
+        };
+      }
+      // Find first worker_spawned event
+      const firstSpawn = session.events.find(
+        (e) =>
+          e.event_type === "DECISION" && e.decision_type === "worker_spawned"
+      );
+      if (!firstSpawn) {
+        return {
+          score: 0,
+          message: "No worker spawned",
+        };
+      }
+      // Calculate time delta
+      const decompTime = new Date(decomp.timestamp).getTime();
+      const spawnTime = new Date(firstSpawn.timestamp).getTime();
+      const deltaMs = spawnTime - decompTime;
+      // Normalize: < 60s = 1.0, > 300s = 0.0, linear in between
+      const EXCELLENT_MS = 60_000;
+      const POOR_MS = 300_000;
+      let score: number;
+      if (deltaMs < EXCELLENT_MS) {
+        score = 1.0;
+      } else if (deltaMs > POOR_MS) {
+        score = 0.0;
+      } else {
+        // Linear decay from 1.0 to 0.0
+        score = 1.0 - (deltaMs - EXCELLENT_MS) / (POOR_MS - EXCELLENT_MS);
+      }
+      const seconds = Math.round(deltaMs / 1000);
+      return {
+        score,
+        message: `First spawn after ${deltaMs}ms (${seconds}s)`,
+      };
+    } catch (error) {
+      return {
+        score: 0,
+        message: `Failed to parse CoordinatorSession: ${error}`,
+      };
+    }
+  },
+});
+/**
+ * Overall Discipline Scorer
+ *
+ * Weighted composite of all coordinator discipline metrics.
+ *
+ * Weights:
+ * - Violations: 30% (most critical - breaking protocol)
+ * - Spawn efficiency: 25% (delegation is key)
+ * - Review thoroughness: 25% (quality gate)
+ * - Time to first spawn: 20% (bias toward action)
+ *
+ * Score: 0.0 to 1.0
+ */
+export const overallDiscipline = createScorer({
+  name: "Overall Coordinator Discipline",
+  description: "Composite score for coordinator protocol adherence",
+  scorer: ({ output, expected }) => {
+    try {
+      // Run all scorers
+      const scores = {
+        violations: violationCount.scorer({ output, expected }),
+        spawn: spawnEfficiency.scorer({ output, expected }),
+        review: reviewThoroughness.scorer({ output, expected }),
+        speed: timeToFirstSpawn.scorer({ output, expected }),
+      };
+      // Weighted average
+      const weights = {
+        violations: 0.3,
+        spawn: 0.25,
+        review: 0.25,
+        speed: 0.2,
+      };
+      const totalScore =
+        scores.violations.score * weights.violations +
+        scores.spawn.score * weights.spawn +
+        scores.review.score * weights.review +
+        scores.speed.score * weights.speed;
+      const details = [
+        `Violations: ${(scores.violations.score * 100).toFixed(0)}%`,
+        `Spawn: ${(scores.spawn.score * 100).toFixed(0)}%`,
+        `Review: ${(scores.review.score * 100).toFixed(0)}%`,
+        `Speed: ${(scores.speed.score * 100).toFixed(0)}%`,
+      ].join(", ");
+      return {
+        score: totalScore,
+        message: `Overall: ${(totalScore * 100).toFixed(0)}% (${details})`,
+      };
+    } catch (error) {
+      return {
+        score: 0,
+        message: `Failed to compute composite score: ${error}`,
+      };
+    }
+  },
+});

package/evals/scorers/index.ts CHANGED Viewed

@@ -78,6 +78,18 @@ export {
   compactionQuality,
 } from "./compaction-scorers.js";
+// ============================================================================
+// Coordinator discipline scorers
+// ============================================================================
+export {
+  violationCount,
+  spawnEfficiency,
+  reviewThoroughness,
+  timeToFirstSpawn,
+  overallDiscipline,
+} from "./coordinator-discipline.js";
 /**
  * Checks that subtasks cover the full task scope
  *

package/examples/plugin-wrapper-template.ts CHANGED Viewed

@@ -14,6 +14,7 @@
  * - SWARM_PROJECT_DIR: Project directory (critical for database path)
  */
 import type { Plugin, PluginInput, Hooks } from "@opencode-ai/plugin";
+import type { ToolPart } from "@opencode-ai/sdk";
 import { tool } from "@opencode-ai/plugin";
 import { spawn } from "child_process";
 import { appendFileSync, mkdirSync, existsSync } from "node:fs";
@@ -68,6 +69,10 @@ function logCompaction(
 // This is CRITICAL: without it, the CLI uses process.cwd() which may be wrong
 let projectDirectory: string = process.cwd();
+// Module-level SDK client - set during plugin initialization
+// Used for scanning session messages during compaction
+let sdkClient: any = null;
 // =============================================================================
 // CLI Execution Helper
 // =============================================================================
@@ -1039,7 +1044,9 @@ async function querySwarmState(sessionID: string): Promise<SwarmStateSnapshot> {
     let cells: any[] = [];
     if (cellsResult.exitCode === 0) {
       try {
-        cells = JSON.parse(cellsResult.stdout);
+        const parsed = JSON.parse(cellsResult.stdout);
+        // Handle wrapped response: { success: true, data: [...] }
+        cells = Array.isArray(parsed) ? parsed : (parsed?.data ?? []);
       } catch (parseErr) {
         logCompaction("error", "query_swarm_state_parse_failed", {
           session_id: sessionID,
@@ -1175,7 +1182,7 @@ async function generateCompactionPrompt(
   snapshot: SwarmStateSnapshot,
 ): Promise<string | null> {
   const startTime = Date.now();
-  const liteModel = process.env.OPENCODE_LITE_MODEL || "claude-3-5-haiku-20241022";
+  const liteModel = process.env.OPENCODE_LITE_MODEL || "__SWARM_LITE_MODEL__";
   logCompaction("debug", "generate_compaction_prompt_start", {
     session_id: snapshot.sessionID,
@@ -1324,6 +1331,226 @@ Keep the prompt concise but actionable. Use actual data from the snapshot, not p
   }
 }
+/**
+ * Session message scan result
+ */
+interface SessionScanResult {
+  messageCount: number;
+  toolCalls: Array<{
+    toolName: string;
+    args: Record<string, unknown>;
+    output?: string;
+  }>;
+  swarmDetected: boolean;
+  reasons: string[];
+}
+/**
+ * Scan session messages for swarm tool calls
+ *
+ * Uses SDK client to fetch messages and look for swarm activity.
+ * This can detect swarm work even if no cells exist yet.
+ */
+async function scanSessionMessages(sessionID: string): Promise<SessionScanResult> {
+  const startTime = Date.now();
+  const result: SessionScanResult = {
+    messageCount: 0,
+    toolCalls: [],
+    swarmDetected: false,
+    reasons: [],
+  };
+  logCompaction("debug", "session_scan_start", {
+    session_id: sessionID,
+    has_sdk_client: !!sdkClient,
+  });
+  if (!sdkClient) {
+    logCompaction("warn", "session_scan_no_sdk_client", {
+      session_id: sessionID,
+    });
+    return result;
+  }
+  try {
+    // Fetch session messages
+    const messagesStart = Date.now();
+    const rawResponse = await sdkClient.session.messages({ path: { id: sessionID } });
+    const messagesDuration = Date.now() - messagesStart;
+    // Log the RAW response to understand its shape
+    logCompaction("debug", "session_scan_raw_response", {
+      session_id: sessionID,
+      response_type: typeof rawResponse,
+      is_array: Array.isArray(rawResponse),
+      is_null: rawResponse === null,
+      is_undefined: rawResponse === undefined,
+      keys: rawResponse && typeof rawResponse === 'object' ? Object.keys(rawResponse) : [],
+      raw_preview: JSON.stringify(rawResponse)?.slice(0, 500),
+    });
+    // The response might be wrapped - check common patterns
+    const messages = Array.isArray(rawResponse)
+      ? rawResponse
+      : rawResponse?.data
+      ? rawResponse.data
+      : rawResponse?.messages
+      ? rawResponse.messages
+      : rawResponse?.items
+      ? rawResponse.items
+      : [];
+    result.messageCount = messages?.length ?? 0;
+    logCompaction("debug", "session_scan_messages_fetched", {
+      session_id: sessionID,
+      duration_ms: messagesDuration,
+      message_count: result.messageCount,
+      extraction_method: Array.isArray(rawResponse) ? 'direct_array' : rawResponse?.data ? 'data_field' : rawResponse?.messages ? 'messages_field' : rawResponse?.items ? 'items_field' : 'fallback_empty',
+    });
+    if (!Array.isArray(messages) || messages.length === 0) {
+      logCompaction("debug", "session_scan_no_messages", {
+        session_id: sessionID,
+      });
+      return result;
+    }
+    // Swarm-related tool patterns
+    const swarmTools = [
+      // High confidence - active swarm coordination
+      "hive_create_epic",
+      "swarm_decompose",
+      "swarm_spawn_subtask",
+      "swarm_complete",
+      "swarmmail_init",
+      "swarmmail_reserve",
+      // Medium confidence - swarm activity
+      "hive_start",
+      "hive_close",
+      "swarm_status",
+      "swarm_progress",
+      "swarmmail_send",
+      // Low confidence - possible swarm
+      "hive_create",
+      "hive_query",
+    ];
+    const highConfidenceTools = new Set([
+      "hive_create_epic",
+      "swarm_decompose",
+      "swarm_spawn_subtask",
+      "swarmmail_init",
+      "swarmmail_reserve",
+    ]);
+    // Scan messages for tool calls
+    let swarmToolCount = 0;
+    let highConfidenceCount = 0;
+    // Debug: collect part types to understand message structure
+    const partTypeCounts: Record<string, number> = {};
+    let messagesWithParts = 0;
+    let messagesWithoutParts = 0;
+    let samplePartTypes: string[] = [];
+    for (const message of messages) {
+      if (!message.parts || !Array.isArray(message.parts)) {
+        messagesWithoutParts++;
+        continue;
+      }
+      messagesWithParts++;
+      for (const part of message.parts) {
+        const partType = part.type || "unknown";
+        partTypeCounts[partType] = (partTypeCounts[partType] || 0) + 1;
+        // Collect first 10 unique part types for debugging
+        if (samplePartTypes.length < 10 && !samplePartTypes.includes(partType)) {
+          samplePartTypes.push(partType);
+        }
+        // Check if this is a tool call part
+        // OpenCode SDK: ToolPart has type="tool", tool=<string name>, state={...}
+        if (part.type === "tool") {
+          const toolPart = part as ToolPart;
+          const toolName = toolPart.tool; // tool name is a string directly
+          if (toolName && swarmTools.includes(toolName)) {
+            swarmToolCount++;
+            if (highConfidenceTools.has(toolName)) {
+              highConfidenceCount++;
+            }
+            // Extract args/output from state if available
+            const state = toolPart.state;
+            const args = state && "input" in state ? state.input : {};
+            const output = state && "output" in state ? state.output : undefined;
+            result.toolCalls.push({
+              toolName,
+              args,
+              output,
+            });
+            logCompaction("debug", "session_scan_tool_found", {
+              session_id: sessionID,
+              tool_name: toolName,
+              is_high_confidence: highConfidenceTools.has(toolName),
+            });
+          }
+        }
+      }
+    }
+    // Determine if swarm detected based on tool calls
+    if (highConfidenceCount > 0) {
+      result.swarmDetected = true;
+      result.reasons.push(`${highConfidenceCount} high-confidence swarm tools (${Array.from(new Set(result.toolCalls.filter(tc => highConfidenceTools.has(tc.toolName)).map(tc => tc.toolName))).join(", ")})`);
+    }
+    if (swarmToolCount > 0 && !result.swarmDetected) {
+      result.swarmDetected = true;
+      result.reasons.push(`${swarmToolCount} swarm-related tools used`);
+    }
+    const totalDuration = Date.now() - startTime;
+    // Debug: log part type distribution to understand message structure
+    logCompaction("debug", "session_scan_part_types", {
+      session_id: sessionID,
+      messages_with_parts: messagesWithParts,
+      messages_without_parts: messagesWithoutParts,
+      part_type_counts: partTypeCounts,
+      sample_part_types: samplePartTypes,
+    });
+    logCompaction("info", "session_scan_complete", {
+      session_id: sessionID,
+      duration_ms: totalDuration,
+      message_count: result.messageCount,
+      tool_call_count: result.toolCalls.length,
+      swarm_tool_count: swarmToolCount,
+      high_confidence_count: highConfidenceCount,
+      swarm_detected: result.swarmDetected,
+      reasons: result.reasons,
+      unique_tools: Array.from(new Set(result.toolCalls.map(tc => tc.toolName))),
+    });
+    return result;
+  } catch (err) {
+    const totalDuration = Date.now() - startTime;
+    logCompaction("error", "session_scan_exception", {
+      session_id: sessionID,
+      error: err instanceof Error ? err.message : String(err),
+      stack: err instanceof Error ? err.stack : undefined,
+      duration_ms: totalDuration,
+    });
+    return result;
+  }
+}
 /**
  * Check for swarm sign - evidence a swarm passed through
  *
@@ -1647,13 +1874,18 @@ type ExtendedHooks = Hooks & {
   ) => Promise<void>;
 };
-export const SwarmPlugin: Plugin = async (
+// NOTE: Only default export - named exports cause double registration!
+// OpenCode's plugin loader calls ALL exports as functions.
+const SwarmPlugin: Plugin = async (
   input: PluginInput,
 ): Promise<ExtendedHooks> => {
   // CRITICAL: Set project directory from OpenCode input
   // Without this, CLI uses wrong database path
   projectDirectory = input.directory;
+  // Store SDK client for session message scanning during compaction
+  sdkClient = input.client;
   return {
     tool: {
       // Beads
@@ -1751,7 +1983,23 @@ export const SwarmPlugin: Plugin = async (
       });
       // =======================================================================
-      // STEP 1: Detect swarm state from hive
+      // STEP 1: Scan session messages for swarm tool calls
+      // =======================================================================
+      const sessionScanStart = Date.now();
+      const sessionScan = await scanSessionMessages(input.sessionID);
+      const sessionScanDuration = Date.now() - sessionScanStart;
+      logCompaction("info", "session_scan_results", {
+        session_id: input.sessionID,
+        duration_ms: sessionScanDuration,
+        message_count: sessionScan.messageCount,
+        tool_call_count: sessionScan.toolCalls.length,
+        swarm_detected_from_messages: sessionScan.swarmDetected,
+        reasons: sessionScan.reasons,
+      });
+      // =======================================================================
+      // STEP 2: Detect swarm state from hive cells
       // =======================================================================
       const detectionStart = Date.now();
       const detection = await detectSwarm();
@@ -1766,6 +2014,57 @@ export const SwarmPlugin: Plugin = async (
         reason_count: detection.reasons.length,
       });
+      // =======================================================================
+      // STEP 3: Merge session scan with hive detection for final confidence
+      // =======================================================================
+      // If session messages show high-confidence swarm tools, boost confidence
+      if (sessionScan.swarmDetected && sessionScan.reasons.some(r => r.includes("high-confidence"))) {
+        if (detection.confidence === "none" || detection.confidence === "low") {
+          detection.confidence = "high";
+          detection.detected = true;
+          detection.reasons.push(...sessionScan.reasons);
+          logCompaction("info", "confidence_boost_from_session_scan", {
+            session_id: input.sessionID,
+            original_confidence: detection.confidence,
+            boosted_to: "high",
+            session_reasons: sessionScan.reasons,
+          });
+        }
+      } else if (sessionScan.swarmDetected) {
+        // Medium boost for any swarm tools found
+        if (detection.confidence === "none") {
+          detection.confidence = "medium";
+          detection.detected = true;
+          detection.reasons.push(...sessionScan.reasons);
+          logCompaction("info", "confidence_boost_from_session_scan", {
+            session_id: input.sessionID,
+            original_confidence: "none",
+            boosted_to: "medium",
+            session_reasons: sessionScan.reasons,
+          });
+        } else if (detection.confidence === "low") {
+          detection.confidence = "medium";
+          detection.reasons.push(...sessionScan.reasons);
+          logCompaction("info", "confidence_boost_from_session_scan", {
+            session_id: input.sessionID,
+            original_confidence: "low",
+            boosted_to: "medium",
+            session_reasons: sessionScan.reasons,
+          });
+        }
+      }
+      logCompaction("info", "final_swarm_detection", {
+        session_id: input.sessionID,
+        confidence: detection.confidence,
+        detected: detection.detected,
+        combined_reasons: detection.reasons,
+        message_scan_contributed: sessionScan.swarmDetected,
+      });
       if (detection.confidence === "high" || detection.confidence === "medium") {
         // Definite or probable swarm - try LLM-powered compaction
         logCompaction("info", "swarm_detected_attempting_llm", {