npm - opencode-swarm-plugin - Versions diffs - 0.40.0 → 0.42.0 - Mend

opencode-swarm-plugin 0.40.0 → 0.42.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/.hive/analysis/eval-failure-analysis-2025-12-25.md +331 -0
package/.hive/analysis/session-data-quality-audit.md +320 -0
package/.hive/eval-results.json +481 -24
package/.hive/issues.jsonl +65 -16
package/.hive/memories.jsonl +159 -1
package/.opencode/eval-history.jsonl +315 -0
package/.turbo/turbo-build.log +5 -5
package/CHANGELOG.md +155 -0
package/README.md +2 -0
package/SCORER-ANALYSIS.md +598 -0
package/bin/eval-gate.test.ts +158 -0
package/bin/eval-gate.ts +74 -0
package/bin/swarm.test.ts +661 -732
package/bin/swarm.ts +274 -0
package/dist/compaction-hook.d.ts +7 -5
package/dist/compaction-hook.d.ts.map +1 -1
package/dist/compaction-prompt-scoring.d.ts +1 -0
package/dist/compaction-prompt-scoring.d.ts.map +1 -1
package/dist/eval-runner.d.ts +134 -0
package/dist/eval-runner.d.ts.map +1 -0
package/dist/hive.d.ts.map +1 -1
package/dist/index.d.ts +29 -0
package/dist/index.d.ts.map +1 -1
package/dist/index.js +99741 -58858
package/dist/memory-tools.d.ts +70 -2
package/dist/memory-tools.d.ts.map +1 -1
package/dist/memory.d.ts +37 -0
package/dist/memory.d.ts.map +1 -1
package/dist/observability-tools.d.ts +64 -0
package/dist/observability-tools.d.ts.map +1 -1
package/dist/plugin.js +99356 -58318
package/dist/swarm-orchestrate.d.ts.map +1 -1
package/dist/swarm-prompts.d.ts +32 -1
package/dist/swarm-prompts.d.ts.map +1 -1
package/docs/planning/ADR-009-oh-my-opencode-patterns.md +353 -0
package/evals/ARCHITECTURE.md +1189 -0
package/evals/example.eval.ts +3 -4
package/evals/fixtures/compaction-prompt-cases.ts +6 -0
package/evals/scorers/coordinator-discipline.ts +0 -253
package/evals/swarm-decomposition.eval.ts +4 -2
package/package.json +4 -3
package/src/compaction-prompt-scorers.test.ts +10 -9
package/src/compaction-prompt-scoring.ts +7 -5
package/src/eval-runner.test.ts +128 -1
package/src/eval-runner.ts +46 -0
package/src/hive.ts +43 -42
package/src/memory-tools.test.ts +84 -0
package/src/memory-tools.ts +68 -3
package/src/memory.test.ts +2 -112
package/src/memory.ts +88 -49
package/src/observability-tools.test.ts +13 -0
package/src/observability-tools.ts +277 -0
package/src/swarm-orchestrate.test.ts +162 -0
package/src/swarm-orchestrate.ts +7 -5
package/src/swarm-prompts.test.ts +168 -4
package/src/swarm-prompts.ts +228 -7
package/.env +0 -2
package/.turbo/turbo-test.log +0 -481
package/.turbo/turbo-typecheck.log +0 -1

package/bin/eval-gate.test.ts ADDED Viewed

@@ -0,0 +1,158 @@
+#!/usr/bin/env bun
+/**
+ * Tests for eval-gate CLI
+ *
+ * TDD: Write tests first to verify behavior before implementing.
+ */
+import { describe, test, expect, beforeEach, mock } from "bun:test";
+import type { RunEvalsResult } from "../src/eval-runner.js";
+// Mock process.exit to prevent test from actually exiting
+const mockExit = mock((code?: number) => {
+  throw new Error(`EXIT:${code ?? 0}`);
+});
+beforeEach(() => {
+  mockExit.mockClear();
+});
+describe("eval-gate CLI", () => {
+  test("exits 0 when all gates pass", async () => {
+    const mockResult: RunEvalsResult = {
+      success: true,
+      totalSuites: 2,
+      totalEvals: 10,
+      averageScore: 0.95,
+      suites: [],
+      gateResults: [
+        {
+          suite: "example",
+          passed: true,
+          phase: "production",
+          message: "Passed",
+          currentScore: 0.95,
+        },
+      ],
+    };
+    // Simulate main() execution with mocked runEvals
+    let exitCode: number | undefined;
+    try {
+      // Would call main() here if we extract it to a function
+      // For now, verify exit logic manually
+      const failedGates = mockResult.gateResults?.filter((g) => !g.passed) || [];
+      if (failedGates.length > 0 || !mockResult.success) {
+        exitCode = 1;
+      } else {
+        exitCode = 0;
+      }
+    } catch (e) {
+      // Extract exit code from mocked error
+      if (e instanceof Error && e.message.startsWith("EXIT:")) {
+        exitCode = parseInt(e.message.split(":")[1]);
+      }
+    }
+    expect(exitCode).toBe(0);
+  });
+  test("exits 1 when gates fail", async () => {
+    const mockResult: RunEvalsResult = {
+      success: false,
+      totalSuites: 2,
+      totalEvals: 10,
+      averageScore: 0.45,
+      suites: [],
+      gateResults: [
+        {
+          suite: "coordinator",
+          passed: false,
+          phase: "production",
+          message: "Regression detected",
+          currentScore: 0.45,
+          baseline: 0.85,
+          regressionPercent: -47,
+        },
+      ],
+    };
+    let exitCode: number | undefined;
+    const failedGates = mockResult.gateResults?.filter((g) => !g.passed) || [];
+    if (failedGates.length > 0 || !mockResult.success) {
+      exitCode = 1;
+    } else {
+      exitCode = 0;
+    }
+    expect(exitCode).toBe(1);
+  });
+  test("exits 1 when threshold check fails", async () => {
+    const mockResult: RunEvalsResult = {
+      success: false, // Threshold failed
+      totalSuites: 2,
+      totalEvals: 10,
+      averageScore: 0.65, // Below threshold of 80
+      suites: [],
+      gateResults: [],
+    };
+    let exitCode: number | undefined;
+    const failedGates = mockResult.gateResults?.filter((g) => !g.passed) || [];
+    if (failedGates.length > 0 || !mockResult.success) {
+      exitCode = 1;
+    } else {
+      exitCode = 0;
+    }
+    expect(exitCode).toBe(1);
+  });
+  test("parses --suite argument", () => {
+    const args = ["--suite", "coordinator"];
+    let suiteFilter: string | undefined;
+    for (let i = 0; i < args.length; i++) {
+      if (args[i] === "--suite" && args[i + 1]) {
+        suiteFilter = args[i + 1];
+        i++;
+      }
+    }
+    expect(suiteFilter).toBe("coordinator");
+  });
+  test("parses --threshold argument", () => {
+    const args = ["--threshold", "85"];
+    let scoreThreshold: number | undefined;
+    for (let i = 0; i < args.length; i++) {
+      if (args[i] === "--threshold" && args[i + 1]) {
+        scoreThreshold = parseInt(args[i + 1], 10);
+        i++;
+      }
+    }
+    expect(scoreThreshold).toBe(85);
+  });
+  test("handles missing arguments gracefully", () => {
+    const args: string[] = [];
+    let suiteFilter: string | undefined;
+    let scoreThreshold: number | undefined;
+    for (let i = 0; i < args.length; i++) {
+      if (args[i] === "--suite" && args[i + 1]) {
+        suiteFilter = args[i + 1];
+        i++;
+      } else if (args[i] === "--threshold" && args[i + 1]) {
+        scoreThreshold = parseInt(args[i + 1], 10);
+        i++;
+      }
+    }
+    expect(suiteFilter).toBeUndefined();
+    expect(scoreThreshold).toBeUndefined();
+  });
+});

package/bin/eval-gate.ts ADDED Viewed

@@ -0,0 +1,74 @@
+#!/usr/bin/env bun
+/**
+ * Eval Gate CLI - Run evals and fail on regression
+ *
+ * Usage:
+ *   bun run bin/eval-gate.ts                    # Run all evals
+ *   bun run bin/eval-gate.ts --suite coordinator # Run specific suite
+ *   bun run bin/eval-gate.ts --threshold 80     # Custom score threshold
+ */
+import { runEvals } from "../src/eval-runner.js";
+const args = process.argv.slice(2);
+// Parse args
+let suiteFilter: string | undefined;
+let scoreThreshold: number | undefined;
+for (let i = 0; i < args.length; i++) {
+  if (args[i] === "--suite" && args[i + 1]) {
+    suiteFilter = args[i + 1];
+    i++;
+  } else if (args[i] === "--threshold" && args[i + 1]) {
+    scoreThreshold = parseInt(args[i + 1], 10);
+    i++;
+  }
+}
+async function main() {
+  console.log("🔍 Running eval gates...\n");
+  const result = await runEvals({
+    cwd: process.cwd(),
+    suiteFilter,
+    scoreThreshold,
+  });
+  // Print results
+  console.log(`📊 Results:`);
+  console.log(`   Suites: ${result.totalSuites}`);
+  console.log(`   Evals: ${result.totalEvals}`);
+  console.log(`   Average Score: ${(result.averageScore * 100).toFixed(1)}%\n`);
+  // Print gate results
+  if (result.gateResults && result.gateResults.length > 0) {
+    console.log("🚦 Gate Results:");
+    for (const gate of result.gateResults) {
+      const icon = gate.passed ? "✅" : "❌";
+      console.log(`   ${icon} ${gate.suite}: ${gate.message}`);
+    }
+    console.log("");
+  }
+  // Check for gate failures
+  const failedGates = result.gateResults?.filter(g => !g.passed) || [];
+  if (failedGates.length > 0) {
+    console.error(`❌ ${failedGates.length} gate(s) failed!`);
+    process.exit(1);
+  }
+  if (!result.success) {
+    console.error(`❌ Evals failed threshold check`);
+    process.exit(1);
+  }
+  console.log("✅ All gates passed!");
+  process.exit(0);
+}
+main().catch((err) => {
+  console.error("Fatal error:", err);
+  process.exit(1);
+});