npm - workspace-maxxing - Versions diffs - 0.1.0 - Mend

workspace-maxxing 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (198) hide show

package/.agents/skills/workspace-maxxing/.workspace-templates/CONTEXT.md +44 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/SYSTEM.md +44 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/references/anti-patterns.md +16 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/references/iron-laws.md +26 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/references/reporting-format.md +52 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/benchmark.ts +171 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/dispatch.ts +473 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/generate-tests.ts +158 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/install-tool.ts +82 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/iterate.ts +265 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/orchestrator.ts +539 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/scaffold.ts +282 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/scripts/validate.ts +452 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/architecture/SKILL.md +95 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/fixer/SKILL.md +109 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/iteration/SKILL.md +89 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/prompt-engineering/SKILL.md +87 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/research/SKILL.md +94 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/testing/SKILL.md +89 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/tooling/SKILL.md +87 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/validation/SKILL.md +103 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/skills/worker/SKILL.md +79 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/workspace/00-meta/CONTEXT.md +6 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/workspace/00-meta/execution-log.md +27 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/workspace/01-input/CONTEXT.md +29 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/workspace/02-process/CONTEXT.md +29 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/workspace/03-output/CONTEXT.md +29 -0
package/.agents/skills/workspace-maxxing/.workspace-templates/workspace/README.md +14 -0
package/.agents/skills/workspace-maxxing/SKILL.md +312 -0
package/.agents/skills/workspace-maxxing/scripts/benchmark.ts +171 -0
package/.agents/skills/workspace-maxxing/scripts/dispatch.ts +473 -0
package/.agents/skills/workspace-maxxing/scripts/generate-tests.ts +158 -0
package/.agents/skills/workspace-maxxing/scripts/install-tool.ts +82 -0
package/.agents/skills/workspace-maxxing/scripts/iterate.ts +265 -0
package/.agents/skills/workspace-maxxing/scripts/orchestrator.ts +539 -0
package/.agents/skills/workspace-maxxing/scripts/scaffold.ts +282 -0
package/.agents/skills/workspace-maxxing/scripts/validate.ts +452 -0
package/README.md +144 -0
package/dist/agent-creator.d.ts +9 -0
package/dist/agent-creator.d.ts.map +1 -0
package/dist/agent-creator.js +199 -0
package/dist/agent-creator.js.map +1 -0
package/dist/agent-iterator.d.ts +38 -0
package/dist/agent-iterator.d.ts.map +1 -0
package/dist/agent-iterator.js +327 -0
package/dist/agent-iterator.js.map +1 -0
package/dist/index.d.ts +3 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +197 -0
package/dist/index.js.map +1 -0
package/dist/install.d.ts +18 -0
package/dist/install.d.ts.map +1 -0
package/dist/install.js +117 -0
package/dist/install.js.map +1 -0
package/dist/platforms/claude.d.ts +7 -0
package/dist/platforms/claude.d.ts.map +1 -0
package/dist/platforms/claude.js +70 -0
package/dist/platforms/claude.js.map +1 -0
package/dist/platforms/copilot.d.ts +7 -0
package/dist/platforms/copilot.d.ts.map +1 -0
package/dist/platforms/copilot.js +75 -0
package/dist/platforms/copilot.js.map +1 -0
package/dist/platforms/gemini.d.ts +7 -0
package/dist/platforms/gemini.d.ts.map +1 -0
package/dist/platforms/gemini.js +81 -0
package/dist/platforms/gemini.js.map +1 -0
package/dist/platforms/index.d.ts +8 -0
package/dist/platforms/index.d.ts.map +1 -0
package/dist/platforms/index.js +41 -0
package/dist/platforms/index.js.map +1 -0
package/dist/platforms/opencode.d.ts +7 -0
package/dist/platforms/opencode.d.ts.map +1 -0
package/dist/platforms/opencode.js +70 -0
package/dist/platforms/opencode.js.map +1 -0
package/dist/scripts/benchmark.d.ts +20 -0
package/dist/scripts/benchmark.d.ts.map +1 -0
package/dist/scripts/benchmark.js +170 -0
package/dist/scripts/benchmark.js.map +1 -0
package/dist/scripts/dispatch.d.ts +32 -0
package/dist/scripts/dispatch.d.ts.map +1 -0
package/dist/scripts/dispatch.js +386 -0
package/dist/scripts/dispatch.js.map +1 -0
package/dist/scripts/generate-tests.d.ts +11 -0
package/dist/scripts/generate-tests.d.ts.map +1 -0
package/dist/scripts/generate-tests.js +118 -0
package/dist/scripts/generate-tests.js.map +1 -0
package/dist/scripts/install-tool.d.ts +8 -0
package/dist/scripts/install-tool.d.ts.map +1 -0
package/dist/scripts/install-tool.js +98 -0
package/dist/scripts/install-tool.js.map +1 -0
package/dist/scripts/iterate.d.ts +44 -0
package/dist/scripts/iterate.d.ts.map +1 -0
package/dist/scripts/iterate.js +260 -0
package/dist/scripts/iterate.js.map +1 -0
package/dist/scripts/orchestrator.d.ts +40 -0
package/dist/scripts/orchestrator.d.ts.map +1 -0
package/dist/scripts/orchestrator.js +378 -0
package/dist/scripts/orchestrator.js.map +1 -0
package/dist/scripts/scaffold.d.ts +8 -0
package/dist/scripts/scaffold.d.ts.map +1 -0
package/dist/scripts/scaffold.js +279 -0
package/dist/scripts/scaffold.js.map +1 -0
package/dist/scripts/validate.d.ts +11 -0
package/dist/scripts/validate.d.ts.map +1 -0
package/dist/scripts/validate.js +472 -0
package/dist/scripts/validate.js.map +1 -0
package/docs/superpowers/plans/2026-04-07-autonomous-iteration-plan.md +1123 -0
package/docs/superpowers/plans/2026-04-07-autonomous-iteration-sub-agent-batches.md +1923 -0
package/docs/superpowers/plans/2026-04-07-autonomous-workflow-sub-skill-plan.md +1505 -0
package/docs/superpowers/plans/2026-04-07-benchmarking-multi-agent-plan.md +854 -0
package/docs/superpowers/plans/2026-04-07-workspace-builder-logic-plan.md +1426 -0
package/docs/superpowers/plans/2026-04-07-workspace-maxxing-plan.md +1299 -0
package/docs/superpowers/plans/2026-04-08-session-294c-subagent-invocation-plan.md +320 -0
package/docs/superpowers/plans/2026-04-08-workflow-prompt-hardening-plan.md +1025 -0
package/docs/superpowers/plans/2026-04-12-workspace-agent-creation-plan.md +992 -0
package/docs/superpowers/specs/2026-04-07-autonomous-iteration-design.md +214 -0
package/docs/superpowers/specs/2026-04-07-autonomous-iteration-sub-agent-batches-design.md +188 -0
package/docs/superpowers/specs/2026-04-07-autonomous-workflow-sub-skill-design.md +137 -0
package/docs/superpowers/specs/2026-04-07-benchmarking-multi-agent-design.md +105 -0
package/docs/superpowers/specs/2026-04-07-workspace-builder-logic-design.md +179 -0
package/docs/superpowers/specs/2026-04-07-workspace-maxxing-design.md +227 -0
package/docs/superpowers/specs/2026-04-08-session-294c-subagent-invocation-design.md +265 -0
package/docs/superpowers/specs/2026-04-08-workflow-prompt-hardening-design.md +146 -0
package/docs/superpowers/specs/2026-04-12-workspace-agent-creation-design.md +239 -0
package/jest.config.js +8 -0
package/package.json +32 -0
package/src/agent-creator.ts +180 -0
package/src/agent-iterator.ts +397 -0
package/src/index.ts +189 -0
package/src/install.ts +105 -0
package/src/platforms/claude.ts +40 -0
package/src/platforms/copilot.ts +50 -0
package/src/platforms/gemini.ts +55 -0
package/src/platforms/index.ts +45 -0
package/src/platforms/opencode.ts +41 -0
package/src/scripts/benchmark.ts +171 -0
package/src/scripts/dispatch.ts +473 -0
package/src/scripts/generate-tests.ts +112 -0
package/src/scripts/install-tool.ts +82 -0
package/src/scripts/iterate.ts +271 -0
package/src/scripts/orchestrator.ts +539 -0
package/src/scripts/scaffold.ts +282 -0
package/src/scripts/validate.ts +516 -0
package/templates/.workspace-templates/CONTEXT.md +44 -0
package/templates/.workspace-templates/SYSTEM.md +44 -0
package/templates/.workspace-templates/references/anti-patterns.md +16 -0
package/templates/.workspace-templates/references/iron-laws.md +26 -0
package/templates/.workspace-templates/references/reporting-format.md +52 -0
package/templates/.workspace-templates/scripts/benchmark.ts +171 -0
package/templates/.workspace-templates/scripts/dispatch.ts +473 -0
package/templates/.workspace-templates/scripts/generate-tests.ts +158 -0
package/templates/.workspace-templates/scripts/install-tool.ts +82 -0
package/templates/.workspace-templates/scripts/iterate.ts +265 -0
package/templates/.workspace-templates/scripts/orchestrator.ts +539 -0
package/templates/.workspace-templates/scripts/scaffold.ts +282 -0
package/templates/.workspace-templates/scripts/validate.ts +452 -0
package/templates/.workspace-templates/skills/architecture/SKILL.md +95 -0
package/templates/.workspace-templates/skills/fixer/SKILL.md +109 -0
package/templates/.workspace-templates/skills/iteration/SKILL.md +89 -0
package/templates/.workspace-templates/skills/prompt-engineering/SKILL.md +87 -0
package/templates/.workspace-templates/skills/research/SKILL.md +94 -0
package/templates/.workspace-templates/skills/testing/SKILL.md +89 -0
package/templates/.workspace-templates/skills/tooling/SKILL.md +87 -0
package/templates/.workspace-templates/skills/validation/SKILL.md +103 -0
package/templates/.workspace-templates/skills/worker/SKILL.md +79 -0
package/templates/.workspace-templates/workspace/00-meta/CONTEXT.md +6 -0
package/templates/.workspace-templates/workspace/00-meta/execution-log.md +27 -0
package/templates/.workspace-templates/workspace/01-input/CONTEXT.md +29 -0
package/templates/.workspace-templates/workspace/02-process/CONTEXT.md +29 -0
package/templates/.workspace-templates/workspace/03-output/CONTEXT.md +29 -0
package/templates/.workspace-templates/workspace/README.md +14 -0
package/templates/SKILL.md +347 -0
package/tests/benchmark.test.ts +158 -0
package/tests/cli.test.ts +109 -0
package/tests/dispatch-parallel.test.ts +124 -0
package/tests/dispatch.test.ts +218 -0
package/tests/fixer-skill.test.ts +203 -0
package/tests/generate-tests.test.ts +101 -0
package/tests/install-tool.test.ts +141 -0
package/tests/install.test.ts +144 -0
package/tests/integration.test.ts +324 -0
package/tests/iterate.test.ts +219 -0
package/tests/orchestrator.test.ts +710 -0
package/tests/scaffold.test.ts +238 -0
package/tests/templates-enhanced.test.ts +208 -0
package/tests/templates.test.ts +219 -0
package/tests/validate.test.ts +421 -0
package/tests/validation-enhanced.test.ts +303 -0
package/tests/worker-skill.test.ts +88 -0
package/tsconfig.json +19 -0
package/workspace/00-meta/CONTEXT.md +3 -0
package/workspace/00-meta/execution-log.md +17 -0
package/workspace/00-meta/tools.md +11 -0
package/workspace/01-input/CONTEXT.md +27 -0
package/workspace/CONTEXT.md +35 -0
package/workspace/README.md +14 -0
package/workspace/SYSTEM.md +36 -0
package/workspace-maxxing-0.1.0.tgz +0 -0

package/tests/orchestrator.test.ts ADDED Viewed

@@ -0,0 +1,710 @@
+import * as fs from 'fs';
+import * as path from 'path';
+import * as os from 'os';
+import { splitIntoBatches, createBatchDirectory, getBatchDirectory, createTestCaseDirectory, runBatchLifecycle } from '../src/scripts/orchestrator';
+import * as dispatch from '../src/scripts/dispatch';
+import * as generateTests from '../src/scripts/generate-tests';
+import * as benchmark from '../src/scripts/benchmark';
+describe('orchestrator', () => {
+  let tempDir: string;
+  beforeEach(() => {
+    tempDir = fs.mkdtempSync(path.join(os.tmpdir(), 'orchestrator-test-'));
+  });
+  afterEach(() => {
+    fs.rmSync(tempDir, { recursive: true, force: true });
+    jest.restoreAllMocks();
+  });
+  describe('splitIntoBatches', () => {
+    it('splits items into batches of specified size', () => {
+      const items = ['tc-001', 'tc-002', 'tc-003', 'tc-004', 'tc-005'];
+      const result = splitIntoBatches(items, 3);
+      expect(result).toHaveLength(2);
+      expect(result[0]).toEqual(['tc-001', 'tc-002', 'tc-003']);
+      expect(result[1]).toEqual(['tc-004', 'tc-005']);
+    });
+    it('returns single batch when items fit', () => {
+      const items = ['tc-001', 'tc-002'];
+      const result = splitIntoBatches(items, 3);
+      expect(result).toHaveLength(1);
+      expect(result[0]).toEqual(['tc-001', 'tc-002']);
+    });
+    it('returns empty array for empty input', () => {
+      const result = splitIntoBatches([], 3);
+      expect(result).toEqual([]);
+    });
+    it('uses default batch size of 3 when not specified', () => {
+      const items = ['a', 'b', 'c', 'd', 'e', 'f', 'g'];
+      const result = splitIntoBatches(items);
+      expect(result).toHaveLength(3);
+      expect(result[0]).toHaveLength(3);
+      expect(result[1]).toHaveLength(3);
+      expect(result[2]).toHaveLength(1);
+    });
+    it('throws for invalid batch sizes to prevent non-terminating loops', () => {
+      expect(() => splitIntoBatches(['tc-001'], 0)).toThrow(/Invalid batchSize/);
+      expect(() => splitIntoBatches(['tc-001'], -1)).toThrow(/Invalid batchSize/);
+      expect(() => splitIntoBatches(['tc-001'], 1.5)).toThrow(/Invalid batchSize/);
+      expect(() => splitIntoBatches(['tc-001'], Number.NaN)).toThrow(/Invalid batchSize/);
+    });
+  });
+  describe('batch directory management', () => {
+    it('creates batch directory structure', () => {
+      const baseDir = path.join(tempDir, '.agents', 'iteration');
+      const result = createBatchDirectory(baseDir, 1);
+      expect(fs.existsSync(result)).toBe(true);
+      expect(result).toContain('batch-01');
+    });
+    it('returns existing batch directory path', () => {
+      const baseDir = path.join(tempDir, '.agents', 'iteration');
+      fs.mkdirSync(path.join(baseDir, 'batch-02'), { recursive: true });
+      const result = getBatchDirectory(baseDir, 2);
+      expect(result).toContain('batch-02');
+    });
+    it('creates test case directory within batch', () => {
+      const baseDir = path.join(tempDir, '.agents', 'iteration');
+      const batchDir = createBatchDirectory(baseDir, 1);
+      const tcDir = createTestCaseDirectory(batchDir, 'tc-001');
+      expect(fs.existsSync(tcDir)).toBe(true);
+      expect(tcDir).toContain('tc-001');
+    });
+  });
+  describe('batch lifecycle', () => {
+    it('rejects invalid numeric config values before running lifecycle', () => {
+      expect(() => runBatchLifecycle(tempDir, { batchSize: 0 })).toThrow(/Invalid batchSize/);
+      expect(() => runBatchLifecycle(tempDir, { maxFixRetries: -1 })).toThrow(/Invalid maxFixRetries/);
+      expect(() => runBatchLifecycle(tempDir, { scoreThreshold: 101 })).toThrow(/Invalid scoreThreshold/);
+      expect(() => runBatchLifecycle(tempDir, { workerTimeout: 0 })).toThrow(/Invalid workerTimeout/);
+    });
+    it('prefers existing agent-generated test-cases.json over generate fallback', () => {
+      const iterationDir = path.join(tempDir, '.agents', 'iteration');
+      fs.mkdirSync(iterationDir, { recursive: true });
+      fs.writeFileSync(
+        path.join(iterationDir, 'test-cases.json'),
+        JSON.stringify([
+          { id: 'tc-a', input: { payload: 'a' }, expected: { criteria: ['a'] } },
+          { id: 'tc-b', input: { payload: 'b' }, expected: { criteria: ['b'] } },
+        ], null, 2),
+      );
+      const generateSpy = jest.spyOn(generateTests, 'generateTestCases').mockReturnValue({
+        testCases: [
+          { stage: 'fallback', type: 'sample', input: 'x', expected: 'x' },
+        ],
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: [],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 5 },
+          nextSkill: 'validation',
+        }));
+      });
+      jest.spyOn(benchmark, 'calculateBenchmark').mockReturnValue({
+        workspace: 'test',
+        agent: 'test-agent',
+        timestamp: '2026-04-07T00:00:00.000Z',
+        rawScore: 90,
+        weightedScore: 95,
+        stages: [],
+        fixSuggestions: [],
+        improvementPotential: false,
+      });
+      const result = runBatchLifecycle(tempDir, {
+        batchSize: 2,
+        scoreThreshold: 85,
+        maxFixRetries: 1,
+        workerTimeout: 300,
+      });
+      expect(result.totalBatches).toBe(1);
+      expect(generateSpy).not.toHaveBeenCalled();
+      expect(dispatchSpy).toHaveBeenCalledTimes(1);
+      expect(dispatchSpy.mock.calls[0][0]).toEqual([
+        { skill: 'worker', batchId: 1, testCaseId: 'tc-a' },
+        { skill: 'worker', batchId: 1, testCaseId: 'tc-b' },
+      ]);
+    });
+    it('throws when existing test-cases.json has invalid top-level structure', () => {
+      const iterationDir = path.join(tempDir, '.agents', 'iteration');
+      fs.mkdirSync(iterationDir, { recursive: true });
+      fs.writeFileSync(path.join(iterationDir, 'test-cases.json'), JSON.stringify({ foo: 'bar' }, null, 2));
+      expect(() => runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        scoreThreshold: 85,
+        maxFixRetries: 1,
+        workerTimeout: 300,
+      })).toThrow(/test-cases.json must be an array or an object with a testCases array/);
+    });
+    it('throws when any test-case is missing id/input/expected fields', () => {
+      const iterationDir = path.join(tempDir, '.agents', 'iteration');
+      fs.mkdirSync(iterationDir, { recursive: true });
+      fs.writeFileSync(
+        path.join(iterationDir, 'test-cases.json'),
+        JSON.stringify([
+          { id: 'tc-001', input: { payload: 'a' }, expected: { criteria: ['a'] } },
+          { id: 'tc-002', input: { payload: 'b' } },
+        ], null, 2),
+      );
+      jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: [],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 5 },
+          nextSkill: 'validation',
+        }));
+      });
+      jest.spyOn(benchmark, 'calculateBenchmark').mockReturnValue({
+        workspace: 'test',
+        agent: 'test-agent',
+        timestamp: '2026-04-07T00:00:00.000Z',
+        rawScore: 90,
+        weightedScore: 95,
+        stages: [],
+        fixSuggestions: [],
+        improvementPotential: false,
+      });
+      expect(() => runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        scoreThreshold: 85,
+        maxFixRetries: 1,
+        workerTimeout: 300,
+      })).toThrow(/must include id, input, and expected/);
+    });
+    it('throws when test-case ids are duplicated', () => {
+      const iterationDir = path.join(tempDir, '.agents', 'iteration');
+      fs.mkdirSync(iterationDir, { recursive: true });
+      fs.writeFileSync(
+        path.join(iterationDir, 'test-cases.json'),
+        JSON.stringify([
+          { id: 'tc-001', input: { payload: 'a' }, expected: { criteria: ['a'] } },
+          { id: 'tc-001', input: { payload: 'b' }, expected: { criteria: ['b'] } },
+        ], null, 2),
+      );
+      jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: [],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 5 },
+          nextSkill: 'validation',
+        }));
+      });
+      jest.spyOn(benchmark, 'calculateBenchmark').mockReturnValue({
+        workspace: 'test',
+        agent: 'test-agent',
+        timestamp: '2026-04-07T00:00:00.000Z',
+        rawScore: 90,
+        weightedScore: 95,
+        stages: [],
+        fixSuggestions: [],
+        improvementPotential: false,
+      });
+      expect(() => runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        scoreThreshold: 85,
+        maxFixRetries: 1,
+        workerTimeout: 300,
+      })).toThrow(/Duplicate testCaseId/);
+    });
+    it('runs full lifecycle and writes summary for passing batches', () => {
+      jest.spyOn(generateTests, 'generateTestCases').mockImplementation((workspacePath, outputPath) => {
+        const payload = {
+          testCases: [
+            { stage: '01-input', type: 'sample' as const, input: 'a', expected: 'a' },
+            { stage: '02-output', type: 'sample' as const, input: 'b', expected: 'b' },
+            { stage: '03-review', type: 'sample' as const, input: 'c', expected: 'c' },
+            { stage: '04-wrap', type: 'sample' as const, input: 'd', expected: 'd' },
+          ],
+        };
+        if (outputPath) {
+          fs.writeFileSync(outputPath, JSON.stringify(payload, null, 2));
+        }
+        return payload;
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: [],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 10 },
+          nextSkill: 'validation',
+        }));
+      });
+      jest.spyOn(benchmark, 'calculateBenchmark')
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 80,
+          weightedScore: 92,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 78,
+          weightedScore: 88,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        });
+      const result = runBatchLifecycle(tempDir, {
+        batchSize: 2,
+        maxFixRetries: 2,
+        scoreThreshold: 85,
+        workerTimeout: 300,
+      });
+      expect(result.totalBatches).toBe(2);
+      expect(result.passedBatches).toBe(2);
+      expect(result.failedBatches).toBe(0);
+      expect(result.escalatedBatches).toBe(0);
+      expect(result.overallScore).toBe(90);
+      expect(result.batchReports.map((r) => r.status)).toEqual(['passed', 'passed']);
+      expect(dispatchSpy).toHaveBeenCalledTimes(2);
+      expect(dispatchSpy.mock.calls[0][0]).toEqual([
+        { skill: 'worker', batchId: 1, testCaseId: 'tc-001' },
+        { skill: 'worker', batchId: 1, testCaseId: 'tc-002' },
+      ]);
+      expect(dispatchSpy.mock.calls[1][0]).toEqual([
+        { skill: 'worker', batchId: 2, testCaseId: 'tc-003' },
+        { skill: 'worker', batchId: 2, testCaseId: 'tc-004' },
+      ]);
+      const summaryPath = path.join(tempDir, '.agents', 'iteration', 'summary.json');
+      expect(fs.existsSync(summaryPath)).toBe(true);
+      const testCasesPath = path.join(tempDir, '.agents', 'iteration', 'test-cases.json');
+      expect(fs.existsSync(testCasesPath)).toBe(true);
+      const savedTestCases = JSON.parse(fs.readFileSync(testCasesPath, 'utf-8'));
+      expect(Array.isArray(savedTestCases.testCases)).toBe(true);
+      expect(savedTestCases.testCases).toHaveLength(4);
+      const savedSummary = JSON.parse(fs.readFileSync(summaryPath, 'utf-8'));
+      expect(savedSummary.totalBatches).toBe(2);
+      expect(savedSummary.overallScore).toBe(90);
+    });
+    it('forwards sub-agent runner options to dispatch calls', () => {
+      jest.spyOn(generateTests, 'generateTestCases').mockReturnValue({
+        testCases: [
+          { stage: '01-input', type: 'sample', input: 'a', expected: 'a' },
+        ],
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: [],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 10 },
+          nextSkill: 'validation',
+        }));
+      });
+      jest.spyOn(benchmark, 'calculateBenchmark').mockReturnValue({
+        workspace: 'test',
+        agent: 'test-agent',
+        timestamp: '2026-04-07T00:00:00.000Z',
+        rawScore: 90,
+        weightedScore: 95,
+        stages: [],
+        fixSuggestions: [],
+        improvementPotential: false,
+      });
+      runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        scoreThreshold: 85,
+        maxFixRetries: 1,
+        workerTimeout: 300,
+        subagentRunner: `${process.execPath} fake-runner.js {skill} {batchId} {testCaseId}`,
+      });
+      expect(dispatchSpy).toHaveBeenCalled();
+      expect(dispatchSpy.mock.calls[0][2]).toEqual(expect.objectContaining({
+        workspacePath: tempDir,
+        runnerCommand: `${process.execPath} fake-runner.js {skill} {batchId} {testCaseId}`,
+        runnerTimeoutSeconds: 300,
+      }));
+    });
+    it('uses worker timeout to treat long worker dispatch as failed and trigger fixer retry', () => {
+      jest.spyOn(generateTests, 'generateTestCases').mockReturnValue({
+        testCases: [
+          { stage: '01-input', type: 'sample', input: 'slow', expected: 'slow' },
+        ],
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: [],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 10 },
+          nextSkill: 'validation',
+        }));
+      });
+      const nowValues = [0, 2001, 3000, 3001];
+      jest.spyOn(Date, 'now').mockImplementation(() => nowValues.shift() ?? 3001);
+      jest.spyOn(benchmark, 'calculateBenchmark')
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 90,
+          weightedScore: 98,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 91,
+          weightedScore: 98,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 91,
+          weightedScore: 98,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        });
+      const result = runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        maxFixRetries: 2,
+        scoreThreshold: 95,
+        workerTimeout: 1,
+      });
+      expect(result.totalBatches).toBe(1);
+      expect(result.passedBatches).toBe(1);
+      expect(result.batchReports[0].status).toBe('passed');
+      expect(result.batchReports[0].findings.join(' ')).toMatch(/timeout|Timeout/);
+      expect(dispatchSpy).toHaveBeenCalledTimes(2);
+      expect(dispatchSpy.mock.calls[0][0][0].skill).toBe('worker');
+      expect(dispatchSpy.mock.calls[1][0][0].skill).toBe('fixer');
+    });
+    it('marks batch as failed when fixes clear worker failures but score remains below threshold', () => {
+      jest.spyOn(generateTests, 'generateTestCases').mockReturnValue({
+        testCases: [
+          { stage: '01-input', type: 'sample', input: 'needs-work', expected: 'better' },
+        ],
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        if (invocations[0]?.skill === 'worker') {
+          return [{
+            skill: 'worker',
+            status: 'failed',
+            batchId: 1,
+            testCaseId: 'tc-001',
+            timestamp: '2026-04-07T00:00:00.000Z',
+            findings: ['output missing'],
+            recommendations: ['run fixer'],
+            metrics: { latencyMs: 20 },
+            nextSkill: 'fixer',
+          }];
+        }
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: ['fixed now'],
+          recommendations: ['re-run benchmark'],
+          metrics: { latencyMs: 15 },
+          nextSkill: 'validation',
+        }));
+      });
+      const benchmarkSpy = jest.spyOn(benchmark, 'calculateBenchmark')
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 60,
+          weightedScore: 80,
+          stages: [],
+          fixSuggestions: ['improve output'],
+          improvementPotential: true,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 62,
+          weightedScore: 80,
+          stages: [],
+          fixSuggestions: ['keep improving'],
+          improvementPotential: true,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 62,
+          weightedScore: 80,
+          stages: [],
+          fixSuggestions: ['keep improving'],
+          improvementPotential: true,
+        });
+      const result = runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        maxFixRetries: 3,
+        scoreThreshold: 95,
+        workerTimeout: 300,
+      });
+      expect(result.totalBatches).toBe(1);
+      expect(result.passedBatches).toBe(0);
+      expect(result.failedBatches).toBe(1);
+      expect(result.escalatedBatches).toBe(0);
+      expect(result.batchReports[0].status).toBe('failed');
+      expect(result.batchReports[0].findings.join(' ')).toMatch(/below threshold/);
+      expect(dispatchSpy).toHaveBeenCalledTimes(2);
+      expect(dispatchSpy.mock.calls[0][0][0].skill).toBe('worker');
+      expect(dispatchSpy.mock.calls[1][0][0].skill).toBe('fixer');
+      expect(benchmarkSpy).toHaveBeenCalledTimes(3);
+    });
+    it('recovers from below-threshold batch after a successful fix attempt', () => {
+      jest.spyOn(generateTests, 'generateTestCases').mockReturnValue({
+        testCases: [
+          { stage: '01-input', type: 'sample', input: 'recover', expected: 'stable' },
+        ],
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        if (invocations[0]?.skill === 'worker') {
+          return [{
+            skill: 'worker',
+            status: 'failed',
+            batchId: 1,
+            testCaseId: 'tc-001',
+            timestamp: '2026-04-07T00:00:00.000Z',
+            findings: ['output missing'],
+            recommendations: ['run fixer'],
+            metrics: { latencyMs: 20 },
+            nextSkill: 'fixer',
+          }];
+        }
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'passed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: ['fixed now'],
+          recommendations: ['continue'],
+          metrics: { latencyMs: 15 },
+          nextSkill: 'validation',
+        }));
+      });
+      jest.spyOn(benchmark, 'calculateBenchmark')
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 60,
+          weightedScore: 80,
+          stages: [],
+          fixSuggestions: ['improve output'],
+          improvementPotential: true,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 78,
+          weightedScore: 97,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        })
+        .mockReturnValueOnce({
+          workspace: 'test',
+          agent: 'test-agent',
+          timestamp: '2026-04-07T00:00:00.000Z',
+          rawScore: 78,
+          weightedScore: 97,
+          stages: [],
+          fixSuggestions: [],
+          improvementPotential: false,
+        });
+      const result = runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        maxFixRetries: 3,
+        scoreThreshold: 95,
+        workerTimeout: 300,
+      });
+      expect(result.totalBatches).toBe(1);
+      expect(result.passedBatches).toBe(1);
+      expect(result.failedBatches).toBe(0);
+      expect(result.escalatedBatches).toBe(0);
+      expect(result.batchReports[0].status).toBe('passed');
+      expect(result.batchReports[0].findings).toContain('Fix attempt 1: 1 fixes applied');
+      expect(dispatchSpy).toHaveBeenCalledTimes(2);
+      expect(dispatchSpy.mock.calls[0][0][0].skill).toBe('worker');
+      expect(dispatchSpy.mock.calls[1][0][0].skill).toBe('fixer');
+    });
+    it('runs fix loop and escalates when retries are exhausted below score threshold', () => {
+      jest.spyOn(generateTests, 'generateTestCases').mockReturnValue({
+        testCases: [
+          { stage: '01-input', type: 'sample', input: 'needs-fix', expected: 'fixed' },
+        ],
+      });
+      const dispatchSpy = jest.spyOn(dispatch, 'dispatchParallel').mockImplementation((invocations) => {
+        if (invocations[0]?.skill === 'worker') {
+          return [{
+            skill: 'worker',
+            status: 'failed',
+            batchId: 1,
+            testCaseId: 'tc-001',
+            timestamp: '2026-04-07T00:00:00.000Z',
+            findings: ['output missing'],
+            recommendations: ['run fixer'],
+            metrics: { latencyMs: 20 },
+            nextSkill: 'fixer',
+          }];
+        }
+        return invocations.map((inv) => ({
+          skill: inv.skill,
+          status: 'failed',
+          batchId: inv.batchId,
+          testCaseId: inv.testCaseId,
+          timestamp: '2026-04-07T00:00:00.000Z',
+          findings: ['still failing'],
+          recommendations: ['retry'],
+          metrics: { latencyMs: 15 },
+          nextSkill: 'validation',
+        }));
+      });
+      const benchmarkSpy = jest.spyOn(benchmark, 'calculateBenchmark').mockReturnValue({
+        workspace: 'test',
+        agent: 'test-agent',
+        timestamp: '2026-04-07T00:00:00.000Z',
+        rawScore: 60,
+        weightedScore: 90,
+        stages: [],
+        fixSuggestions: ['improve output'],
+        improvementPotential: true,
+      });
+      const result = runBatchLifecycle(tempDir, {
+        batchSize: 1,
+        maxFixRetries: 2,
+        scoreThreshold: 95,
+        workerTimeout: 300,
+      });
+      expect(result.totalBatches).toBe(1);
+      expect(result.passedBatches).toBe(0);
+      expect(result.failedBatches).toBe(0);
+      expect(result.escalatedBatches).toBe(1);
+      expect(result.batchReports[0].status).toBe('escalated');
+      expect(result.batchReports[0].findings).toContain('Max retries exhausted');
+      expect(dispatchSpy).toHaveBeenCalledTimes(3);
+      expect(dispatchSpy.mock.calls[0][0][0].skill).toBe('worker');
+      expect(dispatchSpy.mock.calls[1][0][0].skill).toBe('fixer');
+      expect(dispatchSpy.mock.calls[2][0][0].skill).toBe('fixer');
+      expect(benchmarkSpy).toHaveBeenCalledTimes(4);
+    });
+  });
+});