npm - opencastle - Versions diffs - 0.31.6 → 0.32.0 - Mend

opencastle 0.31.6 → 0.32.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (210) hide show

package/LICENSE +93 -21
package/README.md +9 -3
package/bin/cli.mjs +15 -0
package/dist/cli/agents.d.ts.map +1 -1
package/dist/cli/agents.js +19 -5
package/dist/cli/agents.js.map +1 -1
package/dist/cli/artifacts-cli.d.ts +3 -0
package/dist/cli/artifacts-cli.d.ts.map +1 -0
package/dist/cli/artifacts-cli.js +36 -0
package/dist/cli/artifacts-cli.js.map +1 -0
package/dist/cli/baselines.d.ts.map +1 -1
package/dist/cli/baselines.js +11 -0
package/dist/cli/baselines.js.map +1 -1
package/dist/cli/convoy/artifacts.d.ts +25 -0
package/dist/cli/convoy/artifacts.d.ts.map +1 -0
package/dist/cli/convoy/artifacts.js +129 -0
package/dist/cli/convoy/artifacts.js.map +1 -0
package/dist/cli/convoy/artifacts.test.d.ts +2 -0
package/dist/cli/convoy/artifacts.test.d.ts.map +1 -0
package/dist/cli/convoy/artifacts.test.js +169 -0
package/dist/cli/convoy/artifacts.test.js.map +1 -0
package/dist/cli/convoy/compaction.d.ts +23 -0
package/dist/cli/convoy/compaction.d.ts.map +1 -0
package/dist/cli/convoy/compaction.js +117 -0
package/dist/cli/convoy/compaction.js.map +1 -0
package/dist/cli/convoy/compaction.test.d.ts +2 -0
package/dist/cli/convoy/compaction.test.d.ts.map +1 -0
package/dist/cli/convoy/compaction.test.js +205 -0
package/dist/cli/convoy/compaction.test.js.map +1 -0
package/dist/cli/convoy/contracts.d.ts +22 -0
package/dist/cli/convoy/contracts.d.ts.map +1 -0
package/dist/cli/convoy/contracts.js +254 -0
package/dist/cli/convoy/contracts.js.map +1 -0
package/dist/cli/convoy/contracts.test.d.ts +2 -0
package/dist/cli/convoy/contracts.test.d.ts.map +1 -0
package/dist/cli/convoy/contracts.test.js +239 -0
package/dist/cli/convoy/contracts.test.js.map +1 -0
package/dist/cli/convoy/dag-analysis.d.ts +40 -0
package/dist/cli/convoy/dag-analysis.d.ts.map +1 -0
package/dist/cli/convoy/dag-analysis.js +282 -0
package/dist/cli/convoy/dag-analysis.js.map +1 -0
package/dist/cli/convoy/dag-analysis.test.d.ts +2 -0
package/dist/cli/convoy/dag-analysis.test.d.ts.map +1 -0
package/dist/cli/convoy/dag-analysis.test.js +289 -0
package/dist/cli/convoy/dag-analysis.test.js.map +1 -0
package/dist/cli/convoy/effort-scaling.d.ts +20 -0
package/dist/cli/convoy/effort-scaling.d.ts.map +1 -0
package/dist/cli/convoy/effort-scaling.js +82 -0
package/dist/cli/convoy/effort-scaling.js.map +1 -0
package/dist/cli/convoy/effort-scaling.test.d.ts +2 -0
package/dist/cli/convoy/effort-scaling.test.d.ts.map +1 -0
package/dist/cli/convoy/effort-scaling.test.js +120 -0
package/dist/cli/convoy/effort-scaling.test.js.map +1 -0
package/dist/cli/convoy/engine.d.ts.map +1 -1
package/dist/cli/convoy/engine.js +298 -11
package/dist/cli/convoy/engine.js.map +1 -1
package/dist/cli/convoy/engine.test.js +155 -18
package/dist/cli/convoy/engine.test.js.map +1 -1
package/dist/cli/convoy/event-schemas.d.ts.map +1 -1
package/dist/cli/convoy/event-schemas.js +55 -0
package/dist/cli/convoy/event-schemas.js.map +1 -1
package/dist/cli/convoy/isolation.d.ts +27 -0
package/dist/cli/convoy/isolation.d.ts.map +1 -0
package/dist/cli/convoy/isolation.js +120 -0
package/dist/cli/convoy/isolation.js.map +1 -0
package/dist/cli/convoy/isolation.test.d.ts +2 -0
package/dist/cli/convoy/isolation.test.d.ts.map +1 -0
package/dist/cli/convoy/isolation.test.js +105 -0
package/dist/cli/convoy/isolation.test.js.map +1 -0
package/dist/cli/convoy/review-stages.d.ts +9 -0
package/dist/cli/convoy/review-stages.d.ts.map +1 -0
package/dist/cli/convoy/review-stages.js +134 -0
package/dist/cli/convoy/review-stages.js.map +1 -0
package/dist/cli/convoy/review-stages.test.d.ts +2 -0
package/dist/cli/convoy/review-stages.test.d.ts.map +1 -0
package/dist/cli/convoy/review-stages.test.js +197 -0
package/dist/cli/convoy/review-stages.test.js.map +1 -0
package/dist/cli/convoy/skill-refinement.d.ts +39 -0
package/dist/cli/convoy/skill-refinement.d.ts.map +1 -0
package/dist/cli/convoy/skill-refinement.js +239 -0
package/dist/cli/convoy/skill-refinement.js.map +1 -0
package/dist/cli/convoy/skill-refinement.test.d.ts +2 -0
package/dist/cli/convoy/skill-refinement.test.d.ts.map +1 -0
package/dist/cli/convoy/skill-refinement.test.js +230 -0
package/dist/cli/convoy/skill-refinement.test.js.map +1 -0
package/dist/cli/convoy/spec-builder.d.ts +1 -0
package/dist/cli/convoy/spec-builder.d.ts.map +1 -1
package/dist/cli/convoy/spec-builder.js +11 -0
package/dist/cli/convoy/spec-builder.js.map +1 -1
package/dist/cli/convoy/spec-builder.test.js +54 -0
package/dist/cli/convoy/spec-builder.test.js.map +1 -1
package/dist/cli/convoy/store.d.ts +3 -2
package/dist/cli/convoy/store.d.ts.map +1 -1
package/dist/cli/convoy/store.js +20 -2
package/dist/cli/convoy/store.js.map +1 -1
package/dist/cli/convoy/store.test.js +15 -15
package/dist/cli/convoy/store.test.js.map +1 -1
package/dist/cli/convoy/tdd-gate.d.ts +15 -0
package/dist/cli/convoy/tdd-gate.d.ts.map +1 -0
package/dist/cli/convoy/tdd-gate.js +119 -0
package/dist/cli/convoy/tdd-gate.js.map +1 -0
package/dist/cli/convoy/tdd-gate.test.d.ts +2 -0
package/dist/cli/convoy/tdd-gate.test.d.ts.map +1 -0
package/dist/cli/convoy/tdd-gate.test.js +227 -0
package/dist/cli/convoy/tdd-gate.test.js.map +1 -0
package/dist/cli/convoy/types.d.ts +91 -0
package/dist/cli/convoy/types.d.ts.map +1 -1
package/dist/cli/convoy/types.js +8 -0
package/dist/cli/convoy/types.js.map +1 -1
package/dist/cli/dashboard.d.ts.map +1 -1
package/dist/cli/dashboard.js +54 -0
package/dist/cli/dashboard.js.map +1 -1
package/dist/cli/insights.d.ts +3 -0
package/dist/cli/insights.d.ts.map +1 -0
package/dist/cli/insights.js +94 -0
package/dist/cli/insights.js.map +1 -0
package/dist/cli/lesson.d.ts.map +1 -1
package/dist/cli/lesson.js +7 -0
package/dist/cli/lesson.js.map +1 -1
package/dist/cli/log.d.ts.map +1 -1
package/dist/cli/log.js +7 -0
package/dist/cli/log.js.map +1 -1
package/dist/cli/package-config.d.ts +12 -0
package/dist/cli/package-config.d.ts.map +1 -0
package/dist/cli/package-config.js +37 -0
package/dist/cli/package-config.js.map +1 -0
package/dist/cli/package.d.ts +23 -0
package/dist/cli/package.d.ts.map +1 -0
package/dist/cli/package.js +285 -0
package/dist/cli/package.js.map +1 -0
package/dist/cli/package.test.d.ts +2 -0
package/dist/cli/package.test.d.ts.map +1 -0
package/dist/cli/package.test.js +236 -0
package/dist/cli/package.test.js.map +1 -0
package/dist/cli/pipeline.d.ts +6 -0
package/dist/cli/pipeline.d.ts.map +1 -1
package/dist/cli/pipeline.js +15 -2
package/dist/cli/pipeline.js.map +1 -1
package/dist/cli/run/schema.d.ts.map +1 -1
package/dist/cli/run/schema.js +32 -0
package/dist/cli/run/schema.js.map +1 -1
package/dist/cli/run/schema.test.js +51 -0
package/dist/cli/run/schema.test.js.map +1 -1
package/dist/cli/run.d.ts.map +1 -1
package/dist/cli/run.js +10 -1
package/dist/cli/run.js.map +1 -1
package/dist/cli/skills.d.ts +3 -0
package/dist/cli/skills.d.ts.map +1 -0
package/dist/cli/skills.js +107 -0
package/dist/cli/skills.js.map +1 -0
package/dist/cli/types.d.ts +4 -1
package/dist/cli/types.d.ts.map +1 -1
package/dist/cli/update.js +2 -2
package/package.json +3 -2
package/src/cli/agents.ts +20 -5
package/src/cli/artifacts-cli.ts +41 -0
package/src/cli/baselines.ts +12 -0
package/src/cli/convoy/artifacts.test.ts +201 -0
package/src/cli/convoy/artifacts.ts +186 -0
package/src/cli/convoy/compaction.test.ts +245 -0
package/src/cli/convoy/compaction.ts +164 -0
package/src/cli/convoy/contracts.test.ts +279 -0
package/src/cli/convoy/contracts.ts +280 -0
package/src/cli/convoy/dag-analysis.test.ts +349 -0
package/src/cli/convoy/dag-analysis.ts +371 -0
package/src/cli/convoy/effort-scaling.test.ts +140 -0
package/src/cli/convoy/effort-scaling.ts +90 -0
package/src/cli/convoy/engine.test.ts +175 -18
package/src/cli/convoy/engine.ts +315 -12
package/src/cli/convoy/event-schemas.ts +55 -0
package/src/cli/convoy/isolation.test.ts +137 -0
package/src/cli/convoy/isolation.ts +165 -0
package/src/cli/convoy/review-stages.test.ts +235 -0
package/src/cli/convoy/review-stages.ts +166 -0
package/src/cli/convoy/skill-refinement.test.ts +277 -0
package/src/cli/convoy/skill-refinement.ts +306 -0
package/src/cli/convoy/spec-builder.test.ts +61 -0
package/src/cli/convoy/spec-builder.ts +9 -0
package/src/cli/convoy/store.test.ts +15 -15
package/src/cli/convoy/store.ts +26 -4
package/src/cli/convoy/tdd-gate.test.ts +281 -0
package/src/cli/convoy/tdd-gate.ts +154 -0
package/src/cli/convoy/types.ts +51 -0
package/src/cli/dashboard.ts +55 -0
package/src/cli/insights.ts +99 -0
package/src/cli/lesson.ts +8 -0
package/src/cli/log.ts +8 -0
package/src/cli/package-config.ts +48 -0
package/src/cli/package.test.ts +276 -0
package/src/cli/package.ts +329 -0
package/src/cli/pipeline.ts +21 -2
package/src/cli/run/schema.test.ts +58 -0
package/src/cli/run/schema.ts +33 -0
package/src/cli/run.ts +14 -1
package/src/cli/skills.ts +121 -0
package/src/cli/types.ts +4 -1
package/src/cli/update.ts +2 -2
package/src/dashboard/dist/_astro/{index.Je1YjU_y.css → index.BRDFmNzR.css} +1 -1
package/src/dashboard/dist/index.html +163 -2
package/src/dashboard/node_modules/.vite/deps/_metadata.json +6 -6
package/src/dashboard/src/pages/index.astro +162 -1
package/src/dashboard/src/styles/dashboard.css +85 -0
package/src/orchestrator/agents/developer.agent.md +8 -0
package/src/orchestrator/agents/ui-ux-expert.agent.md +7 -0
package/src/orchestrator/prompts/assess-complexity.prompt.md +13 -0
package/src/orchestrator/prompts/brainstorm.prompt.md +18 -0
package/src/orchestrator/prompts/generate-convoy.prompt.md +61 -0
package/src/orchestrator/skills/decomposition/SKILL.md +35 -0
package/src/orchestrator/skills/frontend-design/SKILL.md +27 -1
package/src/orchestrator/skills/project-consistency/SKILL.md +350 -0

package/src/cli/convoy/engine.ts CHANGED Viewed

@@ -22,7 +22,7 @@ import { createEventEmitter, ndjsonPathForConvoy, recoverNdjson, type ConvoyEven
 import { createWorktreeManager, type WorktreeManager } from './worktree.js'
 import { createMergeQueue, MergeConflictError, type MergeQueue } from './merge.js'
 import { createHealthMonitor, detectDrift } from './health.js'
-import type { TaskRecord, ConvoyStatus, ConvoyTaskStatus, GuardConfig, CircuitBreakerConfig, TaskStep, Hook, TaskOutput, TaskInput } from './types.js'
+import type { TaskRecord, ConvoyStatus, ConvoyTaskStatus, GuardConfig, CircuitBreakerConfig, TaskStep, Hook, TaskOutput, TaskInput, TDDGateConfig } from './types.js'
 import { buildPhases, formatDuration } from '../run/executor.js'
 import { parseTimeout, parseYaml } from '../run/schema.js'
 import { getAdapter, detectAdapter } from '../run/adapters/index.js'
@@ -33,6 +33,13 @@ import { readLessons, captureLessons, consolidateLessons } from './lessons.js'
 import { updateExpertise, feedCircuitBreaker } from './expertise.js'
 import { buildKnowledgeGraph } from './knowledge.js'
 import { injectDiscoveredIssuesInstruction, checkDiscoveredIssues, consolidateIssues } from './issues.js'
+import { validateOutput, buildContractInstruction, buildContractRetryPrompt } from './contracts.js'
+import { runTwoStageReview } from './review-stages.js'
+import { buildIsolationPreamble, resolveDependencyResults, detectPartitionViolations } from './isolation.js'
+import { checkTDD, formatTDDFailure, DEFAULT_TDD_CONFIG } from './tdd-gate.js'
+import { runSkillRefinementCheck } from './skill-refinement.js'
+import { getArtifactDir, extractArtifactRefs } from './artifacts.js'
+import { shouldCompact, parseCompactionSummary, saveCompaction, canCompact, getMaxCompactions, generateCompactionPrompt, buildContinuationPrompt } from './compaction.js'
 const execFile = promisify(execFileCb)
@@ -823,6 +830,7 @@ function pollInjectFile(
       dispute_id: null,
       drift_score: null,
       drift_retried: 0,
+      compaction_count: 0,
       outputs: null,
       inputs: null,
       discovered_issues: null,
@@ -1260,6 +1268,36 @@ async function runConvoy(
     const steps: TaskStep[] | undefined = specTask?.steps
     const taskHooks: Hook[] = specTask?.hooks ?? []
+    // ── Context isolation preamble (Phase 41) ────────────────────────────
+    try {
+      const taskFiles = taskRecord.files ? JSON.parse(taskRecord.files) as string[] : []
+      const depIds = taskRecord.depends_on ? JSON.parse(taskRecord.depends_on) as string[] : []
+      const depResults = resolveDependencyResults(store, convoyId, depIds)
+      const preamble = buildIsolationPreamble(
+        { id: taskRecord.id, description: taskRecord.prompt.slice(0, 200), prompt: taskRecord.prompt, files: taskFiles, agent: taskRecord.agent },
+        depResults,
+      )
+      task.prompt = preamble + '\n\n' + task.prompt
+    } catch { /* non-critical — isolation preamble is best-effort */ }
+    // ── Artifact output instructions (Phase 43) ────────────────────────────
+    try {
+      const artifactDir = getArtifactDir(convoyId, taskRecord.id)
+      const artifactInstructions = [
+        '',
+        '## Artifact Output (for large results)',
+        'If your output includes large content (>100 lines of code, full reports, data dumps),',
+        'write it to an artifact file instead of including it inline:',
+        '',
+        '1. Write the content to: ' + artifactDir + '{filename}',
+        '2. In your response, reference it: `[ARTIFACT: {filename}] {1-line summary}`',
+        '3. Keep your inline response focused on the summary and key decisions.',
+        '',
+        'Small outputs (< 100 lines) can remain inline.',
+      ].join('\n')
+      task.prompt = task.prompt + '\n' + artifactInstructions
+    } catch { /* non-critical */ }
     // ── Intelligence: inject lessons (Phase 18.1) ─────────────────────────
     if (spec.defaults?.inject_lessons !== false) {
       try {
@@ -1292,6 +1330,12 @@ async function runConvoy(
       task.prompt = injectDiscoveredIssuesInstruction(task.prompt)
     }
+    // ── Output contract injection ─────────────────────────────────────────
+    const contractInstruction = buildContractInstruction(taskRecord.agent)
+    if (contractInstruction) {
+      task.prompt = task.prompt + '\n\n' + contractInstruction
+    }
     // ── pre_task hooks ────────────────────────────────────────────────────────
     if (taskHooks.length > 0) {
       const preResult = await runHooks(taskHooks, 'pre_task', {
@@ -1439,11 +1483,11 @@ async function runConvoy(
           try {
             // SECURITY: Gate/hook commands come from the .convoy.yml spec file, which is operator-controlled.
             // They are NOT user-supplied and are part of the trusted build configuration.
-            await execFile('sh', ['-c', command], { cwd: worktreePath ?? basePath })
+            await execFile('sh', ['-c', command], { cwd: worktreePath ?? basePath, maxBuffer: 10 * 1024 * 1024 })
           } catch (err) {
             const execErr = err as Error & { code?: unknown; stderr?: string; stdout?: string }
             const code = typeof execErr.code === 'number' ? execErr.code : 1
-            const output = execErr.stderr || execErr.stdout || execErr.message || ''
+            const output = [execErr.stderr, execErr.stdout].filter(Boolean).join('\n').trim() || execErr.message || ''
             gateFailure = { command, exitCode: code, output }
             break
           }
@@ -1683,6 +1727,100 @@ async function runConvoy(
             return
           }
         }
+        // ── Partition violation check (Phase 41) ────────────────────────────
+        if (changedFiles.length > 0) {
+          try {
+            const taskFiles = taskRecord.files ? JSON.parse(taskRecord.files) as string[] : []
+            if (taskFiles.length > 0) {
+              const violation = detectPartitionViolations(taskRecord.id, taskFiles, changedFiles)
+              if (violation) {
+                events.emit('partition_violation', {
+                  task_id: taskRecord.id,
+                  allowed: violation.allowedFiles,
+                  actual: violation.actualFiles,
+                  violations: violation.violations,
+                }, { convoy_id: convoyId, task_id: taskRecord.id })
+                process.stdout.write(`  ${c.yellow('⚠')} ${c.bold(`[${taskRecord.id}]`)} partition violation: ${violation.violations.join(', ')}\n`)
+              }
+            }
+          } catch { /* non-critical */ }
+        }
+        // ── TDD gate ──────────────────────────────────────────────────────────
+        if (builtInGates.tdd_check && changedFiles.length > 0) {
+          const tddConfig: TDDGateConfig = typeof builtInGates.tdd_check === 'object'
+            ? { ...DEFAULT_TDD_CONFIG, ...builtInGates.tdd_check }
+            : DEFAULT_TDD_CONFIG
+          const specTaskForTDD = (spec.tasks ?? []).find(t => t.id === taskRecord.id)
+          const tddResult = checkTDD(changedFiles, changedFiles, tddConfig, specTaskForTDD?.agent ?? taskRecord.agent)
+          if (tddResult.skipped) {
+            events.emit('tdd_check_skipped', {
+              task_id: taskRecord.id,
+              reason: tddResult.skip_reason,
+              agent: specTaskForTDD?.agent ?? taskRecord.agent,
+            }, { convoy_id: convoyId, task_id: taskRecord.id })
+          } else if (tddResult.passed) {
+            events.emit('tdd_check_passed', {
+              task_id: taskRecord.id,
+              new_source_files: tddResult.new_source_files.length,
+              existing_test_files: tddResult.existing_test_files.length,
+            }, { convoy_id: convoyId, task_id: taskRecord.id })
+          } else {
+            const failureMsg = formatTDDFailure(tddResult)
+            events.emit('tdd_check_failed', {
+              task_id: taskRecord.id,
+              missing_test_files: tddResult.missing_test_files,
+              new_source_files: tddResult.new_source_files.length,
+            }, { convoy_id: convoyId, task_id: taskRecord.id })
+            if (tddConfig.mode === 'block') {
+              await removeWorktree()
+              const freshRecord = store.getTask(taskRecord.id, convoyId)!
+              if (freshRecord.retries < freshRecord.max_retries && spec.on_failure !== 'stop') {
+                store.updateTaskStatus(taskRecord.id, convoyId, 'pending', {
+                  retries: freshRecord.retries + 1,
+                  worker_id: null,
+                  worktree: null,
+                  started_at: null,
+                  finished_at: null,
+                  prompt: `TDD gate failed.\n${failureMsg}\n\nCreate the missing test files and try again.\n\n${taskRecord.prompt}`,
+                })
+                store.updateWorkerStatus(workerId, 'failed', { finished_at: finishedAt })
+                process.stdout.write(
+                  `  ${c.yellow('⟳')} ${c.bold(`[${taskRecord.id}]`)} TDD gate failed, retry ${freshRecord.retries + 1}/${freshRecord.max_retries}\n`,
+                )
+              } else {
+                store.withTransaction(() => {
+                  store.updateTaskStatus(taskRecord.id, convoyId, 'gate-failed', {
+                    finished_at: finishedAt,
+                    output: `Built-in gate (tdd_check) failed:\n${failureMsg}`,
+                    exit_code: 1,
+                  })
+                  store.updateWorkerStatus(workerId, 'failed', { finished_at: finishedAt })
+                })
+                completedCount++
+                process.stdout.write(
+                  `  ${c.red('✗')} ${c.bold(`[${taskRecord.id}]`)} TDD gate failed ${elapsed} ${c.dim(`[${completedCount}/${totalTasks}]`)}\n`,
+                )
+                events.emit(
+                  'task_failed',
+                  { reason: 'gate-failed', gate: 'tdd_check', worker_id: workerId },
+                  { convoy_id: convoyId, task_id: taskRecord.id, worker_id: workerId },
+                )
+                handleExhaustion(freshRecord, 'tdd-check', failureMsg)
+              }
+              taskAdapterMap.delete(taskRecord.id)
+              return
+            } else {
+              // warn mode — log but continue
+              process.stdout.write(
+                `  ${c.yellow('⚠')} ${c.bold(`[${taskRecord.id}]`)} TDD gate warning: ${tddResult.missing_test_files.length} source file(s) without tests\n`,
+              )
+            }
+          }
+        }
       }
       // ── Drift detection ──────────────────────────────────────────────────
@@ -1804,7 +1942,19 @@ async function runConvoy(
             await reviewSemaphore.acquire()
             let reviewResult: ReviewResult
             try {
-              if (reviewRunner) {
+              if (reviewRunner && spec.defaults?.review_stages !== false) {
+                // Two-stage review: spec compliance first, then code quality
+                const twoStageResult = await runTwoStageReview(taskRecord, reviewRunner, reviewerModel)
+                for (const stage of twoStageResult.stages) {
+                  events.emit('review_stage_completed', { stage: stage.stage, verdict: stage.verdict, tokens: stage.tokens_used, task_id: taskRecord.id, model: reviewerModel }, { convoy_id: convoyId, task_id: taskRecord.id })
+                }
+                reviewResult = {
+                  verdict: twoStageResult.overall_verdict,
+                  feedback: twoStageResult.stages.flatMap(s => s.issues).join('\n'),
+                  tokens: twoStageResult.total_tokens,
+                  model: reviewerModel,
+                }
+              } else if (reviewRunner) {
                 reviewResult = await reviewRunner(taskRecord, 'fast', reviewerModel)
               } else {
                 reviewResult = { verdict: 'pass', feedback: '', tokens: 0, model: reviewerModel }
@@ -1865,11 +2015,32 @@ async function runConvoy(
           try {
             const noopRunner = (_t: TaskRecord, _l: ReviewLevel, m: string) => Promise.resolve({ verdict: 'pass' as const, feedback: '', tokens: 0, model: m })
             const runner = reviewRunner ?? noopRunner
-            panelResults = await Promise.all([
-              runner(taskRecord, 'panel', reviewerModel),
-              runner(taskRecord, 'panel', reviewerModel),
-              runner(taskRecord, 'panel', reviewerModel),
-            ])
+            const twoStageEnabled = spec.defaults?.review_stages !== false
+            if (twoStageEnabled && reviewRunner) {
+              // Each panel reviewer runs both stages; majority vote on overall_verdict
+              const twoStageResults = await Promise.all([
+                runTwoStageReview(taskRecord, runner, reviewerModel),
+                runTwoStageReview(taskRecord, runner, reviewerModel),
+                runTwoStageReview(taskRecord, runner, reviewerModel),
+              ])
+              for (const tsr of twoStageResults) {
+                for (const stage of tsr.stages) {
+                  events.emit('review_stage_completed', { stage: stage.stage, verdict: stage.verdict, tokens: stage.tokens_used, task_id: taskRecord.id, model: reviewerModel }, { convoy_id: convoyId, task_id: taskRecord.id })
+                }
+              }
+              panelResults = twoStageResults.map(tsr => ({
+                verdict: tsr.overall_verdict,
+                feedback: tsr.stages.flatMap(s => s.issues).join('\n'),
+                tokens: tsr.total_tokens,
+                model: reviewerModel,
+              }))
+            } else {
+              panelResults = await Promise.all([
+                runner(taskRecord, 'panel', reviewerModel),
+                runner(taskRecord, 'panel', reviewerModel),
+                runner(taskRecord, 'panel', reviewerModel),
+              ])
+            }
           } finally {
             reviewSemaphore.release()
           }
@@ -2107,6 +2278,7 @@ async function runConvoy(
                 dispute_id: null,
                 drift_score: null,
                 drift_retried: 0,
+                compaction_count: 0,
                 outputs: null,
                 inputs: null,
                 discovered_issues: null,
@@ -2154,6 +2326,72 @@ async function runConvoy(
         if (result.usage.total_tokens != null) usageExtra.total_tokens = result.usage.total_tokens
       }
+      // ── Context compaction check (Phase 44) ─────────────────────────────
+      const compactionConfig = spec.defaults?.compaction
+      if (compactionConfig?.enabled && usageExtra.total_tokens != null && taskRecord.model) {
+        if (shouldCompact(usageExtra.total_tokens, taskRecord.model, compactionConfig)) {
+          if (canCompact(taskRecord.compaction_count)) {
+            const newCount = taskRecord.compaction_count + 1
+            store.updateTaskCompaction(taskRecord.id, convoyId, newCount)
+            const summaryFromOutput = parseCompactionSummary(result.output, taskRecord.id, convoyId)
+            let summaryPath: string | undefined
+            if (summaryFromOutput) {
+              try {
+                summaryPath = saveCompaction(convoyId, taskRecord.id, summaryFromOutput, newCount)
+              } catch { /* non-critical */ }
+            }
+            const compactionTaskFiles = taskRecord.files ? JSON.parse(taskRecord.files) as string[] : []
+            const compactionDepIds = taskRecord.depends_on ? JSON.parse(taskRecord.depends_on) as string[] : []
+            const compactionDepResults = resolveDependencyResults(store, convoyId, compactionDepIds)
+            const compactionPreamble = buildIsolationPreamble(
+              { id: taskRecord.id, description: taskRecord.prompt.slice(0, 200), prompt: taskRecord.prompt, files: compactionTaskFiles, agent: taskRecord.agent },
+              compactionDepResults,
+            )
+            const continuationPrompt = summaryPath
+              ? buildContinuationPrompt(taskRecord.prompt, summaryPath, compactionPreamble)
+              : compactionPreamble + '\n\n' + generateCompactionPrompt(taskRecord.id) + '\n\n' + taskRecord.prompt
+            store.updateTaskStatus(taskRecord.id, convoyId, 'pending', {
+              worker_id: null,
+              worktree: null,
+              started_at: null,
+              finished_at: null,
+              prompt: continuationPrompt,
+            })
+            store.updateWorkerStatus(workerId, 'failed', { finished_at: finishedAt })
+            events.emit('context_compacted', {
+              task_id: taskRecord.id,
+              compaction_count: newCount,
+              summary_path: summaryPath ?? '',
+              model: taskRecord.model,
+              tokens_used: usageExtra.total_tokens,
+            }, { convoy_id: convoyId, task_id: taskRecord.id })
+            taskAdapterMap.delete(taskRecord.id)
+            return
+          } else {
+            // Max compactions exceeded — fail the task
+            const exhaustedAt = new Date().toISOString()
+            store.updateTaskStatus(taskRecord.id, convoyId, 'failed', {
+              finished_at: exhaustedAt,
+              output: `Context exhausted: reached maximum ${getMaxCompactions()} compactions`,
+              exit_code: 1,
+            })
+            store.updateWorkerStatus(workerId, 'failed', { finished_at: exhaustedAt })
+            events.emit('task_failed', {
+              reason: 'context_exhausted',
+              worker_id: workerId,
+            }, { convoy_id: convoyId, task_id: taskRecord.id })
+            taskAdapterMap.delete(taskRecord.id)
+            return
+          }
+        }
+      }
       // ── Capture outputs as artifacts ────────────────────────────────────────
       if (taskRecord.outputs) {
         const outputs: TaskOutput[] = JSON.parse(taskRecord.outputs)
@@ -2190,6 +2428,48 @@ async function runConvoy(
         }
       }
+      // ── Extract filesystem artifacts (Phase 43) ────────────────────────
+      try {
+        const fsArtifactRefs = extractArtifactRefs(taskRecord.id, convoyId, result.output)
+        if (fsArtifactRefs.length > 0) {
+          events.emit('artifacts_extracted', {
+            task_id: taskRecord.id,
+            count: fsArtifactRefs.length,
+            artifacts: fsArtifactRefs.map(r => ({ filename: r.filename, summary: r.summary })),
+          }, { convoy_id: convoyId, task_id: taskRecord.id })
+        }
+      } catch (err) {
+        process.stderr.write(`[artifacts] Warning: extraction failed for task ${taskRecord.id}: ${(err as Error).message}\n`)
+      }
+      // ── Output contract validation ────────────────────────────────────────
+      const contractResult = validateOutput(taskRecord.agent, result.output)
+      if (!contractResult.valid) {
+        const freshRecordForContract = store.getTask(taskRecord.id, convoyId)!
+        if (freshRecordForContract.retries < freshRecordForContract.max_retries) {
+          const retryPrefix = buildContractRetryPrompt(contractResult) + '\n\n'
+          store.updateTaskStatus(taskRecord.id, convoyId, 'pending', {
+            retries: freshRecordForContract.retries + 1,
+            worker_id: null,
+            worktree: null,
+            started_at: null,
+            finished_at: null,
+            prompt: retryPrefix + taskRecord.prompt,
+          })
+          store.updateWorkerStatus(workerId, 'failed', { finished_at: finishedAt })
+          process.stdout.write(`  ${c.yellow('⟳')} ${c.bold(`[${taskRecord.id}]`)} contract retry ${freshRecordForContract.retries + 1}/${freshRecordForContract.max_retries}\n`)
+          taskAdapterMap.delete(taskRecord.id)
+          return
+        }
+        events.emit('contract_violation', {
+          task_id: taskRecord.id,
+          agent: taskRecord.agent,
+          missing: contractResult.missing,
+          warnings: contractResult.warnings,
+        }, { convoy_id: convoyId, task_id: taskRecord.id })
+        process.stdout.write(`  ${c.yellow('⚠')} ${c.bold(`[${taskRecord.id}]`)} contract violation: missing ${contractResult.missing.join(', ')}\n`)
+      }
       // ── Intelligence: capture persistent agent identity (Phase 17.2) ─────
       const specTaskForCapture = (spec.tasks ?? []).find(t => t.id === taskRecord.id)
       if (specTaskForCapture?.persistent && result.output) {
@@ -2231,6 +2511,7 @@ async function runConvoy(
           output: result.output,
           exit_code: result.exitCode,
           ...usageExtra,
+          contract_result: JSON.stringify(contractResult),
         })
         store.updateWorkerStatus(workerId, 'done', { finished_at: finishedAt })
       })
@@ -2430,13 +2711,13 @@ async function runConvoy(
       try {
         // SECURITY: Gate/hook commands come from the .convoy.yml spec file, which is operator-controlled.
         // They are NOT user-supplied and are part of the trusted build configuration.
-        await execFile('sh', ['-c', command], { cwd: basePath })
+        await execFile('sh', ['-c', command], { cwd: basePath, maxBuffer: 10 * 1024 * 1024 })
         gateResults.push({ command, exitCode: 0, passed: true })
         process.stdout.write(`  ${c.green('✓')} ${c.dim(command)}\n`)
       } catch (err) {
         const execErr = err as Error & { code?: unknown; stderr?: string; stdout?: string }
         const code = typeof execErr.code === 'number' ? execErr.code : 1
-        const output = execErr.stderr || execErr.stdout || execErr.message || ''
+        const output = [execErr.stderr, execErr.stdout].filter(Boolean).join('\n').trim() || execErr.message || ''
         gateResults.push({ command, exitCode: code, passed: false, output })
         process.stdout.write(`  ${c.red('✗')} ${c.dim(command)}\n`)
       }
@@ -2454,7 +2735,16 @@ async function runConvoy(
       .map(g => `Command: ${g.command}\nExit code: ${g.exitCode}\nOutput:\n${g.output ?? '(no output)'}`)
       .join('\n\n---\n\n')
-    const fixPrompt = `The following validation gates failed after all convoy tasks completed. Fix the issues so these commands pass.\n\n${failureSummary}`
+    // Gather files touched by convoy tasks to give the fix agent context
+    const allTasks = store.getTasksByConvoy(convoyId)
+    const touchedFiles = allTasks
+      .filter(t => t.files)
+      .flatMap(t => { try { return JSON.parse(t.files as string) as string[] } catch { return [] } })
+    const filesContext = touchedFiles.length > 0
+      ? `\n\nFiles modified by the convoy tasks:\n${touchedFiles.map(f => `- ${f}`).join('\n')}\n`
+      : ''
+    const fixPrompt = `The following validation gates failed after all convoy tasks completed. Fix the issues so these commands pass.${filesContext}\n\n${failureSummary}`
     const fixTaskId = `gate-fix-${gateAttempt}`
     process.stdout.write(`\n  ${c.yellow('⟳')} ${c.bold(`[${fixTaskId}]`)} fixing gate failures (attempt ${gateAttempt}/${maxGateRetries})\n`)
@@ -2506,6 +2796,18 @@ async function runConvoy(
     try { consolidateIssues(basePath) } catch { /* non-critical */ }
   }
+  // ── Intelligence: skill refinement check ───────────────────────────────
+  try {
+    const proposals = runSkillRefinementCheck(convoyId, basePath)
+    for (const p of proposals) {
+      events.emit('skill_refinement_proposed', {
+        skill_name: p.skill,
+        proposal_path: p.proposalPath,
+      }, { convoy_id: convoyId })
+      process.stdout.write(`  ${c.yellow('◆')} Skill refinement proposed for "${p.skill}". Review at ${p.proposalPath}\n`)
+    }
+  } catch { /* non-critical */ }
   // ── Final status & summary ────────────────────────────────────────────────
   const allTasksFinal = store.getTasksByConvoy(convoyId)
@@ -2991,6 +3293,7 @@ export function createConvoyEngine(options: ConvoyEngineOptions): ConvoyEngine {
         dispute_id: null,
         drift_score: null,
         drift_retried: 0,
+        compaction_count: 0,
         outputs: null,
         inputs: null,
         discovered_issues: null,

package/src/cli/convoy/event-schemas.ts CHANGED Viewed

@@ -178,6 +178,61 @@ export const EVENT_DATA_SCHEMAS: Record<string, AnySchema> = {
     description: v.optional(v.string()),
     severity: v.optional(v.string()),
   }),
+  contract_violation: v.looseObject({
+    task_id: v.optional(v.string()),
+    agent: v.optional(v.string()),
+    missing: v.optional(v.array(v.string())),
+    warnings: v.optional(v.array(v.string())),
+  }),
+  partition_violation: v.looseObject({
+    task_id: v.optional(v.string()),
+    allowed: v.optional(v.array(v.string())),
+    actual: v.optional(v.array(v.string())),
+    violations: v.optional(v.array(v.string())),
+  }),
+  context_compacted: v.looseObject({
+    task_id: v.optional(v.string()),
+    compaction_count: v.optional(v.number()),
+    summary_path: v.optional(v.string()),
+    model: v.optional(v.string()),
+    tokens_used: v.optional(v.number()),
+  }),
+  skill_refinement_proposed: v.looseObject({
+    skill_name: v.optional(v.string()),
+    proposal_path: v.optional(v.string()),
+    failure_count: v.optional(v.number()),
+    confidence: v.optional(v.string()),
+  }),
+  tdd_check_passed: v.looseObject({
+    task_id: v.optional(v.string()),
+    new_source_files: v.optional(v.number()),
+    existing_test_files: v.optional(v.number()),
+  }),
+  tdd_check_failed: v.looseObject({
+    task_id: v.optional(v.string()),
+    missing_test_files: v.optional(v.array(v.string())),
+    new_source_files: v.optional(v.number()),
+  }),
+  tdd_check_skipped: v.looseObject({
+    task_id: v.optional(v.string()),
+    reason: v.optional(v.string()),
+    agent: v.optional(v.string()),
+  }),
+  review_stage_completed: v.looseObject({
+    stage: v.string(),
+    verdict: v.string(),
+    tokens: v.number(),
+    task_id: v.optional(v.string()),
+    model: v.optional(v.string()),
+  }),
+  artifacts_extracted: v.looseObject({
+    task_id: v.optional(v.string()),
+    count: v.optional(v.number()),
+    artifacts: v.optional(v.array(v.looseObject({
+      filename: v.string(),
+      summary: v.optional(v.string()),
+    }))),
+  }),
 }
 export function validateEventData(
   type: string,

package/src/cli/convoy/isolation.test.ts ADDED Viewed

@@ -0,0 +1,137 @@
+import { describe, it, expect } from 'vitest'
+import {
+  buildIsolationPreamble,
+  formatDependencyResults,
+  detectPartitionViolations,
+  type DependencyResult,
+} from './isolation.js'
+describe('buildIsolationPreamble', () => {
+  const baseTask = {
+    id: 'task-1',
+    description: 'Implement the auth service',
+    prompt: 'Please implement the auth service with JWT tokens',
+    files: ['src/auth/', 'src/services/auth.ts'],
+    agent: 'developer',
+  }
+  it('with no dependencies contains task ID, agent, description, file list, and no-dependency text', () => {
+    const result = buildIsolationPreamble(baseTask, [])
+    expect(result).toContain('task-1')
+    expect(result).toContain('developer')
+    expect(result).toContain('Implement the auth service')
+    expect(result).toContain('src/auth/')
+    expect(result).toContain('src/services/auth.ts')
+    expect(result).toContain('No dependencies')
+    expect(result).toContain('first phase')
+  })
+  it('with 2 completed dependencies includes dependency summaries and files', () => {
+    const depResults: DependencyResult[] = [
+      { taskId: 'task-0', agent: 'architect', status: 'done', summary: 'Designed the auth schema', filesChanged: ['schema.ts', 'types.ts'] },
+      { taskId: 'task-0b', agent: 'developer', status: 'done', summary: 'Set up project structure', filesChanged: ['package.json'] },
+    ]
+    const result = buildIsolationPreamble(baseTask, depResults)
+    expect(result).toContain('task-0')
+    expect(result).toContain('Designed the auth schema')
+    expect(result).toContain('schema.ts, types.ts')
+    expect(result).toContain('task-0b')
+    expect(result).toContain('package.json')
+    expect(result).not.toContain('No dependencies')
+  })
+  it('with failed dependency includes failure status', () => {
+    const depResults: DependencyResult[] = [
+      { taskId: 'task-x', agent: 'developer', status: 'failed', summary: 'Build failed due to type errors', filesChanged: [] },
+    ]
+    const result = buildIsolationPreamble(baseTask, depResults)
+    expect(result).toContain('failed')
+    expect(result).toContain('Build failed due to type errors')
+  })
+  it('uses prompt slice when no description', () => {
+    const longPrompt = 'A'.repeat(300)
+    const task = { ...baseTask, description: '', prompt: longPrompt }
+    const result = buildIsolationPreamble(task, [])
+    expect(result).toContain('A'.repeat(200))
+    expect(result).not.toContain('A'.repeat(201))
+  })
+})
+describe('formatDependencyResults', () => {
+  it('compact format includes summary and filesChanged but not full output', () => {
+    const deps: DependencyResult[] = [
+      {
+        taskId: 'dep-1',
+        agent: 'developer',
+        status: 'done',
+        summary: 'Completed auth setup',
+        filesChanged: ['src/auth.ts', 'src/index.ts'],
+      },
+    ]
+    const result = formatDependencyResults(deps)
+    expect(result).toContain('dep-1')
+    expect(result).toContain('developer')
+    expect(result).toContain('done')
+    expect(result).toContain('Completed auth setup')
+    expect(result).toContain('src/auth.ts, src/index.ts')
+  })
+  it('shows no-summary placeholder when summary is null', () => {
+    const deps: DependencyResult[] = [
+      { taskId: 'dep-2', agent: 'architect', status: 'done', summary: null, filesChanged: [] },
+    ]
+    const result = formatDependencyResults(deps)
+    expect(result).toContain('No summary available.')
+    expect(result).toContain('Files changed: none')
+  })
+})
+describe('detectPartitionViolations', () => {
+  it('returns null when all files are within partition', () => {
+    const result = detectPartitionViolations(
+      'task-1',
+      ['src/auth/', 'src/types.ts'],
+      ['src/auth/service.ts', 'src/auth/utils.ts', 'src/types.ts'],
+    )
+    expect(result).toBeNull()
+  })
+  it('detects files outside partition', () => {
+    const result = detectPartitionViolations(
+      'task-1',
+      ['src/auth/'],
+      ['src/auth/service.ts', 'src/other/unrelated.ts'],
+    )
+    expect(result).not.toBeNull()
+    expect(result!.violations).toContain('src/other/unrelated.ts')
+    expect(result!.violations).not.toContain('src/auth/service.ts')
+    expect(result!.taskId).toBe('task-1')
+    expect(result!.allowedFiles).toEqual(['src/auth/'])
+  })
+  it('handles directory paths - src/auth/ allows src/auth/service.ts', () => {
+    const result = detectPartitionViolations(
+      'task-1',
+      ['src/auth/'],
+      ['src/auth/service.ts', 'src/auth/utils/helper.ts'],
+    )
+    expect(result).toBeNull()
+  })
+  it('handles exact file matches - src/index.ts allows only that exact file', () => {
+    const result = detectPartitionViolations(
+      'task-1',
+      ['src/index.ts'],
+      ['src/index.ts', 'src/other.ts'],
+    )
+    expect(result).not.toBeNull()
+    expect(result!.violations).toContain('src/other.ts')
+    expect(result!.violations).not.toContain('src/index.ts')
+  })
+  it('returns null for empty actualFiles', () => {
+    const result = detectPartitionViolations('task-1', ['src/auth/'], [])
+    expect(result).toBeNull()
+  })
+})