npm - @open-multi-agent/core - Versions diffs - 1.6.0 → 1.7.0 - Mend

@open-multi-agent/core 1.6.0 → 1.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

package/README.md +11 -2
package/dist/agent/pool.d.ts +1 -1
package/dist/agent/pool.d.ts.map +1 -1
package/dist/agent/pool.js +23 -1
package/dist/agent/pool.js.map +1 -1
package/dist/agent/runner.d.ts.map +1 -1
package/dist/agent/runner.js +37 -7
package/dist/agent/runner.js.map +1 -1
package/dist/cli/oma.js +1 -1
package/dist/cli/oma.js.map +1 -1
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js.map +1 -1
package/dist/llm/minimax.d.ts +2 -2
package/dist/llm/minimax.js +2 -2
package/dist/orchestrator/orchestrator.d.ts +14 -4
package/dist/orchestrator/orchestrator.d.ts.map +1 -1
package/dist/orchestrator/orchestrator.js +469 -19
package/dist/orchestrator/orchestrator.js.map +1 -1
package/dist/task/task.d.ts +4 -1
package/dist/task/task.d.ts.map +1 -1
package/dist/task/task.js +3 -0
package/dist/task/task.js.map +1 -1
package/dist/types.d.ts +122 -4
package/dist/types.d.ts.map +1 -1
package/package.json +1 -1

package/dist/orchestrator/orchestrator.js CHANGED Viewed

@@ -50,6 +50,7 @@ import { defaultWorkspaceDir } from '../tool/built-in/path-safety.js';
 import { Team } from '../team/team.js';
 import { TaskQueue } from '../task/queue.js';
 import { createTask, validateTaskDependencies } from '../task/task.js';
+import { extractJSON, validateOutput } from '../agent/structured-output.js';
 import { Scheduler } from './scheduler.js';
 import { TokenBudgetExceededError } from '../errors.js';
 import { extractKeywords, keywordScore } from '../utils/keywords.js';
@@ -195,6 +196,23 @@ function buildAgent(config, toolRegistration) {
     });
     return new Agent(config, registry, executor);
 }
+/**
+ * Apply the orchestrator's {@link OrchestratorConfig.defaultToolPreset} as a
+ * fallback grant for an agent that declares neither `tools` nor `toolPreset`.
+ *
+ * Built-in tools are opt-in (default-deny): an agent with no grant resolves to
+ * zero built-in tools. This fills that gap when the orchestrator opts in to a
+ * default. Per-agent grants always win — the default never widens an agent that
+ * already declares `tools` or `toolPreset`.
+ */
+function applyDefaultToolPreset(config, defaultToolPreset) {
+    if (defaultToolPreset === undefined
+        || config.tools !== undefined
+        || config.toolPreset !== undefined) {
+        return config;
+    }
+    return { ...config, toolPreset: defaultToolPreset };
+}
 /** Promise-based delay. */
 function sleep(ms) {
     return new Promise((resolve) => setTimeout(resolve, ms));
@@ -314,6 +332,10 @@ function parseTaskSpecs(raw) {
                 maxRetries: typeof obj['maxRetries'] === 'number' ? obj['maxRetries'] : undefined,
                 retryDelayMs: typeof obj['retryDelayMs'] === 'number' ? obj['retryDelayMs'] : undefined,
                 retryBackoff: typeof obj['retryBackoff'] === 'number' ? obj['retryBackoff'] : undefined,
+                role: typeof obj['role'] === 'string' ? obj['role'] : undefined,
+                priority: obj['priority'] === 'low' || obj['priority'] === 'normal' || obj['priority'] === 'high' || obj['priority'] === 'critical'
+                    ? obj['priority']
+                    : undefined,
             });
         }
         return specs.length > 0 ? specs : null;
@@ -322,6 +344,47 @@ function parseTaskSpecs(raw) {
         return null;
     }
 }
+function routeMatches(policy, selection) {
+    if (!policy)
+        return undefined;
+    const task = selection.task;
+    for (const rule of policy.rules) {
+        const match = rule.match;
+        if (match.phase !== undefined && match.phase !== selection.phase)
+            continue;
+        if (match.agent !== undefined && match.agent !== selection.agent)
+            continue;
+        if (match.taskRole !== undefined && match.taskRole !== task?.role)
+            continue;
+        if (match.taskPriority !== undefined && match.taskPriority !== task?.priority)
+            continue;
+        if (match.leaf !== undefined && match.leaf !== selection.leaf)
+            continue;
+        if (match.hasDependencies !== undefined && match.hasDependencies !== ((task?.dependsOn?.length ?? 0) > 0))
+            continue;
+        return rule.route;
+    }
+    return undefined;
+}
+function withModelRoute(config, route) {
+    if (!route)
+        return config;
+    return {
+        ...config,
+        model: route.model,
+        provider: route.provider ?? config.provider,
+        baseURL: route.baseURL ?? config.baseURL,
+        apiKey: route.apiKey ?? config.apiKey,
+        region: route.region ?? config.region,
+    };
+}
+function isLeafTask(task, tasks) {
+    for (const candidate of tasks) {
+        if (candidate.dependsOn?.includes(task.id))
+            return false;
+    }
+    return true;
+}
 function buildRevealCoordinatorLines(revealContext, assignee) {
     return [
         '## Team context',
@@ -376,13 +439,19 @@ function buildTaskAgentTeamInfo(ctx, taskId, traceBase, delegationDepth, delegat
         }
         // Apply orchestrator-level defaults just like buildPool, then construct a
         // one-shot Agent for this delegation only.
-        const effective = {
+        const route = routeMatches(ctx.modelRouting, {
+            phase: 'delegated',
+            agent: targetAgent,
+            task: ctx.taskById.get(taskId),
+            leaf: ctx.taskLeafById.get(taskId),
+        });
+        const effective = withModelRoute(applyDefaultToolPreset({
             ...targetConfig,
             provider: targetConfig.provider ?? ctx.config.defaultProvider,
             baseURL: targetConfig.baseURL ?? ctx.config.defaultBaseURL,
             apiKey: targetConfig.apiKey ?? ctx.config.defaultApiKey,
             cwd: targetConfig.cwd === undefined ? ctx.config.defaultCwd : targetConfig.cwd,
-        };
+        }, ctx.config.defaultToolPreset), route);
         const tempAgent = buildAgent(effective, { includeDelegateTool: true });
         const nestedTeam = buildTaskAgentTeamInfo(ctx, taskId, traceBase, delegationDepth + 1, [...delegationChain, targetAgent]);
         const childOpts = {
@@ -461,6 +530,18 @@ async function executeQueue(queue, ctx) {
                 });
                 return;
             }
+            const agentConfig = team.getAgent(assignee);
+            if (!agentConfig) {
+                const msg = `Agent "${assignee}" not found in team for task "${task.title}".`;
+                queue.fail(task.id, msg);
+                config.onProgress?.({
+                    type: 'error',
+                    task: task.id,
+                    agent: assignee,
+                    data: msg,
+                });
+                return;
+            }
             const agent = pool.get(assignee);
             if (!agent) {
                 const msg = `Agent "${assignee}" not found in pool for task "${task.title}".`;
@@ -503,9 +584,22 @@ async function executeQueue(queue, ctx) {
                 ...traceBase,
                 team: buildTaskAgentTeamInfo(ctx, task.id, traceBase, 0, [assignee]),
             };
-            const taskStartMs = Date.now();
-            let retryCount = 0;
-            const result = await executeWithRetry(() => pool.run(assignee, prompt, runOptions, config.onAgentStream
+            const workerRoute = routeMatches(ctx.modelRouting, {
+                phase: 'worker',
+                agent: assignee,
+                task,
+                leaf: ctx.taskLeafById.get(task.id),
+            });
+            const routedAgent = workerRoute
+                ? buildAgent(withModelRoute(applyDefaultToolPreset({
+                    ...agentConfig,
+                    provider: agentConfig.provider ?? config.defaultProvider,
+                    baseURL: agentConfig.baseURL ?? config.defaultBaseURL,
+                    apiKey: agentConfig.apiKey ?? config.defaultApiKey,
+                    cwd: agentConfig.cwd === undefined ? config.defaultCwd : agentConfig.cwd,
+                }, config.defaultToolPreset), workerRoute), { includeDelegateTool: true })
+                : undefined;
+            const streamCallback = config.onAgentStream
                 ? (event) => {
                     if (config.onTrace) {
                         const streamMs = Date.now();
@@ -522,7 +616,12 @@ async function executeQueue(queue, ctx) {
                     }
                     config.onAgentStream(assignee, event);
                 }
-                : undefined), task, (retryData) => {
+                : undefined;
+            const taskStartMs = Date.now();
+            let retryCount = 0;
+            const result = await executeWithRetry(() => routedAgent
+                ? pool.runEphemeral(routedAgent, prompt, runOptions, streamCallback)
+                : pool.run(assignee, prompt, runOptions, streamCallback), task, (retryData) => {
                 retryCount++;
                 config.onProgress?.({
                     type: 'task_retry',
@@ -571,27 +670,37 @@ async function executeQueue(queue, ctx) {
                 });
             }
             if (result.success) {
-                // Persist result into shared memory so other agents can read it
                 const sharedMem = team.getSharedMemoryInstance();
+                // Opt-in consensus verification runs *before* the task is finalised so the
+                // verified outcome (accepted → revised, rejected → original) flows into the
+                // queue, shared memory, progress events, and agentResults as one consistent
+                // result. Judge usage is charged to the same parent budget as the rest of the run.
+                let effective = result;
+                if (task.verify && !ctx.budgetExceededTriggered) {
+                    effective = await runTaskVerify(task, assignee, result, sharedMem, ctx);
+                }
+                // Reflect the verified result in the per-task record the caller receives.
+                ctx.agentResults.set(`${assignee}:${task.id}`, effective);
+                // Persist result into shared memory so other agents can read it
                 if (sharedMem) {
-                    await sharedMem.write(assignee, `task:${task.id}:result`, result.output);
+                    await sharedMem.write(assignee, `task:${task.id}:result`, effective.output);
                     // Advance the turn counter so any TTL-tagged entries written during
                     // this task can be expired by subsequent reads.
                     sharedMem.advanceTurn();
                 }
-                const completedTask = queue.complete(task.id, result.output);
+                const completedTask = queue.complete(task.id, effective.output);
                 completedThisRound.push(completedTask);
                 config.onProgress?.({
                     type: 'task_complete',
                     task: task.id,
                     agent: assignee,
-                    data: result,
+                    data: effective,
                 });
                 config.onProgress?.({
                     type: 'agent_complete',
                     agent: assignee,
                     task: task.id,
-                    data: result,
+                    data: effective,
                 });
             }
             else {
@@ -691,6 +800,251 @@ async function buildTaskPrompt(task, team, queue, revealContext) {
     }
     return lines.join('\n');
 }
+/** Skeptic framing applied to every judge (refute mode and lens-mode base). */
+const DEFAULT_VERIFIER_INSTRUCTION = 'You are a rigorous skeptic reviewing a proposed answer to the question shown below. ' +
+    'Judge the answer against what that question actually asks: hunt for errors, unsupported ' +
+    'claims, gaps, and faulty reasoning, then decide whether it withstands scrutiny.';
+/** Per-judge review angles used in `lens` mode (assigned round-robin by index). */
+const CONSENSUS_LENSES = [
+    'factual correctness and logical soundness',
+    'completeness and coverage of the question',
+    'edge cases, failure modes, and counterexamples',
+    'clarity, precision, and freedom from ambiguity',
+    'hidden assumptions and unstated premises',
+    'evidence, citations, and verifiability',
+];
+/** Verdict contract appended to every judge prompt. */
+const VERDICT_INSTRUCTION = 'Respond ONLY with a JSON object {"accept": <true|false>, "critique": "<concise reason>"}. ' +
+    'Set "accept" to true only if the answer withstands scrutiny; otherwise set it false ' +
+    'and explain the problem in "critique".';
+/** Apply orchestrator defaults to a consensus agent config, mirroring buildPool. */
+function applyConsensusDefaults(config, defaults) {
+    return {
+        ...config,
+        provider: config.provider ?? defaults.defaultProvider,
+        baseURL: config.baseURL ?? defaults.defaultBaseURL,
+        apiKey: config.apiKey ?? defaults.defaultApiKey,
+        cwd: config.cwd === undefined ? defaults.defaultCwd : config.cwd,
+    };
+}
+/** Build the user prompt sent to a single judge, always including the original question. */
+function buildJudgePrompt(p) {
+    let instruction;
+    if (p.judgePrompt !== undefined) {
+        instruction = typeof p.judgePrompt === 'function' ? p.judgePrompt(p.judge) : p.judgePrompt;
+    }
+    else if (p.mode === 'lens') {
+        const lens = CONSENSUS_LENSES[p.judgeIndex % CONSENSUS_LENSES.length];
+        instruction = `${DEFAULT_VERIFIER_INSTRUCTION}\nFocus specifically on: ${lens}. ` +
+            'If that angle is irrelevant to this question, accept the answer rather than inventing objections.';
+    }
+    else {
+        instruction = DEFAULT_VERIFIER_INSTRUCTION;
+    }
+    return [
+        instruction,
+        '',
+        '## Question',
+        p.prompt,
+        '',
+        '## Proposed answer',
+        p.answer,
+        '',
+        '## Your verdict',
+        VERDICT_INSTRUCTION,
+    ].join('\n');
+}
+/** Build the proposer prompt for a revision round, feeding back the prior answer and the dissent. */
+function buildRevisePrompt(prompt, answer, dissent) {
+    return [
+        prompt,
+        '',
+        '## Your previous answer',
+        answer,
+        '',
+        '## Reviewer critiques to address',
+        ...dissent.map((d) => `- ${d}`),
+        '',
+        'Revise the previous answer to address every critique above. Respond with the improved answer only.',
+    ].join('\n');
+}
+/** Parse a judge's raw output into an accept/critique decision. */
+function parseJudgeVerdict(output, verdictSchema) {
+    let parsed;
+    try {
+        parsed = extractJSON(output);
+    }
+    catch {
+        return { accept: false, critique: 'Judge output was not valid JSON.' };
+    }
+    if (verdictSchema) {
+        try {
+            validateOutput(verdictSchema, parsed);
+        }
+        catch (err) {
+            return { accept: false, critique: `Verdict failed schema validation: ${err instanceof Error ? err.message : String(err)}` };
+        }
+    }
+    const obj = (parsed && typeof parsed === 'object' ? parsed : {});
+    const accept = typeof obj['accept'] === 'boolean' ? obj['accept'] : false;
+    const critique = typeof obj['critique'] === 'string' && obj['critique']
+        ? obj['critique']
+        : accept ? '' : 'No critique provided.';
+    return { accept, critique };
+}
+/**
+ * Run the judge/refutation loop over a proposed answer: judges run sequentially
+ * (so quorum and budget can stop the rest), dissent is recorded to shared memory
+ * and trace, and `onDissent` decides whether to revise, reject, or keep.
+ */
+async function runConsensusCore(params) {
+    const { team, prompt, judges, mode, quorum, maxRounds, verdictSchema, onDissent, judgePrompt, budget, budgetBaseTokens, reviseProposer, defaults, onTrace, runId, } = params;
+    const pool = params.pool ?? new AgentPool(Math.max(1, defaults.maxConcurrency));
+    const sharedMem = team.getSharedMemoryInstance();
+    let answer = params.initialAnswer;
+    let usage = params.initialUsage;
+    const dissent = [];
+    let rounds = 0;
+    let accepted = false;
+    const overBudget = () => budget !== undefined && budgetBaseTokens + usage.input_tokens + usage.output_tokens > budget;
+    const runEphemeral = (config, text) => pool.runEphemeral(buildAgent(applyConsensusDefaults(config, defaults)), text);
+    // Proposer usage was already accumulated by the caller; bail before judging if it blew the budget.
+    if (overBudget()) {
+        return { answer, verdict: 'rejected', dissent, rounds, tokenUsage: usage };
+    }
+    let budgetHit = false;
+    for (let round = 1; round <= maxRounds; round++) {
+        rounds = round;
+        let acceptCount = 0;
+        const roundDissent = [];
+        for (let j = 0; j < judges.length; j++) {
+            const judge = judges[j];
+            const judgeText = buildJudgePrompt({ judge: judge.name, answer, prompt, mode, judgeIndex: j, judgePrompt });
+            const r = await runEphemeral(judge, judgeText);
+            usage = addUsage(usage, r.tokenUsage);
+            if (overBudget()) {
+                budgetHit = true;
+                break;
+            }
+            const verdict = parseJudgeVerdict(r.output, verdictSchema);
+            // Trace every verdict (accept or dissent); shared memory records dissent only.
+            if (onTrace) {
+                const now = Date.now();
+                emitTrace(onTrace, {
+                    type: 'consensus',
+                    runId: runId ?? '',
+                    agent: judge.name,
+                    round,
+                    accepted: verdict.accept,
+                    ...(verdict.accept ? {} : { dissent: verdict.critique }),
+                    startMs: now,
+                    endMs: now,
+                    durationMs: 0,
+                });
+            }
+            if (verdict.accept) {
+                acceptCount++;
+                if (acceptCount >= quorum) {
+                    accepted = true;
+                    break;
+                }
+            }
+            else {
+                const labelled = `${judge.name}: ${verdict.critique}`;
+                roundDissent.push(labelled);
+                dissent.push(labelled);
+                if (sharedMem) {
+                    await sharedMem.write(judge.name, `consensus:round:${round}:dissent`, verdict.critique);
+                }
+            }
+        }
+        if (budgetHit || accepted)
+            break;
+        // Round missed quorum. Revise (if rounds remain) or stop.
+        if (onDissent === 'revise' && round < maxRounds && reviseProposer) {
+            const r = await runEphemeral(reviseProposer, buildRevisePrompt(prompt, answer, roundDissent));
+            usage = addUsage(usage, r.tokenUsage);
+            if (r.success && r.output)
+                answer = r.output;
+            if (overBudget()) {
+                budgetHit = true;
+                break;
+            }
+            continue;
+        }
+        break;
+    }
+    const verdict = accepted || (!budgetHit && onDissent === 'keep') ? 'accepted' : 'rejected';
+    return { answer, verdict, dissent, rounds, tokenUsage: usage };
+}
+/**
+ * Run the per-task `verify` hook before a task is finalised: feed the task
+ * result into the consensus loop, fold judge usage into the run's cumulative
+ * budget, surface the verdict, and return the effective result — the accepted
+ * revision when judges revise it, otherwise the original. The caller uses this
+ * to finalise the task so the queue, shared memory, events, and agentResults
+ * all agree on the verified outcome.
+ */
+async function runTaskVerify(task, assignee, result, sharedMem, ctx) {
+    const verify = task.verify;
+    const { team, config } = ctx;
+    const assigneeConfig = team.getAgents().find((a) => a.name === assignee);
+    const consensus = await runConsensusCore({
+        team,
+        prompt: task.description,
+        initialAnswer: result.output,
+        initialUsage: ZERO_USAGE,
+        budgetBaseTokens: ctx.cumulativeUsage.input_tokens + ctx.cumulativeUsage.output_tokens,
+        judges: verify.judges,
+        mode: verify.mode ?? 'refute',
+        quorum: Math.min(verify.judges.length, Math.max(1, verify.quorum ?? Math.ceil(verify.judges.length / 2))),
+        maxRounds: Math.max(1, verify.maxRounds ?? 2),
+        verdictSchema: verify.verdictSchema,
+        onDissent: verify.onDissent ?? 'revise',
+        judgePrompt: verify.judgePrompt,
+        budget: ctx.maxTokenBudget,
+        reviseProposer: assigneeConfig,
+        defaults: {
+            defaultProvider: config.defaultProvider,
+            defaultBaseURL: config.defaultBaseURL,
+            defaultApiKey: config.defaultApiKey,
+            defaultCwd: config.defaultCwd,
+            maxConcurrency: config.maxConcurrency ?? DEFAULT_MAX_CONCURRENCY,
+        },
+        onTrace: config.onTrace,
+        ...(ctx.runId ? { runId: ctx.runId } : {}),
+    });
+    ctx.cumulativeUsage = addUsage(ctx.cumulativeUsage, consensus.tokenUsage);
+    // Surface the verdict as a task-level outcome so downstream agents and the
+    // final synthesis can see whether the result survived scrutiny.
+    if (sharedMem) {
+        const summary = consensus.verdict === 'accepted'
+            ? 'accepted'
+            : `rejected${consensus.dissent.length ? `: ${consensus.dissent.join('; ')}` : ''}`;
+        await sharedMem.write(assignee, `task:${task.id}:verdict`, summary);
+    }
+    const total = ctx.cumulativeUsage.input_tokens + ctx.cumulativeUsage.output_tokens;
+    if (!ctx.budgetExceededTriggered && ctx.maxTokenBudget !== undefined && total > ctx.maxTokenBudget) {
+        ctx.budgetExceededTriggered = true;
+        const err = new TokenBudgetExceededError('orchestrator', total, ctx.maxTokenBudget);
+        ctx.budgetExceededReason = err.message;
+        config.onProgress?.({
+            type: 'budget_exceeded',
+            agent: assignee,
+            task: task.id,
+            data: err,
+        });
+    }
+    // Only an *accepted* revision supersedes the task result; a rejected revision is
+    // recorded as dissent but the caller finalises with the original output. Judge
+    // usage rolls into the per-task usage (mirrors how delegation usage rolls in).
+    const useRevision = consensus.verdict === 'accepted' && consensus.answer && consensus.answer !== result.output;
+    return {
+        ...result,
+        output: useRevision ? consensus.answer : result.output,
+        tokenUsage: addUsage(result.tokenUsage, consensus.tokenUsage),
+    };
+}
 // ---------------------------------------------------------------------------
 // OpenMultiAgent
 // ---------------------------------------------------------------------------
@@ -726,6 +1080,7 @@ export class OpenMultiAgent {
             // disable the filesystem sandbox; a string sets a custom sandbox root.
             defaultCwd: config.defaultCwd === undefined ? defaultWorkspaceDir() : config.defaultCwd,
             maxTokenBudget: config.maxTokenBudget,
+            defaultToolPreset: config.defaultToolPreset,
             onApproval: config.onApproval,
             onPlanReady: config.onPlanReady,
             onAgentStream: config.onAgentStream,
@@ -770,14 +1125,14 @@ export class OpenMultiAgent {
      */
     async runAgent(config, prompt, options) {
         const effectiveBudget = resolveTokenBudget(config.maxTokenBudget, this.config.maxTokenBudget);
-        const effective = {
+        const effective = applyDefaultToolPreset({
             ...config,
             provider: config.provider ?? this.config.defaultProvider,
             baseURL: config.baseURL ?? this.config.defaultBaseURL,
             apiKey: config.apiKey ?? this.config.defaultApiKey,
             cwd: config.cwd === undefined ? this.config.defaultCwd : config.cwd,
             maxTokenBudget: effectiveBudget,
-        };
+        }, this.config.defaultToolPreset);
         const agent = buildAgent(effective);
         this.config.onProgress?.({
             type: 'agent_start',
@@ -858,14 +1213,14 @@ export class OpenMultiAgent {
             // to avoid duplicate progress events and double completedTaskCount.
             // Events are emitted here; counting is handled by buildTeamRunResult().
             const effectiveBudget = resolveTokenBudget(bestAgent.maxTokenBudget, this.config.maxTokenBudget);
-            const effective = {
+            const effective = withModelRoute(applyDefaultToolPreset({
                 ...bestAgent,
                 provider: bestAgent.provider ?? this.config.defaultProvider,
                 baseURL: bestAgent.baseURL ?? this.config.defaultBaseURL,
                 apiKey: bestAgent.apiKey ?? this.config.defaultApiKey,
                 cwd: bestAgent.cwd === undefined ? this.config.defaultCwd : bestAgent.cwd,
                 maxTokenBudget: effectiveBudget,
-            };
+            }, this.config.defaultToolPreset), routeMatches(options?.modelRouting, { phase: 'short-circuit', agent: bestAgent.name }));
             const agent = buildAgent(effective);
             this.config.onProgress?.({
                 type: 'agent_start',
@@ -915,7 +1270,7 @@ export class OpenMultiAgent {
         // ------------------------------------------------------------------
         // Step 1: Coordinator decomposes goal into tasks
         // ------------------------------------------------------------------
-        const coordinatorConfig = {
+        const coordinatorBaseConfig = {
             name: 'coordinator',
             model: coordinatorOverrides?.model ?? this.config.defaultModel,
             ...(coordinatorOverrides?.adapter !== undefined ? { adapter: coordinatorOverrides.adapter } : {}),
@@ -942,6 +1297,7 @@ export class OpenMultiAgent {
             loopDetection: coordinatorOverrides?.loopDetection,
             timeoutMs: coordinatorOverrides?.timeoutMs,
         };
+        const coordinatorConfig = withModelRoute(coordinatorBaseConfig, routeMatches(options?.modelRouting, { phase: 'coordinator', agent: 'coordinator' }));
         const decompositionPrompt = this.buildDecompositionPrompt(goal, agentConfigs);
         const coordinatorAgent = buildAgent(coordinatorConfig);
         const runId = this.config.onTrace ? generateRunId() : undefined;
@@ -1020,6 +1376,9 @@ export class OpenMultiAgent {
                     },
                 }
                 : {}),
+            modelRouting: options?.modelRouting,
+            taskById: new Map(queue.list().map((task) => [task.id, task])),
+            taskLeafById: new Map(queue.list().map((task) => [task.id, isLeafTask(task, queue.list())])),
         };
         const planTasks = queue.list();
         const planReadyStartMs = Date.now();
@@ -1098,10 +1457,11 @@ export class OpenMultiAgent {
             return this.buildTeamRunResult(agentResults, goal, taskRecords);
         }
         const synthesisPrompt = await this.buildSynthesisPrompt(goal, queue.list(), team);
+        const synthesisAgent = buildAgent(withModelRoute(coordinatorBaseConfig, routeMatches(options?.modelRouting, { phase: 'synthesis', agent: 'coordinator' })));
         const synthTraceOptions = this.config.onTrace
             ? { onTrace: this.config.onTrace, runId: runId ?? '', traceAgent: 'coordinator' }
             : undefined;
-        const synthesisResult = await coordinatorAgent.run(synthesisPrompt, synthTraceOptions);
+        const synthesisResult = await synthesisAgent.run(synthesisPrompt, synthTraceOptions);
         agentResults.set('coordinator', synthesisResult);
         cumulativeUsage = addUsage(cumulativeUsage, synthesisResult.tokenUsage);
         if (maxTokenBudget !== undefined
@@ -1200,10 +1560,94 @@ export class OpenMultiAgent {
             maxRetries: t.maxRetries,
             retryDelayMs: t.retryDelayMs,
             retryBackoff: t.retryBackoff,
+            role: t.role,
+            priority: t.priority,
+            verify: t.verify,
         })), agentConfigs, queue);
         return this.executeExplicitTaskQueue(team, queue, options);
     }
     // -------------------------------------------------------------------------
+    // Consensus
+    // -------------------------------------------------------------------------
+    /**
+     * Run a proposer→judge consensus over a single prompt.
+     *
+     * The proposer emits an answer; judges try to refute it over up to
+     * `maxRounds`, exiting early once `quorum` accept. Proposer and judge token
+     * usage all count against the orchestrator's `maxTokenBudget` — crossing it
+     * stops issuing further judge calls, exactly like delegation and `runTasks`.
+     */
+    async runConsensus(team, prompt, options) {
+        const proposers = Array.isArray(options.proposer) ? options.proposer : [options.proposer];
+        if (proposers.length === 0) {
+            throw new Error('runConsensus: at least one proposer is required.');
+        }
+        if (options.judges.length === 0) {
+            throw new Error('runConsensus: at least one judge is required.');
+        }
+        const mode = options.mode ?? 'refute';
+        const maxRounds = Math.max(1, options.maxRounds ?? 2);
+        const quorum = Math.min(options.judges.length, Math.max(1, options.quorum ?? Math.ceil(options.judges.length / 2)));
+        const onDissent = options.onDissent ?? 'revise';
+        const budget = this.config.maxTokenBudget;
+        const defaults = {
+            defaultProvider: this.config.defaultProvider,
+            defaultBaseURL: this.config.defaultBaseURL,
+            defaultApiKey: this.config.defaultApiKey,
+            defaultCwd: this.config.defaultCwd,
+            maxConcurrency: this.config.maxConcurrency,
+        };
+        const pool = new AgentPool(Math.max(1, this.config.maxConcurrency));
+        let usage = ZERO_USAGE;
+        // Step 2: run proposer(s); accumulate usage and honour the budget before judging.
+        const candidates = [];
+        for (const proposerConfig of proposers) {
+            const r = await pool.runEphemeral(buildAgent(applyConsensusDefaults(proposerConfig, defaults)), prompt);
+            usage = addUsage(usage, r.tokenUsage);
+            if (r.success && r.output)
+                candidates.push(r.output);
+            if (budget !== undefined && usage.input_tokens + usage.output_tokens > budget) {
+                this.config.onProgress?.({
+                    type: 'budget_exceeded',
+                    agent: proposerConfig.name,
+                    data: new TokenBudgetExceededError(proposerConfig.name, usage.input_tokens + usage.output_tokens, budget),
+                });
+                return {
+                    answer: candidates.join('\n\n---\n\n'),
+                    verdict: 'rejected',
+                    dissent: [],
+                    rounds: 0,
+                    tokenUsage: usage,
+                };
+            }
+        }
+        // Every proposer failed or returned empty output: there is nothing to judge.
+        // Bail with a rejected verdict so an empty answer can never come back accepted.
+        if (candidates.length === 0) {
+            return { answer: '', verdict: 'rejected', dissent: [], rounds: 0, tokenUsage: usage };
+        }
+        return runConsensusCore({
+            team,
+            prompt,
+            initialAnswer: candidates.join('\n\n---\n\n'),
+            initialUsage: usage,
+            budgetBaseTokens: 0,
+            judges: options.judges,
+            mode,
+            quorum,
+            maxRounds,
+            verdictSchema: options.verdictSchema,
+            onDissent,
+            judgePrompt: options.judgePrompt,
+            budget,
+            reviseProposer: proposers[0],
+            defaults,
+            onTrace: this.config.onTrace,
+            runId: this.config.onTrace ? generateRunId() : undefined,
+            pool,
+        });
+    }
+    // -------------------------------------------------------------------------
     // Observability
     // -------------------------------------------------------------------------
     /**
@@ -1398,6 +1842,9 @@ export class OpenMultiAgent {
             budgetExceededTriggered: false,
             budgetExceededReason: undefined,
             taskMetrics: new Map(),
+            modelRouting: options?.modelRouting,
+            taskById: new Map(queue.list().map((task) => [task.id, task])),
+            taskLeafById: new Map(queue.list().map((task) => [task.id, isLeafTask(task, queue.list())])),
         };
         await executeQueue(queue, ctx);
         const taskRecords = queue.list().map((task) => ({
@@ -1443,6 +1890,9 @@ export class OpenMultiAgent {
                 maxRetries: spec.maxRetries,
                 retryDelayMs: spec.retryDelayMs,
                 retryBackoff: spec.retryBackoff,
+                role: spec.role,
+                priority: spec.priority,
+                verify: spec.verify,
             });
             const titleKey = normalizeTitle(spec.title);
             if ((titleCounts.get(titleKey) ?? 0) === 1) {
@@ -1488,14 +1938,14 @@ export class OpenMultiAgent {
     buildPool(agentConfigs) {
         const pool = new AgentPool(this.config.maxConcurrency);
         for (const config of agentConfigs) {
-            const effective = {
+            const effective = applyDefaultToolPreset({
                 ...config,
                 model: config.model,
                 provider: config.provider ?? this.config.defaultProvider,
                 baseURL: config.baseURL ?? this.config.defaultBaseURL,
                 apiKey: config.apiKey ?? this.config.defaultApiKey,
                 cwd: config.cwd === undefined ? this.config.defaultCwd : config.cwd,
-            };
+            }, this.config.defaultToolPreset);
             pool.add(buildAgent(effective, { includeDelegateTool: true }));
         }
         return pool;